From 3c5c90498f5ceba3c40c7c4f80ed0692313b9627 Mon Sep 17 00:00:00 2001 From: Amaury Chamayou Date: Wed, 27 Sep 2023 12:59:11 +0000 Subject: [PATCH 01/11] Add basic backpressure mechanism if primary has too many in-flight transactions --- include/ccf/odata_error.h | 1 + src/consensus/aft/raft.h | 8 ++++++++ src/kv/kv_types.h | 1 + src/kv/test/stub_consensus.h | 5 +++++ src/node/rpc/frontend.h | 12 ++++++++++++ tests/infra/basicperf.py | 15 +++++++++++++++ 6 files changed, 42 insertions(+) diff --git a/include/ccf/odata_error.h b/include/ccf/odata_error.h index bc6f9e88ec2b..928b0bd22a6b 100644 --- a/include/ccf/odata_error.h +++ b/include/ccf/odata_error.h @@ -112,6 +112,7 @@ namespace ccf ERROR(ProposalCreatedTooLongAgo) ERROR(InvalidCreatedAt) ERROR(JSException) + ERROR(TooManyPendingTransactions) // node-to-node (/join and /create): ERROR(ConsensusTypeMismatch) diff --git a/src/consensus/aft/raft.h b/src/consensus/aft/raft.h index c157d3a790f4..687bbad980bd 100644 --- a/src/consensus/aft/raft.h +++ b/src/consensus/aft/raft.h @@ -255,6 +255,14 @@ namespace aft return can_replicate_unsafe(); } + bool is_at_max_capacity() override + { + std::unique_lock guard(state->lock); + return state->last_idx - state->commit_idx >= + 10000; // Make configurable, and should this be a number of tx + // (committable_indices.size()) instead? + } + Consensus::SignatureDisposition get_signature_disposition() override { std::unique_lock guard(state->lock); diff --git a/src/kv/kv_types.h b/src/kv/kv_types.h index 92887ba42be8..3a664e962302 100644 --- a/src/kv/kv_types.h +++ b/src/kv/kv_types.h @@ -440,6 +440,7 @@ namespace kv virtual bool is_backup() = 0; virtual bool is_candidate() = 0; virtual bool can_replicate() = 0; + virtual bool is_at_max_capacity() = 0; enum class SignatureDisposition { diff --git a/src/kv/test/stub_consensus.h b/src/kv/test/stub_consensus.h index 978634741924..01f56b89a306 100644 --- a/src/kv/test/stub_consensus.h +++ b/src/kv/test/stub_consensus.h @@ -59,6 +59,11 @@ namespace kv::test return state == Primary; } + virtual bool is_at_max_capacity() override + { + return false; + } + virtual Consensus::SignatureDisposition get_signature_disposition() override { if (state == Primary) diff --git a/src/node/rpc/frontend.h b/src/node/rpc/frontend.h index 40b0b1f02bb2..7ee6e5fd8873 100644 --- a/src/node/rpc/frontend.h +++ b/src/node/rpc/frontend.h @@ -397,6 +397,18 @@ namespace ccf while (attempts < max_attempts) { + if (consensus != nullptr) + { + if (consensus->is_at_max_capacity()) + { + ctx->set_error( + HTTP_STATUS_SERVICE_UNAVAILABLE, + ccf::errors::TooManyPendingTransactions, + "Too many transactions pending commit on the service."); + return; + } + } + std::unique_ptr tx_p = tables.create_tx_ptr(); set_root_on_proposals(*ctx, *tx_p); diff --git a/tests/infra/basicperf.py b/tests/infra/basicperf.py index 77c8b1881e28..004760bf9c89 100644 --- a/tests/infra/basicperf.py +++ b/tests/infra/basicperf.py @@ -428,6 +428,14 @@ def table(): # if args.stop_primary_after_s: # overall = overall.filter(pl.col("responseStatus") < 500) + number_of_errors = overall.filter( + pl.col("responseStatus") >= 500 + ).height + total_number_of_requests = overall.height + print( + f"Errors: {number_of_errors} ({number_of_errors / total_number_of_requests * 100:.2f}%)" + ) + overall = overall.with_columns( pl.col("receiveTime").alias("latency") - pl.col("sendTime") ) @@ -449,6 +457,13 @@ def table(): agg = pl.concat(agg, rechunk=True) LOG.info("Aggregate results") print(agg) + + number_of_errors = agg.filter(pl.col("responseStatus") >= 500).height + total_number_of_requests = agg.height + print( + f"Errors: {number_of_errors} ({number_of_errors / total_number_of_requests * 100:.2f}%)" + ) + agg_path = os.path.join( network.common_dir, "aggregated_basicperf_output.parquet" ) From 791dde0f67c7d75c81e1e944069dee4cee557761 Mon Sep 17 00:00:00 2001 From: Amaury Chamayou Date: Wed, 27 Sep 2023 17:12:44 +0000 Subject: [PATCH 02/11] Add max_uncommitted_tx_count setting --- doc/host_config_schema/cchost_config.json | 5 +++++ include/ccf/service/consensus_config.h | 1 + src/consensus/aft/raft.h | 10 +++++++--- src/consensus/aft/test/test_common.h | 3 ++- src/consensus/consensus_types.h | 2 +- tests/config.jinja | 3 ++- tests/infra/basicperf.py | 22 +++++++++++++++------- tests/infra/remote.py | 2 ++ 8 files changed, 35 insertions(+), 13 deletions(-) diff --git a/doc/host_config_schema/cchost_config.json b/doc/host_config_schema/cchost_config.json index 04fcc1babb27..a580550b817e 100644 --- a/doc/host_config_schema/cchost_config.json +++ b/doc/host_config_schema/cchost_config.json @@ -562,6 +562,11 @@ "type": "string", "default": "5000ms", "description": "Maximum timeout (time string) after which backup nodes that have not received any message from the primary node (or voted for a candidate) will trigger a new election. This timeout is also used by candidates to restart unsuccessful elections. This should be set to a significantly greater value than 'message_timeout' plus the expected network delay" + }, + "max_uncommitted_tx_count": { + "type": "integer", + "default": 10000, + "description": "Maximum number of uncommitted transactions allowed before the primary refuses new transactions" } }, "description": "This section includes configuration for the consensus protocol (note: should be the same for all other nodes in the service)", diff --git a/include/ccf/service/consensus_config.h b/include/ccf/service/consensus_config.h index 55c5fcf018e4..322a5b2702df 100644 --- a/include/ccf/service/consensus_config.h +++ b/include/ccf/service/consensus_config.h @@ -11,6 +11,7 @@ namespace consensus { ds::TimeString message_timeout = {"100ms"}; ds::TimeString election_timeout = {"5000ms"}; + size_t max_uncommitted_tx_count = 0; bool operator==(const Configuration&) const = default; bool operator!=(const Configuration&) const = default; diff --git a/src/consensus/aft/raft.h b/src/consensus/aft/raft.h index 687bbad980bd..c16df04d8808 100644 --- a/src/consensus/aft/raft.h +++ b/src/consensus/aft/raft.h @@ -146,6 +146,7 @@ namespace aft // Timeouts std::chrono::milliseconds request_timeout; std::chrono::milliseconds election_timeout; + size_t max_uncommitted_tx_count = 0; bool ticking = false; // Configurations @@ -212,6 +213,7 @@ namespace aft request_timeout(settings_.message_timeout), election_timeout(settings_.election_timeout), + max_uncommitted_tx_count(settings_.max_uncommitted_tx_count), reconfiguration_type(reconfiguration_type_), node_client(rpc_request_context_), @@ -257,10 +259,12 @@ namespace aft bool is_at_max_capacity() override { + if (max_uncommitted_tx_count == 0) + { + return false; + } std::unique_lock guard(state->lock); - return state->last_idx - state->commit_idx >= - 10000; // Make configurable, and should this be a number of tx - // (committable_indices.size()) instead? + return state->last_idx - state->commit_idx >= max_uncommitted_tx_count; } Consensus::SignatureDisposition get_signature_disposition() override diff --git a/src/consensus/aft/test/test_common.h b/src/consensus/aft/test/test_common.h index 07dccf0a134a..2e90359a1341 100644 --- a/src/consensus/aft/test/test_common.h +++ b/src/consensus/aft/test/test_common.h @@ -19,12 +19,13 @@ static std::vector cert; static const ds::TimeString request_timeout_ = {"10ms"}; static const ds::TimeString election_timeout_ = {"100ms"}; +static const size_t max_uncommitted_tx_count_ = 0; static const std::chrono::milliseconds request_timeout = request_timeout_; static const std::chrono::milliseconds election_timeout = election_timeout_; static const consensus::Configuration raft_settings{ - request_timeout_, election_timeout_}; + request_timeout_, election_timeout_, max_uncommitted_tx_count_}; static auto hooks = std::make_shared(); diff --git a/src/consensus/consensus_types.h b/src/consensus/consensus_types.h index 9ede9dc6b03b..e65ce57e5056 100644 --- a/src/consensus/consensus_types.h +++ b/src/consensus/consensus_types.h @@ -15,7 +15,7 @@ namespace consensus DECLARE_JSON_TYPE_WITH_OPTIONAL_FIELDS(Configuration); DECLARE_JSON_REQUIRED_FIELDS(Configuration); DECLARE_JSON_OPTIONAL_FIELDS( - Configuration, message_timeout, election_timeout); + Configuration, message_timeout, election_timeout, max_uncommitted_tx_count); #pragma pack(push, 1) template diff --git a/tests/config.jinja b/tests/config.jinja index 140f30e3e091..872b96467c25 100644 --- a/tests/config.jinja +++ b/tests/config.jinja @@ -69,7 +69,8 @@ "consensus": { "message_timeout": "{{ message_timeout }}", - "election_timeout": "{{ election_timeout }}" + "election_timeout": "{{ election_timeout }}", + "max_uncommitted_tx_count": {{ max_uncommitted_tx_count|tojson or 0 }} }, "ledger_signatures": { diff --git a/tests/infra/basicperf.py b/tests/infra/basicperf.py index 004760bf9c89..91256fed3620 100644 --- a/tests/infra/basicperf.py +++ b/tests/infra/basicperf.py @@ -421,12 +421,6 @@ def table(): requestSize=pl.col("request").map_elements(len), responseSize=pl.col("rawResponse").map_elements(len), ) - # 50x are expected when we stop the primary, 500 when we drop the session - # to maintain consistency, and 504 when we try to write to the future primary - # before their election. Since these requests effectively do nothing, they - # should not count towards latency statistics. - # if args.stop_primary_after_s: - # overall = overall.filter(pl.col("responseStatus") < 500) number_of_errors = overall.filter( pl.col("responseStatus") >= 500 @@ -471,6 +465,8 @@ def table(): agg.write_parquet(f) print(f"Aggregated results written to {agg_path}") + # agg = agg.filter(pl.col("responseStatus") < 500) + start_send = agg["sendTime"].min() end_recv = agg["receiveTime"].max() duration_s = (end_recv - start_send).total_seconds() @@ -550,8 +546,20 @@ def table(): .count() .rename({"count": "rcvd"}) ) + errors_per_sec = ( + agg.with_columns( + ( + (pl.col("receiveTime").alias("second") - start_send) + / 1000000 + ).cast(pl.Int64) + ) + .filter(pl.col("responseStatus") >= 500) + .group_by("second") + .count() + .rename({"count": "errors"}) + ) - per_sec = sent_per_sec.join(recv_per_sec, on="second").sort("second") + per_sec = sent_per_sec.join(recv_per_sec, on="second").join(errors_per_sec, on="second", how="outer").sort("second") print(per_sec) per_sec = per_sec.with_columns( sent_rate=pl.col("sent") / per_sec["sent"].max(), diff --git a/tests/infra/remote.py b/tests/infra/remote.py index 503bc2781bf4..0acec80f8982 100644 --- a/tests/infra/remote.py +++ b/tests/infra/remote.py @@ -618,6 +618,7 @@ def __init__( ignore_first_sigterm=False, node_container_image=None, follow_redirect=True, + max_uncommitted_tx_count=0, **kwargs, ): """ @@ -793,6 +794,7 @@ def __init__( ignore_first_sigterm=ignore_first_sigterm, node_address=remote_class.get_node_address(node_address), follow_redirect=follow_redirect, + max_uncommitted_tx_count=max_uncommitted_tx_count, **kwargs, ) From 2a00f6f9c587f8bf97c1b75f8393fec0bfe5f2b6 Mon Sep 17 00:00:00 2001 From: Amaury Chamayou Date: Wed, 27 Sep 2023 17:16:11 +0000 Subject: [PATCH 03/11] Error on errors --- tests/infra/basicperf.py | 13 ++++++++++--- 1 file changed, 10 insertions(+), 3 deletions(-) diff --git a/tests/infra/basicperf.py b/tests/infra/basicperf.py index 91256fed3620..a25a6b6ee335 100644 --- a/tests/infra/basicperf.py +++ b/tests/infra/basicperf.py @@ -465,8 +465,6 @@ def table(): agg.write_parquet(f) print(f"Aggregated results written to {agg_path}") - # agg = agg.filter(pl.col("responseStatus") < 500) - start_send = agg["sendTime"].min() end_recv = agg["receiveTime"].max() duration_s = (end_recv - start_send).total_seconds() @@ -559,7 +557,11 @@ def table(): .rename({"count": "errors"}) ) - per_sec = sent_per_sec.join(recv_per_sec, on="second").join(errors_per_sec, on="second", how="outer").sort("second") + per_sec = ( + sent_per_sec.join(recv_per_sec, on="second") + .join(errors_per_sec, on="second", how="outer") + .sort("second") + ) print(per_sec) per_sec = per_sec.with_columns( sent_rate=pl.col("sent") / per_sec["sent"].max(), @@ -570,6 +572,11 @@ def table(): r = "R" * int(row["rcvd_rate"] * 20) print(f"{row['second']:>3}: {s:>20}|{r:<20}") + if number_of_errors and not args.stop_primary_after_s: + raise RuntimeError( + f"Errors: {number_of_errors} ({number_of_errors / total_number_of_requests * 100:.2f}%)" + ) + with cimetrics.upload.metrics(complete=False) as metrics: LOG.success("Uploading results") metrics.put(args.label, round(throughput, 1)) From dca91b5eda784f7a9e21db272886467131ae27f3 Mon Sep 17 00:00:00 2001 From: Amaury Chamayou Date: Thu, 28 Sep 2023 09:59:23 +0000 Subject: [PATCH 04/11] Backpressure on primary only --- src/consensus/aft/raft.h | 8 +++++++- 1 file changed, 7 insertions(+), 1 deletion(-) diff --git a/src/consensus/aft/raft.h b/src/consensus/aft/raft.h index c16df04d8808..a352195f31d4 100644 --- a/src/consensus/aft/raft.h +++ b/src/consensus/aft/raft.h @@ -257,6 +257,11 @@ namespace aft return can_replicate_unsafe(); } + /** + * Returns true if the node is primary, max_uncommitted_tx_count is non-zero + * and the number of transactions replicated but not yet committed exceeds + * max_uncommitted_tx_count. + */ bool is_at_max_capacity() override { if (max_uncommitted_tx_count == 0) @@ -264,7 +269,8 @@ namespace aft return false; } std::unique_lock guard(state->lock); - return state->last_idx - state->commit_idx >= max_uncommitted_tx_count; + return state->leadership_state == kv::LeadershipState::Leader && + (state->last_idx - state->commit_idx >= max_uncommitted_tx_count); } Consensus::SignatureDisposition get_signature_disposition() override From ccbb86c94537a3c6ec19ab611944cbed31cd745d Mon Sep 17 00:00:00 2001 From: Amaury Chamayou Date: Thu, 28 Sep 2023 10:36:44 +0000 Subject: [PATCH 05/11] Do not apply backpressure on node frontend --- include/ccf/endpoint_registry.h | 5 +++++ src/node/rpc/frontend.h | 4 +++- src/node/rpc/node_frontend.h | 8 ++++++++ tests/infra/basicperf.py | 21 +++++++++++++++++++++ tests/requirements.txt | 1 + 5 files changed, 38 insertions(+), 1 deletion(-) diff --git a/include/ccf/endpoint_registry.h b/include/ccf/endpoint_registry.h index 2052dd72df26..8be93dbb3746 100644 --- a/include/ccf/endpoint_registry.h +++ b/include/ccf/endpoint_registry.h @@ -285,5 +285,10 @@ namespace ccf::endpoints const EndpointDefinitionPtr& endpoint); virtual void increment_metrics_retries( const EndpointDefinitionPtr& endpoint); + + virtual bool apply_uncommitted_tx_backpressure() const + { + return true; + } }; } diff --git a/src/node/rpc/frontend.h b/src/node/rpc/frontend.h index 71db3f09dcb1..b9863acf77cf 100644 --- a/src/node/rpc/frontend.h +++ b/src/node/rpc/frontend.h @@ -399,7 +399,9 @@ namespace ccf { if (consensus != nullptr) { - if (consensus->is_at_max_capacity()) + if ( + endpoints.apply_uncommitted_tx_backpressure() && + consensus->is_at_max_capacity()) { ctx->set_error( HTTP_STATUS_SERVICE_UNAVAILABLE, diff --git a/src/node/rpc/node_frontend.h b/src/node/rpc/node_frontend.h index f6e216a0aaf9..4bd2de5577c4 100644 --- a/src/node/rpc/node_frontend.h +++ b/src/node/rpc/node_frontend.h @@ -144,6 +144,14 @@ namespace ccf class NodeEndpoints : public CommonEndpointRegistry { + public: + // The node frontend is exempt from backpressure rules to enable an operator + // to access a node that is not making progress. + bool apply_uncommitted_tx_backpressure() const override + { + return false; + } + private: NetworkState& network; ccf::AbstractNodeOperation& node_operation; diff --git a/tests/infra/basicperf.py b/tests/infra/basicperf.py index a25a6b6ee335..d5c0b6f45426 100644 --- a/tests/infra/basicperf.py +++ b/tests/infra/basicperf.py @@ -19,6 +19,7 @@ import shutil import datetime import ccf.ledger +import plotext as plt def configure_remote_client(args, client_id, client_host, common_dir): @@ -561,12 +562,32 @@ def table(): sent_per_sec.join(recv_per_sec, on="second") .join(errors_per_sec, on="second", how="outer") .sort("second") + .fill_null(0) ) print(per_sec) per_sec = per_sec.with_columns( sent_rate=pl.col("sent") / per_sec["sent"].max(), rcvd_rate=pl.col("rcvd") / per_sec["rcvd"].max(), ) + + plt.simple_bar( + list(per_sec["second"]), + list(per_sec["sent"]), + width=100, + title="Sent requests per second", + ) + plt.show() + + plt.simple_stacked_bar( + list(per_sec["second"]), + [list(per_sec["rcvd"]), list(per_sec["errors"])], + width=100, + labels=["rcvd", "errors"], + colors=["green", "red"], + title="Received requests per second", + ) + plt.show() + for row in per_sec.iter_rows(named=True): s = "S" * int(row["sent_rate"] * 20) r = "R" * int(row["rcvd_rate"] * 20) diff --git a/tests/requirements.txt b/tests/requirements.txt index f98b45a225bf..c9360e3e078e 100644 --- a/tests/requirements.txt +++ b/tests/requirements.txt @@ -23,3 +23,4 @@ pycose fastparquet==2023.* prettytable==3.* polars +plotext \ No newline at end of file From d229da3e4a570bb7d09dd458bac4dec2d711a4bd Mon Sep 17 00:00:00 2001 From: Amaury Chamayou Date: Thu, 28 Sep 2023 13:24:41 +0000 Subject: [PATCH 06/11] Add e2e test --- tests/e2e_operations.py | 42 +++++++++++++++++++++++++++++++++++++++++ 1 file changed, 42 insertions(+) diff --git a/tests/e2e_operations.py b/tests/e2e_operations.py index b3a5fb5e3b46..649a8eb7c554 100644 --- a/tests/e2e_operations.py +++ b/tests/e2e_operations.py @@ -523,7 +523,49 @@ def run_pid_file_check(args): network.ignoring_shutdown_errors = True +def run_max_uncommitted_tx_count(args): + with infra.network.network( + ["local://localhost", "local://localhost"], + args.binary_dir, + args.debug_nodes, + args.perf_nodes, + pdb=args.pdb, + ) as network: + uncommitted_cap = 20 + network.per_node_args_override[0] = { + "max_uncommitted_tx_count": uncommitted_cap + } + network.start_and_open(args) + LOG.info( + f"Start network with max_uncommitted_tx_count set to {uncommitted_cap}" + ) + # Stop the backup node, to freeze commit + primary, backups = network.find_nodes() + backups[0].stop() + unavailable_count = 0 + last_accepted_index = 0 + + with primary.client(identity="user0") as c: + for idx in range(uncommitted_cap + 1): + r = c.post( + "/app/log/public?scope=test_large_snapshot", + body={"id": idx, "msg": "X" * 42}, + log_capture=[], + ) + if r.status_code == http.HTTPStatus.SERVICE_UNAVAILABLE: + unavailable_count += 1 + if last_accepted_index == 0: + last_accepted_index = idx - 1 + LOG.info(f"Last accepted: {last_accepted_index}, {unavailable_count} 503s") + assert unavailable_count > 0, "Expected at least one SERVICE_UNAVAILABLE" + + with primary.client() as c: + r = c.get("/node/network") + assert r.status_code == http.HTTPStatus.OK.value, r + + def run(args): + run_max_uncommitted_tx_count(args) run_file_operations(args) run_tls_san_checks(args) run_config_timeout_check(args) From 8d9167ad6f9450a98290c28f78c178c5d17626b1 Mon Sep 17 00:00:00 2001 From: Amaury Chamayou Date: Thu, 28 Sep 2023 14:26:47 +0000 Subject: [PATCH 07/11] max_uncommitted_tx_count always inited by ctor --- src/consensus/aft/raft.h | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/consensus/aft/raft.h b/src/consensus/aft/raft.h index a352195f31d4..40e86f58273e 100644 --- a/src/consensus/aft/raft.h +++ b/src/consensus/aft/raft.h @@ -146,7 +146,7 @@ namespace aft // Timeouts std::chrono::milliseconds request_timeout; std::chrono::milliseconds election_timeout; - size_t max_uncommitted_tx_count = 0; + size_t max_uncommitted_tx_count; bool ticking = false; // Configurations From f9abf6ef38ca8178590dc810a3ddf5d37e476ea6 Mon Sep 17 00:00:00 2001 From: Amaury Chamayou Date: Thu, 28 Sep 2023 14:27:31 +0000 Subject: [PATCH 08/11] Correctly set default in config struct --- include/ccf/service/consensus_config.h | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/include/ccf/service/consensus_config.h b/include/ccf/service/consensus_config.h index 322a5b2702df..ba1443949d96 100644 --- a/include/ccf/service/consensus_config.h +++ b/include/ccf/service/consensus_config.h @@ -11,7 +11,7 @@ namespace consensus { ds::TimeString message_timeout = {"100ms"}; ds::TimeString election_timeout = {"5000ms"}; - size_t max_uncommitted_tx_count = 0; + size_t max_uncommitted_tx_count = 10000; bool operator==(const Configuration&) const = default; bool operator!=(const Configuration&) const = default; From fbc6d8e16788db19bbc8b17535398720018410e3 Mon Sep 17 00:00:00 2001 From: Amaury Chamayou Date: Thu, 28 Sep 2023 15:22:39 +0000 Subject: [PATCH 09/11] CHANGELOG --- CHANGELOG.md | 6 ++++++ doc/host_config_schema/cchost_config.json | 2 +- 2 files changed, 7 insertions(+), 1 deletion(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index 07537a284ce5..95bd4fd03184 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -5,6 +5,12 @@ All notable changes to this project will be documented in this file. The format is based on [Keep a Changelog](http://keepachangelog.com/en/1.0.0/) and this project adheres to [Semantic Versioning](http://semver.org/spec/v2.0.0.html). +## [5.0.0-dev3] + +[5.0.0-dev3]: https://github.com/microsoft/CCF/releases/tag/ccf-5.0.0-dev3 + +- Added a `consensus.max_uncommitted_tx_count` configuration option, which if set specifies the maximum number of transactions that can be pending on the primary. When that threshold is exceeded, a `503 Service Unavailable` is temporarily returned on all but the `/node/*` paths (#5692). + ## [5.0.0-dev2] [5.0.0-dev2]: https://github.com/microsoft/CCF/releases/tag/ccf-5.0.0-dev2 diff --git a/doc/host_config_schema/cchost_config.json b/doc/host_config_schema/cchost_config.json index a580550b817e..481115d8520f 100644 --- a/doc/host_config_schema/cchost_config.json +++ b/doc/host_config_schema/cchost_config.json @@ -566,7 +566,7 @@ "max_uncommitted_tx_count": { "type": "integer", "default": 10000, - "description": "Maximum number of uncommitted transactions allowed before the primary refuses new transactions" + "description": "Maximum number of uncommitted transactions allowed before the primary refuses new transactions. Unlimited if set to 0." } }, "description": "This section includes configuration for the consensus protocol (note: should be the same for all other nodes in the service)", From efbf50d07b64ce99b91b428b73f942af8c54c106 Mon Sep 17 00:00:00 2001 From: Amaury Chamayou Date: Thu, 28 Sep 2023 16:29:06 +0100 Subject: [PATCH 10/11] Update CHANGELOG.md Co-authored-by: Eddy Ashton --- CHANGELOG.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index 95bd4fd03184..015bf145b3e3 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -9,7 +9,7 @@ and this project adheres to [Semantic Versioning](http://semver.org/spec/v2.0.0. [5.0.0-dev3]: https://github.com/microsoft/CCF/releases/tag/ccf-5.0.0-dev3 -- Added a `consensus.max_uncommitted_tx_count` configuration option, which if set specifies the maximum number of transactions that can be pending on the primary. When that threshold is exceeded, a `503 Service Unavailable` is temporarily returned on all but the `/node/*` paths (#5692). +- Added a `consensus.max_uncommitted_tx_count` configuration option, which specifies the maximum number of transactions that can be pending on the primary. When that threshold is exceeded, a `503 Service Unavailable` is temporarily returned on all but the `/node/*` paths (#5692). ## [5.0.0-dev2] From 89ebc7c1eae02f52fed29f3e198e006129024413 Mon Sep 17 00:00:00 2001 From: Amaury Chamayou Date: Thu, 28 Sep 2023 15:37:21 +0000 Subject: [PATCH 11/11] Remove now redundant plot --- tests/infra/basicperf.py | 10 ---------- 1 file changed, 10 deletions(-) diff --git a/tests/infra/basicperf.py b/tests/infra/basicperf.py index d5c0b6f45426..963390aaff9d 100644 --- a/tests/infra/basicperf.py +++ b/tests/infra/basicperf.py @@ -564,11 +564,6 @@ def table(): .sort("second") .fill_null(0) ) - print(per_sec) - per_sec = per_sec.with_columns( - sent_rate=pl.col("sent") / per_sec["sent"].max(), - rcvd_rate=pl.col("rcvd") / per_sec["rcvd"].max(), - ) plt.simple_bar( list(per_sec["second"]), @@ -588,11 +583,6 @@ def table(): ) plt.show() - for row in per_sec.iter_rows(named=True): - s = "S" * int(row["sent_rate"] * 20) - r = "R" * int(row["rcvd_rate"] * 20) - print(f"{row['second']:>3}: {s:>20}|{r:<20}") - if number_of_errors and not args.stop_primary_after_s: raise RuntimeError( f"Errors: {number_of_errors} ({number_of_errors / total_number_of_requests * 100:.2f}%)"