From a8abaedc7ec8cf4e8dfb0411ab33558d46138815 Mon Sep 17 00:00:00 2001 From: driftluo Date: Wed, 24 Mar 2021 15:29:40 +0800 Subject: [PATCH 1/2] feat: disable penalty when download nodes are scarce --- sync/src/tests/inflight_blocks.rs | 2 ++ sync/src/types/mod.rs | 45 ++++++++++++++++++++++++------- test/src/specs/sync/get_blocks.rs | 6 ++--- 3 files changed, 41 insertions(+), 12 deletions(-) diff --git a/sync/src/tests/inflight_blocks.rs b/sync/src/tests/inflight_blocks.rs index a2732e99bf..64d97ad49c 100644 --- a/sync/src/tests/inflight_blocks.rs +++ b/sync/src/tests/inflight_blocks.rs @@ -94,6 +94,7 @@ fn inflight_blocks_timeout() { let faketime_file = faketime::millis_tempfile(0).expect("create faketime file"); faketime::enable(&faketime_file); let mut inflight_blocks = InflightBlocks::default(); + inflight_blocks.protect_num = 0; assert!(inflight_blocks.insert(1.into(), (1, h256!("0x1").pack()).into())); assert!(inflight_blocks.insert(1.into(), (2, h256!("0x2").pack()).into())); @@ -147,6 +148,7 @@ fn inflight_trace_number_state() { faketime::enable(&faketime_file); let mut inflight_blocks = InflightBlocks::default(); + inflight_blocks.protect_num = 0; assert!(inflight_blocks.insert(1.into(), (1, h256!("0x1").pack()).into())); assert!(inflight_blocks.insert(2.into(), (2, h256!("0x2").pack()).into())); diff --git a/sync/src/types/mod.rs b/sync/src/types/mod.rs index 121445fb19..e9bc0609c2 100644 --- a/sync/src/types/mod.rs +++ b/sync/src/types/mod.rs @@ -7,8 +7,8 @@ use ckb_chain_spec::consensus::Consensus; use ckb_constant::sync::{ BLOCK_DOWNLOAD_TIMEOUT, HEADERS_DOWNLOAD_HEADERS_PER_SECOND, HEADERS_DOWNLOAD_INSPECT_WINDOW, HEADERS_DOWNLOAD_TOLERABLE_BIAS_FOR_SINGLE_SAMPLE, INIT_BLOCKS_IN_TRANSIT_PER_PEER, - MAX_BLOCKS_IN_TRANSIT_PER_PEER, MAX_HEADERS_LEN, POW_INTERVAL, RETRY_ASK_TX_TIMEOUT_INCREASE, - SUSPEND_SYNC_TIME, + MAX_BLOCKS_IN_TRANSIT_PER_PEER, MAX_HEADERS_LEN, MAX_OUTBOUND_PEERS_TO_PROTECT_FROM_DISCONNECT, + POW_INTERVAL, RETRY_ASK_TX_TIMEOUT_INCREASE, SUSPEND_SYNC_TIME, }; use ckb_error::AnyError; use ckb_logger::{debug, debug_target, error, trace}; @@ -565,6 +565,7 @@ pub struct InflightBlocks { pub(crate) restart_number: BlockNumber, time_analyzer: TimeAnalyzer, pub(crate) adjustment: bool, + pub(crate) protect_num: usize, } impl Default for InflightBlocks { @@ -577,6 +578,7 @@ impl Default for InflightBlocks { restart_number: 0, time_analyzer: TimeAnalyzer::default(), adjustment: true, + protect_num: MAX_OUTBOUND_PEERS_TO_PROTECT_FROM_DISCONNECT, } } } @@ -683,6 +685,16 @@ impl InflightBlocks { pub fn prune(&mut self, tip: BlockNumber) -> HashSet { let now = unix_time_as_millis(); let mut disconnect_list = HashSet::new(); + // Since statistics are currently disturbed by the processing block time, when the number + // of transactions increases, the node will be accidentally evicted. + // + // Especially on machines with poor CPU performance, the node connection will be frequently + // disconnected due to statistics. + // + // In order to protect the decentralization of the network and ensure the survival of low-performance + // nodes, the penalty mechanism will be closed when the number of download nodes is less than the number of protected nodes + let should_punish = self.download_schedulers.len() > self.protect_num; + let adjustment = self.adjustment; let trace = &mut self.trace_number; let download_schedulers = &mut self.download_schedulers; @@ -702,7 +714,9 @@ impl InflightBlocks { if value.timestamp + BLOCK_DOWNLOAD_TIMEOUT < now { if let Some(set) = download_schedulers.get_mut(&value.peer) { set.hashes.remove(key); - set.punish(2); + if should_punish { + set.punish(2); + } }; if !trace.is_empty() { trace.remove(&key); @@ -742,13 +756,17 @@ impl InflightBlocks { if now > 1000 + *time { if let Some(state) = states.remove(key) { if let Some(d) = download_schedulers.get_mut(&state.peer) { - d.punish(1); + if should_punish { + d.punish(1); + } d.hashes.remove(key); }; } else if let Some(v) = compact_inflight.remove(&key.hash) { - for peer in v { - if let Some(d) = download_schedulers.get_mut(&peer) { - d.punish(1); + if should_punish && adjustment { + for peer in v { + if let Some(d) = download_schedulers.get_mut(&peer) { + d.punish(1); + } } } } @@ -817,6 +835,7 @@ impl InflightBlocks { } pub fn remove_by_block(&mut self, block: BlockNumberAndHash) -> bool { + let should_punish = self.download_schedulers.len() > self.protect_num; let download_schedulers = &mut self.download_schedulers; let trace = &mut self.trace_number; let compact = &mut self.compact_reconstruct_inflight; @@ -835,8 +854,16 @@ impl InflightBlocks { match time_analyzer.push_time(elapsed) { TimeQuantile::MinToFast => set.increase(2), TimeQuantile::FastToNormal => set.increase(1), - TimeQuantile::NormalToUpper => set.decrease(1), - TimeQuantile::UpperToMax => set.decrease(2), + TimeQuantile::NormalToUpper => { + if should_punish { + set.decrease(1) + } + } + TimeQuantile::UpperToMax => { + if should_punish { + set.decrease(2) + } + } } } if !trace.is_empty() { diff --git a/test/src/specs/sync/get_blocks.rs b/test/src/specs/sync/get_blocks.rs index 855bab3bb0..843c836420 100644 --- a/test/src/specs/sync/get_blocks.rs +++ b/test/src/specs/sync/get_blocks.rs @@ -53,14 +53,14 @@ impl Spec for GetBlocksTimeout { let received = wait_get_blocks_point(&net, &node1, block_download_timeout_secs * 2, 1); assert!( - received.is_none(), - "Should not received GetBlocks anymore, the timeout could be any number." + received.is_some(), + "Should received GetBlocks anymore, the timeout could be any number." ); let rpc_client = node1.rpc_client(); let result = wait_until(10, || { let peers = rpc_client.get_peers(); - peers.is_empty() + !peers.is_empty() }); if !result { panic!("node1 must disconnect net"); From 34055d60069fcc86286a3e595e230317f68c7fc1 Mon Sep 17 00:00:00 2001 From: driftluo Date: Wed, 24 Mar 2021 15:39:53 +0800 Subject: [PATCH 2/2] feat: allow the protection node to be disconnected due to sync judgment --- sync/src/synchronizer/mod.rs | 7 ++++++- test/src/specs/sync/get_blocks.rs | 4 ++-- 2 files changed, 8 insertions(+), 3 deletions(-) diff --git a/sync/src/synchronizer/mod.rs b/sync/src/synchronizer/mod.rs index 2ebbc853dd..5c45a83758 100644 --- a/sync/src/synchronizer/mod.rs +++ b/sync/src/synchronizer/mod.rs @@ -576,10 +576,15 @@ impl Synchronizer { }; for peer in disconnect_list.iter() { + // It is not forbidden to evict protected nodes: + // - First of all, this node is not designated by the user for protection, + // but is connected randomly. It does not represent the will of the user + // - Secondly, in the synchronization phase, the nodes with zero download tasks are + // retained, apart from reducing the download efficiency, there is no benefit. if self .peers() .get_flag(*peer) - .map(|flag| flag.is_whitelist || flag.is_protect) + .map(|flag| flag.is_whitelist) .unwrap_or(false) { continue; diff --git a/test/src/specs/sync/get_blocks.rs b/test/src/specs/sync/get_blocks.rs index 843c836420..69c83d7a1b 100644 --- a/test/src/specs/sync/get_blocks.rs +++ b/test/src/specs/sync/get_blocks.rs @@ -54,7 +54,7 @@ impl Spec for GetBlocksTimeout { let received = wait_get_blocks_point(&net, &node1, block_download_timeout_secs * 2, 1); assert!( received.is_some(), - "Should received GetBlocks anymore, the timeout could be any number." + "in the case of sparse connections, even if download times out, net should continue to receive GetBlock requests" ); let rpc_client = node1.rpc_client(); @@ -63,7 +63,7 @@ impl Spec for GetBlocksTimeout { !peers.is_empty() }); if !result { - panic!("node1 must disconnect net"); + panic!("node1 must not disconnect net"); } } }