maidsafe · maqi · Feb 8, 2025 · Feb 8, 2025 · Feb 8, 2025 · Feb 8, 2025
diff --git a/ant-networking/src/cmd.rs b/ant-networking/src/cmd.rs
@@ -993,7 +993,7 @@
     pub(crate) fn record_node_issue(&mut self, peer_id: PeerId, issue: NodeIssue) {
         info!("Peer {peer_id:?} is reported as having issue {issue:?}");
         let (issue_vec, is_bad) = self.bad_nodes.entry(peer_id).or_default();
-        let mut new_bad_behaviour = None;
+        let mut _new_bad_behaviour = None;
         let mut is_connection_issue = false;
 
         // If being considered as bad already, skip certain operations
@@ -1033,7 +1033,7 @@
                     } else {
                         *is_bad = true;
                     }
-                    new_bad_behaviour = Some(issue.clone());
+                    _new_bad_behaviour = Some(issue.clone());
                     info!("Peer {peer_id:?} accumulated {issue_counts} times of issue {issue:?}. Consider it as a bad node now.");
                     // Once a bad behaviour detected, no point to continue
                     break;
@@ -1049,53 +1049,56 @@
             if let Some(dead_peer) = self.swarm.behaviour_mut().kademlia.remove_peer(&peer_id) {
                 self.update_on_peer_removal(*dead_peer.node.key.preimage());
             }
-            return;
+            // TODO: re-enable once confirmed with upscale test
+            // return;
         }
 
-        if *is_bad {
-            info!("Evicting bad peer {peer_id:?} from RT.");
-            if let Some(dead_peer) = self.swarm.behaviour_mut().kademlia.remove_peer(&peer_id) {
-                self.update_on_peer_removal(*dead_peer.node.key.preimage());
-            }
-
-            if let Some(bad_behaviour) = new_bad_behaviour {
-                // inform the bad node about it and add to the blocklist after that (not for connection issues)
-                self.record_metrics(Marker::PeerConsideredAsBad { bad_peer: &peer_id });
-
-                warn!("Peer {peer_id:?} is considered as bad due to {bad_behaviour:?}. Informing the peer and adding to blocklist.");
-                // response handling
-                let (tx, rx) = oneshot::channel();
-                let local_swarm_cmd_sender = self.local_cmd_sender.clone();
-                tokio::spawn(async move {
-                    match rx.await {
-                        Ok(result) => {
-                            debug!("Got response for Cmd::PeerConsideredAsBad from {peer_id:?} {result:?}");
-                            if let Err(err) = local_swarm_cmd_sender
-                                .send(LocalSwarmCmd::AddPeerToBlockList { peer_id })
-                                .await
-                            {
-                                error!("SwarmDriver failed to send LocalSwarmCmd: {err}");
-                            }
-                        }
-                        Err(err) => {
-                            error!("Failed to get response from one shot channel for Cmd::PeerConsideredAsBad : {err:?}");
-                        }
-                    }
-                });
-
-                // request
-                let request = Request::Cmd(Cmd::PeerConsideredAsBad {
-                    detected_by: NetworkAddress::from_peer(self.self_peer_id),
-                    bad_peer: NetworkAddress::from_peer(peer_id),
-                    bad_behaviour: bad_behaviour.to_string(),
-                });
-                self.queue_network_swarm_cmd(NetworkSwarmCmd::SendRequest {
-                    req: request,
-                    peer: peer_id,
-                    sender: Some(tx),
-                });
-            }
-        }
+        // Disable disconnection and blocking which are not because of the connection issue.
+        // TODO: re-enable once confirmed with upscale test
+        // if *is_bad {
+        //     info!("Evicting bad peer {peer_id:?} from RT.");
+        //     if let Some(dead_peer) = self.swarm.behaviour_mut().kademlia.remove_peer(&peer_id) {
+        //         self.update_on_peer_removal(*dead_peer.node.key.preimage());
+        //     }
+
+        //     if let Some(bad_behaviour) = new_bad_behaviour {
+        //         // inform the bad node about it and add to the blocklist after that (not for connection issues)
+        //         self.record_metrics(Marker::PeerConsideredAsBad { bad_peer: &peer_id });
+
+        //         warn!("Peer {peer_id:?} is considered as bad due to {bad_behaviour:?}. Informing the peer and adding to blocklist.");
+        //         // response handling
+        //         let (tx, rx) = oneshot::channel();
+        //         let local_swarm_cmd_sender = self.local_cmd_sender.clone();
+        //         tokio::spawn(async move {
+        //             match rx.await {
+        //                 Ok(result) => {
+        //                     debug!("Got response for Cmd::PeerConsideredAsBad from {peer_id:?} {result:?}");
+        //                     if let Err(err) = local_swarm_cmd_sender
+        //                         .send(LocalSwarmCmd::AddPeerToBlockList { peer_id })
+        //                         .await
+        //                     {
+        //                         error!("SwarmDriver failed to send LocalSwarmCmd: {err}");
+        //                     }
+        //                 }
+        //                 Err(err) => {
+        //                     error!("Failed to get response from one shot channel for Cmd::PeerConsideredAsBad : {err:?}");
+        //                 }
+        //             }
+        //         });
+
+        //         // request
+        //         let request = Request::Cmd(Cmd::PeerConsideredAsBad {
+        //             detected_by: NetworkAddress::from_peer(self.self_peer_id),
+        //             bad_peer: NetworkAddress::from_peer(peer_id),
+        //             bad_behaviour: bad_behaviour.to_string(),
+        //         });
+        //         self.queue_network_swarm_cmd(NetworkSwarmCmd::SendRequest {
+        //             req: request,
+        //             peer: peer_id,
+        //             sender: Some(tx),
+        //         });
+        //     }
+        // }
     }
 
     fn verify_peer_quote(&mut self, peer_id: PeerId, quote: PaymentQuote) {

diff --git a/ant-networking/src/driver.rs b/ant-networking/src/driver.rs
@@ -699,6 +699,7 @@ pub struct SwarmDriver {
     pub(crate) metrics_recorder: Option<NetworkMetricsRecorder>,
 
     network_cmd_sender: mpsc::Sender<NetworkSwarmCmd>,
+    #[allow(dead_code)]
     pub(crate) local_cmd_sender: mpsc::Sender<LocalSwarmCmd>,
     local_cmd_receiver: mpsc::Receiver<LocalSwarmCmd>,
     network_cmd_receiver: mpsc::Receiver<NetworkSwarmCmd>,

diff --git a/ant-networking/src/log_markers.rs b/ant-networking/src/log_markers.rs
@@ -22,6 +22,7 @@ pub enum Marker<'a> {
     /// Quoting metrics
     QuotingMetrics { quoting_metrics: &'a QuotingMetrics },
     /// The peer has been considered as bad
+    #[allow(dead_code)]
     PeerConsideredAsBad { bad_peer: &'a PeerId },
     /// We have been flagged as a bad node by a peer.
     FlaggedAsBadNode { flagged_by: &'a PeerId },

diff --git a/ant-networking/src/replication_fetcher.rs b/ant-networking/src/replication_fetcher.rs
@@ -21,7 +21,7 @@ use std::collections::{hash_map::Entry, BTreeMap, HashMap, HashSet, VecDeque};
 use tokio::{sync::mpsc, time::Duration};
 
 // Max parallel fetches that can be undertaken at the same time.
-const MAX_PARALLEL_FETCH: usize = K_VALUE.get();
+const MAX_PARALLEL_FETCH: usize = K_VALUE.get() / 2;
 
 // The duration after which a peer will be considered failed to fetch data from,
 // if no response got from that peer.
@@ -495,20 +495,22 @@ impl ReplicationFetcher {
     //   * Some(true)  : peer is trustworthy
     //   * Some(false) : peer is not trustworthy
     //   * None        : not having enough know to tell
-    fn is_peer_trustworthy(&self, holder: &PeerId) -> Option<bool> {
-        if let Some((scores, _last_seen)) = self.peers_scores.get(holder) {
-            if scores.len() > 1 {
-                let is_healthy = scores.iter().filter(|is_health| **is_health).count() > 1;
-                if !is_healthy {
-                    info!("Peer {holder:?} is not a trustworthy replication source, as bearing scores of {scores:?}");
-                }
-                Some(is_healthy)
-            } else {
-                None
-            }
-        } else {
-            None
-        }
+    fn is_peer_trustworthy(&self, _holder: &PeerId) -> Option<bool> {
+        // TODO: re-enable once confirmed with upscaled test
+        Some(true)
+        // if let Some((scores, _last_seen)) = self.peers_scores.get(holder) {
+        //     if scores.len() > 1 {
+        //         let is_healthy = scores.iter().filter(|is_health| **is_health).count() >= 1;
+        //         if !is_healthy {
+        //             info!("Peer {holder:?} is not a trustworthy replication source, as bearing scores of {scores:?}");
+        //         }
+        //         Some(is_healthy)
+        //     } else {
+        //         None
+        //     }
+        // } else {
+        //     None
+        // }
     }
 
     // Just remove outdated entries in `on_going_fetch`, indicates a failure to fetch from network.

diff --git a/ant-node/src/node.rs b/ant-node/src/node.rs
@@ -69,7 +69,7 @@ const HIGHEST_SCORE: usize = 100;
 
 /// Any nodes bearing a score below this shall be considered as bad.
 /// Max is to be 100 * 100
-const MIN_ACCEPTABLE_HEALTHY_SCORE: usize = 3000;
+const MIN_ACCEPTABLE_HEALTHY_SCORE: usize = 1000;
 
 /// in ms, expecting average StorageChallenge complete time to be around 250ms.
 const TIME_STEP: usize = 20;