From 20937149a59d9dee5968180ead258f2da1ad9f6d Mon Sep 17 00:00:00 2001 From: Eugene Date: Wed, 18 Dec 2024 10:28:14 +0100 Subject: [PATCH] fix(nemesis): filter raft-topology errors when starting/stopping nodes raft is generating the following errors: raft_topology - topology change coordinator fiber got error std::runtime_error when one of the nodes is stopped, it was decided we can safely ignore those errors fixes:9031 --- sdcm/nemesis.py | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/sdcm/nemesis.py b/sdcm/nemesis.py index 4d240a3262..6b813f7838 100644 --- a/sdcm/nemesis.py +++ b/sdcm/nemesis.py @@ -672,6 +672,7 @@ def _kill_scylla_daemon(self): self.target_node.wait_jmx_up() self.cluster.wait_for_schema_agreement() + @decorate_with_context(ignore_raft_topology_cmd_failing) @target_all_nodes def disrupt_stop_wait_start_scylla_server(self, sleep_time=300): # pylint: disable=invalid-name self.target_node.stop_scylla_server(verify_up=False, verify_down=True) @@ -1140,7 +1141,7 @@ def get_all_sstables(self, tables: list[str], node: BaseNode = None): return sstables - @decorate_with_context(ignore_ycsb_connection_refused) + @decorate_with_context([ignore_ycsb_connection_refused, ignore_raft_topology_cmd_failing]) def _destroy_data_and_restart_scylla(self, keyspaces_for_destroy: list = None, sstables_to_destroy_perc: int = 50): # pylint: disable=too-many-statements tables = self.cluster.get_non_system_ks_cf_list(db_node=self.target_node, filter_empty_tables=False, filter_by_keyspace=keyspaces_for_destroy) @@ -1360,7 +1361,7 @@ def _add_and_init_new_cluster_nodes(self, count, timeout=MAX_TIME_WAIT_FOR_NEW_N InfoEvent(message="FinishEvent - New Nodes are up and normal").publish() return new_nodes - @decorate_with_context(ignore_ycsb_connection_refused) + @decorate_with_context([ignore_ycsb_connection_refused, ignore_raft_topology_cmd_failing]) def _terminate_cluster_node(self, node): self.cluster.terminate_node(node) self.monitoring_set.reconfigure_scylla_monitoring() @@ -1683,7 +1684,7 @@ def wait_for_old_node_to_removed(): new_node.set_seed_flag(True) self.cluster.update_seed_provider() - @decorate_with_context(ignore_ycsb_connection_refused) + @decorate_with_context([ignore_ycsb_connection_refused, ignore_raft_topology_cmd_failing]) @target_all_nodes def disrupt_kill_scylla(self): self._kill_scylla_daemon()