Skip to content

Commit

Permalink
tests: added test validating status reporting consistency after upgrade
Browse files Browse the repository at this point in the history
Signed-off-by: Michal Maslanka <michal@redpanda.com>
  • Loading branch information
mmaslankaprv committed Aug 29, 2023
1 parent 78472e3 commit 8df8a3a
Showing 1 changed file with 53 additions and 1 deletion.
54 changes: 53 additions & 1 deletion tests/rptest/tests/nodes_decommissioning_test.py
Original file line number Diff line number Diff line change
Expand Up @@ -16,6 +16,7 @@
from time import sleep
from rptest.clients.default import DefaultClient
from rptest.services.kgo_verifier_services import KgoVerifierConsumerGroupConsumer, KgoVerifierProducer
from rptest.services.redpanda_installer import RedpandaInstaller
from rptest.tests.prealloc_nodes import PreallocNodesTest

from rptest.utils.mode_checks import skip_debug_mode
Expand Down Expand Up @@ -165,14 +166,23 @@ def _state_consistent():
brokers = self.admin.get_brokers(n)
config_ids = [s['node_id'] for s in cfg_status]
brokers_ids = [b['node_id'] for b in brokers]
self.logger.info(
f"broker_ids: {brokers_ids}, ids from configuration status: {config_ids}"
)
if sorted(brokers_ids) != sorted(config_ids):
return False
if decommissioned_id in brokers_ids:
return False

return True

wait_until(_state_consistent, 10, 1)
wait_until(
_state_consistent,
10,
1,
err_msg=
"Timeout waiting for nodes reported from configuration and cluster state to be consistent"
)

def _wait_for_node_removed(self, decommissioned_id):

Expand Down Expand Up @@ -828,6 +838,48 @@ def tried_to_join():

assert len(self.admin.get_brokers(node=self.redpanda.nodes[0])) == 5

@cluster(
num_nodes=6,
# A decom can look like a restart in terms of logs from peers dropping
# connections with it
log_allow_list=RESTART_LOG_ALLOW_LIST)
def test_decommissioning_and_upgrade(self):
self.installer = self.redpanda._installer
# upgrade from previous to current version
versions = [
self.installer.highest_from_prior_feature_version(
RedpandaInstaller.HEAD), RedpandaInstaller.HEAD
]
to_decommission = None
to_decommission_id = None
for v in self.upgrade_through_versions(versions_in=versions,
auto_assign_node_id=True):
if v == versions[0]:
self._create_topics()

self.start_producer()
self.start_consumer()
# decommission node
to_decommission = self.redpanda.nodes[-1]
to_decommission_id = self.redpanda.node_id(to_decommission)
self.logger.info(f"decommissioning node: {to_decommission_id}")
self._decommission(to_decommission_id)

self._wait_for_node_removed(to_decommission_id)
self.redpanda.stop_node(to_decommission)
self.redpanda.clean_node(to_decommission,
preserve_logs=True,
preserve_current_install=True)
self.redpanda.start_node(to_decommission,
auto_assign_node_id=True)
# refresh node ids for rolling restarter
self.redpanda.node_id(to_decommission, force_refresh=True)

# check that the nodes reported from configuration status and
# brokers endpoint is consistent

self._check_state_consistent(to_decommission_id)


class NodeDecommissionFailureReportingTest(RedpandaTest):
def __init__(self, *args, **kwargs):
Expand Down

0 comments on commit 8df8a3a

Please sign in to comment.