From b2cd1ca13c1d4ceecd0fb2eed157ee2770e4b4c5 Mon Sep 17 00:00:00 2001
From: Liapkovich <mikita.liapkovich@scylladb.com>
Date: Mon, 10 Jun 2024 14:26:22 +0200
Subject: [PATCH] test(manager): introduce test for mixed db (vnodes + tablets)

The new test performs sanity checks for cluster consisting of vnodes
and tablets simultaneously.
---
 ...buntu22-manager-vnodes-tablets.jenkinsfile | 17 +++++
 mgmt_cli_test.py                              | 63 +++++++++++++------
 2 files changed, 62 insertions(+), 18 deletions(-)
 create mode 100644 jenkins-pipelines/manager/ubuntu22-manager-vnodes-tablets.jenkinsfile

diff --git a/jenkins-pipelines/manager/ubuntu22-manager-vnodes-tablets.jenkinsfile b/jenkins-pipelines/manager/ubuntu22-manager-vnodes-tablets.jenkinsfile
new file mode 100644
index 0000000000..67cd9f8b07
--- /dev/null
+++ b/jenkins-pipelines/manager/ubuntu22-manager-vnodes-tablets.jenkinsfile
@@ -0,0 +1,17 @@
+#!groovy
+
+// trick from https://github.com/jenkinsci/workflow-cps-global-lib-plugin/pull/43
+def lib = library identifier: 'sct@snapshot', retriever: legacySCM(scm)
+
+managerPipeline(
+    backend: 'aws',
+    region: 'us-east-1',
+    test_name: 'mgmt_cli_test.MgmtCliTest.test_manager_sanity_vnodes_tablets_cluster',
+    test_config: 'test-cases/manager/manager-regression-singleDC-set-distro.yaml',
+
+    scylla_version: '6.0',
+
+    post_behavior_db_nodes: 'destroy',
+    post_behavior_loader_nodes: 'destroy',
+    post_behavior_monitor_nodes: 'destroy',
+)
diff --git a/mgmt_cli_test.py b/mgmt_cli_test.py
index d4f510a6cc..26bbbcf416 100644
--- a/mgmt_cli_test.py
+++ b/mgmt_cli_test.py
@@ -42,6 +42,7 @@
 from sdcm.sct_events.group_common_events import ignore_no_space_errors, ignore_stream_mutation_fragments_errors
 from sdcm.utils.gce_utils import get_gce_storage_client
 from sdcm.utils.azure_utils import AzureService
+from sdcm.utils.tablets.common import TabletsConfiguration
 from sdcm.exceptions import FilesNotCorrupted
 
 
@@ -172,21 +173,24 @@ def restore_backup_from_backup_task(self, mgr_cluster, backup_task, keyspace_and
                             keyspace_and_table_list=keyspace_and_table_list)
 
     # pylint: disable=too-many-arguments
-    def verify_backup_success(self, mgr_cluster, backup_task, keyspace_name='keyspace1', tables_names=None,
+    def verify_backup_success(self, mgr_cluster, backup_task, ks_names: list = None, tables_names: list = None,
                               truncate=True, restore_data_with_task=False, timeout=None):
+        if ks_names is None:
+            ks_names = ['keyspace1']
         if tables_names is None:
             tables_names = ['standard1']
-        per_keyspace_tables_dict = {keyspace_name: tables_names}
+        ks_tables_map = {keyspace: tables_names for keyspace in ks_names}
         if truncate:
-            for table_name in tables_names:
-                self.log.info(f'running truncate on {keyspace_name}.{table_name}')
-                self.db_cluster.nodes[0].run_cqlsh(f'TRUNCATE {keyspace_name}.{table_name}')
+            for ks, tables in ks_tables_map.items():
+                for table_name in tables:
+                    self.log.info(f'running truncate on {ks}.{table_name}')
+                    self.db_cluster.nodes[0].run_cqlsh(f'TRUNCATE {ks}.{table_name}')
         if restore_data_with_task:
             self.restore_backup_with_task(mgr_cluster=mgr_cluster, snapshot_tag=backup_task.get_snapshot_tag(),
                                           timeout=timeout, restore_data=True)
         else:
             self.restore_backup_from_backup_task(mgr_cluster=mgr_cluster, backup_task=backup_task,
-                                                 keyspace_and_table_list=per_keyspace_tables_dict)
+                                                 keyspace_and_table_list=ks_tables_map)
 
     def restore_backup_with_task(self, mgr_cluster, snapshot_tag, timeout, restore_schema=False, restore_data=False,
                                  location_list=None):
@@ -335,7 +339,7 @@ def _create_keyspace_and_basic_table(self, keyspace_name, table_name="example_ta
         self.log.info("creating the table {} in the keyspace {}".format(table_name, keyspace_name))
         self.create_table(table_name, keyspace_name=keyspace_name)
 
-    def test_manager_sanity(self):
+    def test_manager_sanity(self, prepared_ks: bool = False, ks_names: list = None):
         """
         Test steps:
         1) Run the repair test.
@@ -343,11 +347,12 @@ def test_manager_sanity(self):
         3) test_mgmt_cluster_healthcheck
         4) test_client_encryption
         """
-        self.generate_load_and_wait_for_results()
+        if not prepared_ks:
+            self.generate_load_and_wait_for_results()
         with self.subTest('Basic Backup Test'):
-            self.test_basic_backup()
+            self.test_basic_backup(ks_names=ks_names)
         with self.subTest('Restore Backup Test'):
-            self.test_restore_backup_with_task()
+            self.test_restore_backup_with_task(ks_names=ks_names)
         with self.subTest('Repair Multiple Keyspace Types'):
             self.test_repair_multiple_keyspace_types()
         with self.subTest('Mgmt Cluster CRUD'):
@@ -364,6 +369,26 @@ def test_manager_sanity(self):
             # Since this test activates encryption, it has to be the last test in the sanity
             self.test_client_encryption()
 
+    def test_manager_sanity_vnodes_tablets_cluster(self):
+        """
+        Test steps:
+        1) Create tablets keyspace and propagate some data.
+        2) Create vnodes keyspace and propagate some data.
+        3) Run sanity test (test_manager_sanity).
+        """
+        self.log.info('starting test_manager_sanity_vnodes_tablets_cluster')
+
+        ks_config = [("tablets_keyspace", True), ("vnodes_keyspace", False)]
+        ks_names = [i[0] for i in ks_config]
+        for ks_name, tablets_enabled in ks_config:
+            tablets_config = TabletsConfiguration(enabled=tablets_enabled)
+            self.create_keyspace(ks_name, replication_factor=3, tablets_config=tablets_config)
+            self.generate_load_and_wait_for_results(keyspace_name=ks_name)
+
+        self.test_manager_sanity(prepared_ks=True, ks_names=ks_names)
+
+        self.log.info('finishing test_manager_sanity_vnodes_tablets_cluster')
+
     def test_repair_intensity_feature_on_multiple_node(self):
         self._repair_intensity_feature(fault_multiple_nodes=True)
 
@@ -522,7 +547,7 @@ def create_ks_and_tables(self, num_ks, num_table):
                     # self.populate_data_parallel()
         return table_name
 
-    def test_basic_backup(self):
+    def test_basic_backup(self, ks_names: list = None):
         self.log.info('starting test_basic_backup')
         manager_tool = mgmt.get_scylla_manager_tool(manager_node=self.monitors.nodes[0])
         mgr_cluster = self._ensure_and_get_cluster(manager_tool)
@@ -530,25 +555,27 @@ def test_basic_backup(self):
         backup_task_status = backup_task.wait_and_get_final_status(timeout=1500)
         assert backup_task_status == TaskStatus.DONE, \
             f"Backup task ended in {backup_task_status} instead of {TaskStatus.DONE}"
-        self.verify_backup_success(mgr_cluster=mgr_cluster, backup_task=backup_task)
-        self.run_verification_read_stress()
+        self.verify_backup_success(mgr_cluster=mgr_cluster, backup_task=backup_task, ks_names=ks_names)
+        self.run_verification_read_stress(ks_names)
         mgr_cluster.delete()  # remove cluster at the end of the test
         self.log.info('finishing test_basic_backup')
 
-    def test_restore_backup_with_task(self):
+    def test_restore_backup_with_task(self, ks_names: list = None):
         self.log.info('starting test_restore_backup_with_task')
         manager_tool = mgmt.get_scylla_manager_tool(manager_node=self.monitors.nodes[0])
         mgr_cluster = self._ensure_and_get_cluster(manager_tool)
-        backup_task = mgr_cluster.create_backup_task(location_list=self.locations, keyspace_list=["keyspace1"])
+        if not ks_names:
+            ks_names = ['keyspace1']
+        backup_task = mgr_cluster.create_backup_task(location_list=self.locations, keyspace_list=ks_names)
         backup_task_status = backup_task.wait_and_get_final_status(timeout=1500)
         assert backup_task_status == TaskStatus.DONE, \
             f"Backup task ended in {backup_task_status} instead of {TaskStatus.DONE}"
         soft_timeout = 36 * 60
         hard_timeout = 50 * 60
         with adaptive_timeout(Operations.MGMT_REPAIR, self.db_cluster.nodes[0], timeout=soft_timeout):
-            self.verify_backup_success(mgr_cluster=mgr_cluster, backup_task=backup_task, restore_data_with_task=True,
-                                       timeout=hard_timeout)
-        self.run_verification_read_stress()
+            self.verify_backup_success(mgr_cluster=mgr_cluster, backup_task=backup_task, ks_names=ks_names,
+                                       restore_data_with_task=True, timeout=hard_timeout)
+        self.run_verification_read_stress(ks_names)
         mgr_cluster.delete()  # remove cluster at the end of the test
         self.log.info('finishing test_restore_backup_with_task')