From 15a56930484d5f589b349fb6cd06e7aaaf07ebd6 Mon Sep 17 00:00:00 2001 From: Lakshmipathi Date: Mon, 21 Oct 2024 16:29:50 +0530 Subject: [PATCH] full_storage_utilization_test: Storage utilization at 90% cluster size Populate data until it reaches over 90% disk storage and perform db and cluster options. Signed-off-by: Lakshmipathi --- defaults/test_default.yaml | 3 + docs/configuration_options.md | 3 + full_storage_utilization_test.py | 237 ++++++++++++++++++ .../oss/full-storage-utilization.jenkinsfile | 12 + sdcm/cluster.py | 8 + sdcm/sct_config.py | 8 + .../full-storage-utilization-scalein.yaml | 17 ++ .../full-storage-utilization-scaleout.yaml | 17 ++ 8 files changed, 305 insertions(+) create mode 100644 full_storage_utilization_test.py create mode 100644 jenkins-pipelines/oss/full-storage-utilization.jenkinsfile create mode 100644 test-cases/scale/full-storage-utilization-scalein.yaml create mode 100644 test-cases/scale/full-storage-utilization-scaleout.yaml diff --git a/defaults/test_default.yaml b/defaults/test_default.yaml index 020b021033a..6e1a7352719 100644 --- a/defaults/test_default.yaml +++ b/defaults/test_default.yaml @@ -274,3 +274,6 @@ skip_test_stages: {} n_db_zero_token_nodes: 0 zero_token_instance_type_db: 'i4i.large' use_zero_nodes: false +# Storageutilization default values +diskusage_softlimit: 70 +diskusage_hardlimit: 90 diff --git a/docs/configuration_options.md b/docs/configuration_options.md index a5b868d6c63..8ea4f7c31b1 100644 --- a/docs/configuration_options.md +++ b/docs/configuration_options.md @@ -371,3 +371,6 @@ | **n_db_zero_token_nodes** | Number of zero token nodes in cluster. Value should be set as "0 1 1"
for multidc configuration in same manner as 'n_db_nodes' and should be equal
number of regions | N/A | SCT_N_DB_ZERO_TOKEN_NODES | **zero_token_instance_type_db** | Instance type for zero token node | i4i.large | SCT_ZERO_TOKEN_INSTANCE_TYPE_DB | **use_zero_nodes** | If True, enable support in sct of zero nodes(configuration, nemesis) | false | SCT_USE_ZERO_NODES +| **scaling_action_type** | Refers to scaling task like scaleout, scalein etc that needs to be performed when storage reaches specific threshold| N/A | SCT_AUTO_SCALING_ACTION_TYPE +| **diskusage_softlimit** | Soft disk usage limit until this limit data will be written as 10% of available diskspace, after this chunksize will be 1%| 70 | SCT_DISKUSAGE_SOFTLIMIT +| **diskusage_hardlimit** | Maximum disk usage limit where auto-scale tasks will be performed | 90 | SCT_DISKUSAGE_HARDLIMIT diff --git a/full_storage_utilization_test.py b/full_storage_utilization_test.py new file mode 100644 index 00000000000..465ad7bb877 --- /dev/null +++ b/full_storage_utilization_test.py @@ -0,0 +1,237 @@ +from enum import Enum +import time +from sdcm.tester import ClusterTester +from sdcm.utils.tablets.common import wait_for_tablets_balanced + +class ScalingActionType(Enum): + SCALE_OUT = "scale_out" + SCALE_IN = "scale_in" + +class FullStorageUtilizationTest(ClusterTester): + def __init__(self, *args, **kwargs): + super().__init__(*args, **kwargs) + self.num_stress_threads = 10 + self.sleep_time_before_scale = 120 + self.sleep_time_fill_disk = 1800 + self.softlimit = self.params.get('diskusage_softlimit') + self.hardlimit = self.params.get('diskusage_hardlimit') + self.stress_cmd_w = self.params.get('stress_cmd_w') + self.stress_cmd_r = self.params.get('stress_cmd_r') + self.add_node_cnt = self.params.get('add_node_cnt') + self.scaling_action_type = self.params.get('scaling_action_type') + self.total_large_ks=0 + self.total_small_ks=0 + + def prepare_dataset_layout(self, dataset_size, row_size=10240): + n = dataset_size * 1024 * 1024 * 1024 // row_size + seq_end = n * 100 + cores = self.db_cluster.nodes[0].cpu_cores + if not cores: + self.num_stress_threads = 10 + else: + self.num_stress_threads = int(cores) * 8 + + return f'cassandra-stress write cl=ONE n={n} -mode cql3 native -rate threads={self.num_stress_threads} -pop dist="uniform(1..{seq_end})" ' \ + f'-col "size=FIXED({row_size}) n=FIXED(1)" -schema "replication(strategy=NetworkTopologyStrategy,replication_factor=3)"' + + def setUp(self): + super().setUp() + self.start_time = time.time() + + def start_throttle_write(self): + self.stress_cmd_w = self.stress_cmd_w.replace("", str(self.num_stress_threads)) + self.run_stress_thread(stress_cmd=self.stress_cmd_w) + ''' + During scaling operation, make sure there is some on-going read/write + operations to simulate real-world. Wait for 2mins so that c-s tool + is started running. + ''' + time.sleep(self.sleep_time_before_scale) + + def start_throttle_read(self): + self.stress_cmd_r = self.stress_cmd_r.replace("", str(self.num_stress_threads)) + self.run_stress_thread(stress_cmd=self.stress_cmd_r) + time.sleep(self.sleep_time_before_scale) + + def start_throttle_rw(self): + self.start_throttle_write() + self.start_throttle_read() + + def scale_out(self): + self.start_throttle_rw() + self.log.info("Started adding a new node") + start_time = time.time() + self.add_new_node() + duration = time.time() - start_time + self.log.info(f"Adding a node finished with time: {duration}") + + def scale_in(self): + self.start_throttle_rw() + self.log.info("Started removing a node") + start_time = time.time() + self.remove_node() + duration = time.time() - start_time + self.log.info(f"Removing a node finished with time: {duration}") + + def drop_data(self, keyspace_name): + ''' + Drop keyspace and clear snapshots. + ''' + node = self.db_cluster.nodes[0] + self.log.info("Dropping some data") + query = f"DROP KEYSPACE {keyspace_name}" + with self.db_cluster.cql_connection_patient(node) as session: + session.execute(query) + #node.run_nodetool(f"clearsnapshot") + self.log_disk_usage() + + def perform_scale_in(self): + ''' + If we are already at 90% disk utilization, first scale-out then + drop 20% of data to make space for scale-in operation. + + If we are at 67% disk utilization, scale-in without scale-out or + dropping data. + ''' + if self.hardlimit == 90: + self.scale_out() + ''' + Before removing a node, we should make sure + other nodes has enough space so that they + can accommodate data from the removed node. + ''' + # Remove 20% of data from the cluster. + self.drop_data("keyspace_large1") + self.drop_data("keyspace_large2") + self.scale_in() + elif self.hardlimit == 67: + self.scale_in() + + def perform_action(self): + self.log_disk_usage() + # Trigger specific action + if self.scaling_action_type == ScalingActionType.SCALE_OUT.value: + self.scale_out() + elif self.scaling_action_type == ScalingActionType.SCALE_IN.value: + self.perform_scale_in() + else: + self.log.info(f"Invalid ActionType {self.scaling_action_type}") + self.log_disk_usage() + + def test_storage_utilization(self): + """ + Write data until 90% disk usage is reached. + Sleep for 60 minutes. + Perform specific action. + """ + self.run_stress(self.softlimit, sleep_time=self.sleep_time_fill_disk) + self.run_stress(self.hardlimit, sleep_time=self.sleep_time_fill_disk) + self.perform_action() + + def run_stress(self, target_usage, sleep_time=600): + target_used_size = self.calculate_target_used_size(target_usage) + self.run_stress_until_target(target_used_size, target_usage) + + self.log_disk_usage() + self.log.info(f"Wait for {sleep_time} seconds") + time.sleep(sleep_time) + self.log_disk_usage() + + def run_stress_until_target(self, target_used_size, target_usage): + current_usage, current_used = self.get_max_disk_usage() + smaller_dataset = False + + space_needed = target_used_size - current_used + # Calculate chunk size as 10% of space needed + chunk_size = int(space_needed * 0.1) + while current_used < target_used_size and current_usage < target_usage: + # Write smaller dataset near the threshold (15% or 30GB of the target) + smaller_dataset = (((target_used_size - current_used) < 30) or ((target_usage - current_usage) <= 15)) + if not smaller_dataset: + self.total_large_ks += 1 + else: + self.total_small_ks += 1 + + # Use 1GB chunks near threshold, otherwise use 10% of remaining space + dataset_size = 1 if smaller_dataset else chunk_size + ks_name = "keyspace_small" if smaller_dataset else "keyspace_large" + num = self.total_small_ks if smaller_dataset else self.total_large_ks + self.log.info(f"Writing chunk of size: {dataset_size} GB") + stress_cmd = self.prepare_dataset_layout(dataset_size) + stress_queue = self.run_stress_thread(stress_cmd=stress_cmd, keyspace_name=f"{ks_name}{num}", stress_num=1, keyspace_num=num) + + self.verify_stress_thread(cs_thread_pool=stress_queue) + self.get_stress_results(queue=stress_queue) + + self.db_cluster.flush_all_nodes() + #time.sleep(60) if smaller_dataset else time.sleep(600) + + current_usage, current_used = self.get_max_disk_usage() + self.log.info(f"Current max disk usage after writing to keyspace{num}: {current_usage}% ({current_used} GB / {target_used_size} GB)") + + def add_new_node(self): + new_nodes = self.db_cluster.add_nodes(count=self.add_node_cnt, enable_auto_bootstrap=True) + self.db_cluster.wait_for_init(node_list=new_nodes) + self.db_cluster.wait_for_nodes_up_and_normal(nodes=new_nodes) + total_nodes_in_cluster = len(self.db_cluster.nodes) + self.log.info(f"New node added, total nodes in cluster: {total_nodes_in_cluster}") + self.monitors.reconfigure_scylla_monitoring() + wait_for_tablets_balanced(self.db_cluster.nodes[0]) + + def remove_node(self): + self.log.info('Removing a second node from the cluster') + node_to_remove = self.db_cluster.nodes[1] + self.log.info(f"Node to be removed: {node_to_remove.name}") + self.db_cluster.decommission(node_to_remove) + self.log.info(f"Node {node_to_remove.name} has been removed from the cluster") + self.monitors.reconfigure_scylla_monitoring() + wait_for_tablets_balanced(self.db_cluster.nodes[0]) + + def get_max_disk_usage(self): + max_usage = 0 + max_used = 0 + for node in self.db_cluster.nodes: + result = node.remoter.run("df -h -BG --output=used,pcent /var/lib/scylla | sed 1d | sed 's/G//' | sed 's/%//'") + used, usage = result.stdout.strip().split() + max_usage = max(max_usage, int(usage)) + max_used = max(max_used, int(used)) + return max_usage, max_used + + def get_disk_info(self, node): + result = node.remoter.run("df -h -BG --output=size,used,avail,pcent /var/lib/scylla | sed 1d | sed 's/G//g' | sed 's/%//'") + size, used, avail, pcent = result.stdout.strip().split() + return { + 'total': int(size), + 'used': int(used), + 'available': int(avail), + 'used_percent': int(pcent) + } + + def calculate_target_used_size(self, target_percent): + max_total = 0 + for node in self.db_cluster.nodes: + info = self.get_disk_info(node) + max_total = max(max_total, info['total']) + + target_used_size = (target_percent / 100) * max_total + current_usage, current_used = self.get_max_disk_usage() + additional_usage_needed = target_used_size - current_used + + self.log.info(f"Current max disk usage: {current_usage:.2f}%") + self.log.info(f"Current max used space: {current_used:.2f} GB") + self.log.info(f"Max total disk space: {max_total:.2f} GB") + self.log.info(f"Target used space to reach {target_percent}%: {target_used_size:.2f} GB") + self.log.info(f"Additional space to be used: {additional_usage_needed:.2f} GB") + + return target_used_size + + def log_disk_usage(self): + for node in self.db_cluster.nodes: + info = self.get_disk_info(node) + self.log.info(f"Disk usage for node {node.name}:") + self.log.info(f" Total: {info['total']} GB") + self.log.info(f" Used: {info['used']} GB") + self.log.info(f" Available: {info['available']} GB") + self.log.info(f" Used %: {info['used_percent']}%") + + diff --git a/jenkins-pipelines/oss/full-storage-utilization.jenkinsfile b/jenkins-pipelines/oss/full-storage-utilization.jenkinsfile new file mode 100644 index 00000000000..b62422eb0bd --- /dev/null +++ b/jenkins-pipelines/oss/full-storage-utilization.jenkinsfile @@ -0,0 +1,12 @@ +#!groovy + +// trick from https://github.com/jenkinsci/workflow-cps-global-lib-plugin/pull/43 +def lib = library identifier: 'sct@snapshot', retriever: legacySCM(scm) + +longevityPipeline( + backend: 'aws', + region: 'eu-west-1', + test_name: 'full_storage_utilization_test.FullStorageUtilizationTest.test_storage_utilization', + test_config: 'test-cases/scale/full-storage-utilization.yaml', + timeout: [time: 300, unit: 'MINUTES'] +) diff --git a/sdcm/cluster.py b/sdcm/cluster.py index 86395f823c0..31b16819bd4 100644 --- a/sdcm/cluster.py +++ b/sdcm/cluster.py @@ -4451,6 +4451,14 @@ def get_nodes_up_and_normal(self, verification_node=None): up_nodes.append(node) return up_nodes + def flush_all_nodes(self): + """ + This function will connect all db nodes in the cluster and run "nodetool flush" command. + :return: + """ + for node in self.nodes: + node.run_nodetool("flush") + def get_node_status_dictionary(self, ip_address=None, verification_node=None): """Get node status dictionary via nodetool (in case it's not found return None)""" node_status = None diff --git a/sdcm/sct_config.py b/sdcm/sct_config.py index 7a7e97d9d11..902a7aa7a89 100644 --- a/sdcm/sct_config.py +++ b/sdcm/sct_config.py @@ -1233,6 +1233,14 @@ class SCTConfiguration(dict): dict(name="perf_gradual_throttle_steps", env="SCT_PERF_GRADUAL_THROTTLE_STEPS", type=dict, help="Used for gradual performance test. Define throttle for load step in ops. Example: {'read': ['100000', '150000'], 'mixed': ['300']}"), + # StorageUtilizationTest + dict(name="scaling_action_type", env="SCT_SCALING_ACTION_TYPE", type=str, + help="Refers to type of action (scale_in,scale_out etc) that needs to be performed when specific disk usage threshold is reached."), + dict(name="diskusage_softlimit", env="SCT_DISKUSAGE_SOFTLIMIT", type=int, + help="Soft limit threshold, data will populate as 10% chunk until this limit reached."), + dict(name="diskusage_hardlimit", env="SCT_DISKUSAGE_HARDLIMIT", type=int, + help="Maximum limit for disk usage."), + # RefreshTest dict(name="skip_download", env="SCT_SKIP_DOWNLOAD", type=boolean, help=""), diff --git a/test-cases/scale/full-storage-utilization-scalein.yaml b/test-cases/scale/full-storage-utilization-scalein.yaml new file mode 100644 index 00000000000..f32aead6206 --- /dev/null +++ b/test-cases/scale/full-storage-utilization-scalein.yaml @@ -0,0 +1,17 @@ +test_duration: 3600 +n_db_nodes: 4 +n_loaders: 1 +n_monitor_nodes: 1 +user_prefix: 'storage-utilization' +instance_type_db: 'i4i.xlarge' +instance_provision: 'spot' + +enterprise_disable_kms: true +scaling_action_type: "scale_in" +diskusage_softlimit: 45 +diskusage_hardlimit: 67 + +stress_cmd_w: 'cassandra-stress write duration=30m -rate threads= "throttle=1400/s" -mode cql3 native -pop seq=1..5000000 -col "size=FIXED(10240) n=FIXED(1)" -schema "replication(strategy=NetworkTopologyStrategy,replication_factor=3)"' +stress_cmd_r: 'cassandra-stress read duration=30m -rate threads= "throttle=1400/s" -mode cql3 native -pop seq=1..5000000 -col "size=FIXED(10240) n=FIXED(1)" -schema "replication(strategy=NetworkTopologyStrategy,replication_factor=3)"' +append_scylla_yaml: + enable_tablets: true diff --git a/test-cases/scale/full-storage-utilization-scaleout.yaml b/test-cases/scale/full-storage-utilization-scaleout.yaml new file mode 100644 index 00000000000..1d94b4835e2 --- /dev/null +++ b/test-cases/scale/full-storage-utilization-scaleout.yaml @@ -0,0 +1,17 @@ +test_duration: 3600 +n_db_nodes: 3 +n_loaders: 1 +n_monitor_nodes: 1 +user_prefix: 'storage-utilization' +instance_type_db: 'i4i.xlarge' +instance_provision: 'spot' + +enterprise_disable_kms: true +scaling_action_type: "scale_out" +diskusage_softlimit: 70 +diskusage_hardlimit: 90 + +stress_cmd_w: 'cassandra-stress write duration=30m -rate threads= "throttle=1400/s" -mode cql3 native -pop seq=1..5000000 -col "size=FIXED(10240) n=FIXED(1)" -schema "replication(strategy=NetworkTopologyStrategy,replication_factor=3)"' +stress_cmd_r: 'cassandra-stress read duration=30m -rate threads= "throttle=1400/s" -mode cql3 native -pop seq=1..5000000 -col "size=FIXED(10240) n=FIXED(1)" -schema "replication(strategy=NetworkTopologyStrategy,replication_factor=3)"' +append_scylla_yaml: + enable_tablets: true