-
Notifications
You must be signed in to change notification settings - Fork 95
/
performance_regression_alternator_test.py
307 lines (245 loc) · 14 KB
/
performance_regression_alternator_test.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU Affero General Public License as published by
# the Free Software Foundation; either version 3 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
#
# See LICENSE for more details.
#
# Copyright (c) 2020 ScyllaDB
import contextlib
from performance_regression_test import PerformanceRegressionTest
from sdcm.sct_events.group_common_events import ignore_operation_errors, ignore_alternator_client_errors
from sdcm.utils import alternator
from sdcm.utils.decorators import optional_stage
class PerformanceRegressionAlternatorTest(PerformanceRegressionTest):
def __init__(self, *args):
super().__init__(*args)
# suppress YCSB client error and timeout to warnings for all the test in this class
self.stack = contextlib.ExitStack()
self.stack.enter_context(ignore_alternator_client_errors())
self.stack.enter_context(ignore_operation_errors())
def _workload(self, stress_cmd, stress_num, test_name=None, sub_type=None, keyspace_num=1, prefix='', debug_message='', # pylint: disable=too-many-arguments,arguments-differ
save_stats=True, is_alternator=True):
if not is_alternator:
stress_cmd = stress_cmd.replace('dynamodb', 'cassandra-cql')
if debug_message:
self.log.debug(debug_message)
if save_stats:
self.create_test_stats(test_name=test_name, sub_type=sub_type,
doc_id_with_timestamp=True, append_sub_test_to_name=False)
stress_queue = self.run_stress_thread(stress_cmd=stress_cmd, stress_num=stress_num, keyspace_num=keyspace_num,
prefix=prefix, stats_aggregate_cmds=False)
self.get_stress_results(queue=stress_queue, store_results=True)
if save_stats:
self.update_test_details(scylla_conf=True, alternator=is_alternator)
def create_alternator_table(self, schema, alternator_write_isolation):
node = self.db_cluster.nodes[0]
# drop tables
table_name = alternator.consts.TABLE_NAME
if self.alternator.is_table_exists(node=node, table_name=table_name):
self.alternator.delete_table(node=node, table_name=table_name)
# create new tables
self.log.info("Going to create alternator tables")
self.alternator.create_table(node=node, schema=schema, isolation=alternator_write_isolation)
self.run_fstrim_on_all_db_nodes()
self.wait_no_compactions_running()
def create_cql_ks_and_table(self, field_number):
node = self.db_cluster.nodes[0]
with self.db_cluster.cql_connection_patient(node) as session:
session.execute(
"""create keyspace ycsb WITH REPLICATION = {'class' : 'NetworkTopologyStrategy', 'replication_factor': 3 };""")
fields = ', '.join([f"field{i} varchar" for i in range(field_number)])
session.execute(f"""CREATE TABLE ycsb.usertable (
y_id varchar primary key,
{fields});""")
@optional_stage('perf_preload_data')
def preload_data(self, compaction_strategy=None):
# if test require a pre-population of data
prepare_write_cmd = self.params.get('prepare_write_cmd')
if prepare_write_cmd:
# create new document in ES with doc_id = test_id + timestamp
# allow to correctly save results for future compare
self.create_test_stats(sub_type='write-prepare', doc_id_with_timestamp=True)
stress_queue = []
params = {'prefix': 'preload-'}
for stress_type in ['dynamodb', 'cassandra-cql']:
# Check if the prepare_cmd is a list of commands
if not isinstance(prepare_write_cmd, str) and len(prepare_write_cmd) > 1:
# Check if it should be round_robin across loaders
if self.params.get('round_robin'):
self.log.debug('Populating data using round_robin')
params.update({'stress_num': 1, 'round_robin': True})
for stress_cmd in prepare_write_cmd:
params.update({'stress_cmd': stress_cmd.replace('dynamodb', stress_type)})
# Run all stress commands
params.update(dict(stats_aggregate_cmds=False))
self.log.debug('RUNNING stress cmd: {}'.format(stress_cmd.replace('dynamodb', stress_type)))
stress_queue.append(self.run_stress_thread(**params))
# One stress cmd command
else:
stress_queue.append(self.run_stress_thread(stress_cmd=prepare_write_cmd.replace('dynamodb', stress_type), stress_num=1,
prefix='preload-', stats_aggregate_cmds=False))
for stress in stress_queue:
self.get_stress_results(queue=stress, store_results=False)
self.update_test_details()
else:
self.log.warning("No prepare command defined in YAML!")
def test_write(self):
"""
Test steps:
1. Run a write workload with cql
2. Run a write workload without lwt
3. Run a write workload with lwt enabled
"""
# run a write workload
base_cmd_w = self.params.get('stress_cmd_w')
stress_multiplier = self.params.get('stress_multiplier')
self.create_cql_ks_and_table(field_number=10)
self._workload(sub_type='cql', stress_cmd=base_cmd_w,
stress_num=stress_multiplier, keyspace_num=1, is_alternator=False)
schema = self.params.get("dynamodb_primarykey_type")
# run a workload without lwt as baseline
self.create_alternator_table(
schema=schema, alternator_write_isolation=alternator.enums.WriteIsolation.FORBID_RMW)
self._workload(sub_type='without-lwt', stress_cmd=base_cmd_w, stress_num=stress_multiplier, keyspace_num=1)
# run a workload with lwt
self.create_alternator_table(
schema=schema, alternator_write_isolation=alternator.enums.WriteIsolation.ALWAYS_USE_LWT)
self._workload(sub_type='with-lwt', stress_cmd=base_cmd_w, stress_num=stress_multiplier, keyspace_num=1)
self.check_regression_with_baseline('cql')
def test_read(self):
"""
Test steps:
1. Run a write workload as a preparation
2. Run a read workload with cql
3. Run a read workload without lwt
4. Run a read workload with lwt enabled
"""
node = self.db_cluster.nodes[0]
base_cmd_r = self.params.get('stress_cmd_r')
stress_multiplier = self.params.get('stress_multiplier')
self.run_fstrim_on_all_db_nodes()
# run a prepare write workload
self.create_cql_ks_and_table(field_number=10)
self.create_alternator_table(schema=self.params.get("dynamodb_primarykey_type"),
alternator_write_isolation=alternator.enums.WriteIsolation.FORBID_RMW)
self.preload_data()
self._workload(sub_type='cql', stress_cmd=base_cmd_r,
stress_num=stress_multiplier, keyspace_num=1, is_alternator=False)
# run a workload without lwt as baseline
self.alternator.set_write_isolation(node=node, isolation=alternator.enums.WriteIsolation.FORBID_RMW)
self._workload(sub_type='without-lwt', stress_cmd=base_cmd_r, stress_num=stress_multiplier, keyspace_num=1)
# run a workload with lwt
self.alternator.set_write_isolation(node=node, isolation=alternator.enums.WriteIsolation.ALWAYS_USE_LWT)
self._workload(sub_type='with-lwt', stress_cmd=base_cmd_r, stress_num=stress_multiplier, keyspace_num=1)
self.check_regression_with_baseline('cql')
def test_mixed(self):
"""
Test steps:
1. Run a write workload as a preparation
2. Run a mixed workload with cql
3. Run a mixed workload without lwt
4. Run a mixed workload with lwt
"""
node = self.db_cluster.nodes[0]
base_cmd_m = self.params.get('stress_cmd_m')
stress_multiplier = self.params.get('stress_multiplier')
self.run_fstrim_on_all_db_nodes()
self.create_cql_ks_and_table(field_number=10)
self.create_alternator_table(schema=self.params.get("dynamodb_primarykey_type"),
alternator_write_isolation=alternator.enums.WriteIsolation.FORBID_RMW)
# run a write workload as a preparation
self.preload_data()
self._workload(sub_type='cql', stress_cmd=base_cmd_m,
stress_num=stress_multiplier, keyspace_num=1, is_alternator=False)
# run a mixed workload
# run a workload without lwt as baseline
self.alternator.set_write_isolation(node=node, isolation=alternator.enums.WriteIsolation.FORBID_RMW)
self._workload(sub_type='without-lwt', stress_cmd=base_cmd_m, stress_num=stress_multiplier, keyspace_num=1)
# run a workload with lwt
self.alternator.set_write_isolation(node=node, isolation=alternator.enums.WriteIsolation.ALWAYS_USE_LWT)
self._workload(sub_type='with-lwt', stress_cmd=base_cmd_m, stress_num=stress_multiplier, keyspace_num=1)
self.check_regression_with_baseline('cql')
def test_latency(self):
"""
Test steps:
1. Prepare cluster with data (reach steady_stet of compactions and ~x10 capacity than RAM.
with round_robin and list of stress_cmd - the data will load several times faster.
2. Run READ workload with cql.
3. Run READ workload without lwt.
4. Run READ workload with lwt.
5. Run WRITE workload with cql.
6. Run WRITE workload without lwt.
7. Run WRITE workload with lwt.
8. Run MIXED workload with cql.
9. Run MIXED workload without lwt.
10. Run MIXED workload with lwt.
"""
node = self.db_cluster.nodes[0]
self.create_alternator_table(schema=self.params.get("dynamodb_primarykey_type"),
alternator_write_isolation=alternator.enums.WriteIsolation.FORBID_RMW)
self.alternator.set_write_isolation(node=node, isolation=alternator.enums.WriteIsolation.FORBID_RMW)
self.create_cql_ks_and_table(field_number=10)
self.run_fstrim_on_all_db_nodes()
self.preload_data()
base_cmd_w = self.params.get('stress_cmd_w')
base_cmd_r = self.params.get('stress_cmd_r')
base_cmd_m = self.params.get('stress_cmd_m')
stress_multiplier = 2
self.wait_no_compactions_running(n=120)
self.run_fstrim_on_all_db_nodes()
self._workload(
test_name=self.id() + '_read', sub_type='cql', stress_cmd=base_cmd_r, stress_num=stress_multiplier,
keyspace_num=1, is_alternator=False)
# run a workload without lwt as baseline
self.alternator.set_write_isolation(node=node, isolation=alternator.enums.WriteIsolation.FORBID_RMW)
self._workload(
test_name=self.id() + '_read', sub_type='without-lwt', stress_cmd=base_cmd_r, stress_num=stress_multiplier,
keyspace_num=1)
self.wait_no_compactions_running()
# run a workload with lwt
self.alternator.set_write_isolation(node=node, isolation=alternator.enums.WriteIsolation.ALWAYS_USE_LWT)
self._workload(
test_name=self.id() + '_read', sub_type='with-lwt', stress_cmd=base_cmd_r, stress_num=stress_multiplier,
keyspace_num=1)
self.check_regression_with_baseline('cql')
stress_multiplier = 1
self.run_fstrim_on_all_db_nodes()
self.wait_no_compactions_running()
self._workload(
test_name=self.id() + '_write', sub_type='cql', stress_cmd=base_cmd_w + " -target 10000",
stress_num=stress_multiplier, keyspace_num=1, is_alternator=False)
self.wait_no_compactions_running()
# run a workload without lwt as baseline
self.alternator.set_write_isolation(node=node, isolation=alternator.enums.WriteIsolation.FORBID_RMW)
self._workload(
test_name=self.id() + '_write', sub_type='without-lwt', stress_cmd=base_cmd_w + " -target 10000",
stress_num=stress_multiplier, keyspace_num=1)
self.wait_no_compactions_running(n=120)
# run a workload with lwt
self.alternator.set_write_isolation(node=node, isolation=alternator.enums.WriteIsolation.ALWAYS_USE_LWT)
self._workload(
test_name=self.id() + '_write', sub_type='with-lwt', stress_cmd=base_cmd_w + " -target 3000",
stress_num=stress_multiplier, keyspace_num=1)
self.check_regression_with_baseline('cql')
stress_multiplier = 1
self.wait_no_compactions_running(n=120)
self.run_fstrim_on_all_db_nodes()
self._workload(
test_name=self.id() + '_mixed', sub_type='cql', stress_cmd=base_cmd_m + " -target 10000",
stress_num=stress_multiplier, keyspace_num=1, is_alternator=False)
self.wait_no_compactions_running()
# run a workload without lwt as baseline
self.alternator.set_write_isolation(node=node, isolation=alternator.enums.WriteIsolation.FORBID_RMW)
self._workload(test_name=self.id() + '_mixed', sub_type='without-lwt',
stress_cmd=base_cmd_m + " -target 10000", stress_num=stress_multiplier, keyspace_num=1)
self.wait_no_compactions_running()
# run a workload with lwt
self.alternator.set_write_isolation(node=node, isolation=alternator.enums.WriteIsolation.ALWAYS_USE_LWT)
self._workload(test_name=self.id() + '_mixed', sub_type='with-lwt',
stress_cmd=base_cmd_m + " -target 5000", stress_num=stress_multiplier, keyspace_num=1)
self.check_regression_with_baseline('cql')