-
Notifications
You must be signed in to change notification settings - Fork 964
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
[wip -- do not review] feat: add support for big values in SeederV2 #4222
base: main
Are you sure you want to change the base?
Changes from all commits
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -18,12 +18,15 @@ local total_ops = tonumber(ARGV[6]) | |
local min_dev = tonumber(ARGV[7]) | ||
local data_size = tonumber(ARGV[8]) | ||
local collection_size = tonumber(ARGV[9]) | ||
-- Probability of each key in key_target to be a big value | ||
local huge_value_percentage = tonumber(ARGV[10]) | ||
local huge_value_size = tonumber(ARGV[11]) | ||
|
||
-- collect all keys belonging to this script | ||
-- assumes exclusive ownership | ||
local keys = LU_collect_keys(prefix, type) | ||
|
||
LG_funcs.init(data_size, collection_size) | ||
LG_funcs.init(data_size, collection_size, huge_value_percentage, huge_value_size) | ||
local addfunc = LG_funcs['add_' .. string.lower(type)] | ||
local modfunc = LG_funcs['mod_' .. string.lower(type)] | ||
|
||
|
@@ -85,6 +88,7 @@ while true do | |
if counter % 10 == 0 then | ||
-- calculate intensity (not normalized probabilities) | ||
-- please see attached plots in PR to undertand convergence | ||
-- https://github.com/dragonflydb/dragonfly/pull/2556 | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. took me a few seconds to find this so I thought I should include the link. Now we can jump straight to the pr if needed (and it will be needed for anyone who changes this code). |
||
|
||
-- the add intensity is monotonically decreasing with keycount growing, | ||
-- the delete intensity is monotonically increasing with keycount growing, | ||
|
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,9 +1,19 @@ | ||
local LG_funcs = {} | ||
|
||
function LG_funcs.init(dsize, csize) | ||
function LG_funcs.init(dsize, csize, large_val_perc, large_val_sz) | ||
LG_funcs.dsize = dsize | ||
LG_funcs.csize = csize | ||
LG_funcs.esize = math.ceil(dsize / csize) | ||
LG_funcs.huge_value_percentage = large_val_perc | ||
LG_funcs.huge_value_size = large_val_sz | ||
end | ||
|
||
local function huge_entry() | ||
local perc = LG_funcs.huge_value_percentage / 100 | ||
-- [0, 1] | ||
local rand = math.random() | ||
local huge_entry = (perc > rand) | ||
return huge_entry | ||
end | ||
|
||
-- strings | ||
|
@@ -27,12 +37,18 @@ end | |
-- lists | ||
-- store list of random blobs of default container/element sizes | ||
|
||
function LG_funcs.add_list(key) | ||
local elements = dragonfly.randstr(LG_funcs.esize, LG_funcs.csize) | ||
function LG_funcs.add_list(key, huge_value) | ||
local elements | ||
if huge_entry() then | ||
elements = dragonfly.randstr(LG_funcs.huge_value_size, LG_funcs.csize) | ||
else | ||
elements = dragonfly.randstr(LG_funcs.esize, LG_funcs.csize) | ||
end | ||
|
||
redis.apcall('LPUSH', key, unpack(elements)) | ||
end | ||
|
||
function LG_funcs.mod_list(key) | ||
function LG_funcs.mod_list(key, huge_value) | ||
-- equally likely pops and pushes, we rely on the list size being large enough | ||
-- to "highly likely" not get emptied out by consequitve pops | ||
local action = math.random(1, 4) | ||
|
@@ -41,9 +57,23 @@ function LG_funcs.mod_list(key) | |
elseif action == 2 then | ||
redis.apcall('LPOP', key) | ||
elseif action == 3 then | ||
redis.apcall('LPUSH', key, dragonfly.randstr(LG_funcs.esize)) | ||
local str | ||
if huge_entry() then | ||
str = dragonfly.randstr(LG_funcs.huge_value_size) | ||
else | ||
str = dragonfly.randstr(LG_funcs.esize) | ||
end | ||
|
||
redis.apcall('LPUSH', key, str) | ||
else | ||
redis.apcall('RPUSH', key, dragonfly.randstr(LG_funcs.esize)) | ||
local str | ||
if huge_entry() then | ||
str = dragonfly.randstr(LG_funcs.huge_value_size) | ||
else | ||
str = dragonfly.randstr(LG_funcs.esize) | ||
end | ||
|
||
redis.apcall('RPUSH', key, str) | ||
end | ||
end | ||
|
||
|
@@ -62,7 +92,15 @@ function LG_funcs.add_set(key, keys) | |
end | ||
redis.apcall('SDIFFSTORE', key, keys[i1], keys[i2]) | ||
else | ||
local elements = dragonfly.randstr(LG_funcs.esize, LG_funcs.csize) | ||
local elements | ||
if huge_entry() then | ||
-- Hard coded 10 here, meaning up to 10 huge entries per set | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. //TODO so I don't forget to fix it. Replace |
||
-- TODO make this configurable | ||
elements = dragonfly.randstr(LG_funcs.large_val_sz, 10) | ||
else | ||
elements = dragonfly.randstr(LG_funcs.esize, LG_funcs.csize) | ||
end | ||
|
||
redis.apcall('SADD', key, unpack(elements)) | ||
end | ||
end | ||
|
@@ -72,7 +110,14 @@ function LG_funcs.mod_set(key) | |
if math.random() < 0.5 then | ||
redis.apcall('SPOP', key) | ||
else | ||
redis.apcall('SADD', key, dragonfly.randstr(LG_funcs.esize)) | ||
local rand_str | ||
if huge_entry() then | ||
rand_str = dragonfly.randstr(LG_funcs.huge_value_size) | ||
else | ||
rand_str = dragonfly.randstr(LG_funcs.esize) | ||
end | ||
|
||
redis.apcall('SADD', key, rand_str) | ||
end | ||
end | ||
|
||
|
@@ -82,7 +127,13 @@ end | |
-- where `value` is a random string for even indices and a number for odd indices | ||
|
||
function LG_funcs.add_hash(key) | ||
local blobs = dragonfly.randstr(LG_funcs.esize, LG_funcs.csize / 2) | ||
local blobs | ||
if huge_entry() then | ||
blobs = dragonfly.randstr(LG_funcs.huge_value_size, LG_funcs.csize / 2) | ||
else | ||
blobs = dragonfly.randstr(LG_funcs.esize, LG_funcs.csize / 2) | ||
end | ||
|
||
local htable = {} | ||
for i = 1, LG_funcs.csize, 2 do | ||
htable[i * 2 - 1] = tostring(i) | ||
|
@@ -100,15 +151,28 @@ function LG_funcs.mod_hash(key) | |
if idx % 2 == 1 then | ||
redis.apcall('HINCRBY', key, tostring(idx), 1) | ||
else | ||
redis.apcall('HSET', key, tostring(idx), dragonfly.randstr(LG_funcs.esize)) | ||
local str | ||
if huge_entry() then | ||
str = dragonfly.randstr(LG_funcs.large_val_sz) | ||
else | ||
str = dragonfly.randstr(LG_funcs.esize) | ||
end | ||
|
||
redis.apcall('HSET', key, tostring(idx), str) | ||
end | ||
end | ||
|
||
-- sorted sets | ||
|
||
function LG_funcs.add_zset(key, keys) | ||
-- TODO: We don't support ZDIFFSTORE | ||
local blobs = dragonfly.randstr(LG_funcs.esize, LG_funcs.csize) | ||
local blobs | ||
if huge_entry() then | ||
blobs = dragonfly.randstr(LG_funcs.huge_value_size, LG_funcs.csize) | ||
else | ||
blobs = dragonfly.randstr(LG_funcs.csize, LG_funcs.csize) | ||
end | ||
|
||
local ztable = {} | ||
for i = 1, LG_funcs.csize do | ||
ztable[i * 2 - 1] = tostring(i) | ||
|
@@ -120,7 +184,14 @@ end | |
function LG_funcs.mod_zset(key, dbsize) | ||
local action = math.random(1, 4) | ||
if action <= 2 then | ||
redis.apcall('ZADD', key, math.random(0, LG_funcs.csize * 2), dragonfly.randstr(LG_funcs.esize)) | ||
local str | ||
if huge_entry() then | ||
str = dragonfly.randstr(LG_funcs.large_val_sz) | ||
else | ||
str = dragonfly.randstr(LG_funcs.esize) | ||
end | ||
|
||
redis.apcall('ZADD', key, math.random(0, LG_funcs.csize * 2), str) | ||
elseif action == 3 then | ||
redis.apcall('ZPOPMAX', key) | ||
else | ||
|
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
For now I will keep a flat probability for each key in the key target to contain a
huge value