Files
dolt/.github/scripts/merge-perf/data.py
2023-02-28 10:27:55 -08:00

110 lines
3.9 KiB
Python

import os
import shutil
import sys
import random
if len(sys.argv) != 7:
print("usage: python3 data.py <output-dir> <table-num> <row-num> <add-num> <delete-num> <update-num>")
sys.exit(1)
table_dir = sys.argv[1]
tables = int(sys.argv[2])
rows = int(sys.argv[3])
adds = int(sys.argv[4])
deletes = int(sys.argv[5])
updates = int(sys.argv[6])
if __name__=="__main__":
if deletes + updates > rows:
raise ValueError(f"deletes({deletes}) + updates({updates}) = {updates+deletes} > total rows({rows})")
if not os.path.exists(table_dir):
shutil.rmtree(table_dir, ignore_errors=True)
os.makedirs(table_dir)
ys = [i for i in range(rows+adds+deletes+updates)]
random.shuffle(ys)
with open(f"{table_dir}/create.sql", "+w") as f:
for i in range(tables):
if i == 0:
f.write(f"create table table{i} (x int primary key, y int, z int, key y_idx(y));\n")
else:
f.write(f"create table table{i} (x int primary key, y int, z int, key y_idx(y), foreign key (y) references table{i-1}(y));\n")
for j in range(tables):
with open(f"{table_dir}/table{j}.csv", "+w") as f:
f.write("x,y,z\n")
for i in range(rows+deletes+updates):
f.write(f"{i},{ys[i]},{i}\n")
with open(f"{table_dir}/branch.sql", "+w") as f:
for i in range(tables):
f.write(f"set foreign_key_checks = 0;\n")
f.write(f"set unique_checks = 0;\n")
if adds > 0:
f.write(f"insert into table{i} values\n")
for j,k in enumerate(ys[rows+deletes+updates:rows+deletes+updates+adds]):
if j == 0:
f.write(f" ")
else:
f.write(f", ")
f.write(f"({rows+deletes+updates+j},{k},{rows+deletes+updates+j})")
f.write(f";\n")
if deletes > 0:
f.write(f"delete from table{i} where x in\n")
for j, y in enumerate(ys[:deletes]):
if j == 0:
f.write(f" (")
else:
f.write(f", ")
f.write(f"{y}")
f.write(f");\n")
if updates > 0:
f.write(f"update table{i} set y=y+1 where x in\n")
for j, y in enumerate(ys[deletes:deletes+updates]):
if j == 0:
f.write(f" (")
else:
f.write(f", ")
f.write(f"{y}")
f.write(f");\n")
with open(f"{table_dir}/diverge_main.sql", "+w") as f:
for i in range(tables):
f.write(f"set foreign_key_checks = 0;\n")
f.write(f"set unique_checks = 0;\n")
if adds > 0:
# y value is one higher, conflict
f.write(f"insert into table{i} values\n")
for j,k in enumerate(ys[rows+deletes+updates:rows+deletes+updates+adds]):
if j == 0:
f.write(f" ")
else:
f.write(f", ")
f.write(f"({rows+deletes+updates+j},{k+1},{rows+deletes+updates+j})")
f.write(f";\n")
if deletes > 0:
f.write(f"delete from table{i} where y in\n")
for j, y in enumerate(ys[:deletes]):
if j == 0:
f.write(f" (")
else:
f.write(f", ")
f.write(f"{y}")
f.write(f");\n")
if updates > 0:
f.write(f"update table{i} set y=y+1 where y in\n")
for j, y in enumerate(ys[deletes:deletes+updates]):
if j == 0:
f.write(f" (")
else:
f.write(f", ")
f.write(f"{y}")
f.write(f");\n")