more merge perf tests

This commit is contained in:
Max Hoffman
2023-02-28 10:27:55 -08:00
parent bdee61c2ef
commit ed6fcdb51f
3 changed files with 97 additions and 36 deletions

View File

@@ -3,8 +3,8 @@ import shutil
import sys
import random
if len(sys.argv) != 5:
print("usage: python3 data.py <output-dir> <table-num> <row-num> <add-num>")
if len(sys.argv) != 7:
print("usage: python3 data.py <output-dir> <table-num> <row-num> <add-num> <delete-num> <update-num>")
sys.exit(1)
table_dir = sys.argv[1]
@@ -12,13 +12,17 @@ tables = int(sys.argv[2])
rows = int(sys.argv[3])
adds = int(sys.argv[4])
deletes = int(sys.argv[5])
updates = int(sys.argv[6])
if __name__=="__main__":
if deletes + updates > rows:
raise ValueError(f"deletes({deletes}) + updates({updates}) = {updates+deletes} > total rows({rows})")
if not os.path.exists(table_dir):
shutil.rmtree(table_dir, ignore_errors=True)
os.makedirs(table_dir)
ys = [i for i in range(rows+adds)]
ys = [i for i in range(rows+adds+deletes+updates)]
random.shuffle(ys)
with open(f"{table_dir}/create.sql", "+w") as f:
@@ -32,30 +36,74 @@ if __name__=="__main__":
for j in range(tables):
with open(f"{table_dir}/table{j}.csv", "+w") as f:
f.write("x,y,z\n")
for i in range(rows):
for i in range(rows+deletes+updates):
f.write(f"{i},{ys[i]},{i}\n")
with open(f"{table_dir}/branch.sql", "+w") as f:
for i in range(tables):
f.write(f"set foreign_key_checks = 0;\n")
f.write(f"set unique_checks = 0;\n")
f.write(f"insert into table{i} values\n")
for j,k in enumerate(ys[rows:rows+adds]):
if j == 0:
f.write(f" ")
else:
f.write(f", ")
f.write(f"({rows+j},{k},{rows+j})")
f.write(f";\n")
if adds > 0:
f.write(f"insert into table{i} values\n")
for j,k in enumerate(ys[rows+deletes+updates:rows+deletes+updates+adds]):
if j == 0:
f.write(f" ")
else:
f.write(f", ")
f.write(f"({rows+deletes+updates+j},{k},{rows+deletes+updates+j})")
f.write(f";\n")
if deletes > 0:
f.write(f"delete from table{i} where x in\n")
for j, y in enumerate(ys[:deletes]):
if j == 0:
f.write(f" (")
else:
f.write(f", ")
f.write(f"{y}")
f.write(f");\n")
if updates > 0:
f.write(f"update table{i} set y=y+1 where x in\n")
for j, y in enumerate(ys[deletes:deletes+updates]):
if j == 0:
f.write(f" (")
else:
f.write(f", ")
f.write(f"{y}")
f.write(f");\n")
with open(f"{table_dir}/diverge_main.sql", "+w") as f:
for i in range(tables):
f.write(f"set foreign_key_checks = 0;\n")
f.write(f"set unique_checks = 0;\n")
f.write(f"insert into table{i} values\n")
for j,k in enumerate(ys[rows:rows+adds]):
if j == 0:
f.write(f" ")
else:
f.write(f", ")
f.write(f"({rows+j},{k+1},{rows+j})")
f.write(f";\n")
if adds > 0:
# y value is one higher, conflict
f.write(f"insert into table{i} values\n")
for j,k in enumerate(ys[rows+deletes+updates:rows+deletes+updates+adds]):
if j == 0:
f.write(f" ")
else:
f.write(f", ")
f.write(f"({rows+deletes+updates+j},{k+1},{rows+deletes+updates+j})")
f.write(f";\n")
if deletes > 0:
f.write(f"delete from table{i} where y in\n")
for j, y in enumerate(ys[:deletes]):
if j == 0:
f.write(f" (")
else:
f.write(f", ")
f.write(f"{y}")
f.write(f");\n")
if updates > 0:
f.write(f"update table{i} set y=y+1 where y in\n")
for j, y in enumerate(ys[deletes:deletes+updates]):
if j == 0:
f.write(f" (")
else:
f.write(f", ")
f.write(f"{y}")
f.write(f");\n")

View File

@@ -36,3 +36,4 @@ dolt sql < $DATA/branch.sql
dolt commit -Am "new branch"
dolt merge --no-edit main