mirror of
https://github.com/dolthub/dolt.git
synced 2026-01-13 10:26:13 -06:00
110 lines
3.9 KiB
Python
110 lines
3.9 KiB
Python
import os
|
|
import shutil
|
|
import sys
|
|
import random
|
|
|
|
if len(sys.argv) != 7:
|
|
print("usage: python3 data.py <output-dir> <table-num> <row-num> <add-num> <delete-num> <update-num>")
|
|
sys.exit(1)
|
|
|
|
table_dir = sys.argv[1]
|
|
tables = int(sys.argv[2])
|
|
rows = int(sys.argv[3])
|
|
|
|
adds = int(sys.argv[4])
|
|
deletes = int(sys.argv[5])
|
|
updates = int(sys.argv[6])
|
|
|
|
if __name__=="__main__":
|
|
if deletes + updates > rows:
|
|
raise ValueError(f"deletes({deletes}) + updates({updates}) = {updates+deletes} > total rows({rows})")
|
|
if not os.path.exists(table_dir):
|
|
shutil.rmtree(table_dir, ignore_errors=True)
|
|
os.makedirs(table_dir)
|
|
|
|
ys = [i for i in range(rows+adds+deletes+updates)]
|
|
random.shuffle(ys)
|
|
|
|
with open(f"{table_dir}/create.sql", "+w") as f:
|
|
for i in range(tables):
|
|
if i == 0:
|
|
f.write(f"create table table{i} (x int primary key, y int, z int, key y_idx(y));\n")
|
|
else:
|
|
f.write(f"create table table{i} (x int primary key, y int, z int, key y_idx(y), foreign key (y) references table{i-1}(y));\n")
|
|
|
|
|
|
for j in range(tables):
|
|
with open(f"{table_dir}/table{j}.csv", "+w") as f:
|
|
f.write("x,y,z\n")
|
|
for i in range(rows+deletes+updates):
|
|
f.write(f"{i},{ys[i]},{i}\n")
|
|
|
|
with open(f"{table_dir}/branch.sql", "+w") as f:
|
|
for i in range(tables):
|
|
f.write(f"set foreign_key_checks = 0;\n")
|
|
f.write(f"set unique_checks = 0;\n")
|
|
if adds > 0:
|
|
f.write(f"insert into table{i} values\n")
|
|
for j,k in enumerate(ys[rows+deletes+updates:rows+deletes+updates+adds]):
|
|
if j == 0:
|
|
f.write(f" ")
|
|
else:
|
|
f.write(f", ")
|
|
f.write(f"({rows+deletes+updates+j},{k},{rows+deletes+updates+j})")
|
|
f.write(f";\n")
|
|
|
|
if deletes > 0:
|
|
f.write(f"delete from table{i} where x in\n")
|
|
for j, y in enumerate(ys[:deletes]):
|
|
if j == 0:
|
|
f.write(f" (")
|
|
else:
|
|
f.write(f", ")
|
|
f.write(f"{y}")
|
|
f.write(f");\n")
|
|
|
|
if updates > 0:
|
|
f.write(f"update table{i} set y=y+1 where x in\n")
|
|
for j, y in enumerate(ys[deletes:deletes+updates]):
|
|
if j == 0:
|
|
f.write(f" (")
|
|
else:
|
|
f.write(f", ")
|
|
f.write(f"{y}")
|
|
f.write(f");\n")
|
|
|
|
with open(f"{table_dir}/diverge_main.sql", "+w") as f:
|
|
for i in range(tables):
|
|
f.write(f"set foreign_key_checks = 0;\n")
|
|
f.write(f"set unique_checks = 0;\n")
|
|
if adds > 0:
|
|
# y value is one higher, conflict
|
|
f.write(f"insert into table{i} values\n")
|
|
for j,k in enumerate(ys[rows+deletes+updates:rows+deletes+updates+adds]):
|
|
if j == 0:
|
|
f.write(f" ")
|
|
else:
|
|
f.write(f", ")
|
|
f.write(f"({rows+deletes+updates+j},{k+1},{rows+deletes+updates+j})")
|
|
f.write(f";\n")
|
|
|
|
if deletes > 0:
|
|
f.write(f"delete from table{i} where y in\n")
|
|
for j, y in enumerate(ys[:deletes]):
|
|
if j == 0:
|
|
f.write(f" (")
|
|
else:
|
|
f.write(f", ")
|
|
f.write(f"{y}")
|
|
f.write(f");\n")
|
|
|
|
if updates > 0:
|
|
f.write(f"update table{i} set y=y+1 where y in\n")
|
|
for j, y in enumerate(ys[deletes:deletes+updates]):
|
|
if j == 0:
|
|
f.write(f" (")
|
|
else:
|
|
f.write(f", ")
|
|
f.write(f"{y}")
|
|
f.write(f");\n")
|