mirror of
https://github.com/dolthub/dolt.git
synced 2026-04-22 19:43:51 -05:00
d019cce6f7
* Stats auto refresh prototype * fix bugs * test stats update * add tests, fix bugs * fix test * fmt * delete test * more tests * delete table test * [ga-format-pr] Run go/utils/repofmt/format_repo.sh and go/Godeps/update.sh * add and delete stats hooks * fmt * concurrency improvements * [ga-format-pr] Run go/utils/repofmt/format_repo.sh and go/Godeps/update.sh * write bug * more tests and stats functions * working dolt_stat funcs * test fixes * bump * fmt * fix wg panic * [ga-format-pr] Run go/utils/repofmt/format_repo.sh and go/Godeps/update.sh * nick comments --------- Co-authored-by: max-hoffman <max-hoffman@users.noreply.github.com>
351 lines
9.6 KiB
Bash
351 lines
9.6 KiB
Bash
#!/usr/bin/env bats
|
|
load $BATS_TEST_DIRNAME/helper/common.bash
|
|
load $BATS_TEST_DIRNAME/helper/query-server-common.bash
|
|
|
|
setup() {
|
|
skiponwindows "tests are flaky on Windows"
|
|
if [ "$SQL_ENGINE" = "remote-engine" ]; then
|
|
skip "This test tests remote connections directly, SQL_ENGINE is not needed."
|
|
fi
|
|
|
|
setup_common
|
|
|
|
TMPDIRS=$(pwd)/tmpdirs
|
|
mkdir -p $TMPDIRS/{repo1,repo2}
|
|
|
|
cd $TMPDIRS/repo1
|
|
dolt init
|
|
|
|
dolt sql <<SQL
|
|
create table ab (a int primary key, b int, key (b,a));
|
|
SQL
|
|
|
|
cd $TMPDIRS/repo2
|
|
dolt init
|
|
|
|
dolt sql <<SQL
|
|
create table xy (x int primary key, y int, key (y,x));
|
|
create table ab (a int primary key, b int, key (b,a));
|
|
SQL
|
|
|
|
cd $TMPDIRS
|
|
}
|
|
|
|
teardown() {
|
|
teardown_common
|
|
stop_sql_server 1
|
|
rm -rf $TMPDIRS
|
|
cd $BATS_TMPDIR
|
|
}
|
|
|
|
@test "stats: empty initial stats" {
|
|
cd repo2
|
|
|
|
dolt sql -q "insert into xy values (0,0), (1,1)"
|
|
|
|
start_sql_server
|
|
sleep 1
|
|
stop_sql_server
|
|
|
|
# no statistics error if ref does not exist
|
|
run dolt sql -r csv -q "select database_name, table_name, index_name from dolt_statistics"
|
|
[ "$status" -eq 1 ]
|
|
[[ "$output" =~ "no statistics found" ]] || false
|
|
|
|
# setting variables doesn't hang or error
|
|
dolt sql -q "set @@PERSIST.dolt_stats_auto_refresh_enabled = 1;"
|
|
dolt sql -q "set @@PERSIST.dolt_stats_auto_refresh_threshold = .5"
|
|
dolt sql -q "set @@PERSIST.dolt_stats_auto_refresh_interval = 1;"
|
|
|
|
# auto refresh can only initialize at server startup
|
|
start_sql_server
|
|
|
|
# need to trigger at least one refresh cycle
|
|
sleep 1
|
|
|
|
# only statistics for non-empty tables are collected
|
|
run dolt sql -r csv -q "select database_name, table_name, index_name from dolt_statistics"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[0]}" = "database_name,table_name,index_name" ]
|
|
[ "${lines[1]}" = "repo2,xy,primary" ]
|
|
[ "${lines[2]}" = "repo2,xy,yx" ]
|
|
|
|
# appending new chunks picked up
|
|
dolt sql -q "insert into xy select x, 1 from (with recursive inputs(x) as (select 4 union select x+1 from inputs where x < 1000) select * from inputs) dt;"
|
|
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "8" ]
|
|
|
|
# updates picked up
|
|
dolt sql -q "update xy set y = 2 where x between 100 and 800"
|
|
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "8" ]
|
|
}
|
|
|
|
@test "stats: deletes refresh" {
|
|
cd repo2
|
|
|
|
dolt sql -q "insert into xy select x, 1 from (with recursive inputs(x) as (select 4 union select x+1 from inputs where x < 1000) select * from inputs) dt;"
|
|
|
|
# setting variables doesn't hang or error
|
|
dolt sql -q "set @@persist.dolt_stats_auto_refresh_enabled = 1;"
|
|
dolt sql -q "set @@persist.dolt_stats_auto_refresh_threshold = .5"
|
|
dolt sql -q "set @@persist.dolt_stats_auto_refresh_interval = 1;"
|
|
|
|
start_sql_server
|
|
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "8" ]
|
|
|
|
# delete >50% of rows
|
|
dolt sql -q "delete from xy where x > 500"
|
|
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "4" ]
|
|
}
|
|
|
|
@test "stats: add/delete table" {
|
|
cd repo1
|
|
|
|
dolt sql -q "insert into ab values (0,0), (1,0), (2,0)"
|
|
|
|
# setting variables doesn't hang or error
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_enabled = 1;"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_threshold = .5"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_interval = 1;"
|
|
|
|
start_sql_server
|
|
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "2" ]
|
|
|
|
# add table
|
|
dolt sql -q "create table xy (x int primary key, y int)"
|
|
# schema changes don't impact the table hash
|
|
dolt sql -q "insert into xy values (0,0)"
|
|
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics where table_name = 'xy'"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "1" ]
|
|
|
|
dolt sql -q "truncate table xy"
|
|
|
|
sleep 1
|
|
|
|
dolt sql -q "select * from xy"
|
|
|
|
dolt sql -q "select * from dolt_statistics where table_name = 'xy'"
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics where table_name = 'xy'"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "0" ]
|
|
|
|
dolt sql -q "drop table xy"
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics where table_name = 'xy'"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "0" ]
|
|
}
|
|
|
|
@test "stats: add/delete index" {
|
|
cd repo2
|
|
|
|
dolt sql -q "insert into xy values (0,0), (1,0), (2,0)"
|
|
|
|
# setting variables doesn't hang or error
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_enabled = 1;"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_threshold = .5"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_interval = 1;"
|
|
|
|
start_sql_server
|
|
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "2" ]
|
|
|
|
# delete secondary
|
|
dolt sql -q "alter table xy drop index yx"
|
|
# schema changes don't impact the table hash
|
|
dolt sql -q "insert into xy values (3,0)"
|
|
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "1" ]
|
|
|
|
dolt sql -q "alter table xy add index yx (y,x)"
|
|
# row change to impact table hash
|
|
dolt sql -q "insert into xy values (4,0)"
|
|
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "2" ]
|
|
}
|
|
|
|
@test "stats: most common values" {
|
|
cd repo2
|
|
|
|
dolt sql -q "alter table xy add index (y)"
|
|
dolt sql -q "insert into xy values (0,0), (1,0), (2,0), (3,0), (4,0), (5,0)"
|
|
|
|
# setting variables doesn't hang or error
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_enabled = 1;"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_threshold = .5"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_interval = 1;"
|
|
|
|
# auto refresh can only initialize at server startup
|
|
start_sql_server
|
|
|
|
# need to trigger at least one refresh cycle
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select mcv1 from dolt_statistics where index_name = 'y'"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "0" ]
|
|
|
|
sleep 1
|
|
|
|
dolt sql -q "update xy set y = 2 where x between 0 and 3"
|
|
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select mcv1 as mcv from dolt_statistics where index_name = 'y' union select mcv2 as mcv from dolt_statistics where index_name = 'y' order by mcv"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "0" ]
|
|
[ "${lines[2]}" = "2" ]
|
|
}
|
|
|
|
@test "stats: multi db" {
|
|
cd repo1
|
|
dolt sql -q "insert into ab values (0,0), (1,1)"
|
|
|
|
cd ../repo2
|
|
dolt sql -q "insert into ab values (0,0), (1,1)"
|
|
dolt sql -q "insert into xy values (0,0), (1,1)"
|
|
|
|
cd ..
|
|
start_sql_server
|
|
sleep 1
|
|
stop_sql_server
|
|
|
|
run dolt sql -r csv -q "select database_name, table_name, index_name from dolt_statistics"
|
|
[ "$status" -eq 1 ]
|
|
[[ "$output" =~ "no statistics found" ]] || false
|
|
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_enabled = 1;"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_threshold = 0.5"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_interval = 1;"
|
|
|
|
start_sql_server
|
|
sleep 1
|
|
|
|
dolt sql -q "use repo1"
|
|
run dolt sql -r csv -q "select database_name, table_name, index_name from dolt_statistics order by index_name"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[0]}" = "database_name,table_name,index_name" ]
|
|
[ "${lines[1]}" = "repo1,ab,ba" ]
|
|
[ "${lines[2]}" = "repo1,ab,primary" ]
|
|
|
|
run dolt sql -r csv -q "select database_name, table_name, index_name from repo2.dolt_statistics order by index_name"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[0]}" = "database_name,table_name,index_name" ]
|
|
[ "${lines[1]}" = "repo2,ab,ba" ]
|
|
[ "${lines[2]}" = "repo2,ab,primary" ]
|
|
[ "${lines[3]}" = "repo2,xy,primary" ]
|
|
[ "${lines[4]}" = "repo2,xy,yx" ]
|
|
}
|
|
|
|
@test "stats: add/delete database" {
|
|
cd repo1
|
|
|
|
# setting variables doesn't hang or error
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_enabled = 1;"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_threshold = .5"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_interval = 1;"
|
|
|
|
start_sql_server
|
|
|
|
dolt sql -q "insert into ab values (0,0), (1,0), (2,0)"
|
|
dolt sql <<SQL
|
|
create database repo2;
|
|
create table repo2.xy (x int primary key, y int, key(y,x));
|
|
insert into repo2.xy values (0,0), (1,0), (2,0);
|
|
SQL
|
|
|
|
sleep 1
|
|
|
|
# specify database_name filter even though can only see active db stats
|
|
run dolt sql -r csv <<SQL
|
|
use repo2;
|
|
select count(*) from dolt_statistics where database_name = 'repo2';
|
|
SQL
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[2]}" = "2" ]
|
|
|
|
# drop repo2
|
|
dolt sql -q "drop database repo2"
|
|
|
|
sleep 1
|
|
|
|
# we can't access repo2 stats, but still try
|
|
run dolt sql -r csv <<SQL
|
|
select count(*) from dolt_statistics where database_name = 'repo2';
|
|
SQL
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "0" ]
|
|
|
|
dolt sql <<SQL
|
|
create database repo2;
|
|
create table repo2.xy (x int primary key, y int, key(y,x));
|
|
SQL
|
|
|
|
sleep 1
|
|
|
|
# no rows yet
|
|
run dolt sql -r csv <<SQL
|
|
use repo2;
|
|
select count(*) from dolt_statistics where database_name = 'repo2';
|
|
SQL
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[2]}" = "0" ]
|
|
|
|
dolt sql <<SQL
|
|
use repo2;
|
|
insert into xy values (0,0);
|
|
SQL
|
|
|
|
sleep 1
|
|
|
|
# insert initializes stats
|
|
run dolt sql -r csv <<SQL
|
|
use repo2;
|
|
select count(*) from dolt_statistics where database_name = 'repo2';
|
|
SQL
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[2]}" = "2" ]
|
|
}
|
|
|