mirror of
https://github.com/dolthub/dolt.git
synced 2026-05-05 02:45:34 -05:00
801a82a3af
* starter * prog * flush out statsdb interface fork, and noms implementation * more progress on tests * StatsIO tests passing * pretty close, thread canceller still broken * check context dropped inside refresh loop * tidy * nil panic * dolt harness setup imports setup statistics * lot of test fixes * bump * fmt * fix providers race * don't load in create database hook * bump * bump * fix integration tests * fix more bugs * fix drop * more test fixes * cleanup * missing updateActive * simplify bucket merging * nick comments * bump * fix bad merge * tidy and edits * [ga-format-pr] Run go/utils/repofmt/format_repo.sh and go/Godeps/update.sh * bump test fixes * bump * fix bats * bump * [ga-format-pr] Run go/utils/repofmt/format_repo.sh and go/Godeps/update.sh * redo create db to account for variety of edge cases * try path.join --------- Co-authored-by: max-hoffman <max-hoffman@users.noreply.github.com>
350 lines
9.4 KiB
Bash
350 lines
9.4 KiB
Bash
#!/usr/bin/env bats
|
|
load $BATS_TEST_DIRNAME/helper/common.bash
|
|
load $BATS_TEST_DIRNAME/helper/query-server-common.bash
|
|
|
|
setup() {
|
|
skiponwindows "tests are flaky on Windows"
|
|
if [ "$SQL_ENGINE" = "remote-engine" ]; then
|
|
skip "This test tests remote connections directly, SQL_ENGINE is not needed."
|
|
fi
|
|
|
|
setup_common
|
|
|
|
TMPDIRS=$(pwd)/tmpdirs
|
|
mkdir -p $TMPDIRS/{repo1,repo2}
|
|
|
|
cd $TMPDIRS/repo1
|
|
dolt init
|
|
|
|
dolt sql <<SQL
|
|
create table ab (a int primary key, b int, key (b,a));
|
|
SQL
|
|
|
|
cd $TMPDIRS/repo2
|
|
dolt init
|
|
|
|
dolt sql <<SQL
|
|
create table xy (x int primary key, y int, key (y,x));
|
|
create table ab (a int primary key, b int, key (b,a));
|
|
SQL
|
|
|
|
cd $TMPDIRS
|
|
}
|
|
|
|
teardown() {
|
|
teardown_common
|
|
stop_sql_server 1
|
|
rm -rf $TMPDIRS
|
|
cd $BATS_TMPDIR
|
|
}
|
|
|
|
@test "stats: empty initial stats" {
|
|
cd repo2
|
|
|
|
dolt sql -q "insert into xy values (0,0), (1,1)"
|
|
|
|
start_sql_server
|
|
sleep 1
|
|
stop_sql_server
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "0" ]
|
|
|
|
# setting variables doesn't hang or error
|
|
dolt sql -q "set @@PERSIST.dolt_stats_auto_refresh_enabled = 1;"
|
|
dolt sql -q "set @@PERSIST.dolt_stats_auto_refresh_threshold = .5"
|
|
dolt sql -q "set @@PERSIST.dolt_stats_auto_refresh_interval = 1;"
|
|
|
|
# auto refresh initialize at server startup
|
|
start_sql_server
|
|
|
|
# need to trigger at least one refresh cycle
|
|
sleep 1
|
|
|
|
# only statistics for non-empty tables are collected
|
|
run dolt sql -r csv -q "select database_name, table_name, index_name from dolt_statistics order by index_name"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[0]}" = "database_name,table_name,index_name" ]
|
|
[ "${lines[1]}" = "repo2,xy,primary" ]
|
|
[ "${lines[2]}" = "repo2,xy,yx" ]
|
|
|
|
# appending new chunks picked up
|
|
dolt sql -q "insert into xy select x, 1 from (with recursive inputs(x) as (select 4 union select x+1 from inputs where x < 1000) select * from inputs) dt;"
|
|
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "8" ]
|
|
|
|
# updates picked up
|
|
dolt sql -q "update xy set y = 2 where x between 100 and 800"
|
|
|
|
sleep 1
|
|
|
|
dolt sql -r csv -q "select count(*) from dolt_statistics"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "8" ]
|
|
}
|
|
|
|
@test "stats: deletes refresh" {
|
|
cd repo2
|
|
|
|
dolt sql -q "insert into xy select x, 1 from (with recursive inputs(x) as (select 4 union select x+1 from inputs where x < 1000) select * from inputs) dt;"
|
|
|
|
# setting variables doesn't hang or error
|
|
dolt sql -q "set @@persist.dolt_stats_auto_refresh_enabled = 1;"
|
|
dolt sql -q "set @@persist.dolt_stats_auto_refresh_threshold = .5"
|
|
dolt sql -q "set @@persist.dolt_stats_auto_refresh_interval = 1;"
|
|
|
|
start_sql_server
|
|
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "8" ]
|
|
|
|
# delete >50% of rows
|
|
dolt sql -q "delete from xy where x > 600"
|
|
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "4" ]
|
|
}
|
|
|
|
@test "stats: add/delete table" {
|
|
cd repo1
|
|
|
|
dolt sql -q "insert into ab values (0,0), (1,0), (2,0)"
|
|
|
|
# setting variables doesn't hang or error
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_enabled = 1;"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_threshold = .5"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_interval = 1;"
|
|
|
|
start_sql_server
|
|
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "2" ]
|
|
|
|
# add table
|
|
dolt sql -q "create table xy (x int primary key, y int)"
|
|
# schema changes don't impact the table hash
|
|
dolt sql -q "insert into xy values (0,0)"
|
|
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics where table_name = 'xy'"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "1" ]
|
|
|
|
dolt sql -q "truncate table xy"
|
|
|
|
sleep 1
|
|
|
|
dolt sql -q "select * from xy"
|
|
|
|
dolt sql -q "select * from dolt_statistics where table_name = 'xy'"
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics where table_name = 'xy'"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "0" ]
|
|
|
|
dolt sql -q "drop table xy"
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics where table_name = 'xy'"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "0" ]
|
|
}
|
|
|
|
@test "stats: add/delete index" {
|
|
cd repo2
|
|
|
|
dolt sql -q "insert into xy values (0,0), (1,0), (2,0)"
|
|
|
|
# setting variables doesn't hang or error
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_enabled = 1;"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_threshold = .5"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_interval = 1;"
|
|
|
|
start_sql_server
|
|
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "2" ]
|
|
|
|
# delete secondary
|
|
dolt sql -q "alter table xy drop index yx"
|
|
# schema changes don't impact the table hash
|
|
dolt sql -q "insert into xy values (3,0)"
|
|
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "1" ]
|
|
|
|
dolt sql -q "alter table xy add index yx (y,x)"
|
|
# row change to impact table hash
|
|
dolt sql -q "insert into xy values (4,0)"
|
|
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "2" ]
|
|
}
|
|
|
|
@test "stats: most common values" {
|
|
cd repo2
|
|
|
|
dolt sql -q "alter table xy add index (y)"
|
|
dolt sql -q "insert into xy values (0,0), (1,0), (2,0), (3,0), (4,0), (5,0)"
|
|
|
|
# setting variables doesn't hang or error
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_enabled = 1;"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_threshold = .5"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_interval = 1;"
|
|
|
|
# auto refresh can only initialize at server startup
|
|
start_sql_server
|
|
|
|
# need to trigger at least one refresh cycle
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select mcv1 from dolt_statistics where index_name = 'y'"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "0" ]
|
|
|
|
sleep 1
|
|
|
|
dolt sql -q "update xy set y = 2 where x between 0 and 3"
|
|
|
|
sleep 1
|
|
|
|
run dolt sql -r csv -q "select mcv1 as mcv from dolt_statistics where index_name = 'y' union select mcv2 as mcv from dolt_statistics where index_name = 'y' order by mcv"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "0" ]
|
|
[ "${lines[2]}" = "2" ]
|
|
}
|
|
|
|
@test "stats: multi db" {
|
|
cd repo1
|
|
dolt sql -q "insert into ab values (0,0), (1,1)"
|
|
|
|
cd ../repo2
|
|
dolt sql -q "insert into ab values (0,0), (1,1)"
|
|
dolt sql -q "insert into xy values (0,0), (1,1)"
|
|
|
|
cd ..
|
|
start_sql_server
|
|
sleep 1
|
|
stop_sql_server
|
|
|
|
run dolt sql -r csv -q "select count(*) from dolt_statistics"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "0" ]
|
|
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_enabled = 1;"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_threshold = 0.5"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_interval = 1;"
|
|
|
|
start_sql_server
|
|
sleep 1
|
|
|
|
dolt sql -q "use repo1"
|
|
run dolt sql -r csv -q "select database_name, table_name, index_name from dolt_statistics order by index_name"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[0]}" = "database_name,table_name,index_name" ]
|
|
[ "${lines[1]}" = "repo1,ab,ba" ]
|
|
[ "${lines[2]}" = "repo1,ab,primary" ]
|
|
|
|
run dolt sql -r csv -q "select database_name, table_name, index_name from repo2.dolt_statistics order by index_name"
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[0]}" = "database_name,table_name,index_name" ]
|
|
[ "${lines[1]}" = "repo2,ab,ba" ]
|
|
[ "${lines[2]}" = "repo2,ab,primary" ]
|
|
[ "${lines[3]}" = "repo2,xy,primary" ]
|
|
[ "${lines[4]}" = "repo2,xy,yx" ]
|
|
}
|
|
|
|
@test "stats: add/delete database" {
|
|
cd repo1
|
|
|
|
# setting variables doesn't hang or error
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_enabled = 1;"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_threshold = .5"
|
|
dolt sql -q "SET @@persist.dolt_stats_auto_refresh_interval = 1;"
|
|
|
|
start_sql_server
|
|
|
|
dolt sql -q "insert into ab values (0,0), (1,0), (2,0)"
|
|
dolt sql <<SQL
|
|
create database repo2;
|
|
create table repo2.xy (x int primary key, y int, key(y,x));
|
|
insert into repo2.xy values (0,0), (1,0), (2,0);
|
|
SQL
|
|
|
|
sleep 1
|
|
|
|
# specify database_name filter even though can only see active db stats
|
|
run dolt sql -r csv <<SQL
|
|
use repo2;
|
|
select count(*) from dolt_statistics where database_name = 'repo2';
|
|
SQL
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[2]}" = "2" ]
|
|
|
|
# drop repo2
|
|
dolt sql -q "drop database repo2"
|
|
|
|
sleep 1
|
|
|
|
# we can't access repo2 stats, but still try
|
|
run dolt sql -r csv <<SQL
|
|
select count(*) from dolt_statistics where database_name = 'repo2';
|
|
SQL
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[1]}" = "0" ]
|
|
|
|
dolt sql <<SQL
|
|
create database repo2;
|
|
create table repo2.xy (x int primary key, y int, key(y,x));
|
|
SQL
|
|
|
|
sleep 1
|
|
|
|
# no rows yet
|
|
run dolt sql -r csv <<SQL
|
|
use repo2;
|
|
select count(*) from dolt_statistics where database_name = 'repo2';
|
|
SQL
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[2]}" = "0" ]
|
|
|
|
dolt sql <<SQL
|
|
use repo2;
|
|
insert into xy values (0,0);
|
|
SQL
|
|
|
|
sleep 1
|
|
|
|
# insert initializes stats
|
|
run dolt sql -r csv <<SQL
|
|
use repo2;
|
|
select count(*) from dolt_statistics where database_name = 'repo2';
|
|
SQL
|
|
[ "$status" -eq 0 ]
|
|
[ "${lines[2]}" = "2" ]
|
|
}
|
|
|