Files
percona-toolkit/t/pt-table-checksum/basics.t
Sveta Smirnova 19baa34872 PT-2295 - Fix tests on distributions
- Fixed sporadic pt-tc failures on rolled back SHOW MASTER STATUS code
- Added better diagnostic info for sporadically failing t/pt-table-checksum/basics.t
- Decreased chunk size it t/pt-table-checksum/progress.t, so this test
  has less chances to fail, because pt-osc finishes faster than expected
2024-02-13 20:03:32 +03:00

600 lines
18 KiB
Perl

#!/usr/bin/env perl
BEGIN {
die "The PERCONA_TOOLKIT_BRANCH environment variable is not set.\n"
unless $ENV{PERCONA_TOOLKIT_BRANCH} && -d $ENV{PERCONA_TOOLKIT_BRANCH};
unshift @INC, "$ENV{PERCONA_TOOLKIT_BRANCH}/lib";
};
use strict;
use warnings FATAL => 'all';
use English qw(-no_match_vars);
use Test::More;
# Hostnames make testing less accurate. Tests need to see
# that such-and-such happened on specific slave hosts, but
# the sandbox servers are all on one host so all slaves have
# the same hostname.
$ENV{PERCONA_TOOLKIT_TEST_USE_DSN_NAMES} = 1;
use Data::Dumper;
use PerconaTest;
use Sandbox;
require "$trunk/bin/pt-table-checksum";
# We need to restart, so environment is clean for the
# "Default checksum" test
diag(`$trunk/sandbox/test-env restart`);
my $dp = new DSNParser(opts=>$dsn_opts);
my $sb = new Sandbox(basedir => '/tmp', DSNParser => $dp);
my $master_dbh = $sb->get_dbh_for('master');
my $slave1_dbh = $sb->get_dbh_for('slave1');
my $slave2_dbh = $sb->get_dbh_for('slave2');
if ( !$master_dbh ) {
plan skip_all => 'Cannot connect to sandbox master';
}
elsif ( !$slave1_dbh ) {
plan skip_all => 'Cannot connect to sandbox slave1';
}
elsif ( !@{$master_dbh->selectall_arrayref("show databases like 'sakila'")} ) {
plan skip_all => 'sakila database is not loaded';
} else {
plan tests => 40;
}
# The sandbox servers run with lock_wait_timeout=3 and it's not dynamic
# so we need to specify --set-vars innodb_lock_wait_timeout=3 else the tool will die.
my $master_dsn = 'h=127.1,P=12345,u=msandbox,p=msandbox';
my $slave2_dsn = 'h=127.1,P=12347,u=msandbox,p=msandbox';
my @args = ($master_dsn, qw(--set-vars innodb_lock_wait_timeout=3 --ignore-tables load_data));
my $row;
my $output;
my $exit_status;
my $sample = "t/pt-table-checksum/samples/";
my $outfile = '/tmp/pt-table-checksum-results';
my $repl_db = 'percona';
sub reset_repl_db {
$master_dbh->do("drop database if exists $repl_db");
$master_dbh->do("create database $repl_db");
$master_dbh->do("use $repl_db");
}
# ############################################################################
# Default checksum and results. The tool does not technically require any
# options on well-configured systems (which the test env cannot be). With
# nothing but defaults, it should create the repl table, checksum and check
# all tables, dynamically adjust the chunk size, and throttle itself and based
# on all slaves' lag. We don't explicitly test throttling here; that's done
# in throttle.t.
# ############################################################################
# 1
# We need to remove mysql.plugin and percona_test.checksums tables from the
# result and the sample, because they have different number of rows than default
# if run test with enabled MyRocks or TokuDB SE.
# We also need to remove mysql.global_grants because it contains dynamic privileges
# that could be modified by other tests. At the same time, privileges are not removed
# from this table after they have been added, so we cannot remove them when wipe cleaning
# sandbox. See https://dev.mysql.com/doc/refman/8.0/en/privileges-provided.html#static-dynamic-privileges
# This test often fails if run after other tests, we need to see what is wrong
# So we will re-run failed code if test does not pass.
my $cmd = sub { pt_table_checksum::main(@args) };
#diag(output($cmd))
ok(
no_diff(
$cmd,
"$sample/default-results-$sandbox_version.txt",
sed_out => '\'/mysql.plugin$/d; /percona_test.checksums$/d; /mysql.help_category$/d; /mysql.help_keyword$/d; /mysql.help_relation$/d; /mysql.help_topic$/d\'',
post_pipe => 'sed \'/mysql.plugin$/d; /percona_test.checksums$/d; /mysql.help_category$/d; /mysql.help_keyword$/d; /mysql.help_relation$/d; /mysql.help_topic$/d; /mysql.ndb_binlog_index$/d; /mysql.global_grants$/d\' | ' .
'awk \'{print $2 " " $3 " " $4 " " $7 " " $9}\'',
keep_ouput => 1,
),
"Default checksum"
) or diag($test_diff);
# On fast machines, the chunk size will probably be be auto-adjusted so
# large that all tables will be done in a single chunk without an index.
# Since this varies by default, there's no use checking the checksums
# other than to ensure that there's at least one for each table.
# 2
$row = $master_dbh->selectrow_arrayref("select count(*) from percona.checksums");
my $max_chunks = $sandbox_version < '5.7' ? 60 : 100;
ok(
$row->[0] > 25 && $row->[0] < $max_chunks,
"Between 25 and $max_chunks chunks"
) or diag($row->[0]);
# ############################################################################
# Static chunk size (disable --chunk-time)
# ############################################################################
# 3
# We need to remove mysql.plugin and percona_test.checksums tables from the
# result and the sample, because they have different number of rows than default
# if run test with enabled MyRocks or TokuDB SE
ok(
no_diff(
sub { pt_table_checksum::main(@args, qw(--chunk-time 0 --ignore-databases mysql)) },
"$sample/static-chunk-size-results-$sandbox_version.txt",
sed_out => '\'/mysql.plugin$/d; /percona_test.checksums$/d\'',
post_pipe => 'sed \'/mysql.plugin$/d; /percona_test.checksums$/d\' | ' .
'awk \'{print $2 " " $3 " " $4 " " $6 " " $7 " " $9}\'',
),
"Static chunk size (--chunk-time 0)"
);
$row = $master_dbh->selectrow_arrayref("select count(*) from percona.checksums");
my $max_rows = $sandbox_version >= '8.0' ? 102 : $sandbox_version < '5.7' ? 90 : 100;
ok(
$row->[0] >= 75 && $row->[0] <= $max_rows,
'Between 75 and 90 chunks on master'
) or diag($row->[0]);
my $row2 = $slave1_dbh->selectrow_arrayref("select count(*) from percona.checksums");
is(
$row2->[0],
$row->[0],
'... same number of chunks on slave'
) or diag($row->[0], ' ', $row2->[0]);
# ############################################################################
# --[no]replicate-check and, implicitly, the tool's exit status.
# ############################################################################
# Make one row on the slave differ.
$row = $slave1_dbh->selectrow_arrayref("select city, last_update from sakila.city where city_id=1");
$slave1_dbh->do("update sakila.city set city='test' where city_id=1");
$exit_status = pt_table_checksum::main(@args,
qw(--quiet -t sakila.city --chunk-size 1));
is(
$exit_status,
16, # = TABLE_DIFF but nothing else; https://bugs.launchpad.net/percona-toolkit/+bug/944051
"--replicate-check on by default, detects diff"
) or diag("exit status: $exit_status");
$exit_status = pt_table_checksum::main(@args,
qw(--quiet --quiet -t sakila.city --no-replicate-check));
is(
$exit_status,
0,
"--no-replicate-check, no diff detected"
);
# Restore the row on the slave, else other tests will fail.
$slave1_dbh->do("update sakila.city set city='$row->[0]', last_update='$row->[1]' where city_id=1");
# #############################################################################
# --[no]empty-replicate-table
# Issue 21: --empty-replicate-table doesn't empty if previous runs leave info
# #############################################################################
$sb->wipe_clean($master_dbh);
$sb->load_file('master', 't/pt-table-checksum/samples/issue_21.sql');
# Run once to populate the repl table.
pt_table_checksum::main(@args, qw(--quiet --quiet -t test.issue_21),
qw(--chunk-time 0 --chunk-size 2));
# Insert two fake rows into the repl table. The first row tests that
# --empty-replicate-table deletes all rows for each checksummed table,
# and the second row tests that if a table isn't checksummed, then its
# rows aren't deleted.
$master_dbh->do("INSERT INTO percona.checksums VALUES ('test', 'issue_21', 999, 0.00, 'idx', '0', '0', '0', 0, '0', 0, NOW())");
$master_dbh->do("INSERT INTO percona.checksums VALUES ('test', 'other_tbl', 1, 0.00, 'idx', '0', '0', '0', 0, '0', 0, NOW())");
pt_table_checksum::main(@args, qw(--quiet --quiet -t test.issue_21),
qw(--chunk-time 0 --chunk-size 2));
$row = $master_dbh->selectall_arrayref("SELECT tbl, chunk FROM percona.checksums WHERE db='test' ORDER BY tbl, chunk");
is_deeply(
$row,
[
[qw(issue_21 1)],
[qw(issue_21 2)],
[qw(issue_21 3)],
[qw(issue_21 4)], # lower oob
[qw(issue_21 5)], # upper oob
# fake row for chunk 999 is gone
[qw(other_tbl 1)], # this row is still here
],
"--emptry-replicate-table on by default"
) or print STDERR Dumper($row);
# ############################################################################
# --[no]recheck
# ############################################################################
$exit_status = pt_table_checksum::main(@args,
qw(--quiet --quiet --chunk-time 0 --chunk-size 100 -t sakila.city));
$slave1_dbh->do("update percona.checksums set this_crc='' where db='sakila' and tbl='city' and (chunk=1 or chunk=6)");
PerconaTest::wait_for_table($slave2_dbh, "percona.checksums", "db='sakila' and tbl='city' and (chunk=1 or chunk=6) and thic_crc=''");
# 9
ok(
no_diff(
sub { pt_table_checksum::main(@args, qw(--replicate-check-only)) },
"$sample/no-recheck.txt",
),
"--no-recheck (just --replicate-check)"
);
# ############################################################################
# Detect infinite loop.
# ############################################################################
$sb->load_file('master', "t/pt-table-checksum/samples/oversize-chunks.sql");
$output = output(
sub { pt_table_checksum::main(@args, qw(-t osc.t --chunk-size 10)) },
stderr => 1,
);
# 10
like(
$output,
qr/infinite loop detected/,
"Detects infinite loop"
);
# ############################################################################
# Oversize chunk.
# ############################################################################
# 11
ok(
no_diff(
sub { pt_table_checksum::main(@args,
qw(-t osc.t2 --chunk-size 8 --explain --explain)) },
"$sample/oversize-chunks.txt",
),
"Upper boundary same as next lower boundary",
);
$output = output(
sub { pt_table_checksum::main(@args,
qw(-t osc.t2 --chunk-time 0 --chunk-size 8 --chunk-size-limit 1)) },
stderr => 1,
);
is(
PerconaTest::count_checksum_results($output, 'skipped'),
2,
"Skipped oversize chunks"
);
is(
PerconaTest::count_checksum_results($output, 'errors'),
0,
"Oversize chunks are not errors"
);
# SKIPPED should be accurate if the first skipped chunk # > 1.
# https://bugs.launchpad.net/percona-toolkit/+bug/1011738
$output = output(
sub { pt_table_checksum::main(@args,
qw(-t osc.t --chunk-size 6 --chunk-size-limit 1)) },
stderr => 1,
);
like(
$output,
qr/Skipping chunk 2/i,
"Skipped chunk 2"
);
is(
PerconaTest::count_checksum_results($output, 'skipped'),
1,
"Skipped 1 chunk (bug 1011738)"
) or diag($output);
# ############################################################################
# Check slave table row est. if doing doing 1=1 on master table.
# ############################################################################
$master_dbh->do('truncate table percona.checksums');
$sb->load_file('master', "t/pt-table-checksum/samples/3tbl-resume.sql");
$master_dbh->do('set sql_log_bin=0');
$master_dbh->do('truncate table test.t1');
$master_dbh->do('set sql_log_bin=1');
$output = output(
sub {
$exit_status = pt_table_checksum::main(@args, qw(-d test --chunk-size 2))
},
stderr => 1,
);
like(
$output,
qr/Skipping table test.t1/,
"Warns about skipping large slave table"
);
is_deeply(
$master_dbh->selectall_arrayref("select distinct tbl from percona.checksums where db='test'"),
[ ['t2'], ['t3'] ],
"Does not checksum large slave table on master"
);
is_deeply(
$slave1_dbh->selectall_arrayref("select distinct tbl from percona.checksums where db='test'"),
[ ['t2'], ['t3'] ],
"Does not checksum large slave table on slave"
);
is(
$exit_status,
64, # SKIP_TABLE
"Non-zero exit status"
);
is(
PerconaTest::count_checksum_results($output, 'skipped'),
0,
"0 skipped"
);
is(
PerconaTest::count_checksum_results($output, 'errors'),
0,
"0 errors"
);
is(
PerconaTest::count_checksum_results($output, 'rows'),
52,
"52 rows checksummed"
);
# #############################################################################
# pt-table-checksum chunk-size-limit of 0 does not disable chunk size limit
# checking
# https://bugs.launchpad.net/percona-toolkit/+bug/938660
# #############################################################################
# Decided _not_ to do this; we want to always check slave table size when
# single-chunking a table on the master.
$output = output(
sub {
$exit_status = pt_table_checksum::main(@args,
qw(-d test --chunk-size 2 --chunk-size-limit 0))
},
stderr => 1,
);
like(
$output,
qr/Skipping table test.t1/,
"--chunk-size-limit=0 does not disable #-of-rows checks on slaves"
);
# #############################################################################
# Crash if no host in DSN.
# https://bugs.launchpad.net/percona-toolkit/+bug/819450
# http://code.google.com/p/maatkit/issues/detail?id=1332
# #############################################################################
$output = output(
sub { $exit_status = pt_table_checksum::main(
qw(--user msandbox --pass msandbox),
qw(-S /tmp/12345/mysql_sandbox12345.sock --set-vars innodb_lock_wait_timeout=3 --run-time 8)) },
stderr => 1,
);
# This test no longer works because of
# https://bugs.launchpad.net/percona-toolkit/+bug/1087804
# So comment out this test...
#is(
# $exit_status,
# 0,
# "No host in DSN, zero exit status"
#) or diag($output);
# ... and use this one instead:
# Aaaaand this one also no longer works because of
# https://bugs.launchpad.net/percona-toolkit/+bug/1042727
# pt-table-checksum will keep trying to find a slave ... forever.
# (notice the --runtime in the original command otherwise it loops forever)
# So we comment out these other 2 tests
#like(
# $output,
# qr/sakila.store/,
# "No host in DSN, checksums happened"
#) or diag($output);
#is(
# PerconaTest::count_checksum_results($output, 'errors'),
# 0,
# "No host in DSN, 0 errors"
#) or diag($output);
# and instead check if it waits for slaves
# This test is no longer working
# TODO: double check messages
# like(
# $output,
# qr/replica.*stopped.*waiting/i,
# "Warns when waiting for replicas."
# ) or diag($output);
#
# Check if no slaves were found. Bug 1087804:
# Notice we simply execute the command but on 12347, the slaveless slave.
$output = output(
sub { $exit_status = pt_table_checksum::main(
qw(--user msandbox --pass msandbox),
('--set-vars', 'innodb_lock_wait_timeout=3', '--run-time', '5', $slave2_dsn )) },
stderr => 1,
);
like(
$output,
qr/no slaves were found/,
"Warns when no slave are found (bug 1087804)"
) or diag($output);
is(
$exit_status,
8, # https://bugs.launchpad.net/percona-toolkit/+bug/944051
"Exit status 8 when no slaves are found (bug 1087804)"
) or diag($output);
# #############################################################################
# Test --where.
# #############################################################################
$sb->load_file('master', 't/pt-table-checksum/samples/600cities.sql');
$master_dbh->do("LOAD DATA INFILE '$trunk/t/pt-table-checksum/samples/600cities.data' INTO TABLE test.t");
$output = output(
sub { $exit_status = pt_table_checksum::main(@args,
qw(-t test.t --chunk-size 20 --explain --explain),
"--where", "id>=100 AND id<=200"); },
stderr => 1,
);
like(
$output,
qr/^REPLACE INTO.+?id>=100 AND id<=200.+?checksum chunk/m,
"--where in checksum chunk query"
);
like(
$output,
qr/^REPLACE INTO.+?id>=100 AND id<=200.+?past lower chunk/m,
"--where in past lower chunk query"
);
like(
$output,
qr/^REPLACE INTO.+?id>=100 AND id<=200.+?past upper chunk/m,
"--where in past upper chunk query"
);
like(
$output,
qr/^SELECT.+?id>=100 AND id<=200.+?next chunk boundary/m,
"--where in next chunk boundary query"
);
like(
$output,
qr/^1\s+100\s+119/m,
"--where for first chunk"
);
like(
$output,
qr/^6\s+200\s+200/m,
"--where for last chunk"
);
like(
$output,
qr/^7\s+100$/m,
"--where for lower oob chunk"
);
like(
$output,
qr/^8\s+200\s+$/m,
"--where for upper oob chunk"
);
# #############################################################################
# Bug 932442: column with 2 spaces
# #############################################################################
$sb->load_file('master', "t/pt-table-checksum/samples/2-space-col.sql");
$output = output(
sub { $exit_status = pt_table_checksum::main(@args,
qw(-t test.t --chunk-size 3)) },
stderr => 1,
);
is(
$exit_status,
0,
"Bug 932442: 0 exit"
);
is(
PerconaTest::count_checksum_results($output, 'errors'),
0,
"Bug 932442: 0 errors"
);
# #############################################################################
# Bug 821675: can't parse column names containing periods
# #############################################################################
$sb->load_file('master', "t/pt-table-checksum/samples/dot.sql");
ok(
no_diff(
sub { pt_table_checksum::main(@args,
qw(-t test.t --chunk-size 3 --explain --explain))
},
"t/pt-table-checksum/samples/dot.out",
),
"Bug 821675 (dot): queries"
);
$output = output(
sub { $exit_status = pt_table_checksum::main(@args,
qw(-t test.t --chunk-size 3 --explain --explain)) },
stderr => 1,
);
is(
$exit_status,
0,
"Bug 821675 (dot): 0 exit"
);
is(
PerconaTest::count_checksum_results($output, 'errors'),
0,
"Bug 821675 (dot): 0 errors"
);
# #############################################################################
# Bug 1019479: does not work with sql_mode ONLY_FULL_GROUP_BY
# #############################################################################
# add a couple more modes to test that commas don't affect setting
$master_dbh->do("SET sql_mode = 'NO_ZERO_DATE,ONLY_FULL_GROUP_BY,STRICT_ALL_TABLES'");
# force chunk-size because bug doesn't show up if table done in one chunk
$exit_status = pt_table_checksum::main(@args,
qw(--quiet --quiet -t sakila.actor --chunk-size=50));
is(
$exit_status,
0,
"sql_mode ONLY_FULL_GROUP_BY is overidden"
);
DONE:
# #############################################################################
# Done.
# #############################################################################
$sb->wipe_clean($master_dbh);
ok($sb->ok(), "Sandbox servers") or BAIL_OUT(__FILE__ . " broke the sandbox");
done_testing;