Wait for --replicate table to repl on all slaves. Add wait_for arg to PerconaTest::full_output().

This commit is contained in:
Daniel Nichter
2012-06-05 12:29:26 -04:00
parent 95f7e53feb
commit 4f83cf4102
4 changed files with 104 additions and 5 deletions

View File

@@ -6274,6 +6274,7 @@ sub main {
check_repl_table( check_repl_table(
dbh => $master_dbh, dbh => $master_dbh,
repl_table => $repl_table, repl_table => $repl_table,
slaves => $slaves,
OptionParser => $o, OptionParser => $o,
TableParser => $tp, TableParser => $tp,
Quoter => $q, Quoter => $q,
@@ -7210,11 +7211,11 @@ sub print_checksum_diffs {
sub check_repl_table { sub check_repl_table {
my ( %args ) = @_; my ( %args ) = @_;
my @required_args = qw(dbh repl_table OptionParser TableParser Quoter); my @required_args = qw(dbh repl_table slaves OptionParser TableParser Quoter);
foreach my $arg ( @required_args ) { foreach my $arg ( @required_args ) {
die "I need a $arg argument" unless $args{$arg}; die "I need a $arg argument" unless $args{$arg};
} }
my ($dbh, $repl_table, $o, $tp, $q) = @args{@required_args}; my ($dbh, $repl_table, $slaves, $o, $tp, $q) = @args{@required_args};
PTDEBUG && _d('Checking --replicate table', $repl_table); PTDEBUG && _d('Checking --replicate table', $repl_table);
# If the repl db doesn't exit, auto-create it, maybe. # If the repl db doesn't exit, auto-create it, maybe.
@@ -7265,6 +7266,43 @@ sub check_repl_table {
. "$repl_table.\n" unless $have_tbl_privs; . "$repl_table.\n" unless $have_tbl_privs;
} }
# Check and wait for the repl table to appear on all slaves.
# https://bugs.launchpad.net/percona-toolkit/+bug/1008778
if ( scalar @$slaves ) {
my $waiting_for;
my $pr;
if ( $o->get('progress') ) {
$pr = new Progress(
jobsize => scalar @$slaves,
spec => $o->get('progress'),
callback => sub {
print STDERR "Waiting for the --replicate table to replicate to "
. $waiting_for->name() . "...\n";
},
);
$pr->start();
}
foreach my $slave ( @$slaves ) {
PTDEBUG && _d('Checking if', $slave->name(), 'has repl table');
$waiting_for = $slave;
my $slave_has_repl_table = $tp->check_table(
dbh => $slave->dbh(),
db => $db,
tbl => $tbl,
);
while ( !$slave_has_repl_table ) {
$pr->update(sub { return 0; }) if $pr;
sleep 0.5;
$slave_has_repl_table = $tp->check_table(
dbh => $slave->dbh(),
db => $db,
tbl => $tbl,
);
}
}
}
return; # success, repl table is ready to go return; # success, repl table is ready to go
} }

View File

@@ -742,7 +742,7 @@ sub _d {
# This is because otherwise, errors thrown during cleanup # This is because otherwise, errors thrown during cleanup
# would be skipped. # would be skipped.
sub full_output { sub full_output {
my ( $code ) = @_; my ( $code, %args ) = @_;
die "I need a code argument" unless $code; die "I need a code argument" unless $code;
my (undef, $file) = tempfile(); my (undef, $file) = tempfile();
@@ -755,6 +755,19 @@ sub full_output {
my $status; my $status;
warn $file; warn $file;
if (my $pid = fork) { if (my $pid = fork) {
if ( my $t = $args{wait_for} ) {
# Wait for t seconds then kill the child.
sleep $t;
my $tries = 3;
# Most tools require 2 interrupts to make them stop.
while ( kill(0, $pid) && $tries-- ) {
kill SIGTERM, $pid;
sleep 0.10;
}
# Child didn't respond to SIGTERM? Then kill -9 it.
kill SIGKILL, $pid if kill(0, $pid);
sleep 0.25;
}
waitpid($pid, 0); waitpid($pid, 0);
$status = $?; $status = $?;
} }

View File

@@ -39,10 +39,9 @@ elsif ( !$slave2_dbh ) {
plan skip_all => 'Cannot connect to sandbox slave2'; plan skip_all => 'Cannot connect to sandbox slave2';
} }
else { else {
plan tests => 4; plan tests => 5;
} }
# The sandbox servers run with lock_wait_timeout=3 and it's not dynamic # The sandbox servers run with lock_wait_timeout=3 and it's not dynamic
# so we need to specify --lock-wait-timeout=3 else the tool will die. # so we need to specify --lock-wait-timeout=3 else the tool will die.
# And --max-load "" prevents waiting for status variables. Setting # And --max-load "" prevents waiting for status variables. Setting
@@ -99,6 +98,40 @@ is(
# Now wait until the SQL thread is started again. # Now wait until the SQL thread is started again.
wait_until_slave_running($slave1_dbh, $slave2_dbh); wait_until_slave_running($slave1_dbh, $slave2_dbh);
# #############################################################################
# Wait for --replicate table to replicate.
# https://bugs.launchpad.net/percona-toolkit/+bug/1008778
# #############################################################################
$master_dbh->do("DROP DATABASE IF EXISTS percona");
wait_until(sub {
my $dbs = $slave2_dbh->selectall_arrayref("SHOW DATABASES");
return !grep { $_->[0] eq 'percona' } @$dbs;
});
$sb->load_file('master', "t/pt-table-checksum/samples/dsn-table.sql");
$slave2_dbh->do("STOP SLAVE");
wait_until(sub {
my $ss = $slave2_dbh->selectrow_hashref("SHOW SLAVE STATUS");
return $ss->{slave_io_running} eq 'Yes';
});
($output) = PerconaTest::full_output(
sub { pt_table_checksum::main(@args, qw(-t sakila.country),
"--recursion-method", "dsn=F=/tmp/12345/my.sandbox.cnf,t=dsns.dsns");
},
wait_for => 3, # wait this many seconds then kill that ^
);
like(
$output,
qr/Waiting for the --replicate table to replicate to h=127.1,P=12347/,
"--progress for --replicate table (bug 1008778)"
);
$slave2_dbh->do("START SLAVE");
wait_until_slave_running($slave2_dbh);
# ############################################################################# # #############################################################################
# Done. # Done.
# ############################################################################# # #############################################################################

View File

@@ -0,0 +1,15 @@
DROP DATABASE IF EXISTS dsns;
CREATE DATABASE dsns;
USE dsns;
CREATE TABLE dsns (
id int auto_increment primary key,
parent_id int default null,
dsn varchar(255) not null
);
INSERT INTO dsns VALUES
-- (1, null, 'h=127.1,P=12345,u=msandbox,p=msandbox'), -- master
(2, 1, 'h=127.1,P=12346,u=msandbox,p=msandbox'),
(3, 2, 'h=127.1,P=12347,u=msandbox,p=msandbox');