Commit 87679ac9 authored by Alfranio Correia's avatar Alfranio Correia

BUG#38197 Errors in @@init_slave not visible in 'show slave status'

      
Some errors that cause the slave SQL thread to stop are not shown in the
Slave_SQL_Error column of "SHOW SLAVE STATUS". Instead, the error is only 
in the server's error log.
      
That makes it difficult to analyze the error for the user. One example of an error
that stops the slave but is not shown by "SHOW SLAVE STATUS" is when @@global.init_slave
is set incorrectly (e.g., it contains something that is not valid SQL).
      
Three failures were not correctly reported:
      
1 - Failures during slave thread initialization
2 - Failures while initializing the relay log position right after
starting the slave thread.
3 - Failures while processing queries passed through the init_slave
option.
      
This patch fixes the issues by reporting the errors through relay-info->report.
parent 97362981
reset master; reset master;
call mtr.add_suppression("Failed during slave.*thread initialization"); call mtr.add_suppression("Failed during slave thread initialization");
stop slave; stop slave;
reset slave; reset slave;
SET GLOBAL debug="d,simulate_io_slave_error_on_init,simulate_sql_slave_error_on_init"; SET GLOBAL debug="d,simulate_io_slave_error_on_init,simulate_sql_slave_error_on_init";
...@@ -23,8 +23,8 @@ Replicate_Do_Table ...@@ -23,8 +23,8 @@ Replicate_Do_Table
Replicate_Ignore_Table Replicate_Ignore_Table
Replicate_Wild_Do_Table Replicate_Wild_Do_Table
Replicate_Wild_Ignore_Table Replicate_Wild_Ignore_Table
Last_Errno 0 Last_Errno #
Last_Error Last_Error Failed during slave thread initialization
Skip_Counter 0 Skip_Counter 0
Exec_Master_Log_Pos 0 Exec_Master_Log_Pos 0
Relay_Log_Space # Relay_Log_Space #
...@@ -41,6 +41,6 @@ Seconds_Behind_Master # ...@@ -41,6 +41,6 @@ Seconds_Behind_Master #
Master_SSL_Verify_Server_Cert No Master_SSL_Verify_Server_Cert No
Last_IO_Errno 0 Last_IO_Errno 0
Last_IO_Error Last_IO_Error
Last_SQL_Errno 0 Last_SQL_Errno #
Last_SQL_Error Last_SQL_Error Failed during slave thread initialization
SET GLOBAL debug=""; SET GLOBAL debug="";
stop slave;
drop table if exists t1,t2,t3,t4,t5,t6,t7,t8,t9;
reset master;
reset slave;
drop table if exists t1,t2,t3,t4,t5,t6,t7,t8,t9;
start slave;
stop slave;
reset slave;
SET GLOBAL debug= "d,simulate_io_slave_error_on_init,simulate_sql_slave_error_on_init";
start slave;
Reporting the following error: Failed during slave thread initialization
SET GLOBAL debug= "";
stop slave;
reset slave;
SET GLOBAL init_slave= "garbage";
start slave;
Reporting the following error: Slave SQL thread aborted. Can't execute init_slave query
SET GLOBAL init_slave= "";
...@@ -15,7 +15,7 @@ reset master; ...@@ -15,7 +15,7 @@ reset master;
connection slave; connection slave;
# Add suppression for expected warnings in slaves error log # Add suppression for expected warnings in slaves error log
call mtr.add_suppression("Failed during slave.*thread initialization"); call mtr.add_suppression("Failed during slave thread initialization");
--disable_warnings --disable_warnings
stop slave; stop slave;
...@@ -38,7 +38,7 @@ connection slave; ...@@ -38,7 +38,7 @@ connection slave;
source include/wait_for_slave_to_stop.inc; source include/wait_for_slave_to_stop.inc;
--replace_result $MASTER_MYPORT MASTER_PORT --replace_result $MASTER_MYPORT MASTER_PORT
--replace_column 1 # 8 # 9 # 23 # 33 # --replace_column 1 # 8 # 9 # 19 # 23 # 33 # 37 #
query_vertical show slave status; query_vertical show slave status;
# #
......
######################################################################
# Some errors that cause the slave SQL thread to stop are not shown in
# the Slave_SQL_Error column of "SHOW SLAVE STATUS". Instead, the error
# is only in the server's error log.
#
# Two failures and their respective reporting are verified:
#
# 1 - Failures during slave thread initialization
# 2 - Failures while processing queries passed through the init_slave
# option.
#
# In order to check the first type of failure, we inject a fault in the
# SQL/IO Threads through SET GLOBAL debug.
#
# To check the second type, we set @@global.init_slave to an invalid
# command thus preventing the initialization of the SQL Thread.
#
# Obs:
# 1 - Note that testing failures while initializing the relay log position
# is hard as the same function is called before the code reaches the point
# that we want to test.
#
# 2 - This test does not target failures that are reported while applying
# events such as duplicate keys, errors while reading the relay-log.bin*,
# etc. Such errors are already checked on other tests.
######################################################################
######################################################################
# Configuring the Environment
######################################################################
source include/have_debug.inc;
source include/master-slave.inc;
source include/have_log_bin.inc;
connection slave;
--disable_warnings
stop slave;
--enable_warnings
reset slave;
######################################################################
# Injecting faults in the threads' initialization
######################################################################
connection slave;
# Set debug flags on slave to force errors to occur
SET GLOBAL debug= "d,simulate_io_slave_error_on_init,simulate_sql_slave_error_on_init";
start slave;
#
# slave is going to stop because of emulated failures
# but there won't be any crashes nor asserts hit.
#
source include/wait_for_slave_to_stop.inc;
let $error= query_get_value(SHOW SLAVE STATUS, Last_Error, 1);
echo Reporting the following error: $error;
SET GLOBAL debug= "";
######################################################################
# Injecting faults in the init_slave option
######################################################################
connection slave;
--disable_warnings
stop slave;
--enable_warnings
source include/wait_for_slave_to_stop.inc;
reset slave;
SET GLOBAL init_slave= "garbage";
start slave;
source include/wait_for_slave_sql_to_stop.inc;
let $error= query_get_value(SHOW SLAVE STATUS, Last_Error, 1);
echo Reporting the following error: $error;
######################################################################
# Clean up
######################################################################
SET GLOBAL init_slave= "";
...@@ -2678,7 +2678,8 @@ pthread_handler_t handle_slave_sql(void *arg) ...@@ -2678,7 +2678,8 @@ pthread_handler_t handle_slave_sql(void *arg)
*/ */
pthread_cond_broadcast(&rli->start_cond); pthread_cond_broadcast(&rli->start_cond);
pthread_mutex_unlock(&rli->run_lock); pthread_mutex_unlock(&rli->run_lock);
sql_print_error("Failed during slave thread initialization"); rli->report(ERROR_LEVEL, ER_SLAVE_FATAL_ERROR,
"Failed during slave thread initialization");
goto err; goto err;
} }
thd->init_for_queries(); thd->init_for_queries();
...@@ -2723,8 +2724,8 @@ pthread_handler_t handle_slave_sql(void *arg) ...@@ -2723,8 +2724,8 @@ pthread_handler_t handle_slave_sql(void *arg)
1 /*need data lock*/, &errmsg, 1 /*need data lock*/, &errmsg,
1 /*look for a description_event*/)) 1 /*look for a description_event*/))
{ {
sql_print_error("Error initializing relay log position: %s", rli->report(ERROR_LEVEL, ER_SLAVE_FATAL_ERROR,
errmsg); "Error initializing relay log position: %s", errmsg);
goto err; goto err;
} }
THD_CHECK_SENTRY(thd); THD_CHECK_SENTRY(thd);
...@@ -2769,8 +2770,8 @@ log '%s' at position %s, relay log '%s' position: %s", RPL_LOG_NAME, ...@@ -2769,8 +2770,8 @@ log '%s' at position %s, relay log '%s' position: %s", RPL_LOG_NAME,
execute_init_command(thd, &sys_init_slave, &LOCK_sys_init_slave); execute_init_command(thd, &sys_init_slave, &LOCK_sys_init_slave);
if (thd->is_slave_error) if (thd->is_slave_error)
{ {
sql_print_error("\ rli->report(ERROR_LEVEL, thd->main_da.sql_errno(),
Slave SQL thread aborted. Can't execute init_slave query"); "Slave SQL thread aborted. Can't execute init_slave query");
goto err; goto err;
} }
} }
...@@ -2820,10 +2821,20 @@ Slave SQL thread aborted. Can't execute init_slave query"); ...@@ -2820,10 +2821,20 @@ Slave SQL thread aborted. Can't execute init_slave query");
thd->main_da.sql_errno(), last_errno)); thd->main_da.sql_errno(), last_errno));
if (last_errno == 0) if (last_errno == 0)
{ {
/*
This function is reporting an error which was not reported
while executing exec_relay_log_event().
*/
rli->report(ERROR_LEVEL, thd->main_da.sql_errno(), errmsg); rli->report(ERROR_LEVEL, thd->main_da.sql_errno(), errmsg);
} }
else if (last_errno != thd->main_da.sql_errno()) else if (last_errno != thd->main_da.sql_errno())
{ {
/*
* An error was reported while executing exec_relay_log_event()
* however the error code differs from what is in the thread.
* This function prints out more information to help finding
* what caused the problem.
*/
sql_print_error("Slave (additional info): %s Error_code: %d", sql_print_error("Slave (additional info): %s Error_code: %d",
errmsg, thd->main_da.sql_errno()); errmsg, thd->main_da.sql_errno());
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment