Commit 87fa6d2c authored by sjaakola's avatar sjaakola Committed by Jan Lindström

MDEV-24327 wsrep XID checkpointing order with log_slave_updates=OFF

If log_slave_updates==OFF, wsrep applier threads used to be configured
with option: thd->variables.option_bits&= ~(OPTION_BIN_LOG);
(i.e. like sql_log_bin=ON). And this was regardless of log-bin configuration.

With this, having configuration of: --log-bin && --log-slave-updates=OFF,
local threads used binlogging, but applier threads did not. And further:
local threads went through binlog group commit, while applier threads did
direct commits. This resulted in situation, where applier threads entered
earlier in wsrep XID checkpointing, and could sync their wsrep XID out of order.
Later local thread commit would see that higher seqno was already checkpointed,
and fire an assert because of this.

As a fix, applier threads are now forced to enable binlogging regardless of
log-slave-updates configuration.

This PR comes with new mtr test: galera.MDEV-24327, which causes a scenario
where applier transaction is applied and committed while earlier local transaction
is parked before commit order monitor enter. A buggy mariadb versoin would fail
for assertion because of wsrep XID checkpoint order violation.
parent d4c35fb2
connection node_2;
connection node_1;
CREATE TABLE t1 (f1 INTEGER PRIMARY KEY, f2 CHAR(1));
INSERT INTO t1 VALUES (1, 'f');
INSERT INTO t1 VALUES (2, 'g');
connection node_1;
SET AUTOCOMMIT=ON;
START TRANSACTION;
UPDATE t1 SET f2 = '1' WHERE f1 = 1;
connect node_1a, 127.0.0.1, root, , test, $NODE_MYPORT_1;
SET SESSION wsrep_sync_wait=0;
connection node_1a;
SET SESSION wsrep_on = 0;
SET SESSION wsrep_on = 1;
SET GLOBAL wsrep_provider_options = 'dbug=';
SET GLOBAL wsrep_provider_options = 'dbug=d,commit_monitor_master_enter_sync';
connection node_1;
COMMIT;
connection node_1a;
SET SESSION wsrep_on = 0;
SET SESSION wsrep_on = 1;
SET GLOBAL wsrep_provider_options = 'dbug=';
connection node_2;
UPDATE t1 SET f2 = '2' WHERE f1 = 2;
connection node_1a;
SET GLOBAL wsrep_provider_options = 'signal=commit_monitor_master_enter_sync';
SET GLOBAL wsrep_provider_options = 'dbug=';
connection node_1;
SELECT * FROM t1;
f1 f2
1 1
2 2
"node 1 is complete now"
connection node_2;
DROP TABLE t1;
!include ../galera_2nodes.cnf
[mysqld.1]
log-bin=mariadb-bin
log-slave-updates=OFF
#
# MDEV-24327 wsrep XID checkpointing order violation with log_slave_updates=OFF
#
# Here we have configure two node cluster with --log-bin=ON and --log-slave_-updates=OFF
#
# a transaction in node executes so far that it has replicated and reached
# commit phase, We have sync point before entering commit order monitor and
# the transaction is parked there
#
# Then another transaction is executed in node 2, it replicates and commits in node 2
# and is received and applied in node 1. After applying it will remain waiting for
# commit order monitor, as it has later seqno than the first transaction in node 1.
#
# control connection in node 1 waits to see the
#
# With the buggy version of MDEV-24327, the applier has however, already synced the
# wsrep XID checkpoint
#
#
#
--source include/galera_cluster.inc
--source include/have_innodb.inc
--source include/have_debug_sync.inc
--source include/galera_have_debug_sync.inc
CREATE TABLE t1 (f1 INTEGER PRIMARY KEY, f2 CHAR(1));
INSERT INTO t1 VALUES (1, 'f');
INSERT INTO t1 VALUES (2, 'g');
--connection node_1
SET AUTOCOMMIT=ON;
START TRANSACTION;
UPDATE t1 SET f2 = '1' WHERE f1 = 1;
--connect node_1a, 127.0.0.1, root, , test, $NODE_MYPORT_1
SET SESSION wsrep_sync_wait=0;
--connection node_1a
--let $expected_wsrep_received = `SELECT VARIABLE_VALUE+1 FROM INFORMATION_SCHEMA.GLOBAL_STATUS WHERE VARIABLE_NAME = 'wsrep_received'`
--source include/galera_wait_sync_point.inc
--source include/galera_clear_sync_point.inc
# Block the commit, send the COMMIT and wait until it gets blocked
--let $galera_sync_point = commit_monitor_master_enter_sync
--source include/galera_set_sync_point.inc
--connection node_1
--send COMMIT
--connection node_1a
# wait for the commit to block in sync point
--let $galera_sync_point = commit_monitor_master_enter_sync
--source include/galera_wait_sync_point.inc
--source include/galera_clear_sync_point.inc
#
# replicate non conflicting transaction from node 2
# it will get later seqno and should sync XID checkpoint after transaction in node 1
#
--connection node_2
UPDATE t1 SET f2 = '2' WHERE f1 = 2;
#
# wait until update from node 2 has been committed
# if XID checkpointing order was violated, node 1 would crash for assert
#
--connection node_1a
--let $wait_condition = SELECT VARIABLE_VALUE = $expected_wsrep_received FROM INFORMATION_SCHEMA.GLOBAL_STATUS WHERE VARIABLE_NAME = 'wsrep_received'
--source include/wait_condition.inc
--let $galera_sync_point = commit_monitor_master_enter_sync
--source include/galera_signal_sync_point.inc
--source include/galera_clear_sync_point.inc
--connection node_1
--reap
SELECT * FROM t1;
--echo "node 1 is complete now"
--connection node_2
DROP TABLE t1;
...@@ -142,11 +142,12 @@ Wsrep_high_priority_service::Wsrep_high_priority_service(THD* thd) ...@@ -142,11 +142,12 @@ Wsrep_high_priority_service::Wsrep_high_priority_service(THD* thd)
/* Disable general logging on applier threads */ /* Disable general logging on applier threads */
thd->variables.option_bits |= OPTION_LOG_OFF; thd->variables.option_bits |= OPTION_LOG_OFF;
/* Enable binlogging if opt_log_slave_updates is set */
if (opt_log_slave_updates) /* enable binlogging regardless of log_slave_updates setting
thd->variables.option_bits|= OPTION_BIN_LOG; this is for ensuring that both local and applier transaction go through
else same commit ordering algorithm in group commit control
thd->variables.option_bits&= ~(OPTION_BIN_LOG); */
thd->variables.option_bits|= OPTION_BIN_LOG;
thd->net.vio= 0; thd->net.vio= 0;
thd->reset_db(&db_str); thd->reset_db(&db_str);
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment