mirror of
				https://github.com/MariaDB/server.git
				synced 2025-10-26 01:18:31 +02:00 
			
		
		
		
	 2cb5fb6019
			
		
	
	
	2cb5fb6019
	
	
	
		
			
			If log_slave_updates==OFF, wsrep applier threads used to be configured with option: thd->variables.option_bits&= ~(OPTION_BIN_LOG); (i.e. like sql_log_bin=ON). And this was regardless of log-bin configuration. With this, having configuration of: --log-bin && --log-slave-updates=OFF, local threads used binlogging, but applier threads did not. And further: local threads went through binlog group commit, while applier threads did direct commits. This resulted in situation, where applier threads entered earlier in wsrep XID checkpointing, and could sync their wsrep XID out of order. Later local thread commit would see that higher seqno was already checkpointed, and fire an assert because of this. As a fix, applier threads are now forced to enable binlogging regardless of log-slave-updates configuration. This PR comes with new mtr test: galera.MDEV-24327, which causes a scenario where applier transaction is applied and committed while earlier local transaction is parked before commit order monitor enter. A buggy mariadb versoin would fail for assertion because of wsrep XID checkpoint order violation. Reviewed-by: Jan Lindström <jan.lindstrom@mariadb.com>
		
			
				
	
	
		
			87 lines
		
	
	
	
		
			2.7 KiB
		
	
	
	
		
			Text
		
	
	
	
	
	
			
		
		
	
	
			87 lines
		
	
	
	
		
			2.7 KiB
		
	
	
	
		
			Text
		
	
	
	
	
	
| #
 | |
| # MDEV-24327 wsrep XID checkpointing order violation with log_slave_updates=OFF
 | |
| #
 | |
| # Here we have configure two node cluster with --log-bin=ON and --log-slave_-updates=OFF
 | |
| #
 | |
| # a transaction in node executes so far that it has replicated and reached
 | |
| # commit phase, We have sync point before entering commit order monitor and
 | |
| # the transaction is parked there
 | |
| #
 | |
| # Then another transaction is executed in node 2, it replicates and commits in node 2
 | |
| # and is received and applied in node 1. After applying it will remain waiting for
 | |
| # commit order monitor, as it has later seqno than the first transaction in node 1.
 | |
| #
 | |
| # control connection in node 1 waits to see the 
 | |
| # 
 | |
| # With the buggy version of MDEV-24327, the applier has however, already synced the
 | |
| # wsrep XID checkpoint
 | |
| #
 | |
| #
 | |
| #
 | |
| 
 | |
| --source include/galera_cluster.inc
 | |
| --source include/have_innodb.inc
 | |
| --source include/have_debug_sync.inc
 | |
| --source include/galera_have_debug_sync.inc
 | |
| 
 | |
| CREATE TABLE t1 (f1 INTEGER PRIMARY KEY, f2 CHAR(1));
 | |
| INSERT INTO t1 VALUES (1, 'f');
 | |
| INSERT INTO t1 VALUES (2, 'g');
 | |
| 
 | |
| --connection node_1
 | |
| SET AUTOCOMMIT=ON;
 | |
| START TRANSACTION;
 | |
| 
 | |
| UPDATE t1 SET f2 = '1' WHERE f1 = 1;
 | |
| 
 | |
| --connect node_1a, 127.0.0.1, root, , test, $NODE_MYPORT_1
 | |
| SET SESSION wsrep_sync_wait=0;
 | |
| --connection node_1a
 | |
| --let $expected_wsrep_received = `SELECT VARIABLE_VALUE+1 FROM INFORMATION_SCHEMA.GLOBAL_STATUS WHERE VARIABLE_NAME = 'wsrep_received'`
 | |
| --source include/galera_wait_sync_point.inc
 | |
| --source include/galera_clear_sync_point.inc
 | |
| 
 | |
| # Block the commit, send the COMMIT and wait until it gets blocked
 | |
| 
 | |
| --let $galera_sync_point = commit_monitor_master_enter_sync
 | |
| --source include/galera_set_sync_point.inc
 | |
| 
 | |
| --connection node_1
 | |
| --send COMMIT
 | |
| 
 | |
| --connection node_1a
 | |
| 
 | |
| # wait for the commit to block in sync point
 | |
| 
 | |
| --let $galera_sync_point = commit_monitor_master_enter_sync
 | |
| --source include/galera_wait_sync_point.inc
 | |
| --source include/galera_clear_sync_point.inc
 | |
| 
 | |
| #
 | |
| # replicate non conflicting transaction from node 2
 | |
| # it will get later seqno and should sync XID checkpoint after transaction in node 1
 | |
| #
 | |
| --connection node_2
 | |
| UPDATE t1 SET f2 = '2' WHERE f1 = 2;
 | |
| 
 | |
| #
 | |
| # wait until update from node 2 has been committed
 | |
| # if XID checkpointing order was violated, node 1 would crash for assert
 | |
| #
 | |
| 
 | |
| --connection node_1a
 | |
| --let $wait_condition = SELECT VARIABLE_VALUE = $expected_wsrep_received FROM INFORMATION_SCHEMA.GLOBAL_STATUS WHERE VARIABLE_NAME = 'wsrep_received'
 | |
| --source include/wait_condition.inc
 | |
| 
 | |
| --let $galera_sync_point = commit_monitor_master_enter_sync
 | |
| --source include/galera_signal_sync_point.inc
 | |
| --source include/galera_clear_sync_point.inc
 | |
| 
 | |
| --connection node_1
 | |
| --reap
 | |
| SELECT * FROM t1;
 | |
| --echo "node 1 is complete now"
 | |
| 
 | |
| 
 | |
| --connection node_2
 | |
| DROP TABLE t1;
 |