mirror of
https://github.com/MariaDB/server.git
synced 2025-01-23 15:24:16 +01:00
0b87de124d
Implement --semi-sync-master-wait-point=AFTER_SYNC|AFTER_COMMIT. When AFTER_SYNC, the semi-sync wait will be done earlier, before the storage engine commit rather than after. This means that a transaction will not be visible on the master until at least one slave has received it.
495 lines
13 KiB
C++
495 lines
13 KiB
C++
/* Copyright (C) 2007 Google Inc.
|
|
Copyright (c) 2008 MySQL AB, 2008-2009 Sun Microsystems, Inc.
|
|
Use is subject to license terms.
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; version 2 of the License.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program; if not, write to the Free Software
|
|
Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA */
|
|
|
|
|
|
#include "semisync_master.h"
|
|
#include "sql_class.h" // THD
|
|
|
|
static ReplSemiSyncMaster repl_semisync;
|
|
|
|
C_MODE_START
|
|
|
|
int repl_semi_report_binlog_update(Binlog_storage_param *param,
|
|
const char *log_file,
|
|
my_off_t log_pos, uint32 flags)
|
|
{
|
|
int error= 0;
|
|
|
|
if (repl_semisync.getMasterEnabled())
|
|
{
|
|
/*
|
|
Let us store the binlog file name and the position, so that
|
|
we know how long to wait for the binlog to the replicated to
|
|
the slave in synchronous replication.
|
|
*/
|
|
error= repl_semisync.writeTranxInBinlog(log_file,
|
|
log_pos);
|
|
}
|
|
|
|
return error;
|
|
}
|
|
|
|
int repl_semi_request_commit(Trans_param *param)
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
int repl_semi_report_binlog_sync(Binlog_storage_param *param,
|
|
const char *log_file,
|
|
my_off_t log_pos, uint32 flags)
|
|
{
|
|
int error= 0;
|
|
if (rpl_semi_sync_master_wait_point ==
|
|
SEMI_SYNC_MASTER_WAIT_POINT_AFTER_BINLOG_SYNC)
|
|
{
|
|
error = repl_semisync.commitTrx(log_file, log_pos);
|
|
}
|
|
|
|
return error;
|
|
}
|
|
|
|
int repl_semi_report_commit(Trans_param *param)
|
|
{
|
|
if (rpl_semi_sync_master_wait_point !=
|
|
SEMI_SYNC_MASTER_WAIT_POINT_AFTER_STORAGE_COMMIT)
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
bool is_real_trans= param->flags & TRANS_IS_REAL_TRANS;
|
|
|
|
if (is_real_trans && param->log_pos)
|
|
{
|
|
const char *binlog_name= param->log_file;
|
|
return repl_semisync.commitTrx(binlog_name, param->log_pos);
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
int repl_semi_report_rollback(Trans_param *param)
|
|
{
|
|
return repl_semi_report_commit(param);
|
|
}
|
|
|
|
int repl_semi_binlog_dump_start(Binlog_transmit_param *param,
|
|
const char *log_file,
|
|
my_off_t log_pos)
|
|
{
|
|
bool semi_sync_slave= repl_semisync.is_semi_sync_slave();
|
|
|
|
if (semi_sync_slave)
|
|
{
|
|
/* One more semi-sync slave */
|
|
repl_semisync.add_slave();
|
|
|
|
/*
|
|
Let's assume this semi-sync slave has already received all
|
|
binlog events before the filename and position it requests.
|
|
*/
|
|
repl_semisync.reportReplyBinlog(param->server_id, log_file, log_pos);
|
|
}
|
|
sql_print_information("Start %s binlog_dump to slave (server_id: %d), pos(%s, %lu)",
|
|
semi_sync_slave ? "semi-sync" : "asynchronous",
|
|
param->server_id, log_file, (unsigned long)log_pos);
|
|
|
|
return 0;
|
|
}
|
|
|
|
int repl_semi_binlog_dump_end(Binlog_transmit_param *param)
|
|
{
|
|
bool semi_sync_slave= repl_semisync.is_semi_sync_slave();
|
|
|
|
sql_print_information("Stop %s binlog_dump to slave (server_id: %d)",
|
|
semi_sync_slave ? "semi-sync" : "asynchronous",
|
|
param->server_id);
|
|
if (semi_sync_slave)
|
|
{
|
|
/* One less semi-sync slave */
|
|
repl_semisync.remove_slave();
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
int repl_semi_reserve_header(Binlog_transmit_param *param,
|
|
unsigned char *header,
|
|
unsigned long size, unsigned long *len)
|
|
{
|
|
*len += repl_semisync.reserveSyncHeader(header, size);
|
|
return 0;
|
|
}
|
|
|
|
int repl_semi_before_send_event(Binlog_transmit_param *param,
|
|
unsigned char *packet, unsigned long len,
|
|
const char *log_file, my_off_t log_pos)
|
|
{
|
|
return repl_semisync.updateSyncHeader(packet,
|
|
log_file,
|
|
log_pos,
|
|
param->server_id);
|
|
}
|
|
|
|
int repl_semi_after_send_event(Binlog_transmit_param *param,
|
|
const char *event_buf, unsigned long len)
|
|
{
|
|
if (repl_semisync.is_semi_sync_slave())
|
|
{
|
|
THD *thd= current_thd;
|
|
/*
|
|
Possible errors in reading slave reply are ignored deliberately
|
|
because we do not want dump thread to quit on this. Error
|
|
messages are already reported.
|
|
*/
|
|
(void) repl_semisync.readSlaveReply(&thd->net,
|
|
param->server_id, event_buf);
|
|
thd->clear_error();
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
int repl_semi_reset_master(Binlog_transmit_param *param)
|
|
{
|
|
if (repl_semisync.resetMaster())
|
|
return 1;
|
|
return 0;
|
|
}
|
|
|
|
C_MODE_END
|
|
|
|
/*
|
|
semisync system variables
|
|
*/
|
|
static void fix_rpl_semi_sync_master_timeout(MYSQL_THD thd,
|
|
SYS_VAR *var,
|
|
void *ptr,
|
|
const void *val);
|
|
|
|
static void fix_rpl_semi_sync_master_trace_level(MYSQL_THD thd,
|
|
SYS_VAR *var,
|
|
void *ptr,
|
|
const void *val);
|
|
|
|
static void fix_rpl_semi_sync_master_enabled(MYSQL_THD thd,
|
|
SYS_VAR *var,
|
|
void *ptr,
|
|
const void *val);
|
|
|
|
static MYSQL_SYSVAR_BOOL(enabled, rpl_semi_sync_master_enabled,
|
|
PLUGIN_VAR_OPCMDARG,
|
|
"Enable semi-synchronous replication master (disabled by default). ",
|
|
NULL, // check
|
|
&fix_rpl_semi_sync_master_enabled, // update
|
|
0);
|
|
|
|
/* NOTE: must match order of rpl_semi_sync_master_wait_point_t */
|
|
static const char *rpl_semi_sync_master_wait_point_names[] =
|
|
{
|
|
"AFTER_SYNC",
|
|
"AFTER_COMMIT",
|
|
NullS
|
|
};
|
|
|
|
static TYPELIB rpl_semi_sync_master_wait_point_typelib =
|
|
{
|
|
array_elements(rpl_semi_sync_master_wait_point_names) - 1,
|
|
"",
|
|
rpl_semi_sync_master_wait_point_names,
|
|
NULL
|
|
};
|
|
|
|
static MYSQL_SYSVAR_ENUM(
|
|
wait_point,
|
|
rpl_semi_sync_master_wait_point,
|
|
PLUGIN_VAR_RQCMDARG,
|
|
"Should transaction wait for semi-sync ack after having synced binlog, "
|
|
"or after having committed in storeage engine.",
|
|
NULL, // check
|
|
NULL, // update
|
|
SEMI_SYNC_MASTER_WAIT_POINT_AFTER_STORAGE_COMMIT,
|
|
&rpl_semi_sync_master_wait_point_typelib);
|
|
|
|
static MYSQL_SYSVAR_ULONG(timeout, rpl_semi_sync_master_timeout,
|
|
PLUGIN_VAR_OPCMDARG,
|
|
"The timeout value (in ms) for semi-synchronous replication in the master",
|
|
NULL, // check
|
|
fix_rpl_semi_sync_master_timeout, // update
|
|
10000, 0, ~0UL, 1);
|
|
|
|
static MYSQL_SYSVAR_BOOL(wait_no_slave, rpl_semi_sync_master_wait_no_slave,
|
|
PLUGIN_VAR_OPCMDARG,
|
|
"Wait until timeout when no semi-synchronous replication slave available (enabled by default). ",
|
|
NULL, // check
|
|
NULL, // update
|
|
1);
|
|
|
|
static MYSQL_SYSVAR_ULONG(trace_level, rpl_semi_sync_master_trace_level,
|
|
PLUGIN_VAR_OPCMDARG,
|
|
"The tracing level for semi-sync replication.",
|
|
NULL, // check
|
|
&fix_rpl_semi_sync_master_trace_level, // update
|
|
32, 0, ~0UL, 1);
|
|
|
|
static SYS_VAR* semi_sync_master_system_vars[]= {
|
|
MYSQL_SYSVAR(enabled),
|
|
MYSQL_SYSVAR(wait_point),
|
|
MYSQL_SYSVAR(timeout),
|
|
MYSQL_SYSVAR(wait_no_slave),
|
|
MYSQL_SYSVAR(trace_level),
|
|
NULL,
|
|
};
|
|
|
|
|
|
static void fix_rpl_semi_sync_master_timeout(MYSQL_THD thd,
|
|
SYS_VAR *var,
|
|
void *ptr,
|
|
const void *val)
|
|
{
|
|
*(unsigned long *)ptr= *(unsigned long *)val;
|
|
repl_semisync.setWaitTimeout(rpl_semi_sync_master_timeout);
|
|
return;
|
|
}
|
|
|
|
static void fix_rpl_semi_sync_master_trace_level(MYSQL_THD thd,
|
|
SYS_VAR *var,
|
|
void *ptr,
|
|
const void *val)
|
|
{
|
|
*(unsigned long *)ptr= *(unsigned long *)val;
|
|
repl_semisync.setTraceLevel(rpl_semi_sync_master_trace_level);
|
|
return;
|
|
}
|
|
|
|
static void fix_rpl_semi_sync_master_enabled(MYSQL_THD thd,
|
|
SYS_VAR *var,
|
|
void *ptr,
|
|
const void *val)
|
|
{
|
|
*(char *)ptr= *(char *)val;
|
|
if (rpl_semi_sync_master_enabled)
|
|
{
|
|
if (repl_semisync.enableMaster() != 0)
|
|
rpl_semi_sync_master_enabled = false;
|
|
}
|
|
else
|
|
{
|
|
if (repl_semisync.disableMaster() != 0)
|
|
rpl_semi_sync_master_enabled = true;
|
|
}
|
|
|
|
return;
|
|
}
|
|
|
|
Trans_observer trans_observer = {
|
|
sizeof(Trans_observer), // len
|
|
|
|
repl_semi_report_commit, // after_commit
|
|
repl_semi_report_rollback, // after_rollback
|
|
};
|
|
|
|
Binlog_storage_observer storage_observer = {
|
|
sizeof(Binlog_storage_observer), // len
|
|
|
|
repl_semi_report_binlog_update, // report_update
|
|
repl_semi_report_binlog_sync, // after_sync
|
|
};
|
|
|
|
Binlog_transmit_observer transmit_observer = {
|
|
sizeof(Binlog_transmit_observer), // len
|
|
|
|
repl_semi_binlog_dump_start, // start
|
|
repl_semi_binlog_dump_end, // stop
|
|
repl_semi_reserve_header, // reserve_header
|
|
repl_semi_before_send_event, // before_send_event
|
|
repl_semi_after_send_event, // after_send_event
|
|
repl_semi_reset_master, // reset
|
|
};
|
|
|
|
|
|
#define SHOW_FNAME(name) \
|
|
rpl_semi_sync_master_show_##name
|
|
|
|
#define DEF_SHOW_FUNC(name, show_type) \
|
|
static int SHOW_FNAME(name)(MYSQL_THD thd, SHOW_VAR *var, char *buff) \
|
|
{ \
|
|
repl_semisync.setExportStats(); \
|
|
var->type= show_type; \
|
|
var->value= (char *)&rpl_semi_sync_master_##name; \
|
|
return 0; \
|
|
}
|
|
|
|
DEF_SHOW_FUNC(status, SHOW_BOOL)
|
|
DEF_SHOW_FUNC(clients, SHOW_LONG)
|
|
DEF_SHOW_FUNC(wait_sessions, SHOW_LONG)
|
|
DEF_SHOW_FUNC(trx_wait_time, SHOW_LONGLONG)
|
|
DEF_SHOW_FUNC(trx_wait_num, SHOW_LONGLONG)
|
|
DEF_SHOW_FUNC(net_wait_time, SHOW_LONGLONG)
|
|
DEF_SHOW_FUNC(net_wait_num, SHOW_LONGLONG)
|
|
DEF_SHOW_FUNC(avg_net_wait_time, SHOW_LONG)
|
|
DEF_SHOW_FUNC(avg_trx_wait_time, SHOW_LONG)
|
|
|
|
|
|
/* plugin status variables */
|
|
static SHOW_VAR semi_sync_master_status_vars[]= {
|
|
{"Rpl_semi_sync_master_status",
|
|
(char*) &SHOW_FNAME(status),
|
|
SHOW_SIMPLE_FUNC},
|
|
{"Rpl_semi_sync_master_clients",
|
|
(char*) &SHOW_FNAME(clients),
|
|
SHOW_SIMPLE_FUNC},
|
|
{"Rpl_semi_sync_master_yes_tx",
|
|
(char*) &rpl_semi_sync_master_yes_transactions,
|
|
SHOW_LONG},
|
|
{"Rpl_semi_sync_master_no_tx",
|
|
(char*) &rpl_semi_sync_master_no_transactions,
|
|
SHOW_LONG},
|
|
{"Rpl_semi_sync_master_wait_sessions",
|
|
(char*) &SHOW_FNAME(wait_sessions),
|
|
SHOW_SIMPLE_FUNC},
|
|
{"Rpl_semi_sync_master_no_times",
|
|
(char*) &rpl_semi_sync_master_off_times,
|
|
SHOW_LONG},
|
|
{"Rpl_semi_sync_master_timefunc_failures",
|
|
(char*) &rpl_semi_sync_master_timefunc_fails,
|
|
SHOW_LONG},
|
|
{"Rpl_semi_sync_master_wait_pos_backtraverse",
|
|
(char*) &rpl_semi_sync_master_wait_pos_backtraverse,
|
|
SHOW_LONG},
|
|
{"Rpl_semi_sync_master_tx_wait_time",
|
|
(char*) &SHOW_FNAME(trx_wait_time),
|
|
SHOW_SIMPLE_FUNC},
|
|
{"Rpl_semi_sync_master_tx_waits",
|
|
(char*) &SHOW_FNAME(trx_wait_num),
|
|
SHOW_SIMPLE_FUNC},
|
|
{"Rpl_semi_sync_master_tx_avg_wait_time",
|
|
(char*) &SHOW_FNAME(avg_trx_wait_time),
|
|
SHOW_SIMPLE_FUNC},
|
|
{"Rpl_semi_sync_master_net_wait_time",
|
|
(char*) &SHOW_FNAME(net_wait_time),
|
|
SHOW_SIMPLE_FUNC},
|
|
{"Rpl_semi_sync_master_net_waits",
|
|
(char*) &SHOW_FNAME(net_wait_num),
|
|
SHOW_SIMPLE_FUNC},
|
|
{"Rpl_semi_sync_master_net_avg_wait_time",
|
|
(char*) &SHOW_FNAME(avg_net_wait_time),
|
|
SHOW_SIMPLE_FUNC},
|
|
{NULL, NULL, SHOW_LONG},
|
|
};
|
|
|
|
#ifdef HAVE_PSI_INTERFACE
|
|
PSI_mutex_key key_ss_mutex_LOCK_binlog_;
|
|
|
|
static PSI_mutex_info all_semisync_mutexes[]=
|
|
{
|
|
{ &key_ss_mutex_LOCK_binlog_, "LOCK_binlog_", 0}
|
|
};
|
|
|
|
PSI_cond_key key_ss_cond_COND_binlog_send_;
|
|
|
|
static PSI_cond_info all_semisync_conds[]=
|
|
{
|
|
{ &key_ss_cond_COND_binlog_send_, "COND_binlog_send_", 0}
|
|
};
|
|
#endif /* HAVE_PSI_INTERFACE */
|
|
|
|
PSI_stage_info stage_waiting_for_semi_sync_ack_from_slave=
|
|
{ 0, "Waiting for semi-sync ACK from slave", 0};
|
|
|
|
#ifdef HAVE_PSI_INTERFACE
|
|
PSI_stage_info *all_semisync_stages[]=
|
|
{
|
|
& stage_waiting_for_semi_sync_ack_from_slave
|
|
};
|
|
|
|
static void init_semisync_psi_keys(void)
|
|
{
|
|
const char* category= "semisync";
|
|
int count;
|
|
|
|
count= array_elements(all_semisync_mutexes);
|
|
mysql_mutex_register(category, all_semisync_mutexes, count);
|
|
|
|
count= array_elements(all_semisync_conds);
|
|
mysql_cond_register(category, all_semisync_conds, count);
|
|
|
|
count= array_elements(all_semisync_stages);
|
|
mysql_stage_register(category, all_semisync_stages, count);
|
|
}
|
|
#endif /* HAVE_PSI_INTERFACE */
|
|
|
|
static int semi_sync_master_plugin_init(void *p)
|
|
{
|
|
#ifdef HAVE_PSI_INTERFACE
|
|
init_semisync_psi_keys();
|
|
#endif
|
|
|
|
if (repl_semisync.initObject())
|
|
return 1;
|
|
if (register_trans_observer(&trans_observer, p))
|
|
return 1;
|
|
if (register_binlog_storage_observer(&storage_observer, p))
|
|
return 1;
|
|
if (register_binlog_transmit_observer(&transmit_observer, p))
|
|
return 1;
|
|
return 0;
|
|
}
|
|
|
|
static int semi_sync_master_plugin_deinit(void *p)
|
|
{
|
|
if (unregister_trans_observer(&trans_observer, p))
|
|
{
|
|
sql_print_error("unregister_trans_observer failed");
|
|
return 1;
|
|
}
|
|
if (unregister_binlog_storage_observer(&storage_observer, p))
|
|
{
|
|
sql_print_error("unregister_binlog_storage_observer failed");
|
|
return 1;
|
|
}
|
|
if (unregister_binlog_transmit_observer(&transmit_observer, p))
|
|
{
|
|
sql_print_error("unregister_binlog_transmit_observer failed");
|
|
return 1;
|
|
}
|
|
repl_semisync.cleanup();
|
|
sql_print_information("unregister_replicator OK");
|
|
return 0;
|
|
}
|
|
|
|
struct Mysql_replication semi_sync_master_plugin= {
|
|
MYSQL_REPLICATION_INTERFACE_VERSION
|
|
};
|
|
|
|
/*
|
|
Plugin library descriptor
|
|
*/
|
|
maria_declare_plugin(semisync_master)
|
|
{
|
|
MYSQL_REPLICATION_PLUGIN,
|
|
&semi_sync_master_plugin,
|
|
"rpl_semi_sync_master",
|
|
"He Zhenxing",
|
|
"Semi-synchronous replication master",
|
|
PLUGIN_LICENSE_GPL,
|
|
semi_sync_master_plugin_init, /* Plugin Init */
|
|
semi_sync_master_plugin_deinit, /* Plugin Deinit */
|
|
0x0100 /* 1.0 */,
|
|
semi_sync_master_status_vars, /* status variables */
|
|
semi_sync_master_system_vars, /* system variables */
|
|
"1.0",
|
|
MariaDB_PLUGIN_MATURITY_GAMMA
|
|
}
|
|
maria_declare_plugin_end;
|
|
|