mirror of
				https://github.com/MariaDB/server.git
				synced 2025-10-31 02:46:29 +01:00 
			
		
		
		
	 3d11313b6f
			
		
	
	
	3d11313b6f
	
	
	
		
			
			Replication filtering is not safe for cluster consistency. There is problem when two or more filtering rules are provided by user. Here, we disable replication filtering inside a Galera cluster for now. To support safe replication filereing in the Galera cluster it should also effect SST/IST. Signed-off-by: Julius Goryavsky <julius.goryavsky@mariadb.com>
		
			
				
	
	
		
			8833 lines
		
	
	
	
		
			283 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			8833 lines
		
	
	
	
		
			283 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /*
 | |
|    Copyright (c) 2000, 2019, Oracle and/or its affiliates.
 | |
|    Copyright (c) 2009, 2022, MariaDB
 | |
| 
 | |
|    This program is free software; you can redistribute it and/or modify
 | |
|    it under the terms of the GNU General Public License as published by
 | |
|    the Free Software Foundation; version 2 of the License.
 | |
| 
 | |
|    This program is distributed in the hope that it will be useful,
 | |
|    but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | |
|    GNU General Public License for more details.
 | |
| 
 | |
|    You should have received a copy of the GNU General Public License
 | |
|    along with this program; if not, write to the Free Software
 | |
|    Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1335  USA */
 | |
| 
 | |
| 
 | |
| #include "mariadb.h"
 | |
| #include "sql_priv.h"
 | |
| 
 | |
| #ifdef MYSQL_CLIENT
 | |
| #error MYSQL_CLIENT must not be defined here
 | |
| #endif
 | |
| 
 | |
| #ifndef MYSQL_SERVER
 | |
| #error MYSQL_SERVER must be defined here
 | |
| #endif
 | |
| 
 | |
| #include "unireg.h"
 | |
| #include "log_event.h"
 | |
| #include "sql_base.h"                           // close_thread_tables
 | |
| #include "sql_cache.h"                       // QUERY_CACHE_FLAGS_SIZE
 | |
| #include "sql_locale.h" // MY_LOCALE, my_locale_by_number, my_locale_en_US
 | |
| #include "key.h"        // key_copy
 | |
| #include "lock.h"       // mysql_unlock_tables
 | |
| #include "sql_parse.h"  // mysql_test_parse_for_slave
 | |
| #include "tztime.h"     // struct Time_zone
 | |
| #include "sql_load.h"   // mysql_load
 | |
| #include "sql_db.h"     // load_db_opt_by_name
 | |
| #include "slave.h"
 | |
| #include "rpl_rli.h"
 | |
| #include "rpl_mi.h"
 | |
| #include "rpl_filter.h"
 | |
| #include "rpl_record.h"
 | |
| #include "transaction.h"
 | |
| #include <my_dir.h>
 | |
| #include "sql_show.h"    // append_identifier
 | |
| #include "debug_sync.h"  // debug_sync
 | |
| #include <mysql/psi/mysql_statement.h>
 | |
| #include <strfunc.h>
 | |
| #include "compat56.h"
 | |
| #include "wsrep_mysqld.h"
 | |
| #include "sql_insert.h"
 | |
| 
 | |
| #include <my_bitmap.h>
 | |
| #include "rpl_utility.h"
 | |
| #include "rpl_constants.h"
 | |
| #include "sql_digest.h"
 | |
| #include "zlib.h"
 | |
| 
 | |
| 
 | |
| #define log_cs  &my_charset_latin1
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| static int rows_event_stmt_cleanup(rpl_group_info *rgi, THD* thd);
 | |
| 
 | |
| static const char *HA_ERR(int i)
 | |
| {
 | |
|   /* 
 | |
|     This function should only be called in case of an error
 | |
|     was detected 
 | |
|    */
 | |
|   DBUG_ASSERT(i != 0);
 | |
|   switch (i) {
 | |
|   case HA_ERR_KEY_NOT_FOUND: return "HA_ERR_KEY_NOT_FOUND";
 | |
|   case HA_ERR_FOUND_DUPP_KEY: return "HA_ERR_FOUND_DUPP_KEY";
 | |
|   case HA_ERR_RECORD_CHANGED: return "HA_ERR_RECORD_CHANGED";
 | |
|   case HA_ERR_WRONG_INDEX: return "HA_ERR_WRONG_INDEX";
 | |
|   case HA_ERR_CRASHED: return "HA_ERR_CRASHED";
 | |
|   case HA_ERR_WRONG_IN_RECORD: return "HA_ERR_WRONG_IN_RECORD";
 | |
|   case HA_ERR_OUT_OF_MEM: return "HA_ERR_OUT_OF_MEM";
 | |
|   case HA_ERR_NOT_A_TABLE: return "HA_ERR_NOT_A_TABLE";
 | |
|   case HA_ERR_WRONG_COMMAND: return "HA_ERR_WRONG_COMMAND";
 | |
|   case HA_ERR_OLD_FILE: return "HA_ERR_OLD_FILE";
 | |
|   case HA_ERR_NO_ACTIVE_RECORD: return "HA_ERR_NO_ACTIVE_RECORD";
 | |
|   case HA_ERR_RECORD_DELETED: return "HA_ERR_RECORD_DELETED";
 | |
|   case HA_ERR_RECORD_FILE_FULL: return "HA_ERR_RECORD_FILE_FULL";
 | |
|   case HA_ERR_INDEX_FILE_FULL: return "HA_ERR_INDEX_FILE_FULL";
 | |
|   case HA_ERR_END_OF_FILE: return "HA_ERR_END_OF_FILE";
 | |
|   case HA_ERR_UNSUPPORTED: return "HA_ERR_UNSUPPORTED";
 | |
|   case HA_ERR_TO_BIG_ROW: return "HA_ERR_TO_BIG_ROW";
 | |
|   case HA_WRONG_CREATE_OPTION: return "HA_WRONG_CREATE_OPTION";
 | |
|   case HA_ERR_FOUND_DUPP_UNIQUE: return "HA_ERR_FOUND_DUPP_UNIQUE";
 | |
|   case HA_ERR_UNKNOWN_CHARSET: return "HA_ERR_UNKNOWN_CHARSET";
 | |
|   case HA_ERR_WRONG_MRG_TABLE_DEF: return "HA_ERR_WRONG_MRG_TABLE_DEF";
 | |
|   case HA_ERR_CRASHED_ON_REPAIR: return "HA_ERR_CRASHED_ON_REPAIR";
 | |
|   case HA_ERR_CRASHED_ON_USAGE: return "HA_ERR_CRASHED_ON_USAGE";
 | |
|   case HA_ERR_LOCK_WAIT_TIMEOUT: return "HA_ERR_LOCK_WAIT_TIMEOUT";
 | |
|   case HA_ERR_LOCK_TABLE_FULL: return "HA_ERR_LOCK_TABLE_FULL";
 | |
|   case HA_ERR_READ_ONLY_TRANSACTION: return "HA_ERR_READ_ONLY_TRANSACTION";
 | |
|   case HA_ERR_LOCK_DEADLOCK: return "HA_ERR_LOCK_DEADLOCK";
 | |
|   case HA_ERR_CANNOT_ADD_FOREIGN: return "HA_ERR_CANNOT_ADD_FOREIGN";
 | |
|   case HA_ERR_NO_REFERENCED_ROW: return "HA_ERR_NO_REFERENCED_ROW";
 | |
|   case HA_ERR_ROW_IS_REFERENCED: return "HA_ERR_ROW_IS_REFERENCED";
 | |
|   case HA_ERR_NO_SAVEPOINT: return "HA_ERR_NO_SAVEPOINT";
 | |
|   case HA_ERR_NON_UNIQUE_BLOCK_SIZE: return "HA_ERR_NON_UNIQUE_BLOCK_SIZE";
 | |
|   case HA_ERR_NO_SUCH_TABLE: return "HA_ERR_NO_SUCH_TABLE";
 | |
|   case HA_ERR_TABLE_EXIST: return "HA_ERR_TABLE_EXIST";
 | |
|   case HA_ERR_NO_CONNECTION: return "HA_ERR_NO_CONNECTION";
 | |
|   case HA_ERR_NULL_IN_SPATIAL: return "HA_ERR_NULL_IN_SPATIAL";
 | |
|   case HA_ERR_TABLE_DEF_CHANGED: return "HA_ERR_TABLE_DEF_CHANGED";
 | |
|   case HA_ERR_NO_PARTITION_FOUND: return "HA_ERR_NO_PARTITION_FOUND";
 | |
|   case HA_ERR_RBR_LOGGING_FAILED: return "HA_ERR_RBR_LOGGING_FAILED";
 | |
|   case HA_ERR_DROP_INDEX_FK: return "HA_ERR_DROP_INDEX_FK";
 | |
|   case HA_ERR_FOREIGN_DUPLICATE_KEY: return "HA_ERR_FOREIGN_DUPLICATE_KEY";
 | |
|   case HA_ERR_TABLE_NEEDS_UPGRADE: return "HA_ERR_TABLE_NEEDS_UPGRADE";
 | |
|   case HA_ERR_TABLE_READONLY: return "HA_ERR_TABLE_READONLY";
 | |
|   case HA_ERR_AUTOINC_READ_FAILED: return "HA_ERR_AUTOINC_READ_FAILED";
 | |
|   case HA_ERR_AUTOINC_ERANGE: return "HA_ERR_AUTOINC_ERANGE";
 | |
|   case HA_ERR_GENERIC: return "HA_ERR_GENERIC";
 | |
|   case HA_ERR_RECORD_IS_THE_SAME: return "HA_ERR_RECORD_IS_THE_SAME";
 | |
|   case HA_ERR_LOGGING_IMPOSSIBLE: return "HA_ERR_LOGGING_IMPOSSIBLE";
 | |
|   case HA_ERR_CORRUPT_EVENT: return "HA_ERR_CORRUPT_EVENT";
 | |
|   case HA_ERR_ROWS_EVENT_APPLY : return "HA_ERR_ROWS_EVENT_APPLY";
 | |
|   case HA_ERR_PARTITION_LIST : return "HA_ERR_PARTITION_LIST";
 | |
|   }
 | |
|   return "No Error!";
 | |
| }
 | |
| 
 | |
| 
 | |
| /*
 | |
|   Return true if an error caught during event execution is a temporary error
 | |
|   that will cause automatic retry of the event group during parallel
 | |
|   replication, false otherwise.
 | |
| 
 | |
|   In parallel replication, conflicting transactions can occasionally cause
 | |
|   deadlocks; such errors are handled automatically by rolling back re-trying
 | |
|   the transactions, so should not pollute the error log.
 | |
| */
 | |
| static bool
 | |
| is_parallel_retry_error(rpl_group_info *rgi, int err)
 | |
| {
 | |
|   if (!rgi->is_parallel_exec)
 | |
|     return false;
 | |
|   if (rgi->speculation == rpl_group_info::SPECULATE_OPTIMISTIC)
 | |
|     return true;
 | |
|   if (rgi->killed_for_retry &&
 | |
|       (err == ER_QUERY_INTERRUPTED || err == ER_CONNECTION_KILLED))
 | |
|     return true;
 | |
|   return has_temporary_error(rgi->thd);
 | |
| }
 | |
| 
 | |
| /**
 | |
|   Accumulate a Diagnostics_area's errors and warnings into an output buffer
 | |
| 
 | |
|     @param errbuf       The output buffer to write error messages
 | |
|     @param errbuf_size  The size of the output buffer
 | |
|     @param da           The Diagnostics_area to check for errors
 | |
| */
 | |
| static void inline aggregate_da_errors(char *errbuf, size_t errbuf_size,
 | |
|                                        Diagnostics_area *da)
 | |
| {
 | |
|   const char *errbuf_end= errbuf + errbuf_size;
 | |
|   char *slider;
 | |
|   Diagnostics_area::Sql_condition_iterator it= da->sql_conditions();
 | |
|   const Sql_condition *err;
 | |
|   size_t len;
 | |
|   for (err= it++, slider= errbuf; err && slider < errbuf_end - 1;
 | |
|        slider += len, err= it++)
 | |
|   {
 | |
|     len= my_snprintf(slider, errbuf_end - slider,
 | |
|                      " %s, Error_code: %d;", err->get_message_text(),
 | |
|                      err->get_sql_errno());
 | |
|   }
 | |
| }
 | |
| 
 | |
| 
 | |
| /**
 | |
|    Error reporting facility for Rows_log_event::do_apply_event
 | |
| 
 | |
|    @param level     error, warning or info
 | |
|    @param ha_error  HA_ERR_ code
 | |
|    @param rli       pointer to the active Relay_log_info instance
 | |
|    @param thd       pointer to the slave thread's thd
 | |
|    @param table     pointer to the event's table object
 | |
|    @param type      the type of the event
 | |
|    @param log_name  the master binlog file name
 | |
|    @param pos       the master binlog file pos (the next after the event)
 | |
| 
 | |
| */
 | |
| static void inline slave_rows_error_report(enum loglevel level, int ha_error,
 | |
|                                            rpl_group_info *rgi, THD *thd,
 | |
|                                            TABLE *table, const char * type,
 | |
|                                            const char *log_name, my_off_t pos)
 | |
| {
 | |
|   const char *handler_error= (ha_error ? HA_ERR(ha_error) : NULL);
 | |
|   char buff[MAX_SLAVE_ERRMSG];
 | |
|   Relay_log_info const *rli= rgi->rli;
 | |
|   buff[0]= 0;
 | |
|   int errcode= thd->is_error() ? thd->get_stmt_da()->sql_errno() : 0;
 | |
| 
 | |
|   /*
 | |
|     In parallel replication, deadlocks or other temporary errors can happen
 | |
|     occasionally in normal operation, they will be handled correctly and
 | |
|     automatically by re-trying the transactions. So do not pollute the error
 | |
|     log with messages about them.
 | |
|   */
 | |
|   if (is_parallel_retry_error(rgi, errcode))
 | |
|     return;
 | |
| 
 | |
|   aggregate_da_errors(buff, sizeof(buff), thd->get_stmt_da());
 | |
| 
 | |
|   if (ha_error != 0)
 | |
|     rli->report(level, errcode, rgi->gtid_info(),
 | |
|                 "Could not execute %s event on table %s.%s;"
 | |
|                 "%s handler error %s; "
 | |
|                 "the event's master log %s, end_log_pos %llu",
 | |
|                 type, table->s->db.str, table->s->table_name.str,
 | |
|                 buff, handler_error == NULL ? "<unknown>" : handler_error,
 | |
|                 log_name, pos);
 | |
|   else
 | |
|     rli->report(level, errcode, rgi->gtid_info(),
 | |
|                 "Could not execute %s event on table %s.%s;"
 | |
|                 "%s the event's master log %s, end_log_pos %llu",
 | |
|                 type, table->s->db.str, table->s->table_name.str,
 | |
|                 buff, log_name, pos);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| static void set_thd_db(THD *thd, Rpl_filter *rpl_filter,
 | |
|                        const char *db, uint32 db_len)
 | |
| {
 | |
|   char lcase_db_buf[NAME_LEN +1];
 | |
|   LEX_CSTRING new_db;
 | |
|   new_db.length= db_len;
 | |
|   if (lower_case_table_names == 1)
 | |
|   {
 | |
|     strmov(lcase_db_buf, db);
 | |
|     my_casedn_str(system_charset_info, lcase_db_buf);
 | |
|     new_db.str= lcase_db_buf;
 | |
|   }
 | |
|   else
 | |
|     new_db.str= db;
 | |
|   /* TODO WARNING this makes rewrite_db respect lower_case_table_names values
 | |
|    * for more info look MDEV-17446 */
 | |
|   new_db.str= rpl_filter->get_rewrite_db(new_db.str, &new_db.length);
 | |
|   thd->set_db(&new_db);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| 
 | |
| inline int idempotent_error_code(int err_code)
 | |
| {
 | |
|   int ret= 0;
 | |
| 
 | |
|   switch (err_code)
 | |
|   {
 | |
|     case 0:
 | |
|       ret= 1;
 | |
|     break;
 | |
|     /*
 | |
|       The following list of "idempotent" errors
 | |
|       means that an error from the list might happen
 | |
|       because of idempotent (more than once)
 | |
|       applying of a binlog file.
 | |
|       Notice, that binlog has a  ddl operation its
 | |
|       second applying may cause
 | |
| 
 | |
|       case HA_ERR_TABLE_DEF_CHANGED:
 | |
|       case HA_ERR_CANNOT_ADD_FOREIGN:
 | |
| 
 | |
|       which are not included into to the list.
 | |
| 
 | |
|       Note that HA_ERR_RECORD_DELETED is not in the list since
 | |
|       do_exec_row() should not return that error code.
 | |
|     */
 | |
|     case HA_ERR_RECORD_CHANGED:
 | |
|     case HA_ERR_KEY_NOT_FOUND:
 | |
|     case HA_ERR_END_OF_FILE:
 | |
|     case HA_ERR_FOUND_DUPP_KEY:
 | |
|     case HA_ERR_FOUND_DUPP_UNIQUE:
 | |
|     case HA_ERR_FOREIGN_DUPLICATE_KEY:
 | |
|     case HA_ERR_NO_REFERENCED_ROW:
 | |
|     case HA_ERR_ROW_IS_REFERENCED:
 | |
|       ret= 1;
 | |
|     break;
 | |
|     default:
 | |
|       ret= 0;
 | |
|     break;
 | |
|   }
 | |
|   return (ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|   Ignore error code specified on command line.
 | |
| */
 | |
| 
 | |
| inline int ignored_error_code(int err_code)
 | |
| {
 | |
|   if (use_slave_mask && bitmap_is_set(&slave_error_mask, err_code))
 | |
|   {
 | |
|     statistic_increment(slave_skipped_errors, LOCK_status);
 | |
|     return 1;
 | |
|   }
 | |
|   return err_code == ER_SLAVE_IGNORED_TABLE;
 | |
| }
 | |
| 
 | |
| /*
 | |
|   This function converts an engine's error to a server error.
 | |
|    
 | |
|   If the thread does not have an error already reported, it tries to 
 | |
|   define it by calling the engine's method print_error. However, if a 
 | |
|   mapping is not found, it uses the ER_UNKNOWN_ERROR and prints out a 
 | |
|   warning message.
 | |
| */ 
 | |
| int convert_handler_error(int error, THD* thd, TABLE *table)
 | |
| {
 | |
|   uint actual_error= (thd->is_error() ? thd->get_stmt_da()->sql_errno() :
 | |
|                            0);
 | |
| 
 | |
|   if (actual_error == 0)
 | |
|   {
 | |
|     table->file->print_error(error, MYF(0));
 | |
|     actual_error= (thd->is_error() ? thd->get_stmt_da()->sql_errno() :
 | |
|                         ER_UNKNOWN_ERROR);
 | |
|     if (actual_error == ER_UNKNOWN_ERROR)
 | |
|       if (global_system_variables.log_warnings)
 | |
|         sql_print_warning("Unknown error detected %d in handler", error);
 | |
|   }
 | |
| 
 | |
|   return (actual_error);
 | |
| }
 | |
| 
 | |
| inline bool concurrency_error_code(int error)
 | |
| {
 | |
|   switch (error)
 | |
|   {
 | |
|   case ER_LOCK_WAIT_TIMEOUT:
 | |
|   case ER_LOCK_DEADLOCK:
 | |
|   case ER_XA_RBDEADLOCK:
 | |
|     return TRUE;
 | |
|   default: 
 | |
|     return (FALSE);
 | |
|   }
 | |
| }
 | |
| 
 | |
| inline bool unexpected_error_code(int unexpected_error)
 | |
| {
 | |
|   switch (unexpected_error) 
 | |
|   {
 | |
|   case ER_NET_READ_ERROR:
 | |
|   case ER_NET_ERROR_ON_WRITE:
 | |
|   case ER_QUERY_INTERRUPTED:
 | |
|   case ER_STATEMENT_TIMEOUT:
 | |
|   case ER_CONNECTION_KILLED:
 | |
|   case ER_SERVER_SHUTDOWN:
 | |
|   case ER_NEW_ABORTING_CONNECTION:
 | |
|     return(TRUE);
 | |
|   default:
 | |
|     return(FALSE);
 | |
|   }
 | |
| }
 | |
| 
 | |
| /*
 | |
|   pretty_print_str()
 | |
| */
 | |
| 
 | |
| static void
 | |
| pretty_print_str(String *packet, const char *str, int len)
 | |
| {
 | |
|   const char *end= str + len;
 | |
|   packet->append(STRING_WITH_LEN("'"));
 | |
|   while (str < end)
 | |
|   {
 | |
|     char c;
 | |
|     switch ((c=*str++)) {
 | |
|     case '\n': packet->append(STRING_WITH_LEN("\\n")); break;
 | |
|     case '\r': packet->append(STRING_WITH_LEN("\\r")); break;
 | |
|     case '\\': packet->append(STRING_WITH_LEN("\\\\")); break;
 | |
|     case '\b': packet->append(STRING_WITH_LEN("\\b")); break;
 | |
|     case '\t': packet->append(STRING_WITH_LEN("\\t")); break;
 | |
|     case '\'': packet->append(STRING_WITH_LEN("\\'")); break;
 | |
|     case 0   : packet->append(STRING_WITH_LEN("\\0")); break;
 | |
|     default:
 | |
|       packet->append(&c, 1);
 | |
|       break;
 | |
|     }
 | |
|   }
 | |
|   packet->append(STRING_WITH_LEN("'"));
 | |
| }
 | |
| #endif /* HAVE_REPLICATION */
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| 
 | |
| /**
 | |
|   Create a prefix for the temporary files that is to be used for
 | |
|   load data file name for this master
 | |
| 
 | |
|   @param name	           Store prefix of name here
 | |
|   @param connection_name   Connection name
 | |
|  
 | |
|   @return pointer to end of name
 | |
| 
 | |
|   @description
 | |
|   We assume that FN_REFLEN is big enough to hold
 | |
|   MAX_CONNECTION_NAME * MAX_FILENAME_MBWIDTH characters + 2 numbers +
 | |
|   a short extension.
 | |
| 
 | |
|   The resulting file name has the following parts, each separated with a '-'
 | |
|   - PREFIX_SQL_LOAD (SQL_LOAD-)
 | |
|   - If a connection name is given (multi-master setup):
 | |
|     - Add an extra '-' to mark that this is a multi-master file
 | |
|     - connection name in lower case, converted to safe file characters.
 | |
|     (see create_logfile_name_with_suffix()).
 | |
|   - server_id
 | |
|   - A last '-' (after server_id).
 | |
| */
 | |
| 
 | |
| static char *load_data_tmp_prefix(char *name,
 | |
|                                   LEX_CSTRING *connection_name)
 | |
| {
 | |
|   name= strmov(name, PREFIX_SQL_LOAD);
 | |
|   if (connection_name->length)
 | |
|   {
 | |
|     uint buf_length;
 | |
|     uint errors;
 | |
|     /* Add marker that this is a multi-master-file */
 | |
|     *name++='-';
 | |
|     /* Convert connection_name to a safe filename */
 | |
|     buf_length= strconvert(system_charset_info, connection_name->str, FN_REFLEN,
 | |
|                            &my_charset_filename, name, FN_REFLEN, &errors);
 | |
|     name+= buf_length;
 | |
|     *name++= '-';
 | |
|   }
 | |
|   name= int10_to_str(global_system_variables.server_id, name, 10);
 | |
|   *name++ = '-';
 | |
|   *name= '\0';                                  // For testing prefixes
 | |
|   return name;
 | |
| }
 | |
| 
 | |
| 
 | |
| /**
 | |
|   Creates a temporary name for LOAD DATA INFILE
 | |
| 
 | |
|   @param buf		      Store new filename here
 | |
|   @param file_id	      File_id (part of file name)
 | |
|   @param event_server_id      Event_id (part of file name)
 | |
|   @param ext		      Extension for file name
 | |
| 
 | |
|   @return
 | |
|     Pointer to start of extension
 | |
| */
 | |
| 
 | |
| static char *slave_load_file_stem(char *buf, uint file_id,
 | |
|                                   int event_server_id, const char *ext,
 | |
|                                   LEX_CSTRING *connection_name)
 | |
| {
 | |
|   char *res;
 | |
|   res= buf+ unpack_dirname(buf, slave_load_tmpdir);
 | |
|   to_unix_path(buf);
 | |
|   buf= load_data_tmp_prefix(res, connection_name);
 | |
|   buf= int10_to_str(event_server_id, buf, 10);
 | |
|   *buf++ = '-';
 | |
|   res= int10_to_str(file_id, buf, 10);
 | |
|   strmov(res, ext);                             // Add extension last
 | |
|   return res;                                   // Pointer to extension
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| 
 | |
| /**
 | |
|   Delete all temporary files used for SQL_LOAD.
 | |
| */
 | |
| 
 | |
| static void cleanup_load_tmpdir(LEX_CSTRING *connection_name)
 | |
| {
 | |
|   MY_DIR *dirp;
 | |
|   FILEINFO *file;
 | |
|   uint i;
 | |
|   char dir[FN_REFLEN], fname[FN_REFLEN];
 | |
|   char prefbuf[31 + MAX_CONNECTION_NAME* MAX_FILENAME_MBWIDTH + 1];
 | |
|   DBUG_ENTER("cleanup_load_tmpdir");
 | |
| 
 | |
|   unpack_dirname(dir, slave_load_tmpdir);
 | |
|   if (!(dirp=my_dir(dir, MYF(MY_WME))))
 | |
|     return;
 | |
| 
 | |
|   /* 
 | |
|      When we are deleting temporary files, we should only remove
 | |
|      the files associated with the server id of our server.
 | |
|      We don't use event_server_id here because since we've disabled
 | |
|      direct binlogging of Create_file/Append_file/Exec_load events
 | |
|      we cannot meet Start_log event in the middle of events from one 
 | |
|      LOAD DATA.
 | |
|   */
 | |
| 
 | |
|   load_data_tmp_prefix(prefbuf, connection_name);
 | |
|   DBUG_PRINT("enter", ("dir: '%s'  prefix: '%s'", dir, prefbuf));
 | |
| 
 | |
|   for (i=0 ; i < (uint)dirp->number_of_files; i++)
 | |
|   {
 | |
|     file=dirp->dir_entry+i;
 | |
|     if (is_prefix(file->name, prefbuf))
 | |
|     {
 | |
|       fn_format(fname,file->name,slave_load_tmpdir,"",MY_UNPACK_FILENAME);
 | |
|       mysql_file_delete(key_file_misc, fname, MYF(0));
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   my_dirend(dirp);
 | |
|   DBUG_VOID_RETURN;
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| /**
 | |
|   Append a version of the 'str' string suitable for use in a query to
 | |
|   the 'to' string.  To generate a correct escaping, the character set
 | |
|   information in 'csinfo' is used.
 | |
| */
 | |
| 
 | |
| int append_query_string(CHARSET_INFO *csinfo, String *to,
 | |
|                         const char *str, size_t len, bool no_backslash)
 | |
| {
 | |
|   char *beg, *ptr;
 | |
|   my_bool overflow;
 | |
|   uint32 const orig_len= to->length();
 | |
|   if (to->reserve(orig_len + len * 2 + 4))
 | |
|     return 1;
 | |
| 
 | |
|   beg= (char*) to->ptr() + to->length();
 | |
|   ptr= beg;
 | |
|   if (csinfo->escape_with_backslash_is_dangerous)
 | |
|     ptr= str_to_hex(ptr, str, len);
 | |
|   else
 | |
|   {
 | |
|     *ptr++= '\'';
 | |
|     if (!no_backslash)
 | |
|     {
 | |
|       ptr+= escape_string_for_mysql(csinfo, ptr, 0, str, len, &overflow);
 | |
|     }
 | |
|     else
 | |
|     {
 | |
|       const char *frm_str= str;
 | |
| 
 | |
|       for (; frm_str < (str + len); frm_str++)
 | |
|       {
 | |
|         /* Using '' way to represent "'" */
 | |
|         if (*frm_str == '\'')
 | |
|           *ptr++= *frm_str;
 | |
| 
 | |
|         *ptr++= *frm_str;
 | |
|       }
 | |
|     }
 | |
| 
 | |
|     *ptr++= '\'';
 | |
|   }
 | |
|   to->length((uint32)(orig_len + ptr - beg));
 | |
|   return 0;
 | |
| }
 | |
| 
 | |
| 
 | |
| /**************************************************************************
 | |
| 	Log_event methods (= the parent class of all events)
 | |
| **************************************************************************/
 | |
| 
 | |
| Log_event::Log_event(THD* thd_arg, uint16 flags_arg, bool using_trans)
 | |
|   :log_pos(0), temp_buf(0), exec_time(0), thd(thd_arg),
 | |
|    checksum_alg(BINLOG_CHECKSUM_ALG_UNDEF)
 | |
| {
 | |
|   server_id=	thd->variables.server_id;
 | |
|   when=         thd->start_time;
 | |
|   when_sec_part=thd->start_time_sec_part;
 | |
| 
 | |
|   if (using_trans)
 | |
|     cache_type= Log_event::EVENT_TRANSACTIONAL_CACHE;
 | |
|   else
 | |
|     cache_type= Log_event::EVENT_STMT_CACHE;
 | |
|   flags= flags_arg |
 | |
|     (thd->variables.option_bits & OPTION_SKIP_REPLICATION ?
 | |
|      LOG_EVENT_SKIP_REPLICATION_F : 0);
 | |
| }
 | |
| 
 | |
| /**
 | |
|   This minimal constructor is for when you are not even sure that there
 | |
|   is a valid THD. For example in the server when we are shutting down or
 | |
|   flushing logs after receiving a SIGHUP (then we must write a Rotate to
 | |
|   the binlog but we have no THD, so we need this minimal constructor).
 | |
| */
 | |
| 
 | |
| Log_event::Log_event()
 | |
|   :temp_buf(0), exec_time(0), flags(0), cache_type(EVENT_INVALID_CACHE),
 | |
|    thd(0), checksum_alg(BINLOG_CHECKSUM_ALG_UNDEF)
 | |
| {
 | |
|   server_id=	global_system_variables.server_id;
 | |
|   /*
 | |
|     We can't call my_time() here as this would cause a call before
 | |
|     my_init() is called
 | |
|   */
 | |
|   when=         0;
 | |
|   when_sec_part=0;
 | |
|   log_pos=	0;
 | |
| }
 | |
| 
 | |
| 
 | |
| 
 | |
| #ifdef HAVE_REPLICATION
 | |
| 
 | |
| int Log_event::do_update_pos(rpl_group_info *rgi)
 | |
| {
 | |
|   Relay_log_info *rli= rgi->rli;
 | |
|   DBUG_ENTER("Log_event::do_update_pos");
 | |
| 
 | |
|   DBUG_ASSERT(!rli->belongs_to_client());
 | |
|   /*
 | |
|     rli is null when (as far as I (Guilhem) know) the caller is
 | |
|     Load_log_event::do_apply_event *and* that one is called from
 | |
|     Execute_load_log_event::do_apply_event.  In this case, we don't
 | |
|     do anything here ; Execute_load_log_event::do_apply_event will
 | |
|     call Log_event::do_apply_event again later with the proper rli.
 | |
|     Strictly speaking, if we were sure that rli is null only in the
 | |
|     case discussed above, 'if (rli)' is useless here.  But as we are
 | |
|     not 100% sure, keep it for now.
 | |
| 
 | |
|     Matz: I don't think we will need this check with this refactoring.
 | |
|   */
 | |
|   if (rli)
 | |
|   {
 | |
|     /*
 | |
|       In parallel execution, delay position update for the events that are
 | |
|       not part of event groups (format description, rotate, and such) until
 | |
|       the actual event execution reaches that point.
 | |
|     */
 | |
|     if (!rgi->is_parallel_exec || is_group_event(get_type_code()))
 | |
|       rli->stmt_done(log_pos, thd, rgi);
 | |
|   }
 | |
|   DBUG_RETURN(0);                                  // Cannot fail currently
 | |
| }
 | |
| 
 | |
| 
 | |
| Log_event::enum_skip_reason
 | |
| Log_event::do_shall_skip(rpl_group_info *rgi)
 | |
| {
 | |
|   Relay_log_info *rli= rgi->rli;
 | |
|   DBUG_PRINT("info", ("ev->server_id: %lu, ::server_id: %lu,"
 | |
|                       " rli->replicate_same_server_id: %d,"
 | |
|                       " rli->slave_skip_counter: %llu",
 | |
|                       (ulong) server_id,
 | |
|                       (ulong) global_system_variables.server_id,
 | |
|                       rli->replicate_same_server_id,
 | |
|                       rli->slave_skip_counter));
 | |
|   if ((server_id == global_system_variables.server_id &&
 | |
|        !(rli->replicate_same_server_id || (flags &  LOG_EVENT_ACCEPT_OWN_F))) ||
 | |
|       (rli->slave_skip_counter == 1 && rli->is_in_group()) ||
 | |
|       (flags & LOG_EVENT_SKIP_REPLICATION_F &&
 | |
|        opt_replicate_events_marked_for_skip != RPL_SKIP_REPLICATE))
 | |
|     return EVENT_SKIP_IGNORE;
 | |
|   if (rli->slave_skip_counter > 0)
 | |
|     return EVENT_SKIP_COUNT;
 | |
|   return EVENT_SKIP_NOT;
 | |
| }
 | |
| 
 | |
| 
 | |
| /*
 | |
|   Log_event::pack_info()
 | |
| */
 | |
| 
 | |
| void Log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|   protocol->store("", 0, &my_charset_bin);
 | |
| }
 | |
| 
 | |
| 
 | |
| /**
 | |
|   Only called by SHOW BINLOG EVENTS
 | |
| */
 | |
| int Log_event::net_send(Protocol *protocol, const char* log_name, my_off_t pos)
 | |
| {
 | |
|   const char *p= strrchr(log_name, FN_LIBCHAR);
 | |
|   const char *event_type;
 | |
|   if (p)
 | |
|     log_name = p + 1;
 | |
| 
 | |
|   protocol->prepare_for_resend();
 | |
|   protocol->store(log_name, strlen(log_name), &my_charset_bin);
 | |
|   protocol->store((ulonglong) pos);
 | |
|   event_type = get_type_str();
 | |
|   protocol->store(event_type, strlen(event_type), &my_charset_bin);
 | |
|   protocol->store((uint32) server_id);
 | |
|   protocol->store((ulonglong) log_pos);
 | |
|   pack_info(protocol);
 | |
|   return protocol->write();
 | |
| }
 | |
| #endif /* HAVE_REPLICATION */
 | |
| 
 | |
| 
 | |
| /**
 | |
|   init_show_field_list() prepares the column names and types for the
 | |
|   output of SHOW BINLOG EVENTS; it is used only by SHOW BINLOG
 | |
|   EVENTS.
 | |
| */
 | |
| 
 | |
| void Log_event::init_show_field_list(THD *thd, List<Item>* field_list)
 | |
| {
 | |
|   MEM_ROOT *mem_root= thd->mem_root;
 | |
|   field_list->push_back(new (mem_root)
 | |
|                         Item_empty_string(thd, "Log_name", 20),
 | |
|                         mem_root);
 | |
|   field_list->push_back(new (mem_root)
 | |
|                         Item_return_int(thd, "Pos",
 | |
|                                         MY_INT64_NUM_DECIMAL_DIGITS,
 | |
|                                         MYSQL_TYPE_LONGLONG),
 | |
|                         mem_root);
 | |
|   field_list->push_back(new (mem_root)
 | |
|                         Item_empty_string(thd, "Event_type", 20),
 | |
|                         mem_root);
 | |
|   field_list->push_back(new (mem_root)
 | |
|                         Item_return_int(thd, "Server_id", 10,
 | |
|                                         MYSQL_TYPE_LONG),
 | |
|                         mem_root);
 | |
|   field_list->push_back(new (mem_root)
 | |
|                         Item_return_int(thd, "End_log_pos",
 | |
|                                         MY_INT64_NUM_DECIMAL_DIGITS,
 | |
|                                         MYSQL_TYPE_LONGLONG),
 | |
|                         mem_root);
 | |
|   field_list->push_back(new (mem_root) Item_empty_string(thd, "Info", 20),
 | |
|                         mem_root);
 | |
| }
 | |
| 
 | |
| /**
 | |
|    A decider of whether to trigger checksum computation or not.
 | |
|    To be invoked in Log_event::write() stack.
 | |
|    The decision is positive 
 | |
| 
 | |
|     S,M) if it's been marked for checksumming with @c checksum_alg
 | |
|     
 | |
|     M) otherwise, if @@global.binlog_checksum is not NONE and the event is 
 | |
|        directly written to the binlog file.
 | |
|        The to-be-cached event decides at @c write_cache() time.
 | |
| 
 | |
|    Otherwise the decision is negative.
 | |
| 
 | |
|    @note   A side effect of the method is altering Log_event::checksum_alg
 | |
|            it the latter was undefined at calling.
 | |
| 
 | |
|    @return true   Checksum should be used. Log_event::checksum_alg is set.
 | |
|    @return false  No checksum
 | |
| */
 | |
| 
 | |
| my_bool Log_event::need_checksum()
 | |
| {
 | |
|   my_bool ret;
 | |
|   DBUG_ENTER("Log_event::need_checksum");
 | |
| 
 | |
|   /* 
 | |
|      few callers of Log_event::write 
 | |
|      (incl FD::write, FD constructing code on the slave side, Rotate relay log
 | |
|      and Stop event) 
 | |
|      provides their checksum alg preference through Log_event::checksum_alg.
 | |
|   */
 | |
|   if (checksum_alg != BINLOG_CHECKSUM_ALG_UNDEF)
 | |
|     ret= checksum_alg != BINLOG_CHECKSUM_ALG_OFF;
 | |
|   else
 | |
|   {
 | |
|     ret= binlog_checksum_options && cache_type == Log_event::EVENT_NO_CACHE;
 | |
|     checksum_alg= ret ? (enum_binlog_checksum_alg)binlog_checksum_options
 | |
|                       : BINLOG_CHECKSUM_ALG_OFF;
 | |
|   }
 | |
|   /*
 | |
|     FD calls the methods before data_written has been calculated.
 | |
|     The following invariant claims if the current is not the first
 | |
|     call (and therefore data_written is not zero) then `ret' must be
 | |
|     TRUE. It may not be null because FD is always checksummed.
 | |
|   */
 | |
|   
 | |
|   DBUG_ASSERT(get_type_code() != FORMAT_DESCRIPTION_EVENT || ret ||
 | |
|               data_written == 0);
 | |
| 
 | |
|   DBUG_ASSERT(!ret || 
 | |
|               ((checksum_alg == binlog_checksum_options ||
 | |
|                /* 
 | |
|                   Stop event closes the relay-log and its checksum alg
 | |
|                   preference is set by the caller can be different
 | |
|                   from the server's binlog_checksum_options.
 | |
|                */
 | |
|                get_type_code() == STOP_EVENT ||
 | |
|                /* 
 | |
|                   Rotate:s can be checksummed regardless of the server's
 | |
|                   binlog_checksum_options. That applies to both
 | |
|                   the local RL's Rotate and the master's Rotate
 | |
|                   which IO thread instantiates via queue_binlog_ver_3_event.
 | |
|                */
 | |
|                get_type_code() == ROTATE_EVENT ||
 | |
|                get_type_code() == START_ENCRYPTION_EVENT ||
 | |
|                /* FD is always checksummed */
 | |
|                get_type_code() == FORMAT_DESCRIPTION_EVENT) && 
 | |
|                checksum_alg != BINLOG_CHECKSUM_ALG_OFF));
 | |
| 
 | |
|   DBUG_ASSERT(checksum_alg != BINLOG_CHECKSUM_ALG_UNDEF);
 | |
| 
 | |
|   DBUG_ASSERT(((get_type_code() != ROTATE_EVENT &&
 | |
|                 get_type_code() != STOP_EVENT) ||
 | |
|                get_type_code() != FORMAT_DESCRIPTION_EVENT) ||
 | |
|               cache_type == Log_event::EVENT_NO_CACHE);
 | |
| 
 | |
|   DBUG_RETURN(ret);
 | |
| }
 | |
| 
 | |
| int Log_event_writer::write_internal(const uchar *pos, size_t len)
 | |
| {
 | |
|   DBUG_ASSERT(!ctx || encrypt_or_write == &Log_event_writer::encrypt_and_write);
 | |
|   if (my_b_safe_write(file, pos, len))
 | |
|   {
 | |
|     DBUG_PRINT("error", ("write to log failed: %d", my_errno));
 | |
|     return 1;
 | |
|   }
 | |
|   bytes_written+= len;
 | |
|   return 0;
 | |
| }
 | |
| 
 | |
| /*
 | |
|   as soon as encryption produces the first output block, write event_len
 | |
|   where it should be in a valid event header
 | |
| */
 | |
| int Log_event_writer::maybe_write_event_len(uchar *pos, size_t len)
 | |
| {
 | |
|   if (len && event_len)
 | |
|   {
 | |
|     DBUG_ASSERT(len >= EVENT_LEN_OFFSET);
 | |
|     if (write_internal(pos + EVENT_LEN_OFFSET - 4, 4))
 | |
|       return 1;
 | |
|     int4store(pos + EVENT_LEN_OFFSET - 4, event_len);
 | |
|     event_len= 0;
 | |
|   }
 | |
|   return 0;
 | |
| }
 | |
| 
 | |
| int Log_event_writer::encrypt_and_write(const uchar *pos, size_t len)
 | |
| {
 | |
|   uchar *dst;
 | |
|   size_t dstsize;
 | |
|   uint dstlen;
 | |
|   int res;                                      // Safe as res is always set
 | |
|   DBUG_ASSERT(ctx);
 | |
| 
 | |
|   if (!len)
 | |
|     return 0;
 | |
| 
 | |
|   dstsize= encryption_encrypted_length((uint)len, ENCRYPTION_KEY_SYSTEM_DATA,
 | |
|                                        crypto->key_version);
 | |
|   if (!(dst= (uchar*)my_safe_alloca(dstsize)))
 | |
|     return 1;
 | |
| 
 | |
|   if (encryption_ctx_update(ctx, pos, (uint)len, dst, &dstlen))
 | |
|   {
 | |
|     res= 1;
 | |
|     goto err;
 | |
|   }
 | |
| 
 | |
|   if (maybe_write_event_len(dst, dstlen))
 | |
|   {
 | |
|     res= 1;
 | |
|     goto err;
 | |
|   }
 | |
| 
 | |
|   res= write_internal(dst, dstlen);
 | |
| 
 | |
| err:
 | |
|   my_safe_afree(dst, dstsize);
 | |
|   return res;
 | |
| }
 | |
| 
 | |
| int Log_event_writer::write_header(uchar *pos, size_t len)
 | |
| {
 | |
|   DBUG_ENTER("Log_event_writer::write_header");
 | |
|   /*
 | |
|     recording checksum of FD event computed with dropped
 | |
|     possibly active LOG_EVENT_BINLOG_IN_USE_F flag.
 | |
|     Similar step at verication: the active flag is dropped before
 | |
|     checksum computing.
 | |
|   */
 | |
|   if (checksum_len)
 | |
|   {
 | |
|     uchar save=pos[FLAGS_OFFSET];
 | |
|     pos[FLAGS_OFFSET]&= ~LOG_EVENT_BINLOG_IN_USE_F;
 | |
|     crc= my_checksum(0, pos, len);
 | |
|     pos[FLAGS_OFFSET]= save;
 | |
|   }
 | |
| 
 | |
|   if (ctx)
 | |
|   {
 | |
|     uchar iv[BINLOG_IV_LENGTH];
 | |
|     crypto->set_iv(iv, (uint32)my_b_safe_tell(file));
 | |
|     if (encryption_ctx_init(ctx, crypto->key, crypto->key_length,
 | |
|            iv, sizeof(iv), ENCRYPTION_FLAG_ENCRYPT | ENCRYPTION_FLAG_NOPAD,
 | |
|            ENCRYPTION_KEY_SYSTEM_DATA, crypto->key_version))
 | |
|       DBUG_RETURN(1);
 | |
| 
 | |
|     DBUG_ASSERT(len >= LOG_EVENT_HEADER_LEN);
 | |
|     event_len= uint4korr(pos + EVENT_LEN_OFFSET);
 | |
|     DBUG_ASSERT(event_len >= len);
 | |
|     memcpy(pos + EVENT_LEN_OFFSET, pos, 4);
 | |
|     pos+= 4;
 | |
|     len-= 4;
 | |
|   }
 | |
|   DBUG_RETURN((this->*encrypt_or_write)(pos, len));
 | |
| }
 | |
| 
 | |
| int Log_event_writer::write_data(const uchar *pos, size_t len)
 | |
| {
 | |
|   DBUG_ENTER("Log_event_writer::write_data");
 | |
| 
 | |
|   if (!len)
 | |
|     DBUG_RETURN(0);
 | |
| 
 | |
|   if (checksum_len)
 | |
|     crc= my_checksum(crc, pos, len);
 | |
| 
 | |
|   DBUG_RETURN((this->*encrypt_or_write)(pos, len));
 | |
| }
 | |
| 
 | |
| int Log_event_writer::write_footer()
 | |
| {
 | |
|   DBUG_ENTER("Log_event_writer::write_footer");
 | |
|   if (checksum_len)
 | |
|   {
 | |
|     uchar checksum_buf[BINLOG_CHECKSUM_LEN];
 | |
|     int4store(checksum_buf, crc);
 | |
|     if ((this->*encrypt_or_write)(checksum_buf, BINLOG_CHECKSUM_LEN))
 | |
|       DBUG_RETURN(ER_ERROR_ON_WRITE);
 | |
|   }
 | |
|   if (ctx)
 | |
|   {
 | |
|     uint dstlen;
 | |
|     uchar dst[MY_AES_BLOCK_SIZE*2];
 | |
|     if (encryption_ctx_finish(ctx, dst, &dstlen))
 | |
|       DBUG_RETURN(1);
 | |
|     if (maybe_write_event_len(dst, dstlen) || write_internal(dst, dstlen))
 | |
|       DBUG_RETURN(ER_ERROR_ON_WRITE);
 | |
|   }
 | |
|   DBUG_RETURN(0);
 | |
| }
 | |
| 
 | |
| /*
 | |
|   Log_event::write_header()
 | |
| */
 | |
| 
 | |
| bool Log_event::write_header(size_t event_data_length)
 | |
| {
 | |
|   uchar header[LOG_EVENT_HEADER_LEN];
 | |
|   ulong now;
 | |
|   DBUG_ENTER("Log_event::write_header");
 | |
|   DBUG_PRINT("enter", ("filepos: %lld  length: %zu type: %d",
 | |
|                        (longlong) writer->pos(), event_data_length,
 | |
|                        (int) get_type_code()));
 | |
| 
 | |
|   writer->checksum_len= need_checksum() ? BINLOG_CHECKSUM_LEN : 0;
 | |
| 
 | |
|   /* Store number of bytes that will be written by this event */
 | |
|   data_written= event_data_length + sizeof(header) + writer->checksum_len;
 | |
| 
 | |
|   /*
 | |
|     log_pos != 0 if this is relay-log event. In this case we should not
 | |
|     change the position
 | |
|   */
 | |
| 
 | |
|   if (is_artificial_event())
 | |
|   {
 | |
|     /*
 | |
|       Artificial events are automatically generated and do not exist
 | |
|       in master's binary log, so log_pos should be set to 0.
 | |
|     */
 | |
|     log_pos= 0;
 | |
|   }
 | |
|   else  if (!log_pos)
 | |
|   {
 | |
|     /*
 | |
|       Calculate the position of where the next event will start
 | |
|       (end of this event, that is).
 | |
|     */
 | |
| 
 | |
|     log_pos= writer->pos() + data_written;
 | |
|     
 | |
|     DBUG_EXECUTE_IF("dbug_master_binlog_over_2GB", log_pos += (1ULL <<31););
 | |
|   }
 | |
| 
 | |
|   now= get_time();                               // Query start time
 | |
| 
 | |
|   /*
 | |
|     Header will be of size LOG_EVENT_HEADER_LEN for all events, except for
 | |
|     FORMAT_DESCRIPTION_EVENT and ROTATE_EVENT, where it will be
 | |
|     LOG_EVENT_MINIMAL_HEADER_LEN (remember these 2 have a frozen header,
 | |
|     because we read them before knowing the format).
 | |
|   */
 | |
| 
 | |
|   int4store(header, now);              // timestamp
 | |
|   header[EVENT_TYPE_OFFSET]= get_type_code();
 | |
|   int4store(header+ SERVER_ID_OFFSET, server_id);
 | |
|   int4store(header+ EVENT_LEN_OFFSET, data_written);
 | |
|   int4store(header+ LOG_POS_OFFSET, log_pos);
 | |
|   int2store(header + FLAGS_OFFSET, flags);
 | |
| 
 | |
|   bool ret= writer->write_header(header, sizeof(header));
 | |
|   DBUG_RETURN(ret);
 | |
| }
 | |
| 
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| inline Log_event::enum_skip_reason
 | |
| Log_event::continue_group(rpl_group_info *rgi)
 | |
| {
 | |
|   if (rgi->rli->slave_skip_counter == 1)
 | |
|     return Log_event::EVENT_SKIP_IGNORE;
 | |
|   return Log_event::do_shall_skip(rgi);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| /**************************************************************************
 | |
| 	Query_log_event methods
 | |
| **************************************************************************/
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| 
 | |
| /**
 | |
|   This (which is used only for SHOW BINLOG EVENTS) could be updated to
 | |
|   print SET @@session_var=. But this is not urgent, as SHOW BINLOG EVENTS is
 | |
|   only an information, it does not produce suitable queries to replay (for
 | |
|   example it does not print LOAD DATA INFILE).
 | |
|   @todo
 | |
|     show the catalog ??
 | |
| */
 | |
| 
 | |
| void Query_log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|   // TODO: show the catalog ??
 | |
|   char buf_mem[1024];
 | |
|   String buf(buf_mem, sizeof(buf_mem), system_charset_info);
 | |
|   buf.real_alloc(9 + db_len + q_len);
 | |
|   if (!(flags & LOG_EVENT_SUPPRESS_USE_F)
 | |
|       && db && db_len)
 | |
|   {
 | |
|     buf.append(STRING_WITH_LEN("use "));
 | |
|     append_identifier(protocol->thd, &buf, db, db_len);
 | |
|     buf.append(STRING_WITH_LEN("; "));
 | |
|   }
 | |
| 
 | |
|   DBUG_ASSERT(!flags2 || flags2_inited);
 | |
| 
 | |
|   if (flags2 & (OPTION_NO_FOREIGN_KEY_CHECKS | OPTION_AUTO_IS_NULL |
 | |
|                 OPTION_RELAXED_UNIQUE_CHECKS |
 | |
|                 OPTION_NO_CHECK_CONSTRAINT_CHECKS |
 | |
|                 OPTION_IF_EXISTS))
 | |
|   {
 | |
|     buf.append(STRING_WITH_LEN("set "));
 | |
|     if (flags2 & OPTION_NO_FOREIGN_KEY_CHECKS)
 | |
|       buf.append(STRING_WITH_LEN("foreign_key_checks=1, "));
 | |
|     if (flags2 & OPTION_AUTO_IS_NULL)
 | |
|       buf.append(STRING_WITH_LEN("sql_auto_is_null, "));
 | |
|     if (flags2 & OPTION_RELAXED_UNIQUE_CHECKS)
 | |
|       buf.append(STRING_WITH_LEN("unique_checks=1, "));
 | |
|     if (flags2 & OPTION_NO_CHECK_CONSTRAINT_CHECKS)
 | |
|       buf.append(STRING_WITH_LEN("check_constraint_checks=1, "));
 | |
|     if (flags2 & OPTION_IF_EXISTS)
 | |
|       buf.append(STRING_WITH_LEN("@@sql_if_exists=1, "));
 | |
|     buf[buf.length()-2]=';';
 | |
|   }
 | |
|   if (query && q_len)
 | |
|     buf.append(query, q_len);
 | |
|   protocol->store(&buf);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| /**
 | |
|   Utility function for the next method (Query_log_event::write()) .
 | |
| */
 | |
| static void store_str_with_code_and_len(uchar **dst, const char *src,
 | |
|                                         uint len, uint code)
 | |
| {
 | |
|   /*
 | |
|     only 1 byte to store the length of catalog, so it should not
 | |
|     surpass 255
 | |
|   */
 | |
|   DBUG_ASSERT(len <= 255);
 | |
|   DBUG_ASSERT(src);
 | |
|   *((*dst)++)= (uchar) code;
 | |
|   *((*dst)++)= (uchar) len;
 | |
|   bmove(*dst, src, len);
 | |
|   (*dst)+= len;
 | |
| }
 | |
| 
 | |
| 
 | |
| /**
 | |
|   Query_log_event::write().
 | |
| 
 | |
|   @note
 | |
|     In this event we have to modify the header to have the correct
 | |
|     EVENT_LEN_OFFSET as we don't yet know how many status variables we
 | |
|     will print!
 | |
| */
 | |
| 
 | |
| bool Query_log_event::write()
 | |
| {
 | |
|   uchar buf[QUERY_HEADER_LEN + MAX_SIZE_LOG_EVENT_STATUS];
 | |
|   uchar *start, *start_of_status;
 | |
|   ulong event_length;
 | |
| 
 | |
|   if (!query)
 | |
|     return 1;                                   // Something wrong with event
 | |
| 
 | |
|   /*
 | |
|     We want to store the thread id:
 | |
|     (- as an information for the user when he reads the binlog)
 | |
|     - if the query uses temporary table: for the slave SQL thread to know to
 | |
|     which master connection the temp table belongs.
 | |
|     Now imagine we (write()) are called by the slave SQL thread (we are
 | |
|     logging a query executed by this thread; the slave runs with
 | |
|     --log-slave-updates). Then this query will be logged with
 | |
|     thread_id=the_thread_id_of_the_SQL_thread. Imagine that 2 temp tables of
 | |
|     the same name were created simultaneously on the master (in the master
 | |
|     binlog you have
 | |
|     CREATE TEMPORARY TABLE t; (thread 1)
 | |
|     CREATE TEMPORARY TABLE t; (thread 2)
 | |
|     ...)
 | |
|     then in the slave's binlog there will be
 | |
|     CREATE TEMPORARY TABLE t; (thread_id_of_the_slave_SQL_thread)
 | |
|     CREATE TEMPORARY TABLE t; (thread_id_of_the_slave_SQL_thread)
 | |
|     which is bad (same thread id!).
 | |
| 
 | |
|     To avoid this, we log the thread's thread id EXCEPT for the SQL
 | |
|     slave thread for which we log the original (master's) thread id.
 | |
|     Now this moves the bug: what happens if the thread id on the
 | |
|     master was 10 and when the slave replicates the query, a
 | |
|     connection number 10 is opened by a normal client on the slave,
 | |
|     and updates a temp table of the same name? We get a problem
 | |
|     again. To avoid this, in the handling of temp tables (sql_base.cc)
 | |
|     we use thread_id AND server_id.  TODO when this is merged into
 | |
|     4.1: in 4.1, slave_proxy_id has been renamed to pseudo_thread_id
 | |
|     and is a session variable: that's to make mysqlbinlog work with
 | |
|     temp tables. We probably need to introduce
 | |
| 
 | |
|     SET PSEUDO_SERVER_ID
 | |
|     for mysqlbinlog in 4.1. mysqlbinlog would print:
 | |
|     SET PSEUDO_SERVER_ID=
 | |
|     SET PSEUDO_THREAD_ID=
 | |
|     for each query using temp tables.
 | |
|   */
 | |
|   int4store(buf + Q_THREAD_ID_OFFSET, slave_proxy_id);
 | |
|   int4store(buf + Q_EXEC_TIME_OFFSET, exec_time);
 | |
|   buf[Q_DB_LEN_OFFSET] = (char) db_len;
 | |
|   int2store(buf + Q_ERR_CODE_OFFSET, error_code);
 | |
| 
 | |
|   /*
 | |
|     You MUST always write status vars in increasing order of code. This
 | |
|     guarantees that a slightly older slave will be able to parse those he
 | |
|     knows.
 | |
|   */
 | |
|   start_of_status= start= buf+QUERY_HEADER_LEN;
 | |
|   if (flags2_inited)
 | |
|   {
 | |
|     *start++= Q_FLAGS2_CODE;
 | |
|     int4store(start, flags2);
 | |
|     start+= 4;
 | |
|   }
 | |
|   if (sql_mode_inited)
 | |
|   {
 | |
|     *start++= Q_SQL_MODE_CODE;
 | |
|     int8store(start, (ulonglong)sql_mode);
 | |
|     start+= 8;
 | |
|   }
 | |
|   if (catalog_len) // i.e. this var is inited (false for 4.0 events)
 | |
|   {
 | |
|     store_str_with_code_and_len(&start,
 | |
|                                 catalog, catalog_len, Q_CATALOG_NZ_CODE);
 | |
|     /*
 | |
|       In 5.0.x where x<4 masters we used to store the end zero here. This was
 | |
|       a waste of one byte so we don't do it in x>=4 masters. We change code to
 | |
|       Q_CATALOG_NZ_CODE, because re-using the old code would make x<4 slaves
 | |
|       of this x>=4 master segfault (expecting a zero when there is
 | |
|       none). Remaining compatibility problems are: the older slave will not
 | |
|       find the catalog; but it is will not crash, and it's not an issue
 | |
|       that it does not find the catalog as catalogs were not used in these
 | |
|       older MySQL versions (we store it in binlog and read it from relay log
 | |
|       but do nothing useful with it). What is an issue is that the older slave
 | |
|       will stop processing the Q_* blocks (and jumps to the db/query) as soon
 | |
|       as it sees unknown Q_CATALOG_NZ_CODE; so it will not be able to read
 | |
|       Q_AUTO_INCREMENT*, Q_CHARSET and so replication will fail silently in
 | |
|       various ways. Documented that you should not mix alpha/beta versions if
 | |
|       they are not exactly the same version, with example of 5.0.3->5.0.2 and
 | |
|       5.0.4->5.0.3. If replication is from older to new, the new will
 | |
|       recognize Q_CATALOG_CODE and have no problem.
 | |
|     */
 | |
|   }
 | |
|   if (auto_increment_increment != 1 || auto_increment_offset != 1)
 | |
|   {
 | |
|     *start++= Q_AUTO_INCREMENT;
 | |
|     int2store(start, auto_increment_increment);
 | |
|     int2store(start+2, auto_increment_offset);
 | |
|     start+= 4;
 | |
|   }
 | |
|   if (charset_inited)
 | |
|   {
 | |
|     *start++= Q_CHARSET_CODE;
 | |
|     memcpy(start, charset, 6);
 | |
|     start+= 6;
 | |
|   }
 | |
|   if (time_zone_len)
 | |
|   {
 | |
|     /* In the TZ sys table, column Name is of length 64 so this should be ok */
 | |
|     DBUG_ASSERT(time_zone_len <= MAX_TIME_ZONE_NAME_LENGTH);
 | |
|     store_str_with_code_and_len(&start,
 | |
|                                 time_zone_str, time_zone_len, Q_TIME_ZONE_CODE);
 | |
|   }
 | |
|   if (lc_time_names_number)
 | |
|   {
 | |
|     DBUG_ASSERT(lc_time_names_number <= 0xFFFF);
 | |
|     *start++= Q_LC_TIME_NAMES_CODE;
 | |
|     int2store(start, lc_time_names_number);
 | |
|     start+= 2;
 | |
|   }
 | |
|   if (charset_database_number)
 | |
|   {
 | |
|     DBUG_ASSERT(charset_database_number <= 0xFFFF);
 | |
|     *start++= Q_CHARSET_DATABASE_CODE;
 | |
|     int2store(start, charset_database_number);
 | |
|     start+= 2;
 | |
|   }
 | |
|   if (table_map_for_update)
 | |
|   {
 | |
|     *start++= Q_TABLE_MAP_FOR_UPDATE_CODE;
 | |
|     int8store(start, table_map_for_update);
 | |
|     start+= 8;
 | |
|   }
 | |
|   if (master_data_written != 0)
 | |
|   {
 | |
|     /*
 | |
|       Q_MASTER_DATA_WRITTEN_CODE only exists in relay logs where the master
 | |
|       has binlog_version<4 and the slave has binlog_version=4. See comment
 | |
|       for master_data_written in log_event.h for details.
 | |
|     */
 | |
|     *start++= Q_MASTER_DATA_WRITTEN_CODE;
 | |
|     int4store(start, master_data_written);
 | |
|     start+= 4;
 | |
|   }
 | |
| 
 | |
|   if (thd && thd->need_binlog_invoker())
 | |
|   {
 | |
|     LEX_CSTRING user;
 | |
|     LEX_CSTRING host;
 | |
|     memset(&user, 0, sizeof(user));
 | |
|     memset(&host, 0, sizeof(host));
 | |
| 
 | |
|     if (thd->slave_thread && thd->has_invoker())
 | |
|     {
 | |
|       /* user will be null, if master is older than this patch */
 | |
|       user= thd->get_invoker_user();
 | |
|       host= thd->get_invoker_host();
 | |
|     }
 | |
|     else
 | |
|     {
 | |
|       Security_context *ctx= thd->security_ctx;
 | |
| 
 | |
|       if (thd->need_binlog_invoker() == THD::INVOKER_USER)
 | |
|       {
 | |
|         user.str= ctx->priv_user;
 | |
|         host.str= ctx->priv_host;
 | |
|         host.length= strlen(host.str);
 | |
|       }
 | |
|       else
 | |
|       {
 | |
|         user.str= ctx->priv_role;
 | |
|         host= empty_clex_str;
 | |
|       }
 | |
|       user.length= strlen(user.str);
 | |
|     }
 | |
| 
 | |
|     if (user.length > 0)
 | |
|     {
 | |
|       *start++= Q_INVOKER;
 | |
| 
 | |
|       /*
 | |
|         Store user length and user. The max length of use is 16, so 1 byte is
 | |
|         enough to store the user's length.
 | |
|        */
 | |
|       *start++= (uchar)user.length;
 | |
|       memcpy(start, user.str, user.length);
 | |
|       start+= user.length;
 | |
| 
 | |
|       /*
 | |
|         Store host length and host. The max length of host is 60, so 1 byte is
 | |
|         enough to store the host's length.
 | |
|        */
 | |
|       *start++= (uchar)host.length;
 | |
|       memcpy(start, host.str, host.length);
 | |
|       start+= host.length;
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   if (thd && thd->query_start_sec_part_used)
 | |
|   {
 | |
|     *start++= Q_HRNOW;
 | |
|     get_time();
 | |
|     int3store(start, when_sec_part);
 | |
|     start+= 3;
 | |
|   }
 | |
| 
 | |
|   /* xid's is used with ddl_log handling */
 | |
|   if (thd && thd->binlog_xid)
 | |
|   {
 | |
|     *start++= Q_XID;
 | |
|     int8store(start, thd->binlog_xid);
 | |
|     start+= 8;
 | |
|   }
 | |
| 
 | |
|   /*
 | |
|     NOTE: When adding new status vars, please don't forget to update
 | |
|     the MAX_SIZE_LOG_EVENT_STATUS in log_event.h and update the function
 | |
|     code_name() in this file.
 | |
|    
 | |
|     Here there could be code like
 | |
|     if (command-line-option-which-says-"log_this_variable" && inited)
 | |
|     {
 | |
|     *start++= Q_THIS_VARIABLE_CODE;
 | |
|     int4store(start, this_variable);
 | |
|     start+= 4;
 | |
|     }
 | |
|   */
 | |
|   
 | |
|   /* Store length of status variables */
 | |
|   status_vars_len= (uint) (start-start_of_status);
 | |
|   DBUG_ASSERT(status_vars_len <= MAX_SIZE_LOG_EVENT_STATUS);
 | |
|   int2store(buf + Q_STATUS_VARS_LEN_OFFSET, status_vars_len);
 | |
| 
 | |
|   /*
 | |
|     Calculate length of whole event
 | |
|     The "1" below is the \0 in the db's length
 | |
|   */
 | |
|   event_length= ((uint) (start-buf) + get_post_header_size_for_derived() +
 | |
|                  db_len + 1 + q_len);
 | |
| 
 | |
|   return write_header(event_length) ||
 | |
|          write_data(buf, QUERY_HEADER_LEN) ||
 | |
|          write_post_header_for_derived() ||
 | |
|          write_data(start_of_status, (uint) status_vars_len) ||
 | |
|          write_data(db, db_len + 1) ||
 | |
|          write_data(query, q_len) ||
 | |
|          write_footer();
 | |
| }
 | |
| 
 | |
| bool Query_compressed_log_event::write()
 | |
| {
 | |
|   uchar *buffer;
 | |
|   uint32 alloc_size, compressed_size;
 | |
|   bool ret= true;
 | |
| 
 | |
|   compressed_size= alloc_size= binlog_get_compress_len(q_len);
 | |
|   buffer= (uchar*) my_safe_alloca(alloc_size);
 | |
|   if (buffer &&
 | |
|       !binlog_buf_compress((uchar*) query, buffer, q_len, &compressed_size))
 | |
|   {
 | |
|     /*
 | |
|       Write the compressed event. We have to temporarily store the event
 | |
|       in query and q_len as Query_log_event::write() uses these.
 | |
|     */
 | |
|     const char *query_tmp= query;
 | |
|     uint32 q_len_tmp= q_len;
 | |
|     query= (char*) buffer;
 | |
|     q_len= compressed_size;
 | |
|     ret= Query_log_event::write();
 | |
|     query= query_tmp;
 | |
|     q_len= q_len_tmp;
 | |
|   }
 | |
|   my_safe_afree(buffer, alloc_size);
 | |
|   return ret;
 | |
| }
 | |
| 
 | |
| 
 | |
| /**
 | |
|   The simplest constructor that could possibly work.  This is used for
 | |
|   creating static objects that have a special meaning and are invisible
 | |
|   to the log.  
 | |
| */
 | |
| Query_log_event::Query_log_event()
 | |
|   :Log_event(), data_buf(0)
 | |
| {
 | |
|   memset(&user, 0, sizeof(user));
 | |
|   memset(&host, 0, sizeof(host));
 | |
| }
 | |
| 
 | |
| 
 | |
| /*
 | |
|   SYNOPSIS
 | |
|     Query_log_event::Query_log_event()
 | |
|       thd_arg           - thread handle
 | |
|       query_arg         - array of char representing the query
 | |
|       query_length      - size of the  `query_arg' array
 | |
|       using_trans       - there is a modified transactional table
 | |
|       direct            - Don't cache statement
 | |
|       suppress_use      - suppress the generation of 'USE' statements
 | |
|       errcode           - the error code of the query
 | |
|       
 | |
|   DESCRIPTION
 | |
|   Creates an event for binlogging
 | |
|   The value for `errcode' should be supplied by caller.
 | |
| */
 | |
| Query_log_event::Query_log_event(THD* thd_arg, const char* query_arg,
 | |
|                                  size_t query_length, bool using_trans,
 | |
| 				 bool direct, bool suppress_use, int errcode)
 | |
| 
 | |
|   :Log_event(thd_arg,
 | |
|              (thd_arg->thread_specific_used ? LOG_EVENT_THREAD_SPECIFIC_F :
 | |
|               0) |
 | |
|              (suppress_use ? LOG_EVENT_SUPPRESS_USE_F : 0),
 | |
| 	     using_trans),
 | |
|    data_buf(0), query(query_arg), catalog(thd_arg->catalog),
 | |
|    q_len((uint32) query_length),
 | |
|    thread_id(thd_arg->thread_id),
 | |
|    /* save the original thread id; we already know the server id */
 | |
|    slave_proxy_id((ulong)thd_arg->variables.pseudo_thread_id),
 | |
|    flags2_inited(1), sql_mode_inited(1), charset_inited(1), flags2(0),
 | |
|    sql_mode(thd_arg->variables.sql_mode),
 | |
|    auto_increment_increment(thd_arg->variables.auto_increment_increment),
 | |
|    auto_increment_offset(thd_arg->variables.auto_increment_offset),
 | |
|    lc_time_names_number(thd_arg->variables.lc_time_names->number),
 | |
|    charset_database_number(0),
 | |
|    table_map_for_update((ulonglong)thd_arg->table_map_for_update),
 | |
|    master_data_written(0)
 | |
| {
 | |
|   /* status_vars_len is set just before writing the event */
 | |
| 
 | |
|   time_t end_time;
 | |
| 
 | |
| #ifdef WITH_WSREP
 | |
|   /*
 | |
|     If Query_log_event will contain non trans keyword (not BEGIN, COMMIT,
 | |
|     SAVEPOINT or ROLLBACK) we disable PA for this transaction.
 | |
|     Note that here WSREP(thd) might not be true e.g. when wsrep_shcema
 | |
|     is created we create tables with thd->variables.wsrep_on=false
 | |
|     to avoid replicating wsrep_schema tables to other nodes.
 | |
|    */
 | |
|   if (WSREP_ON && !is_trans_keyword(false))
 | |
|   {
 | |
|     thd->wsrep_PA_safe= false;
 | |
|   }
 | |
| #endif /* WITH_WSREP */
 | |
| 
 | |
|   memset(&user, 0, sizeof(user));
 | |
|   memset(&host, 0, sizeof(host));
 | |
|   error_code= errcode;
 | |
| 
 | |
|   end_time= my_time(0);
 | |
|   exec_time = (ulong) (end_time  - thd_arg->start_time);
 | |
|   /**
 | |
|     @todo this means that if we have no catalog, then it is replicated
 | |
|     as an existing catalog of length zero. is that safe? /sven
 | |
|   */
 | |
|   catalog_len = (catalog) ? (uint32) strlen(catalog) : 0;
 | |
| 
 | |
|   if (!(db= thd->db.str))
 | |
|     db= "";
 | |
|   db_len= (uint32) strlen(db);
 | |
|   if (thd_arg->variables.collation_database != thd_arg->db_charset)
 | |
|     charset_database_number= thd_arg->variables.collation_database->number;
 | |
|   
 | |
|   /*
 | |
|     We only replicate over the bits of flags2 that we need: the rest
 | |
|     are masked out by "& OPTIONS_WRITTEN_TO_BINLOG".
 | |
| 
 | |
|     We also force AUTOCOMMIT=1.  Rationale (cf. BUG#29288): After
 | |
|     fixing BUG#26395, we always write BEGIN and COMMIT around all
 | |
|     transactions (even single statements in autocommit mode).  This is
 | |
|     so that replication from non-transactional to transactional table
 | |
|     and error recovery from XA to non-XA table should work as
 | |
|     expected.  The BEGIN/COMMIT are added in log.cc. However, there is
 | |
|     one exception: MyISAM bypasses log.cc and writes directly to the
 | |
|     binlog.  So if autocommit is off, master has MyISAM, and slave has
 | |
|     a transactional engine, then the slave will just see one long
 | |
|     never-ending transaction.  The only way to bypass explicit
 | |
|     BEGIN/COMMIT in the binlog is by using a non-transactional table.
 | |
|     So setting AUTOCOMMIT=1 will make this work as expected.
 | |
| 
 | |
|     Note: explicitly replicate AUTOCOMMIT=1 from master. We do not
 | |
|     assume AUTOCOMMIT=1 on slave; the slave still reads the state of
 | |
|     the autocommit flag as written by the master to the binlog. This
 | |
|     behavior may change after WL#4162 has been implemented.
 | |
|   */
 | |
|   flags2= (uint32) (thd_arg->variables.option_bits &
 | |
|                     (OPTIONS_WRITTEN_TO_BIN_LOG & ~OPTION_NOT_AUTOCOMMIT));
 | |
|   DBUG_ASSERT(thd_arg->variables.character_set_client->number < 256*256);
 | |
|   DBUG_ASSERT(thd_arg->variables.collation_connection->number < 256*256);
 | |
|   DBUG_ASSERT(thd_arg->variables.collation_server->number < 256*256);
 | |
|   DBUG_ASSERT(thd_arg->variables.character_set_client->mbminlen == 1);
 | |
|   int2store(charset, thd_arg->variables.character_set_client->number);
 | |
|   int2store(charset+2, thd_arg->variables.collation_connection->number);
 | |
|   int2store(charset+4, thd_arg->variables.collation_server->number);
 | |
|   if (thd_arg->time_zone_used)
 | |
|   {
 | |
|     /*
 | |
|       Note that our event becomes dependent on the Time_zone object
 | |
|       representing the time zone. Fortunately such objects are never deleted
 | |
|       or changed during mysqld's lifetime.
 | |
|     */
 | |
|     time_zone_len= thd_arg->variables.time_zone->get_name()->length();
 | |
|     time_zone_str= thd_arg->variables.time_zone->get_name()->ptr();
 | |
|   }
 | |
|   else
 | |
|     time_zone_len= 0;
 | |
| 
 | |
|   LEX *lex= thd->lex;
 | |
|   /*
 | |
|     Defines that the statement will be written directly to the binary log
 | |
|     without being wrapped by a BEGIN...COMMIT. Otherwise, the statement
 | |
|     will be written to either the trx-cache or stmt-cache.
 | |
| 
 | |
|     Note that a cache will not be used if the parameter direct is TRUE.
 | |
|   */
 | |
|   bool use_cache= FALSE;
 | |
|   /*
 | |
|     TRUE defines that the trx-cache must be used and by consequence the
 | |
|     use_cache is TRUE.
 | |
| 
 | |
|     Note that a cache will not be used if the parameter direct is TRUE.
 | |
|   */
 | |
|   bool trx_cache= FALSE;
 | |
|   cache_type= Log_event::EVENT_INVALID_CACHE;
 | |
| 
 | |
|   if (!direct)
 | |
|   {
 | |
|     switch (lex->sql_command)
 | |
|     {
 | |
|       case SQLCOM_DROP_TABLE:
 | |
|       case SQLCOM_DROP_SEQUENCE:
 | |
|         use_cache= (lex->tmp_table() && thd->in_multi_stmt_transaction_mode());
 | |
|         break;
 | |
| 
 | |
|       case SQLCOM_CREATE_TABLE:
 | |
|       case SQLCOM_CREATE_SEQUENCE:
 | |
|         /*
 | |
|            If we are using CREATE ... SELECT or if we are a slave
 | |
|            executing BEGIN...COMMIT (generated by CREATE...SELECT) we
 | |
|            have to use the transactional cache to ensure we don't
 | |
|            calculate any checksum for the CREATE part.
 | |
|          */
 | |
|         trx_cache= (lex->first_select_lex()->item_list.elements &&
 | |
|             thd->is_current_stmt_binlog_format_row()) ||
 | |
|           (thd->variables.option_bits & OPTION_GTID_BEGIN);
 | |
|         use_cache= (lex->tmp_table() &&
 | |
|             thd->in_multi_stmt_transaction_mode()) || trx_cache;
 | |
|         break;
 | |
|       case SQLCOM_SET_OPTION:
 | |
|         if (lex->autocommit)
 | |
|           use_cache= trx_cache= FALSE;
 | |
|         else
 | |
|           use_cache= TRUE;
 | |
|         break;
 | |
|       case SQLCOM_RELEASE_SAVEPOINT:
 | |
|       case SQLCOM_ROLLBACK_TO_SAVEPOINT:
 | |
|       case SQLCOM_SAVEPOINT:
 | |
|       case SQLCOM_XA_END:
 | |
|         use_cache= trx_cache= TRUE;
 | |
|         break;
 | |
|       default:
 | |
|         use_cache= sqlcom_can_generate_row_events(thd);
 | |
|         break;
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   if (!use_cache || direct)
 | |
|   {
 | |
|     cache_type= Log_event::EVENT_NO_CACHE;
 | |
|   }
 | |
|   else if (using_trans || trx_cache || stmt_has_updated_trans_table(thd) ||
 | |
|            thd->lex->is_mixed_stmt_unsafe(thd->in_multi_stmt_transaction_mode(),
 | |
|                                           thd->variables.binlog_direct_non_trans_update,
 | |
|                                           trans_has_updated_trans_table(thd),
 | |
|                                           thd->tx_isolation))
 | |
|     cache_type= Log_event::EVENT_TRANSACTIONAL_CACHE;
 | |
|   else
 | |
|     cache_type= Log_event::EVENT_STMT_CACHE;
 | |
|   DBUG_ASSERT(cache_type != Log_event::EVENT_INVALID_CACHE);
 | |
|   DBUG_PRINT("info",("Query_log_event has flags2: %lu  sql_mode: %llu  cache_tye: %d",
 | |
|                      (ulong) flags2, sql_mode, cache_type));
 | |
| }
 | |
| 
 | |
| Query_compressed_log_event::Query_compressed_log_event(THD* thd_arg, const char* query_arg,
 | |
|     ulong query_length, bool using_trans,
 | |
|     bool direct, bool suppress_use, int errcode)
 | |
|     :Query_log_event(thd_arg, query_arg, query_length, using_trans, direct,
 | |
|                      suppress_use, errcode),
 | |
|      query_buf(0)
 | |
| {
 | |
| 
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| 
 | |
| int Query_log_event::do_apply_event(rpl_group_info *rgi)
 | |
| {
 | |
|   return do_apply_event(rgi, query, q_len);
 | |
| }
 | |
| 
 | |
| /**
 | |
|    Compare if two errors should be regarded as equal.
 | |
|    This is to handle the case when you can get slightly different errors
 | |
|    on master and slave for the same thing.
 | |
|    @param
 | |
|    expected_error	Error we got on master
 | |
|    actual_error		Error we got on slave
 | |
| 
 | |
|    @return
 | |
|    1 Errors are equal
 | |
|    0 Errors are different
 | |
| */
 | |
| 
 | |
| bool test_if_equal_repl_errors(int expected_error, int actual_error)
 | |
| {
 | |
|   if (expected_error == actual_error)
 | |
|     return 1;
 | |
|   switch (expected_error) {
 | |
|   case ER_DUP_ENTRY:
 | |
|   case ER_DUP_ENTRY_WITH_KEY_NAME:
 | |
|   case ER_DUP_KEY:
 | |
|   case ER_AUTOINC_READ_FAILED:
 | |
|     return (actual_error == ER_DUP_ENTRY ||
 | |
|             actual_error == ER_DUP_ENTRY_WITH_KEY_NAME ||
 | |
|             actual_error == ER_DUP_KEY ||
 | |
|             actual_error == ER_AUTOINC_READ_FAILED ||
 | |
|             actual_error == HA_ERR_AUTOINC_ERANGE);
 | |
|   case ER_UNKNOWN_TABLE:
 | |
|     return actual_error == ER_IT_IS_A_VIEW;
 | |
|   default:
 | |
|     break;
 | |
|   }
 | |
|   return 0;
 | |
| }
 | |
| 
 | |
| 
 | |
| /**
 | |
|   @todo
 | |
|   Compare the values of "affected rows" around here. Something
 | |
|   like:
 | |
|   @code
 | |
|      if ((uint32) affected_in_event != (uint32) affected_on_slave)
 | |
|      {
 | |
|      sql_print_error("Slave: did not get the expected number of affected \
 | |
|      rows running query from master - expected %d, got %d (this numbers \
 | |
|      should have matched modulo 4294967296).", 0, ...);
 | |
|      thd->query_error = 1;
 | |
|      }
 | |
|   @endcode
 | |
|   We may also want an option to tell the slave to ignore "affected"
 | |
|   mismatch. This mismatch could be implemented with a new ER_ code, and
 | |
|   to ignore it you would use --slave-skip-errors...
 | |
| */
 | |
| int Query_log_event::do_apply_event(rpl_group_info *rgi,
 | |
|                                     const char *query_arg, uint32 q_len_arg)
 | |
| {
 | |
|   int expected_error,actual_error= 0;
 | |
|   Schema_specification_st db_options;
 | |
|   uint64 sub_id= 0;
 | |
|   void *hton= NULL;
 | |
|   rpl_gtid gtid;
 | |
|   Relay_log_info const *rli= rgi->rli;
 | |
|   Rpl_filter *rpl_filter= rli->mi->rpl_filter;
 | |
|   bool current_stmt_is_commit;
 | |
|   DBUG_ENTER("Query_log_event::do_apply_event");
 | |
| 
 | |
|   /*
 | |
|     Colleagues: please never free(thd->catalog) in MySQL. This would
 | |
|     lead to bugs as here thd->catalog is a part of an alloced block,
 | |
|     not an entire alloced block (see
 | |
|     Query_log_event::do_apply_event()). Same for thd->db.  Thank
 | |
|     you.
 | |
|   */
 | |
|   thd->catalog= catalog_len ? (char *) catalog : (char *)"";
 | |
| 
 | |
|   size_t valid_len= Well_formed_prefix(system_charset_info,
 | |
|                                        db, db_len, NAME_LEN).length();
 | |
| 
 | |
|   if (valid_len != db_len)
 | |
|   {
 | |
|     rli->report(ERROR_LEVEL, ER_SLAVE_FATAL_ERROR,
 | |
|                 ER_THD(thd, ER_SLAVE_FATAL_ERROR),
 | |
|                 "Invalid database name in Query event.");
 | |
|     thd->is_slave_error= true;
 | |
|     goto end;
 | |
|   }
 | |
| 
 | |
|   set_thd_db(thd, rpl_filter, db, db_len);
 | |
| 
 | |
|   /*
 | |
|     Setting the character set and collation of the current database thd->db.
 | |
|    */
 | |
|   load_db_opt_by_name(thd, thd->db.str, &db_options);
 | |
|   if (db_options.default_table_charset)
 | |
|     thd->db_charset= db_options.default_table_charset;
 | |
|   thd->variables.auto_increment_increment= auto_increment_increment;
 | |
|   thd->variables.auto_increment_offset=    auto_increment_offset;
 | |
| 
 | |
|   DBUG_PRINT("info", ("log_pos: %lu", (ulong) log_pos));
 | |
| 
 | |
|   thd->clear_error(1);
 | |
|   current_stmt_is_commit= is_commit();
 | |
| 
 | |
|   DBUG_ASSERT(!current_stmt_is_commit || !rgi->tables_to_lock);
 | |
|   rgi->slave_close_thread_tables(thd);
 | |
| 
 | |
|   /*
 | |
|     Note:   We do not need to execute reset_one_shot_variables() if this
 | |
|             db_ok() test fails.
 | |
|     Reason: The db stored in binlog events is the same for SET and for
 | |
|             its companion query.  If the SET is ignored because of
 | |
|             db_ok(), the companion query will also be ignored, and if
 | |
|             the companion query is ignored in the db_ok() test of
 | |
|             ::do_apply_event(), then the companion SET also have so
 | |
|             we don't need to reset_one_shot_variables().
 | |
|   */
 | |
|   if (rpl_filter->is_db_empty() ||
 | |
|       is_trans_keyword(
 | |
|           (rgi->gtid_ev_flags2 & (Gtid_log_event::FL_PREPARED_XA |
 | |
|                                   Gtid_log_event::FL_COMPLETED_XA))) ||
 | |
|       rpl_filter->db_ok(thd->db.str))
 | |
|   {
 | |
|     thd->set_time(when, when_sec_part);
 | |
|     thd->set_query_and_id((char*)query_arg, q_len_arg,
 | |
|                           thd->charset(), next_query_id());
 | |
|     thd->variables.pseudo_thread_id= thread_id;		// for temp tables
 | |
|     DBUG_PRINT("query",("%s", thd->query()));
 | |
| 
 | |
| #ifdef WITH_WSREP
 | |
|     if (WSREP(thd))
 | |
|     {
 | |
|       WSREP_DEBUG("Query_log_event thread=%llu for query=%s",
 | |
| 		  thd_get_thread_id(thd), wsrep_thd_query(thd));
 | |
|     }
 | |
| #endif
 | |
| 
 | |
|     if (unlikely(!(expected_error= error_code)) ||
 | |
|         ignored_error_code(expected_error) ||
 | |
|         !unexpected_error_code(expected_error))
 | |
|     {
 | |
|       thd->slave_expected_error= expected_error;
 | |
|       if (flags2_inited)
 | |
|       {
 | |
|         ulonglong mask= flags2_inited;
 | |
|         thd->variables.option_bits= (flags2 & mask) |
 | |
|                                     (thd->variables.option_bits & ~mask);
 | |
|       }
 | |
|       /*
 | |
|         else, we are in a 3.23/4.0 binlog; we previously received a
 | |
|         Rotate_log_event which reset thd->variables.option_bits and
 | |
|         sql_mode etc, so nothing to do.
 | |
|       */
 | |
|       /*
 | |
|         We do not replicate MODE_NO_DIR_IN_CREATE. That is, if the master is a
 | |
|         slave which runs with SQL_MODE=MODE_NO_DIR_IN_CREATE, this should not
 | |
|         force us to ignore the dir too. Imagine you are a ring of machines, and
 | |
|         one has a disk problem so that you temporarily need
 | |
|         MODE_NO_DIR_IN_CREATE on this machine; you don't want it to propagate
 | |
|         elsewhere (you don't want all slaves to start ignoring the dirs).
 | |
|       */
 | |
|       if (sql_mode_inited)
 | |
|         thd->variables.sql_mode=
 | |
|           (sql_mode_t) ((thd->variables.sql_mode & MODE_NO_DIR_IN_CREATE) |
 | |
|                         (sql_mode & ~(sql_mode_t) MODE_NO_DIR_IN_CREATE));
 | |
|       if (charset_inited)
 | |
|       {
 | |
|         rpl_sql_thread_info *sql_info= thd->system_thread_info.rpl_sql_info;
 | |
|         if (sql_info->cached_charset_compare(charset))
 | |
|         {
 | |
|           /* Verify that we support the charsets found in the event. */
 | |
|           if (!(thd->variables.character_set_client=
 | |
|                 get_charset(uint2korr(charset), MYF(MY_WME))) ||
 | |
|               !(thd->variables.collation_connection=
 | |
|                 get_charset(uint2korr(charset+2), MYF(MY_WME))) ||
 | |
|               !(thd->variables.collation_server=
 | |
|                 get_charset(uint2korr(charset+4), MYF(MY_WME))))
 | |
|           {
 | |
|             /*
 | |
|               We updated the thd->variables with nonsensical values (0). Let's
 | |
|               set them to something safe (i.e. which avoids crash), and we'll
 | |
|               stop with EE_UNKNOWN_CHARSET in compare_errors (unless set to
 | |
|               ignore this error).
 | |
|             */
 | |
|             set_slave_thread_default_charset(thd, rgi);
 | |
|             goto compare_errors;
 | |
|           }
 | |
|           thd->update_charset(); // for the charset change to take effect
 | |
|           /*
 | |
|             Reset thd->query_string.cs to the newly set value.
 | |
|             Note, there is a small flaw here. For a very short time frame
 | |
|             if the new charset is different from the old charset and
 | |
|             if another thread executes "SHOW PROCESSLIST" after
 | |
|             the above thd->set_query_and_id() and before this thd->set_query(),
 | |
|             and if the current query has some non-ASCII characters,
 | |
|             the another thread may see some '?' marks in the PROCESSLIST
 | |
|             result. This should be acceptable now. This is a reminder
 | |
|             to fix this if any refactoring happens here sometime.
 | |
|           */
 | |
|           thd->set_query((char*) query_arg, q_len_arg, thd->charset());
 | |
|         }
 | |
|       }
 | |
|       if (time_zone_len)
 | |
|       {
 | |
|         String tmp(time_zone_str, time_zone_len, &my_charset_bin);
 | |
|         if (!(thd->variables.time_zone= my_tz_find(thd, &tmp)))
 | |
|         {
 | |
|           my_error(ER_UNKNOWN_TIME_ZONE, MYF(0), tmp.c_ptr());
 | |
|           thd->variables.time_zone= global_system_variables.time_zone;
 | |
|           goto compare_errors;
 | |
|         }
 | |
|       }
 | |
|       if (lc_time_names_number)
 | |
|       {
 | |
|         if (!(thd->variables.lc_time_names=
 | |
|               my_locale_by_number(lc_time_names_number)))
 | |
|         {
 | |
|           my_printf_error(ER_UNKNOWN_ERROR,
 | |
|                       "Unknown locale: '%d'", MYF(0), lc_time_names_number);
 | |
|           thd->variables.lc_time_names= &my_locale_en_US;
 | |
|           goto compare_errors;
 | |
|         }
 | |
|       }
 | |
|       else
 | |
|         thd->variables.lc_time_names= &my_locale_en_US;
 | |
|       if (charset_database_number)
 | |
|       {
 | |
|         CHARSET_INFO *cs;
 | |
|         if (!(cs= get_charset(charset_database_number, MYF(0))))
 | |
|         {
 | |
|           char buf[20];
 | |
|           int10_to_str((int) charset_database_number, buf, -10);
 | |
|           my_error(ER_UNKNOWN_COLLATION, MYF(0), buf);
 | |
|           goto compare_errors;
 | |
|         }
 | |
|         thd->variables.collation_database= cs;
 | |
|       }
 | |
|       else
 | |
|         thd->variables.collation_database= thd->db_charset;
 | |
| 
 | |
|       {
 | |
|         const CHARSET_INFO *cs= thd->charset();
 | |
|         /*
 | |
|           We cannot ask for parsing a statement using a character set
 | |
|           without state_maps (parser internal data).
 | |
|         */
 | |
|         if (!cs->state_map)
 | |
|         {
 | |
|           rli->report(ERROR_LEVEL, ER_SLAVE_FATAL_ERROR,
 | |
|                       ER_THD(thd, ER_SLAVE_FATAL_ERROR),
 | |
|                       "character_set cannot be parsed");
 | |
|           thd->is_slave_error= true;
 | |
|           goto end;
 | |
|         }
 | |
|       }
 | |
| 
 | |
|       /*
 | |
|         Record any GTID in the same transaction, so slave state is
 | |
|         transactionally consistent.
 | |
|       */
 | |
|       if (current_stmt_is_commit)
 | |
|       {
 | |
|         thd->variables.option_bits&= ~OPTION_GTID_BEGIN;
 | |
|         if (rgi->gtid_pending)
 | |
|         {
 | |
|           sub_id= rgi->gtid_sub_id;
 | |
|           rgi->gtid_pending= false;
 | |
| 
 | |
|           gtid= rgi->current_gtid;
 | |
|           if (unlikely(rpl_global_gtid_slave_state->record_gtid(thd, >id,
 | |
|                                                                 sub_id,
 | |
|                                                                 true, false,
 | |
|                                                                 &hton)))
 | |
|           {
 | |
|             int errcode= thd->get_stmt_da()->sql_errno();
 | |
|             if (!is_parallel_retry_error(rgi, errcode))
 | |
|               rli->report(ERROR_LEVEL, ER_CANNOT_UPDATE_GTID_STATE,
 | |
|                           rgi->gtid_info(),
 | |
|                           "Error during COMMIT: failed to update GTID state in "
 | |
|                         "%s.%s: %d: %s",
 | |
|                           "mysql", rpl_gtid_slave_state_table_name.str,
 | |
|                           errcode,
 | |
|                           thd->get_stmt_da()->message());
 | |
|             sub_id= 0;
 | |
|             thd->is_slave_error= 1;
 | |
|             goto end;
 | |
|           }
 | |
|         }
 | |
|       }
 | |
| 
 | |
|       thd->table_map_for_update= (table_map)table_map_for_update;
 | |
|       thd->set_invoker(&user, &host);
 | |
|       /*
 | |
|         Flag if we need to rollback the statement transaction on
 | |
|         slave if it by chance succeeds.
 | |
|         If we expected a non-zero error code and get nothing and,
 | |
|         it is a concurrency issue or ignorable issue, effects
 | |
|         of the statement should be rolled back.
 | |
|       */
 | |
|       if (unlikely(expected_error) &&
 | |
|           (ignored_error_code(expected_error) ||
 | |
|            concurrency_error_code(expected_error)))
 | |
|       {
 | |
|         thd->variables.option_bits|= OPTION_MASTER_SQL_ERROR;
 | |
|         thd->variables.option_bits&= ~OPTION_GTID_BEGIN;
 | |
|       }
 | |
|       /* Execute the query (note that we bypass dispatch_command()) */
 | |
|       Parser_state parser_state;
 | |
|       if (!parser_state.init(thd, thd->query(), thd->query_length()))
 | |
|       {
 | |
|         DBUG_ASSERT(thd->m_digest == NULL);
 | |
|         thd->m_digest= & thd->m_digest_state;
 | |
|         DBUG_ASSERT(thd->m_statement_psi == NULL);
 | |
|         thd->m_statement_psi= MYSQL_START_STATEMENT(&thd->m_statement_state,
 | |
|                                                     stmt_info_rpl.m_key,
 | |
|                                                     thd->db.str, thd->db.length,
 | |
|                                                     thd->charset(), NULL);
 | |
|         THD_STAGE_INFO(thd, stage_starting);
 | |
|         MYSQL_SET_STATEMENT_TEXT(thd->m_statement_psi, thd->query(), thd->query_length());
 | |
|         if (thd->m_digest != NULL)
 | |
|           thd->m_digest->reset(thd->m_token_array, max_digest_length);
 | |
| 
 | |
|          if (thd->slave_thread)
 | |
|          {
 | |
|            /*
 | |
|              To be compatible with previous releases, the slave thread uses the global
 | |
|              log_slow_disabled_statements value, wich can be changed dynamically, so we
 | |
|              have to set the sql_log_slow respectively.
 | |
|            */
 | |
|            thd->variables.sql_log_slow= !MY_TEST(global_system_variables.log_slow_disabled_statements & LOG_SLOW_DISABLE_SLAVE);
 | |
|          }
 | |
| 
 | |
|         mysql_parse(thd, thd->query(), thd->query_length(), &parser_state);
 | |
|         /* Finalize server status flags after executing a statement. */
 | |
|         thd->update_server_status();
 | |
|         log_slow_statement(thd);
 | |
|         thd->lex->restore_set_statement_var();
 | |
| 
 | |
|         /*
 | |
|           When THD::slave_expected_error gets reset inside execution stack
 | |
|           that is the case of to be ignored event. In this case the expected
 | |
|           error must change to the reset value as well.
 | |
|         */
 | |
|         expected_error= thd->slave_expected_error;
 | |
|       }
 | |
| 
 | |
|       thd->variables.option_bits&= ~OPTION_MASTER_SQL_ERROR;
 | |
|     }
 | |
|     else
 | |
|     {
 | |
|       /*
 | |
|         The query got a really bad error on the master (thread killed etc),
 | |
|         which could be inconsistent. Parse it to test the table names: if the
 | |
|         replicate-*-do|ignore-table rules say "this query must be ignored" then
 | |
|         we exit gracefully; otherwise we warn about the bad error and tell DBA
 | |
|         to check/fix it.
 | |
|       */
 | |
|       if (mysql_test_parse_for_slave(thd, thd->query(), thd->query_length()))
 | |
|         thd->clear_error(1);
 | |
|       else
 | |
|       {
 | |
|         rli->report(ERROR_LEVEL, expected_error, rgi->gtid_info(),
 | |
|                           "\
 | |
| Query partially completed on the master (error on master: %d) \
 | |
| and was aborted. There is a chance that your master is inconsistent at this \
 | |
| point. If you are sure that your master is ok, run this query manually on the \
 | |
| slave and then restart the slave with SET GLOBAL SQL_SLAVE_SKIP_COUNTER=1; \
 | |
| START SLAVE; . Query: '%s'", expected_error, thd->query());
 | |
|         thd->is_slave_error= 1;
 | |
|       }
 | |
|       goto end;
 | |
|     }
 | |
| 
 | |
|     /* If the query was not ignored, it is printed to the general log */
 | |
|     if (likely(!thd->is_error()) ||
 | |
|         thd->get_stmt_da()->sql_errno() != ER_SLAVE_IGNORED_TABLE)
 | |
|       general_log_write(thd, COM_QUERY, thd->query(), thd->query_length());
 | |
|     else
 | |
|     {
 | |
|       /*
 | |
|         Bug#54201: If we skip an INSERT query that uses auto_increment, then we
 | |
|         should reset any @@INSERT_ID set by an Intvar_log_event associated with
 | |
|         the query; otherwise the @@INSERT_ID will linger until the next INSERT
 | |
|         that uses auto_increment and may affect extra triggers on the slave etc.
 | |
| 
 | |
|         We reset INSERT_ID unconditionally; it is probably cheaper than
 | |
|         checking if it is necessary.
 | |
|       */
 | |
|       thd->auto_inc_intervals_forced.empty();
 | |
|     }
 | |
| 
 | |
| compare_errors:
 | |
|     /*
 | |
|       In the slave thread, we may sometimes execute some DROP / * 40005
 | |
|       TEMPORARY * / TABLE that come from parts of binlogs (likely if we
 | |
|       use RESET SLAVE or CHANGE MASTER TO), while the temporary table
 | |
|       has already been dropped. To ignore such irrelevant "table does
 | |
|       not exist errors", we silently clear the error if TEMPORARY was used.
 | |
|     */
 | |
|     if ((thd->lex->sql_command == SQLCOM_DROP_TABLE ||
 | |
|          thd->lex->sql_command == SQLCOM_DROP_SEQUENCE) &&
 | |
|         thd->lex->tmp_table() &&
 | |
|         thd->is_error() && thd->get_stmt_da()->sql_errno() == ER_BAD_TABLE_ERROR &&
 | |
|         !expected_error)
 | |
|       thd->get_stmt_da()->reset_diagnostics_area();
 | |
|     /*
 | |
|       If we expected a non-zero error code, and we don't get the same error
 | |
|       code, and it should be ignored or is related to a concurrency issue.
 | |
|     */
 | |
|     actual_error= thd->is_error() ? thd->get_stmt_da()->sql_errno() : 0;
 | |
|     DBUG_PRINT("info",("expected_error: %d  sql_errno: %d",
 | |
|                        expected_error, actual_error));
 | |
| 
 | |
|     if ((unlikely(expected_error) &&
 | |
|          !test_if_equal_repl_errors(expected_error, actual_error) &&
 | |
|          !concurrency_error_code(expected_error)) &&
 | |
|         !ignored_error_code(actual_error) &&
 | |
|         !ignored_error_code(expected_error))
 | |
|     {
 | |
|       rli->report(ERROR_LEVEL, 0, rgi->gtid_info(),
 | |
|                   "Query caused different errors on master and slave.     "
 | |
|                   "Error on master: message (format)='%s' error code=%d ; "
 | |
|                   "Error on slave: actual message='%s', error code=%d. "
 | |
|                   "Default database: '%s'. Query: '%s'",
 | |
|                   ER_THD(thd, expected_error),
 | |
|                   expected_error,
 | |
|                   actual_error ? thd->get_stmt_da()->message() : "no error",
 | |
|                   actual_error,
 | |
|                   print_slave_db_safe(db), query_arg);
 | |
|       thd->is_slave_error= 1;
 | |
|     }
 | |
|     /*
 | |
|       If we get the same error code as expected and it is not a concurrency
 | |
|       issue, or should be ignored.
 | |
|     */
 | |
|     else if ((test_if_equal_repl_errors(expected_error, actual_error) &&
 | |
|               !concurrency_error_code(expected_error)) ||
 | |
|              ignored_error_code(actual_error))
 | |
|     {
 | |
|       DBUG_PRINT("info",("error ignored"));
 | |
|       thd->clear_error(1);
 | |
|       if (actual_error == ER_QUERY_INTERRUPTED ||
 | |
|           actual_error == ER_CONNECTION_KILLED)
 | |
|         thd->reset_killed();
 | |
|     }
 | |
|     else if (actual_error == ER_XAER_NOTA && !rpl_filter->db_ok(get_db()))
 | |
|     {
 | |
|       /*
 | |
|         If there is an XA query whos XID cannot be found, if the replication
 | |
|         filter is active and filters the target database, assume that the XID
 | |
|         cache has been cleared (e.g. by server restart) since it was prepared,
 | |
|         so we can just ignore this event.
 | |
|       */
 | |
|       thd->clear_error(1);
 | |
|     }
 | |
|     /*
 | |
|       Other cases: mostly we expected no error and get one.
 | |
|     */
 | |
|     else if (unlikely(thd->is_slave_error || thd->is_fatal_error))
 | |
|     {
 | |
|       if (!is_parallel_retry_error(rgi, actual_error))
 | |
|         rli->report(ERROR_LEVEL, actual_error, rgi->gtid_info(),
 | |
|                     "Error '%s' on query. Default database: '%s'. Query: '%s'",
 | |
|                     (actual_error ? thd->get_stmt_da()->message() :
 | |
|                      "unexpected success or fatal error"),
 | |
|                     thd->get_db(), query_arg);
 | |
|       thd->is_slave_error= 1;
 | |
| #ifdef WITH_WSREP
 | |
|       if (wsrep_thd_is_toi(thd) && wsrep_must_ignore_error(thd))
 | |
|       {
 | |
|         thd->clear_error(1);
 | |
|         thd->killed= NOT_KILLED;
 | |
|         thd->wsrep_has_ignored_error= true;
 | |
|       }
 | |
| #endif /* WITH_WSREP */
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|       TODO: compare the values of "affected rows" around here. Something
 | |
|       like:
 | |
|       if ((uint32) affected_in_event != (uint32) affected_on_slave)
 | |
|       {
 | |
|       sql_print_error("Slave: did not get the expected number of affected \
 | |
|       rows running query from master - expected %d, got %d (this numbers \
 | |
|       should have matched modulo 4294967296).", 0, ...);
 | |
|       thd->is_slave_error = 1;
 | |
|       }
 | |
|       We may also want an option to tell the slave to ignore "affected"
 | |
|       mismatch. This mismatch could be implemented with a new ER_ code, and
 | |
|       to ignore it you would use --slave-skip-errors...
 | |
| 
 | |
|       To do the comparison we need to know the value of "affected" which the
 | |
|       above mysql_parse() computed. And we need to know the value of
 | |
|       "affected" in the master's binlog. Both will be implemented later. The
 | |
|       important thing is that we now have the format ready to log the values
 | |
|       of "affected" in the binlog. So we can release 5.0.0 before effectively
 | |
|       logging "affected" and effectively comparing it.
 | |
|     */
 | |
|   } /* End of if (db_ok(... */
 | |
| 
 | |
|   {
 | |
|     /**
 | |
|       The following failure injecion works in cooperation with tests
 | |
|       setting @@global.debug= 'd,stop_slave_middle_group'.
 | |
|       The sql thread receives the killed status and will proceed
 | |
|       to shutdown trying to finish incomplete events group.
 | |
|     */
 | |
|     DBUG_EXECUTE_IF("stop_slave_middle_group",
 | |
|                     if (!current_stmt_is_commit && is_begin() == 0)
 | |
|                     {
 | |
|                       if (thd->transaction->all.modified_non_trans_table)
 | |
|                         const_cast<Relay_log_info*>(rli)->abort_slave= 1;
 | |
|                     };);
 | |
|   }
 | |
| 
 | |
| end:
 | |
|   if (unlikely(sub_id && !thd->is_slave_error))
 | |
|     rpl_global_gtid_slave_state->update_state_hash(sub_id, >id, hton, rgi);
 | |
| 
 | |
|   /*
 | |
|     Probably we have set thd->query, thd->db, thd->catalog to point to places
 | |
|     in the data_buf of this event. Now the event is going to be deleted
 | |
|     probably, so data_buf will be freed, so the thd->... listed above will be
 | |
|     pointers to freed memory.
 | |
|     So we must set them to 0, so that those bad pointers values are not later
 | |
|     used. Note that "cleanup" queries like automatic DROP TEMPORARY TABLE
 | |
|     don't suffer from these assignments to 0 as DROP TEMPORARY
 | |
|     TABLE uses the db.table syntax.
 | |
|   */
 | |
|   thd->catalog= 0;
 | |
|   thd->set_db(&null_clex_str);    /* will free the current database */
 | |
|   thd->reset_query();
 | |
|   DBUG_PRINT("info", ("end: query= 0"));
 | |
| 
 | |
|   /* Mark the statement completed. */
 | |
|   MYSQL_END_STATEMENT(thd->m_statement_psi, thd->get_stmt_da());
 | |
|   thd->m_statement_psi= NULL;
 | |
|   thd->m_digest= NULL;
 | |
| 
 | |
|   /*
 | |
|     As a disk space optimization, future masters will not log an event for
 | |
|     LAST_INSERT_ID() if that function returned 0 (and thus they will be able
 | |
|     to replace the THD::stmt_depends_on_first_successful_insert_id_in_prev_stmt
 | |
|     variable by (THD->first_successful_insert_id_in_prev_stmt > 0) ; with the
 | |
|     resetting below we are ready to support that.
 | |
|   */
 | |
|   thd->first_successful_insert_id_in_prev_stmt_for_binlog= 0;
 | |
|   thd->first_successful_insert_id_in_prev_stmt= 0;
 | |
|   thd->stmt_depends_on_first_successful_insert_id_in_prev_stmt= 0;
 | |
|   free_root(thd->mem_root,MYF(MY_KEEP_PREALLOC));
 | |
|   DBUG_RETURN(thd->is_slave_error);
 | |
| }
 | |
| 
 | |
| Log_event::enum_skip_reason
 | |
| Query_log_event::do_shall_skip(rpl_group_info *rgi)
 | |
| {
 | |
|   Relay_log_info *rli= rgi->rli;
 | |
|   DBUG_ENTER("Query_log_event::do_shall_skip");
 | |
|   DBUG_PRINT("debug", ("query: '%s'  q_len: %d", query, q_len));
 | |
|   DBUG_ASSERT(query && q_len > 0);
 | |
|   DBUG_ASSERT(thd == rgi->thd);
 | |
| 
 | |
|   /*
 | |
|     An event skipped due to @@skip_replication must not be counted towards the
 | |
|     number of events to be skipped due to @@sql_slave_skip_counter.
 | |
|   */
 | |
|   if (flags & LOG_EVENT_SKIP_REPLICATION_F &&
 | |
|       opt_replicate_events_marked_for_skip != RPL_SKIP_REPLICATE)
 | |
|     DBUG_RETURN(Log_event::EVENT_SKIP_IGNORE);
 | |
| 
 | |
|   if (rli->slave_skip_counter > 0)
 | |
|   {
 | |
|     if (is_begin())
 | |
|     {
 | |
|       thd->variables.option_bits|= OPTION_BEGIN | OPTION_GTID_BEGIN;
 | |
|       DBUG_RETURN(Log_event::continue_group(rgi));
 | |
|     }
 | |
| 
 | |
|     if (is_commit() || is_rollback())
 | |
|     {
 | |
|       thd->variables.option_bits&= ~(OPTION_BEGIN | OPTION_GTID_BEGIN);
 | |
|       DBUG_RETURN(Log_event::EVENT_SKIP_COUNT);
 | |
|     }
 | |
|   }
 | |
| #ifdef WITH_WSREP
 | |
|   else if (WSREP(thd) && wsrep_mysql_replication_bundle &&
 | |
|            opt_slave_domain_parallel_threads == 0 &&
 | |
|            thd->wsrep_mysql_replicated > 0 &&
 | |
|            (is_begin() || is_commit()))
 | |
|   {
 | |
|     if (++thd->wsrep_mysql_replicated < (int)wsrep_mysql_replication_bundle)
 | |
|     {
 | |
|       WSREP_DEBUG("skipping wsrep commit %d", thd->wsrep_mysql_replicated);
 | |
|       DBUG_RETURN(Log_event::EVENT_SKIP_IGNORE);
 | |
|     }
 | |
|     else
 | |
|     {
 | |
|       thd->wsrep_mysql_replicated = 0;
 | |
|     }
 | |
|   }
 | |
| #endif /* WITH_WSREP */
 | |
|   DBUG_RETURN(Log_event::do_shall_skip(rgi));
 | |
| }
 | |
| 
 | |
| 
 | |
| bool
 | |
| Query_log_event::peek_is_commit_rollback(const uchar *event_start,
 | |
|                                          size_t event_len,
 | |
|                                          enum enum_binlog_checksum_alg
 | |
|                                          checksum_alg)
 | |
| {
 | |
|   if (checksum_alg == BINLOG_CHECKSUM_ALG_CRC32)
 | |
|   {
 | |
|     if (event_len > BINLOG_CHECKSUM_LEN)
 | |
|       event_len-= BINLOG_CHECKSUM_LEN;
 | |
|     else
 | |
|       event_len= 0;
 | |
|   }
 | |
|   else
 | |
|     DBUG_ASSERT(checksum_alg == BINLOG_CHECKSUM_ALG_UNDEF ||
 | |
|                 checksum_alg == BINLOG_CHECKSUM_ALG_OFF);
 | |
| 
 | |
|   if (event_len < LOG_EVENT_HEADER_LEN + QUERY_HEADER_LEN || event_len < 9)
 | |
|     return false;
 | |
|   return !memcmp(event_start + (event_len-7), "\0COMMIT", 7) ||
 | |
|          !memcmp(event_start + (event_len-9), "\0ROLLBACK", 9);
 | |
| }
 | |
| 
 | |
| #endif
 | |
| 
 | |
| 
 | |
| /**************************************************************************
 | |
| 	Start_log_event_v3 methods
 | |
| **************************************************************************/
 | |
| 
 | |
| Start_log_event_v3::Start_log_event_v3()
 | |
|   :Log_event(), created(0), binlog_version(BINLOG_VERSION),
 | |
|    dont_set_created(0)
 | |
| {
 | |
|   memcpy(server_version, ::server_version, ST_SERVER_VER_LEN);
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| void Start_log_event_v3::pack_info(Protocol *protocol)
 | |
| {
 | |
|   char buf[12 + ST_SERVER_VER_LEN + 14 + 22], *pos;
 | |
|   pos= strmov(buf, "Server ver: ");
 | |
|   pos= strmov(pos, server_version);
 | |
|   pos= strmov(pos, ", Binlog ver: ");
 | |
|   pos= int10_to_str(binlog_version, pos, 10);
 | |
|   protocol->store(buf, (uint) (pos-buf), &my_charset_bin);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| bool Start_log_event_v3::write()
 | |
| {
 | |
|   char buff[START_V3_HEADER_LEN];
 | |
|   int2store(buff + ST_BINLOG_VER_OFFSET,binlog_version);
 | |
|   memcpy(buff + ST_SERVER_VER_OFFSET,server_version,ST_SERVER_VER_LEN);
 | |
|   if (!dont_set_created)
 | |
|     created= get_time(); // this sets when and when_sec_part as a side effect
 | |
|   int4store(buff + ST_CREATED_OFFSET,created);
 | |
|   return write_header(sizeof(buff)) ||
 | |
|          write_data(buff, sizeof(buff)) ||
 | |
|          write_footer();
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| 
 | |
| /**
 | |
|   Start_log_event_v3::do_apply_event() .
 | |
|   The master started
 | |
| 
 | |
|     IMPLEMENTATION
 | |
|     - To handle the case where the master died without having time to write
 | |
|     DROP TEMPORARY TABLE, DO RELEASE_LOCK (prepared statements' deletion is
 | |
|     TODO), we clean up all temporary tables that we got, if we are sure we
 | |
|     can (see below).
 | |
| 
 | |
|   @todo
 | |
|     - Remove all active user locks.
 | |
|     Guilhem 2003-06: this is true but not urgent: the worst it can cause is
 | |
|     the use of a bit of memory for a user lock which will not be used
 | |
|     anymore. If the user lock is later used, the old one will be released. In
 | |
|     other words, no deadlock problem.
 | |
| */
 | |
| 
 | |
| int Start_log_event_v3::do_apply_event(rpl_group_info *rgi)
 | |
| {
 | |
|   DBUG_ENTER("Start_log_event_v3::do_apply_event");
 | |
|   int error= 0;
 | |
|   Relay_log_info *rli= rgi->rli;
 | |
| 
 | |
|   switch (binlog_version)
 | |
|   {
 | |
|   case 3:
 | |
|   case 4:
 | |
|     /*
 | |
|       This can either be 4.x (then a Start_log_event_v3 is only at master
 | |
|       startup so we are sure the master has restarted and cleared his temp
 | |
|       tables; the event always has 'created'>0) or 5.0 (then we have to test
 | |
|       'created').
 | |
|     */
 | |
|     if (created)
 | |
|     {
 | |
|       rli->close_temporary_tables();
 | |
|       
 | |
|       /*
 | |
|         The following is only false if we get here with a BINLOG statement
 | |
|       */
 | |
|       if (rli->mi)
 | |
|         cleanup_load_tmpdir(&rli->mi->cmp_connection_name);
 | |
|     }
 | |
|     break;
 | |
| 
 | |
|     /*
 | |
|        Now the older formats; in that case load_tmpdir is cleaned up by the I/O
 | |
|        thread.
 | |
|     */
 | |
|   case 1:
 | |
|     if (strncmp(rli->relay_log.description_event_for_exec->server_version,
 | |
|                 "3.23.57",7) >= 0 && created)
 | |
|     {
 | |
|       /*
 | |
|         Can distinguish, based on the value of 'created': this event was
 | |
|         generated at master startup.
 | |
|       */
 | |
|       rli->close_temporary_tables();
 | |
|     }
 | |
|     /*
 | |
|       Otherwise, can't distinguish a Start_log_event generated at
 | |
|       master startup and one generated by master FLUSH LOGS, so cannot
 | |
|       be sure temp tables have to be dropped. So do nothing.
 | |
|     */
 | |
|     break;
 | |
|   default:
 | |
|     /*
 | |
|       This case is not expected. It can be either an event corruption or an
 | |
|       unsupported binary log version.
 | |
|     */
 | |
|     rli->report(ERROR_LEVEL, ER_SLAVE_FATAL_ERROR,
 | |
|                 ER_THD(thd, ER_SLAVE_FATAL_ERROR),
 | |
|                 "Binlog version not supported");
 | |
|     DBUG_RETURN(1);
 | |
|   }
 | |
|   DBUG_RETURN(error);
 | |
| }
 | |
| #endif /* defined(HAVE_REPLICATION) */
 | |
| 
 | |
| /***************************************************************************
 | |
|        Format_description_log_event methods
 | |
| ****************************************************************************/
 | |
| 
 | |
| bool Format_description_log_event::write()
 | |
| {
 | |
|   bool ret;
 | |
|   bool no_checksum;
 | |
|   /*
 | |
|     We don't call Start_log_event_v3::write() because this would make 2
 | |
|     my_b_safe_write().
 | |
|   */
 | |
|   uchar buff[START_V3_HEADER_LEN+1];
 | |
|   size_t rec_size= sizeof(buff) + BINLOG_CHECKSUM_ALG_DESC_LEN +
 | |
|                    number_of_event_types;
 | |
|   int2store(buff + ST_BINLOG_VER_OFFSET,binlog_version);
 | |
|   memcpy((char*) buff + ST_SERVER_VER_OFFSET,server_version,ST_SERVER_VER_LEN);
 | |
|   if (!dont_set_created)
 | |
|     created= get_time();
 | |
|   int4store(buff + ST_CREATED_OFFSET,created);
 | |
|   buff[ST_COMMON_HEADER_LEN_OFFSET]= common_header_len;
 | |
|   /*
 | |
|     if checksum is requested
 | |
|     record the checksum-algorithm descriptor next to
 | |
|     post_header_len vector which will be followed by the checksum value.
 | |
|     Master is supposed to trigger checksum computing by binlog_checksum_options,
 | |
|     slave does it via marking the event according to
 | |
|     FD_queue checksum_alg value.
 | |
|   */
 | |
|   compile_time_assert(BINLOG_CHECKSUM_ALG_DESC_LEN == 1);
 | |
| #ifdef DBUG_ASSERT_EXISTS
 | |
|   data_written= 0; // to prepare for need_checksum assert
 | |
| #endif
 | |
|   uint8 checksum_byte= (uint8)
 | |
|     (need_checksum() ? checksum_alg : BINLOG_CHECKSUM_ALG_OFF);
 | |
|   /* 
 | |
|      FD of checksum-aware server is always checksum-equipped, (V) is in,
 | |
|      regardless of @@global.binlog_checksum policy.
 | |
|      Thereby a combination of (A) == 0, (V) != 0 means
 | |
|      it's the checksum-aware server's FD event that heads checksum-free binlog
 | |
|      file. 
 | |
|      Here 0 stands for checksumming OFF to evaluate (V) as 0 is that case.
 | |
|      A combination of (A) != 0, (V) != 0 denotes FD of the checksum-aware server
 | |
|      heading the checksummed binlog.
 | |
|      (A), (V) presence in FD of the checksum-aware server makes the event
 | |
|      1 + 4 bytes bigger comparing to the former FD.
 | |
|   */
 | |
| 
 | |
|   if ((no_checksum= (checksum_alg == BINLOG_CHECKSUM_ALG_OFF)))
 | |
|   {
 | |
|     checksum_alg= BINLOG_CHECKSUM_ALG_CRC32;  // Forcing (V) room to fill anyway
 | |
|   }
 | |
|   ret= write_header(rec_size) ||
 | |
|        write_data(buff, sizeof(buff)) ||
 | |
|        write_data(post_header_len, number_of_event_types) ||
 | |
|        write_data(&checksum_byte, sizeof(checksum_byte)) ||
 | |
|        write_footer();
 | |
|   if (no_checksum)
 | |
|     checksum_alg= BINLOG_CHECKSUM_ALG_OFF;
 | |
|   return ret;
 | |
| }
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| int Format_description_log_event::do_apply_event(rpl_group_info *rgi)
 | |
| {
 | |
|   int ret= 0;
 | |
|   Relay_log_info *rli= rgi->rli;
 | |
|   DBUG_ENTER("Format_description_log_event::do_apply_event");
 | |
| 
 | |
|   /*
 | |
|     As a transaction NEVER spans on 2 or more binlogs:
 | |
|     if we have an active transaction at this point, the master died
 | |
|     while writing the transaction to the binary log, i.e. while
 | |
|     flushing the binlog cache to the binlog. XA guarantees that master has
 | |
|     rolled back. So we roll back.
 | |
|     Note: this event could be sent by the master to inform us of the
 | |
|     format of its binlog; in other words maybe it is not at its
 | |
|     original place when it comes to us; we'll know this by checking
 | |
|     log_pos ("artificial" events have log_pos == 0).
 | |
|   */
 | |
|   if (!thd->rli_fake &&
 | |
|       !is_artificial_event() && created && thd->transaction->all.ha_list)
 | |
|   {
 | |
|     /* This is not an error (XA is safe), just an information */
 | |
|     rli->report(INFORMATION_LEVEL, 0, NULL,
 | |
|                 "Rolling back unfinished transaction (no COMMIT "
 | |
|                 "or ROLLBACK in relay log). A probable cause is that "
 | |
|                 "the master died while writing the transaction to "
 | |
|                 "its binary log, thus rolled back too."); 
 | |
|     rgi->cleanup_context(thd, 1);
 | |
|   }
 | |
| 
 | |
|   /*
 | |
|     If this event comes from ourselves, there is no cleaning task to
 | |
|     perform, we don't call Start_log_event_v3::do_apply_event()
 | |
|     (this was just to update the log's description event).
 | |
|   */
 | |
|   if (server_id != (uint32) global_system_variables.server_id)
 | |
|   {
 | |
|     /*
 | |
|       If the event was not requested by the slave i.e. the master sent
 | |
|       it while the slave asked for a position >4, the event will make
 | |
|       rli->group_master_log_pos advance. Say that the slave asked for
 | |
|       position 1000, and the Format_desc event's end is 96. Then in
 | |
|       the beginning of replication rli->group_master_log_pos will be
 | |
|       0, then 96, then jump to first really asked event (which is
 | |
|       >96). So this is ok.
 | |
|     */
 | |
|     ret= Start_log_event_v3::do_apply_event(rgi);
 | |
|   }
 | |
| 
 | |
|   if (!ret)
 | |
|   {
 | |
|     /* Save the information describing this binlog */
 | |
|     copy_crypto_data(rli->relay_log.description_event_for_exec);
 | |
|     delete rli->relay_log.description_event_for_exec;
 | |
|     rli->relay_log.description_event_for_exec= this;
 | |
|   }
 | |
| 
 | |
|   DBUG_RETURN(ret);
 | |
| }
 | |
| 
 | |
| int Format_description_log_event::do_update_pos(rpl_group_info *rgi)
 | |
| {
 | |
|   if (server_id == (uint32) global_system_variables.server_id)
 | |
|   {
 | |
|     /*
 | |
|       We only increase the relay log position if we are skipping
 | |
|       events and do not touch any group_* variables, nor flush the
 | |
|       relay log info.  If there is a crash, we will have to re-skip
 | |
|       the events again, but that is a minor issue.
 | |
| 
 | |
|       If we do not skip stepping the group log position (and the
 | |
|       server id was changed when restarting the server), it might well
 | |
|       be that we start executing at a position that is invalid, e.g.,
 | |
|       at a Rows_log_event or a Query_log_event preceeded by a
 | |
|       Intvar_log_event instead of starting at a Table_map_log_event or
 | |
|       the Intvar_log_event respectively.
 | |
|      */
 | |
|     rgi->inc_event_relay_log_pos();
 | |
|     return 0;
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     return Log_event::do_update_pos(rgi);
 | |
|   }
 | |
| }
 | |
| 
 | |
| Log_event::enum_skip_reason
 | |
| Format_description_log_event::do_shall_skip(rpl_group_info *rgi)
 | |
| {
 | |
|   return Log_event::EVENT_SKIP_NOT;
 | |
| }
 | |
| 
 | |
| #endif
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| int Start_encryption_log_event::do_apply_event(rpl_group_info* rgi)
 | |
| {
 | |
|   return rgi->rli->relay_log.description_event_for_exec->start_decryption(this);
 | |
| }
 | |
| 
 | |
| int Start_encryption_log_event::do_update_pos(rpl_group_info *rgi)
 | |
| {
 | |
|   /*
 | |
|     master never sends Start_encryption_log_event, any SELE that a slave
 | |
|     might see was created locally in MYSQL_BIN_LOG::open() on the slave
 | |
|   */
 | |
|   rgi->inc_event_relay_log_pos();
 | |
|   return 0;
 | |
| }
 | |
| 
 | |
| #endif
 | |
| 
 | |
| 
 | |
| /**************************************************************************
 | |
|       Load_log_event methods
 | |
| **************************************************************************/
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| bool Load_log_event::print_query(THD *thd, bool need_db, const char *cs,
 | |
|                                  String *buf, my_off_t *fn_start,
 | |
|                                  my_off_t *fn_end, const char *qualify_db)
 | |
| {
 | |
|   if (need_db && db && db_len)
 | |
|   {
 | |
|     buf->append(STRING_WITH_LEN("use "));
 | |
|     append_identifier(thd, buf, db, db_len);
 | |
|     buf->append(STRING_WITH_LEN("; "));
 | |
|   }
 | |
| 
 | |
|   buf->append(STRING_WITH_LEN("LOAD DATA "));
 | |
| 
 | |
|   if (is_concurrent)
 | |
|     buf->append(STRING_WITH_LEN("CONCURRENT "));
 | |
| 
 | |
|   if (fn_start)
 | |
|     *fn_start= buf->length();
 | |
| 
 | |
|   if (check_fname_outside_temp_buf())
 | |
|     buf->append(STRING_WITH_LEN("LOCAL "));
 | |
|   buf->append(STRING_WITH_LEN("INFILE '"));
 | |
|   buf->append_for_single_quote(fname, fname_len);
 | |
|   buf->append(STRING_WITH_LEN("' "));
 | |
| 
 | |
|   if (sql_ex.opt_flags & REPLACE_FLAG)
 | |
|     buf->append(STRING_WITH_LEN("REPLACE "));
 | |
|   else if (sql_ex.opt_flags & IGNORE_FLAG)
 | |
|     buf->append(STRING_WITH_LEN("IGNORE "));
 | |
| 
 | |
|   buf->append(STRING_WITH_LEN("INTO"));
 | |
| 
 | |
|   if (fn_end)
 | |
|     *fn_end= buf->length();
 | |
| 
 | |
|   buf->append(STRING_WITH_LEN(" TABLE "));
 | |
|   if (qualify_db)
 | |
|   {
 | |
|     append_identifier(thd, buf, qualify_db, strlen(qualify_db));
 | |
|     buf->append(STRING_WITH_LEN("."));
 | |
|   }
 | |
|   append_identifier(thd, buf, table_name, table_name_len);
 | |
| 
 | |
|   if (cs != NULL)
 | |
|   {
 | |
|     buf->append(STRING_WITH_LEN(" CHARACTER SET "));
 | |
|     buf->append(cs, strlen(cs));
 | |
|   }
 | |
| 
 | |
|   /* We have to create all optional fields as the default is not empty */
 | |
|   buf->append(STRING_WITH_LEN(" FIELDS TERMINATED BY "));
 | |
|   pretty_print_str(buf, sql_ex.field_term, sql_ex.field_term_len);
 | |
|   if (sql_ex.opt_flags & OPT_ENCLOSED_FLAG)
 | |
|     buf->append(STRING_WITH_LEN(" OPTIONALLY "));
 | |
|   buf->append(STRING_WITH_LEN(" ENCLOSED BY "));
 | |
|   pretty_print_str(buf, sql_ex.enclosed, sql_ex.enclosed_len);
 | |
| 
 | |
|   buf->append(STRING_WITH_LEN(" ESCAPED BY "));
 | |
|   pretty_print_str(buf, sql_ex.escaped, sql_ex.escaped_len);
 | |
| 
 | |
|   buf->append(STRING_WITH_LEN(" LINES TERMINATED BY "));
 | |
|   pretty_print_str(buf, sql_ex.line_term, sql_ex.line_term_len);
 | |
|   if (sql_ex.line_start_len)
 | |
|   {
 | |
|     buf->append(STRING_WITH_LEN(" STARTING BY "));
 | |
|     pretty_print_str(buf, sql_ex.line_start, sql_ex.line_start_len);
 | |
|   }
 | |
| 
 | |
|   if ((long) skip_lines > 0)
 | |
|   {
 | |
|     buf->append(STRING_WITH_LEN(" IGNORE "));
 | |
|     buf->append_ulonglong(skip_lines);
 | |
|     buf->append(STRING_WITH_LEN(" LINES "));
 | |
|   }
 | |
| 
 | |
|   if (num_fields)
 | |
|   {
 | |
|     uint i;
 | |
|     const char *field= fields;
 | |
|     buf->append(STRING_WITH_LEN(" ("));
 | |
|     for (i = 0; i < num_fields; i++)
 | |
|     {
 | |
|       if (i)
 | |
|       {
 | |
|         /*
 | |
|           Yes, the space and comma is reversed here. But this is mostly dead
 | |
|           code, at most used when reading really old binlogs from old servers,
 | |
|           so better just leave it as is...
 | |
|         */
 | |
|         buf->append(STRING_WITH_LEN(" ,"));
 | |
|       }
 | |
|       append_identifier(thd, buf, field, field_lens[i]);
 | |
|       field+= field_lens[i]  + 1;
 | |
|     }
 | |
|     buf->append(STRING_WITH_LEN(")"));
 | |
|   }
 | |
|   return 0;
 | |
| }
 | |
| 
 | |
| 
 | |
| void Load_log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|   char query_buffer[1024];
 | |
|   String query_str(query_buffer, sizeof(query_buffer), system_charset_info);
 | |
| 
 | |
|   query_str.length(0);
 | |
|   print_query(protocol->thd, TRUE, NULL, &query_str, 0, 0, NULL);
 | |
|   protocol->store(query_str.ptr(), query_str.length(), &my_charset_bin);
 | |
| }
 | |
| #endif /* defined(HAVE_REPLICATION) */
 | |
| 
 | |
| 
 | |
| bool Load_log_event::write_data_header()
 | |
| {
 | |
|   char buf[LOAD_HEADER_LEN];
 | |
|   int4store(buf + L_THREAD_ID_OFFSET, slave_proxy_id);
 | |
|   int4store(buf + L_EXEC_TIME_OFFSET, exec_time);
 | |
|   int4store(buf + L_SKIP_LINES_OFFSET, skip_lines);
 | |
|   buf[L_TBL_LEN_OFFSET] = (char)table_name_len;
 | |
|   buf[L_DB_LEN_OFFSET] = (char)db_len;
 | |
|   int4store(buf + L_NUM_FIELDS_OFFSET, num_fields);
 | |
|   return write_data(buf, LOAD_HEADER_LEN) != 0;
 | |
| }
 | |
| 
 | |
| 
 | |
| bool Load_log_event::write_data_body()
 | |
| {
 | |
|   if (sql_ex.write_data(writer))
 | |
|     return 1;
 | |
|   if (num_fields && fields && field_lens)
 | |
|   {
 | |
|     if (write_data(field_lens, num_fields) ||
 | |
| 	write_data(fields, field_block_len))
 | |
|       return 1;
 | |
|   }
 | |
|   return (write_data(table_name, table_name_len + 1) ||
 | |
| 	  write_data(db, db_len + 1) ||
 | |
| 	  write_data(fname, fname_len));
 | |
| }
 | |
| 
 | |
| 
 | |
| Load_log_event::Load_log_event(THD *thd_arg, const sql_exchange *ex,
 | |
| 			       const char *db_arg, const char *table_name_arg,
 | |
| 			       List<Item> &fields_arg,
 | |
|                                bool is_concurrent_arg,
 | |
| 			       enum enum_duplicates handle_dup,
 | |
| 			       bool ignore, bool using_trans)
 | |
|   :Log_event(thd_arg,
 | |
|              thd_arg->thread_specific_used ? LOG_EVENT_THREAD_SPECIFIC_F : 0,
 | |
|              using_trans),
 | |
|    thread_id(thd_arg->thread_id),
 | |
|    slave_proxy_id((ulong)thd_arg->variables.pseudo_thread_id),
 | |
|    num_fields(0),fields(0),
 | |
|    field_lens(0),field_block_len(0),
 | |
|    table_name(table_name_arg ? table_name_arg : ""),
 | |
|    db(db_arg), fname(ex->file_name), local_fname(FALSE),
 | |
|    is_concurrent(is_concurrent_arg)
 | |
| {
 | |
|   time_t end_time;
 | |
|   time(&end_time);
 | |
|   exec_time = (ulong) (end_time  - thd_arg->start_time);
 | |
|   /* db can never be a zero pointer in 4.0 */
 | |
|   db_len = (uint32) strlen(db);
 | |
|   table_name_len = (uint32) strlen(table_name);
 | |
|   fname_len = (fname) ? (uint) strlen(fname) : 0;
 | |
|   sql_ex.field_term = ex->field_term->ptr();
 | |
|   sql_ex.field_term_len = (uint8) ex->field_term->length();
 | |
|   sql_ex.enclosed = ex->enclosed->ptr();
 | |
|   sql_ex.enclosed_len = (uint8) ex->enclosed->length();
 | |
|   sql_ex.line_term = ex->line_term->ptr();
 | |
|   sql_ex.line_term_len = (uint8) ex->line_term->length();
 | |
|   sql_ex.line_start = ex->line_start->ptr();
 | |
|   sql_ex.line_start_len = (uint8) ex->line_start->length();
 | |
|   sql_ex.escaped = ex->escaped->ptr();
 | |
|   sql_ex.escaped_len = (uint8) ex->escaped->length();
 | |
|   sql_ex.opt_flags = 0;
 | |
|   sql_ex.cached_new_format = -1;
 | |
|     
 | |
|   if (ex->dumpfile)
 | |
|     sql_ex.opt_flags|= DUMPFILE_FLAG;
 | |
|   if (ex->opt_enclosed)
 | |
|     sql_ex.opt_flags|= OPT_ENCLOSED_FLAG;
 | |
| 
 | |
|   sql_ex.empty_flags= 0;
 | |
| 
 | |
|   switch (handle_dup) {
 | |
|   case DUP_REPLACE:
 | |
|     sql_ex.opt_flags|= REPLACE_FLAG;
 | |
|     break;
 | |
|   case DUP_UPDATE:				// Impossible here
 | |
|   case DUP_ERROR:
 | |
|     break;	
 | |
|   }
 | |
|   if (ignore)
 | |
|     sql_ex.opt_flags|= IGNORE_FLAG;
 | |
| 
 | |
|   if (!ex->field_term->length())
 | |
|     sql_ex.empty_flags |= FIELD_TERM_EMPTY;
 | |
|   if (!ex->enclosed->length())
 | |
|     sql_ex.empty_flags |= ENCLOSED_EMPTY;
 | |
|   if (!ex->line_term->length())
 | |
|     sql_ex.empty_flags |= LINE_TERM_EMPTY;
 | |
|   if (!ex->line_start->length())
 | |
|     sql_ex.empty_flags |= LINE_START_EMPTY;
 | |
|   if (!ex->escaped->length())
 | |
|     sql_ex.empty_flags |= ESCAPED_EMPTY;
 | |
|     
 | |
|   skip_lines = ex->skip_lines;
 | |
| 
 | |
|   List_iterator<Item> li(fields_arg);
 | |
|   field_lens_buf.length(0);
 | |
|   fields_buf.length(0);
 | |
|   Item* item;
 | |
|   while ((item = li++))
 | |
|   {
 | |
|     num_fields++;
 | |
|     uchar len= (uchar) item->name.length;
 | |
|     field_block_len += len + 1;
 | |
|     fields_buf.append(item->name.str, len + 1);
 | |
|     field_lens_buf.append((char*)&len, 1);
 | |
|   }
 | |
| 
 | |
|   field_lens = (const uchar*)field_lens_buf.ptr();
 | |
|   fields = fields_buf.ptr();
 | |
| }
 | |
| 
 | |
| 
 | |
| /**
 | |
|   Load_log_event::set_fields()
 | |
| 
 | |
|   @note
 | |
|     This function can not use the member variable 
 | |
|     for the database, since LOAD DATA INFILE on the slave
 | |
|     can be for a different database than the current one.
 | |
|     This is the reason for the affected_db argument to this method.
 | |
| */
 | |
| 
 | |
| void Load_log_event::set_fields(const char* affected_db, 
 | |
| 				List<Item> &field_list,
 | |
|                                 Name_resolution_context *context)
 | |
| {
 | |
|   uint i;
 | |
|   const char* field = fields;
 | |
|   for (i= 0; i < num_fields; i++)
 | |
|   {
 | |
|     LEX_CSTRING field_name= {field, field_lens[i] };
 | |
|     field_list.push_back(new (thd->mem_root)
 | |
|                          Item_field(thd, context,
 | |
|                                     Lex_cstring_strlen(affected_db),
 | |
|                                     Lex_cstring_strlen(table_name),
 | |
|                                     field_name),
 | |
|                          thd->mem_root);
 | |
|     field+= field_lens[i]  + 1;
 | |
|   }
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| /**
 | |
|   Does the data loading job when executing a LOAD DATA on the slave.
 | |
| 
 | |
|   @param net
 | |
|   @param rli
 | |
|   @param use_rli_only_for_errors     If set to 1, rli is provided to
 | |
|                                      Load_log_event::exec_event only for this
 | |
|                                      function to have RPL_LOG_NAME and
 | |
|                                      rli->last_slave_error, both being used by
 | |
|                                      error reports. rli's position advancing
 | |
|                                      is skipped (done by the caller which is
 | |
|                                      Execute_load_log_event::exec_event).
 | |
|                                      If set to 0, rli is provided for full use,
 | |
|                                      i.e. for error reports and position
 | |
|                                      advancing.
 | |
| 
 | |
|   @todo
 | |
|     fix this; this can be done by testing rules in
 | |
|     Create_file_log_event::exec_event() and then discarding Append_block and
 | |
|     al.
 | |
|   @todo
 | |
|     this is a bug - this needs to be moved to the I/O thread
 | |
| 
 | |
|   @retval
 | |
|     0           Success
 | |
|   @retval
 | |
|     1           Failure
 | |
| */
 | |
| 
 | |
| int Load_log_event::do_apply_event(NET* net, rpl_group_info *rgi,
 | |
|                                    bool use_rli_only_for_errors)
 | |
| {
 | |
|   Relay_log_info const *rli= rgi->rli;
 | |
|   Rpl_filter *rpl_filter= rli->mi->rpl_filter;
 | |
|   DBUG_ENTER("Load_log_event::do_apply_event");
 | |
| 
 | |
|   DBUG_ASSERT(thd->query() == 0);
 | |
|   set_thd_db(thd, rpl_filter, db, db_len);
 | |
|   thd->clear_error(1);
 | |
| 
 | |
|   /* see Query_log_event::do_apply_event() and BUG#13360 */
 | |
|   DBUG_ASSERT(!rgi->m_table_map.count());
 | |
|   /*
 | |
|     Usually lex_start() is called by mysql_parse(), but we need it here
 | |
|     as the present method does not call mysql_parse().
 | |
|   */
 | |
|   lex_start(thd);
 | |
|   thd->lex->local_file= local_fname;
 | |
|   thd->reset_for_next_command(0);               // Errors are cleared above
 | |
| 
 | |
|   /*
 | |
|     We test replicate_*_db rules. Note that we have already prepared
 | |
|     the file to load, even if we are going to ignore and delete it
 | |
|     now. So it is possible that we did a lot of disk writes for
 | |
|     nothing. In other words, a big LOAD DATA INFILE on the master will
 | |
|     still consume a lot of space on the slave (space in the relay log
 | |
|     + space of temp files: twice the space of the file to load...)
 | |
|     even if it will finally be ignored.  TODO: fix this; this can be
 | |
|     done by testing rules in Create_file_log_event::do_apply_event()
 | |
|     and then discarding Append_block and al. Another way is do the
 | |
|     filtering in the I/O thread (more efficient: no disk writes at
 | |
|     all).
 | |
| 
 | |
|     Note:   We do not need to execute reset_one_shot_variables() if this
 | |
|             db_ok() test fails.
 | |
|     Reason: The db stored in binlog events is the same for SET and for
 | |
|             its companion query.  If the SET is ignored because of
 | |
|             db_ok(), the companion query will also be ignored, and if
 | |
|             the companion query is ignored in the db_ok() test of
 | |
|             ::do_apply_event(), then the companion SET also have so
 | |
|             we don't need to reset_one_shot_variables().
 | |
|   */
 | |
|   if (rpl_filter->db_ok(thd->db.str))
 | |
|   {
 | |
|     thd->set_time(when, when_sec_part);
 | |
|     thd->set_query_id(next_query_id());
 | |
|     thd->get_stmt_da()->opt_clear_warning_info(thd->query_id);
 | |
| 
 | |
|     TABLE_LIST tables;
 | |
|     LEX_CSTRING db_name= { thd->strmake(thd->db.str, thd->db.length), thd->db.length };
 | |
|     if (lower_case_table_names)
 | |
|       my_casedn_str(system_charset_info, (char *)table_name);
 | |
|     LEX_CSTRING tbl_name=   { table_name, strlen(table_name) };
 | |
|     tables.init_one_table(&db_name, &tbl_name, 0, TL_WRITE);
 | |
|     tables.updating= 1;
 | |
| 
 | |
|     // the table will be opened in mysql_load    
 | |
|     if (rpl_filter->is_on() && !rpl_filter->tables_ok(thd->db.str, &tables))
 | |
|     {
 | |
|       // TODO: this is a bug - this needs to be moved to the I/O thread
 | |
|       if (net)
 | |
|         skip_load_data_infile(net);
 | |
|     }
 | |
|     else
 | |
|     {
 | |
|       enum enum_duplicates handle_dup;
 | |
|       bool ignore= 0;
 | |
|       char query_buffer[1024];
 | |
|       String query_str(query_buffer, sizeof(query_buffer), system_charset_info);
 | |
|       char *load_data_query;
 | |
| 
 | |
|       query_str.length(0);
 | |
|       /*
 | |
|         Forge LOAD DATA INFILE query which will be used in SHOW PROCESS LIST
 | |
|         and written to slave's binlog if binlogging is on.
 | |
|       */
 | |
|       print_query(thd, FALSE, NULL, &query_str, NULL, NULL, NULL);
 | |
|       if (!(load_data_query= (char *)thd->strmake(query_str.ptr(),
 | |
|                                                   query_str.length())))
 | |
|       {
 | |
|         /*
 | |
|           This will set thd->fatal_error in case of OOM. So we surely will notice
 | |
|           that something is wrong.
 | |
|         */
 | |
|         goto error;
 | |
|       }
 | |
| 
 | |
|       thd->set_query(load_data_query, (uint) (query_str.length()));
 | |
| 
 | |
|       if (sql_ex.opt_flags & REPLACE_FLAG)
 | |
|         handle_dup= DUP_REPLACE;
 | |
|       else if (sql_ex.opt_flags & IGNORE_FLAG)
 | |
|       {
 | |
|         ignore= 1;
 | |
|         handle_dup= DUP_ERROR;
 | |
|       }
 | |
|       else
 | |
|       {
 | |
|         /*
 | |
|           When replication is running fine, if it was DUP_ERROR on the
 | |
|           master then we could choose IGNORE here, because if DUP_ERROR
 | |
|           suceeded on master, and data is identical on the master and slave,
 | |
|           then there should be no uniqueness errors on slave, so IGNORE is
 | |
|           the same as DUP_ERROR. But in the unlikely case of uniqueness errors
 | |
|           (because the data on the master and slave happen to be different
 | |
|           (user error or bug), we want LOAD DATA to print an error message on
 | |
|           the slave to discover the problem.
 | |
| 
 | |
|           If reading from net (a 3.23 master), mysql_load() will change this
 | |
|           to IGNORE.
 | |
|         */
 | |
|         handle_dup= DUP_ERROR;
 | |
|       }
 | |
|       /*
 | |
|         We need to set thd->lex->sql_command and thd->lex->duplicates
 | |
|         since InnoDB tests these variables to decide if this is a LOAD
 | |
|         DATA ... REPLACE INTO ... statement even though mysql_parse()
 | |
|         is not called.  This is not needed in 5.0 since there the LOAD
 | |
|         DATA ... statement is replicated using mysql_parse(), which
 | |
|         sets the thd->lex fields correctly.
 | |
|       */
 | |
|       thd->lex->sql_command= SQLCOM_LOAD;
 | |
|       thd->lex->duplicates= handle_dup;
 | |
| 
 | |
|       sql_exchange ex((char*)fname, sql_ex.opt_flags & DUMPFILE_FLAG);
 | |
|       String field_term(sql_ex.field_term,sql_ex.field_term_len,log_cs);
 | |
|       String enclosed(sql_ex.enclosed,sql_ex.enclosed_len,log_cs);
 | |
|       String line_term(sql_ex.line_term,sql_ex.line_term_len,log_cs);
 | |
|       String line_start(sql_ex.line_start,sql_ex.line_start_len,log_cs);
 | |
|       String escaped(sql_ex.escaped,sql_ex.escaped_len, log_cs);
 | |
|       ex.field_term= &field_term;
 | |
|       ex.enclosed= &enclosed;
 | |
|       ex.line_term= &line_term;
 | |
|       ex.line_start= &line_start;
 | |
|       ex.escaped= &escaped;
 | |
| 
 | |
|       ex.opt_enclosed = (sql_ex.opt_flags & OPT_ENCLOSED_FLAG);
 | |
|       if (sql_ex.empty_flags & FIELD_TERM_EMPTY)
 | |
|         ex.field_term->length(0);
 | |
| 
 | |
|       ex.skip_lines = skip_lines;
 | |
|       List<Item> field_list;
 | |
|       thd->lex->first_select_lex()->context.resolve_in_table_list_only(&tables);
 | |
|       set_fields(tables.db.str,
 | |
|                  field_list, &thd->lex->first_select_lex()->context);
 | |
|       thd->variables.pseudo_thread_id= thread_id;
 | |
|       if (net)
 | |
|       {
 | |
|         // mysql_load will use thd->net to read the file
 | |
|         thd->net.vio = net->vio;
 | |
|         // Make sure the client does not get confused about the packet sequence
 | |
|         thd->net.pkt_nr = net->pkt_nr;
 | |
|       }
 | |
|       /*
 | |
|         It is safe to use tmp_list twice because we are not going to
 | |
|         update it inside mysql_load().
 | |
|       */
 | |
|       List<Item> tmp_list;
 | |
|       if (thd->open_temporary_tables(&tables) ||
 | |
|           mysql_load(thd, &ex, &tables, field_list, tmp_list, tmp_list,
 | |
|                      handle_dup, ignore, net != 0))
 | |
|         thd->is_slave_error= 1;
 | |
|       if (thd->cuted_fields)
 | |
|       {
 | |
|         /* log_pos is the position of the LOAD event in the master log */
 | |
|         sql_print_warning("Slave: load data infile on table '%s' at "
 | |
|                           "log position %llu in log '%s' produced %ld "
 | |
|                           "warning(s). Default database: '%s'",
 | |
|                           (char*) table_name, log_pos, RPL_LOG_NAME,
 | |
|                           (ulong) thd->cuted_fields,
 | |
|                           thd->get_db());
 | |
|       }
 | |
|       if (net)
 | |
|         net->pkt_nr= thd->net.pkt_nr;
 | |
|     }
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     /*
 | |
|       We will just ask the master to send us /dev/null if we do not
 | |
|       want to load the data.
 | |
|       TODO: this a bug - needs to be done in I/O thread
 | |
|     */
 | |
|     if (net)
 | |
|       skip_load_data_infile(net);
 | |
|   }
 | |
| 
 | |
| error:
 | |
|   thd->net.vio = 0; 
 | |
|   const char *remember_db= thd->get_db();
 | |
|   thd->catalog= 0;
 | |
|   thd->set_db(&null_clex_str);     /* will free the current database */
 | |
|   thd->reset_query();
 | |
|   thd->get_stmt_da()->set_overwrite_status(true);
 | |
|   thd->is_error() ? trans_rollback_stmt(thd) : trans_commit_stmt(thd);
 | |
|   thd->variables.option_bits&= ~(OPTION_BEGIN | OPTION_GTID_BEGIN);
 | |
|   thd->get_stmt_da()->set_overwrite_status(false);
 | |
|   close_thread_tables(thd);
 | |
|   /*
 | |
|     - If transaction rollback was requested due to deadlock
 | |
|       perform it and release metadata locks.
 | |
|     - If inside a multi-statement transaction,
 | |
|     defer the release of metadata locks until the current
 | |
|     transaction is either committed or rolled back. This prevents
 | |
|     other statements from modifying the table for the entire
 | |
|     duration of this transaction.  This provides commit ordering
 | |
|     and guarantees serializability across multiple transactions.
 | |
|     - If in autocommit mode, or outside a transactional context,
 | |
|     automatically release metadata locks of the current statement.
 | |
|   */
 | |
|   if (thd->transaction_rollback_request)
 | |
|   {
 | |
|     trans_rollback_implicit(thd);
 | |
|     thd->release_transactional_locks();
 | |
|   }
 | |
|   else if (! thd->in_multi_stmt_transaction_mode())
 | |
|     thd->release_transactional_locks();
 | |
|   else
 | |
|     thd->mdl_context.release_statement_locks();
 | |
| 
 | |
|   DBUG_EXECUTE_IF("LOAD_DATA_INFILE_has_fatal_error",
 | |
|                   thd->is_slave_error= 0; thd->is_fatal_error= 1;);
 | |
| 
 | |
|   if (unlikely(thd->is_slave_error))
 | |
|   {
 | |
|     /* this err/sql_errno code is copy-paste from net_send_error() */
 | |
|     const char *err;
 | |
|     int sql_errno;
 | |
|     if (thd->is_error())
 | |
|     {
 | |
|       err= thd->get_stmt_da()->message();
 | |
|       sql_errno= thd->get_stmt_da()->sql_errno();
 | |
|     }
 | |
|     else
 | |
|     {
 | |
|       sql_errno=ER_UNKNOWN_ERROR;
 | |
|       err= ER_THD(thd, sql_errno);
 | |
|     }
 | |
|     rli->report(ERROR_LEVEL, sql_errno, rgi->gtid_info(), "\
 | |
| Error '%s' running LOAD DATA INFILE on table '%s'. Default database: '%s'",
 | |
|                     err, (char*)table_name, remember_db);
 | |
|     free_root(thd->mem_root,MYF(MY_KEEP_PREALLOC));
 | |
|     DBUG_RETURN(1);
 | |
|   }
 | |
|   free_root(thd->mem_root,MYF(MY_KEEP_PREALLOC));
 | |
| 
 | |
|   if (unlikely(thd->is_fatal_error))
 | |
|   {
 | |
|     char buf[256];
 | |
|     my_snprintf(buf, sizeof(buf),
 | |
|                 "Running LOAD DATA INFILE on table '%-.64s'."
 | |
|                 " Default database: '%-.64s'",
 | |
|                 (char*)table_name,
 | |
|                 remember_db);
 | |
| 
 | |
|     rli->report(ERROR_LEVEL, ER_SLAVE_FATAL_ERROR, rgi->gtid_info(),
 | |
|                 ER_THD(thd, ER_SLAVE_FATAL_ERROR), buf);
 | |
|     DBUG_RETURN(1);
 | |
|   }
 | |
| 
 | |
|   DBUG_RETURN( use_rli_only_for_errors ? 0 : Log_event::do_apply_event(rgi) );
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| /**************************************************************************
 | |
|   Rotate_log_event methods
 | |
| **************************************************************************/
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| void Rotate_log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|   StringBuffer<256> tmp(log_cs);
 | |
|   tmp.length(0);
 | |
|   tmp.append(new_log_ident, ident_len);
 | |
|   tmp.append(STRING_WITH_LEN(";pos="));
 | |
|   tmp.append_ulonglong(pos);
 | |
|   protocol->store(tmp.ptr(), tmp.length(), &my_charset_bin);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| Rotate_log_event::Rotate_log_event(const char* new_log_ident_arg,
 | |
|                                    uint ident_len_arg, ulonglong pos_arg,
 | |
|                                    uint flags_arg)
 | |
|   :Log_event(), new_log_ident(new_log_ident_arg),
 | |
|    pos(pos_arg),ident_len(ident_len_arg ? ident_len_arg :
 | |
|                           (uint) strlen(new_log_ident_arg)), flags(flags_arg)
 | |
| {
 | |
|   DBUG_ENTER("Rotate_log_event::Rotate_log_event(...,flags)");
 | |
|   DBUG_PRINT("enter",("new_log_ident: %s  pos: %llu  flags: %lu", new_log_ident_arg,
 | |
|                       pos_arg, (ulong) flags));
 | |
|   cache_type= EVENT_NO_CACHE;
 | |
|   if (flags & DUP_NAME)
 | |
|     new_log_ident= my_strndup(PSI_INSTRUMENT_ME, new_log_ident_arg, ident_len, MYF(MY_WME));
 | |
|   if (flags & RELAY_LOG)
 | |
|     set_relay_log_event();
 | |
|   DBUG_VOID_RETURN;
 | |
| }
 | |
| 
 | |
| 
 | |
| bool Rotate_log_event::write()
 | |
| {
 | |
|   char buf[ROTATE_HEADER_LEN];
 | |
|   int8store(buf + R_POS_OFFSET, pos);
 | |
|   return (write_header(ROTATE_HEADER_LEN + ident_len) ||
 | |
|           write_data(buf, ROTATE_HEADER_LEN) ||
 | |
|           write_data(new_log_ident, (uint) ident_len) ||
 | |
|           write_footer());
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| 
 | |
| /*
 | |
|   Got a rotate log event from the master.
 | |
| 
 | |
|   This is mainly used so that we can later figure out the logname and
 | |
|   position for the master.
 | |
| 
 | |
|   We can't rotate the slave's BINlog as this will cause infinitive rotations
 | |
|   in a A -> B -> A setup.
 | |
|   The NOTES below is a wrong comment which will disappear when 4.1 is merged.
 | |
| 
 | |
|   This must only be called from the Slave SQL thread, since it calls
 | |
|   Relay_log_info::flush().
 | |
| 
 | |
|   @retval
 | |
|     0	ok
 | |
|     1   error
 | |
| */
 | |
| int Rotate_log_event::do_update_pos(rpl_group_info *rgi)
 | |
| {
 | |
|   int error= 0;
 | |
|   Relay_log_info *rli= rgi->rli;
 | |
|   DBUG_ENTER("Rotate_log_event::do_update_pos");
 | |
| 
 | |
|   DBUG_PRINT("info", ("server_id=%lu; ::server_id=%lu",
 | |
|                       (ulong) this->server_id, (ulong) global_system_variables.server_id));
 | |
|   DBUG_PRINT("info", ("new_log_ident: %s", this->new_log_ident));
 | |
|   DBUG_PRINT("info", ("pos: %llu", this->pos));
 | |
| 
 | |
|   /*
 | |
|     If we are in a transaction or in a group: the only normal case is
 | |
|     when the I/O thread was copying a big transaction, then it was
 | |
|     stopped and restarted: we have this in the relay log:
 | |
| 
 | |
|     BEGIN
 | |
|     ...
 | |
|     ROTATE (a fake one)
 | |
|     ...
 | |
|     COMMIT or ROLLBACK
 | |
| 
 | |
|     In that case, we don't want to touch the coordinates which
 | |
|     correspond to the beginning of the transaction.  Starting from
 | |
|     5.0.0, there also are some rotates from the slave itself, in the
 | |
|     relay log, which shall not change the group positions.
 | |
| 
 | |
|     In parallel replication, rotate event is executed out-of-band with normal
 | |
|     events, so we cannot update group_master_log_name or _pos here, it will
 | |
|     be updated with the next normal event instead.
 | |
|   */
 | |
|   if ((server_id != global_system_variables.server_id ||
 | |
|        rli->replicate_same_server_id) &&
 | |
|       !is_relay_log_event() &&
 | |
|       !rli->is_in_group() &&
 | |
|       !rgi->is_parallel_exec)
 | |
|   {
 | |
|     mysql_mutex_lock(&rli->data_lock);
 | |
|     DBUG_PRINT("info", ("old group_master_log_name: '%s'  "
 | |
|                         "old group_master_log_pos: %lu",
 | |
|                         rli->group_master_log_name,
 | |
|                         (ulong) rli->group_master_log_pos));
 | |
|     memcpy(rli->group_master_log_name, new_log_ident, ident_len+1);
 | |
|     rli->notify_group_master_log_name_update();
 | |
|     rli->inc_group_relay_log_pos(pos, rgi, TRUE /* skip_lock */);
 | |
|     DBUG_PRINT("info", ("new group_master_log_name: '%s'  "
 | |
|                         "new group_master_log_pos: %lu",
 | |
|                         rli->group_master_log_name,
 | |
|                         (ulong) rli->group_master_log_pos));
 | |
|     mysql_mutex_unlock(&rli->data_lock);
 | |
|     rpl_global_gtid_slave_state->record_and_update_gtid(thd, rgi);
 | |
|     error= rli->flush();
 | |
|     
 | |
|     /*
 | |
|       Reset thd->variables.option_bits and sql_mode etc, because this could
 | |
|       be the signal of a master's downgrade from 5.0 to 4.0.
 | |
|       However, no need to reset description_event_for_exec: indeed, if the next
 | |
|       master is 5.0 (even 5.0.1) we will soon get a Format_desc; if the next
 | |
|       master is 4.0 then the events are in the slave's format (conversion).
 | |
|     */
 | |
|     set_slave_thread_options(thd);
 | |
|     set_slave_thread_default_charset(thd, rgi);
 | |
|     thd->variables.sql_mode= global_system_variables.sql_mode;
 | |
|     thd->variables.auto_increment_increment=
 | |
|       thd->variables.auto_increment_offset= 1;
 | |
|   }
 | |
|   else
 | |
|     rgi->inc_event_relay_log_pos();
 | |
| 
 | |
|   DBUG_RETURN(error);
 | |
| }
 | |
| 
 | |
| 
 | |
| Log_event::enum_skip_reason
 | |
| Rotate_log_event::do_shall_skip(rpl_group_info *rgi)
 | |
| {
 | |
|   enum_skip_reason reason= Log_event::do_shall_skip(rgi);
 | |
| 
 | |
|   switch (reason) {
 | |
|   case Log_event::EVENT_SKIP_NOT:
 | |
|   case Log_event::EVENT_SKIP_COUNT:
 | |
|     return Log_event::EVENT_SKIP_NOT;
 | |
| 
 | |
|   case Log_event::EVENT_SKIP_IGNORE:
 | |
|     return Log_event::EVENT_SKIP_IGNORE;
 | |
|   }
 | |
|   DBUG_ASSERT(0);
 | |
|   return Log_event::EVENT_SKIP_NOT;             // To keep compiler happy
 | |
| }
 | |
| 
 | |
| #endif
 | |
| 
 | |
| 
 | |
| /**************************************************************************
 | |
|   Binlog_checkpoint_log_event methods
 | |
| **************************************************************************/
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| void Binlog_checkpoint_log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|   protocol->store(binlog_file_name, binlog_file_len, &my_charset_bin);
 | |
| }
 | |
| 
 | |
| 
 | |
| Log_event::enum_skip_reason
 | |
| Binlog_checkpoint_log_event::do_shall_skip(rpl_group_info *rgi)
 | |
| {
 | |
|   enum_skip_reason reason= Log_event::do_shall_skip(rgi);
 | |
|   if (reason == EVENT_SKIP_COUNT)
 | |
|     reason= EVENT_SKIP_NOT;
 | |
|   return reason;
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| Binlog_checkpoint_log_event::Binlog_checkpoint_log_event(
 | |
|         const char *binlog_file_name_arg,
 | |
|         uint binlog_file_len_arg)
 | |
|   :Log_event(),
 | |
|    binlog_file_name(my_strndup(PSI_INSTRUMENT_ME, binlog_file_name_arg, binlog_file_len_arg,
 | |
|                                MYF(MY_WME))),
 | |
|    binlog_file_len(binlog_file_len_arg)
 | |
| {
 | |
|   cache_type= EVENT_NO_CACHE;
 | |
| }
 | |
| 
 | |
| 
 | |
| bool Binlog_checkpoint_log_event::write()
 | |
| {
 | |
|   uchar buf[BINLOG_CHECKPOINT_HEADER_LEN];
 | |
|   int4store(buf, binlog_file_len);
 | |
|   return write_header(BINLOG_CHECKPOINT_HEADER_LEN + binlog_file_len) ||
 | |
|          write_data(buf, BINLOG_CHECKPOINT_HEADER_LEN) ||
 | |
|          write_data(binlog_file_name, binlog_file_len) ||
 | |
|          write_footer();
 | |
| }
 | |
| 
 | |
| 
 | |
| /**************************************************************************
 | |
|         Global transaction ID stuff
 | |
| **************************************************************************/
 | |
| 
 | |
| Gtid_log_event::Gtid_log_event(THD *thd_arg, uint64 seq_no_arg,
 | |
|                                uint32 domain_id_arg, bool standalone,
 | |
|                                uint16 flags_arg, bool is_transactional,
 | |
|                                uint64 commit_id_arg, bool has_xid,
 | |
|                                bool ro_1pc)
 | |
|   : Log_event(thd_arg, flags_arg, is_transactional),
 | |
|     seq_no(seq_no_arg), commit_id(commit_id_arg), domain_id(domain_id_arg),
 | |
|     flags2((standalone ? FL_STANDALONE : 0) |
 | |
|            (commit_id_arg ? FL_GROUP_COMMIT_ID : 0)),
 | |
|     flags_extra(0), extra_engines(0)
 | |
| {
 | |
|   cache_type= Log_event::EVENT_NO_CACHE;
 | |
|   bool is_tmp_table= thd_arg->lex->stmt_accessed_temp_table();
 | |
|   if (thd_arg->transaction->stmt.trans_did_wait() ||
 | |
|       thd_arg->transaction->all.trans_did_wait())
 | |
|     flags2|= FL_WAITED;
 | |
|   if (thd_arg->transaction->stmt.trans_did_ddl() ||
 | |
|       thd_arg->transaction->stmt.has_created_dropped_temp_table() ||
 | |
|       thd_arg->transaction->stmt.trans_executed_admin_cmd() ||
 | |
|       thd_arg->transaction->all.trans_did_ddl() ||
 | |
|       thd_arg->transaction->all.has_created_dropped_temp_table() ||
 | |
|       thd_arg->transaction->all.trans_executed_admin_cmd())
 | |
|     flags2|= FL_DDL;
 | |
|   else if (is_transactional && !is_tmp_table &&
 | |
|            !(thd_arg->transaction->all.modified_non_trans_table &&
 | |
|              thd->variables.binlog_direct_non_trans_update == 0 &&
 | |
|              !thd->is_current_stmt_binlog_format_row()))
 | |
|     flags2|= FL_TRANSACTIONAL;
 | |
|   if (!(thd_arg->variables.option_bits & OPTION_RPL_SKIP_PARALLEL))
 | |
|     flags2|= FL_ALLOW_PARALLEL;
 | |
|   /* Preserve any DDL or WAITED flag in the slave's binlog. */
 | |
|   if (thd_arg->rgi_slave)
 | |
|     flags2|= (thd_arg->rgi_slave->gtid_ev_flags2 & (FL_DDL|FL_WAITED));
 | |
| 
 | |
|   XID_STATE &xid_state= thd->transaction->xid_state;
 | |
|   if (is_transactional)
 | |
|   {
 | |
|     if (xid_state.is_explicit_XA() &&
 | |
|         (thd->lex->sql_command == SQLCOM_XA_PREPARE ||
 | |
|          xid_state.get_state_code() == XA_PREPARED))
 | |
|     {
 | |
|       DBUG_ASSERT(!(thd->lex->sql_command == SQLCOM_XA_COMMIT &&
 | |
|                     thd->lex->xa_opt == XA_ONE_PHASE));
 | |
| 
 | |
|       flags2|= thd->lex->sql_command == SQLCOM_XA_PREPARE ?
 | |
|         FL_PREPARED_XA : FL_COMPLETED_XA;
 | |
|       xid.set(xid_state.get_xid());
 | |
|     }
 | |
|     /* count non-zero extra recoverable engines; total = extra + 1 */
 | |
|     if (has_xid)
 | |
|     {
 | |
|       DBUG_ASSERT(ha_count_rw_2pc(thd_arg,
 | |
|                                   thd_arg->in_multi_stmt_transaction_mode()));
 | |
| 
 | |
|       extra_engines=
 | |
|         ha_count_rw_2pc(thd_arg, thd_arg->in_multi_stmt_transaction_mode()) - 1;
 | |
|     }
 | |
|     else if (ro_1pc)
 | |
|     {
 | |
|       extra_engines= UCHAR_MAX;
 | |
|     }
 | |
|     else if (thd->lex->sql_command == SQLCOM_XA_PREPARE)
 | |
|     {
 | |
|       DBUG_ASSERT(thd_arg->in_multi_stmt_transaction_mode());
 | |
| 
 | |
|       uint8 count= ha_count_rw_2pc(thd_arg, true);
 | |
|       extra_engines= count > 1 ? 0 : UCHAR_MAX;
 | |
|     }
 | |
|     if (extra_engines > 0)
 | |
|       flags_extra|= FL_EXTRA_MULTI_ENGINE;
 | |
|   }
 | |
| 
 | |
|   DBUG_ASSERT(thd_arg->lex->sql_command != SQLCOM_CREATE_SEQUENCE ||
 | |
|               (flags2 & FL_DDL) || thd_arg->in_multi_stmt_transaction_mode());
 | |
| }
 | |
| 
 | |
| 
 | |
| /*
 | |
|   Used to record GTID while sending binlog to slave, without having to
 | |
|   fully contruct every Gtid_log_event() needlessly.
 | |
| */
 | |
| bool
 | |
| Gtid_log_event::peek(const uchar *event_start, size_t event_len,
 | |
|                      enum enum_binlog_checksum_alg checksum_alg,
 | |
|                      uint32 *domain_id, uint32 *server_id, uint64 *seq_no,
 | |
|                      uchar *flags2, const Format_description_log_event *fdev)
 | |
| {
 | |
|   const uchar *p;
 | |
| 
 | |
|   if (checksum_alg == BINLOG_CHECKSUM_ALG_CRC32)
 | |
|   {
 | |
|     if (event_len > BINLOG_CHECKSUM_LEN)
 | |
|       event_len-= BINLOG_CHECKSUM_LEN;
 | |
|     else
 | |
|       event_len= 0;
 | |
|   }
 | |
|   else
 | |
|     DBUG_ASSERT(checksum_alg == BINLOG_CHECKSUM_ALG_UNDEF ||
 | |
|                 checksum_alg == BINLOG_CHECKSUM_ALG_OFF);
 | |
| 
 | |
|   if (event_len < (uint32)fdev->common_header_len + GTID_HEADER_LEN)
 | |
|     return true;
 | |
|   *server_id= uint4korr(event_start + SERVER_ID_OFFSET);
 | |
|   p= event_start + fdev->common_header_len;
 | |
|   *seq_no= uint8korr(p);
 | |
|   p+= 8;
 | |
|   *domain_id= uint4korr(p);
 | |
|   p+= 4;
 | |
|   *flags2= *p;
 | |
|   return false;
 | |
| }
 | |
| 
 | |
| 
 | |
| bool
 | |
| Gtid_log_event::write()
 | |
| {
 | |
|   uchar buf[GTID_HEADER_LEN+2+sizeof(XID) + /* flags_extra: */ 1+4];
 | |
|   size_t write_len= 13;
 | |
| 
 | |
|   int8store(buf, seq_no);
 | |
|   int4store(buf+8, domain_id);
 | |
|   buf[12]= flags2;
 | |
|   if (flags2 & FL_GROUP_COMMIT_ID)
 | |
|   {
 | |
|     DBUG_ASSERT(write_len + 8 == GTID_HEADER_LEN + 2);
 | |
| 
 | |
|     int8store(buf+write_len, commit_id);
 | |
|     write_len= GTID_HEADER_LEN + 2;
 | |
|   }
 | |
| 
 | |
|   if (flags2 & (FL_PREPARED_XA | FL_COMPLETED_XA)
 | |
| #ifndef DBUG_OFF
 | |
|       && DBUG_EVALUATE_IF("negate_xid_from_gtid", 0, 1)
 | |
| #endif
 | |
|   )
 | |
|   {
 | |
|     int4store(&buf[write_len],   xid.formatID);
 | |
|     buf[write_len +4]=   (uchar) xid.gtrid_length;
 | |
|     buf[write_len +4+1]= (uchar) xid.bqual_length;
 | |
|     write_len+= 6;
 | |
|     long data_length= xid.bqual_length + xid.gtrid_length;
 | |
| 
 | |
| #ifndef DBUG_OFF
 | |
|     if (DBUG_EVALUATE_IF("negate_xid_data_from_gtid", 0, 1))
 | |
|     {
 | |
| #endif
 | |
|     memcpy(buf+write_len, xid.data, data_length);
 | |
|     write_len+= data_length;
 | |
| #ifndef DBUG_OFF
 | |
|     }
 | |
| #endif
 | |
|   }
 | |
| 
 | |
|   DBUG_EXECUTE_IF("inject_fl_extra_multi_engine_into_gtid", {
 | |
|     flags_extra|= FL_EXTRA_MULTI_ENGINE;
 | |
|   });
 | |
|   if (flags_extra > 0)
 | |
|   {
 | |
|     buf[write_len]= flags_extra;
 | |
|     write_len++;
 | |
|   }
 | |
|   DBUG_EXECUTE_IF("inject_fl_extra_multi_engine_into_gtid", {
 | |
|     flags_extra&= ~FL_EXTRA_MULTI_ENGINE;
 | |
|   });
 | |
| 
 | |
|   if (flags_extra & FL_EXTRA_MULTI_ENGINE)
 | |
|   {
 | |
|     buf[write_len]= extra_engines;
 | |
|     write_len++;
 | |
|   }
 | |
| 
 | |
|   if (write_len < GTID_HEADER_LEN)
 | |
|   {
 | |
|     bzero(buf+write_len, GTID_HEADER_LEN-write_len);
 | |
|     write_len= GTID_HEADER_LEN;
 | |
|   }
 | |
|   return write_header(write_len) ||
 | |
|          write_data(buf, write_len) ||
 | |
|          write_footer();
 | |
| }
 | |
| 
 | |
| 
 | |
| /*
 | |
|   Replace a GTID event with either a BEGIN event, dummy event, or nothing, as
 | |
|   appropriate to work with old slave that does not know global transaction id.
 | |
| 
 | |
|   The need_dummy_event argument is an IN/OUT argument. It is passed as TRUE
 | |
|   if slave has capability lower than MARIA_SLAVE_CAPABILITY_TOLERATE_HOLES.
 | |
|   It is returned TRUE if we return a BEGIN (or dummy) event to be sent to the
 | |
|   slave, FALSE if event should be skipped completely.
 | |
| */
 | |
| int
 | |
| Gtid_log_event::make_compatible_event(String *packet, bool *need_dummy_event,
 | |
|                                       ulong ev_offset,
 | |
|                                       enum enum_binlog_checksum_alg checksum_alg)
 | |
| {
 | |
|   uchar flags2;
 | |
|   if (packet->length() - ev_offset < LOG_EVENT_HEADER_LEN + GTID_HEADER_LEN)
 | |
|     return 1;
 | |
|   flags2= (*packet)[ev_offset + LOG_EVENT_HEADER_LEN + 12];
 | |
|   if (flags2 & FL_STANDALONE)
 | |
|   {
 | |
|     if (*need_dummy_event)
 | |
|       return Query_log_event::dummy_event(packet, ev_offset, checksum_alg);
 | |
|     return 0;
 | |
|   }
 | |
| 
 | |
|   *need_dummy_event= true;
 | |
|   return Query_log_event::begin_event(packet, ev_offset, checksum_alg);
 | |
| }
 | |
| 
 | |
| 
 | |
| #ifdef HAVE_REPLICATION
 | |
| void
 | |
| Gtid_log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|   char buf[6+5+10+1+10+1+20+1+4+20+1+ ser_buf_size+5 /* sprintf */];
 | |
|   char *p;
 | |
|   p = strmov(buf, (flags2 & FL_STANDALONE  ? "GTID " :
 | |
|                    flags2 & FL_PREPARED_XA ? "XA START " : "BEGIN GTID "));
 | |
|   if (flags2 & FL_PREPARED_XA)
 | |
|   {
 | |
|     p+= sprintf(p, "%s GTID ", xid.serialize());
 | |
|   }
 | |
|   p= longlong10_to_str(domain_id, p, 10);
 | |
|   *p++= '-';
 | |
|   p= longlong10_to_str(server_id, p, 10);
 | |
|   *p++= '-';
 | |
|   p= longlong10_to_str(seq_no, p, 10);
 | |
|   if (flags2 & FL_GROUP_COMMIT_ID)
 | |
|   {
 | |
|     p= strmov(p, " cid=");
 | |
|     p= longlong10_to_str(commit_id, p, 10);
 | |
|   }
 | |
| 
 | |
|   protocol->store(buf, p-buf, &my_charset_bin);
 | |
| }
 | |
| 
 | |
| static char gtid_begin_string[] = "BEGIN";
 | |
| 
 | |
| int
 | |
| Gtid_log_event::do_apply_event(rpl_group_info *rgi)
 | |
| {
 | |
|   ulonglong bits= thd->variables.option_bits;
 | |
|   thd->variables.server_id= this->server_id;
 | |
|   thd->variables.gtid_domain_id= this->domain_id;
 | |
|   thd->variables.gtid_seq_no= this->seq_no;
 | |
|   rgi->gtid_ev_flags2= flags2;
 | |
|   thd->reset_for_next_command();
 | |
| 
 | |
|   if (opt_gtid_strict_mode && opt_bin_log && opt_log_slave_updates)
 | |
|   {
 | |
|     if (mysql_bin_log.check_strict_gtid_sequence(this->domain_id,
 | |
|                                                  this->server_id, this->seq_no))
 | |
|       return 1;
 | |
|   }
 | |
| 
 | |
|   DBUG_ASSERT((bits & OPTION_GTID_BEGIN) == 0);
 | |
| 
 | |
|   Master_info *mi=rgi->rli->mi;
 | |
|   switch (flags2 & (FL_DDL | FL_TRANSACTIONAL))
 | |
|   {
 | |
|     case FL_TRANSACTIONAL:
 | |
|       mi->total_trans_groups++;
 | |
|       break;
 | |
|     case FL_DDL:
 | |
|       mi->total_ddl_groups++;
 | |
|     break;
 | |
|     default:
 | |
|       mi->total_non_trans_groups++;
 | |
|   }
 | |
| 
 | |
|   if (flags2 & FL_STANDALONE)
 | |
|     return 0;
 | |
| 
 | |
|   /* Execute this like a BEGIN query event. */
 | |
|   bits|= OPTION_GTID_BEGIN;
 | |
|   if (flags2 & FL_ALLOW_PARALLEL)
 | |
|     bits&= ~(ulonglong)OPTION_RPL_SKIP_PARALLEL;
 | |
|   else
 | |
|     bits|= (ulonglong)OPTION_RPL_SKIP_PARALLEL;
 | |
|   thd->variables.option_bits= bits;
 | |
|   DBUG_PRINT("info", ("Set OPTION_GTID_BEGIN"));
 | |
|   thd->is_slave_error= 0;
 | |
| 
 | |
|   char buf_xa[sizeof("XA START") + 1 + ser_buf_size];
 | |
|   if (flags2 & FL_PREPARED_XA)
 | |
|   {
 | |
|     const char fmt[]= "XA START %s";
 | |
| 
 | |
|     thd->lex->xid= &xid;
 | |
|     thd->lex->xa_opt= XA_NONE;
 | |
|     sprintf(buf_xa, fmt, xid.serialize());
 | |
|     thd->set_query_and_id(buf_xa, static_cast<uint32>(strlen(buf_xa)),
 | |
|                           &my_charset_bin, next_query_id());
 | |
|     thd->lex->sql_command= SQLCOM_XA_START;
 | |
|     if (trans_xa_start(thd))
 | |
|     {
 | |
|       DBUG_PRINT("error", ("trans_xa_start() failed"));
 | |
|       thd->is_slave_error= 1;
 | |
|     }
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     thd->set_query_and_id(gtid_begin_string, sizeof(gtid_begin_string)-1,
 | |
|                           &my_charset_bin, next_query_id());
 | |
|     thd->lex->sql_command= SQLCOM_BEGIN;
 | |
|     if (trans_begin(thd, 0))
 | |
|     {
 | |
|       DBUG_PRINT("error", ("trans_begin() failed"));
 | |
|       thd->is_slave_error= 1;
 | |
|     }
 | |
|   }
 | |
|   status_var_increment(thd->status_var.com_stat[thd->lex->sql_command]);
 | |
|   thd->update_stats();
 | |
| 
 | |
|   if (likely(!thd->is_slave_error))
 | |
|     general_log_write(thd, COM_QUERY, thd->query(), thd->query_length());
 | |
| 
 | |
|   thd->reset_query();
 | |
|   free_root(thd->mem_root,MYF(MY_KEEP_PREALLOC));
 | |
|   return thd->is_slave_error;
 | |
| }
 | |
| 
 | |
| 
 | |
| int
 | |
| Gtid_log_event::do_update_pos(rpl_group_info *rgi)
 | |
| {
 | |
|   rgi->inc_event_relay_log_pos();
 | |
|   return 0;
 | |
| }
 | |
| 
 | |
| 
 | |
| Log_event::enum_skip_reason
 | |
| Gtid_log_event::do_shall_skip(rpl_group_info *rgi)
 | |
| {
 | |
|   Relay_log_info *rli= rgi->rli;
 | |
|   /*
 | |
|     An event skipped due to @@skip_replication must not be counted towards the
 | |
|     number of events to be skipped due to @@sql_slave_skip_counter.
 | |
|   */
 | |
|   if (flags & LOG_EVENT_SKIP_REPLICATION_F &&
 | |
|       opt_replicate_events_marked_for_skip != RPL_SKIP_REPLICATE)
 | |
|     return Log_event::EVENT_SKIP_IGNORE;
 | |
| 
 | |
|   if (rli->slave_skip_counter > 0)
 | |
|   {
 | |
|     if (!(flags2 & FL_STANDALONE))
 | |
|     {
 | |
|       thd->variables.option_bits|= OPTION_BEGIN;
 | |
|       DBUG_ASSERT(rgi->rli->get_flag(Relay_log_info::IN_TRANSACTION));
 | |
|     }
 | |
|     return Log_event::continue_group(rgi);
 | |
|   }
 | |
|   return Log_event::do_shall_skip(rgi);
 | |
| }
 | |
| 
 | |
| 
 | |
| #endif  /* HAVE_REPLICATION */
 | |
| 
 | |
| 
 | |
| 
 | |
| Gtid_list_log_event::Gtid_list_log_event(rpl_binlog_state *gtid_set,
 | |
|                                          uint32 gl_flags_)
 | |
|   : count(gtid_set->count()), gl_flags(gl_flags_), list(0), sub_id_list(0)
 | |
| {
 | |
|   cache_type= EVENT_NO_CACHE;
 | |
|   /* Failure to allocate memory will be caught by is_valid() returning false. */
 | |
|   if (count < (1<<28) &&
 | |
|       (list = (rpl_gtid *)my_malloc(PSI_INSTRUMENT_ME,
 | |
|                            count * sizeof(*list) + (count == 0), MYF(MY_WME))))
 | |
|     gtid_set->get_gtid_list(list, count);
 | |
| }
 | |
| 
 | |
| 
 | |
| Gtid_list_log_event::Gtid_list_log_event(slave_connection_state *gtid_set,
 | |
|                                          uint32 gl_flags_)
 | |
|   : count(gtid_set->count()), gl_flags(gl_flags_), list(0), sub_id_list(0)
 | |
| {
 | |
|   cache_type= EVENT_NO_CACHE;
 | |
|   /* Failure to allocate memory will be caught by is_valid() returning false. */
 | |
|   if (count < (1<<28) &&
 | |
|       (list = (rpl_gtid *)my_malloc(PSI_INSTRUMENT_ME,
 | |
|                           count * sizeof(*list) + (count == 0), MYF(MY_WME))))
 | |
|   {
 | |
|     gtid_set->get_gtid_list(list, count);
 | |
| #if defined(HAVE_REPLICATION)
 | |
|     if (gl_flags & FLAG_IGN_GTIDS)
 | |
|     {
 | |
|       uint32 i;
 | |
| 
 | |
|       if (!(sub_id_list= (uint64 *)my_malloc(PSI_INSTRUMENT_ME,
 | |
|                                          count * sizeof(uint64), MYF(MY_WME))))
 | |
|       {
 | |
|         my_free(list);
 | |
|         list= NULL;
 | |
|         return;
 | |
|       }
 | |
|       for (i= 0; i < count; ++i)
 | |
|       {
 | |
|         if (!(sub_id_list[i]=
 | |
|               rpl_global_gtid_slave_state->next_sub_id(list[i].domain_id)))
 | |
|         {
 | |
|           my_free(list);
 | |
|           my_free(sub_id_list);
 | |
|           list= NULL;
 | |
|           sub_id_list= NULL;
 | |
|           return;
 | |
|         }
 | |
|       }
 | |
|     }
 | |
| #endif
 | |
|   }
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| bool
 | |
| Gtid_list_log_event::to_packet(String *packet)
 | |
| {
 | |
|   uint32 i;
 | |
|   uchar *p;
 | |
|   uint32 needed_length;
 | |
| 
 | |
|   DBUG_ASSERT(count < 1<<28);
 | |
| 
 | |
|   needed_length= packet->length() + get_data_size();
 | |
|   if (packet->reserve(needed_length))
 | |
|     return true;
 | |
|   p= (uchar *)packet->ptr() + packet->length();;
 | |
|   packet->length(needed_length);
 | |
|   int4store(p, (count & ((1<<28)-1)) | gl_flags);
 | |
|   p += 4;
 | |
|   /* Initialise the padding for empty Gtid_list. */
 | |
|   if (count == 0)
 | |
|     int2store(p, 0);
 | |
|   for (i= 0; i < count; ++i)
 | |
|   {
 | |
|     int4store(p, list[i].domain_id);
 | |
|     int4store(p+4, list[i].server_id);
 | |
|     int8store(p+8, list[i].seq_no);
 | |
|     p += 16;
 | |
|   }
 | |
| 
 | |
|   return false;
 | |
| }
 | |
| 
 | |
| 
 | |
| bool
 | |
| Gtid_list_log_event::write()
 | |
| {
 | |
|   char buf[128];
 | |
|   String packet(buf, sizeof(buf), system_charset_info);
 | |
| 
 | |
|   packet.length(0);
 | |
|   if (to_packet(&packet))
 | |
|     return true;
 | |
|   return write_header(get_data_size()) ||
 | |
|          write_data(packet.ptr(), packet.length()) ||
 | |
|          write_footer();
 | |
| }
 | |
| 
 | |
| 
 | |
| int
 | |
| Gtid_list_log_event::do_apply_event(rpl_group_info *rgi)
 | |
| {
 | |
|   Relay_log_info *rli= const_cast<Relay_log_info*>(rgi->rli);
 | |
|   int ret;
 | |
|   if (gl_flags & FLAG_IGN_GTIDS)
 | |
|   {
 | |
|     void *hton= NULL;
 | |
|     uint32 i;
 | |
| 
 | |
|     for (i= 0; i < count; ++i)
 | |
|     {
 | |
|       if ((ret= rpl_global_gtid_slave_state->record_gtid(thd, &list[i],
 | |
|                                                          sub_id_list[i],
 | |
|                                                          false, false, &hton)))
 | |
|         return ret;
 | |
|       rpl_global_gtid_slave_state->update_state_hash(sub_id_list[i], &list[i],
 | |
|                                                      hton, NULL);
 | |
|     }
 | |
|   }
 | |
|   ret= Log_event::do_apply_event(rgi);
 | |
|   if (rli->until_condition == Relay_log_info::UNTIL_GTID &&
 | |
|       (gl_flags & FLAG_UNTIL_REACHED))
 | |
|   {
 | |
|     char str_buf[128];
 | |
|     String str(str_buf, sizeof(str_buf), system_charset_info);
 | |
|     rli->until_gtid_pos.to_string(&str);
 | |
|     sql_print_information("Slave SQL thread stops because it reached its"
 | |
|                           " UNTIL master_gtid_pos %s", str.c_ptr_safe());
 | |
|     rli->abort_slave= true;
 | |
|     rli->stop_for_until= true;
 | |
|   }
 | |
|   free_root(thd->mem_root, MYF(MY_KEEP_PREALLOC));
 | |
|   return ret;
 | |
| }
 | |
| 
 | |
| 
 | |
| Log_event::enum_skip_reason
 | |
| Gtid_list_log_event::do_shall_skip(rpl_group_info *rgi)
 | |
| {
 | |
|   enum_skip_reason reason= Log_event::do_shall_skip(rgi);
 | |
|   if (reason == EVENT_SKIP_COUNT)
 | |
|     reason= EVENT_SKIP_NOT;
 | |
|   return reason;
 | |
| }
 | |
| 
 | |
| 
 | |
| void
 | |
| Gtid_list_log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|   char buf_mem[1024];
 | |
|   String buf(buf_mem, sizeof(buf_mem), system_charset_info);
 | |
|   uint32 i;
 | |
|   bool first;
 | |
| 
 | |
|   buf.length(0);
 | |
|   buf.append(STRING_WITH_LEN("["));
 | |
|   first= true;
 | |
|   for (i= 0; i < count; ++i)
 | |
|     rpl_slave_state_tostring_helper(&buf, &list[i], &first);
 | |
|   buf.append(STRING_WITH_LEN("]"));
 | |
| 
 | |
|   protocol->store(&buf);
 | |
| }
 | |
| #endif  /* HAVE_REPLICATION */
 | |
| 
 | |
| 
 | |
| 
 | |
| /**************************************************************************
 | |
| 	Intvar_log_event methods
 | |
| **************************************************************************/
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| void Intvar_log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|   char buf[256], *pos;
 | |
|   pos= strmake(buf, get_var_type_name(), sizeof(buf)-23);
 | |
|   *pos++= '=';
 | |
|   pos= longlong10_to_str(val, pos, -10);
 | |
|   protocol->store(buf, (uint) (pos-buf), &my_charset_bin);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| bool Intvar_log_event::write()
 | |
| {
 | |
|   uchar buf[9];
 | |
|   buf[I_TYPE_OFFSET]= (uchar) type;
 | |
|   int8store(buf + I_VAL_OFFSET, val);
 | |
|   return write_header(sizeof(buf)) ||
 | |
|          write_data(buf, sizeof(buf)) ||
 | |
|          write_footer();
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| 
 | |
| /*
 | |
|   Intvar_log_event::do_apply_event()
 | |
| */
 | |
| 
 | |
| int Intvar_log_event::do_apply_event(rpl_group_info *rgi)
 | |
| {
 | |
|   DBUG_ENTER("Intvar_log_event::do_apply_event");
 | |
|   if (rgi->deferred_events_collecting)
 | |
|   {
 | |
|     DBUG_PRINT("info",("deferring event"));
 | |
|     DBUG_RETURN(rgi->deferred_events->add(this));
 | |
|   }
 | |
| 
 | |
|   switch (type) {
 | |
|   case LAST_INSERT_ID_EVENT:
 | |
|     thd->first_successful_insert_id_in_prev_stmt= val;
 | |
|     DBUG_PRINT("info",("last_insert_id_event: %ld", (long) val));
 | |
|     break;
 | |
|   case INSERT_ID_EVENT:
 | |
|     thd->force_one_auto_inc_interval(val);
 | |
|     break;
 | |
|   }
 | |
|   DBUG_RETURN(0);
 | |
| }
 | |
| 
 | |
| int Intvar_log_event::do_update_pos(rpl_group_info *rgi)
 | |
| {
 | |
|   rgi->inc_event_relay_log_pos();
 | |
|   return 0;
 | |
| }
 | |
| 
 | |
| 
 | |
| Log_event::enum_skip_reason
 | |
| Intvar_log_event::do_shall_skip(rpl_group_info *rgi)
 | |
| {
 | |
|   /*
 | |
|     It is a common error to set the slave skip counter to 1 instead of
 | |
|     2 when recovering from an insert which used a auto increment,
 | |
|     rand, or user var.  Therefore, if the slave skip counter is 1, we
 | |
|     just say that this event should be skipped by ignoring it, meaning
 | |
|     that we do not change the value of the slave skip counter since it
 | |
|     will be decreased by the following insert event.
 | |
|   */
 | |
|   return continue_group(rgi);
 | |
| }
 | |
| 
 | |
| #endif
 | |
| 
 | |
| 
 | |
| /**************************************************************************
 | |
|   Rand_log_event methods
 | |
| **************************************************************************/
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| void Rand_log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|   char buf1[256], *pos;
 | |
|   pos= strmov(buf1,"rand_seed1=");
 | |
|   pos= int10_to_str((long) seed1, pos, 10);
 | |
|   pos= strmov(pos, ",rand_seed2=");
 | |
|   pos= int10_to_str((long) seed2, pos, 10);
 | |
|   protocol->store(buf1, (uint) (pos-buf1), &my_charset_bin);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| bool Rand_log_event::write()
 | |
| {
 | |
|   uchar buf[16];
 | |
|   int8store(buf + RAND_SEED1_OFFSET, seed1);
 | |
|   int8store(buf + RAND_SEED2_OFFSET, seed2);
 | |
|   return write_header(sizeof(buf)) ||
 | |
|          write_data(buf, sizeof(buf)) ||
 | |
|          write_footer();
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| int Rand_log_event::do_apply_event(rpl_group_info *rgi)
 | |
| {
 | |
|   if (rgi->deferred_events_collecting)
 | |
|     return rgi->deferred_events->add(this);
 | |
| 
 | |
|   thd->rand.seed1= (ulong) seed1;
 | |
|   thd->rand.seed2= (ulong) seed2;
 | |
|   return 0;
 | |
| }
 | |
| 
 | |
| int Rand_log_event::do_update_pos(rpl_group_info *rgi)
 | |
| {
 | |
|   rgi->inc_event_relay_log_pos();
 | |
|   return 0;
 | |
| }
 | |
| 
 | |
| 
 | |
| Log_event::enum_skip_reason
 | |
| Rand_log_event::do_shall_skip(rpl_group_info *rgi)
 | |
| {
 | |
|   /*
 | |
|     It is a common error to set the slave skip counter to 1 instead of
 | |
|     2 when recovering from an insert which used a auto increment,
 | |
|     rand, or user var.  Therefore, if the slave skip counter is 1, we
 | |
|     just say that this event should be skipped by ignoring it, meaning
 | |
|     that we do not change the value of the slave skip counter since it
 | |
|     will be decreased by the following insert event.
 | |
|   */
 | |
|   return continue_group(rgi);
 | |
| }
 | |
| 
 | |
| /**
 | |
|    Exec deferred Int-, Rand- and User- var events prefixing
 | |
|    a Query-log-event event.
 | |
| 
 | |
|    @param thd THD handle
 | |
| 
 | |
|    @return false on success, true if a failure in an event applying occurred.
 | |
| */
 | |
| bool slave_execute_deferred_events(THD *thd)
 | |
| {
 | |
|   bool res= false;
 | |
|   rpl_group_info *rgi= thd->rgi_slave;
 | |
| 
 | |
|   DBUG_ASSERT(rgi && (!rgi->deferred_events_collecting || rgi->deferred_events));
 | |
| 
 | |
|   if (!rgi->deferred_events_collecting || rgi->deferred_events->is_empty())
 | |
|     return res;
 | |
| 
 | |
|   res= rgi->deferred_events->execute(rgi);
 | |
|   rgi->deferred_events->rewind();
 | |
| 
 | |
|   return res;
 | |
| }
 | |
| 
 | |
| #endif /* HAVE_REPLICATION */
 | |
| 
 | |
| 
 | |
| /**************************************************************************
 | |
|   Xid_apply_log_event methods
 | |
| **************************************************************************/
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| 
 | |
| int Xid_apply_log_event::do_record_gtid(THD *thd, rpl_group_info *rgi,
 | |
|                                         bool in_trans, void **out_hton,
 | |
|                                         bool force_err)
 | |
| {
 | |
|   int err= 0;
 | |
|   Relay_log_info const *rli= rgi->rli;
 | |
| 
 | |
|   rgi->gtid_pending= false;
 | |
|   err= rpl_global_gtid_slave_state->record_gtid(thd, &rgi->current_gtid,
 | |
|                                                 rgi->gtid_sub_id,
 | |
|                                                 in_trans, false, out_hton);
 | |
| 
 | |
|   if (unlikely(err))
 | |
|   {
 | |
|     int ec= thd->get_stmt_da()->sql_errno();
 | |
|     /*
 | |
|       Do not report an error if this is really a kill due to a deadlock.
 | |
|       In this case, the transaction will be re-tried instead. Unless force_err
 | |
|       is set, as in the case of XA PREPARE, as the GTID state is updated as a
 | |
|       separate transaction, and if that fails, we should not retry but exit in
 | |
|       error immediately.
 | |
|     */
 | |
|     if (!is_parallel_retry_error(rgi, ec) || force_err)
 | |
|     {
 | |
|       char buff[MAX_SLAVE_ERRMSG];
 | |
|       buff[0]= 0;
 | |
|       aggregate_da_errors(buff, sizeof(buff), thd->get_stmt_da());
 | |
| 
 | |
|       if (force_err)
 | |
|         thd->clear_error();
 | |
| 
 | |
|       rli->report(ERROR_LEVEL, ER_CANNOT_UPDATE_GTID_STATE, rgi->gtid_info(),
 | |
|                   "Error during XID COMMIT: failed to update GTID state in "
 | |
|                   "%s.%s: %d: %s the event's master log %s, end_log_pos %llu",
 | |
|                   "mysql", rpl_gtid_slave_state_table_name.str, ec,
 | |
|                   buff, RPL_LOG_NAME, log_pos);
 | |
|     }
 | |
|     thd->is_slave_error= 1;
 | |
|   }
 | |
| 
 | |
|   return err;
 | |
| }
 | |
| 
 | |
| static bool wsrep_must_replay(THD *thd)
 | |
| {
 | |
| #ifdef WITH_WSREP
 | |
|   mysql_mutex_lock(&thd->LOCK_thd_data);
 | |
|   bool res= WSREP(thd) && thd->wsrep_trx().state() == wsrep::transaction::s_must_replay;
 | |
|   mysql_mutex_unlock(&thd->LOCK_thd_data);
 | |
|   return res;
 | |
| #else
 | |
|   return false;
 | |
| #endif
 | |
| }
 | |
| 
 | |
| 
 | |
| int Xid_apply_log_event::do_apply_event(rpl_group_info *rgi)
 | |
| {
 | |
|   bool res;
 | |
|   int err;
 | |
|   uint64 sub_id= 0;
 | |
|   void *hton= NULL;
 | |
|   rpl_gtid gtid;
 | |
| 
 | |
|   /*
 | |
|     An instance of this class such as XID_EVENT works like a COMMIT
 | |
|     statement. It updates mysql.gtid_slave_pos with the GTID of the
 | |
|     current transaction.
 | |
|     Therefore, it acts much like a normal SQL statement, so we need to do
 | |
|     THD::reset_for_next_command() as if starting a new statement.
 | |
| 
 | |
|     XA_PREPARE_LOG_EVENT also updates the gtid table *but* the update gets
 | |
|     committed as separate "autocommit" transaction.
 | |
|   */
 | |
|   thd->reset_for_next_command();
 | |
|   /*
 | |
|     Record any GTID in the same transaction, so slave state is transactionally
 | |
|     consistent.
 | |
|   */
 | |
| #ifdef WITH_WSREP
 | |
|   thd->wsrep_affected_rows= 0;
 | |
| #endif
 | |
| 
 | |
| #ifndef DBUG_OFF
 | |
|   bool record_gtid_delayed_for_xa= false;
 | |
| #endif
 | |
|   if (rgi->gtid_pending)
 | |
|   {
 | |
|     sub_id= rgi->gtid_sub_id;
 | |
|     gtid= rgi->current_gtid;
 | |
| 
 | |
|     if (!thd->transaction->xid_state.is_explicit_XA())
 | |
|     {
 | |
|       if ((err= do_record_gtid(thd, rgi, true /* in_trans */, &hton)))
 | |
|         return err;
 | |
| 
 | |
|       DBUG_EXECUTE_IF("gtid_fail_after_record_gtid",
 | |
|                       {
 | |
|                         my_error(ER_ERROR_DURING_COMMIT, MYF(0),
 | |
|                                  HA_ERR_WRONG_COMMAND);
 | |
|                         thd->is_slave_error= 1;
 | |
|                         return 1;
 | |
|                       });
 | |
|     }
 | |
| #ifndef DBUG_OFF
 | |
|     else
 | |
|       record_gtid_delayed_for_xa= true;
 | |
| #endif
 | |
|   }
 | |
| 
 | |
|   general_log_print(thd, COM_QUERY, "%s", get_query());
 | |
|   thd->variables.option_bits&= ~OPTION_GTID_BEGIN;
 | |
|   res= do_commit();
 | |
|   if (!res && rgi->gtid_pending)
 | |
|   {
 | |
|     DBUG_ASSERT(!thd->transaction->xid_state.is_explicit_XA());
 | |
| 
 | |
|     DBUG_ASSERT(record_gtid_delayed_for_xa);
 | |
|     if (thd->rgi_slave->is_parallel_exec)
 | |
|     {
 | |
|       /*
 | |
|         With XA, since the transaction is prepared/committed without updating
 | |
|         the GTID pos (MDEV-32020...), we need here to clear any pending
 | |
|         deadlock kill.
 | |
| 
 | |
|         Otherwise if the kill happened after the prepare/commit completed, it
 | |
|         might end up killing the subsequent GTID position update, causing the
 | |
|         slave to fail with error.
 | |
|       */
 | |
|       wait_for_pending_deadlock_kill(thd, thd->rgi_slave);
 | |
|       thd->reset_killed();
 | |
|     }
 | |
| 
 | |
|     if ((err= do_record_gtid(thd, rgi, false, &hton, true)))
 | |
|       return err;
 | |
|   }
 | |
| 
 | |
|   if (sub_id && (!res || wsrep_must_replay(thd)))
 | |
|     rpl_global_gtid_slave_state->update_state_hash(sub_id, >id, hton, rgi);
 | |
|   /*
 | |
|     Increment the global status commit count variable
 | |
|   */
 | |
|   enum enum_sql_command cmd= !thd->transaction->xid_state.is_explicit_XA()
 | |
|     ? SQLCOM_COMMIT : SQLCOM_XA_PREPARE;
 | |
|   status_var_increment(thd->status_var.com_stat[cmd]);
 | |
| 
 | |
|   return res;
 | |
| }
 | |
| 
 | |
| Log_event::enum_skip_reason
 | |
| Xid_apply_log_event::do_shall_skip(rpl_group_info *rgi)
 | |
| {
 | |
|   DBUG_ENTER("Xid_apply_log_event::do_shall_skip");
 | |
|   if (rgi->rli->slave_skip_counter > 0)
 | |
|   {
 | |
|     DBUG_ASSERT(!rgi->rli->get_flag(Relay_log_info::IN_TRANSACTION));
 | |
|     thd->variables.option_bits&= ~(OPTION_BEGIN | OPTION_GTID_BEGIN);
 | |
|     DBUG_RETURN(Log_event::EVENT_SKIP_COUNT);
 | |
|   }
 | |
| #ifdef WITH_WSREP
 | |
|   else if (wsrep_mysql_replication_bundle && WSREP(thd) &&
 | |
|            opt_slave_domain_parallel_threads == 0)
 | |
|   {
 | |
|     if (++thd->wsrep_mysql_replicated < (int)wsrep_mysql_replication_bundle)
 | |
|     {
 | |
|       WSREP_DEBUG("skipping wsrep commit %d", thd->wsrep_mysql_replicated);
 | |
|       DBUG_RETURN(Log_event::EVENT_SKIP_IGNORE);
 | |
|     }
 | |
|     else
 | |
|     {
 | |
|       thd->wsrep_mysql_replicated = 0;
 | |
|     }
 | |
|   }
 | |
| #endif
 | |
|   DBUG_RETURN(Log_event::do_shall_skip(rgi));
 | |
| }
 | |
| #endif /* HAVE_REPLICATION */
 | |
| 
 | |
| /**************************************************************************
 | |
|   Xid_log_event methods
 | |
| **************************************************************************/
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| void Xid_log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|   char buf[128], *pos;
 | |
|   pos= strmov(buf, "COMMIT /* xid=");
 | |
|   pos= longlong10_to_str(xid, pos, 10);
 | |
|   pos= strmov(pos, " */");
 | |
|   protocol->store(buf, (uint) (pos-buf), &my_charset_bin);
 | |
| }
 | |
| 
 | |
| 
 | |
| int Xid_log_event::do_commit()
 | |
| {
 | |
|   bool res;
 | |
|   res= trans_commit(thd); /* Automatically rolls back on error. */
 | |
|   thd->release_transactional_locks();
 | |
|   return res;
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| bool Xid_log_event::write()
 | |
| {
 | |
|   DBUG_EXECUTE_IF("do_not_write_xid", return 0;);
 | |
|   return write_header(sizeof(xid)) ||
 | |
|          write_data((uchar*)&xid, sizeof(xid)) ||
 | |
|          write_footer();
 | |
| }
 | |
| 
 | |
| /**************************************************************************
 | |
|   XA_prepare_log_event methods
 | |
| **************************************************************************/
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| void XA_prepare_log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|   char query[sizeof("XA COMMIT ONE PHASE") + 1 + ser_buf_size];
 | |
| 
 | |
|   sprintf(query,
 | |
|           (one_phase ? "XA COMMIT %s ONE PHASE" :  "XA PREPARE %s"),
 | |
|           m_xid.serialize());
 | |
| 
 | |
|   protocol->store(query, strlen(query), &my_charset_bin);
 | |
| }
 | |
| 
 | |
| 
 | |
| int XA_prepare_log_event::do_commit()
 | |
| {
 | |
|   int res;
 | |
|   xid_t xid;
 | |
|   xid.set(m_xid.formatID,
 | |
|           m_xid.data, m_xid.gtrid_length,
 | |
|           m_xid.data + m_xid.gtrid_length, m_xid.bqual_length);
 | |
| 
 | |
|   thd->lex->xid= &xid;
 | |
|   if (!one_phase)
 | |
|   {
 | |
|     if (thd->is_current_stmt_binlog_disabled() &&
 | |
|         (res= thd->wait_for_prior_commit()))
 | |
|       return res;
 | |
| 
 | |
|     thd->lex->sql_command= SQLCOM_XA_PREPARE;
 | |
|     res= trans_xa_prepare(thd);
 | |
|   }
 | |
|   else
 | |
|     res= trans_xa_commit(thd);
 | |
| 
 | |
|   return res;
 | |
| }
 | |
| #endif // HAVE_REPLICATION
 | |
| 
 | |
| 
 | |
| bool XA_prepare_log_event::write()
 | |
| {
 | |
|   uchar data[1 + 4 + 4 + 4]= {one_phase,};
 | |
|   uint8 one_phase_byte= one_phase;
 | |
| 
 | |
|   int4store(data+1, static_cast<XID*>(xid)->formatID);
 | |
|   int4store(data+(1+4), static_cast<XID*>(xid)->gtrid_length);
 | |
|   int4store(data+(1+4+4), static_cast<XID*>(xid)->bqual_length);
 | |
| 
 | |
|   DBUG_ASSERT(xid_subheader_no_data == sizeof(data) - 1);
 | |
| 
 | |
|   return write_header(sizeof(one_phase_byte) + xid_subheader_no_data +
 | |
|                       static_cast<XID*>(xid)->gtrid_length +
 | |
|                       static_cast<XID*>(xid)->bqual_length) ||
 | |
|          write_data(data, sizeof(data)) ||
 | |
|          write_data((uchar*) static_cast<XID*>(xid)->data,
 | |
|                      static_cast<XID*>(xid)->gtrid_length +
 | |
|                      static_cast<XID*>(xid)->bqual_length) ||
 | |
|          write_footer();
 | |
| }
 | |
| 
 | |
| 
 | |
| /**************************************************************************
 | |
|   User_var_log_event methods
 | |
| **************************************************************************/
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| static bool
 | |
| user_var_append_name_part(THD *thd, String *buf,
 | |
|                           const char *name, size_t name_len,
 | |
|                           const LEX_CSTRING &data_type_name)
 | |
| {
 | |
|   return buf->append('@') ||
 | |
|     append_identifier(thd, buf, name, name_len) ||
 | |
|     buf->append('=') ||
 | |
|     (data_type_name.length &&
 | |
|      (buf->append(STRING_WITH_LEN("/*")) ||
 | |
|       buf->append(data_type_name.str, data_type_name.length) ||
 | |
|       buf->append(STRING_WITH_LEN("*/"))));
 | |
| }
 | |
| 
 | |
| void User_var_log_event::pack_info(Protocol* protocol)
 | |
| {
 | |
|   if (is_null)
 | |
|   {
 | |
|     char buf_mem[FN_REFLEN+7];
 | |
|     String buf(buf_mem, sizeof(buf_mem), system_charset_info);
 | |
|     buf.length(0);
 | |
|     if (user_var_append_name_part(protocol->thd, &buf, name, name_len,
 | |
|                                   m_data_type_name) ||
 | |
|         buf.append(NULL_clex_str))
 | |
|       return;
 | |
|     protocol->store(buf.ptr(), buf.length(), &my_charset_bin);
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     switch (m_type) {
 | |
|     case REAL_RESULT:
 | |
|     {
 | |
|       double real_val;
 | |
|       char buf2[MY_GCVT_MAX_FIELD_WIDTH+1];
 | |
|       char buf_mem[FN_REFLEN + MY_GCVT_MAX_FIELD_WIDTH + 1];
 | |
|       String buf(buf_mem, sizeof(buf_mem), system_charset_info);
 | |
|       float8get(real_val, val);
 | |
|       buf.length(0);
 | |
|       if (user_var_append_name_part(protocol->thd, &buf, name, name_len,
 | |
|                                     m_data_type_name) ||
 | |
|           buf.append(buf2, my_gcvt(real_val, MY_GCVT_ARG_DOUBLE,
 | |
|                                    MY_GCVT_MAX_FIELD_WIDTH, buf2, NULL)))
 | |
|         return;
 | |
|       protocol->store(buf.ptr(), buf.length(), &my_charset_bin);
 | |
|       break;
 | |
|     }
 | |
|     case INT_RESULT:
 | |
|     {
 | |
|       char buf2[22];
 | |
|       char buf_mem[FN_REFLEN + 22];
 | |
|       String buf(buf_mem, sizeof(buf_mem), system_charset_info);
 | |
|       buf.length(0);
 | |
|       if (user_var_append_name_part(protocol->thd, &buf, name, name_len,
 | |
|                                     m_data_type_name) ||
 | |
|           buf.append(buf2,
 | |
|                  longlong10_to_str(uint8korr(val), buf2,
 | |
|                    (is_unsigned() ? 10 : -10))-buf2))
 | |
|         return;
 | |
|       protocol->store(buf.ptr(), buf.length(), &my_charset_bin);
 | |
|       break;
 | |
|     }
 | |
|     case DECIMAL_RESULT:
 | |
|     {
 | |
|       char buf_mem[FN_REFLEN + DECIMAL_MAX_STR_LENGTH];
 | |
|       String buf(buf_mem, sizeof(buf_mem), system_charset_info);
 | |
|       char buf2[DECIMAL_MAX_STR_LENGTH+1];
 | |
|       String str(buf2, sizeof(buf2), &my_charset_bin);
 | |
|       buf.length(0);
 | |
|       my_decimal((const uchar *) (val + 2), val[0], val[1]).to_string(&str);
 | |
|       if (user_var_append_name_part(protocol->thd, &buf, name, name_len,
 | |
|                                     m_data_type_name) ||
 | |
|           buf.append(str))
 | |
|         return;
 | |
|       protocol->store(buf.ptr(), buf.length(), &my_charset_bin);
 | |
| 
 | |
|       break;
 | |
|     }
 | |
|     case STRING_RESULT:
 | |
|     {
 | |
|       /* 15 is for 'COLLATE' and other chars */
 | |
|       char buf_mem[FN_REFLEN + 512 + 1 + 2*MY_CS_NAME_SIZE+15];
 | |
|       String buf(buf_mem, sizeof(buf_mem), system_charset_info);
 | |
|       CHARSET_INFO *cs;
 | |
|       buf.length(0);
 | |
|       if (!(cs= get_charset(m_charset_number, MYF(0))))
 | |
|       {
 | |
|         if (buf.append(STRING_WITH_LEN("???")))
 | |
|           return;
 | |
|       }
 | |
|       else
 | |
|       {
 | |
|         size_t old_len;
 | |
|         char *beg, *end;
 | |
|         if (user_var_append_name_part(protocol->thd, &buf, name, name_len,
 | |
|                                       m_data_type_name) ||
 | |
|             buf.append('_') ||
 | |
|             buf.append(cs->cs_name) ||
 | |
|             buf.append(' '))
 | |
|           return;
 | |
|         old_len= buf.length();
 | |
|         if (buf.reserve(old_len + val_len * 2 + 3 + sizeof(" COLLATE ") +
 | |
|                         MY_CS_NAME_SIZE))
 | |
|           return;
 | |
|         beg= const_cast<char *>(buf.ptr()) + old_len;
 | |
|         end= str_to_hex(beg, val, val_len);
 | |
|         buf.length(old_len + (end - beg));
 | |
|         if (buf.append(STRING_WITH_LEN(" COLLATE ")) ||
 | |
|             buf.append(cs->coll_name))
 | |
|           return;
 | |
|       }
 | |
|       protocol->store(buf.ptr(), buf.length(), &my_charset_bin);
 | |
|       break;
 | |
|     }
 | |
|     case ROW_RESULT:
 | |
|     default:
 | |
|       DBUG_ASSERT(0);
 | |
|       return;
 | |
|     }
 | |
|   }
 | |
| }
 | |
| #endif // HAVE_REPLICATION
 | |
| 
 | |
| 
 | |
| bool User_var_log_event::write()
 | |
| {
 | |
|   char buf[UV_NAME_LEN_SIZE];
 | |
|   char buf1[UV_VAL_IS_NULL + UV_VAL_TYPE_SIZE + 
 | |
| 	    UV_CHARSET_NUMBER_SIZE + UV_VAL_LEN_SIZE];
 | |
|   uchar buf2[MY_MAX(8, DECIMAL_MAX_FIELD_SIZE + 2)], *pos= buf2;
 | |
|   uint unsigned_len= 0;
 | |
|   uint buf1_length;
 | |
|   size_t event_length;
 | |
| 
 | |
|   int4store(buf, name_len);
 | |
|   
 | |
|   if ((buf1[0]= is_null))
 | |
|   {
 | |
|     buf1_length= 1;
 | |
|     val_len= 0;                                 // Length of 'pos'
 | |
|   }    
 | |
|   else
 | |
|   {
 | |
|     buf1[1]= m_type;
 | |
|     int4store(buf1 + 2, m_charset_number);
 | |
| 
 | |
|     switch (m_type) {
 | |
|     case REAL_RESULT:
 | |
|       float8store(buf2, *(double*) val);
 | |
|       break;
 | |
|     case INT_RESULT:
 | |
|       int8store(buf2, *(longlong*) val);
 | |
|       unsigned_len= 1;
 | |
|       break;
 | |
|     case DECIMAL_RESULT:
 | |
|     {
 | |
|       my_decimal *dec= (my_decimal *)val;
 | |
|       dec->fix_buffer_pointer();
 | |
|       buf2[0]= (char)(dec->intg + dec->frac);
 | |
|       buf2[1]= (char)dec->frac;
 | |
|       decimal2bin((decimal_t*)val, buf2+2, buf2[0], buf2[1]);
 | |
|       val_len= decimal_bin_size(buf2[0], buf2[1]) + 2;
 | |
|       break;
 | |
|     }
 | |
|     case STRING_RESULT:
 | |
|       pos= (uchar*) val;
 | |
|       break;
 | |
|     case ROW_RESULT:
 | |
|     default:
 | |
|       DBUG_ASSERT(0);
 | |
|       return 0;
 | |
|     }
 | |
|     int4store(buf1 + 2 + UV_CHARSET_NUMBER_SIZE, val_len);
 | |
|     buf1_length= 10;
 | |
|   }
 | |
| 
 | |
|   uchar data_type_name_chunk_signature= (uchar) CHUNK_DATA_TYPE_NAME;
 | |
|   uint data_type_name_chunk_signature_length= m_data_type_name.length ? 1 : 0;
 | |
|   uchar data_type_name_length_length= m_data_type_name.length ? 1 : 0;
 | |
| 
 | |
|   /* Length of the whole event */
 | |
|   event_length= sizeof(buf)+ name_len + buf1_length + val_len + unsigned_len +
 | |
|                 data_type_name_chunk_signature_length +
 | |
|                 data_type_name_length_length +
 | |
|                 (uint) m_data_type_name.length;
 | |
| 
 | |
|   uchar unsig= m_is_unsigned ? CHUNK_UNSIGNED : CHUNK_SIGNED;
 | |
|   uchar data_type_name_length= (uchar) m_data_type_name.length;
 | |
|   return write_header(event_length) ||
 | |
|          write_data(buf, sizeof(buf))   ||
 | |
|          write_data(name, name_len)     ||
 | |
|          write_data(buf1, buf1_length) ||
 | |
|          write_data(pos, val_len) ||
 | |
|          write_data(&unsig, unsigned_len) ||
 | |
|          write_data(&data_type_name_chunk_signature,
 | |
|                     data_type_name_chunk_signature_length) ||
 | |
|          write_data(&data_type_name_length, data_type_name_length_length) ||
 | |
|          write_data(m_data_type_name.str, (uint) m_data_type_name.length) ||
 | |
|          write_footer();
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| int User_var_log_event::do_apply_event(rpl_group_info *rgi)
 | |
| {
 | |
|   Item *it= 0;
 | |
|   CHARSET_INFO *charset;
 | |
|   DBUG_ENTER("User_var_log_event::do_apply_event");
 | |
|   query_id_t sav_query_id= 0; /* memorize orig id when deferred applying */
 | |
| 
 | |
|   if (rgi->deferred_events_collecting)
 | |
|   {
 | |
|     set_deferred(current_thd->query_id);
 | |
|     DBUG_RETURN(rgi->deferred_events->add(this));
 | |
|   }
 | |
|   else if (is_deferred())
 | |
|   {
 | |
|     sav_query_id= current_thd->query_id;
 | |
|     current_thd->query_id= query_id; /* recreating original time context */
 | |
|   }
 | |
| 
 | |
|   if (!(charset= get_charset(m_charset_number, MYF(MY_WME))))
 | |
|   {
 | |
|     rgi->rli->report(ERROR_LEVEL, ER_SLAVE_FATAL_ERROR,
 | |
|                 ER_THD(thd, ER_SLAVE_FATAL_ERROR),
 | |
|                 "Invalid character set for User var event");
 | |
|     DBUG_RETURN(1);
 | |
|   }
 | |
|   LEX_CSTRING user_var_name;
 | |
|   user_var_name.str= name;
 | |
|   user_var_name.length= name_len;
 | |
|   double real_val;
 | |
|   longlong int_val;
 | |
| 
 | |
|   if (is_null)
 | |
|   {
 | |
|     it= new (thd->mem_root) Item_null(thd);
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     switch (m_type) {
 | |
|     case REAL_RESULT:
 | |
|       if (val_len != 8)
 | |
|       {
 | |
|         rgi->rli->report(ERROR_LEVEL, ER_SLAVE_FATAL_ERROR,
 | |
|                     ER_THD(thd, ER_SLAVE_FATAL_ERROR),
 | |
|                     "Invalid variable length at User var event");
 | |
|         return 1;
 | |
|       }
 | |
|       float8get(real_val, val);
 | |
|       it= new (thd->mem_root) Item_float(thd, real_val, 0);
 | |
|       val= (char*) &real_val;		// Pointer to value in native format
 | |
|       val_len= 8;
 | |
|       break;
 | |
|     case INT_RESULT:
 | |
|       if (val_len != 8)
 | |
|       {
 | |
|         rgi->rli->report(ERROR_LEVEL, ER_SLAVE_FATAL_ERROR,
 | |
|                     ER_THD(thd, ER_SLAVE_FATAL_ERROR),
 | |
|                     "Invalid variable length at User var event");
 | |
|         return 1;
 | |
|       }
 | |
|       int_val= (longlong) uint8korr(val);
 | |
|       it= new (thd->mem_root) Item_int(thd, int_val);
 | |
|       val= (char*) &int_val;		// Pointer to value in native format
 | |
|       val_len= 8;
 | |
|       break;
 | |
|     case DECIMAL_RESULT:
 | |
|     {
 | |
|       if (val_len < 3)
 | |
|       {
 | |
|         rgi->rli->report(ERROR_LEVEL, ER_SLAVE_FATAL_ERROR,
 | |
|                     ER_THD(thd, ER_SLAVE_FATAL_ERROR),
 | |
|                     "Invalid variable length at User var event");
 | |
|         return 1;
 | |
|       }
 | |
|       Item_decimal *dec= new (thd->mem_root) Item_decimal(thd, (uchar*) val+2, val[0], val[1]);
 | |
|       it= dec;
 | |
|       val= (char *)dec->val_decimal(NULL);
 | |
|       val_len= sizeof(my_decimal);
 | |
|       break;
 | |
|     }
 | |
|     case STRING_RESULT:
 | |
|       it= new (thd->mem_root) Item_string(thd, val, (uint)val_len, charset);
 | |
|       break;
 | |
|     case ROW_RESULT:
 | |
|     default:
 | |
|       DBUG_ASSERT(0);
 | |
|       DBUG_RETURN(0);
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   Item_func_set_user_var *e= new (thd->mem_root) Item_func_set_user_var(thd, &user_var_name, it);
 | |
|   /*
 | |
|     Item_func_set_user_var can't substitute something else on its place =>
 | |
|     0 can be passed as last argument (reference on item)
 | |
| 
 | |
|     Fix_fields() can fail, in which case a call of update_hash() might
 | |
|     crash the server, so if fix fields fails, we just return with an
 | |
|     error.
 | |
|   */
 | |
|   if (e->fix_fields(thd, 0))
 | |
|     DBUG_RETURN(1);
 | |
| 
 | |
|   const Type_handler *th= Type_handler::handler_by_log_event_data_type(thd,
 | |
|                                                                        *this);
 | |
|   e->update_hash((void*) val, val_len, th, charset);
 | |
| 
 | |
|   if (!is_deferred())
 | |
|     free_root(thd->mem_root, 0);
 | |
|   else
 | |
|     current_thd->query_id= sav_query_id; /* restore current query's context */
 | |
| 
 | |
|   DBUG_RETURN(0);
 | |
| }
 | |
| 
 | |
| int User_var_log_event::do_update_pos(rpl_group_info *rgi)
 | |
| {
 | |
|   rgi->inc_event_relay_log_pos();
 | |
|   return 0;
 | |
| }
 | |
| 
 | |
| Log_event::enum_skip_reason
 | |
| User_var_log_event::do_shall_skip(rpl_group_info *rgi)
 | |
| {
 | |
|   /*
 | |
|     It is a common error to set the slave skip counter to 1 instead
 | |
|     of 2 when recovering from an insert which used a auto increment,
 | |
|     rand, or user var.  Therefore, if the slave skip counter is 1, we
 | |
|     just say that this event should be skipped by ignoring it, meaning
 | |
|     that we do not change the value of the slave skip counter since it
 | |
|     will be decreased by the following insert event.
 | |
|   */
 | |
|   return continue_group(rgi);
 | |
| }
 | |
| #endif // HAVE_REPLICATION
 | |
| 
 | |
| 
 | |
| #ifdef HAVE_REPLICATION
 | |
| 
 | |
| /**************************************************************************
 | |
| 	Stop_log_event methods
 | |
| **************************************************************************/
 | |
| 
 | |
| /*
 | |
|   The master stopped.  We used to clean up all temporary tables but
 | |
|   this is useless as, as the master has shut down properly, it has
 | |
|   written all DROP TEMPORARY TABLE (prepared statements' deletion is
 | |
|   TODO only when we binlog prep stmts).  We used to clean up
 | |
|   slave_load_tmpdir, but this is useless as it has been cleared at the
 | |
|   end of LOAD DATA INFILE.  So we have nothing to do here.  The place
 | |
|   were we must do this cleaning is in
 | |
|   Start_log_event_v3::do_apply_event(), not here. Because if we come
 | |
|   here, the master was sane.
 | |
| 
 | |
|   This must only be called from the Slave SQL thread, since it calls
 | |
|   Relay_log_info::flush().
 | |
| */
 | |
| 
 | |
| int Stop_log_event::do_update_pos(rpl_group_info *rgi)
 | |
| {
 | |
|   int error= 0;
 | |
|   Relay_log_info *rli= rgi->rli;
 | |
|   DBUG_ENTER("Stop_log_event::do_update_pos");
 | |
|   /*
 | |
|     We do not want to update master_log pos because we get a rotate event
 | |
|     before stop, so by now group_master_log_name is set to the next log.
 | |
|     If we updated it, we will have incorrect master coordinates and this
 | |
|     could give false triggers in MASTER_POS_WAIT() that we have reached
 | |
|     the target position when in fact we have not.
 | |
|   */
 | |
|   if (rli->get_flag(Relay_log_info::IN_TRANSACTION))
 | |
|     rgi->inc_event_relay_log_pos();
 | |
|   else if (!rgi->is_parallel_exec)
 | |
|   {
 | |
|     rpl_global_gtid_slave_state->record_and_update_gtid(thd, rgi);
 | |
|     rli->inc_group_relay_log_pos(0, rgi);
 | |
|     if (rli->flush())
 | |
|       error= 1;
 | |
|   }
 | |
|   DBUG_RETURN(error);
 | |
| }
 | |
| 
 | |
| #endif /* HAVE_REPLICATION */
 | |
| 
 | |
| 
 | |
| /**************************************************************************
 | |
| 	Create_file_log_event methods
 | |
| **************************************************************************/
 | |
| 
 | |
| Create_file_log_event::
 | |
| Create_file_log_event(THD* thd_arg, sql_exchange* ex,
 | |
| 		      const char* db_arg, const char* table_name_arg,
 | |
|                       List<Item>& fields_arg,
 | |
|                       bool is_concurrent_arg,
 | |
|                       enum enum_duplicates handle_dup,
 | |
|                       bool ignore,
 | |
| 		      uchar* block_arg, uint block_len_arg, bool using_trans)
 | |
|   :Load_log_event(thd_arg, ex, db_arg, table_name_arg, fields_arg,
 | |
|                   is_concurrent_arg,
 | |
|                   handle_dup, ignore, using_trans),
 | |
|    fake_base(0), block(block_arg), event_buf(0), block_len(block_len_arg),
 | |
|    file_id(thd_arg->file_id = mysql_bin_log.next_file_id())
 | |
| {
 | |
|   DBUG_ENTER("Create_file_log_event");
 | |
|   sql_ex.force_new_format();
 | |
|   DBUG_VOID_RETURN;
 | |
| }
 | |
| 
 | |
| 
 | |
| /*
 | |
|   Create_file_log_event::write_data_body()
 | |
| */
 | |
| 
 | |
| bool Create_file_log_event::write_data_body()
 | |
| {
 | |
|   bool res;
 | |
|   if ((res= Load_log_event::write_data_body()) || fake_base)
 | |
|     return res;
 | |
|   return write_data("", 1) ||
 | |
|          write_data(block, block_len);
 | |
| }
 | |
| 
 | |
| 
 | |
| /*
 | |
|   Create_file_log_event::write_data_header()
 | |
| */
 | |
| 
 | |
| bool Create_file_log_event::write_data_header()
 | |
| {
 | |
|   bool res;
 | |
|   uchar buf[CREATE_FILE_HEADER_LEN];
 | |
|   if ((res= Load_log_event::write_data_header()) || fake_base)
 | |
|     return res;
 | |
|   int4store(buf + CF_FILE_ID_OFFSET, file_id);
 | |
|   return write_data(buf, CREATE_FILE_HEADER_LEN) != 0;
 | |
| }
 | |
| 
 | |
| 
 | |
| /*
 | |
|   Create_file_log_event::write_base()
 | |
| */
 | |
| 
 | |
| bool Create_file_log_event::write_base()
 | |
| {
 | |
|   bool res;
 | |
|   fake_base= 1;                                 // pretend we are Load event
 | |
|   res= write();
 | |
|   fake_base= 0;
 | |
|   return res;
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| void Create_file_log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|   char buf[SAFE_NAME_LEN*2 + 30 + 21*2], *pos;
 | |
|   pos= strmov(buf, "db=");
 | |
|   memcpy(pos, db, db_len);
 | |
|   pos= strmov(pos + db_len, ";table=");
 | |
|   memcpy(pos, table_name, table_name_len);
 | |
|   pos= strmov(pos + table_name_len, ";file_id=");
 | |
|   pos= int10_to_str((long) file_id, pos, 10);
 | |
|   pos= strmov(pos, ";block_len=");
 | |
|   pos= int10_to_str((long) block_len, pos, 10);
 | |
|   protocol->store(buf, (uint) (pos-buf), &my_charset_bin);
 | |
| }
 | |
| #endif /* defined(HAVE_REPLICATION) */
 | |
| 
 | |
| 
 | |
| /**
 | |
|   Create_file_log_event::do_apply_event()
 | |
|   Constructor for Create_file_log_event to intantiate an event
 | |
|   from the relay log on the slave.
 | |
| 
 | |
|   @retval
 | |
|     0           Success
 | |
|   @retval
 | |
|     1           Failure
 | |
| */
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| int Create_file_log_event::do_apply_event(rpl_group_info *rgi)
 | |
| {
 | |
|   char fname_buf[FN_REFLEN];
 | |
|   char *ext;
 | |
|   int fd = -1;
 | |
|   IO_CACHE file;
 | |
|   Log_event_writer lew(&file, 0);
 | |
|   int error = 1;
 | |
|   Relay_log_info const *rli= rgi->rli;
 | |
| 
 | |
|   THD_STAGE_INFO(thd, stage_making_temp_file_create_before_load_data);
 | |
|   bzero((char*)&file, sizeof(file));
 | |
|   ext= slave_load_file_stem(fname_buf, file_id, server_id, ".info",
 | |
|                             &rli->mi->connection_name);
 | |
|   /* old copy may exist already */
 | |
|   mysql_file_delete(key_file_log_event_info, fname_buf, MYF(0));
 | |
|   if ((fd= mysql_file_create(key_file_log_event_info,
 | |
|                              fname_buf, CREATE_MODE,
 | |
|                              O_WRONLY | O_BINARY | O_EXCL | O_NOFOLLOW,
 | |
|                              MYF(MY_WME))) < 0 ||
 | |
|       init_io_cache(&file, fd, IO_SIZE, WRITE_CACHE, (my_off_t)0, 0,
 | |
| 		    MYF(MY_WME|MY_NABP)))
 | |
|   {
 | |
|     rli->report(ERROR_LEVEL, my_errno, rgi->gtid_info(),
 | |
|                 "Error in Create_file event: could not open file '%s'",
 | |
|                 fname_buf);
 | |
|     goto err;
 | |
|   }
 | |
| 
 | |
|   // a trick to avoid allocating another buffer
 | |
|   fname= fname_buf;
 | |
|   fname_len= (uint) (strmov(ext, ".data") - fname);
 | |
|   writer= &lew;
 | |
|   if (write_base())
 | |
|   {
 | |
|     strmov(ext, ".info"); // to have it right in the error message
 | |
|     rli->report(ERROR_LEVEL, my_errno, rgi->gtid_info(),
 | |
|                 "Error in Create_file event: could not write to file '%s'",
 | |
|                 fname_buf);
 | |
|     goto err;
 | |
|   }
 | |
|   end_io_cache(&file);
 | |
|   mysql_file_close(fd, MYF(0));
 | |
| 
 | |
|   // fname_buf now already has .data, not .info, because we did our trick
 | |
|   /* old copy may exist already */
 | |
|   mysql_file_delete(key_file_log_event_data, fname_buf, MYF(0));
 | |
|   if ((fd= mysql_file_create(key_file_log_event_data,
 | |
|                              fname_buf, CREATE_MODE,
 | |
|                              O_WRONLY | O_BINARY | O_EXCL | O_NOFOLLOW,
 | |
|                              MYF(MY_WME))) < 0)
 | |
|   {
 | |
|     rli->report(ERROR_LEVEL, my_errno, rgi->gtid_info(),
 | |
|                 "Error in Create_file event: could not open file '%s'",
 | |
|                 fname_buf);
 | |
|     goto err;
 | |
|   }
 | |
|   if (mysql_file_write(fd, (uchar*) block, block_len, MYF(MY_WME+MY_NABP)))
 | |
|   {
 | |
|     rli->report(ERROR_LEVEL, my_errno, rgi->gtid_info(),
 | |
|                 "Error in Create_file event: write to '%s' failed",
 | |
|                 fname_buf);
 | |
|     goto err;
 | |
|   }
 | |
|   error=0;					// Everything is ok
 | |
| 
 | |
| err:
 | |
|   if (unlikely(error))
 | |
|     end_io_cache(&file);
 | |
|   if (likely(fd >= 0))
 | |
|     mysql_file_close(fd, MYF(0));
 | |
|   return error != 0;
 | |
| }
 | |
| #endif /* defined(HAVE_REPLICATION) */
 | |
| 
 | |
| 
 | |
| /**************************************************************************
 | |
| 	Append_block_log_event methods
 | |
| **************************************************************************/
 | |
| 
 | |
| Append_block_log_event::Append_block_log_event(THD *thd_arg,
 | |
|                                                const char *db_arg,
 | |
| 					       uchar *block_arg,
 | |
| 					       uint block_len_arg,
 | |
| 					       bool using_trans)
 | |
|   :Log_event(thd_arg,0, using_trans), block(block_arg),
 | |
|    block_len(block_len_arg), file_id(thd_arg->file_id), db(db_arg)
 | |
| {
 | |
| }
 | |
| 
 | |
| 
 | |
| bool Append_block_log_event::write()
 | |
| {
 | |
|   uchar buf[APPEND_BLOCK_HEADER_LEN];
 | |
|   int4store(buf + AB_FILE_ID_OFFSET, file_id);
 | |
|   return write_header(APPEND_BLOCK_HEADER_LEN + block_len) ||
 | |
|          write_data(buf, APPEND_BLOCK_HEADER_LEN) ||
 | |
|          write_data(block, block_len) ||
 | |
|          write_footer();
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| void Append_block_log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|   char buf[256];
 | |
|   uint length;
 | |
|   length= (uint) sprintf(buf, ";file_id=%u;block_len=%u", file_id, block_len);
 | |
|   protocol->store(buf, length, &my_charset_bin);
 | |
| }
 | |
| 
 | |
| 
 | |
| /*
 | |
|   Append_block_log_event::get_create_or_append()
 | |
| */
 | |
| 
 | |
| int Append_block_log_event::get_create_or_append() const
 | |
| {
 | |
|   return 0; /* append to the file, fail if not exists */
 | |
| }
 | |
| 
 | |
| /*
 | |
|   Append_block_log_event::do_apply_event()
 | |
| */
 | |
| 
 | |
| int Append_block_log_event::do_apply_event(rpl_group_info *rgi)
 | |
| {
 | |
|   char fname[FN_REFLEN];
 | |
|   int fd;
 | |
|   int error = 1;
 | |
|   Relay_log_info const *rli= rgi->rli;
 | |
|   DBUG_ENTER("Append_block_log_event::do_apply_event");
 | |
| 
 | |
|   THD_STAGE_INFO(thd, stage_making_temp_file_append_before_load_data);
 | |
|   slave_load_file_stem(fname, file_id, server_id, ".data",
 | |
|                        &rli->mi->cmp_connection_name);
 | |
|   if (get_create_or_append())
 | |
|   {
 | |
|     /*
 | |
|       Usually lex_start() is called by mysql_parse(), but we need it here
 | |
|       as the present method does not call mysql_parse().
 | |
|     */
 | |
|     lex_start(thd);
 | |
|     thd->reset_for_next_command();
 | |
|     /* old copy may exist already */
 | |
|     mysql_file_delete(key_file_log_event_data, fname, MYF(0));
 | |
|     if ((fd= mysql_file_create(key_file_log_event_data,
 | |
|                                fname, CREATE_MODE,
 | |
|                                O_WRONLY | O_BINARY | O_EXCL | O_NOFOLLOW,
 | |
|                                MYF(MY_WME))) < 0)
 | |
|     {
 | |
|       rli->report(ERROR_LEVEL, my_errno, rgi->gtid_info(),
 | |
|                   "Error in %s event: could not create file '%s'",
 | |
|                   get_type_str(), fname);
 | |
|       goto err;
 | |
|     }
 | |
|   }
 | |
|   else if ((fd= mysql_file_open(key_file_log_event_data,
 | |
|                                 fname,
 | |
|                                 O_WRONLY | O_APPEND | O_BINARY | O_NOFOLLOW,
 | |
|                                 MYF(MY_WME))) < 0)
 | |
|   {
 | |
|     rli->report(ERROR_LEVEL, my_errno, rgi->gtid_info(),
 | |
|                 "Error in %s event: could not open file '%s'",
 | |
|                 get_type_str(), fname);
 | |
|     goto err;
 | |
|   }
 | |
| 
 | |
|   DBUG_EXECUTE_IF("remove_slave_load_file_before_write",
 | |
|                   {
 | |
|                     my_delete(fname, MYF(0));
 | |
|                   });
 | |
| 
 | |
|   if (mysql_file_write(fd, (uchar*) block, block_len, MYF(MY_WME+MY_NABP)))
 | |
|   {
 | |
|     rli->report(ERROR_LEVEL, my_errno, rgi->gtid_info(),
 | |
|                 "Error in %s event: write to '%s' failed",
 | |
|                 get_type_str(), fname);
 | |
|     goto err;
 | |
|   }
 | |
|   error=0;
 | |
| 
 | |
| err:
 | |
|   if (fd >= 0)
 | |
|     mysql_file_close(fd, MYF(0));
 | |
|   DBUG_RETURN(error);
 | |
| }
 | |
| #endif // HAVE_REPLICATION
 | |
| 
 | |
| 
 | |
| /**************************************************************************
 | |
| 	Delete_file_log_event methods
 | |
| **************************************************************************/
 | |
| 
 | |
| Delete_file_log_event::Delete_file_log_event(THD *thd_arg, const char* db_arg,
 | |
| 					     bool using_trans)
 | |
|   :Log_event(thd_arg, 0, using_trans), file_id(thd_arg->file_id), db(db_arg)
 | |
| {
 | |
| }
 | |
| 
 | |
| 
 | |
| bool Delete_file_log_event::write()
 | |
| {
 | |
|  uchar buf[DELETE_FILE_HEADER_LEN];
 | |
|  int4store(buf + DF_FILE_ID_OFFSET, file_id);
 | |
|  return write_header(sizeof(buf)) ||
 | |
|         write_data(buf, sizeof(buf)) ||
 | |
|         write_footer();
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| void Delete_file_log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|   char buf[64];
 | |
|   uint length;
 | |
|   length= (uint) sprintf(buf, ";file_id=%u", (uint) file_id);
 | |
|   protocol->store(buf, (int32) length, &my_charset_bin);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| int Delete_file_log_event::do_apply_event(rpl_group_info *rgi)
 | |
| {
 | |
|   char fname[FN_REFLEN+10];
 | |
|   Relay_log_info const *rli= rgi->rli;
 | |
|   char *ext= slave_load_file_stem(fname, file_id, server_id, ".data",
 | |
|                                   &rli->mi->cmp_connection_name);
 | |
|   mysql_file_delete(key_file_log_event_data, fname, MYF(MY_WME));
 | |
|   strmov(ext, ".info");
 | |
|   mysql_file_delete(key_file_log_event_info, fname, MYF(MY_WME));
 | |
|   return 0;
 | |
| }
 | |
| #endif /* defined(HAVE_REPLICATION) */
 | |
| 
 | |
| 
 | |
| /**************************************************************************
 | |
| 	Execute_load_log_event methods
 | |
| **************************************************************************/
 | |
| 
 | |
| Execute_load_log_event::Execute_load_log_event(THD *thd_arg,
 | |
|                                                const char* db_arg,
 | |
| 					       bool using_trans)
 | |
|   :Log_event(thd_arg, 0, using_trans), file_id(thd_arg->file_id), db(db_arg)
 | |
| {
 | |
| }
 | |
|   
 | |
| 
 | |
| bool Execute_load_log_event::write()
 | |
| {
 | |
|   uchar buf[EXEC_LOAD_HEADER_LEN];
 | |
|   int4store(buf + EL_FILE_ID_OFFSET, file_id);
 | |
|   return write_header(sizeof(buf)) ||
 | |
|          write_data(buf, sizeof(buf)) ||
 | |
|          write_footer();
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| void Execute_load_log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|   char buf[64];
 | |
|   uint length;
 | |
|   length= (uint) sprintf(buf, ";file_id=%u", (uint) file_id);
 | |
|   protocol->store(buf, (int32) length, &my_charset_bin);
 | |
| }
 | |
| 
 | |
| 
 | |
| /*
 | |
|   Execute_load_log_event::do_apply_event()
 | |
| */
 | |
| 
 | |
| int Execute_load_log_event::do_apply_event(rpl_group_info *rgi)
 | |
| {
 | |
|   char fname[FN_REFLEN+10];
 | |
|   char *ext;
 | |
|   int fd;
 | |
|   int error= 1, read_error;
 | |
|   IO_CACHE file;
 | |
|   Load_log_event *lev= 0;
 | |
|   Relay_log_info const *rli= rgi->rli;
 | |
| 
 | |
|   ext= slave_load_file_stem(fname, file_id, server_id, ".info",
 | |
|                             &rli->mi->cmp_connection_name);
 | |
|   if ((fd= mysql_file_open(key_file_log_event_info,
 | |
|                            fname, O_RDONLY | O_BINARY | O_NOFOLLOW,
 | |
|                            MYF(MY_WME))) < 0 ||
 | |
|       init_io_cache(&file, fd, IO_SIZE, READ_CACHE, (my_off_t)0, 0,
 | |
| 		    MYF(MY_WME|MY_NABP)))
 | |
|   {
 | |
|     rli->report(ERROR_LEVEL, my_errno, rgi->gtid_info(),
 | |
|                 "Error in Exec_load event: could not open file '%s'",
 | |
|                 fname);
 | |
|     goto err;
 | |
|   }
 | |
|   if (!(lev= (Load_log_event*)
 | |
|         Log_event::read_log_event(&file, &read_error,
 | |
|                                   rli->relay_log.description_event_for_exec,
 | |
|                                   opt_slave_sql_verify_checksum)) ||
 | |
|       lev->get_type_code() != NEW_LOAD_EVENT)
 | |
|   {
 | |
|     rli->report(ERROR_LEVEL, 0, rgi->gtid_info(), "Error in Exec_load event: "
 | |
|                     "file '%s' appears corrupted", fname);
 | |
|     goto err;
 | |
|   }
 | |
|   lev->thd = thd;
 | |
|   /*
 | |
|     lev->do_apply_event should use rli only for errors i.e. should
 | |
|     not advance rli's position.
 | |
| 
 | |
|     lev->do_apply_event is the place where the table is loaded (it
 | |
|     calls mysql_load()).
 | |
|   */
 | |
| 
 | |
|   if (lev->do_apply_event(0,rgi,1)) 
 | |
|   {
 | |
|     /*
 | |
|       We want to indicate the name of the file that could not be loaded
 | |
|       (SQL_LOADxxx).
 | |
|       But as we are here we are sure the error is in rli->last_slave_error and
 | |
|       rli->last_slave_errno (example of error: duplicate entry for key), so we
 | |
|       don't want to overwrite it with the filename.
 | |
|       What we want instead is add the filename to the current error message.
 | |
|     */
 | |
|     char *tmp= my_strdup(PSI_INSTRUMENT_ME, rli->last_error().message, MYF(MY_WME));
 | |
|     if (tmp)
 | |
|     {
 | |
|       rli->report(ERROR_LEVEL, rli->last_error().number, rgi->gtid_info(),
 | |
|                   "%s. Failed executing load from '%s'", tmp, fname);
 | |
|       my_free(tmp);
 | |
|     }
 | |
|     goto err;
 | |
|   }
 | |
|   /*
 | |
|     We have an open file descriptor to the .info file; we need to close it
 | |
|     or Windows will refuse to delete the file in mysql_file_delete().
 | |
|   */
 | |
|   if (fd >= 0)
 | |
|   {
 | |
|     mysql_file_close(fd, MYF(0));
 | |
|     end_io_cache(&file);
 | |
|     fd= -1;
 | |
|   }
 | |
|   mysql_file_delete(key_file_log_event_info, fname, MYF(MY_WME));
 | |
|   memcpy(ext, ".data", 6);
 | |
|   mysql_file_delete(key_file_log_event_data, fname, MYF(MY_WME));
 | |
|   error = 0;
 | |
| 
 | |
| err:
 | |
|   delete lev;
 | |
|   if (fd >= 0)
 | |
|   {
 | |
|     mysql_file_close(fd, MYF(0));
 | |
|     end_io_cache(&file);
 | |
|   }
 | |
|   return error;
 | |
| }
 | |
| 
 | |
| #endif /* defined(HAVE_REPLICATION) */
 | |
| 
 | |
| /**************************************************************************
 | |
| 	Begin_load_query_log_event methods
 | |
| **************************************************************************/
 | |
| 
 | |
| Begin_load_query_log_event::
 | |
| Begin_load_query_log_event(THD* thd_arg, const char* db_arg, uchar* block_arg,
 | |
|                            uint block_len_arg, bool using_trans)
 | |
|   :Append_block_log_event(thd_arg, db_arg, block_arg, block_len_arg,
 | |
|                           using_trans)
 | |
| {
 | |
|    file_id= thd_arg->file_id= mysql_bin_log.next_file_id();
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined( HAVE_REPLICATION)
 | |
| int Begin_load_query_log_event::get_create_or_append() const
 | |
| {
 | |
|   return 1; /* create the file */
 | |
| }
 | |
| 
 | |
| 
 | |
| Log_event::enum_skip_reason
 | |
| Begin_load_query_log_event::do_shall_skip(rpl_group_info *rgi)
 | |
| {
 | |
|   /*
 | |
|     If the slave skip counter is 1, then we should not start executing
 | |
|     on the next event.
 | |
|   */
 | |
|   return continue_group(rgi);
 | |
| }
 | |
| #endif /* defined( HAVE_REPLICATION) */
 | |
| 
 | |
| 
 | |
| /**************************************************************************
 | |
| 	Execute_load_query_log_event methods
 | |
| **************************************************************************/
 | |
| 
 | |
| Execute_load_query_log_event::
 | |
| Execute_load_query_log_event(THD *thd_arg, const char* query_arg,
 | |
|                              ulong query_length_arg, uint fn_pos_start_arg,
 | |
|                              uint fn_pos_end_arg,
 | |
|                              enum_load_dup_handling dup_handling_arg,
 | |
|                              bool using_trans, bool direct, bool suppress_use,
 | |
|                              int errcode):
 | |
|   Query_log_event(thd_arg, query_arg, query_length_arg, using_trans, direct,
 | |
|                   suppress_use, errcode),
 | |
|   file_id(thd_arg->file_id), fn_pos_start(fn_pos_start_arg),
 | |
|   fn_pos_end(fn_pos_end_arg), dup_handling(dup_handling_arg)
 | |
| {
 | |
| }
 | |
| 
 | |
| 
 | |
| bool
 | |
| Execute_load_query_log_event::write_post_header_for_derived()
 | |
| {
 | |
|   uchar buf[EXECUTE_LOAD_QUERY_EXTRA_HEADER_LEN];
 | |
|   int4store(buf, file_id);
 | |
|   int4store(buf + 4, fn_pos_start);
 | |
|   int4store(buf + 4 + 4, fn_pos_end);
 | |
|   *(buf + 4 + 4 + 4)= (uchar) dup_handling;
 | |
|   return write_data(buf, EXECUTE_LOAD_QUERY_EXTRA_HEADER_LEN);
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| void Execute_load_query_log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|   char buf_mem[1024];
 | |
|   String buf(buf_mem, sizeof(buf_mem), system_charset_info);
 | |
|   buf.real_alloc(9 + db_len + q_len + 10 + 21);
 | |
|   if (db && db_len)
 | |
|   {
 | |
|     if (buf.append(STRING_WITH_LEN("use ")) ||
 | |
|         append_identifier(protocol->thd, &buf, db, db_len) ||
 | |
|         buf.append(STRING_WITH_LEN("; ")))
 | |
|       return;
 | |
|   }
 | |
|   if (query && q_len && buf.append(query, q_len))
 | |
|     return;
 | |
|   if (buf.append(STRING_WITH_LEN(" ;file_id=")) ||
 | |
|       buf.append_ulonglong(file_id))
 | |
|     return;
 | |
|   protocol->store(buf.ptr(), buf.length(), &my_charset_bin);
 | |
| }
 | |
| 
 | |
| 
 | |
| int
 | |
| Execute_load_query_log_event::do_apply_event(rpl_group_info *rgi)
 | |
| {
 | |
|   char *p;
 | |
|   char *buf;
 | |
|   char *fname;
 | |
|   char *fname_end;
 | |
|   int error;
 | |
|   Relay_log_info const *rli= rgi->rli;
 | |
| 
 | |
|   buf= (char*) my_malloc(PSI_INSTRUMENT_ME, q_len + 1 -
 | |
|      (fn_pos_end - fn_pos_start) + (FN_REFLEN + 10) + 10 + 8 + 5, MYF(MY_WME));
 | |
| 
 | |
|   DBUG_EXECUTE_IF("LOAD_DATA_INFILE_has_fatal_error", my_free(buf); buf= NULL;);
 | |
| 
 | |
|   /* Replace filename and LOCAL keyword in query before executing it */
 | |
|   if (buf == NULL)
 | |
|   {
 | |
|     rli->report(ERROR_LEVEL, ER_SLAVE_FATAL_ERROR, rgi->gtid_info(),
 | |
|                 ER_THD(rgi->thd, ER_SLAVE_FATAL_ERROR), "Not enough memory");
 | |
|     return 1;
 | |
|   }
 | |
| 
 | |
|   p= buf;
 | |
|   memcpy(p, query, fn_pos_start);
 | |
|   p+= fn_pos_start;
 | |
|   fname= (p= strmake(p, STRING_WITH_LEN(" INFILE \'")));
 | |
|   p= slave_load_file_stem(p, file_id, server_id, ".data",
 | |
|                           &rli->mi->cmp_connection_name);
 | |
|   fname_end= p= strend(p);                      // Safer than p=p+5
 | |
|   *(p++)='\'';
 | |
|   switch (dup_handling) {
 | |
|   case LOAD_DUP_IGNORE:
 | |
|     p= strmake(p, STRING_WITH_LEN(" IGNORE"));
 | |
|     break;
 | |
|   case LOAD_DUP_REPLACE:
 | |
|     p= strmake(p, STRING_WITH_LEN(" REPLACE"));
 | |
|     break;
 | |
|   default:
 | |
|     /* Ordinary load data */
 | |
|     break;
 | |
|   }
 | |
|   p= strmake(p, STRING_WITH_LEN(" INTO "));
 | |
|   p= strmake(p, query+fn_pos_end, q_len-fn_pos_end);
 | |
| 
 | |
|   error= Query_log_event::do_apply_event(rgi, buf, (uint32)(p-buf));
 | |
| 
 | |
|   /* Forging file name for deletion in same buffer */
 | |
|   *fname_end= 0;
 | |
| 
 | |
|   /*
 | |
|     If there was an error the slave is going to stop, leave the
 | |
|     file so that we can re-execute this event at START SLAVE.
 | |
|   */
 | |
|   if (unlikely(!error))
 | |
|     mysql_file_delete(key_file_log_event_data, fname, MYF(MY_WME));
 | |
| 
 | |
|   my_free(buf);
 | |
|   return error;
 | |
| }
 | |
| #endif // HAVE_REPLICATION
 | |
| 
 | |
| 
 | |
| /**************************************************************************
 | |
| 	sql_ex_info methods
 | |
| **************************************************************************/
 | |
| 
 | |
| static bool write_str(Log_event_writer *writer, const char *str, uint length)
 | |
| {
 | |
|   uchar tmp[1];
 | |
|   tmp[0]= (uchar) length;
 | |
|   return (writer->write_data(tmp, sizeof(tmp)) ||
 | |
| 	  writer->write_data((uchar*) str, length));
 | |
| }
 | |
| 
 | |
| bool sql_ex_info::write_data(Log_event_writer *writer)
 | |
| {
 | |
|   if (new_format())
 | |
|   {
 | |
|     return write_str(writer, field_term, field_term_len) ||
 | |
| 	   write_str(writer, enclosed,   enclosed_len) ||
 | |
| 	   write_str(writer, line_term,  line_term_len) ||
 | |
| 	   write_str(writer, line_start, line_start_len) ||
 | |
| 	   write_str(writer, escaped,    escaped_len) ||
 | |
| 	   writer->write_data((uchar*) &opt_flags, 1);
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     uchar old_ex[7];
 | |
|     old_ex[0]= *field_term;
 | |
|     old_ex[1]= *enclosed;
 | |
|     old_ex[2]= *line_term;
 | |
|     old_ex[3]= *line_start;
 | |
|     old_ex[4]= *escaped;
 | |
|     old_ex[5]=  opt_flags;
 | |
|     old_ex[6]=  empty_flags;
 | |
|     return writer->write_data(old_ex, sizeof(old_ex));
 | |
|   }
 | |
| }
 | |
| 
 | |
| 
 | |
| 
 | |
| /**************************************************************************
 | |
| 	Rows_log_event member functions
 | |
| **************************************************************************/
 | |
| 
 | |
| Rows_log_event::Rows_log_event(THD *thd_arg, TABLE *tbl_arg,
 | |
|                                ulonglong table_id,
 | |
|                                MY_BITMAP const *cols, bool is_transactional,
 | |
|                                Log_event_type event_type)
 | |
|   : Log_event(thd_arg, 0, is_transactional),
 | |
|     m_row_count(0),
 | |
|     m_table(tbl_arg),
 | |
|     m_table_id(table_id),
 | |
|     m_width(tbl_arg ? tbl_arg->s->fields : 1),
 | |
|     m_rows_buf(0), m_rows_cur(0), m_rows_end(0), m_flags(0),
 | |
|     m_type(event_type), m_extra_row_data(0)
 | |
| #ifdef HAVE_REPLICATION
 | |
|     , m_curr_row(NULL), m_curr_row_end(NULL),
 | |
|     m_key(NULL), m_key_info(NULL), m_key_nr(0),
 | |
|     master_had_triggers(0)
 | |
| #endif
 | |
| {
 | |
|   /*
 | |
|     We allow a special form of dummy event when the table, and cols
 | |
|     are null and the table id is UINT32_MAX.  This is a temporary
 | |
|     solution, to be able to terminate a started statement in the
 | |
|     binary log: the extraneous events will be removed in the future.
 | |
|    */
 | |
|   DBUG_ASSERT((tbl_arg && tbl_arg->s &&
 | |
|                (table_id & MAX_TABLE_MAP_ID) != UINT32_MAX) ||
 | |
|               (!tbl_arg && !cols && (table_id & MAX_TABLE_MAP_ID) == UINT32_MAX));
 | |
| 
 | |
|   if (thd_arg->variables.option_bits & OPTION_NO_FOREIGN_KEY_CHECKS)
 | |
|     set_flags(NO_FOREIGN_KEY_CHECKS_F);
 | |
|   if (thd_arg->variables.option_bits & OPTION_RELAXED_UNIQUE_CHECKS)
 | |
|     set_flags(RELAXED_UNIQUE_CHECKS_F);
 | |
|   if (thd_arg->variables.option_bits & OPTION_NO_CHECK_CONSTRAINT_CHECKS)
 | |
|     set_flags(NO_CHECK_CONSTRAINT_CHECKS_F);
 | |
|   /* if my_bitmap_init fails, caught in is_valid() */
 | |
|   if (likely(!my_bitmap_init(&m_cols,
 | |
|                              m_width <= sizeof(m_bitbuf)*8 ? m_bitbuf : NULL,
 | |
|                              m_width,
 | |
|                              false)))
 | |
|   {
 | |
|     /* Cols can be zero if this is a dummy binrows event */
 | |
|     if (likely(cols != NULL))
 | |
|       bitmap_copy(&m_cols, cols);
 | |
|   }
 | |
| }
 | |
| 
 | |
| 
 | |
| int Rows_log_event::do_add_row_data(uchar *row_data, size_t length)
 | |
| {
 | |
|   /*
 | |
|     When the table has a primary key, we would probably want, by default, to
 | |
|     log only the primary key value instead of the entire "before image". This
 | |
|     would save binlog space. TODO
 | |
|   */
 | |
|   DBUG_ENTER("Rows_log_event::do_add_row_data");
 | |
|   DBUG_PRINT("enter", ("row_data:%p  length: %lu", row_data,
 | |
|                        (ulong) length));
 | |
| 
 | |
|   /*
 | |
|     If length is zero, there is nothing to write, so we just
 | |
|     return. Note that this is not an optimization, since calling
 | |
|     realloc() with size 0 means free().
 | |
|    */
 | |
|   if (length == 0)
 | |
|   {
 | |
|     m_row_count++;
 | |
|     DBUG_RETURN(0);
 | |
|   }
 | |
| 
 | |
|   /*
 | |
|     Don't print debug messages when running valgrind since they can
 | |
|     trigger false warnings.
 | |
|    */
 | |
| #ifndef HAVE_valgrind
 | |
|   DBUG_DUMP("row_data", row_data, MY_MIN(length, 32));
 | |
| #endif
 | |
| 
 | |
|   DBUG_ASSERT(m_rows_buf <= m_rows_cur);
 | |
|   DBUG_ASSERT(!m_rows_buf || (m_rows_end && m_rows_buf < m_rows_end));
 | |
|   DBUG_ASSERT(m_rows_cur <= m_rows_end);
 | |
| 
 | |
|   /* The cast will always work since m_rows_cur <= m_rows_end */
 | |
|   if (static_cast<size_t>(m_rows_end - m_rows_cur) <= length)
 | |
|   {
 | |
|     size_t const block_size= 1024;
 | |
|     size_t cur_size= m_rows_cur - m_rows_buf;
 | |
|     DBUG_EXECUTE_IF("simulate_too_big_row_case1",
 | |
|                      cur_size= UINT_MAX32 - (block_size * 10);
 | |
|                      length= UINT_MAX32 - (block_size * 10););
 | |
|     DBUG_EXECUTE_IF("simulate_too_big_row_case2",
 | |
|                      cur_size= UINT_MAX32 - (block_size * 10);
 | |
|                      length= block_size * 10;);
 | |
|     DBUG_EXECUTE_IF("simulate_too_big_row_case3",
 | |
|                      cur_size= block_size * 10;
 | |
|                      length= UINT_MAX32 - (block_size * 10););
 | |
|     DBUG_EXECUTE_IF("simulate_too_big_row_case4",
 | |
|                      cur_size= UINT_MAX32 - (block_size * 10);
 | |
|                      length= (block_size * 10) - block_size + 1;);
 | |
|     size_t remaining_space= UINT_MAX32 - cur_size;
 | |
|     /* Check that the new data fits within remaining space and we can add
 | |
|        block_size without wrapping.
 | |
|      */
 | |
|     if (cur_size > UINT_MAX32 || length > remaining_space ||
 | |
|         ((length + block_size) > remaining_space))
 | |
|     {
 | |
|       sql_print_error("The row data is greater than 4GB, which is too big to "
 | |
|                       "write to the binary log.");
 | |
|       DBUG_RETURN(ER_BINLOG_ROW_LOGGING_FAILED);
 | |
|     }
 | |
|     size_t const new_alloc= 
 | |
|         block_size * ((cur_size + length + block_size - 1) / block_size);
 | |
| 
 | |
|     uchar* const new_buf= (uchar*)my_realloc(PSI_INSTRUMENT_ME, m_rows_buf,
 | |
|                                     new_alloc, MYF(MY_ALLOW_ZERO_PTR|MY_WME));
 | |
|     if (unlikely(!new_buf))
 | |
|       DBUG_RETURN(HA_ERR_OUT_OF_MEM);
 | |
| 
 | |
|     /* If the memory moved, we need to move the pointers */
 | |
|     if (new_buf != m_rows_buf)
 | |
|     {
 | |
|       m_rows_buf= new_buf;
 | |
|       m_rows_cur= m_rows_buf + cur_size;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|        The end pointer should always be changed to point to the end of
 | |
|        the allocated memory.
 | |
|     */
 | |
|     m_rows_end= m_rows_buf + new_alloc;
 | |
|   }
 | |
| 
 | |
|   DBUG_ASSERT(m_rows_cur + length <= m_rows_end);
 | |
|   memcpy(m_rows_cur, row_data, length);
 | |
|   m_rows_cur+= length;
 | |
|   m_row_count++;
 | |
|   DBUG_RETURN(0);
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| 
 | |
| /**
 | |
|   Restores empty table list as it was before trigger processing.
 | |
| 
 | |
|   @note We have a lot of ASSERTS that check the lists when we close tables.
 | |
|   There was the same problem with MERGE MYISAM tables and so here we try to
 | |
|   go the same way.
 | |
| */
 | |
| inline void restore_empty_query_table_list(LEX *lex)
 | |
| {
 | |
|   if (lex->first_not_own_table())
 | |
|       (*lex->first_not_own_table()->prev_global)= NULL;
 | |
|   lex->query_tables= NULL;
 | |
|   lex->query_tables_last= &lex->query_tables;
 | |
| }
 | |
| 
 | |
| 
 | |
| int Rows_log_event::do_apply_event(rpl_group_info *rgi)
 | |
| {
 | |
|   Relay_log_info const *rli= rgi->rli;
 | |
|   TABLE* table;
 | |
|   DBUG_ENTER("Rows_log_event::do_apply_event(Relay_log_info*)");
 | |
|   int error= 0;
 | |
|   LEX *lex= thd->lex;
 | |
|   uint8 new_trg_event_map= get_trg_event_map();
 | |
|   /*
 | |
|     If m_table_id == UINT32_MAX, then we have a dummy event that does not
 | |
|     contain any data.  In that case, we just remove all tables in the
 | |
|     tables_to_lock list, close the thread tables, and return with
 | |
|     success.
 | |
|    */
 | |
|   if (m_table_id == UINT32_MAX)
 | |
|   {
 | |
|     /*
 | |
|        This one is supposed to be set: just an extra check so that
 | |
|        nothing strange has happened.
 | |
|      */
 | |
|     DBUG_ASSERT(get_flags(STMT_END_F));
 | |
| 
 | |
|     rgi->slave_close_thread_tables(thd);
 | |
|     thd->clear_error();
 | |
|     DBUG_RETURN(0);
 | |
|   }
 | |
| 
 | |
|   /*
 | |
|     'thd' has been set by exec_relay_log_event(), just before calling
 | |
|     do_apply_event(). We still check here to prevent future coding
 | |
|     errors.
 | |
|   */
 | |
|   DBUG_ASSERT(rgi->thd == thd);
 | |
| 
 | |
|   /*
 | |
|     If there is no locks taken, this is the first binrow event seen
 | |
|     after the table map events.  We should then lock all the tables
 | |
|     used in the transaction and proceed with execution of the actual
 | |
|     event.
 | |
|   */
 | |
|   if (!thd->lock)
 | |
|   {
 | |
|     /*
 | |
|       Lock_tables() reads the contents of thd->lex, so they must be
 | |
|       initialized.
 | |
| 
 | |
|       We also call the THD::reset_for_next_command(), since this
 | |
|       is the logical start of the next "statement". Note that this
 | |
|       call might reset the value of current_stmt_binlog_format, so
 | |
|       we need to do any changes to that value after this function.
 | |
|     */
 | |
|     delete_explain_query(thd->lex);
 | |
|     lex_start(thd);
 | |
|     thd->reset_for_next_command();
 | |
|     /*
 | |
|       The current statement is just about to begin and 
 | |
|       has not yet modified anything. Note, all.modified is reset
 | |
|       by THD::reset_for_next_command().
 | |
|     */
 | |
|     thd->transaction->stmt.modified_non_trans_table= FALSE;
 | |
|     thd->transaction->stmt.m_unsafe_rollback_flags&= ~THD_TRANS::DID_WAIT;
 | |
|     /*
 | |
|       This is a row injection, so we flag the "statement" as
 | |
|       such. Note that this code is called both when the slave does row
 | |
|       injections and when the BINLOG statement is used to do row
 | |
|       injections.
 | |
|     */
 | |
|     thd->lex->set_stmt_row_injection();
 | |
| 
 | |
|     /*
 | |
|       There are a few flags that are replicated with each row event.
 | |
|       Make sure to set/clear them before executing the main body of
 | |
|       the event.
 | |
|     */
 | |
|     if (get_flags(NO_FOREIGN_KEY_CHECKS_F))
 | |
|         thd->variables.option_bits|= OPTION_NO_FOREIGN_KEY_CHECKS;
 | |
|     else
 | |
|         thd->variables.option_bits&= ~OPTION_NO_FOREIGN_KEY_CHECKS;
 | |
| 
 | |
|     if (get_flags(RELAXED_UNIQUE_CHECKS_F))
 | |
|         thd->variables.option_bits|= OPTION_RELAXED_UNIQUE_CHECKS;
 | |
|     else
 | |
|         thd->variables.option_bits&= ~OPTION_RELAXED_UNIQUE_CHECKS;
 | |
| 
 | |
|     if (get_flags(NO_CHECK_CONSTRAINT_CHECKS_F))
 | |
|       thd->variables.option_bits|= OPTION_NO_CHECK_CONSTRAINT_CHECKS;
 | |
|     else
 | |
|       thd->variables.option_bits&= ~OPTION_NO_CHECK_CONSTRAINT_CHECKS;
 | |
| 
 | |
|     /* A small test to verify that objects have consistent types */
 | |
|     DBUG_ASSERT(sizeof(thd->variables.option_bits) == sizeof(OPTION_RELAXED_UNIQUE_CHECKS));
 | |
| 
 | |
|     DBUG_EXECUTE_IF("rows_log_event_before_open_table",
 | |
|                     {
 | |
|                       const char action[] = "now SIGNAL before_open_table WAIT_FOR go_ahead_sql";
 | |
|                       DBUG_ASSERT(!debug_sync_set_action(thd, STRING_WITH_LEN(action)));
 | |
|                     };);
 | |
| 
 | |
| 
 | |
|     /*
 | |
|       Trigger's procedures work with global table list. So we have to add
 | |
|       rgi->tables_to_lock content there to get trigger's in the list.
 | |
| 
 | |
|       Then restore_empty_query_table_list() restore the list as it was
 | |
|     */
 | |
|     DBUG_ASSERT(lex->query_tables == NULL);
 | |
|     if ((lex->query_tables= rgi->tables_to_lock))
 | |
|       rgi->tables_to_lock->prev_global= &lex->query_tables;
 | |
| 
 | |
|     for (TABLE_LIST *tables= rgi->tables_to_lock; tables;
 | |
|          tables= tables->next_global)
 | |
|     {
 | |
|       if (slave_run_triggers_for_rbr)
 | |
|       {
 | |
|         tables->trg_event_map= new_trg_event_map;
 | |
|         lex->query_tables_last= &tables->next_global;
 | |
|       }
 | |
|       else
 | |
|       {
 | |
|         tables->slave_fk_event_map= new_trg_event_map;
 | |
|         lex->query_tables_last= &tables->next_global;
 | |
|       }
 | |
|     }
 | |
|     if (unlikely(open_and_lock_tables(thd, rgi->tables_to_lock, FALSE, 0)))
 | |
|     {
 | |
| #ifdef WITH_WSREP
 | |
|       if (WSREP(thd) && !thd->slave_thread)
 | |
|       {
 | |
|         WSREP_WARN("BF applier thread=%lu failed to open_and_lock_tables for "
 | |
|                    "%s, fatal: %d "
 | |
|                    "wsrep = (exec_mode: %d conflict_state: %d seqno: %lld)",
 | |
|                    thd_get_thread_id(thd),
 | |
|                    thd->get_stmt_da()->message(),
 | |
|                    thd->is_fatal_error,
 | |
|                    thd->wsrep_cs().mode(),
 | |
|                    thd->wsrep_trx().state(),
 | |
|                    wsrep_thd_trx_seqno(thd));
 | |
|       }
 | |
| #endif /* WITH_WSREP */
 | |
|       if (thd->is_error() &&
 | |
|           !is_parallel_retry_error(rgi, error= thd->get_stmt_da()->sql_errno()))
 | |
|       {
 | |
|         /*
 | |
|           Error reporting borrowed from Query_log_event with many excessive
 | |
|           simplifications.
 | |
|           We should not honour --slave-skip-errors at this point as we are
 | |
|           having severe errors which should not be skipped.
 | |
|         */
 | |
|         rli->report(ERROR_LEVEL, error, rgi->gtid_info(),
 | |
|                     "Error executing row event: '%s'",
 | |
|                     (error ? thd->get_stmt_da()->message() :
 | |
|                      "unexpected success or fatal error"));
 | |
|         thd->is_slave_error= 1;
 | |
|       }
 | |
|       /* remove trigger's tables */
 | |
|       goto err;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|       When the open and locking succeeded, we check all tables to
 | |
|       ensure that they still have the correct type.
 | |
|     */
 | |
| 
 | |
|     {
 | |
|       DBUG_PRINT("debug", ("Checking compatibility of tables to lock - tables_to_lock: %p",
 | |
|                            rgi->tables_to_lock));
 | |
| 
 | |
|       /**
 | |
|         When using RBR and MyISAM MERGE tables the base tables that make
 | |
|         up the MERGE table can be appended to the list of tables to lock.
 | |
|   
 | |
|         Thus, we just check compatibility for those that tables that have
 | |
|         a correspondent table map event (ie, those that are actually going
 | |
|         to be accessed while applying the event). That's why the loop stops
 | |
|         at rli->tables_to_lock_count .
 | |
| 
 | |
|         NOTE: The base tables are added here are removed when 
 | |
|               close_thread_tables is called.
 | |
|        */
 | |
|       TABLE_LIST *table_list_ptr= rgi->tables_to_lock;
 | |
|       for (uint i=0 ; table_list_ptr && (i < rgi->tables_to_lock_count);
 | |
|            table_list_ptr= table_list_ptr->next_global, i++)
 | |
|       {
 | |
|         /*
 | |
|           Below if condition takes care of skipping base tables that
 | |
|           make up the MERGE table (which are added by open_tables()
 | |
|           call). They are added next to the merge table in the list.
 | |
|           For eg: If RPL_TABLE_LIST is t3->t1->t2 (where t1 and t2
 | |
|           are base tables for merge table 't3'), open_tables will modify
 | |
|           the list by adding t1 and t2 again immediately after t3 in the
 | |
|           list (*not at the end of the list*). New table_to_lock list will
 | |
|           look like t3->t1'->t2'->t1->t2 (where t1' and t2' are TABLE_LIST
 | |
|           objects added by open_tables() call). There is no flag(or logic) in
 | |
|           open_tables() that can skip adding these base tables to the list.
 | |
|           So the logic here should take care of skipping them.
 | |
| 
 | |
|           tables_to_lock_count logic will take care of skipping base tables
 | |
|           that are added at the end of the list.
 | |
|           For eg: If RPL_TABLE_LIST is t1->t2->t3, open_tables will modify
 | |
|           the list into t1->t2->t3->t1'->t2'. t1' and t2' will be skipped
 | |
|           because tables_to_lock_count logic in this for loop.
 | |
|         */
 | |
|         if (table_list_ptr->parent_l)
 | |
|           continue;
 | |
|         /*
 | |
|           We can use a down cast here since we know that every table added
 | |
|           to the tables_to_lock is a RPL_TABLE_LIST (or child table which is
 | |
|           skipped above).
 | |
|         */
 | |
|         RPL_TABLE_LIST *ptr= static_cast<RPL_TABLE_LIST*>(table_list_ptr);
 | |
|         DBUG_ASSERT(ptr->m_tabledef_valid);
 | |
|         TABLE *conv_table;
 | |
|         if (!ptr->m_tabledef.compatible_with(thd, rgi, ptr->table, &conv_table))
 | |
|         {
 | |
|           DBUG_PRINT("debug", ("Table: %s.%s is not compatible with master",
 | |
|                                ptr->table->s->db.str,
 | |
|                                ptr->table->s->table_name.str));
 | |
|           /*
 | |
|             We should not honour --slave-skip-errors at this point as we are
 | |
|             having severe errors which should not be skiped.
 | |
|           */
 | |
|           thd->is_slave_error= 1;
 | |
|           /* remove trigger's tables */
 | |
|           error= ERR_BAD_TABLE_DEF;
 | |
|           goto err;
 | |
|         }
 | |
|         DBUG_PRINT("debug", ("Table: %s.%s is compatible with master"
 | |
|                              " - conv_table: %p",
 | |
|                              ptr->table->s->db.str,
 | |
|                              ptr->table->s->table_name.str, conv_table));
 | |
|         ptr->m_conv_table= conv_table;
 | |
|       }
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|       ... and then we add all the tables to the table map and but keep
 | |
|       them in the tables to lock list.
 | |
| 
 | |
|       We also invalidate the query cache for all the tables, since
 | |
|       they will now be changed.
 | |
| 
 | |
|       TODO [/Matz]: Maybe the query cache should not be invalidated
 | |
|       here? It might be that a table is not changed, even though it
 | |
|       was locked for the statement.  We do know that each
 | |
|       Rows_log_event contain at least one row, so after processing one
 | |
|       Rows_log_event, we can invalidate the query cache for the
 | |
|       associated table.
 | |
|      */
 | |
|     TABLE_LIST *ptr= rgi->tables_to_lock;
 | |
|     for (uint i=0 ;  ptr && (i < rgi->tables_to_lock_count); ptr= ptr->next_global, i++)
 | |
|     {
 | |
|       /*
 | |
|         Please see comment in above 'for' loop to know the reason
 | |
|         for this if condition
 | |
|       */
 | |
|       if (ptr->parent_l)
 | |
|         continue;
 | |
|       rgi->m_table_map.set_table(ptr->table_id, ptr->table);
 | |
|       /*
 | |
|         Following is passing flag about triggers on the server. The problem was
 | |
|         to pass it between table map event and row event. I do it via extended
 | |
|         TABLE_LIST (RPL_TABLE_LIST) but row event uses only TABLE so I need to
 | |
|         find somehow the corresponding TABLE_LIST.
 | |
|       */
 | |
|       if (m_table_id == ptr->table_id)
 | |
|       {
 | |
|         ptr->table->master_had_triggers=
 | |
|           ((RPL_TABLE_LIST*)ptr)->master_had_triggers;
 | |
|       }
 | |
|     }
 | |
| 
 | |
| #ifdef HAVE_QUERY_CACHE
 | |
|     /*
 | |
|       Moved invalidation right before the call to rows_event_stmt_cleanup(),
 | |
|       to avoid query cache being polluted with stale entries,
 | |
|     */
 | |
| # ifdef WITH_WSREP
 | |
|     /* Query cache is not invalidated on wsrep applier here */
 | |
|     if (!(WSREP(thd) && wsrep_thd_is_applying(thd)))
 | |
| # endif /* WITH_WSREP */
 | |
|       query_cache.invalidate_locked_for_write(thd, rgi->tables_to_lock);
 | |
| #endif /* HAVE_QUERY_CACHE */
 | |
|   }
 | |
| 
 | |
|   table= m_table= rgi->m_table_map.get_table(m_table_id);
 | |
| 
 | |
|   DBUG_PRINT("debug", ("m_table:%p, m_table_id: %llu%s",
 | |
|                        m_table, m_table_id,
 | |
|                        table && master_had_triggers ?
 | |
|                        " (master had triggers)" : ""));
 | |
|   if (table)
 | |
|   {
 | |
|     Rows_log_event::Db_restore_ctx restore_ctx(this);
 | |
|     master_had_triggers= table->master_had_triggers;
 | |
|     bool transactional_table= table->file->has_transactions_and_rollback();
 | |
|     table->file->prepare_for_insert(get_general_type_code() != WRITE_ROWS_EVENT);
 | |
| 
 | |
|     /*
 | |
|       table == NULL means that this table should not be replicated
 | |
|       (this was set up by Table_map_log_event::do_apply_event()
 | |
|       which tested replicate-* rules).
 | |
|     */
 | |
| 
 | |
|     /*
 | |
|       It's not needed to set_time() but
 | |
|       1) it continues the property that "Time" in SHOW PROCESSLIST shows how
 | |
|       much slave is behind
 | |
|       2) it will be needed when we allow replication from a table with no
 | |
|       TIMESTAMP column to a table with one.
 | |
|       So we call set_time(), like in SBR. Presently it changes nothing.
 | |
|     */
 | |
|     thd->set_time(when, when_sec_part);
 | |
| 
 | |
|     if (m_width == table->s->fields && bitmap_is_set_all(&m_cols))
 | |
|       set_flags(COMPLETE_ROWS_F);
 | |
| 
 | |
|     /*
 | |
|       Set tables write and read sets.
 | |
| 
 | |
|       Read_set contains all slave columns (in case we are going to fetch
 | |
|       a complete record from slave).
 | |
| 
 | |
|       Write_set equals the m_cols bitmap sent from master but it can be
 | |
|       longer if slave has extra columns.
 | |
|     */
 | |
| 
 | |
|     DBUG_PRINT_BITSET("debug", "Setting table's read_set from: %s", &m_cols);
 | |
| 
 | |
|     bitmap_set_all(table->read_set);
 | |
|     if (get_general_type_code() == DELETE_ROWS_EVENT ||
 | |
|         get_general_type_code() == UPDATE_ROWS_EVENT)
 | |
|       bitmap_intersect(table->read_set,&m_cols);
 | |
| 
 | |
|     bitmap_set_all(table->write_set);
 | |
|     table->rpl_write_set= table->write_set;
 | |
| 
 | |
|     /* WRITE ROWS EVENTS store the bitmap in m_cols instead of m_cols_ai */
 | |
|     MY_BITMAP *after_image= ((get_general_type_code() == UPDATE_ROWS_EVENT) ?
 | |
|                              &m_cols_ai : &m_cols);
 | |
|     bitmap_intersect(table->write_set, after_image);
 | |
| 
 | |
|     this->slave_exec_mode= slave_exec_mode_options; // fix the mode
 | |
| 
 | |
|     // Do event specific preparations 
 | |
|     error= do_before_row_operations(rli);
 | |
| 
 | |
|     /*
 | |
|       Bug#56662 Assertion failed: next_insert_id == 0, file handler.cc
 | |
|       Don't allow generation of auto_increment value when processing
 | |
|       rows event by setting 'MODE_NO_AUTO_VALUE_ON_ZERO'. The exception
 | |
|       to this rule happens when the auto_inc column exists on some
 | |
|       extra columns on the slave. In that case, do not force
 | |
|       MODE_NO_AUTO_VALUE_ON_ZERO.
 | |
|     */
 | |
|     sql_mode_t saved_sql_mode= thd->variables.sql_mode;
 | |
|     if (!is_auto_inc_in_extra_columns())
 | |
|       thd->variables.sql_mode= MODE_NO_AUTO_VALUE_ON_ZERO;
 | |
| 
 | |
|     // row processing loop
 | |
| 
 | |
|     /* 
 | |
|       set the initial time of this ROWS statement if it was not done
 | |
|       before in some other ROWS event. 
 | |
|      */
 | |
|     rgi->set_row_stmt_start_timestamp();
 | |
| 
 | |
|     THD_STAGE_INFO(thd, stage_executing);
 | |
|     do
 | |
|     {
 | |
|       /* in_use can have been set to NULL in close_tables_for_reopen */
 | |
|       THD* old_thd= table->in_use;
 | |
|       if (!table->in_use)
 | |
|         table->in_use= thd;
 | |
| 
 | |
|       error= do_exec_row(rgi);
 | |
| 
 | |
|       if (unlikely(error))
 | |
|         DBUG_PRINT("info", ("error: %s", HA_ERR(error)));
 | |
|       DBUG_ASSERT(error != HA_ERR_RECORD_DELETED);
 | |
| 
 | |
|       table->in_use = old_thd;
 | |
| 
 | |
|       if (unlikely(error))
 | |
|       {
 | |
|         int actual_error= convert_handler_error(error, thd, table);
 | |
|         bool idempotent_error= (idempotent_error_code(error) &&
 | |
|                                (slave_exec_mode == SLAVE_EXEC_MODE_IDEMPOTENT));
 | |
|         bool ignored_error= (idempotent_error == 0 ?
 | |
|                              ignored_error_code(actual_error) : 0);
 | |
| 
 | |
| #ifdef WITH_WSREP
 | |
|         if (WSREP(thd) && thd->wsrep_applier &&
 | |
|             wsrep_ignored_error_code(this, actual_error))
 | |
|         {
 | |
|           idempotent_error= true;
 | |
|           thd->wsrep_has_ignored_error= true;
 | |
|         }
 | |
| #endif /* WITH_WSREP */
 | |
|         if (idempotent_error || ignored_error)
 | |
|         {
 | |
|           if (global_system_variables.log_warnings)
 | |
|             slave_rows_error_report(WARNING_LEVEL, error, rgi, thd, table,
 | |
|                                     get_type_str(),
 | |
|                                     RPL_LOG_NAME, log_pos);
 | |
|           thd->clear_error(1);
 | |
|           error= 0;
 | |
|           if (idempotent_error == 0)
 | |
|             break;
 | |
|         }
 | |
|       }
 | |
| 
 | |
|       /*
 | |
|        If m_curr_row_end  was not set during event execution (e.g., because
 | |
|        of errors) we can't proceed to the next row. If the error is transient
 | |
|        (i.e., error==0 at this point) we must call unpack_current_row() to set 
 | |
|        m_curr_row_end.
 | |
|       */ 
 | |
|    
 | |
|       DBUG_PRINT("info", ("curr_row: %p; curr_row_end: %p; rows_end:%p",
 | |
|                           m_curr_row, m_curr_row_end, m_rows_end));
 | |
| 
 | |
|       if (!m_curr_row_end && likely(!error))
 | |
|         error= unpack_current_row(rgi);
 | |
| 
 | |
|       m_curr_row= m_curr_row_end;
 | |
|  
 | |
|       if (likely(error == 0) && !transactional_table)
 | |
|         thd->transaction->all.modified_non_trans_table=
 | |
|           thd->transaction->stmt.modified_non_trans_table= TRUE;
 | |
|     } // row processing loop
 | |
|     while (error == 0 && (m_curr_row != m_rows_end));
 | |
| 
 | |
|     /*
 | |
|       Restore the sql_mode after the rows event is processed.
 | |
|     */
 | |
|     thd->variables.sql_mode= saved_sql_mode;
 | |
| 
 | |
|     {/**
 | |
|          The following failure injecion works in cooperation with tests 
 | |
|          setting @@global.debug= 'd,stop_slave_middle_group'.
 | |
|          The sql thread receives the killed status and will proceed 
 | |
|          to shutdown trying to finish incomplete events group.
 | |
|      */
 | |
|       DBUG_EXECUTE_IF("stop_slave_middle_group",
 | |
|                       if (thd->transaction->all.modified_non_trans_table)
 | |
|                         const_cast<Relay_log_info*>(rli)->abort_slave= 1;);
 | |
|     }
 | |
| 
 | |
|     if (unlikely(error= do_after_row_operations(rli, error)) &&
 | |
|         ignored_error_code(convert_handler_error(error, thd, table)))
 | |
|     {
 | |
| 
 | |
|       if (global_system_variables.log_warnings)
 | |
|         slave_rows_error_report(WARNING_LEVEL, error, rgi, thd, table,
 | |
|                                 get_type_str(),
 | |
|                                 RPL_LOG_NAME, log_pos);
 | |
|       thd->clear_error(1);
 | |
|       error= 0;
 | |
|     }
 | |
|   } // if (table)
 | |
| 
 | |
|   
 | |
|   if (unlikely(error))
 | |
|   {
 | |
|     slave_rows_error_report(ERROR_LEVEL, error, rgi, thd, table,
 | |
|                              get_type_str(),
 | |
|                              RPL_LOG_NAME, log_pos);
 | |
|     /*
 | |
|       @todo We should probably not call
 | |
|       reset_current_stmt_binlog_format_row() from here.
 | |
| 
 | |
|       Note: this applies to log_event_old.cc too.
 | |
|       /Sven
 | |
|     */
 | |
|     thd->reset_current_stmt_binlog_format_row();
 | |
|     thd->is_slave_error= 1;
 | |
|     /* remove trigger's tables */
 | |
|     goto err;
 | |
|   }
 | |
| 
 | |
|   /* remove trigger's tables */
 | |
|   restore_empty_query_table_list(thd->lex);
 | |
| 
 | |
| #if defined(WITH_WSREP) && defined(HAVE_QUERY_CACHE)
 | |
|   if (WSREP(thd) && wsrep_thd_is_applying(thd))
 | |
|     query_cache.invalidate_locked_for_write(thd, rgi->tables_to_lock);
 | |
| #endif /* WITH_WSREP && HAVE_QUERY_CACHE */
 | |
| 
 | |
|   if (get_flags(STMT_END_F))
 | |
|   {
 | |
|     if (unlikely((error= rows_event_stmt_cleanup(rgi, thd))))
 | |
|       slave_rows_error_report(ERROR_LEVEL, thd->is_error() ? 0 : error,
 | |
|                               rgi, thd, table, get_type_str(),
 | |
|                               RPL_LOG_NAME, log_pos);
 | |
|     if (thd->slave_thread)
 | |
|       free_root(thd->mem_root, MYF(MY_KEEP_PREALLOC));
 | |
|   }
 | |
| 
 | |
|   DBUG_RETURN(error);
 | |
| 
 | |
| err:
 | |
|   restore_empty_query_table_list(thd->lex);
 | |
|   rgi->slave_close_thread_tables(thd);
 | |
|   DBUG_RETURN(error);
 | |
| }
 | |
| 
 | |
| Log_event::enum_skip_reason
 | |
| Rows_log_event::do_shall_skip(rpl_group_info *rgi)
 | |
| {
 | |
|   /*
 | |
|     If the slave skip counter is 1 and this event does not end a
 | |
|     statement, then we should not start executing on the next event.
 | |
|     Otherwise, we defer the decision to the normal skipping logic.
 | |
|   */
 | |
|   if (rgi->rli->slave_skip_counter == 1 && !get_flags(STMT_END_F))
 | |
|     return Log_event::EVENT_SKIP_IGNORE;
 | |
|   else
 | |
|     return Log_event::do_shall_skip(rgi);
 | |
| }
 | |
| 
 | |
| /**
 | |
|    The function is called at Rows_log_event statement commit time,
 | |
|    normally from Rows_log_event::do_update_pos() and possibly from
 | |
|    Query_log_event::do_apply_event() of the COMMIT.
 | |
|    The function commits the last statement for engines, binlog and
 | |
|    releases resources have been allocated for the statement.
 | |
|   
 | |
|    @retval  0         Ok.
 | |
|    @retval  non-zero  Error at the commit.
 | |
|  */
 | |
| 
 | |
| static int rows_event_stmt_cleanup(rpl_group_info *rgi, THD * thd)
 | |
| {
 | |
|   int error;
 | |
|   DBUG_ENTER("rows_event_stmt_cleanup");
 | |
| 
 | |
|   {
 | |
|     /*
 | |
|       This is the end of a statement or transaction, so close (and
 | |
|       unlock) the tables we opened when processing the
 | |
|       Table_map_log_event starting the statement.
 | |
| 
 | |
|       OBSERVER.  This will clear *all* mappings, not only those that
 | |
|       are open for the table. There is not good handle for on-close
 | |
|       actions for tables.
 | |
| 
 | |
|       NOTE. Even if we have no table ('table' == 0) we still need to be
 | |
|       here, so that we increase the group relay log position. If we didn't, we
 | |
|       could have a group relay log position which lags behind "forever"
 | |
|       (assume the last master's transaction is ignored by the slave because of
 | |
|       replicate-ignore rules).
 | |
|     */
 | |
|     error= thd->binlog_flush_pending_rows_event(TRUE);
 | |
| 
 | |
|     /*
 | |
|       If this event is not in a transaction, the call below will, if some
 | |
|       transactional storage engines are involved, commit the statement into
 | |
|       them and flush the pending event to binlog.
 | |
|       If this event is in a transaction, the call will do nothing, but a
 | |
|       Xid_log_event will come next which will, if some transactional engines
 | |
|       are involved, commit the transaction and flush the pending event to the
 | |
|       binlog.
 | |
|       We check for thd->transaction_rollback_request because it is possible
 | |
|       there was a deadlock that was ignored by slave-skip-errors. Normally, the
 | |
|       deadlock would have been rolled back already.
 | |
|     */
 | |
|     error|= (int) ((error || thd->transaction_rollback_request)
 | |
|                        ? trans_rollback_stmt(thd)
 | |
|                        : trans_commit_stmt(thd));
 | |
| 
 | |
|     /*
 | |
|       Now what if this is not a transactional engine? we still need to
 | |
|       flush the pending event to the binlog; we did it with
 | |
|       thd->binlog_flush_pending_rows_event(). Note that we imitate
 | |
|       what is done for real queries: a call to
 | |
|       ha_autocommit_or_rollback() (sometimes only if involves a
 | |
|       transactional engine), and a call to be sure to have the pending
 | |
|       event flushed.
 | |
|     */
 | |
| 
 | |
|     /*
 | |
|       @todo We should probably not call
 | |
|       reset_current_stmt_binlog_format_row() from here.
 | |
| 
 | |
|       Note: this applies to log_event_old.cc too
 | |
| 
 | |
|       Btw, the previous comment about transactional engines does not
 | |
|       seem related to anything that happens here.
 | |
|       /Sven
 | |
|     */
 | |
|     thd->reset_current_stmt_binlog_format_row();
 | |
| 
 | |
|     /*
 | |
|       Reset modified_non_trans_table that we have set in
 | |
|       rows_log_event::do_apply_event()
 | |
|     */
 | |
|     if (!thd->in_multi_stmt_transaction_mode())
 | |
|     {
 | |
|       thd->transaction->all.modified_non_trans_table= 0;
 | |
|       thd->transaction->all.m_unsafe_rollback_flags&= ~THD_TRANS::DID_WAIT;
 | |
|     }
 | |
| 
 | |
|     rgi->cleanup_context(thd, 0);
 | |
|   }
 | |
|   DBUG_RETURN(error);
 | |
| }
 | |
| 
 | |
| /**
 | |
|    The method either increments the relay log position or
 | |
|    commits the current statement and increments the master group 
 | |
|    possition if the event is STMT_END_F flagged and
 | |
|    the statement corresponds to the autocommit query (i.e replicated
 | |
|    without wrapping in BEGIN/COMMIT)
 | |
| 
 | |
|    @retval 0         Success
 | |
|    @retval non-zero  Error in the statement commit
 | |
|  */
 | |
| int
 | |
| Rows_log_event::do_update_pos(rpl_group_info *rgi)
 | |
| {
 | |
|   Relay_log_info *rli= rgi->rli;
 | |
|   int error= 0;
 | |
|   DBUG_ENTER("Rows_log_event::do_update_pos");
 | |
| 
 | |
|   DBUG_PRINT("info", ("flags: %s",
 | |
|                       get_flags(STMT_END_F) ? "STMT_END_F " : ""));
 | |
| 
 | |
|   if (get_flags(STMT_END_F))
 | |
|   {
 | |
|     /*
 | |
|       Indicate that a statement is finished.
 | |
|       Step the group log position if we are not in a transaction,
 | |
|       otherwise increase the event log position.
 | |
|     */
 | |
|     error= rli->stmt_done(log_pos, thd, rgi);
 | |
|     /*
 | |
|       Clear any errors in thd->net.last_err*. It is not known if this is
 | |
|       needed or not. It is believed that any errors that may exist in
 | |
|       thd->net.last_err* are allowed. Examples of errors are "key not
 | |
|       found", which is produced in the test case rpl_row_conflicts.test
 | |
|     */
 | |
|     thd->clear_error();
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     rgi->inc_event_relay_log_pos();
 | |
|   }
 | |
| 
 | |
|   DBUG_RETURN(error);
 | |
| }
 | |
| 
 | |
| #endif /* defined(HAVE_REPLICATION) */
 | |
| 
 | |
| 
 | |
| bool Rows_log_event::write_data_header()
 | |
| {
 | |
|   uchar buf[ROWS_HEADER_LEN_V2];        // No need to init the buffer
 | |
|   DBUG_ASSERT(m_table_id != UINT32_MAX);
 | |
|   DBUG_EXECUTE_IF("old_row_based_repl_4_byte_map_id_master",
 | |
|                   {
 | |
|                     int4store(buf + 0, (ulong) m_table_id);
 | |
|                     int2store(buf + 4, m_flags);
 | |
|                     return (write_data(buf, 6));
 | |
|                   });
 | |
|   int6store(buf + RW_MAPID_OFFSET, m_table_id);
 | |
|   int2store(buf + RW_FLAGS_OFFSET, m_flags);
 | |
|   return write_data(buf, ROWS_HEADER_LEN);
 | |
| }
 | |
| 
 | |
| bool Rows_log_event::write_data_body()
 | |
| {
 | |
|   /*
 | |
|      Note that this should be the number of *bits*, not the number of
 | |
|      bytes.
 | |
|   */
 | |
|   uchar sbuf[MAX_INT_WIDTH];
 | |
|   my_ptrdiff_t const data_size= m_rows_cur - m_rows_buf;
 | |
|   bool res= false;
 | |
|   uchar *const sbuf_end= net_store_length(sbuf, (size_t) m_width);
 | |
|   uint bitmap_size= no_bytes_in_export_map(&m_cols);
 | |
|   uchar *bitmap;
 | |
|   DBUG_ASSERT(static_cast<size_t>(sbuf_end - sbuf) <= sizeof(sbuf));
 | |
| 
 | |
|   DBUG_DUMP("m_width", sbuf, (size_t) (sbuf_end - sbuf));
 | |
|   res= res || write_data(sbuf, (size_t) (sbuf_end - sbuf));
 | |
| 
 | |
|   bitmap= (uchar*) my_alloca(bitmap_size);
 | |
|   bitmap_export(bitmap, &m_cols);
 | |
| 
 | |
|   DBUG_DUMP("m_cols", bitmap, bitmap_size);
 | |
|   res= res || write_data(bitmap, bitmap_size);
 | |
|   /*
 | |
|     TODO[refactor write]: Remove the "down cast" here (and elsewhere).
 | |
|    */
 | |
|   if (get_general_type_code() == UPDATE_ROWS_EVENT)
 | |
|   {
 | |
|     DBUG_ASSERT(m_cols.n_bits == m_cols_ai.n_bits);
 | |
|     bitmap_export(bitmap, &m_cols_ai);
 | |
| 
 | |
|     DBUG_DUMP("m_cols_ai", bitmap, bitmap_size);
 | |
|     res= res || write_data(bitmap, bitmap_size);
 | |
|   }
 | |
|   DBUG_DUMP("rows", m_rows_buf, data_size);
 | |
|   res= res || write_data(m_rows_buf, (size_t) data_size);
 | |
|   my_afree(bitmap);
 | |
| 
 | |
|   return res;
 | |
| }
 | |
| 
 | |
| 
 | |
| bool Rows_log_event::write_compressed()
 | |
| {
 | |
|   uchar *m_rows_buf_tmp= m_rows_buf;
 | |
|   uchar *m_rows_cur_tmp= m_rows_cur;
 | |
|   bool ret= true;
 | |
|   uint32 comlen, alloc_size;
 | |
|   comlen= alloc_size= binlog_get_compress_len((uint32)(m_rows_cur_tmp -
 | |
|                                                        m_rows_buf_tmp));
 | |
|   m_rows_buf= (uchar*) my_safe_alloca(alloc_size);
 | |
|   if(m_rows_buf &&
 | |
|      !binlog_buf_compress(m_rows_buf_tmp, m_rows_buf,
 | |
|                           (uint32)(m_rows_cur_tmp - m_rows_buf_tmp), &comlen))
 | |
|   {
 | |
|     m_rows_cur= comlen + m_rows_buf;
 | |
|     ret= Log_event::write();
 | |
|   }
 | |
|   my_safe_afree(m_rows_buf, alloc_size);
 | |
|   m_rows_buf= m_rows_buf_tmp;
 | |
|   m_rows_cur= m_rows_cur_tmp;
 | |
|   return ret;
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| void Rows_log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|   char buf[256];
 | |
|   char const *const flagstr=
 | |
|     get_flags(STMT_END_F) ? " flags: STMT_END_F" : "";
 | |
|   size_t bytes= my_snprintf(buf, sizeof(buf),
 | |
|                                "table_id: %llu%s", m_table_id, flagstr);
 | |
|   protocol->store(buf, bytes, &my_charset_bin);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| /**************************************************************************
 | |
| 	Annotate_rows_log_event member functions
 | |
| **************************************************************************/
 | |
| 
 | |
| Annotate_rows_log_event::Annotate_rows_log_event(THD *thd,
 | |
|                                                  bool using_trans,
 | |
|                                                  bool direct)
 | |
|   : Log_event(thd, 0, using_trans),
 | |
|     m_save_thd_query_txt(0),
 | |
|     m_save_thd_query_len(0),
 | |
|     m_saved_thd_query(false),
 | |
|     m_used_query_txt(0)
 | |
| {
 | |
|   m_query_txt= thd->query();
 | |
|   m_query_len= thd->query_length();
 | |
|   if (direct)
 | |
|     cache_type= Log_event::EVENT_NO_CACHE;
 | |
| }
 | |
| 
 | |
| 
 | |
| bool Annotate_rows_log_event::write_data_header()
 | |
| { 
 | |
|   return 0;
 | |
| }
 | |
| 
 | |
| 
 | |
| bool Annotate_rows_log_event::write_data_body()
 | |
| {
 | |
|   return write_data(m_query_txt, m_query_len);
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| void Annotate_rows_log_event::pack_info(Protocol* protocol)
 | |
| {
 | |
|   if (m_query_txt && m_query_len)
 | |
|     protocol->store(m_query_txt, m_query_len, &my_charset_bin);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| int Annotate_rows_log_event::do_apply_event(rpl_group_info *rgi)
 | |
| {
 | |
|   rgi->free_annotate_event();
 | |
|   m_save_thd_query_txt= thd->query();
 | |
|   m_save_thd_query_len= thd->query_length();
 | |
|   m_saved_thd_query= true;
 | |
|   m_used_query_txt= 1;
 | |
|   thd->set_query(m_query_txt, m_query_len);
 | |
|   return 0;
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| int Annotate_rows_log_event::do_update_pos(rpl_group_info *rgi)
 | |
| {
 | |
|   rgi->inc_event_relay_log_pos();
 | |
|   return 0;
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| Log_event::enum_skip_reason
 | |
| Annotate_rows_log_event::do_shall_skip(rpl_group_info *rgi)
 | |
| {
 | |
|   return continue_group(rgi);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| /**************************************************************************
 | |
| 	Table_map_log_event member functions and support functions
 | |
| **************************************************************************/
 | |
| 
 | |
| /**
 | |
|   Save the field metadata based on the real_type of the field.
 | |
|   The metadata saved depends on the type of the field. Some fields
 | |
|   store a single byte for pack_length() while others store two bytes
 | |
|   for field_length (max length).
 | |
|   
 | |
|   @retval  0  Ok.
 | |
| 
 | |
|   @todo
 | |
|   We may want to consider changing the encoding of the information.
 | |
|   Currently, the code attempts to minimize the number of bytes written to 
 | |
|   the tablemap. There are at least two other alternatives; 1) using 
 | |
|   net_store_length() to store the data allowing it to choose the number of
 | |
|   bytes that are appropriate thereby making the code much easier to 
 | |
|   maintain (only 1 place to change the encoding), or 2) use a fixed number
 | |
|   of bytes for each field. The problem with option 1 is that net_store_length()
 | |
|   will use one byte if the value < 251, but 3 bytes if it is > 250. Thus,
 | |
|   for fields like CHAR which can be no larger than 255 characters, the method
 | |
|   will use 3 bytes when the value is > 250. Further, every value that is
 | |
|   encoded using 2 parts (e.g., pack_length, field_length) will be numerically
 | |
|   > 250 therefore will use 3 bytes for eah value. The problem with option 2
 | |
|   is less wasteful for space but does waste 1 byte for every field that does
 | |
|   not encode 2 parts. 
 | |
| */
 | |
| int Table_map_log_event::save_field_metadata()
 | |
| {
 | |
|   DBUG_ENTER("Table_map_log_event::save_field_metadata");
 | |
|   int index= 0;
 | |
|   Binlog_type_info *info;
 | |
|   for (unsigned int i= 0 ; i < m_table->s->fields ; i++)
 | |
|   {
 | |
|     DBUG_PRINT("debug", ("field_type: %d", m_coltype[i]));
 | |
|     info= binlog_type_info_array + i;
 | |
|     int2store(&m_field_metadata[index], info->m_metadata);
 | |
|     index+= info->m_metadata_size;
 | |
|     DBUG_EXECUTE_IF("inject_invalid_blob_size",
 | |
|                     {
 | |
|                       if (m_coltype[i] == MYSQL_TYPE_BLOB)
 | |
|                         m_field_metadata[index-1] = 5;
 | |
|                     });
 | |
|   }
 | |
|   DBUG_RETURN(index);
 | |
| }
 | |
| 
 | |
| 
 | |
| /*
 | |
|   Constructor used to build an event for writing to the binary log.
 | |
|   Mats says tbl->s lives longer than this event so it's ok to copy pointers
 | |
|   (tbl->s->db etc) and not pointer content.
 | |
|  */
 | |
| Table_map_log_event::Table_map_log_event(THD *thd, TABLE *tbl, ulonglong tid,
 | |
|                                          bool is_transactional)
 | |
|   : Log_event(thd, 0, is_transactional),
 | |
|     m_table(tbl),
 | |
|     m_dbnam(tbl->s->db.str),
 | |
|     m_dblen(m_dbnam ? tbl->s->db.length : 0),
 | |
|     m_tblnam(tbl->s->table_name.str),
 | |
|     m_tbllen(tbl->s->table_name.length),
 | |
|     m_colcnt(tbl->s->fields),
 | |
|     m_memory(NULL),
 | |
|     m_table_id(tid),
 | |
|     m_flags(TM_BIT_LEN_EXACT_F),
 | |
|     m_data_size(0),
 | |
|     m_field_metadata(0),
 | |
|     m_field_metadata_size(0),
 | |
|     m_null_bits(0),
 | |
|     m_meta_memory(NULL),
 | |
|     m_optional_metadata_len(0),
 | |
|     m_optional_metadata(NULL)
 | |
| {
 | |
|   uchar cbuf[MAX_INT_WIDTH];
 | |
|   uchar *cbuf_end;
 | |
|   DBUG_ENTER("Table_map_log_event::Table_map_log_event(TABLE)");
 | |
|   DBUG_ASSERT(m_table_id != UINT32_MAX);
 | |
|   /*
 | |
|     In TABLE_SHARE, "db" and "table_name" are 0-terminated (see this comment in
 | |
|     table.cc / alloc_table_share():
 | |
|       Use the fact the key is db/0/table_name/0
 | |
|     As we rely on this let's assert it.
 | |
|   */
 | |
|   DBUG_ASSERT((tbl->s->db.str == 0) ||
 | |
|               (tbl->s->db.str[tbl->s->db.length] == 0));
 | |
|   DBUG_ASSERT(tbl->s->table_name.str[tbl->s->table_name.length] == 0);
 | |
| 
 | |
|   binlog_type_info_array= (Binlog_type_info *)thd->alloc(m_table->s->fields *
 | |
|                                                    sizeof(Binlog_type_info));
 | |
|   for (uint i= 0; i <  m_table->s->fields; i++)
 | |
|     binlog_type_info_array[i]= m_table->field[i]->binlog_type_info();
 | |
| 
 | |
|   m_data_size=  TABLE_MAP_HEADER_LEN;
 | |
|   DBUG_EXECUTE_IF("old_row_based_repl_4_byte_map_id_master", m_data_size= 6;);
 | |
|   m_data_size+= m_dblen + 2;	// Include length and terminating \0
 | |
|   m_data_size+= m_tbllen + 2;	// Include length and terminating \0
 | |
|   cbuf_end= net_store_length(cbuf, (size_t) m_colcnt);
 | |
|   DBUG_ASSERT(static_cast<size_t>(cbuf_end - cbuf) <= sizeof(cbuf));
 | |
|   m_data_size+= (cbuf_end - cbuf) + m_colcnt;	// COLCNT and column types
 | |
| 
 | |
|   if (tbl->triggers)
 | |
|     m_flags|= TM_BIT_HAS_TRIGGERS_F;
 | |
| 
 | |
|   /* If malloc fails, caught in is_valid() */
 | |
|   if ((m_memory= (uchar*) my_malloc(PSI_INSTRUMENT_ME, m_colcnt, MYF(MY_WME))))
 | |
|   {
 | |
|     m_coltype= reinterpret_cast<uchar*>(m_memory);
 | |
|     for (unsigned int i= 0 ; i < m_table->s->fields ; ++i)
 | |
|       m_coltype[i]= binlog_type_info_array[i].m_type_code;
 | |
|     DBUG_EXECUTE_IF("inject_invalid_column_type", m_coltype[1]= 230;);
 | |
|   }
 | |
| 
 | |
|   /*
 | |
|     Calculate a bitmap for the results of maybe_null() for all columns.
 | |
|     The bitmap is used to determine when there is a column from the master
 | |
|     that is not on the slave and is null and thus not in the row data during
 | |
|     replication.
 | |
|   */
 | |
|   uint num_null_bytes= (m_table->s->fields + 7) / 8;
 | |
|   m_data_size+= num_null_bytes;
 | |
|   m_meta_memory= (uchar *)my_multi_malloc(PSI_INSTRUMENT_ME, MYF(MY_WME),
 | |
|                                  &m_null_bits, num_null_bytes,
 | |
|                                  &m_field_metadata, (m_colcnt * 2),
 | |
|                                  NULL);
 | |
| 
 | |
|   bzero(m_field_metadata, (m_colcnt * 2));
 | |
| 
 | |
|   /*
 | |
|     Create an array for the field metadata and store it.
 | |
|   */
 | |
|   m_field_metadata_size= save_field_metadata();
 | |
|   DBUG_ASSERT(m_field_metadata_size <= (m_colcnt * 2));
 | |
| 
 | |
|   /*
 | |
|     Now set the size of the data to the size of the field metadata array
 | |
|     plus one or three bytes (see pack.c:net_store_length) for number of 
 | |
|     elements in the field metadata array.
 | |
|   */
 | |
|   if (m_field_metadata_size < 251)
 | |
|     m_data_size+= m_field_metadata_size + 1; 
 | |
|   else
 | |
|     m_data_size+= m_field_metadata_size + 3; 
 | |
| 
 | |
|   bzero(m_null_bits, num_null_bytes);
 | |
|   for (unsigned int i= 0 ; i < m_table->s->fields ; ++i)
 | |
|     if (m_table->field[i]->maybe_null())
 | |
|       m_null_bits[(i / 8)]+= 1 << (i % 8);
 | |
| 
 | |
|   init_metadata_fields();
 | |
|   m_data_size+= m_metadata_buf.length();
 | |
| 
 | |
|   DBUG_VOID_RETURN;
 | |
| }
 | |
| 
 | |
| 
 | |
| /*
 | |
|   Return value is an error code, one of:
 | |
| 
 | |
|       -1     Failure to open table   [from open_tables()]
 | |
|        0     Success
 | |
|        1     No room for more tables [from set_table()]
 | |
|        2     Out of memory           [from set_table()]
 | |
|        3     Wrong table definition
 | |
|        4     Daisy-chaining RBR with SBR not possible
 | |
|  */
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| 
 | |
| enum enum_tbl_map_status
 | |
| {
 | |
|   /* no duplicate identifier found */
 | |
|   OK_TO_PROCESS= 0,
 | |
| 
 | |
|   /* this table map must be filtered out */
 | |
|   FILTERED_OUT= 1,
 | |
| 
 | |
|   /* identifier mapping table with different properties */
 | |
|   SAME_ID_MAPPING_DIFFERENT_TABLE= 2,
 | |
|   
 | |
|   /* a duplicate identifier was found mapping the same table */
 | |
|   SAME_ID_MAPPING_SAME_TABLE= 3
 | |
| };
 | |
| 
 | |
| /*
 | |
|   Checks if this table map event should be processed or not. First
 | |
|   it checks the filtering rules, and then looks for duplicate identifiers
 | |
|   in the existing list of rli->tables_to_lock.
 | |
| 
 | |
|   It checks that there hasn't been any corruption by verifying that there
 | |
|   are no duplicate entries with different properties.
 | |
| 
 | |
|   In some cases, some binary logs could get corrupted, showing several
 | |
|   tables mapped to the same table_id, 0 (see: BUG#56226). Thus we do this
 | |
|   early sanity check for such cases and avoid that the server crashes 
 | |
|   later.
 | |
| 
 | |
|   In some corner cases, the master logs duplicate table map events, i.e.,
 | |
|   same id, same database name, same table name (see: BUG#37137). This is
 | |
|   different from the above as it's the same table that is mapped again 
 | |
|   to the same identifier. Thus we cannot just check for same ids and 
 | |
|   assume that the event is corrupted we need to check every property. 
 | |
| 
 | |
|   NOTE: in the event that BUG#37137 ever gets fixed, this extra check 
 | |
|         will still be valid because we would need to support old binary 
 | |
|         logs anyway.
 | |
| 
 | |
|   @param rli The relay log info reference.
 | |
|   @param table_list A list element containing the table to check against.
 | |
|   @return OK_TO_PROCESS 
 | |
|             if there was no identifier already in rli->tables_to_lock 
 | |
|             
 | |
|           FILTERED_OUT
 | |
|             if the event is filtered according to the filtering rules
 | |
| 
 | |
|           SAME_ID_MAPPING_DIFFERENT_TABLE 
 | |
|             if the same identifier already maps a different table in 
 | |
|             rli->tables_to_lock
 | |
| 
 | |
|           SAME_ID_MAPPING_SAME_TABLE 
 | |
|             if the same identifier already maps the same table in 
 | |
|             rli->tables_to_lock.
 | |
| */
 | |
| static enum_tbl_map_status
 | |
| check_table_map(rpl_group_info *rgi, RPL_TABLE_LIST *table_list)
 | |
| {
 | |
|   DBUG_ENTER("check_table_map");
 | |
|   enum_tbl_map_status res= OK_TO_PROCESS;
 | |
|   Relay_log_info *rli= rgi->rli;
 | |
| 
 | |
|   if (rgi->thd->slave_thread /* filtering is for slave only */ &&
 | |
|       (!rli->mi->rpl_filter->db_ok(table_list->db.str) ||
 | |
|        (rli->mi->rpl_filter->is_on() && !rli->mi->rpl_filter->tables_ok("", table_list))))
 | |
|     res= FILTERED_OUT;
 | |
|   else
 | |
|   {
 | |
|     RPL_TABLE_LIST *ptr= static_cast<RPL_TABLE_LIST*>(rgi->tables_to_lock);
 | |
|     for(uint i=0 ; ptr && (i< rgi->tables_to_lock_count); 
 | |
|         ptr= static_cast<RPL_TABLE_LIST*>(ptr->next_local), i++)
 | |
|     {
 | |
|       if (ptr->table_id == table_list->table_id)
 | |
|       {
 | |
| 
 | |
|         if (cmp(&ptr->db, &table_list->db) ||
 | |
|             cmp(&ptr->alias, &table_list->table_name) ||
 | |
|             ptr->lock_type != TL_WRITE) // the ::do_apply_event always sets TL_WRITE
 | |
|           res= SAME_ID_MAPPING_DIFFERENT_TABLE;
 | |
|         else
 | |
|           res= SAME_ID_MAPPING_SAME_TABLE;
 | |
| 
 | |
|         break;
 | |
|       }
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   DBUG_PRINT("debug", ("check of table map ended up with: %u", res));
 | |
| 
 | |
|   DBUG_RETURN(res);
 | |
| }
 | |
| 
 | |
| int Table_map_log_event::do_apply_event(rpl_group_info *rgi)
 | |
| {
 | |
|   RPL_TABLE_LIST *table_list;
 | |
|   char *db_mem, *tname_mem, *ptr;
 | |
|   size_t dummy_len, db_mem_length, tname_mem_length;
 | |
|   void *memory;
 | |
|   Rpl_filter *filter;
 | |
|   Relay_log_info const *rli= rgi->rli;
 | |
|   DBUG_ENTER("Table_map_log_event::do_apply_event(Relay_log_info*)");
 | |
| 
 | |
|   /* Step the query id to mark what columns that are actually used. */
 | |
|   thd->set_query_id(next_query_id());
 | |
| 
 | |
|   if (!(memory= my_multi_malloc(PSI_INSTRUMENT_ME, MYF(MY_WME),
 | |
|                                 &table_list, (uint) sizeof(RPL_TABLE_LIST),
 | |
|                                 &db_mem, (uint) NAME_LEN + 1,
 | |
|                                 &tname_mem, (uint) NAME_LEN + 1,
 | |
|                                 NullS)))
 | |
|     DBUG_RETURN(HA_ERR_OUT_OF_MEM);
 | |
| 
 | |
|   db_mem_length= strmov(db_mem, m_dbnam) - db_mem;
 | |
|   tname_mem_length= strmov(tname_mem, m_tblnam) - tname_mem;
 | |
|   if (lower_case_table_names)
 | |
|   {
 | |
|     my_casedn_str(files_charset_info, (char*)tname_mem);
 | |
|     my_casedn_str(files_charset_info, (char*)db_mem);
 | |
|   }
 | |
| 
 | |
|   /* call from mysql_client_binlog_statement() will not set rli->mi */
 | |
|   filter= rgi->thd->slave_thread ? rli->mi->rpl_filter : global_rpl_filter;
 | |
| 
 | |
|   /* rewrite rules changed the database */
 | |
|   if (((ptr= (char*) filter->get_rewrite_db(db_mem, &dummy_len)) != db_mem))
 | |
|     db_mem_length= strmov(db_mem, ptr) - db_mem;
 | |
| 
 | |
|   LEX_CSTRING tmp_db_name=  {db_mem, db_mem_length };
 | |
|   LEX_CSTRING tmp_tbl_name= {tname_mem, tname_mem_length };
 | |
| 
 | |
|   table_list->init_one_table(&tmp_db_name, &tmp_tbl_name, 0, TL_WRITE);
 | |
|   table_list->table_id= DBUG_EVALUATE_IF("inject_tblmap_same_id_maps_diff_table", 0, m_table_id);
 | |
|   table_list->updating= 1;
 | |
|   table_list->required_type= TABLE_TYPE_NORMAL;
 | |
| 
 | |
|   DBUG_PRINT("debug", ("table: %s is mapped to %llu",
 | |
|                        table_list->table_name.str,
 | |
|                        table_list->table_id));
 | |
|   table_list->master_had_triggers= ((m_flags & TM_BIT_HAS_TRIGGERS_F) ? 1 : 0);
 | |
|   DBUG_PRINT("debug", ("table->master_had_triggers=%d", 
 | |
|                        (int)table_list->master_had_triggers));
 | |
| 
 | |
|   enum_tbl_map_status tblmap_status= check_table_map(rgi, table_list);
 | |
|   if (tblmap_status == OK_TO_PROCESS)
 | |
|   {
 | |
|     DBUG_ASSERT(thd->lex->query_tables != table_list);
 | |
| 
 | |
|     /*
 | |
|       Use placement new to construct the table_def instance in the
 | |
|       memory allocated for it inside table_list.
 | |
| 
 | |
|       The memory allocated by the table_def structure (i.e., not the
 | |
|       memory allocated *for* the table_def structure) is released
 | |
|       inside Relay_log_info::clear_tables_to_lock() by calling the
 | |
|       table_def destructor explicitly.
 | |
|     */
 | |
|     new (&table_list->m_tabledef)
 | |
|       table_def(m_coltype, m_colcnt,
 | |
|                 m_field_metadata, m_field_metadata_size,
 | |
|                 m_null_bits, m_flags);
 | |
|     table_list->m_tabledef_valid= TRUE;
 | |
|     table_list->m_conv_table= NULL;
 | |
|     table_list->open_type= OT_BASE_ONLY;
 | |
| 
 | |
|     /*
 | |
|       We record in the slave's information that the table should be
 | |
|       locked by linking the table into the list of tables to lock.
 | |
|     */
 | |
|     table_list->next_global= table_list->next_local= rgi->tables_to_lock;
 | |
|     rgi->tables_to_lock= table_list;
 | |
|     rgi->tables_to_lock_count++;
 | |
|     /* 'memory' is freed in clear_tables_to_lock */
 | |
|   }
 | |
|   else  // FILTERED_OUT, SAME_ID_MAPPING_*
 | |
|   {
 | |
|     /*
 | |
|       If mapped already but with different properties, we raise an
 | |
|       error.
 | |
|       If mapped already but with same properties we skip the event.
 | |
|       If filtered out we skip the event.
 | |
| 
 | |
|       In all three cases, we need to free the memory previously 
 | |
|       allocated.
 | |
|      */
 | |
|     if (tblmap_status == SAME_ID_MAPPING_DIFFERENT_TABLE)
 | |
|     {
 | |
|       /*
 | |
|         Something bad has happened. We need to stop the slave as strange things
 | |
|         could happen if we proceed: slave crash, wrong table being updated, ...
 | |
|         As a consequence we push an error in this case.
 | |
|        */
 | |
| 
 | |
|       char buf[256];
 | |
| 
 | |
|       my_snprintf(buf, sizeof(buf), 
 | |
|                   "Found table map event mapping table id %llu which "
 | |
|                   "was already mapped but with different settings.",
 | |
|                   table_list->table_id);
 | |
| 
 | |
|       if (thd->slave_thread)
 | |
|         rli->report(ERROR_LEVEL, ER_SLAVE_FATAL_ERROR, rgi->gtid_info(),
 | |
|                     ER_THD(thd, ER_SLAVE_FATAL_ERROR), buf);
 | |
|       else
 | |
|         /* 
 | |
|           For the cases in which a 'BINLOG' statement is set to 
 | |
|           execute in a user session 
 | |
|          */
 | |
|         my_error(ER_SLAVE_FATAL_ERROR, MYF(0), buf);
 | |
|     } 
 | |
|     
 | |
|     my_free(memory);
 | |
|   }
 | |
| 
 | |
|   DBUG_RETURN(tblmap_status == SAME_ID_MAPPING_DIFFERENT_TABLE);
 | |
| }
 | |
| 
 | |
| Log_event::enum_skip_reason
 | |
| Table_map_log_event::do_shall_skip(rpl_group_info *rgi)
 | |
| {
 | |
|   /*
 | |
|     If the slave skip counter is 1, then we should not start executing
 | |
|     on the next event.
 | |
|   */
 | |
|   return continue_group(rgi);
 | |
| }
 | |
| 
 | |
| int Table_map_log_event::do_update_pos(rpl_group_info *rgi)
 | |
| {
 | |
|   rgi->inc_event_relay_log_pos();
 | |
|   return 0;
 | |
| }
 | |
| 
 | |
| #endif /* defined(HAVE_REPLICATION) */
 | |
| 
 | |
| bool Table_map_log_event::write_data_header()
 | |
| {
 | |
|   DBUG_ASSERT(m_table_id != UINT32_MAX);
 | |
|   uchar buf[TABLE_MAP_HEADER_LEN];
 | |
|   DBUG_EXECUTE_IF("old_row_based_repl_4_byte_map_id_master",
 | |
|                   {
 | |
|                     int4store(buf + 0, (ulong) m_table_id);
 | |
|                     int2store(buf + 4, m_flags);
 | |
|                     return (write_data(buf, 6));
 | |
|                   });
 | |
|   int6store(buf + TM_MAPID_OFFSET, m_table_id);
 | |
|   int2store(buf + TM_FLAGS_OFFSET, m_flags);
 | |
|   return write_data(buf, TABLE_MAP_HEADER_LEN);
 | |
| }
 | |
| 
 | |
| bool Table_map_log_event::write_data_body()
 | |
| {
 | |
|   DBUG_ASSERT(m_dbnam != NULL);
 | |
|   DBUG_ASSERT(m_tblnam != NULL);
 | |
|   /* We use only one byte per length for storage in event: */
 | |
|   DBUG_ASSERT(m_dblen <= MY_MIN(NAME_LEN, 255));
 | |
|   DBUG_ASSERT(m_tbllen <= MY_MIN(NAME_LEN, 255));
 | |
| 
 | |
|   uchar const dbuf[]= { (uchar) m_dblen };
 | |
|   uchar const tbuf[]= { (uchar) m_tbllen };
 | |
| 
 | |
|   uchar cbuf[MAX_INT_WIDTH];
 | |
|   uchar *const cbuf_end= net_store_length(cbuf, (size_t) m_colcnt);
 | |
|   DBUG_ASSERT(static_cast<size_t>(cbuf_end - cbuf) <= sizeof(cbuf));
 | |
| 
 | |
|   /*
 | |
|     Store the size of the field metadata.
 | |
|   */
 | |
|   uchar mbuf[MAX_INT_WIDTH];
 | |
|   uchar *const mbuf_end= net_store_length(mbuf, m_field_metadata_size);
 | |
| 
 | |
|   return write_data(dbuf,      sizeof(dbuf)) ||
 | |
|          write_data(m_dbnam,   m_dblen+1) ||
 | |
|          write_data(tbuf,      sizeof(tbuf)) ||
 | |
|          write_data(m_tblnam,  m_tbllen+1) ||
 | |
|          write_data(cbuf, (size_t) (cbuf_end - cbuf)) ||
 | |
|          write_data(m_coltype, m_colcnt) ||
 | |
|          write_data(mbuf, (size_t) (mbuf_end - mbuf)) ||
 | |
|          write_data(m_field_metadata, m_field_metadata_size),
 | |
|          write_data(m_null_bits, (m_colcnt + 7) / 8) ||
 | |
|          write_data((const uchar*) m_metadata_buf.ptr(),
 | |
|                                   m_metadata_buf.length());
 | |
|  }
 | |
| 
 | |
| /**
 | |
|    stores an integer into packed format.
 | |
| 
 | |
|    @param[out] str_buf  a buffer where the packed integer will be stored.
 | |
|    @param[in] length  the integer will be packed.
 | |
|  */
 | |
| static inline
 | |
| void store_compressed_length(String &str_buf, ulonglong length)
 | |
| {
 | |
|   // Store Type and packed length
 | |
|   uchar buf[4];
 | |
|   uchar *buf_ptr = net_store_length(buf, length);
 | |
| 
 | |
|   str_buf.append(reinterpret_cast<char *>(buf), buf_ptr-buf);
 | |
| }
 | |
| 
 | |
| /**
 | |
|   Write data into str_buf with Type|Length|Value(TLV) format.
 | |
| 
 | |
|   @param[out] str_buf a buffer where the field is stored.
 | |
|   @param[in] type  type of the field
 | |
|   @param[in] length  length of the field value
 | |
|   @param[in] value  value of the field
 | |
| */
 | |
| static inline
 | |
| bool write_tlv_field(String &str_buf,
 | |
|                      enum Table_map_log_event::Optional_metadata_field_type
 | |
|                      type, uint length, const uchar *value)
 | |
| {
 | |
|   /* type is stored in one byte, so it should never bigger than 255. */
 | |
|   DBUG_ASSERT(static_cast<int>(type) <= 255);
 | |
|   str_buf.append((char) type);
 | |
|   store_compressed_length(str_buf, length);
 | |
|   return str_buf.append(reinterpret_cast<const char *>(value), length);
 | |
| }
 | |
| 
 | |
| /**
 | |
|   Write data into str_buf with Type|Length|Value(TLV) format.
 | |
| 
 | |
|   @param[out] str_buf a buffer where the field is stored.
 | |
|   @param[in] type  type of the field
 | |
|   @param[in] value  value of the field
 | |
| */
 | |
| static inline
 | |
| bool write_tlv_field(String &str_buf,
 | |
|                      enum Table_map_log_event::Optional_metadata_field_type
 | |
|                      type, const String &value)
 | |
| {
 | |
|   return write_tlv_field(str_buf, type, value.length(),
 | |
|                          reinterpret_cast<const uchar *>(value.ptr()));
 | |
| }
 | |
| 
 | |
| static inline bool is_character_field(Binlog_type_info *info_array, Field *field)
 | |
| {
 | |
|   Binlog_type_info *info= info_array + field->field_index;
 | |
|   if (!info->m_cs)
 | |
|     return 0;
 | |
|   if (info->m_set_typelib || info->m_enum_typelib)
 | |
|     return 0;
 | |
|   return 1;
 | |
| }
 | |
| 
 | |
| static inline bool is_enum_or_set_field(Binlog_type_info *info_array, Field *field) {
 | |
|   Binlog_type_info *info= info_array + field->field_index;
 | |
|   if (info->m_set_typelib || info->m_enum_typelib)
 | |
|     return 1;
 | |
|   return 0;
 | |
| }
 | |
| 
 | |
| 
 | |
| void Table_map_log_event::init_metadata_fields()
 | |
| {
 | |
|   DBUG_ENTER("init_metadata_fields");
 | |
|   DBUG_EXECUTE_IF("simulate_no_optional_metadata", DBUG_VOID_RETURN;);
 | |
| 
 | |
|   if (binlog_row_metadata == BINLOG_ROW_METADATA_NO_LOG)
 | |
|     DBUG_VOID_RETURN;
 | |
|   if (init_signedness_field() ||
 | |
|       init_charset_field(&is_character_field, DEFAULT_CHARSET,
 | |
|                          COLUMN_CHARSET) ||
 | |
|       init_geometry_type_field())
 | |
|   {
 | |
|     m_metadata_buf.length(0);
 | |
|     DBUG_VOID_RETURN;
 | |
|   }
 | |
| 
 | |
|   if (binlog_row_metadata == BINLOG_ROW_METADATA_FULL)
 | |
|   {
 | |
|     if (DBUG_EVALUATE_IF("dont_log_column_name", 0, init_column_name_field()) ||
 | |
|         init_charset_field(&is_enum_or_set_field, ENUM_AND_SET_DEFAULT_CHARSET,
 | |
|                            ENUM_AND_SET_COLUMN_CHARSET) ||
 | |
|         init_set_str_value_field() ||
 | |
|         init_enum_str_value_field() ||
 | |
|         init_primary_key_field())
 | |
|       m_metadata_buf.length(0);
 | |
|   }
 | |
|   DBUG_VOID_RETURN;
 | |
| }
 | |
| 
 | |
| bool Table_map_log_event::init_signedness_field()
 | |
| {
 | |
|   /* use it to store signed flags, each numeric column take a bit. */
 | |
|   StringBuffer<128> buf;
 | |
|   unsigned char flag= 0;
 | |
|   unsigned char mask= 0x80;
 | |
|   Binlog_type_info *info;
 | |
| 
 | |
|   for (unsigned int i= 0 ; i < m_table->s->fields ; ++i)
 | |
|   {
 | |
|     info= binlog_type_info_array + i;
 | |
|     if (info->m_signedness != Binlog_type_info::SIGN_NOT_APPLICABLE)
 | |
|     {
 | |
|       if (info->m_signedness == Binlog_type_info::SIGN_UNSIGNED)
 | |
|         flag|= mask;
 | |
|       mask >>= 1;
 | |
| 
 | |
|       // 8 fields are tested, store the result and clear the flag.
 | |
|       if (mask == 0)
 | |
|       {
 | |
|         buf.append(flag);
 | |
|         flag= 0;
 | |
|         mask= 0x80;
 | |
|       }
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   // Stores the signedness flags of last few columns
 | |
|   if (mask != 0x80)
 | |
|     buf.append(flag);
 | |
| 
 | |
|   // The table has no numeric column, so don't log SIGNEDNESS field
 | |
|   if (buf.is_empty())
 | |
|     return false;
 | |
| 
 | |
|   return write_tlv_field(m_metadata_buf, SIGNEDNESS, buf);
 | |
| }
 | |
| 
 | |
| bool Table_map_log_event::init_charset_field(
 | |
|     bool (* include_type)(Binlog_type_info *, Field *),
 | |
|     Optional_metadata_field_type default_charset_type,
 | |
|     Optional_metadata_field_type column_charset_type)
 | |
| {
 | |
|   DBUG_EXECUTE_IF("simulate_init_charset_field_error", return true;);
 | |
| 
 | |
|   std::map<uint, uint> collation_map;
 | |
|   // For counting characters columns
 | |
|   uint char_col_cnt= 0;
 | |
| 
 | |
|   /* Find the collation number used by most fields */
 | |
|   for (unsigned int i= 0 ; i < m_table->s->fields ; ++i)
 | |
|   {
 | |
|     if ((*include_type)(binlog_type_info_array, m_table->field[i]))
 | |
|     {
 | |
|       collation_map[binlog_type_info_array[i].m_cs->number]++;
 | |
|       char_col_cnt++;
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   if (char_col_cnt == 0)
 | |
|     return false;
 | |
| 
 | |
|   /* Find the most used collation */
 | |
|   uint most_used_collation= 0;
 | |
|   uint most_used_count= 0;
 | |
|   for (std::map<uint, uint>::iterator it= collation_map.begin();
 | |
|        it != collation_map.end(); it++)
 | |
|   {
 | |
|     if (it->second > most_used_count)
 | |
|     {
 | |
|       most_used_count= it->second;
 | |
|       most_used_collation= it->first;
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   /*
 | |
|     Comparing length of COLUMN_CHARSET field and COLUMN_CHARSET_WITH_DEFAULT
 | |
|     field to decide which field should be logged.
 | |
| 
 | |
|     Length of COLUMN_CHARSET = character column count * collation id size.
 | |
|     Length of COLUMN_CHARSET_WITH_DEFAULT =
 | |
|      default collation_id size + count of columns not use default charset *
 | |
|      (column index size + collation id size)
 | |
| 
 | |
|     Assume column index just uses 1 byte and collation number also uses 1 byte.
 | |
|   */
 | |
|   if (char_col_cnt * 1 < (1 + (char_col_cnt - most_used_count) * 2))
 | |
|   {
 | |
|     StringBuffer<512> buf;
 | |
| 
 | |
|     /*
 | |
|       Stores character set information into COLUMN_CHARSET format,
 | |
|       character sets of all columns are stored one by one.
 | |
|       -----------------------------------------
 | |
|       | Charset number | .... |Charset number |
 | |
|       -----------------------------------------
 | |
|     */
 | |
|     for (unsigned int i= 0 ; i < m_table->s->fields ; ++i)
 | |
|     {
 | |
|       if (include_type(binlog_type_info_array, m_table->field[i]))
 | |
|         store_compressed_length(buf, binlog_type_info_array[i].m_cs->number);
 | |
|     }
 | |
|     return write_tlv_field(m_metadata_buf, column_charset_type, buf);
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     StringBuffer<512> buf;
 | |
|     uint char_column_index= 0;
 | |
|     uint default_collation= most_used_collation;
 | |
| 
 | |
|     /*
 | |
|       Stores character set information into DEFAULT_CHARSET format,
 | |
|       First stores the default character set, and then stores the character
 | |
|       sets different to default character with their column index one by one.
 | |
|       --------------------------------------------------------
 | |
|       | Default Charset | Col Index | Charset number | ...   |
 | |
|       --------------------------------------------------------
 | |
|     */
 | |
| 
 | |
|     // Store the default collation number
 | |
|     store_compressed_length(buf, default_collation);
 | |
| 
 | |
|     for (unsigned int i= 0 ; i < m_table->s->fields ; ++i)
 | |
|     {
 | |
|       if (include_type(binlog_type_info_array, m_table->field[i]))
 | |
|       {
 | |
|         CHARSET_INFO *cs= binlog_type_info_array[i].m_cs;
 | |
|         DBUG_ASSERT(cs);
 | |
|         if (cs->number != default_collation)
 | |
|         {
 | |
|           store_compressed_length(buf, char_column_index);
 | |
|           store_compressed_length(buf, cs->number);
 | |
|         }
 | |
|         char_column_index++;
 | |
|       }
 | |
|     }
 | |
|     return write_tlv_field(m_metadata_buf, default_charset_type, buf);
 | |
|   }
 | |
| }
 | |
| 
 | |
| bool Table_map_log_event::init_column_name_field()
 | |
| {
 | |
|   StringBuffer<2048> buf;
 | |
| 
 | |
|   for (unsigned int i= 0 ; i < m_table->s->fields ; ++i)
 | |
|   {
 | |
|     size_t len= m_table->field[i]->field_name.length;
 | |
| 
 | |
|     store_compressed_length(buf, len);
 | |
|     buf.append(m_table->field[i]->field_name.str, len);
 | |
|   }
 | |
|   return write_tlv_field(m_metadata_buf, COLUMN_NAME, buf);
 | |
| }
 | |
| 
 | |
| bool Table_map_log_event::init_set_str_value_field()
 | |
| {
 | |
|   StringBuffer<1024> buf;
 | |
|   TYPELIB *typelib;
 | |
| 
 | |
|   /*
 | |
|     SET string values are stored in the same format:
 | |
|     ----------------------------------------------
 | |
|     | Value number | value1 len | value 1|  .... |  // first SET column
 | |
|     ----------------------------------------------
 | |
|     | Value number | value1 len | value 1|  .... |  // second SET column
 | |
|     ----------------------------------------------
 | |
|    */
 | |
|   for (unsigned int i= 0 ; i < m_table->s->fields ; ++i)
 | |
|   {
 | |
|     if ((typelib= binlog_type_info_array[i].m_set_typelib))
 | |
|     {
 | |
|       store_compressed_length(buf, typelib->count);
 | |
|       for (unsigned int i= 0; i < typelib->count; i++)
 | |
|       {
 | |
|         store_compressed_length(buf, typelib->type_lengths[i]);
 | |
|         buf.append(typelib->type_names[i], typelib->type_lengths[i]);
 | |
|       }
 | |
|     }
 | |
|   }
 | |
|   if (buf.length() > 0)
 | |
|     return write_tlv_field(m_metadata_buf, SET_STR_VALUE, buf);
 | |
|   return false;
 | |
| }
 | |
| 
 | |
| bool Table_map_log_event::init_enum_str_value_field()
 | |
| {
 | |
|   StringBuffer<1024> buf;
 | |
|   TYPELIB *typelib;
 | |
| 
 | |
|   /* ENUM is same to SET columns, see comment in init_set_str_value_field */
 | |
|   for (unsigned int i= 0 ; i < m_table->s->fields ; ++i)
 | |
|   {
 | |
|     if ((typelib= binlog_type_info_array[i].m_enum_typelib))
 | |
|     {
 | |
|       store_compressed_length(buf, typelib->count);
 | |
|       for (unsigned int i= 0; i < typelib->count; i++)
 | |
|       {
 | |
|         store_compressed_length(buf, typelib->type_lengths[i]);
 | |
|         buf.append(typelib->type_names[i], typelib->type_lengths[i]);
 | |
|       }
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   if (buf.length() > 0)
 | |
|     return write_tlv_field(m_metadata_buf, ENUM_STR_VALUE, buf);
 | |
|   return false;
 | |
| }
 | |
| 
 | |
| bool Table_map_log_event::init_geometry_type_field()
 | |
| {
 | |
|   StringBuffer<256> buf;
 | |
|   uint geom_type;
 | |
| 
 | |
|   /* Geometry type of geometry columns is stored one by one as packed length */
 | |
|   for (unsigned int i= 0 ; i < m_table->s->fields ; ++i)
 | |
|   {
 | |
|     if (binlog_type_info_array[i].m_type_code == MYSQL_TYPE_GEOMETRY)
 | |
|     {
 | |
|       geom_type= binlog_type_info_array[i].m_geom_type;
 | |
|       DBUG_EXECUTE_IF("inject_invalid_geometry_type", geom_type= 100;);
 | |
|       store_compressed_length(buf, geom_type);
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   if (buf.length() > 0)
 | |
|     return write_tlv_field(m_metadata_buf, GEOMETRY_TYPE, buf);
 | |
|   return false;
 | |
| }
 | |
| 
 | |
| bool Table_map_log_event::init_primary_key_field()
 | |
| {
 | |
|   DBUG_EXECUTE_IF("simulate_init_primary_key_field_error", return true;);
 | |
| 
 | |
|   if (unlikely(m_table->s->primary_key == MAX_KEY))
 | |
|     return false;
 | |
| 
 | |
|   // If any key column uses prefix like KEY(c1(10)) */
 | |
|   bool has_prefix= false;
 | |
|   KEY *pk= m_table->key_info + m_table->s->primary_key;
 | |
| 
 | |
|   DBUG_ASSERT(pk->user_defined_key_parts > 0);
 | |
| 
 | |
|   /* Check if any key column uses prefix */
 | |
|   for (uint i= 0; i < pk->user_defined_key_parts; i++)
 | |
|   {
 | |
|     KEY_PART_INFO *key_part= pk->key_part+i;
 | |
|     if (key_part->length != m_table->field[key_part->fieldnr-1]->key_length())
 | |
|     {
 | |
|       has_prefix= true;
 | |
|       break;
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   StringBuffer<128> buf;
 | |
| 
 | |
|   if (!has_prefix)
 | |
|   {
 | |
|     /* Index of PK columns are stored one by one. */
 | |
|     for (uint i= 0; i < pk->user_defined_key_parts; i++)
 | |
|     {
 | |
|       KEY_PART_INFO *key_part= pk->key_part+i;
 | |
|       store_compressed_length(buf, key_part->fieldnr-1);
 | |
|     }
 | |
|     return write_tlv_field(m_metadata_buf, SIMPLE_PRIMARY_KEY, buf);
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     /* Index of PK columns are stored with a prefix length one by one. */
 | |
|     for (uint i= 0; i < pk->user_defined_key_parts; i++)
 | |
|     {
 | |
|       KEY_PART_INFO *key_part= pk->key_part+i;
 | |
|       size_t prefix= 0;
 | |
| 
 | |
|       store_compressed_length(buf, key_part->fieldnr-1);
 | |
| 
 | |
|       // Store character length but not octet length
 | |
|       if (key_part->length != m_table->field[key_part->fieldnr-1]->key_length())
 | |
|         prefix= key_part->length / key_part->field->charset()->mbmaxlen;
 | |
|       store_compressed_length(buf, prefix);
 | |
|     }
 | |
|     return write_tlv_field(m_metadata_buf, PRIMARY_KEY_WITH_PREFIX, buf);
 | |
|   }
 | |
| }
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| /*
 | |
|   Print some useful information for the SHOW BINARY LOG information
 | |
|   field.
 | |
|  */
 | |
| 
 | |
| void Table_map_log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|     char buf[256];
 | |
|     size_t bytes= my_snprintf(buf, sizeof(buf),
 | |
|                               "table_id: %llu (%s.%s)",
 | |
|                               m_table_id, m_dbnam, m_tblnam);
 | |
|     protocol->store(buf, bytes, &my_charset_bin);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| /**************************************************************************
 | |
| 	Write_rows_log_event member functions
 | |
| **************************************************************************/
 | |
| 
 | |
| /*
 | |
|   Constructor used to build an event for writing to the binary log.
 | |
|  */
 | |
| Write_rows_log_event::Write_rows_log_event(THD *thd_arg, TABLE *tbl_arg,
 | |
|                                            ulonglong tid_arg,
 | |
|                                            bool is_transactional)
 | |
|   :Rows_log_event(thd_arg, tbl_arg, tid_arg, tbl_arg->rpl_write_set,
 | |
|                   is_transactional, WRITE_ROWS_EVENT_V1)
 | |
| {
 | |
| }
 | |
| 
 | |
| Write_rows_compressed_log_event::Write_rows_compressed_log_event(
 | |
|                                            THD *thd_arg,
 | |
|                                            TABLE *tbl_arg,
 | |
|                                            ulonglong tid_arg,
 | |
|                                            bool is_transactional)
 | |
|   : Write_rows_log_event(thd_arg, tbl_arg, tid_arg, is_transactional)
 | |
| {
 | |
|   m_type = WRITE_ROWS_COMPRESSED_EVENT_V1;
 | |
| }
 | |
| 
 | |
| bool Write_rows_compressed_log_event::write()
 | |
| {
 | |
|   return Rows_log_event::write_compressed();
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| int 
 | |
| Write_rows_log_event::do_before_row_operations(const Slave_reporting_capability *const)
 | |
| {
 | |
|   int error= 0;
 | |
| 
 | |
|   /*
 | |
|     Increment the global status insert count variable
 | |
|   */
 | |
|   if (get_flags(STMT_END_F))
 | |
|     status_var_increment(thd->status_var.com_stat[SQLCOM_INSERT]);
 | |
| 
 | |
|   /**
 | |
|      todo: to introduce a property for the event (handler?) which forces
 | |
|      applying the event in the replace (idempotent) fashion.
 | |
|   */
 | |
|   if (slave_exec_mode == SLAVE_EXEC_MODE_IDEMPOTENT)
 | |
|   {
 | |
|     /*
 | |
|       We are using REPLACE semantics and not INSERT IGNORE semantics
 | |
|       when writing rows, that is: new rows replace old rows.  We need to
 | |
|       inform the storage engine that it should use this behaviour.
 | |
|     */
 | |
|     
 | |
|     /* Tell the storage engine that we are using REPLACE semantics. */
 | |
|     thd->lex->duplicates= DUP_REPLACE;
 | |
|     
 | |
|     /*
 | |
|       Pretend we're executing a REPLACE command: this is needed for
 | |
|       InnoDB since it is not (properly) checking the lex->duplicates flag.
 | |
|     */
 | |
|     thd->lex->sql_command= SQLCOM_REPLACE;
 | |
|     /* 
 | |
|        Do not raise the error flag in case of hitting to an unique attribute
 | |
|     */
 | |
|     m_table->file->extra(HA_EXTRA_IGNORE_DUP_KEY);
 | |
|     /* 
 | |
|        The following is needed in case if we have AFTER DELETE triggers.
 | |
|     */
 | |
|     m_table->file->extra(HA_EXTRA_WRITE_CAN_REPLACE);
 | |
|     m_table->file->extra(HA_EXTRA_IGNORE_NO_KEY);
 | |
|   }
 | |
|   if (m_table->triggers && do_invoke_trigger())
 | |
|     m_table->prepare_triggers_for_insert_stmt_or_event();
 | |
| 
 | |
|   /* Honor next number column if present */
 | |
|   m_table->next_number_field= m_table->found_next_number_field;
 | |
|   /*
 | |
|    * Fixed Bug#45999, In RBR, Store engine of Slave auto-generates new
 | |
|    * sequence numbers for auto_increment fields if the values of them are 0.
 | |
|    * If generateing a sequence number is decided by the values of
 | |
|    * table->auto_increment_field_not_null and SQL_MODE(if includes
 | |
|    * MODE_NO_AUTO_VALUE_ON_ZERO) in update_auto_increment function.
 | |
|    * SQL_MODE of slave sql thread is always consistency with master's.
 | |
|    * In RBR, auto_increment fields never are NULL, except if the auto_inc
 | |
|    * column exists only on the slave side (i.e., in an extra column
 | |
|    * on the slave's table).
 | |
|    */
 | |
|   if (!is_auto_inc_in_extra_columns())
 | |
|     m_table->auto_increment_field_not_null= TRUE;
 | |
|   else
 | |
|   {
 | |
|     /*
 | |
|       Here we have checked that there is an extra field
 | |
|       on this server's table that has an auto_inc column.
 | |
| 
 | |
|       Mark that the auto_increment field is null and mark
 | |
|       the read and write set bits.
 | |
| 
 | |
|       (There can only be one AUTO_INC column, it is always
 | |
|        indexed and it cannot have a DEFAULT value).
 | |
|     */
 | |
|     m_table->auto_increment_field_not_null= FALSE;
 | |
|     m_table->mark_auto_increment_column(true);
 | |
|   }
 | |
| 
 | |
|   return error;
 | |
| }
 | |
| 
 | |
| int 
 | |
| Write_rows_log_event::do_after_row_operations(const Slave_reporting_capability *const,
 | |
|                                               int error)
 | |
| {
 | |
|   int local_error= 0;
 | |
| 
 | |
|   /**
 | |
|     Clear the write_set bit for auto_inc field that only
 | |
|     existed on the destination table as an extra column.
 | |
|    */
 | |
|   if (is_auto_inc_in_extra_columns())
 | |
|   {
 | |
|     bitmap_clear_bit(m_table->rpl_write_set,
 | |
|                      m_table->next_number_field->field_index);
 | |
|     bitmap_clear_bit(m_table->read_set,
 | |
|                      m_table->next_number_field->field_index);
 | |
| 
 | |
|     if (get_flags(STMT_END_F))
 | |
|       m_table->file->ha_release_auto_increment();
 | |
|   }
 | |
|   m_table->next_number_field=0;
 | |
|   m_table->auto_increment_field_not_null= FALSE;
 | |
|   if (slave_exec_mode == SLAVE_EXEC_MODE_IDEMPOTENT)
 | |
|   {
 | |
|     m_table->file->extra(HA_EXTRA_NO_IGNORE_DUP_KEY);
 | |
|     m_table->file->extra(HA_EXTRA_WRITE_CANNOT_REPLACE);
 | |
|     /*
 | |
|       resetting the extra with 
 | |
|       table->file->extra(HA_EXTRA_NO_IGNORE_NO_KEY); 
 | |
|       fires bug#27077
 | |
|       explanation: file->reset() performs this duty
 | |
|       ultimately. Still todo: fix
 | |
|     */
 | |
|   }
 | |
|   if (unlikely((local_error= m_table->file->ha_end_bulk_insert())))
 | |
|   {
 | |
|     m_table->file->print_error(local_error, MYF(0));
 | |
|   }
 | |
|   return error? error : local_error;
 | |
| }
 | |
| 
 | |
| bool Rows_log_event::process_triggers(trg_event_type event,
 | |
|                                       trg_action_time_type time_type,
 | |
|                                       bool old_row_is_record1)
 | |
| {
 | |
|   bool result;
 | |
|   DBUG_ENTER("Rows_log_event::process_triggers");
 | |
|   m_table->triggers->mark_fields_used(event);
 | |
|   if (slave_run_triggers_for_rbr == SLAVE_RUN_TRIGGERS_FOR_RBR_YES)
 | |
|   {
 | |
|     result= m_table->triggers->process_triggers(thd, event,
 | |
|                                                 time_type,
 | |
|                                                 old_row_is_record1);
 | |
|   }
 | |
|   else
 | |
|     result= m_table->triggers->process_triggers(thd, event,
 | |
|                                                 time_type,
 | |
|                                                 old_row_is_record1);
 | |
| 
 | |
|   DBUG_RETURN(result);
 | |
| }
 | |
| /*
 | |
|   Check if there are more UNIQUE keys after the given key.
 | |
| */
 | |
| static int
 | |
| last_uniq_key(TABLE *table, uint keyno)
 | |
| {
 | |
|   while (++keyno < table->s->keys)
 | |
|     if (table->key_info[keyno].flags & HA_NOSAME)
 | |
|       return 0;
 | |
|   return 1;
 | |
| }
 | |
| 
 | |
| /**
 | |
|    Check if an error is a duplicate key error.
 | |
| 
 | |
|    This function is used to check if an error code is one of the
 | |
|    duplicate key error, i.e., and error code for which it is sensible
 | |
|    to do a <code>get_dup_key()</code> to retrieve the duplicate key.
 | |
| 
 | |
|    @param errcode The error code to check.
 | |
| 
 | |
|    @return <code>true</code> if the error code is such that
 | |
|    <code>get_dup_key()</code> will return true, <code>false</code>
 | |
|    otherwise.
 | |
|  */
 | |
| bool
 | |
| is_duplicate_key_error(int errcode)
 | |
| {
 | |
|   switch (errcode)
 | |
|   {
 | |
|   case HA_ERR_FOUND_DUPP_KEY:
 | |
|   case HA_ERR_FOUND_DUPP_UNIQUE:
 | |
|     return true;
 | |
|   }
 | |
|   return false;
 | |
| }
 | |
| 
 | |
| /**
 | |
|   Write the current row into event's table.
 | |
| 
 | |
|   The row is located in the row buffer, pointed by @c m_curr_row member.
 | |
|   Number of columns of the row is stored in @c m_width member (it can be 
 | |
|   different from the number of columns in the table to which we insert). 
 | |
|   Bitmap @c m_cols indicates which columns are present in the row. It is assumed 
 | |
|   that event's table is already open and pointed by @c m_table.
 | |
| 
 | |
|   If the same record already exists in the table it can be either overwritten 
 | |
|   or an error is reported depending on the value of @c overwrite flag 
 | |
|   (error reporting not yet implemented). Note that the matching record can be
 | |
|   different from the row we insert if we use primary keys to identify records in
 | |
|   the table.
 | |
| 
 | |
|   The row to be inserted can contain values only for selected columns. The 
 | |
|   missing columns are filled with default values using @c prepare_record() 
 | |
|   function. If a matching record is found in the table and @c overwritte is
 | |
|   true, the missing columns are taken from it.
 | |
| 
 | |
|   @param  rli   Relay log info (needed for row unpacking).
 | |
|   @param  overwrite  
 | |
|                 Shall we overwrite if the row already exists or signal 
 | |
|                 error (currently ignored).
 | |
| 
 | |
|   @returns Error code on failure, 0 on success.
 | |
| 
 | |
|   This method, if successful, sets @c m_curr_row_end pointer to point at the
 | |
|   next row in the rows buffer. This is done when unpacking the row to be 
 | |
|   inserted.
 | |
| 
 | |
|   @note If a matching record is found, it is either updated using 
 | |
|   @c ha_update_row() or first deleted and then new record written.
 | |
| */ 
 | |
| 
 | |
| int
 | |
| Rows_log_event::write_row(rpl_group_info *rgi,
 | |
|                           const bool overwrite)
 | |
| {
 | |
|   DBUG_ENTER("write_row");
 | |
|   DBUG_ASSERT(m_table != NULL && thd != NULL);
 | |
| 
 | |
|   TABLE *table= m_table;  // pointer to event's table
 | |
|   int error;
 | |
|   int UNINIT_VAR(keynum);
 | |
|   const bool invoke_triggers= (m_table->triggers && do_invoke_trigger());
 | |
|   auto_afree_ptr<char> key(NULL);
 | |
| 
 | |
|   prepare_record(table, m_width, true);
 | |
| 
 | |
|   /* unpack row into table->record[0] */
 | |
|   if (unlikely((error= unpack_current_row(rgi))))
 | |
|   {
 | |
|     table->file->print_error(error, MYF(0));
 | |
|     DBUG_RETURN(error);
 | |
|   }
 | |
| 
 | |
|   if (m_curr_row == m_rows_buf && !invoke_triggers && !table->s->long_unique_table)
 | |
|   {
 | |
|     /*
 | |
|        This table has no triggers so we can do bulk insert.
 | |
| 
 | |
|        This is the first row to be inserted, we estimate the rows with
 | |
|        the size of the first row and use that value to initialize
 | |
|        storage engine for bulk insertion.
 | |
|     */
 | |
|     /* this is the first row to be inserted, we estimate the rows with
 | |
|        the size of the first row and use that value to initialize
 | |
|        storage engine for bulk insertion */
 | |
|     DBUG_ASSERT(!(m_curr_row > m_curr_row_end));
 | |
|     ha_rows estimated_rows= 0;
 | |
|     if (m_curr_row < m_curr_row_end)
 | |
|       estimated_rows= (m_rows_end - m_curr_row) / (m_curr_row_end - m_curr_row);
 | |
|     else if (m_curr_row == m_curr_row_end)
 | |
|       estimated_rows= 1;
 | |
| 
 | |
|     table->file->ha_start_bulk_insert(estimated_rows);
 | |
|   }
 | |
| 
 | |
|   /*
 | |
|     Explicitly set the auto_inc to null to make sure that
 | |
|     it gets an auto_generated value.
 | |
|   */
 | |
|   if (is_auto_inc_in_extra_columns())
 | |
|     m_table->next_number_field->set_null();
 | |
|   
 | |
|   DBUG_DUMP("record[0]", table->record[0], table->s->reclength);
 | |
|   DBUG_PRINT_BITSET("debug", "rpl_write_set: %s", table->rpl_write_set);
 | |
|   DBUG_PRINT_BITSET("debug", "read_set:      %s", table->read_set);
 | |
| 
 | |
|   if (table->s->long_unique_table)
 | |
|     table->update_virtual_fields(table->file, VCOL_UPDATE_FOR_WRITE);
 | |
| 
 | |
|   if (invoke_triggers &&
 | |
|       unlikely(process_triggers(TRG_EVENT_INSERT, TRG_ACTION_BEFORE, TRUE)))
 | |
|   {
 | |
|     DBUG_RETURN(HA_ERR_GENERIC); // in case if error is not set yet
 | |
|   }
 | |
| 
 | |
|   // Handle INSERT.
 | |
|   if (table->versioned(VERS_TIMESTAMP))
 | |
|   {
 | |
|     ulong sec_part;
 | |
|     bitmap_set_bit(table->read_set, table->vers_start_field()->field_index);
 | |
|     table->file->column_bitmaps_signal();
 | |
|     // Check whether a row came from unversioned table and fix vers fields.
 | |
|     if (table->vers_start_field()->get_timestamp(&sec_part) == 0 && sec_part == 0)
 | |
|       table->vers_update_fields();
 | |
|   }
 | |
| 
 | |
|   /* 
 | |
|     Try to write record. If a corresponding record already exists in the table,
 | |
|     we try to change it using ha_update_row() if possible. Otherwise we delete
 | |
|     it and repeat the whole process again. 
 | |
| 
 | |
|     TODO: Add safety measures against infinite looping. 
 | |
|    */
 | |
| 
 | |
|   DBUG_EXECUTE_IF("write_row_inject_sleep_before_ha_write_row",
 | |
|                   my_sleep(20000););
 | |
|   if (table->s->sequence)
 | |
|     error= update_sequence();
 | |
|   else while (unlikely(error= table->file->ha_write_row(table->record[0])))
 | |
|   {
 | |
|     if (error == HA_ERR_LOCK_DEADLOCK ||
 | |
|         error == HA_ERR_LOCK_WAIT_TIMEOUT ||
 | |
|         (keynum= table->file->get_dup_key(error)) < 0 ||
 | |
|         !overwrite)
 | |
|     {
 | |
|       DBUG_PRINT("info",("get_dup_key returns %d)", keynum));
 | |
|       /*
 | |
|         Deadlock, waiting for lock or just an error from the handler
 | |
|         such as HA_ERR_FOUND_DUPP_KEY when overwrite is false.
 | |
|         Retrieval of the duplicate key number may fail
 | |
|         - either because the error was not "duplicate key" error
 | |
|         - or because the information which key is not available
 | |
|       */
 | |
|       table->file->print_error(error, MYF(0));
 | |
|       DBUG_RETURN(error);
 | |
|     }
 | |
|     /*
 | |
|        We need to retrieve the old row into record[1] to be able to
 | |
|        either update or delete the offending record.  We either:
 | |
| 
 | |
|        - use rnd_pos() with a row-id (available as dupp_row) to the
 | |
|          offending row, if that is possible (MyISAM and Blackhole), or else
 | |
| 
 | |
|        - use index_read_idx() with the key that is duplicated, to
 | |
|          retrieve the offending row.
 | |
|      */
 | |
|     if (table->file->ha_table_flags() & HA_DUPLICATE_POS)
 | |
|     {
 | |
|       DBUG_PRINT("info",("Locating offending record using rnd_pos()"));
 | |
| 
 | |
|       if ((error= table->file->ha_rnd_init_with_error(0)))
 | |
|       {
 | |
|         DBUG_RETURN(error);
 | |
|       }
 | |
| 
 | |
|       error= table->file->ha_rnd_pos(table->record[1], table->file->dup_ref);
 | |
|       if (unlikely(error))
 | |
|       {
 | |
|         DBUG_PRINT("info",("rnd_pos() returns error %d",error));
 | |
|         table->file->print_error(error, MYF(0));
 | |
|         DBUG_RETURN(error);
 | |
|       }
 | |
|       table->file->ha_rnd_end();
 | |
|     }
 | |
|     else
 | |
|     {
 | |
|       DBUG_PRINT("info",("Locating offending record using index_read_idx()"));
 | |
| 
 | |
|       if (table->file->extra(HA_EXTRA_FLUSH_CACHE))
 | |
|       {
 | |
|         DBUG_PRINT("info",("Error when setting HA_EXTRA_FLUSH_CACHE"));
 | |
|         DBUG_RETURN(my_errno);
 | |
|       }
 | |
| 
 | |
|       if (key.get() == NULL)
 | |
|       {
 | |
|         key.assign(static_cast<char*>(my_alloca(table->s->max_unique_length)));
 | |
|         if (key.get() == NULL)
 | |
|         {
 | |
|           DBUG_PRINT("info",("Can't allocate key buffer"));
 | |
|           DBUG_RETURN(ENOMEM);
 | |
|         }
 | |
|       }
 | |
| 
 | |
|       key_copy((uchar*)key.get(), table->record[0], table->key_info + keynum,
 | |
|                0);
 | |
|       error= table->file->ha_index_read_idx_map(table->record[1], keynum,
 | |
|                                                 (const uchar*)key.get(),
 | |
|                                                 HA_WHOLE_KEY,
 | |
|                                                 HA_READ_KEY_EXACT);
 | |
|       if (unlikely(error))
 | |
|       {
 | |
|         DBUG_PRINT("info",("index_read_idx() returns %s", HA_ERR(error)));
 | |
|         table->file->print_error(error, MYF(0));
 | |
|         DBUG_RETURN(error);
 | |
|       }
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|        Now, record[1] should contain the offending row.  That
 | |
|        will enable us to update it or, alternatively, delete it (so
 | |
|        that we can insert the new row afterwards).
 | |
|     */
 | |
|     if (table->s->long_unique_table)
 | |
|     {
 | |
|       /* same as for REPLACE/ODKU */
 | |
|       table->move_fields(table->field, table->record[1], table->record[0]);
 | |
|       table->update_virtual_fields(table->file, VCOL_UPDATE_FOR_REPLACE);
 | |
|       table->move_fields(table->field, table->record[0], table->record[1]);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|       If row is incomplete we will use the record found to fill 
 | |
|       missing columns.  
 | |
|     */
 | |
|     if (!get_flags(COMPLETE_ROWS_F))
 | |
|     {
 | |
|       restore_record(table,record[1]);
 | |
|       error= unpack_current_row(rgi);
 | |
|       if (table->s->long_unique_table)
 | |
|         table->update_virtual_fields(table->file, VCOL_UPDATE_FOR_WRITE);
 | |
|     }
 | |
| 
 | |
|     DBUG_PRINT("debug",("preparing for update: before and after image"));
 | |
|     DBUG_DUMP("record[1] (before)", table->record[1], table->s->reclength);
 | |
|     DBUG_DUMP("record[0] (after)", table->record[0], table->s->reclength);
 | |
| 
 | |
|     /*
 | |
|        REPLACE is defined as either INSERT or DELETE + INSERT.  If
 | |
|        possible, we can replace it with an UPDATE, but that will not
 | |
|        work on InnoDB if FOREIGN KEY checks are necessary.
 | |
| 
 | |
|        I (Matz) am not sure of the reason for the last_uniq_key()
 | |
|        check as, but I'm guessing that it's something along the
 | |
|        following lines.
 | |
| 
 | |
|        Suppose that we got the duplicate key to be a key that is not
 | |
|        the last unique key for the table and we perform an update:
 | |
|        then there might be another key for which the unique check will
 | |
|        fail, so we're better off just deleting the row and inserting
 | |
|        the correct row.
 | |
| 
 | |
|        Additionally we don't use UPDATE if rbr triggers should be invoked -
 | |
|        when triggers are used we want a simple and predictable execution path.
 | |
|      */
 | |
|     if (last_uniq_key(table, keynum) && !invoke_triggers &&
 | |
|         !table->file->referenced_by_foreign_key())
 | |
|     {
 | |
|       DBUG_PRINT("info",("Updating row using ha_update_row()"));
 | |
|       error= table->file->ha_update_row(table->record[1],
 | |
|                                        table->record[0]);
 | |
|       switch (error) {
 | |
| 
 | |
|       case HA_ERR_RECORD_IS_THE_SAME:
 | |
|         DBUG_PRINT("info",("ignoring HA_ERR_RECORD_IS_THE_SAME error from"
 | |
|                            " ha_update_row()"));
 | |
|         error= 0;
 | |
| 
 | |
|       case 0:
 | |
|         break;
 | |
| 
 | |
|       default:
 | |
|         DBUG_PRINT("info",("ha_update_row() returns error %d",error));
 | |
|         table->file->print_error(error, MYF(0));
 | |
|       }
 | |
| 
 | |
|       DBUG_RETURN(error);
 | |
|     }
 | |
|     else
 | |
|     {
 | |
|       DBUG_PRINT("info",("Deleting offending row and trying to write new one again"));
 | |
|       if (invoke_triggers &&
 | |
|           unlikely(process_triggers(TRG_EVENT_DELETE, TRG_ACTION_BEFORE,
 | |
|                                     TRUE)))
 | |
|         error= HA_ERR_GENERIC; // in case if error is not set yet
 | |
|       else
 | |
|       {
 | |
|         if (unlikely((error= table->file->ha_delete_row(table->record[1]))))
 | |
|         {
 | |
|           DBUG_PRINT("info",("ha_delete_row() returns error %d",error));
 | |
|           table->file->print_error(error, MYF(0));
 | |
|           DBUG_RETURN(error);
 | |
|         }
 | |
|         if (invoke_triggers &&
 | |
|             unlikely(process_triggers(TRG_EVENT_DELETE, TRG_ACTION_AFTER,
 | |
|                                       TRUE)))
 | |
|           DBUG_RETURN(HA_ERR_GENERIC); // in case if error is not set yet
 | |
|       }
 | |
|       /* Will retry ha_write_row() with the offending row removed. */
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   if (invoke_triggers &&
 | |
|       unlikely(process_triggers(TRG_EVENT_INSERT, TRG_ACTION_AFTER, TRUE)))
 | |
|     error= HA_ERR_GENERIC; // in case if error is not set yet
 | |
| 
 | |
|   DBUG_RETURN(error);
 | |
| }
 | |
| 
 | |
| 
 | |
| int Rows_log_event::update_sequence()
 | |
| {
 | |
|   TABLE *table= m_table;  // pointer to event's table
 | |
|   bool old_master= false;
 | |
|   int err= 0;
 | |
| 
 | |
|   if (!bitmap_is_set(table->rpl_write_set, MIN_VALUE_FIELD_NO) ||
 | |
|       (
 | |
| #if defined(WITH_WSREP)
 | |
|        ! WSREP(thd) &&
 | |
| #endif
 | |
|        table->in_use->rgi_slave &&
 | |
|        !(table->in_use->rgi_slave->gtid_ev_flags2 & Gtid_log_event::FL_DDL) &&
 | |
|        !(old_master=
 | |
|          rpl_master_has_bug(thd->rgi_slave->rli,
 | |
|                             29621, FALSE, FALSE, FALSE, TRUE))))
 | |
|   {
 | |
|     /* This event come from a setval function executed on the master.
 | |
|        Update the sequence next_number and round, like we do with setval()
 | |
|     */
 | |
|     MY_BITMAP *old_map= dbug_tmp_use_all_columns(table,
 | |
|                                                  &table->read_set);
 | |
|     longlong nextval= table->field[NEXT_FIELD_NO]->val_int();
 | |
|     longlong round= table->field[ROUND_FIELD_NO]->val_int();
 | |
|     dbug_tmp_restore_column_map(&table->read_set, old_map);
 | |
| 
 | |
|     return table->s->sequence->set_value(table, nextval, round, 0) > 0;
 | |
|   }
 | |
|   if (old_master && !WSREP(thd) && thd->rgi_slave->is_parallel_exec)
 | |
|   {
 | |
|     DBUG_ASSERT(thd->rgi_slave->parallel_entry);
 | |
|     /*
 | |
|       With parallel replication enabled, we can't execute alongside any other
 | |
|       transaction in which we may depend, so we force retry to release
 | |
|       the server layer table lock for possible prior in binlog order
 | |
|       same table transactions.
 | |
|     */
 | |
|     if (thd->rgi_slave->parallel_entry->last_committed_sub_id <
 | |
|         thd->rgi_slave->wait_commit_sub_id)
 | |
|     {
 | |
|       err= ER_LOCK_DEADLOCK;
 | |
|       my_error(err, MYF(0));
 | |
|     }
 | |
|   }
 | |
|   /*
 | |
|     Update all fields in table and update the active sequence, like with
 | |
|     ALTER SEQUENCE
 | |
|   */
 | |
|   return err == 0 ? table->file->ha_write_row(table->record[0]) : err;
 | |
| }
 | |
| 
 | |
| 
 | |
| #endif
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| 
 | |
| int
 | |
| Write_rows_log_event::do_exec_row(rpl_group_info *rgi)
 | |
| {
 | |
|   DBUG_ASSERT(m_table != NULL);
 | |
|   const char *tmp= thd->get_proc_info();
 | |
|   char *message, msg[128];
 | |
|   const LEX_CSTRING &table_name= m_table->s->table_name;
 | |
|   const char quote_char=
 | |
|     get_quote_char_for_identifier(thd, table_name.str, table_name.length);
 | |
|   my_snprintf(msg, sizeof msg,
 | |
|               "Write_rows_log_event::write_row() on table %c%.*s%c",
 | |
|               quote_char, int(table_name.length), table_name.str, quote_char);
 | |
|   message= msg;
 | |
|   int error;
 | |
| 
 | |
| #ifdef WSREP_PROC_INFO
 | |
|   my_snprintf(thd->wsrep_info, sizeof(thd->wsrep_info) - 1,
 | |
|               "Write_rows_log_event::write_row(%lld) on table %c%.*s%c",
 | |
|               (long long) wsrep_thd_trx_seqno(thd), quote_char,
 | |
|               int(table_name.length), table_name.str, quote_char);
 | |
|   message= thd->wsrep_info;
 | |
| #endif /* WSREP_PROC_INFO */
 | |
| 
 | |
|   thd_proc_info(thd, message);
 | |
|   error= write_row(rgi, slave_exec_mode == SLAVE_EXEC_MODE_IDEMPOTENT);
 | |
|   thd_proc_info(thd, tmp);
 | |
| 
 | |
|   if (unlikely(error) && unlikely(!thd->is_error()))
 | |
|   {
 | |
|     DBUG_ASSERT(0);
 | |
|     my_error(ER_UNKNOWN_ERROR, MYF(0));
 | |
|   }
 | |
| 
 | |
|   return error;
 | |
| }
 | |
| 
 | |
| #endif /* defined(HAVE_REPLICATION) */
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| uint8 Write_rows_log_event::get_trg_event_map()
 | |
| {
 | |
|   return trg2bit(TRG_EVENT_INSERT) | trg2bit(TRG_EVENT_UPDATE) |
 | |
|          trg2bit(TRG_EVENT_DELETE);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| /**************************************************************************
 | |
| 	Delete_rows_log_event member functions
 | |
| **************************************************************************/
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| /*
 | |
|   Compares table->record[0] and table->record[1]
 | |
| 
 | |
|   Returns TRUE if different.
 | |
| */
 | |
| static bool record_compare(TABLE *table, bool vers_from_plain= false)
 | |
| {
 | |
|   bool result= FALSE;
 | |
|   /**
 | |
|     Compare full record only if:
 | |
|     - there are no blob fields (otherwise we would also need 
 | |
|       to compare blobs contents as well);
 | |
|     - there are no varchar fields (otherwise we would also need
 | |
|       to compare varchar contents as well);
 | |
|     - there are no null fields, otherwise NULLed fields 
 | |
|       contents (i.e., the don't care bytes) may show arbitrary 
 | |
|       values, depending on how each engine handles internally.
 | |
|     */
 | |
|   if ((table->s->blob_fields + 
 | |
|        table->s->varchar_fields + 
 | |
|        table->s->null_fields) == 0)
 | |
|   {
 | |
|     result= cmp_record(table,record[1]);
 | |
|     goto record_compare_exit;
 | |
|   }
 | |
| 
 | |
|   /* Compare null bits */
 | |
|   if (memcmp(table->null_flags,
 | |
| 	     table->null_flags+table->s->rec_buff_length,
 | |
| 	     table->s->null_bytes))
 | |
|   {
 | |
|     result= TRUE;				// Diff in NULL value
 | |
|     goto record_compare_exit;
 | |
|   }
 | |
| 
 | |
|   /* Compare fields */
 | |
|   for (Field **ptr=table->field ; *ptr ; ptr++)
 | |
|   {
 | |
|     /*
 | |
|       If the table is versioned, don't compare using the version if there is a
 | |
|       primary key. If there isn't a primary key, we need the version to
 | |
|       identify the correct record if there are duplicate rows in the data set.
 | |
|       However, if the primary server is unversioned (vers_from_plain is true),
 | |
|       then we implicitly use row_end as the primary key on our side. This is
 | |
|       because the implicit row_end value will be set to the maximum value for
 | |
|       the latest row update (which is what we care about).
 | |
|     */
 | |
|     if (table->versioned() && (*ptr)->vers_sys_field() &&
 | |
|         (table->s->primary_key < MAX_KEY ||
 | |
|          (vers_from_plain && table->vers_start_field() == (*ptr))))
 | |
|       continue;
 | |
|     /**
 | |
|       We only compare field contents that are not null.
 | |
|       NULL fields (i.e., their null bits) were compared 
 | |
|       earlier.
 | |
|     */
 | |
|     if (!(*(ptr))->is_null())
 | |
|     {
 | |
|       if ((*ptr)->cmp_binary_offset(table->s->rec_buff_length))
 | |
|       {
 | |
|         result= TRUE;
 | |
|         goto record_compare_exit;
 | |
|       }
 | |
|     }
 | |
|   }
 | |
| 
 | |
| record_compare_exit:
 | |
|   return result;
 | |
| }
 | |
| 
 | |
| 
 | |
| /**
 | |
|   Find the best key to use when locating the row in @c find_row().
 | |
| 
 | |
|   A primary key is preferred if it exists; otherwise a unique index is
 | |
|   preferred. Else we pick the index with the smalles rec_per_key value.
 | |
| 
 | |
|   If a suitable key is found, set @c m_key, @c m_key_nr and @c m_key_info
 | |
|   member fields appropriately.
 | |
| 
 | |
|   @returns Error code on failure, 0 on success.
 | |
| */
 | |
| int Rows_log_event::find_key()
 | |
| {
 | |
|   uint i, best_key_nr, last_part;
 | |
|   KEY *key, *UNINIT_VAR(best_key);
 | |
|   ulong UNINIT_VAR(best_rec_per_key), tmp;
 | |
|   DBUG_ENTER("Rows_log_event::find_key");
 | |
|   DBUG_ASSERT(m_table);
 | |
| 
 | |
|   best_key_nr= MAX_KEY;
 | |
| 
 | |
|   /*
 | |
|     Keys are sorted so that any primary key is first, followed by unique keys,
 | |
|     followed by any other. So we will automatically pick the primary key if
 | |
|     it exists.
 | |
|   */
 | |
|   for (i= 0, key= m_table->key_info; i < m_table->s->keys; i++, key++)
 | |
|   {
 | |
|     if (!m_table->s->keys_in_use.is_set(i))
 | |
|       continue;
 | |
|     /*
 | |
|       We cannot use a unique key with NULL-able columns to uniquely identify
 | |
|       a row (but we can still select it for range scan below if nothing better
 | |
|       is available).
 | |
|     */
 | |
|     if ((key->flags & (HA_NOSAME | HA_NULL_PART_KEY)) == HA_NOSAME)
 | |
|     {
 | |
|       best_key_nr= i;
 | |
|       best_key= key;
 | |
|       break;
 | |
|     }
 | |
|     /*
 | |
|       We can only use a non-unique key if it allows range scans (ie. skip
 | |
|       FULLTEXT indexes and such).
 | |
|     */
 | |
|     last_part= key->user_defined_key_parts - 1;
 | |
|     DBUG_PRINT("info", ("Index %s rec_per_key[%u]= %lu",
 | |
|                         key->name.str, last_part, key->rec_per_key[last_part]));
 | |
|     if (!(m_table->file->index_flags(i, last_part, 1) & HA_READ_NEXT))
 | |
|       continue;
 | |
| 
 | |
|     tmp= key->rec_per_key[last_part];
 | |
|     if (best_key_nr == MAX_KEY || (tmp > 0 && tmp < best_rec_per_key))
 | |
|     {
 | |
|       best_key_nr= i;
 | |
|       best_key= key;
 | |
|       best_rec_per_key= tmp;
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   if (best_key_nr == MAX_KEY)
 | |
|   {
 | |
|     m_key_info= NULL;
 | |
|     DBUG_RETURN(0);
 | |
|   }
 | |
| 
 | |
|   // Allocate buffer for key searches
 | |
|   m_key= (uchar *) my_malloc(PSI_INSTRUMENT_ME, best_key->key_length, MYF(MY_WME));
 | |
|   if (m_key == NULL)
 | |
|     DBUG_RETURN(HA_ERR_OUT_OF_MEM);
 | |
|   m_key_info= best_key;
 | |
|   m_key_nr= best_key_nr;
 | |
| 
 | |
|   DBUG_RETURN(0);;
 | |
| }
 | |
| 
 | |
| 
 | |
| /* 
 | |
|   Check if we are already spending too much time on this statement.
 | |
|   if we are, warn user that it might be because table does not have
 | |
|   a PK, but only if the warning was not printed before for this STMT.
 | |
| 
 | |
|   @param type          The event type code.
 | |
|   @param table_name    The name of the table that the slave is 
 | |
|                        operating.
 | |
|   @param is_index_scan States whether the slave is doing an index scan 
 | |
|                        or not.
 | |
|   @param rli           The relay metadata info.
 | |
| */
 | |
| static inline 
 | |
| void issue_long_find_row_warning(Log_event_type type, 
 | |
|                                  const char *table_name,
 | |
|                                  bool is_index_scan,
 | |
|                                  rpl_group_info *rgi)
 | |
| {
 | |
|   if ((global_system_variables.log_warnings > 1 && 
 | |
|        !rgi->is_long_find_row_note_printed()))
 | |
|   {
 | |
|     ulonglong now= microsecond_interval_timer();
 | |
|     ulonglong stmt_ts= rgi->get_row_stmt_start_timestamp();
 | |
|     
 | |
|     DBUG_EXECUTE_IF("inject_long_find_row_note", 
 | |
|                     stmt_ts-=(LONG_FIND_ROW_THRESHOLD*2*HRTIME_RESOLUTION););
 | |
| 
 | |
|     longlong delta= (now - stmt_ts)/HRTIME_RESOLUTION;
 | |
| 
 | |
|     if (delta > LONG_FIND_ROW_THRESHOLD)
 | |
|     {
 | |
|       rgi->set_long_find_row_note_printed();
 | |
|       const char* evt_type= LOG_EVENT_IS_DELETE_ROW(type) ? " DELETE" : "n UPDATE";
 | |
|       const char* scan_type= is_index_scan ? "scanning an index" : "scanning the table";
 | |
| 
 | |
|       sql_print_information("The slave is applying a ROW event on behalf of a%s statement "
 | |
|                             "on table %s and is currently taking a considerable amount "
 | |
|                             "of time (%lld seconds). This is due to the fact that it is %s "
 | |
|                             "while looking up records to be processed. Consider adding a "
 | |
|                             "primary key (or unique key) to the table to improve "
 | |
|                             "performance.",
 | |
|                             evt_type, table_name, delta, scan_type);
 | |
|     }
 | |
|   }
 | |
| }
 | |
| 
 | |
| 
 | |
| /*
 | |
|   HA_ERR_KEY_NOT_FOUND is a fatal error normally, but it's an expected
 | |
|   error in speculate optimistic mode, so use something non-fatal instead
 | |
| */
 | |
| static int row_not_found_error(rpl_group_info *rgi)
 | |
| {
 | |
|   return rgi->speculation != rpl_group_info::SPECULATE_OPTIMISTIC
 | |
|          ? HA_ERR_KEY_NOT_FOUND : HA_ERR_RECORD_CHANGED;
 | |
| }
 | |
| 
 | |
| static int end_of_file_error(rpl_group_info *rgi)
 | |
| {
 | |
|   return rgi->speculation != rpl_group_info::SPECULATE_OPTIMISTIC
 | |
|          ? HA_ERR_END_OF_FILE : HA_ERR_RECORD_CHANGED;
 | |
| }
 | |
| 
 | |
| /**
 | |
|   Locate the current row in event's table.
 | |
| 
 | |
|   The current row is pointed by @c m_curr_row. Member @c m_width tells
 | |
|   how many columns are there in the row (this can be differnet from
 | |
|   the number of columns in the table). It is assumed that event's
 | |
|   table is already open and pointed by @c m_table.
 | |
| 
 | |
|   If a corresponding record is found in the table it is stored in 
 | |
|   @c m_table->record[0]. Note that when record is located based on a primary 
 | |
|   key, it is possible that the record found differs from the row being located.
 | |
| 
 | |
|   If no key is specified or table does not have keys, a table scan is used to 
 | |
|   find the row. In that case the row should be complete and contain values for
 | |
|   all columns. However, it can still be shorter than the table, i.e. the table 
 | |
|   can contain extra columns not present in the row. It is also possible that 
 | |
|   the table has fewer columns than the row being located. 
 | |
| 
 | |
|   @returns Error code on failure, 0 on success. 
 | |
|   
 | |
|   @post In case of success @c m_table->record[0] contains the record found. 
 | |
|   Also, the internal "cursor" of the table is positioned at the record found.
 | |
| 
 | |
|   @note If the engine allows random access of the records, a combination of
 | |
|   @c position() and @c rnd_pos() will be used. 
 | |
| 
 | |
|   Note that one MUST call ha_index_or_rnd_end() after this function if
 | |
|   it returns 0 as we must leave the row position in the handler intact
 | |
|   for any following update/delete command.
 | |
| */
 | |
| 
 | |
| int Rows_log_event::find_row(rpl_group_info *rgi)
 | |
| {
 | |
|   DBUG_ENTER("Rows_log_event::find_row");
 | |
| 
 | |
|   DBUG_ASSERT(m_table && m_table->in_use != NULL);
 | |
| 
 | |
|   TABLE *table= m_table;
 | |
|   int error= 0;
 | |
|   bool is_table_scan= false, is_index_scan= false;
 | |
| 
 | |
|   /*
 | |
|     rpl_row_tabledefs.test specifies that
 | |
|     if the extra field on the slave does not have a default value
 | |
|     and this is okay with Delete or Update events.
 | |
|     Todo: fix wl3228 hld that requires defauls for all types of events
 | |
|   */
 | |
|   
 | |
|   prepare_record(table, m_width, FALSE);
 | |
|   error= unpack_current_row(rgi);
 | |
| 
 | |
|   m_vers_from_plain= false;
 | |
|   if (table->versioned())
 | |
|   {
 | |
|     Field *row_end= table->vers_end_field();
 | |
|     DBUG_ASSERT(table->read_set);
 | |
|     bitmap_set_bit(table->read_set, row_end->field_index);
 | |
|     // check whether master table is unversioned
 | |
|     if (row_end->val_int() == 0)
 | |
|     {
 | |
|       bitmap_set_bit(table->write_set, row_end->field_index);
 | |
|       // Plain source table may have a PRIMARY KEY. And row_end is always
 | |
|       // a part of PRIMARY KEY. Set it to max value for engine to find it in
 | |
|       // index. Needed for an UPDATE/DELETE cases.
 | |
|       table->vers_end_field()->set_max();
 | |
|       m_vers_from_plain= true;
 | |
|     }
 | |
|     table->file->column_bitmaps_signal();
 | |
|   }
 | |
| 
 | |
|   DBUG_PRINT("info",("looking for the following record"));
 | |
|   DBUG_DUMP("record[0]", table->record[0], table->s->reclength);
 | |
| 
 | |
|   if ((table->file->ha_table_flags() & HA_PRIMARY_KEY_REQUIRED_FOR_POSITION) &&
 | |
|       table->s->primary_key < MAX_KEY)
 | |
|   {
 | |
|     /*
 | |
|       Use a more efficient method to fetch the record given by
 | |
|       table->record[0] if the engine allows it.  We first compute a
 | |
|       row reference using the position() member function (it will be
 | |
|       stored in table->file->ref) and the use rnd_pos() to position
 | |
|       the "cursor" (i.e., record[0] in this case) at the correct row.
 | |
| 
 | |
|       TODO: Add a check that the correct record has been fetched by
 | |
|       comparing with the original record. Take into account that the
 | |
|       record on the master and slave can be of different
 | |
|       length. Something along these lines should work:
 | |
| 
 | |
|       ADD>>>  store_record(table,record[1]);
 | |
|               int error= table->file->ha_rnd_pos(table->record[0],
 | |
|               table->file->ref);
 | |
|       ADD>>>  DBUG_ASSERT(memcmp(table->record[1], table->record[0],
 | |
|                                  table->s->reclength) == 0);
 | |
| 
 | |
|     */
 | |
|     int error;
 | |
|     DBUG_PRINT("info",("locating record using primary key (position)"));
 | |
| 
 | |
|     error= table->file->ha_rnd_pos_by_record(table->record[0]);
 | |
|     if (unlikely(error))
 | |
|     {
 | |
|       DBUG_PRINT("info",("rnd_pos returns error %d",error));
 | |
|       if (error == HA_ERR_KEY_NOT_FOUND)
 | |
|         error= row_not_found_error(rgi);
 | |
|       table->file->print_error(error, MYF(0));
 | |
|     }
 | |
|     DBUG_RETURN(error);
 | |
|   }
 | |
| 
 | |
|   // We can't use position() - try other methods.
 | |
|   
 | |
|   /* 
 | |
|     We need to retrieve all fields
 | |
|     TODO: Move this out from this function to main loop 
 | |
|    */
 | |
|   table->use_all_columns();
 | |
| 
 | |
|   /*
 | |
|     Save copy of the record in table->record[1]. It might be needed 
 | |
|     later if linear search is used to find exact match.
 | |
|    */ 
 | |
|   store_record(table,record[1]);    
 | |
| 
 | |
|   if (m_key_info)
 | |
|   {
 | |
|     DBUG_PRINT("info",("locating record using key #%u [%s] (index_read)",
 | |
|                        m_key_nr, m_key_info->name.str));
 | |
|     /* We use this to test that the correct key is used in test cases. */
 | |
|     DBUG_EXECUTE_IF("slave_crash_if_wrong_index",
 | |
|                     if(0 != strcmp(m_key_info->name.str,"expected_key")) abort(););
 | |
| 
 | |
|     /* The key is active: search the table using the index */
 | |
|     if (!table->file->inited &&
 | |
|         (error= table->file->ha_index_init(m_key_nr, FALSE)))
 | |
|     {
 | |
|       DBUG_PRINT("info",("ha_index_init returns error %d",error));
 | |
|       table->file->print_error(error, MYF(0));
 | |
|       goto end;
 | |
|     }
 | |
| 
 | |
|     /* Fill key data for the row */
 | |
| 
 | |
|     DBUG_ASSERT(m_key);
 | |
|     key_copy(m_key, table->record[0], m_key_info, 0);
 | |
| 
 | |
|     /*
 | |
|       Don't print debug messages when running valgrind since they can
 | |
|       trigger false warnings.
 | |
|      */
 | |
| #ifndef HAVE_valgrind
 | |
|     DBUG_DUMP("key data", m_key, m_key_info->key_length);
 | |
| #endif
 | |
| 
 | |
|     /*
 | |
|       We need to set the null bytes to ensure that the filler bit are
 | |
|       all set when returning.  There are storage engines that just set
 | |
|       the necessary bits on the bytes and don't set the filler bits
 | |
|       correctly.
 | |
|     */
 | |
|     if (table->s->null_bytes > 0)
 | |
|       table->record[0][table->s->null_bytes - 1]|=
 | |
|         256U - (1U << table->s->last_null_bit_pos);
 | |
| 
 | |
|     if (unlikely((error= table->file->ha_index_read_map(table->record[0],
 | |
|                                                         m_key,
 | |
|                                                         HA_WHOLE_KEY,
 | |
|                                                         HA_READ_KEY_EXACT))))
 | |
|     {
 | |
|       DBUG_PRINT("info",("no record matching the key found in the table"));
 | |
|       if (error == HA_ERR_KEY_NOT_FOUND)
 | |
|         error= row_not_found_error(rgi);
 | |
|       table->file->print_error(error, MYF(0));
 | |
|       table->file->ha_index_end();
 | |
|       goto end;
 | |
|     }
 | |
| 
 | |
|   /*
 | |
|     Don't print debug messages when running valgrind since they can
 | |
|     trigger false warnings.
 | |
|    */
 | |
| #ifndef HAVE_valgrind
 | |
|     DBUG_PRINT("info",("found first matching record")); 
 | |
|     DBUG_DUMP("record[0]", table->record[0], table->s->reclength);
 | |
| #endif
 | |
|     /*
 | |
|       Below is a minor "optimization".  If the key (i.e., key number
 | |
|       0) has the HA_NOSAME flag set, we know that we have found the
 | |
|       correct record (since there can be no duplicates); otherwise, we
 | |
|       have to compare the record with the one found to see if it is
 | |
|       the correct one.
 | |
| 
 | |
|       CAVEAT! This behaviour is essential for the replication of,
 | |
|       e.g., the mysql.proc table since the correct record *shall* be
 | |
|       found using the primary key *only*.  There shall be no
 | |
|       comparison of non-PK columns to decide if the correct record is
 | |
|       found.  I can see no scenario where it would be incorrect to
 | |
|       chose the row to change only using a PK or an UNNI.
 | |
|     */
 | |
|     if (table->key_info->flags & HA_NOSAME)
 | |
|     {
 | |
|       /* Unique does not have non nullable part */
 | |
|       if (!(table->key_info->flags & (HA_NULL_PART_KEY)))
 | |
|       {
 | |
|         error= 0;
 | |
|         goto end;
 | |
|       }
 | |
|       else
 | |
|       {
 | |
|         KEY *keyinfo= table->key_info;
 | |
|         /*
 | |
|           Unique has nullable part. We need to check if there is any
 | |
|           field in the BI image that is null and part of UNNI.
 | |
|         */
 | |
|         bool null_found= FALSE;
 | |
|         for (uint i=0; i < keyinfo->user_defined_key_parts && !null_found; i++)
 | |
|         {
 | |
|           uint fieldnr= keyinfo->key_part[i].fieldnr - 1;
 | |
|           Field **f= table->field+fieldnr;
 | |
|           null_found= (*f)->is_null();
 | |
|         }
 | |
| 
 | |
|         if (!null_found)
 | |
|         {
 | |
|           error= 0;
 | |
|           goto end;
 | |
|         }
 | |
| 
 | |
|         /* else fall through to index scan */
 | |
|       }
 | |
|     }
 | |
| 
 | |
|     is_index_scan=true;
 | |
| 
 | |
|     /*
 | |
|       In case key is not unique, we still have to iterate over records found
 | |
|       and find the one which is identical to the row given. A copy of the 
 | |
|       record we are looking for is stored in record[1].
 | |
|      */ 
 | |
|     DBUG_PRINT("info",("non-unique index, scanning it to find matching record")); 
 | |
|     /* We use this to test that the correct key is used in test cases. */
 | |
|     DBUG_EXECUTE_IF("slave_crash_if_index_scan", abort(););
 | |
| 
 | |
|     while (record_compare(table, m_vers_from_plain))
 | |
|     {
 | |
|       while ((error= table->file->ha_index_next(table->record[0])))
 | |
|       {
 | |
|         DBUG_PRINT("info",("no record matching the given row found"));
 | |
|         if (error == HA_ERR_END_OF_FILE)
 | |
|           error= end_of_file_error(rgi);
 | |
|         table->file->print_error(error, MYF(0));
 | |
|         table->file->ha_index_end();
 | |
|         goto end;
 | |
|       }
 | |
|     }
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     DBUG_PRINT("info",("locating record using table scan (rnd_next)"));
 | |
|     /* We use this to test that the correct key is used in test cases. */
 | |
|     DBUG_EXECUTE_IF("slave_crash_if_table_scan", abort(););
 | |
| 
 | |
|     /* We don't have a key: search the table using rnd_next() */
 | |
|     if (unlikely((error= table->file->ha_rnd_init_with_error(1))))
 | |
|     {
 | |
|       DBUG_PRINT("info",("error initializing table scan"
 | |
|                          " (ha_rnd_init returns %d)",error));
 | |
|       goto end;
 | |
|     }
 | |
| 
 | |
|     is_table_scan= true;
 | |
| 
 | |
|     /* Continue until we find the right record or have made a full loop */
 | |
|     do
 | |
|     {
 | |
|       error= table->file->ha_rnd_next(table->record[0]);
 | |
| 
 | |
|       if (unlikely(error))
 | |
|         DBUG_PRINT("info", ("error: %s", HA_ERR(error)));
 | |
|       switch (error) {
 | |
| 
 | |
|       case 0:
 | |
|         DBUG_DUMP("record found", table->record[0], table->s->reclength);
 | |
|         break;
 | |
| 
 | |
|       case HA_ERR_END_OF_FILE:
 | |
|         error= end_of_file_error(rgi);
 | |
|         DBUG_PRINT("info", ("Record not found"));
 | |
|         table->file->ha_rnd_end();
 | |
|         goto end;
 | |
| 
 | |
|       default:
 | |
|         DBUG_PRINT("info", ("Failed to get next record"
 | |
|                             " (rnd_next returns %d)",error));
 | |
|         table->file->print_error(error, MYF(0));
 | |
|         table->file->ha_rnd_end();
 | |
|         goto end;
 | |
|       }
 | |
|     }
 | |
|     while (record_compare(table, m_vers_from_plain));
 | |
|     
 | |
|     /* 
 | |
|       Note: above record_compare will take into accout all record fields 
 | |
|       which might be incorrect in case a partial row was given in the event
 | |
|      */
 | |
| 
 | |
|     DBUG_ASSERT(error == HA_ERR_END_OF_FILE || error == 0);
 | |
|   }
 | |
| 
 | |
| end:
 | |
|   if (is_table_scan || is_index_scan)
 | |
|     issue_long_find_row_warning(get_general_type_code(), m_table->alias.c_ptr(), 
 | |
|                                 is_index_scan, rgi);
 | |
|   DBUG_RETURN(error);
 | |
| }
 | |
| 
 | |
| #endif
 | |
| 
 | |
| /*
 | |
|   Constructor used to build an event for writing to the binary log.
 | |
|  */
 | |
| 
 | |
| Delete_rows_log_event::Delete_rows_log_event(THD *thd_arg, TABLE *tbl_arg,
 | |
|                                              ulonglong tid,
 | |
|                                              bool is_transactional)
 | |
|   : Rows_log_event(thd_arg, tbl_arg, tid, tbl_arg->read_set, is_transactional,
 | |
|                    DELETE_ROWS_EVENT_V1)
 | |
| {
 | |
| }
 | |
| 
 | |
| Delete_rows_compressed_log_event::Delete_rows_compressed_log_event(
 | |
|                                            THD *thd_arg, TABLE *tbl_arg,
 | |
|                                            ulonglong tid_arg,
 | |
|                                            bool is_transactional)
 | |
|   : Delete_rows_log_event(thd_arg, tbl_arg, tid_arg, is_transactional)
 | |
| {
 | |
|   m_type= DELETE_ROWS_COMPRESSED_EVENT_V1;
 | |
| }
 | |
| 
 | |
| bool Delete_rows_compressed_log_event::write()
 | |
| {
 | |
|   return Rows_log_event::write_compressed();    
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| 
 | |
| int 
 | |
| Delete_rows_log_event::do_before_row_operations(const Slave_reporting_capability *const)
 | |
| {
 | |
|   /*
 | |
|     Increment the global status delete count variable
 | |
|    */
 | |
|   if (get_flags(STMT_END_F))
 | |
|     status_var_increment(thd->status_var.com_stat[SQLCOM_DELETE]);
 | |
| 
 | |
|   if ((m_table->file->ha_table_flags() & HA_PRIMARY_KEY_REQUIRED_FOR_POSITION) &&
 | |
|       m_table->s->primary_key < MAX_KEY)
 | |
|   {
 | |
|     /*
 | |
|       We don't need to allocate any memory for m_key since it is not used.
 | |
|     */
 | |
|     return 0;
 | |
|   }
 | |
|   if (do_invoke_trigger())
 | |
|     m_table->prepare_triggers_for_delete_stmt_or_event();
 | |
| 
 | |
|   return find_key();
 | |
| }
 | |
| 
 | |
| int 
 | |
| Delete_rows_log_event::do_after_row_operations(const Slave_reporting_capability *const, 
 | |
|                                                int error)
 | |
| {
 | |
|   m_table->file->ha_index_or_rnd_end();
 | |
|   my_free(m_key);
 | |
|   m_key= NULL;
 | |
|   m_key_info= NULL;
 | |
| 
 | |
|   return error;
 | |
| }
 | |
| 
 | |
| int Delete_rows_log_event::do_exec_row(rpl_group_info *rgi)
 | |
| {
 | |
|   int error;
 | |
|   const char *tmp= thd->get_proc_info();
 | |
|   char *message, msg[128];
 | |
|   const LEX_CSTRING &table_name= m_table->s->table_name;
 | |
|   const char quote_char=
 | |
|     get_quote_char_for_identifier(thd, table_name.str, table_name.length);
 | |
|   my_snprintf(msg, sizeof msg,
 | |
|               "Delete_rows_log_event::find_row() on table %c%.*s%c",
 | |
|               quote_char, int(table_name.length), table_name.str, quote_char);
 | |
|   message= msg;
 | |
|   const bool invoke_triggers= (m_table->triggers && do_invoke_trigger());
 | |
|   DBUG_ASSERT(m_table != NULL);
 | |
| 
 | |
| #ifdef WSREP_PROC_INFO
 | |
|   my_snprintf(thd->wsrep_info, sizeof(thd->wsrep_info) - 1,
 | |
|               "Delete_rows_log_event::find_row(%lld) on table %c%.*s%c",
 | |
|               (long long) wsrep_thd_trx_seqno(thd), quote_char,
 | |
|               int(table_name.length), table_name.str,
 | |
|               quote_char);
 | |
|   message= thd->wsrep_info;
 | |
| #endif /* WSREP_PROC_INFO */
 | |
| 
 | |
|   thd_proc_info(thd, message);
 | |
|   if (likely(!(error= find_row(rgi))))
 | |
|   {
 | |
|     /*
 | |
|       Delete the record found, located in record[0]
 | |
|     */
 | |
|     my_snprintf(msg, sizeof msg,
 | |
|                 "Delete_rows_log_event::ha_delete_row() on table %c%.*s%c",
 | |
|                 quote_char, int(table_name.length), table_name.str,
 | |
|                 quote_char);
 | |
|     message= msg;
 | |
| #ifdef WSREP_PROC_INFO
 | |
|     snprintf(thd->wsrep_info, sizeof(thd->wsrep_info) - 1,
 | |
|              "Delete_rows_log_event::ha_delete_row(%lld) on table %c%.*s%c",
 | |
|              (long long) wsrep_thd_trx_seqno(thd), quote_char,
 | |
|              int(table_name.length), table_name.str, quote_char);
 | |
|     message= thd->wsrep_info;
 | |
| #endif
 | |
|     thd_proc_info(thd, message);
 | |
| 
 | |
|     if (invoke_triggers &&
 | |
|         unlikely(process_triggers(TRG_EVENT_DELETE, TRG_ACTION_BEFORE, FALSE)))
 | |
|       error= HA_ERR_GENERIC; // in case if error is not set yet
 | |
|     if (likely(!error))
 | |
|     {
 | |
|       m_table->mark_columns_per_binlog_row_image();
 | |
|       if (m_vers_from_plain && m_table->versioned(VERS_TIMESTAMP))
 | |
|       {
 | |
|         Field *end= m_table->vers_end_field();
 | |
|         bitmap_set_bit(m_table->write_set, end->field_index);
 | |
|         store_record(m_table, record[1]);
 | |
|         end->set_time();
 | |
|         error= m_table->file->ha_update_row(m_table->record[1],
 | |
|                                             m_table->record[0]);
 | |
|       }
 | |
|       else
 | |
|       {
 | |
|         error= m_table->file->ha_delete_row(m_table->record[0]);
 | |
|       }
 | |
|       m_table->default_column_bitmaps();
 | |
|     }
 | |
|     if (invoke_triggers && likely(!error) &&
 | |
|         unlikely(process_triggers(TRG_EVENT_DELETE, TRG_ACTION_AFTER, FALSE)))
 | |
|       error= HA_ERR_GENERIC; // in case if error is not set yet
 | |
|     m_table->file->ha_index_or_rnd_end();
 | |
|   }
 | |
|   thd_proc_info(thd, tmp);
 | |
|   return error;
 | |
| }
 | |
| 
 | |
| #endif /* defined(HAVE_REPLICATION) */
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| uint8 Delete_rows_log_event::get_trg_event_map()
 | |
| {
 | |
|   return trg2bit(TRG_EVENT_DELETE);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| /**************************************************************************
 | |
| 	Update_rows_log_event member functions
 | |
| **************************************************************************/
 | |
| 
 | |
| /*
 | |
|   Constructor used to build an event for writing to the binary log.
 | |
|  */
 | |
| Update_rows_log_event::Update_rows_log_event(THD *thd_arg, TABLE *tbl_arg,
 | |
|                                              ulonglong tid,
 | |
|                                              bool is_transactional)
 | |
| : Rows_log_event(thd_arg, tbl_arg, tid, tbl_arg->read_set, is_transactional,
 | |
|                  UPDATE_ROWS_EVENT_V1)
 | |
| {
 | |
|   init(tbl_arg->rpl_write_set);
 | |
| }
 | |
| 
 | |
| Update_rows_compressed_log_event::
 | |
| Update_rows_compressed_log_event(THD *thd_arg, TABLE *tbl_arg,
 | |
|                                  ulonglong tid, bool is_transactional)
 | |
| : Update_rows_log_event(thd_arg, tbl_arg, tid, is_transactional)
 | |
| {
 | |
|   m_type = UPDATE_ROWS_COMPRESSED_EVENT_V1;
 | |
| }
 | |
| 
 | |
| bool Update_rows_compressed_log_event::write()
 | |
| {
 | |
|   return Rows_log_event::write_compressed();
 | |
| }
 | |
| 
 | |
| void Update_rows_log_event::init(MY_BITMAP const *cols)
 | |
| {
 | |
|   /* if my_bitmap_init fails, caught in is_valid() */
 | |
|   if (likely(!my_bitmap_init(&m_cols_ai,
 | |
|                           m_width <= sizeof(m_bitbuf_ai)*8 ? m_bitbuf_ai : NULL,
 | |
|                           m_width,
 | |
|                           false)))
 | |
|   {
 | |
|     /* Cols can be zero if this is a dummy binrows event */
 | |
|     if (likely(cols != NULL))
 | |
|       bitmap_copy(&m_cols_ai, cols);
 | |
|   }
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| 
 | |
| int 
 | |
| Update_rows_log_event::do_before_row_operations(const Slave_reporting_capability *const)
 | |
| {
 | |
|   /*
 | |
|     Increment the global status update count variable
 | |
|   */
 | |
|   if (get_flags(STMT_END_F))
 | |
|     status_var_increment(thd->status_var.com_stat[SQLCOM_UPDATE]);
 | |
| 
 | |
|   int err;
 | |
|   if ((err= find_key()))
 | |
|     return err;
 | |
| 
 | |
|   if (do_invoke_trigger())
 | |
|     m_table->prepare_triggers_for_update_stmt_or_event();
 | |
| 
 | |
|   return 0;
 | |
| }
 | |
| 
 | |
| int 
 | |
| Update_rows_log_event::do_after_row_operations(const Slave_reporting_capability *const, 
 | |
|                                                int error)
 | |
| {
 | |
|   /*error= ToDo:find out what this should really be, this triggers close_scan in nbd, returning error?*/
 | |
|   m_table->file->ha_index_or_rnd_end();
 | |
|   my_free(m_key); // Free for multi_malloc
 | |
|   m_key= NULL;
 | |
|   m_key_info= NULL;
 | |
| 
 | |
|   return error;
 | |
| }
 | |
| 
 | |
| int
 | |
| Update_rows_log_event::do_exec_row(rpl_group_info *rgi)
 | |
| {
 | |
|   const bool invoke_triggers= (m_table->triggers && do_invoke_trigger());
 | |
|   const char *tmp= thd->get_proc_info();
 | |
|   DBUG_ASSERT(m_table != NULL);
 | |
|   char *message, msg[128];
 | |
|   const LEX_CSTRING &table_name= m_table->s->table_name;
 | |
|   const char quote_char=
 | |
|     get_quote_char_for_identifier(thd, table_name.str, table_name.length);
 | |
|   my_snprintf(msg, sizeof msg,
 | |
|               "Update_rows_log_event::find_row() on table %c%.*s%c",
 | |
|               quote_char, int(table_name.length), table_name.str, quote_char);
 | |
|   message= msg;
 | |
| 
 | |
| #ifdef WSREP_PROC_INFO
 | |
|   my_snprintf(thd->wsrep_info, sizeof(thd->wsrep_info) - 1,
 | |
|               "Update_rows_log_event::find_row(%lld) on table %c%.*s%c",
 | |
|               (long long) wsrep_thd_trx_seqno(thd), quote_char,
 | |
|               int(table_name.length), table_name.str,
 | |
|               quote_char);
 | |
|   message= thd->wsrep_info;
 | |
| #endif /* WSREP_PROC_INFO */
 | |
| 
 | |
|   thd_proc_info(thd, message);
 | |
|   // Temporary fix to find out why it fails [/Matz]
 | |
|   memcpy(m_table->read_set->bitmap, m_cols.bitmap, (m_table->read_set->n_bits + 7) / 8);
 | |
|   memcpy(m_table->write_set->bitmap, m_cols_ai.bitmap, (m_table->write_set->n_bits + 7) / 8);
 | |
| 
 | |
|   m_table->mark_columns_per_binlog_row_image();
 | |
| 
 | |
|   int error= find_row(rgi);
 | |
|   if (unlikely(error))
 | |
|   {
 | |
|     /*
 | |
|       We need to read the second image in the event of error to be
 | |
|       able to skip to the next pair of updates
 | |
|     */
 | |
|     if ((m_curr_row= m_curr_row_end))
 | |
|       unpack_current_row(rgi, &m_cols_ai);
 | |
|     thd_proc_info(thd, tmp);
 | |
|     return error;
 | |
|   }
 | |
| 
 | |
|   const bool history_change= m_table->versioned() ?
 | |
|     !m_table->vers_end_field()->is_max() : false;
 | |
|   TABLE_LIST *tl= m_table->pos_in_table_list;
 | |
|   uint8 trg_event_map_save= tl->trg_event_map;
 | |
| 
 | |
|   /*
 | |
|     This is the situation after locating BI:
 | |
| 
 | |
|     ===|=== before image ====|=== after image ===|===
 | |
|        ^                     ^
 | |
|        m_curr_row            m_curr_row_end
 | |
| 
 | |
|     BI found in the table is stored in record[0]. We copy it to record[1]
 | |
|     and unpack AI to record[0].
 | |
|    */
 | |
| 
 | |
|   store_record(m_table,record[1]);
 | |
| 
 | |
|   m_curr_row= m_curr_row_end;
 | |
|   my_snprintf(msg, sizeof msg,
 | |
|               "Update_rows_log_event::unpack_current_row() on table %c%.*s%c",
 | |
|               quote_char, int(table_name.length), table_name.str, quote_char);
 | |
|   message= msg;
 | |
| #ifdef WSREP_PROC_INFO
 | |
|   my_snprintf(thd->wsrep_info, sizeof(thd->wsrep_info) - 1,
 | |
|               "Update_rows_log_event::unpack_current_row(%lld) on table %c%.*s%c",
 | |
|               (long long) wsrep_thd_trx_seqno(thd), quote_char,
 | |
|               int(table_name.length), table_name.str, quote_char);
 | |
|   message= thd->wsrep_info;
 | |
| #endif /* WSREP_PROC_INFO */
 | |
| 
 | |
|   /* this also updates m_curr_row_end */
 | |
|   thd_proc_info(thd, message);
 | |
|   if (unlikely((error= unpack_current_row(rgi, &m_cols_ai))))
 | |
|     goto err;
 | |
|   if (m_table->s->long_unique_table)
 | |
|     m_table->update_virtual_fields(m_table->file, VCOL_UPDATE_FOR_WRITE);
 | |
| 
 | |
|   /*
 | |
|     Now we have the right row to update.  The old row (the one we're
 | |
|     looking for) is in record[1] and the new row is in record[0].
 | |
|   */
 | |
| #ifndef HAVE_valgrind
 | |
|   /*
 | |
|     Don't print debug messages when running valgrind since they can
 | |
|     trigger false warnings.
 | |
|    */
 | |
|   DBUG_PRINT("info",("Updating row in table"));
 | |
|   DBUG_DUMP("old record", m_table->record[1], m_table->s->reclength);
 | |
|   DBUG_DUMP("new values", m_table->record[0], m_table->s->reclength);
 | |
| #endif
 | |
| 
 | |
|   my_snprintf(msg, sizeof msg,
 | |
|               "Update_rows_log_event::ha_update_row() on table %c%.*s%c",
 | |
|               quote_char, int(table_name.length), table_name.str, quote_char);
 | |
|   message= msg;
 | |
| #ifdef WSREP_PROC_INFO
 | |
|   my_snprintf(thd->wsrep_info, sizeof(thd->wsrep_info) - 1,
 | |
|               "Update_rows_log_event::ha_update_row(%lld) on table %c%.*s%c",
 | |
|               (long long) wsrep_thd_trx_seqno(thd), quote_char,
 | |
|               int(table_name.length), table_name.str, quote_char);
 | |
|   message= thd->wsrep_info;
 | |
| #endif /* WSREP_PROC_INFO */
 | |
| 
 | |
|   thd_proc_info(thd, message);
 | |
|   if (invoke_triggers &&
 | |
|       unlikely(process_triggers(TRG_EVENT_UPDATE, TRG_ACTION_BEFORE, TRUE)))
 | |
|   {
 | |
|     error= HA_ERR_GENERIC; // in case if error is not set yet
 | |
|     goto err;
 | |
|   }
 | |
| 
 | |
|   if (m_table->versioned())
 | |
|   {
 | |
|     if (m_vers_from_plain && m_table->versioned(VERS_TIMESTAMP))
 | |
|       m_table->vers_update_fields();
 | |
|     if (!history_change && !m_table->vers_end_field()->is_max())
 | |
|     {
 | |
|       tl->trg_event_map|= trg2bit(TRG_EVENT_DELETE);
 | |
|     }
 | |
|   }
 | |
|   error= m_table->file->ha_update_row(m_table->record[1], m_table->record[0]);
 | |
|   tl->trg_event_map= trg_event_map_save;
 | |
|   if (unlikely(error == HA_ERR_RECORD_IS_THE_SAME))
 | |
|     error= 0;
 | |
|   if (m_vers_from_plain && m_table->versioned(VERS_TIMESTAMP))
 | |
|   {
 | |
|     store_record(m_table, record[2]);
 | |
|     error= vers_insert_history_row(m_table);
 | |
|     restore_record(m_table, record[2]);
 | |
|   }
 | |
|   m_table->default_column_bitmaps();
 | |
| 
 | |
|   if (invoke_triggers && likely(!error) &&
 | |
|       unlikely(process_triggers(TRG_EVENT_UPDATE, TRG_ACTION_AFTER, TRUE)))
 | |
|     error= HA_ERR_GENERIC; // in case if error is not set yet
 | |
| 
 | |
| 
 | |
| err:
 | |
|   thd_proc_info(thd, tmp);
 | |
|   m_table->file->ha_index_or_rnd_end();
 | |
|   return error;
 | |
| }
 | |
| 
 | |
| #endif /* defined(HAVE_REPLICATION) */
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| uint8 Update_rows_log_event::get_trg_event_map()
 | |
| {
 | |
|   return trg2bit(TRG_EVENT_UPDATE);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| #if defined(MYSQL_SERVER) && defined(HAVE_REPLICATION)
 | |
| void Incident_log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|   char buf[256];
 | |
|   size_t bytes;
 | |
|   if (m_message.length > 0)
 | |
|     bytes= my_snprintf(buf, sizeof(buf), "#%d (%s)",
 | |
|                        m_incident, description());
 | |
|   else
 | |
|     bytes= my_snprintf(buf, sizeof(buf), "#%d (%s): %s",
 | |
|                        m_incident, description(), m_message.str);
 | |
|   protocol->store(buf, bytes, &my_charset_bin);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| #if defined(WITH_WSREP)
 | |
| /*
 | |
|   read the first event from (*buf). The size of the (*buf) is (*buf_len).
 | |
|   At the end (*buf) is shitfed to point to the following event or NULL and
 | |
|   (*buf_len) will be changed to account just being read bytes of the 1st event.
 | |
| */
 | |
| #define WSREP_MAX_ALLOWED_PACKET 1024*1024*1024 // current protocol max
 | |
| 
 | |
| Log_event* wsrep_read_log_event(
 | |
|   char **arg_buf, size_t *arg_buf_len,
 | |
|   const Format_description_log_event *description_event)
 | |
| {
 | |
|   uchar *head= (uchar*) (*arg_buf);
 | |
|   uint data_len = uint4korr(head + EVENT_LEN_OFFSET);
 | |
|   const char *error= 0;
 | |
|   Log_event *res=  0;
 | |
|   DBUG_ENTER("wsrep_read_log_event");
 | |
| 
 | |
|   if (data_len > WSREP_MAX_ALLOWED_PACKET)
 | |
|   {
 | |
|     error = "Event too big";
 | |
|     goto err;
 | |
|   }
 | |
| 
 | |
|   res= Log_event::read_log_event(head, data_len, &error, description_event,
 | |
|                                  false);
 | |
| 
 | |
| err:
 | |
|   if (!res)
 | |
|   {
 | |
|     DBUG_ASSERT(error != 0);
 | |
|     sql_print_error("Error in Log_event::read_log_event(): "
 | |
|                     "'%s', data_len: %u, event_type: %d",
 | |
| 		    error, data_len, (int) head[EVENT_TYPE_OFFSET]);
 | |
|   }
 | |
|   (*arg_buf)+= data_len;
 | |
|   (*arg_buf_len)-= data_len;
 | |
|   DBUG_RETURN(res);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| int Incident_log_event::do_apply_event(rpl_group_info *rgi)
 | |
| {
 | |
|   Relay_log_info const *rli= rgi->rli;
 | |
|   DBUG_ENTER("Incident_log_event::do_apply_event");
 | |
| 
 | |
|   if (ignored_error_code(ER_SLAVE_INCIDENT))
 | |
|   {
 | |
|     DBUG_PRINT("info", ("Ignoring Incident"));
 | |
|     DBUG_RETURN(0);
 | |
|   }
 | |
| 
 | |
|   rli->report(ERROR_LEVEL, ER_SLAVE_INCIDENT, NULL,
 | |
|               ER_THD(rgi->thd, ER_SLAVE_INCIDENT),
 | |
|               description(),
 | |
|               m_message.length > 0 ? m_message.str : "<none>");
 | |
|   DBUG_RETURN(1);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| bool
 | |
| Incident_log_event::write_data_header()
 | |
| {
 | |
|   DBUG_ENTER("Incident_log_event::write_data_header");
 | |
|   DBUG_PRINT("enter", ("m_incident: %d", m_incident));
 | |
|   uchar buf[sizeof(int16)];
 | |
|   int2store(buf, (int16) m_incident);
 | |
|   DBUG_RETURN(write_data(buf, sizeof(buf)));
 | |
| }
 | |
| 
 | |
| bool
 | |
| Incident_log_event::write_data_body()
 | |
| {
 | |
|   uchar tmp[1];
 | |
|   DBUG_ENTER("Incident_log_event::write_data_body");
 | |
|   tmp[0]= (uchar) m_message.length;
 | |
|   DBUG_RETURN(write_data(tmp, sizeof(tmp)) ||
 | |
|               write_data(m_message.str, m_message.length));
 | |
| }
 | |
| 
 | |
| 
 | |
| #if defined(MYSQL_SERVER) && defined(HAVE_REPLICATION)
 | |
| /* Pack info for its unrecognized ignorable event */
 | |
| void Ignorable_log_event::pack_info(Protocol *protocol)
 | |
| {
 | |
|   char buf[256];
 | |
|   size_t bytes;
 | |
|   bytes= my_snprintf(buf, sizeof(buf), "# Ignorable event type %d (%s)",
 | |
|                      number, description);
 | |
|   protocol->store(buf, bytes, &my_charset_bin);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| #if defined(HAVE_REPLICATION)
 | |
| Heartbeat_log_event::Heartbeat_log_event(const uchar *buf, uint event_len,
 | |
|                     const Format_description_log_event* description_event)
 | |
|   :Log_event(buf, description_event)
 | |
| {
 | |
|   uint8 header_size= description_event->common_header_len;
 | |
|   if (log_pos == 0)
 | |
|   {
 | |
|     log_pos= uint8korr(buf + header_size);
 | |
|     log_ident= buf + header_size + HB_SUB_HEADER_LEN;
 | |
|     ident_len= event_len - (header_size + HB_SUB_HEADER_LEN);
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     log_ident= buf + header_size;
 | |
|     ident_len = event_len - header_size;
 | |
|   }
 | |
| }
 | |
| #endif
 | |
| 
 | |
| 
 | |
| /**
 | |
|    Check if we should write event to the relay log
 | |
| 
 | |
|    This is used to skip events that is only supported by MySQL
 | |
| 
 | |
|    Return:
 | |
|    0 ok
 | |
|    1 Don't write event
 | |
| */
 | |
| 
 | |
| bool event_that_should_be_ignored(const uchar *buf)
 | |
| {
 | |
|   uint event_type= buf[EVENT_TYPE_OFFSET];
 | |
|   if (event_type == GTID_LOG_EVENT ||
 | |
|       event_type == ANONYMOUS_GTID_LOG_EVENT ||
 | |
|       event_type == PREVIOUS_GTIDS_LOG_EVENT ||
 | |
|       event_type == TRANSACTION_CONTEXT_EVENT ||
 | |
|       event_type == VIEW_CHANGE_EVENT ||
 | |
|       (uint2korr(buf + FLAGS_OFFSET) & LOG_EVENT_IGNORABLE_F))
 | |
|     return 1;
 | |
|   return 0;
 | |
| }
 |