2014-02-26 19:11:54 +01:00
|
|
|
/*****************************************************************************
|
|
|
|
|
2017-01-06 19:48:54 +05:30
|
|
|
Copyright (c) 1997, 2017, Oracle and/or its affiliates. All Rights Reserved.
|
2014-02-26 19:11:54 +01:00
|
|
|
Copyright (c) 2012, Facebook Inc.
|
2018-01-10 13:18:02 +02:00
|
|
|
Copyright (c) 2013, 2018, MariaDB Corporation.
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
This program is free software; you can redistribute it and/or modify it under
|
|
|
|
the terms of the GNU General Public License as published by the Free Software
|
|
|
|
Foundation; version 2 of the License.
|
|
|
|
|
|
|
|
This program is distributed in the hope that it will be useful, but WITHOUT
|
|
|
|
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
|
|
FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License along with
|
|
|
|
this program; if not, write to the Free Software Foundation, Inc.,
|
|
|
|
51 Franklin Street, Suite 500, Boston, MA 02110-1335 USA
|
|
|
|
|
|
|
|
*****************************************************************************/
|
|
|
|
|
|
|
|
/**************************************************//**
|
|
|
|
@file log/log0recv.cc
|
|
|
|
Recovery
|
|
|
|
|
|
|
|
Created 9/20/1997 Heikki Tuuri
|
|
|
|
*******************************************************/
|
|
|
|
|
2018-11-19 11:42:14 +02:00
|
|
|
#include "univ.i"
|
2014-05-05 18:20:28 +02:00
|
|
|
|
|
|
|
#include <vector>
|
2016-08-12 11:17:45 +03:00
|
|
|
#include <map>
|
|
|
|
#include <string>
|
2017-11-30 13:37:59 +11:00
|
|
|
#include <my_service_manager.h>
|
2016-08-12 11:17:45 +03:00
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
#include "log0recv.h"
|
|
|
|
|
2016-09-06 09:43:16 +03:00
|
|
|
#ifdef HAVE_MY_AES_H
|
|
|
|
#include <my_aes.h>
|
|
|
|
#endif
|
|
|
|
|
2015-08-07 15:21:20 +03:00
|
|
|
#include "log0crypt.h"
|
2014-02-26 19:11:54 +01:00
|
|
|
#include "mem0mem.h"
|
|
|
|
#include "buf0buf.h"
|
|
|
|
#include "buf0flu.h"
|
|
|
|
#include "mtr0mtr.h"
|
|
|
|
#include "mtr0log.h"
|
|
|
|
#include "page0cur.h"
|
|
|
|
#include "page0zip.h"
|
|
|
|
#include "btr0btr.h"
|
|
|
|
#include "btr0cur.h"
|
|
|
|
#include "ibuf0ibuf.h"
|
|
|
|
#include "trx0undo.h"
|
|
|
|
#include "trx0rec.h"
|
|
|
|
#include "fil0fil.h"
|
2016-09-06 09:43:16 +03:00
|
|
|
#include "row0trunc.h"
|
2016-12-30 15:04:10 +02:00
|
|
|
#include "buf0rea.h"
|
|
|
|
#include "srv0srv.h"
|
|
|
|
#include "srv0start.h"
|
|
|
|
#include "trx0roll.h"
|
|
|
|
#include "row0merge.h"
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
/** Log records are stored in the hash table in chunks at most of this size;
|
|
|
|
this must be less than UNIV_PAGE_SIZE as it is stored in the buffer pool */
|
|
|
|
#define RECV_DATA_BLOCK_SIZE (MEM_MAX_ALLOC_IN_BUF - sizeof(recv_data_t))
|
|
|
|
|
|
|
|
/** Read-ahead area in applying log records to file pages */
|
|
|
|
#define RECV_READ_AHEAD_AREA 32
|
|
|
|
|
|
|
|
/** The recovery system */
|
2017-03-07 17:16:49 +02:00
|
|
|
recv_sys_t* recv_sys;
|
2014-02-26 19:11:54 +01:00
|
|
|
/** TRUE when applying redo log records during crash recovery; FALSE
|
|
|
|
otherwise. Note that this is FALSE while a background thread is
|
|
|
|
rolling back incomplete transactions. */
|
2016-08-12 11:17:45 +03:00
|
|
|
volatile bool recv_recovery_on;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
/** TRUE when recv_init_crash_recovery() has been called. */
|
2016-08-12 11:17:45 +03:00
|
|
|
bool recv_needed_recovery;
|
2016-12-30 15:04:10 +02:00
|
|
|
#ifdef UNIV_DEBUG
|
2014-02-26 19:11:54 +01:00
|
|
|
/** TRUE if writing to the redo log (mtr_commit) is forbidden.
|
|
|
|
Protected by log_sys->mutex. */
|
2016-08-12 11:17:45 +03:00
|
|
|
bool recv_no_log_write = false;
|
2016-12-30 15:04:10 +02:00
|
|
|
#endif /* UNIV_DEBUG */
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
/** TRUE if buf_page_is_corrupted() should check if the log sequence
|
|
|
|
number (FIL_PAGE_LSN) is in the future. Initially FALSE, and set by
|
2016-08-12 11:17:45 +03:00
|
|
|
recv_recovery_from_checkpoint_start(). */
|
|
|
|
bool recv_lsn_checks_on;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
/** If the following is TRUE, the buffer pool file pages must be invalidated
|
|
|
|
after recovery and no ibuf operations are allowed; this becomes TRUE if
|
|
|
|
the log record hash table becomes too full, and log records must be merged
|
|
|
|
to file pages already before the recovery is finished: in this case no
|
|
|
|
ibuf operations are allowed, as they could modify the pages read in the
|
|
|
|
buffer pool before the pages have been recovered to the up-to-date state.
|
|
|
|
|
|
|
|
TRUE means that recovery is running and no operations on the log files
|
|
|
|
are allowed yet: the variable name is misleading. */
|
2016-08-12 11:17:45 +03:00
|
|
|
bool recv_no_ibuf_operations;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
/** The type of the previous parsed redo log record */
|
2016-08-12 11:17:45 +03:00
|
|
|
static mlog_id_t recv_previous_parsed_rec_type;
|
2014-02-26 19:11:54 +01:00
|
|
|
/** The offset of the previous parsed redo log record */
|
|
|
|
static ulint recv_previous_parsed_rec_offset;
|
|
|
|
/** The 'multi' flag of the previous parsed redo log record */
|
|
|
|
static ulint recv_previous_parsed_rec_is_multi;
|
|
|
|
|
|
|
|
/** This many frames must be left free in the buffer pool when we scan
|
|
|
|
the log and store the scanned log records in the buffer pool: we will
|
|
|
|
use these free frames to read in pages when we start applying the
|
|
|
|
log records to the database.
|
|
|
|
This is the default value. If the actual size of the buffer pool is
|
|
|
|
larger than 10 MB we'll set this value to 512. */
|
2016-08-12 11:17:45 +03:00
|
|
|
ulint recv_n_pool_free_frames;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
/** The maximum lsn we see for a page during the recovery process. If this
|
|
|
|
is bigger than the lsn we are able to scan up to, that is an indication that
|
|
|
|
the recovery failed and the database may be corrupt. */
|
2015-05-27 14:34:45 +01:00
|
|
|
static lsn_t recv_max_page_lsn;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
#ifdef UNIV_PFS_THREAD
|
2016-08-12 11:17:45 +03:00
|
|
|
mysql_pfs_key_t trx_rollback_clean_thread_key;
|
|
|
|
mysql_pfs_key_t recv_writer_thread_key;
|
2016-12-30 15:04:10 +02:00
|
|
|
#endif /* UNIV_PFS_THREAD */
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-07-05 22:09:28 +03:00
|
|
|
/** Is recv_writer_thread active? */
|
|
|
|
bool recv_writer_thread_active;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
#ifndef DBUG_OFF
|
|
|
|
/** Return string name of the redo log record type.
|
|
|
|
@param[in] type record log record enum
|
|
|
|
@return string name of record log record */
|
MDEV-13564 Mariabackup does not work with TRUNCATE
Implement undo tablespace truncation via normal redo logging.
Implement TRUNCATE TABLE as a combination of RENAME to #sql-ib name,
CREATE, and DROP.
Note: Orphan #sql-ib*.ibd may be left behind if MariaDB Server 10.2
is killed before the DROP operation is committed. If MariaDB Server 10.2
is killed during TRUNCATE, it is also possible that the old table
was renamed to #sql-ib*.ibd but the data dictionary will refer to the
table using the original name.
In MariaDB Server 10.3, RENAME inside InnoDB is transactional,
and #sql-* tables will be dropped on startup. So, this new TRUNCATE
will be fully crash-safe in 10.3.
ha_mroonga::wrapper_truncate(): Pass table options to the underlying
storage engine, now that ha_innobase::truncate() will need them.
rpl_slave_state::truncate_state_table(): Before truncating
mysql.gtid_slave_pos, evict any cached table handles from
the table definition cache, so that there will be no stale
references to the old table after truncating.
== TRUNCATE TABLE ==
WL#6501 in MySQL 5.7 introduced separate log files for implementing
atomic and crash-safe TRUNCATE TABLE, instead of using the InnoDB
undo and redo log. Some convoluted logic was added to the InnoDB
crash recovery, and some extra synchronization (including a redo log
checkpoint) was introduced to make this work. This synchronization
has caused performance problems and race conditions, and the extra
log files cannot be copied or applied by external backup programs.
In order to support crash-upgrade from MariaDB 10.2, we will keep
the logic for parsing and applying the extra log files, but we will
no longer generate those files in TRUNCATE TABLE.
A prerequisite for crash-safe TRUNCATE is a crash-safe RENAME TABLE
(with full redo and undo logging and proper rollback). This will
be implemented in MDEV-14717.
ha_innobase::truncate(): Invoke RENAME, create(), delete_table().
Because RENAME cannot be fully rolled back before MariaDB 10.3
due to missing undo logging, add some explicit rename-back in
case the operation fails.
ha_innobase::delete(): Introduce a variant that takes sqlcom as
a parameter. In TRUNCATE TABLE, we do not want to touch any
FOREIGN KEY constraints.
ha_innobase::create(): Add the parameters file_per_table, trx.
In TRUNCATE, the new table must be created in the same transaction
that renames the old table.
create_table_info_t::create_table_info_t(): Add the parameters
file_per_table, trx.
row_drop_table_for_mysql(): Replace a bool parameter with sqlcom.
row_drop_table_after_create_fail(): New function, wrapping
row_drop_table_for_mysql().
dict_truncate_index_tree_in_mem(), fil_truncate_tablespace(),
fil_prepare_for_truncate(), fil_reinit_space_header_for_table(),
row_truncate_table_for_mysql(), TruncateLogger,
row_truncate_prepare(), row_truncate_rollback(),
row_truncate_complete(), row_truncate_fts(),
row_truncate_update_system_tables(),
row_truncate_foreign_key_checks(), row_truncate_sanity_checks():
Remove.
row_upd_check_references_constraints(): Remove a check for
TRUNCATE, now that the table is no longer truncated in place.
The new test innodb.truncate_foreign uses DEBUG_SYNC to cover some
race-condition like scenarios. The test innodb-innodb.truncate does
not use any synchronization.
We add a redo log subformat to indicate backup-friendly format.
MariaDB 10.4 will remove support for the old TRUNCATE logging,
so crash-upgrade from old 10.2 or 10.3 to 10.4 will involve
limitations.
== Undo tablespace truncation ==
MySQL 5.7 implements undo tablespace truncation. It is only
possible when innodb_undo_tablespaces is set to at least 2.
The logging is implemented similar to the WL#6501 TRUNCATE,
that is, using separate log files and a redo log checkpoint.
We can simply implement undo tablespace truncation within
a single mini-transaction that reinitializes the undo log
tablespace file. Unfortunately, due to the redo log format
of some operations, currently, the total redo log written by
undo tablespace truncation will be more than the combined size
of the truncated undo tablespace. It should be acceptable
to have a little more than 1 megabyte of log in a single
mini-transaction. This will be fixed in MDEV-17138 in
MariaDB Server 10.4.
recv_sys_t: Add truncated_undo_spaces[] to remember for which undo
tablespaces a MLOG_FILE_CREATE2 record was seen.
namespace undo: Remove some unnecessary declarations.
fil_space_t::is_being_truncated: Document that this flag now
only applies to undo tablespaces. Remove some references.
fil_space_t::is_stopping(): Do not refer to is_being_truncated.
This check is for tablespaces of tables. Potentially used
tablespaces are never truncated any more.
buf_dblwr_process(): Suppress the out-of-bounds warning
for undo tablespaces.
fil_truncate_log(): Write a MLOG_FILE_CREATE2 with a nonzero
page number (new size of the tablespace in pages) to inform
crash recovery that the undo tablespace size has been reduced.
fil_op_write_log(): Relax assertions, so that MLOG_FILE_CREATE2
can be written for undo tablespaces (without .ibd file suffix)
for a nonzero page number.
os_file_truncate(): Add the parameter allow_shrink=false
so that undo tablespaces can actually be shrunk using this function.
fil_name_parse(): For undo tablespace truncation,
buffer MLOG_FILE_CREATE2 in truncated_undo_spaces[].
recv_read_in_area(): Avoid reading pages for which no redo log
records remain buffered, after recv_addr_trim() removed them.
trx_rseg_header_create(): Add a FIXME comment that we could write
much less redo log.
trx_undo_truncate_tablespace(): Reinitialize the undo tablespace
in a single mini-transaction, which will be flushed to the redo log
before the file size is trimmed.
recv_addr_trim(): Discard any redo logs for pages that were
logged after the new end of a file, before the truncation LSN.
If the rec_list becomes empty, reduce n_addrs. After removing
any affected records, actually truncate the file.
recv_apply_hashed_log_recs(): Invoke recv_addr_trim() right before
applying any log records. The undo tablespace files must be open
at this point.
buf_flush_or_remove_pages(), buf_flush_dirty_pages(),
buf_LRU_flush_or_remove_pages(): Add a parameter for specifying
the number of the first page to flush or remove (default 0).
trx_purge_initiate_truncate(): Remove the log checkpoints, the
extra logging, and some unnecessary crash points. Merge the code
from trx_undo_truncate_tablespace(). First, flush all to-be-discarded
pages (beyond the new end of the file), then trim the space->size
to make the page allocation deterministic. At the only remaining
crash injection point, flush the redo log, so that the recovery
can be tested.
2018-08-28 13:43:06 +03:00
|
|
|
static const char* get_mlog_string(mlog_id_t type);
|
2016-08-12 11:17:45 +03:00
|
|
|
#endif /* !DBUG_OFF */
|
|
|
|
|
|
|
|
/** Tablespace item during recovery */
|
|
|
|
struct file_name_t {
|
|
|
|
/** Tablespace file name (MLOG_FILE_NAME) */
|
|
|
|
std::string name;
|
|
|
|
/** Tablespace object (NULL if not valid or not found) */
|
|
|
|
fil_space_t* space;
|
2018-03-27 13:47:56 +05:30
|
|
|
|
|
|
|
/** Tablespace status. */
|
|
|
|
enum fil_status {
|
|
|
|
/** Normal tablespace */
|
|
|
|
NORMAL,
|
|
|
|
/** Deleted tablespace */
|
|
|
|
DELETED,
|
|
|
|
/** Missing tablespace */
|
|
|
|
MISSING
|
|
|
|
};
|
|
|
|
|
|
|
|
/** Status of the tablespace */
|
|
|
|
fil_status status;
|
2016-08-12 11:17:45 +03:00
|
|
|
|
|
|
|
/** Constructor */
|
2018-03-27 13:47:56 +05:30
|
|
|
file_name_t(std::string name_, bool deleted) :
|
|
|
|
name(name_), space(NULL), status(deleted ? DELETED: NORMAL) {}
|
2016-08-12 11:17:45 +03:00
|
|
|
};
|
|
|
|
|
|
|
|
/** Map of dirty tablespaces during recovery */
|
|
|
|
typedef std::map<
|
|
|
|
ulint,
|
|
|
|
file_name_t,
|
|
|
|
std::less<ulint>,
|
|
|
|
ut_allocator<std::pair<const ulint, file_name_t> > > recv_spaces_t;
|
|
|
|
|
|
|
|
static recv_spaces_t recv_spaces;
|
|
|
|
|
2018-08-28 17:14:54 +03:00
|
|
|
/** States of recv_addr_t */
|
|
|
|
enum recv_addr_state {
|
|
|
|
/** not yet processed */
|
|
|
|
RECV_NOT_PROCESSED,
|
|
|
|
/** page is being read */
|
|
|
|
RECV_BEING_READ,
|
|
|
|
/** log records are being applied on the page */
|
|
|
|
RECV_BEING_PROCESSED,
|
|
|
|
/** log records have been applied on the page */
|
|
|
|
RECV_PROCESSED,
|
|
|
|
/** log records have been discarded because the tablespace
|
|
|
|
does not exist */
|
|
|
|
RECV_DISCARDED
|
|
|
|
};
|
|
|
|
|
|
|
|
/** Hashed page file address struct */
|
|
|
|
struct recv_addr_t{
|
|
|
|
/** recovery state of the page */
|
|
|
|
recv_addr_state state;
|
|
|
|
/** tablespace identifier */
|
|
|
|
unsigned space:32;
|
|
|
|
/** page number */
|
|
|
|
unsigned page_no:32;
|
|
|
|
/** list of log records for this page */
|
|
|
|
UT_LIST_BASE_NODE_T(recv_t) rec_list;
|
|
|
|
/** hash node in the hash bucket chain */
|
|
|
|
hash_node_t addr_hash;
|
|
|
|
};
|
|
|
|
|
2018-08-16 16:10:18 +03:00
|
|
|
/** Report optimized DDL operation (without redo log),
|
|
|
|
corresponding to MLOG_INDEX_LOAD.
|
2018-08-09 15:06:52 +01:00
|
|
|
@param[in] space_id tablespace identifier
|
|
|
|
*/
|
|
|
|
void (*log_optimized_ddl_op)(ulint space_id);
|
|
|
|
|
2018-08-16 16:10:18 +03:00
|
|
|
/** Report backup-unfriendly TRUNCATE operation (with separate log file),
|
|
|
|
corresponding to MLOG_TRUNCATE. */
|
|
|
|
void (*log_truncate)();
|
|
|
|
|
2018-08-09 15:06:52 +01:00
|
|
|
/** Report an operation to create, delete, or rename a file during backup.
|
|
|
|
@param[in] space_id tablespace identifier
|
|
|
|
@param[in] flags tablespace flags (NULL if not create)
|
|
|
|
@param[in] name file name (not NUL-terminated)
|
|
|
|
@param[in] len length of name, in bytes
|
|
|
|
@param[in] new_name new file name (NULL if not rename)
|
|
|
|
@param[in] new_len length of new_name, in bytes (0 if NULL) */
|
|
|
|
void (*log_file_op)(ulint space_id, const byte* flags,
|
|
|
|
const byte* name, ulint len,
|
|
|
|
const byte* new_name, ulint new_len);
|
2018-03-13 15:19:30 +05:30
|
|
|
|
MDEV-13564 Mariabackup does not work with TRUNCATE
Implement undo tablespace truncation via normal redo logging.
Implement TRUNCATE TABLE as a combination of RENAME to #sql-ib name,
CREATE, and DROP.
Note: Orphan #sql-ib*.ibd may be left behind if MariaDB Server 10.2
is killed before the DROP operation is committed. If MariaDB Server 10.2
is killed during TRUNCATE, it is also possible that the old table
was renamed to #sql-ib*.ibd but the data dictionary will refer to the
table using the original name.
In MariaDB Server 10.3, RENAME inside InnoDB is transactional,
and #sql-* tables will be dropped on startup. So, this new TRUNCATE
will be fully crash-safe in 10.3.
ha_mroonga::wrapper_truncate(): Pass table options to the underlying
storage engine, now that ha_innobase::truncate() will need them.
rpl_slave_state::truncate_state_table(): Before truncating
mysql.gtid_slave_pos, evict any cached table handles from
the table definition cache, so that there will be no stale
references to the old table after truncating.
== TRUNCATE TABLE ==
WL#6501 in MySQL 5.7 introduced separate log files for implementing
atomic and crash-safe TRUNCATE TABLE, instead of using the InnoDB
undo and redo log. Some convoluted logic was added to the InnoDB
crash recovery, and some extra synchronization (including a redo log
checkpoint) was introduced to make this work. This synchronization
has caused performance problems and race conditions, and the extra
log files cannot be copied or applied by external backup programs.
In order to support crash-upgrade from MariaDB 10.2, we will keep
the logic for parsing and applying the extra log files, but we will
no longer generate those files in TRUNCATE TABLE.
A prerequisite for crash-safe TRUNCATE is a crash-safe RENAME TABLE
(with full redo and undo logging and proper rollback). This will
be implemented in MDEV-14717.
ha_innobase::truncate(): Invoke RENAME, create(), delete_table().
Because RENAME cannot be fully rolled back before MariaDB 10.3
due to missing undo logging, add some explicit rename-back in
case the operation fails.
ha_innobase::delete(): Introduce a variant that takes sqlcom as
a parameter. In TRUNCATE TABLE, we do not want to touch any
FOREIGN KEY constraints.
ha_innobase::create(): Add the parameters file_per_table, trx.
In TRUNCATE, the new table must be created in the same transaction
that renames the old table.
create_table_info_t::create_table_info_t(): Add the parameters
file_per_table, trx.
row_drop_table_for_mysql(): Replace a bool parameter with sqlcom.
row_drop_table_after_create_fail(): New function, wrapping
row_drop_table_for_mysql().
dict_truncate_index_tree_in_mem(), fil_truncate_tablespace(),
fil_prepare_for_truncate(), fil_reinit_space_header_for_table(),
row_truncate_table_for_mysql(), TruncateLogger,
row_truncate_prepare(), row_truncate_rollback(),
row_truncate_complete(), row_truncate_fts(),
row_truncate_update_system_tables(),
row_truncate_foreign_key_checks(), row_truncate_sanity_checks():
Remove.
row_upd_check_references_constraints(): Remove a check for
TRUNCATE, now that the table is no longer truncated in place.
The new test innodb.truncate_foreign uses DEBUG_SYNC to cover some
race-condition like scenarios. The test innodb-innodb.truncate does
not use any synchronization.
We add a redo log subformat to indicate backup-friendly format.
MariaDB 10.4 will remove support for the old TRUNCATE logging,
so crash-upgrade from old 10.2 or 10.3 to 10.4 will involve
limitations.
== Undo tablespace truncation ==
MySQL 5.7 implements undo tablespace truncation. It is only
possible when innodb_undo_tablespaces is set to at least 2.
The logging is implemented similar to the WL#6501 TRUNCATE,
that is, using separate log files and a redo log checkpoint.
We can simply implement undo tablespace truncation within
a single mini-transaction that reinitializes the undo log
tablespace file. Unfortunately, due to the redo log format
of some operations, currently, the total redo log written by
undo tablespace truncation will be more than the combined size
of the truncated undo tablespace. It should be acceptable
to have a little more than 1 megabyte of log in a single
mini-transaction. This will be fixed in MDEV-17138 in
MariaDB Server 10.4.
recv_sys_t: Add truncated_undo_spaces[] to remember for which undo
tablespaces a MLOG_FILE_CREATE2 record was seen.
namespace undo: Remove some unnecessary declarations.
fil_space_t::is_being_truncated: Document that this flag now
only applies to undo tablespaces. Remove some references.
fil_space_t::is_stopping(): Do not refer to is_being_truncated.
This check is for tablespaces of tables. Potentially used
tablespaces are never truncated any more.
buf_dblwr_process(): Suppress the out-of-bounds warning
for undo tablespaces.
fil_truncate_log(): Write a MLOG_FILE_CREATE2 with a nonzero
page number (new size of the tablespace in pages) to inform
crash recovery that the undo tablespace size has been reduced.
fil_op_write_log(): Relax assertions, so that MLOG_FILE_CREATE2
can be written for undo tablespaces (without .ibd file suffix)
for a nonzero page number.
os_file_truncate(): Add the parameter allow_shrink=false
so that undo tablespaces can actually be shrunk using this function.
fil_name_parse(): For undo tablespace truncation,
buffer MLOG_FILE_CREATE2 in truncated_undo_spaces[].
recv_read_in_area(): Avoid reading pages for which no redo log
records remain buffered, after recv_addr_trim() removed them.
trx_rseg_header_create(): Add a FIXME comment that we could write
much less redo log.
trx_undo_truncate_tablespace(): Reinitialize the undo tablespace
in a single mini-transaction, which will be flushed to the redo log
before the file size is trimmed.
recv_addr_trim(): Discard any redo logs for pages that were
logged after the new end of a file, before the truncation LSN.
If the rec_list becomes empty, reduce n_addrs. After removing
any affected records, actually truncate the file.
recv_apply_hashed_log_recs(): Invoke recv_addr_trim() right before
applying any log records. The undo tablespace files must be open
at this point.
buf_flush_or_remove_pages(), buf_flush_dirty_pages(),
buf_LRU_flush_or_remove_pages(): Add a parameter for specifying
the number of the first page to flush or remove (default 0).
trx_purge_initiate_truncate(): Remove the log checkpoints, the
extra logging, and some unnecessary crash points. Merge the code
from trx_undo_truncate_tablespace(). First, flush all to-be-discarded
pages (beyond the new end of the file), then trim the space->size
to make the page allocation deterministic. At the only remaining
crash injection point, flush the redo log, so that the recovery
can be tested.
2018-08-28 13:43:06 +03:00
|
|
|
/** Process a MLOG_CREATE2 record that indicates that a tablespace
|
|
|
|
is being shrunk in size.
|
|
|
|
@param[in] space_id tablespace identifier
|
|
|
|
@param[in] pages trimmed size of the file, in pages
|
|
|
|
@param[in] lsn log sequence number of the operation */
|
|
|
|
static void recv_addr_trim(ulint space_id, unsigned pages, lsn_t lsn)
|
|
|
|
{
|
|
|
|
DBUG_ENTER("recv_addr_trim");
|
|
|
|
DBUG_LOG("ib_log",
|
|
|
|
"discarding log beyond end of tablespace "
|
|
|
|
<< page_id_t(space_id, pages) << " before LSN " << lsn);
|
|
|
|
ut_ad(mutex_own(&recv_sys->mutex));
|
|
|
|
for (ulint i = recv_sys->addr_hash->n_cells; i--; ) {
|
|
|
|
hash_cell_t* const cell = hash_get_nth_cell(
|
|
|
|
recv_sys->addr_hash, i);
|
|
|
|
for (recv_addr_t* addr = static_cast<recv_addr_t*>(cell->node),
|
2018-11-20 14:55:44 +02:00
|
|
|
*next;
|
|
|
|
addr; addr = next) {
|
MDEV-13564 Mariabackup does not work with TRUNCATE
Implement undo tablespace truncation via normal redo logging.
Implement TRUNCATE TABLE as a combination of RENAME to #sql-ib name,
CREATE, and DROP.
Note: Orphan #sql-ib*.ibd may be left behind if MariaDB Server 10.2
is killed before the DROP operation is committed. If MariaDB Server 10.2
is killed during TRUNCATE, it is also possible that the old table
was renamed to #sql-ib*.ibd but the data dictionary will refer to the
table using the original name.
In MariaDB Server 10.3, RENAME inside InnoDB is transactional,
and #sql-* tables will be dropped on startup. So, this new TRUNCATE
will be fully crash-safe in 10.3.
ha_mroonga::wrapper_truncate(): Pass table options to the underlying
storage engine, now that ha_innobase::truncate() will need them.
rpl_slave_state::truncate_state_table(): Before truncating
mysql.gtid_slave_pos, evict any cached table handles from
the table definition cache, so that there will be no stale
references to the old table after truncating.
== TRUNCATE TABLE ==
WL#6501 in MySQL 5.7 introduced separate log files for implementing
atomic and crash-safe TRUNCATE TABLE, instead of using the InnoDB
undo and redo log. Some convoluted logic was added to the InnoDB
crash recovery, and some extra synchronization (including a redo log
checkpoint) was introduced to make this work. This synchronization
has caused performance problems and race conditions, and the extra
log files cannot be copied or applied by external backup programs.
In order to support crash-upgrade from MariaDB 10.2, we will keep
the logic for parsing and applying the extra log files, but we will
no longer generate those files in TRUNCATE TABLE.
A prerequisite for crash-safe TRUNCATE is a crash-safe RENAME TABLE
(with full redo and undo logging and proper rollback). This will
be implemented in MDEV-14717.
ha_innobase::truncate(): Invoke RENAME, create(), delete_table().
Because RENAME cannot be fully rolled back before MariaDB 10.3
due to missing undo logging, add some explicit rename-back in
case the operation fails.
ha_innobase::delete(): Introduce a variant that takes sqlcom as
a parameter. In TRUNCATE TABLE, we do not want to touch any
FOREIGN KEY constraints.
ha_innobase::create(): Add the parameters file_per_table, trx.
In TRUNCATE, the new table must be created in the same transaction
that renames the old table.
create_table_info_t::create_table_info_t(): Add the parameters
file_per_table, trx.
row_drop_table_for_mysql(): Replace a bool parameter with sqlcom.
row_drop_table_after_create_fail(): New function, wrapping
row_drop_table_for_mysql().
dict_truncate_index_tree_in_mem(), fil_truncate_tablespace(),
fil_prepare_for_truncate(), fil_reinit_space_header_for_table(),
row_truncate_table_for_mysql(), TruncateLogger,
row_truncate_prepare(), row_truncate_rollback(),
row_truncate_complete(), row_truncate_fts(),
row_truncate_update_system_tables(),
row_truncate_foreign_key_checks(), row_truncate_sanity_checks():
Remove.
row_upd_check_references_constraints(): Remove a check for
TRUNCATE, now that the table is no longer truncated in place.
The new test innodb.truncate_foreign uses DEBUG_SYNC to cover some
race-condition like scenarios. The test innodb-innodb.truncate does
not use any synchronization.
We add a redo log subformat to indicate backup-friendly format.
MariaDB 10.4 will remove support for the old TRUNCATE logging,
so crash-upgrade from old 10.2 or 10.3 to 10.4 will involve
limitations.
== Undo tablespace truncation ==
MySQL 5.7 implements undo tablespace truncation. It is only
possible when innodb_undo_tablespaces is set to at least 2.
The logging is implemented similar to the WL#6501 TRUNCATE,
that is, using separate log files and a redo log checkpoint.
We can simply implement undo tablespace truncation within
a single mini-transaction that reinitializes the undo log
tablespace file. Unfortunately, due to the redo log format
of some operations, currently, the total redo log written by
undo tablespace truncation will be more than the combined size
of the truncated undo tablespace. It should be acceptable
to have a little more than 1 megabyte of log in a single
mini-transaction. This will be fixed in MDEV-17138 in
MariaDB Server 10.4.
recv_sys_t: Add truncated_undo_spaces[] to remember for which undo
tablespaces a MLOG_FILE_CREATE2 record was seen.
namespace undo: Remove some unnecessary declarations.
fil_space_t::is_being_truncated: Document that this flag now
only applies to undo tablespaces. Remove some references.
fil_space_t::is_stopping(): Do not refer to is_being_truncated.
This check is for tablespaces of tables. Potentially used
tablespaces are never truncated any more.
buf_dblwr_process(): Suppress the out-of-bounds warning
for undo tablespaces.
fil_truncate_log(): Write a MLOG_FILE_CREATE2 with a nonzero
page number (new size of the tablespace in pages) to inform
crash recovery that the undo tablespace size has been reduced.
fil_op_write_log(): Relax assertions, so that MLOG_FILE_CREATE2
can be written for undo tablespaces (without .ibd file suffix)
for a nonzero page number.
os_file_truncate(): Add the parameter allow_shrink=false
so that undo tablespaces can actually be shrunk using this function.
fil_name_parse(): For undo tablespace truncation,
buffer MLOG_FILE_CREATE2 in truncated_undo_spaces[].
recv_read_in_area(): Avoid reading pages for which no redo log
records remain buffered, after recv_addr_trim() removed them.
trx_rseg_header_create(): Add a FIXME comment that we could write
much less redo log.
trx_undo_truncate_tablespace(): Reinitialize the undo tablespace
in a single mini-transaction, which will be flushed to the redo log
before the file size is trimmed.
recv_addr_trim(): Discard any redo logs for pages that were
logged after the new end of a file, before the truncation LSN.
If the rec_list becomes empty, reduce n_addrs. After removing
any affected records, actually truncate the file.
recv_apply_hashed_log_recs(): Invoke recv_addr_trim() right before
applying any log records. The undo tablespace files must be open
at this point.
buf_flush_or_remove_pages(), buf_flush_dirty_pages(),
buf_LRU_flush_or_remove_pages(): Add a parameter for specifying
the number of the first page to flush or remove (default 0).
trx_purge_initiate_truncate(): Remove the log checkpoints, the
extra logging, and some unnecessary crash points. Merge the code
from trx_undo_truncate_tablespace(). First, flush all to-be-discarded
pages (beyond the new end of the file), then trim the space->size
to make the page allocation deterministic. At the only remaining
crash injection point, flush the redo log, so that the recovery
can be tested.
2018-08-28 13:43:06 +03:00
|
|
|
next = static_cast<recv_addr_t*>(addr->addr_hash);
|
|
|
|
|
|
|
|
if (addr->space != space_id || addr->page_no < pages) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (recv_t* recv = UT_LIST_GET_FIRST(addr->rec_list);
|
|
|
|
recv; ) {
|
|
|
|
recv_t* n = UT_LIST_GET_NEXT(rec_list, recv);
|
|
|
|
if (recv->start_lsn < lsn) {
|
|
|
|
DBUG_PRINT("ib_log",
|
|
|
|
("Discarding %s for"
|
|
|
|
" page %u:%u at " LSN_PF,
|
|
|
|
get_mlog_string(
|
|
|
|
recv->type),
|
|
|
|
addr->space, addr->page_no,
|
|
|
|
recv->start_lsn));
|
|
|
|
UT_LIST_REMOVE(addr->rec_list, recv);
|
|
|
|
}
|
|
|
|
recv = n;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (fil_space_t* space = fil_space_get(space_id)) {
|
|
|
|
ut_ad(UT_LIST_GET_LEN(space->chain) == 1);
|
|
|
|
fil_node_t* file = UT_LIST_GET_FIRST(space->chain);
|
|
|
|
ut_ad(file->is_open());
|
|
|
|
os_file_truncate(file->name, file->handle,
|
|
|
|
os_offset_t(pages) << srv_page_size_shift,
|
|
|
|
true);
|
|
|
|
}
|
|
|
|
DBUG_VOID_RETURN;
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/** Process a file name from a MLOG_FILE_* record.
|
|
|
|
@param[in,out] name file name
|
|
|
|
@param[in] len length of the file name
|
|
|
|
@param[in] space_id the tablespace ID
|
2018-08-23 17:02:50 +03:00
|
|
|
@param[in] deleted whether this is a MLOG_FILE_DELETE record */
|
2016-08-12 11:17:45 +03:00
|
|
|
static
|
2018-08-23 17:02:50 +03:00
|
|
|
void
|
2016-08-12 11:17:45 +03:00
|
|
|
fil_name_process(
|
|
|
|
char* name,
|
|
|
|
ulint len,
|
|
|
|
ulint space_id,
|
|
|
|
bool deleted)
|
|
|
|
{
|
2018-03-13 15:19:30 +05:30
|
|
|
if (srv_operation == SRV_OPERATION_BACKUP) {
|
2018-08-23 17:02:50 +03:00
|
|
|
return;
|
2018-03-13 15:19:30 +05:30
|
|
|
}
|
|
|
|
|
|
|
|
ut_ad(srv_operation == SRV_OPERATION_NORMAL
|
|
|
|
|| srv_operation == SRV_OPERATION_RESTORE
|
|
|
|
|| srv_operation == SRV_OPERATION_RESTORE_EXPORT);
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/* We will also insert space=NULL into the map, so that
|
|
|
|
further checks can ensure that a MLOG_FILE_NAME record was
|
|
|
|
scanned before applying any page records for the space_id. */
|
|
|
|
|
2016-09-06 09:43:16 +03:00
|
|
|
os_normalize_path(name);
|
2016-08-12 11:17:45 +03:00
|
|
|
file_name_t fname(std::string(name, len - 1), deleted);
|
|
|
|
std::pair<recv_spaces_t::iterator,bool> p = recv_spaces.insert(
|
|
|
|
std::make_pair(space_id, fname));
|
|
|
|
ut_ad(p.first->first == space_id);
|
|
|
|
|
|
|
|
file_name_t& f = p.first->second;
|
|
|
|
|
|
|
|
if (deleted) {
|
|
|
|
/* Got MLOG_FILE_DELETE */
|
|
|
|
|
2018-03-27 13:47:56 +05:30
|
|
|
if (!p.second && f.status != file_name_t::DELETED) {
|
|
|
|
f.status = file_name_t::DELETED;
|
2016-08-12 11:17:45 +03:00
|
|
|
if (f.space != NULL) {
|
|
|
|
fil_space_free(space_id, false);
|
|
|
|
f.space = NULL;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
ut_ad(f.space == NULL);
|
|
|
|
} else if (p.second // the first MLOG_FILE_NAME or MLOG_FILE_RENAME2
|
|
|
|
|| f.name != fname.name) {
|
|
|
|
fil_space_t* space;
|
|
|
|
|
|
|
|
/* Check if the tablespace file exists and contains
|
|
|
|
the space_id. If not, ignore the file after displaying
|
|
|
|
a note. Abort if there are multiple files with the
|
|
|
|
same space_id. */
|
|
|
|
switch (fil_ibd_load(space_id, name, space)) {
|
|
|
|
case FIL_LOAD_OK:
|
|
|
|
ut_ad(space != NULL);
|
|
|
|
|
|
|
|
if (f.space == NULL || f.space == space) {
|
|
|
|
f.name = fname.name;
|
|
|
|
f.space = space;
|
2018-03-27 13:47:56 +05:30
|
|
|
f.status = file_name_t::NORMAL;
|
2016-08-12 11:17:45 +03:00
|
|
|
} else {
|
|
|
|
ib::error() << "Tablespace " << space_id
|
|
|
|
<< " has been found in two places: '"
|
|
|
|
<< f.name << "' and '" << name << "'."
|
|
|
|
" You must delete one of them.";
|
|
|
|
recv_sys->found_corrupt_fs = true;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
|
|
|
case FIL_LOAD_ID_CHANGED:
|
|
|
|
ut_ad(space == NULL);
|
|
|
|
break;
|
|
|
|
|
|
|
|
case FIL_LOAD_NOT_FOUND:
|
|
|
|
/* No matching tablespace was found; maybe it
|
|
|
|
was renamed, and we will find a subsequent
|
|
|
|
MLOG_FILE_* record. */
|
|
|
|
ut_ad(space == NULL);
|
|
|
|
|
|
|
|
if (srv_force_recovery) {
|
|
|
|
/* Without innodb_force_recovery,
|
|
|
|
missing tablespaces will only be
|
|
|
|
reported in
|
|
|
|
recv_init_crash_recovery_spaces().
|
|
|
|
Enable some more diagnostics when
|
|
|
|
forcing recovery. */
|
|
|
|
|
|
|
|
ib::info()
|
|
|
|
<< "At LSN: " << recv_sys->recovered_lsn
|
|
|
|
<< ": unable to open file " << name
|
|
|
|
<< " for tablespace " << space_id;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
|
|
|
case FIL_LOAD_INVALID:
|
|
|
|
ut_ad(space == NULL);
|
|
|
|
if (srv_force_recovery == 0) {
|
|
|
|
ib::warn() << "We do not continue the crash"
|
|
|
|
" recovery, because the table may"
|
|
|
|
" become corrupt if we cannot apply"
|
|
|
|
" the log records in the InnoDB log to"
|
|
|
|
" it. To fix the problem and start"
|
|
|
|
" mysqld:";
|
|
|
|
ib::info() << "1) If there is a permission"
|
|
|
|
" problem in the file and mysqld"
|
|
|
|
" cannot open the file, you should"
|
|
|
|
" modify the permissions.";
|
|
|
|
ib::info() << "2) If the tablespace is not"
|
|
|
|
" needed, or you can restore an older"
|
|
|
|
" version from a backup, then you can"
|
|
|
|
" remove the .ibd file, and use"
|
|
|
|
" --innodb_force_recovery=1 to force"
|
|
|
|
" startup without this file.";
|
|
|
|
ib::info() << "3) If the file system or the"
|
|
|
|
" disk is broken, and you cannot"
|
|
|
|
" remove the .ibd file, you can set"
|
|
|
|
" --innodb_force_recovery.";
|
|
|
|
recv_sys->found_corrupt_fs = true;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
ib::info() << "innodb_force_recovery was set to "
|
|
|
|
<< srv_force_recovery << ". Continuing crash"
|
|
|
|
" recovery even though we cannot access the"
|
|
|
|
" files for tablespace " << space_id << ".";
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/** Parse or process a MLOG_FILE_* record.
|
|
|
|
@param[in] ptr redo log record
|
|
|
|
@param[in] end end of the redo log buffer
|
|
|
|
@param[in] space_id the tablespace ID
|
|
|
|
@param[in] first_page_no first page number in the file
|
|
|
|
@param[in] type MLOG_FILE_NAME or MLOG_FILE_DELETE
|
|
|
|
or MLOG_FILE_CREATE2 or MLOG_FILE_RENAME2
|
|
|
|
@param[in] apply whether to apply the record
|
|
|
|
@return pointer to next redo log record
|
|
|
|
@retval NULL if this log record was truncated */
|
|
|
|
static
|
|
|
|
byte*
|
|
|
|
fil_name_parse(
|
|
|
|
byte* ptr,
|
|
|
|
const byte* end,
|
|
|
|
ulint space_id,
|
|
|
|
ulint first_page_no,
|
|
|
|
mlog_id_t type,
|
|
|
|
bool apply)
|
|
|
|
{
|
|
|
|
if (type == MLOG_FILE_CREATE2) {
|
|
|
|
if (end < ptr + 4) {
|
|
|
|
return(NULL);
|
|
|
|
}
|
|
|
|
ptr += 4;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (end < ptr + 2) {
|
|
|
|
return(NULL);
|
|
|
|
}
|
|
|
|
|
|
|
|
ulint len = mach_read_from_2(ptr);
|
|
|
|
ptr += 2;
|
|
|
|
if (end < ptr + len) {
|
|
|
|
return(NULL);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* MLOG_FILE_* records should only be written for
|
|
|
|
user-created tablespaces. The name must be long enough
|
|
|
|
and end in .ibd. */
|
|
|
|
bool corrupt = is_predefined_tablespace(space_id)
|
|
|
|
|| len < sizeof "/a.ibd\0"
|
MDEV-13564 Mariabackup does not work with TRUNCATE
Implement undo tablespace truncation via normal redo logging.
Implement TRUNCATE TABLE as a combination of RENAME to #sql-ib name,
CREATE, and DROP.
Note: Orphan #sql-ib*.ibd may be left behind if MariaDB Server 10.2
is killed before the DROP operation is committed. If MariaDB Server 10.2
is killed during TRUNCATE, it is also possible that the old table
was renamed to #sql-ib*.ibd but the data dictionary will refer to the
table using the original name.
In MariaDB Server 10.3, RENAME inside InnoDB is transactional,
and #sql-* tables will be dropped on startup. So, this new TRUNCATE
will be fully crash-safe in 10.3.
ha_mroonga::wrapper_truncate(): Pass table options to the underlying
storage engine, now that ha_innobase::truncate() will need them.
rpl_slave_state::truncate_state_table(): Before truncating
mysql.gtid_slave_pos, evict any cached table handles from
the table definition cache, so that there will be no stale
references to the old table after truncating.
== TRUNCATE TABLE ==
WL#6501 in MySQL 5.7 introduced separate log files for implementing
atomic and crash-safe TRUNCATE TABLE, instead of using the InnoDB
undo and redo log. Some convoluted logic was added to the InnoDB
crash recovery, and some extra synchronization (including a redo log
checkpoint) was introduced to make this work. This synchronization
has caused performance problems and race conditions, and the extra
log files cannot be copied or applied by external backup programs.
In order to support crash-upgrade from MariaDB 10.2, we will keep
the logic for parsing and applying the extra log files, but we will
no longer generate those files in TRUNCATE TABLE.
A prerequisite for crash-safe TRUNCATE is a crash-safe RENAME TABLE
(with full redo and undo logging and proper rollback). This will
be implemented in MDEV-14717.
ha_innobase::truncate(): Invoke RENAME, create(), delete_table().
Because RENAME cannot be fully rolled back before MariaDB 10.3
due to missing undo logging, add some explicit rename-back in
case the operation fails.
ha_innobase::delete(): Introduce a variant that takes sqlcom as
a parameter. In TRUNCATE TABLE, we do not want to touch any
FOREIGN KEY constraints.
ha_innobase::create(): Add the parameters file_per_table, trx.
In TRUNCATE, the new table must be created in the same transaction
that renames the old table.
create_table_info_t::create_table_info_t(): Add the parameters
file_per_table, trx.
row_drop_table_for_mysql(): Replace a bool parameter with sqlcom.
row_drop_table_after_create_fail(): New function, wrapping
row_drop_table_for_mysql().
dict_truncate_index_tree_in_mem(), fil_truncate_tablespace(),
fil_prepare_for_truncate(), fil_reinit_space_header_for_table(),
row_truncate_table_for_mysql(), TruncateLogger,
row_truncate_prepare(), row_truncate_rollback(),
row_truncate_complete(), row_truncate_fts(),
row_truncate_update_system_tables(),
row_truncate_foreign_key_checks(), row_truncate_sanity_checks():
Remove.
row_upd_check_references_constraints(): Remove a check for
TRUNCATE, now that the table is no longer truncated in place.
The new test innodb.truncate_foreign uses DEBUG_SYNC to cover some
race-condition like scenarios. The test innodb-innodb.truncate does
not use any synchronization.
We add a redo log subformat to indicate backup-friendly format.
MariaDB 10.4 will remove support for the old TRUNCATE logging,
so crash-upgrade from old 10.2 or 10.3 to 10.4 will involve
limitations.
== Undo tablespace truncation ==
MySQL 5.7 implements undo tablespace truncation. It is only
possible when innodb_undo_tablespaces is set to at least 2.
The logging is implemented similar to the WL#6501 TRUNCATE,
that is, using separate log files and a redo log checkpoint.
We can simply implement undo tablespace truncation within
a single mini-transaction that reinitializes the undo log
tablespace file. Unfortunately, due to the redo log format
of some operations, currently, the total redo log written by
undo tablespace truncation will be more than the combined size
of the truncated undo tablespace. It should be acceptable
to have a little more than 1 megabyte of log in a single
mini-transaction. This will be fixed in MDEV-17138 in
MariaDB Server 10.4.
recv_sys_t: Add truncated_undo_spaces[] to remember for which undo
tablespaces a MLOG_FILE_CREATE2 record was seen.
namespace undo: Remove some unnecessary declarations.
fil_space_t::is_being_truncated: Document that this flag now
only applies to undo tablespaces. Remove some references.
fil_space_t::is_stopping(): Do not refer to is_being_truncated.
This check is for tablespaces of tables. Potentially used
tablespaces are never truncated any more.
buf_dblwr_process(): Suppress the out-of-bounds warning
for undo tablespaces.
fil_truncate_log(): Write a MLOG_FILE_CREATE2 with a nonzero
page number (new size of the tablespace in pages) to inform
crash recovery that the undo tablespace size has been reduced.
fil_op_write_log(): Relax assertions, so that MLOG_FILE_CREATE2
can be written for undo tablespaces (without .ibd file suffix)
for a nonzero page number.
os_file_truncate(): Add the parameter allow_shrink=false
so that undo tablespaces can actually be shrunk using this function.
fil_name_parse(): For undo tablespace truncation,
buffer MLOG_FILE_CREATE2 in truncated_undo_spaces[].
recv_read_in_area(): Avoid reading pages for which no redo log
records remain buffered, after recv_addr_trim() removed them.
trx_rseg_header_create(): Add a FIXME comment that we could write
much less redo log.
trx_undo_truncate_tablespace(): Reinitialize the undo tablespace
in a single mini-transaction, which will be flushed to the redo log
before the file size is trimmed.
recv_addr_trim(): Discard any redo logs for pages that were
logged after the new end of a file, before the truncation LSN.
If the rec_list becomes empty, reduce n_addrs. After removing
any affected records, actually truncate the file.
recv_apply_hashed_log_recs(): Invoke recv_addr_trim() right before
applying any log records. The undo tablespace files must be open
at this point.
buf_flush_or_remove_pages(), buf_flush_dirty_pages(),
buf_LRU_flush_or_remove_pages(): Add a parameter for specifying
the number of the first page to flush or remove (default 0).
trx_purge_initiate_truncate(): Remove the log checkpoints, the
extra logging, and some unnecessary crash points. Merge the code
from trx_undo_truncate_tablespace(). First, flush all to-be-discarded
pages (beyond the new end of the file), then trim the space->size
to make the page allocation deterministic. At the only remaining
crash injection point, flush the redo log, so that the recovery
can be tested.
2018-08-28 13:43:06 +03:00
|
|
|
|| (!first_page_no != !memcmp(ptr + len - 5, DOT_IBD, 5))
|
2016-08-12 11:17:45 +03:00
|
|
|
|| memchr(ptr, OS_PATH_SEPARATOR, len) == NULL;
|
|
|
|
|
|
|
|
byte* end_ptr = ptr + len;
|
|
|
|
|
|
|
|
switch (type) {
|
|
|
|
default:
|
|
|
|
ut_ad(0); // the caller checked this
|
|
|
|
case MLOG_FILE_NAME:
|
|
|
|
if (corrupt) {
|
|
|
|
ib::error() << "MLOG_FILE_NAME incorrect:" << ptr;
|
|
|
|
recv_sys->found_corrupt_log = true;
|
|
|
|
break;
|
|
|
|
}
|
2016-09-06 09:43:16 +03:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
fil_name_process(
|
|
|
|
reinterpret_cast<char*>(ptr), len, space_id, false);
|
|
|
|
break;
|
|
|
|
case MLOG_FILE_DELETE:
|
|
|
|
if (corrupt) {
|
|
|
|
ib::error() << "MLOG_FILE_DELETE incorrect:" << ptr;
|
|
|
|
recv_sys->found_corrupt_log = true;
|
|
|
|
break;
|
|
|
|
}
|
2016-09-06 09:43:16 +03:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
fil_name_process(
|
|
|
|
reinterpret_cast<char*>(ptr), len, space_id, true);
|
2018-08-09 15:06:52 +01:00
|
|
|
/* fall through */
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_FILE_CREATE2:
|
MDEV-13564 Mariabackup does not work with TRUNCATE
Implement undo tablespace truncation via normal redo logging.
Implement TRUNCATE TABLE as a combination of RENAME to #sql-ib name,
CREATE, and DROP.
Note: Orphan #sql-ib*.ibd may be left behind if MariaDB Server 10.2
is killed before the DROP operation is committed. If MariaDB Server 10.2
is killed during TRUNCATE, it is also possible that the old table
was renamed to #sql-ib*.ibd but the data dictionary will refer to the
table using the original name.
In MariaDB Server 10.3, RENAME inside InnoDB is transactional,
and #sql-* tables will be dropped on startup. So, this new TRUNCATE
will be fully crash-safe in 10.3.
ha_mroonga::wrapper_truncate(): Pass table options to the underlying
storage engine, now that ha_innobase::truncate() will need them.
rpl_slave_state::truncate_state_table(): Before truncating
mysql.gtid_slave_pos, evict any cached table handles from
the table definition cache, so that there will be no stale
references to the old table after truncating.
== TRUNCATE TABLE ==
WL#6501 in MySQL 5.7 introduced separate log files for implementing
atomic and crash-safe TRUNCATE TABLE, instead of using the InnoDB
undo and redo log. Some convoluted logic was added to the InnoDB
crash recovery, and some extra synchronization (including a redo log
checkpoint) was introduced to make this work. This synchronization
has caused performance problems and race conditions, and the extra
log files cannot be copied or applied by external backup programs.
In order to support crash-upgrade from MariaDB 10.2, we will keep
the logic for parsing and applying the extra log files, but we will
no longer generate those files in TRUNCATE TABLE.
A prerequisite for crash-safe TRUNCATE is a crash-safe RENAME TABLE
(with full redo and undo logging and proper rollback). This will
be implemented in MDEV-14717.
ha_innobase::truncate(): Invoke RENAME, create(), delete_table().
Because RENAME cannot be fully rolled back before MariaDB 10.3
due to missing undo logging, add some explicit rename-back in
case the operation fails.
ha_innobase::delete(): Introduce a variant that takes sqlcom as
a parameter. In TRUNCATE TABLE, we do not want to touch any
FOREIGN KEY constraints.
ha_innobase::create(): Add the parameters file_per_table, trx.
In TRUNCATE, the new table must be created in the same transaction
that renames the old table.
create_table_info_t::create_table_info_t(): Add the parameters
file_per_table, trx.
row_drop_table_for_mysql(): Replace a bool parameter with sqlcom.
row_drop_table_after_create_fail(): New function, wrapping
row_drop_table_for_mysql().
dict_truncate_index_tree_in_mem(), fil_truncate_tablespace(),
fil_prepare_for_truncate(), fil_reinit_space_header_for_table(),
row_truncate_table_for_mysql(), TruncateLogger,
row_truncate_prepare(), row_truncate_rollback(),
row_truncate_complete(), row_truncate_fts(),
row_truncate_update_system_tables(),
row_truncate_foreign_key_checks(), row_truncate_sanity_checks():
Remove.
row_upd_check_references_constraints(): Remove a check for
TRUNCATE, now that the table is no longer truncated in place.
The new test innodb.truncate_foreign uses DEBUG_SYNC to cover some
race-condition like scenarios. The test innodb-innodb.truncate does
not use any synchronization.
We add a redo log subformat to indicate backup-friendly format.
MariaDB 10.4 will remove support for the old TRUNCATE logging,
so crash-upgrade from old 10.2 or 10.3 to 10.4 will involve
limitations.
== Undo tablespace truncation ==
MySQL 5.7 implements undo tablespace truncation. It is only
possible when innodb_undo_tablespaces is set to at least 2.
The logging is implemented similar to the WL#6501 TRUNCATE,
that is, using separate log files and a redo log checkpoint.
We can simply implement undo tablespace truncation within
a single mini-transaction that reinitializes the undo log
tablespace file. Unfortunately, due to the redo log format
of some operations, currently, the total redo log written by
undo tablespace truncation will be more than the combined size
of the truncated undo tablespace. It should be acceptable
to have a little more than 1 megabyte of log in a single
mini-transaction. This will be fixed in MDEV-17138 in
MariaDB Server 10.4.
recv_sys_t: Add truncated_undo_spaces[] to remember for which undo
tablespaces a MLOG_FILE_CREATE2 record was seen.
namespace undo: Remove some unnecessary declarations.
fil_space_t::is_being_truncated: Document that this flag now
only applies to undo tablespaces. Remove some references.
fil_space_t::is_stopping(): Do not refer to is_being_truncated.
This check is for tablespaces of tables. Potentially used
tablespaces are never truncated any more.
buf_dblwr_process(): Suppress the out-of-bounds warning
for undo tablespaces.
fil_truncate_log(): Write a MLOG_FILE_CREATE2 with a nonzero
page number (new size of the tablespace in pages) to inform
crash recovery that the undo tablespace size has been reduced.
fil_op_write_log(): Relax assertions, so that MLOG_FILE_CREATE2
can be written for undo tablespaces (without .ibd file suffix)
for a nonzero page number.
os_file_truncate(): Add the parameter allow_shrink=false
so that undo tablespaces can actually be shrunk using this function.
fil_name_parse(): For undo tablespace truncation,
buffer MLOG_FILE_CREATE2 in truncated_undo_spaces[].
recv_read_in_area(): Avoid reading pages for which no redo log
records remain buffered, after recv_addr_trim() removed them.
trx_rseg_header_create(): Add a FIXME comment that we could write
much less redo log.
trx_undo_truncate_tablespace(): Reinitialize the undo tablespace
in a single mini-transaction, which will be flushed to the redo log
before the file size is trimmed.
recv_addr_trim(): Discard any redo logs for pages that were
logged after the new end of a file, before the truncation LSN.
If the rec_list becomes empty, reduce n_addrs. After removing
any affected records, actually truncate the file.
recv_apply_hashed_log_recs(): Invoke recv_addr_trim() right before
applying any log records. The undo tablespace files must be open
at this point.
buf_flush_or_remove_pages(), buf_flush_dirty_pages(),
buf_LRU_flush_or_remove_pages(): Add a parameter for specifying
the number of the first page to flush or remove (default 0).
trx_purge_initiate_truncate(): Remove the log checkpoints, the
extra logging, and some unnecessary crash points. Merge the code
from trx_undo_truncate_tablespace(). First, flush all to-be-discarded
pages (beyond the new end of the file), then trim the space->size
to make the page allocation deterministic. At the only remaining
crash injection point, flush the redo log, so that the recovery
can be tested.
2018-08-28 13:43:06 +03:00
|
|
|
if (first_page_no) {
|
|
|
|
ut_ad(first_page_no
|
|
|
|
== SRV_UNDO_TABLESPACE_SIZE_IN_PAGES);
|
|
|
|
ut_a(srv_is_undo_tablespace(space_id));
|
|
|
|
compile_time_assert(
|
|
|
|
UT_ARR_SIZE(recv_sys->truncated_undo_spaces)
|
|
|
|
== TRX_SYS_MAX_UNDO_SPACES);
|
|
|
|
recv_sys_t::trunc& t = recv_sys->truncated_undo_spaces[
|
|
|
|
space_id - srv_undo_space_id_start];
|
|
|
|
t.lsn = recv_sys->recovered_lsn;
|
|
|
|
t.pages = uint32_t(first_page_no);
|
|
|
|
} else if (log_file_op) {
|
2018-08-09 15:06:52 +01:00
|
|
|
log_file_op(space_id,
|
|
|
|
type == MLOG_FILE_CREATE2 ? ptr - 4 : NULL,
|
|
|
|
ptr, len, NULL, 0);
|
|
|
|
}
|
2016-08-12 11:17:45 +03:00
|
|
|
break;
|
|
|
|
case MLOG_FILE_RENAME2:
|
|
|
|
if (corrupt) {
|
|
|
|
ib::error() << "MLOG_FILE_RENAME2 incorrect:" << ptr;
|
|
|
|
recv_sys->found_corrupt_log = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* The new name follows the old name. */
|
|
|
|
byte* new_name = end_ptr + 2;
|
|
|
|
if (end < new_name) {
|
|
|
|
return(NULL);
|
|
|
|
}
|
|
|
|
|
|
|
|
ulint new_len = mach_read_from_2(end_ptr);
|
|
|
|
|
|
|
|
if (end < end_ptr + 2 + new_len) {
|
|
|
|
return(NULL);
|
|
|
|
}
|
|
|
|
|
|
|
|
end_ptr += 2 + new_len;
|
|
|
|
|
|
|
|
corrupt = corrupt
|
|
|
|
|| new_len < sizeof "/a.ibd\0"
|
|
|
|
|| memcmp(new_name + new_len - 5, DOT_IBD, 5) != 0
|
|
|
|
|| !memchr(new_name, OS_PATH_SEPARATOR, new_len);
|
|
|
|
|
|
|
|
if (corrupt) {
|
2016-09-06 09:43:16 +03:00
|
|
|
ib::error() << "MLOG_FILE_RENAME2 new_name incorrect:" << ptr
|
|
|
|
<< " new_name: " << new_name;
|
2016-08-12 11:17:45 +03:00
|
|
|
recv_sys->found_corrupt_log = true;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
fil_name_process(
|
|
|
|
reinterpret_cast<char*>(ptr), len,
|
|
|
|
space_id, false);
|
|
|
|
fil_name_process(
|
|
|
|
reinterpret_cast<char*>(new_name), new_len,
|
|
|
|
space_id, false);
|
|
|
|
|
2018-08-09 15:06:52 +01:00
|
|
|
if (log_file_op) {
|
|
|
|
log_file_op(space_id, NULL,
|
|
|
|
ptr, len, new_name, new_len);
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (!apply) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
if (!fil_op_replay_rename(
|
|
|
|
space_id, first_page_no,
|
|
|
|
reinterpret_cast<const char*>(ptr),
|
|
|
|
reinterpret_cast<const char*>(new_name))) {
|
|
|
|
recv_sys->found_corrupt_fs = true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return(end_ptr);
|
|
|
|
}
|
|
|
|
|
2017-06-29 22:24:48 +03:00
|
|
|
/** Clean up after recv_sys_init() */
|
2014-02-26 19:11:54 +01:00
|
|
|
void
|
2017-06-29 22:24:48 +03:00
|
|
|
recv_sys_close()
|
2014-02-26 19:11:54 +01:00
|
|
|
{
|
|
|
|
if (recv_sys != NULL) {
|
2017-01-31 19:43:03 +02:00
|
|
|
recv_sys->dblwr.pages.clear();
|
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
if (recv_sys->addr_hash != NULL) {
|
|
|
|
hash_table_free(recv_sys->addr_hash);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (recv_sys->heap != NULL) {
|
|
|
|
mem_heap_free(recv_sys->heap);
|
|
|
|
}
|
2016-12-30 15:04:10 +02:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (recv_sys->flush_start != NULL) {
|
|
|
|
os_event_destroy(recv_sys->flush_start);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (recv_sys->flush_end != NULL) {
|
|
|
|
os_event_destroy(recv_sys->flush_end);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
2016-12-30 15:04:10 +02:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_free(recv_sys->buf);
|
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
ut_ad(!recv_writer_thread_active);
|
|
|
|
mutex_free(&recv_sys->writer_mutex);
|
|
|
|
|
|
|
|
mutex_free(&recv_sys->mutex);
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_free(recv_sys);
|
2014-02-26 19:11:54 +01:00
|
|
|
recv_sys = NULL;
|
|
|
|
}
|
2016-08-12 11:17:45 +03:00
|
|
|
|
|
|
|
recv_spaces.clear();
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
/************************************************************
|
|
|
|
Reset the state of the recovery system variables. */
|
|
|
|
void
|
|
|
|
recv_sys_var_init(void)
|
|
|
|
/*===================*/
|
|
|
|
{
|
2016-08-12 11:17:45 +03:00
|
|
|
recv_recovery_on = false;
|
|
|
|
recv_needed_recovery = false;
|
|
|
|
recv_lsn_checks_on = false;
|
|
|
|
recv_no_ibuf_operations = false;
|
|
|
|
recv_previous_parsed_rec_type = MLOG_SINGLE_REC_FLAG;
|
2014-02-26 19:11:54 +01:00
|
|
|
recv_previous_parsed_rec_offset = 0;
|
|
|
|
recv_previous_parsed_rec_is_multi = 0;
|
|
|
|
recv_n_pool_free_frames = 256;
|
|
|
|
recv_max_page_lsn = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/******************************************************************//**
|
|
|
|
recv_writer thread tasked with flushing dirty pages from the buffer
|
|
|
|
pools.
|
|
|
|
@return a dummy parameter */
|
2016-08-12 11:17:45 +03:00
|
|
|
extern "C"
|
2014-02-26 19:11:54 +01:00
|
|
|
os_thread_ret_t
|
|
|
|
DECLARE_THREAD(recv_writer_thread)(
|
|
|
|
/*===============================*/
|
2016-06-21 14:21:03 +02:00
|
|
|
void* arg MY_ATTRIBUTE((unused)))
|
2014-02-26 19:11:54 +01:00
|
|
|
/*!< in: a dummy parameter required by
|
|
|
|
os_thread_create */
|
|
|
|
{
|
2017-01-06 19:48:54 +05:30
|
|
|
my_thread_init();
|
2014-02-26 19:11:54 +01:00
|
|
|
ut_ad(!srv_read_only_mode);
|
|
|
|
|
|
|
|
#ifdef UNIV_PFS_THREAD
|
2016-09-11 10:57:05 +02:00
|
|
|
pfs_register_thread(recv_writer_thread_key);
|
2014-02-26 19:11:54 +01:00
|
|
|
#endif /* UNIV_PFS_THREAD */
|
|
|
|
|
|
|
|
#ifdef UNIV_DEBUG_THREAD_CREATION
|
2016-08-12 11:17:45 +03:00
|
|
|
ib::info() << "recv_writer thread running, id "
|
|
|
|
<< os_thread_pf(os_thread_get_curr_id());
|
2014-02-26 19:11:54 +01:00
|
|
|
#endif /* UNIV_DEBUG_THREAD_CREATION */
|
|
|
|
|
|
|
|
while (srv_shutdown_state == SRV_SHUTDOWN_NONE) {
|
|
|
|
|
2014-11-06 13:17:11 +02:00
|
|
|
/* Wait till we get a signal to clean the LRU list.
|
|
|
|
Bounded by max wait time of 100ms. */
|
2016-08-12 11:17:45 +03:00
|
|
|
ib_uint64_t sig_count = os_event_reset(buf_flush_event);
|
2014-11-06 13:17:11 +02:00
|
|
|
os_event_wait_time_low(buf_flush_event, 100000, sig_count);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
mutex_enter(&recv_sys->writer_mutex);
|
|
|
|
|
|
|
|
if (!recv_recovery_on) {
|
|
|
|
mutex_exit(&recv_sys->writer_mutex);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Flush pages from end of LRU if required */
|
2016-08-12 11:17:45 +03:00
|
|
|
os_event_reset(recv_sys->flush_end);
|
|
|
|
recv_sys->flush_type = BUF_FLUSH_LRU;
|
|
|
|
os_event_set(recv_sys->flush_start);
|
|
|
|
os_event_wait(recv_sys->flush_end);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
mutex_exit(&recv_sys->writer_mutex);
|
|
|
|
}
|
|
|
|
|
|
|
|
recv_writer_thread_active = false;
|
|
|
|
|
2017-01-06 19:48:54 +05:30
|
|
|
my_thread_end();
|
2014-02-26 19:11:54 +01:00
|
|
|
/* We count the number of threads in os_thread_exit().
|
|
|
|
A created thread should always use that to exit and not
|
|
|
|
use return() to exit. */
|
2016-09-06 09:43:16 +03:00
|
|
|
os_thread_exit();
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
OS_THREAD_DUMMY_RETURN;
|
|
|
|
}
|
|
|
|
|
2017-06-29 22:24:48 +03:00
|
|
|
/** Initialize the redo log recovery subsystem. */
|
2014-02-26 19:11:54 +01:00
|
|
|
void
|
2017-06-29 22:24:48 +03:00
|
|
|
recv_sys_init()
|
2014-02-26 19:11:54 +01:00
|
|
|
{
|
2017-06-29 22:24:48 +03:00
|
|
|
ut_ad(recv_sys == NULL);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-06-29 22:24:48 +03:00
|
|
|
recv_sys = static_cast<recv_sys_t*>(ut_zalloc_nokey(sizeof(*recv_sys)));
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-06-29 22:24:48 +03:00
|
|
|
mutex_create(LATCH_ID_RECV_SYS, &recv_sys->mutex);
|
|
|
|
mutex_create(LATCH_ID_RECV_WRITER, &recv_sys->writer_mutex);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-06-29 22:24:48 +03:00
|
|
|
recv_sys->heap = mem_heap_create_typed(256, MEM_HEAP_FOR_RECV_SYS);
|
2016-08-12 11:17:45 +03:00
|
|
|
|
|
|
|
if (!srv_read_only_mode) {
|
|
|
|
recv_sys->flush_start = os_event_create(0);
|
|
|
|
recv_sys->flush_end = os_event_create(0);
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-06-29 22:24:48 +03:00
|
|
|
ulint size = buf_pool_get_curr_size();
|
2014-02-26 19:11:54 +01:00
|
|
|
/* Set appropriate value of recv_n_pool_free_frames. */
|
2017-06-29 22:24:48 +03:00
|
|
|
if (size >= 10 << 20) {
|
2014-02-26 19:11:54 +01:00
|
|
|
/* Buffer pool of size greater than 10 MB. */
|
|
|
|
recv_n_pool_free_frames = 512;
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
recv_sys->buf = static_cast<byte*>(
|
|
|
|
ut_malloc_nokey(RECV_PARSING_BUF_SIZE));
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-06-29 22:24:48 +03:00
|
|
|
recv_sys->addr_hash = hash_create(size / 512);
|
2017-03-07 17:16:49 +02:00
|
|
|
recv_sys->progress_time = ut_time();
|
2014-02-26 19:11:54 +01:00
|
|
|
recv_max_page_lsn = 0;
|
|
|
|
|
2014-05-05 18:20:28 +02:00
|
|
|
/* Call the constructor for recv_sys_t::dblwr member */
|
|
|
|
new (&recv_sys->dblwr) recv_dblwr_t();
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2017-03-07 17:16:49 +02:00
|
|
|
/** Empty a fully processed hash table. */
|
2014-02-26 19:11:54 +01:00
|
|
|
static
|
2016-09-06 09:43:16 +03:00
|
|
|
void
|
2017-03-07 17:16:49 +02:00
|
|
|
recv_sys_empty_hash()
|
2014-02-26 19:11:54 +01:00
|
|
|
{
|
|
|
|
ut_ad(mutex_own(&(recv_sys->mutex)));
|
2017-03-07 17:16:49 +02:00
|
|
|
ut_a(recv_sys->n_addrs == 0);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
hash_table_free(recv_sys->addr_hash);
|
|
|
|
mem_heap_empty(recv_sys->heap);
|
|
|
|
|
|
|
|
recv_sys->addr_hash = hash_create(buf_pool_get_curr_size() / 512);
|
|
|
|
}
|
|
|
|
|
|
|
|
/********************************************************//**
|
|
|
|
Frees the recovery system. */
|
|
|
|
void
|
|
|
|
recv_sys_debug_free(void)
|
|
|
|
/*=====================*/
|
|
|
|
{
|
|
|
|
mutex_enter(&(recv_sys->mutex));
|
|
|
|
|
|
|
|
hash_table_free(recv_sys->addr_hash);
|
|
|
|
mem_heap_free(recv_sys->heap);
|
|
|
|
ut_free(recv_sys->buf);
|
|
|
|
|
|
|
|
recv_sys->buf = NULL;
|
|
|
|
recv_sys->heap = NULL;
|
|
|
|
recv_sys->addr_hash = NULL;
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/* wake page cleaner up to progress */
|
|
|
|
if (!srv_read_only_mode) {
|
|
|
|
ut_ad(!recv_recovery_on);
|
|
|
|
ut_ad(!recv_writer_thread_active);
|
|
|
|
os_event_reset(buf_flush_event);
|
|
|
|
os_event_set(recv_sys->flush_start);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
mutex_exit(&(recv_sys->mutex));
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2017-02-10 12:11:42 +02:00
|
|
|
/** Read a log segment to a buffer.
|
|
|
|
@param[out] buf buffer
|
|
|
|
@param[in] group redo log files
|
2017-11-29 22:56:23 +00:00
|
|
|
@param[in, out] start_lsn in : read area start, out: the last read valid lsn
|
2017-02-10 12:11:42 +02:00
|
|
|
@param[in] end_lsn read area end
|
2017-11-29 22:56:23 +00:00
|
|
|
@param[out] invalid_block - invalid, (maybe incompletely written) block encountered
|
|
|
|
@return false, if invalid block encountered (e.g checksum mismatch), true otherwise */
|
|
|
|
bool
|
2017-02-10 12:11:42 +02:00
|
|
|
log_group_read_log_seg(
|
|
|
|
byte* buf,
|
|
|
|
const log_group_t* group,
|
2017-11-29 22:56:23 +00:00
|
|
|
lsn_t *start_lsn,
|
2017-02-10 12:11:42 +02:00
|
|
|
lsn_t end_lsn)
|
|
|
|
{
|
|
|
|
ulint len;
|
|
|
|
lsn_t source_offset;
|
2017-11-29 22:56:23 +00:00
|
|
|
bool success = true;
|
2017-02-10 12:11:42 +02:00
|
|
|
ut_ad(log_mutex_own());
|
2017-11-29 22:56:23 +00:00
|
|
|
ut_ad(!(*start_lsn % OS_FILE_LOG_BLOCK_SIZE));
|
2017-11-09 16:25:16 +00:00
|
|
|
ut_ad(!(end_lsn % OS_FILE_LOG_BLOCK_SIZE));
|
2017-02-10 12:11:42 +02:00
|
|
|
|
|
|
|
loop:
|
2017-11-29 22:56:23 +00:00
|
|
|
source_offset = log_group_calc_lsn_offset(*start_lsn, group);
|
2017-02-10 12:11:42 +02:00
|
|
|
|
2017-11-29 22:56:23 +00:00
|
|
|
ut_a(end_lsn - *start_lsn <= ULINT_MAX);
|
|
|
|
len = (ulint) (end_lsn - *start_lsn);
|
2017-02-10 12:11:42 +02:00
|
|
|
|
|
|
|
ut_ad(len != 0);
|
|
|
|
|
|
|
|
const bool at_eof = (source_offset % group->file_size) + len
|
|
|
|
> group->file_size;
|
|
|
|
if (at_eof) {
|
|
|
|
/* If the above condition is true then len (which is ulint)
|
|
|
|
is > the expression below, so the typecast is ok */
|
|
|
|
len = (ulint) (group->file_size -
|
|
|
|
(source_offset % group->file_size));
|
|
|
|
}
|
|
|
|
|
|
|
|
log_sys->n_log_ios++;
|
|
|
|
|
|
|
|
MONITOR_INC(MONITOR_LOG_IO);
|
|
|
|
|
|
|
|
ut_a(source_offset / UNIV_PAGE_SIZE <= ULINT_MAX);
|
|
|
|
|
|
|
|
const ulint page_no
|
|
|
|
= (ulint) (source_offset / univ_page_size.physical());
|
|
|
|
|
|
|
|
fil_io(IORequestLogRead, true,
|
2017-05-26 14:04:19 +03:00
|
|
|
page_id_t(SRV_LOG_SPACE_FIRST_ID, page_no),
|
2017-02-10 12:11:42 +02:00
|
|
|
univ_page_size,
|
|
|
|
(ulint) (source_offset % univ_page_size.physical()),
|
|
|
|
len, buf, NULL);
|
|
|
|
|
|
|
|
for (ulint l = 0; l < len; l += OS_FILE_LOG_BLOCK_SIZE,
|
|
|
|
buf += OS_FILE_LOG_BLOCK_SIZE,
|
2017-11-29 22:56:23 +00:00
|
|
|
(*start_lsn) += OS_FILE_LOG_BLOCK_SIZE) {
|
2017-02-10 12:11:42 +02:00
|
|
|
const ulint block_number = log_block_get_hdr_no(buf);
|
|
|
|
|
2017-11-29 22:56:23 +00:00
|
|
|
if (block_number != log_block_convert_lsn_to_no(*start_lsn)) {
|
2017-02-10 12:11:42 +02:00
|
|
|
/* Garbage or an incompletely written log block.
|
|
|
|
We will not report any error, because this can
|
|
|
|
happen when InnoDB was killed while it was
|
|
|
|
writing redo log. We simply treat this as an
|
|
|
|
abrupt end of the redo log. */
|
2017-11-29 22:56:23 +00:00
|
|
|
end_lsn = *start_lsn;
|
2017-03-07 17:16:49 +02:00
|
|
|
break;
|
2017-02-10 12:11:42 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
if (innodb_log_checksums || group->is_encrypted()) {
|
|
|
|
ulint crc = log_block_calc_checksum_crc32(buf);
|
|
|
|
ulint cksum = log_block_get_checksum(buf);
|
|
|
|
|
2017-11-29 22:56:23 +00:00
|
|
|
DBUG_EXECUTE_IF("log_intermittent_checksum_mismatch", {
|
|
|
|
static int block_counter;
|
|
|
|
if (block_counter++ == 0) {
|
|
|
|
cksum = crc + 1;
|
|
|
|
}
|
|
|
|
});
|
|
|
|
|
2017-02-10 12:11:42 +02:00
|
|
|
if (crc != cksum) {
|
|
|
|
ib::error() << "Invalid log block checksum."
|
|
|
|
<< " block: " << block_number
|
|
|
|
<< " checkpoint no: "
|
|
|
|
<< log_block_get_checkpoint_no(buf)
|
|
|
|
<< " expected: " << crc
|
|
|
|
<< " found: " << cksum;
|
2017-11-29 22:56:23 +00:00
|
|
|
end_lsn = *start_lsn;
|
|
|
|
success = false;
|
2017-03-07 17:16:49 +02:00
|
|
|
break;
|
2017-02-10 12:11:42 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
if (group->is_encrypted()) {
|
2017-11-29 22:56:23 +00:00
|
|
|
log_crypt(buf, *start_lsn,
|
2017-09-11 16:47:23 +03:00
|
|
|
OS_FILE_LOG_BLOCK_SIZE, true);
|
2017-02-10 12:11:42 +02:00
|
|
|
}
|
|
|
|
}
|
2018-08-09 19:42:46 +03:00
|
|
|
|
|
|
|
ulint dl = log_block_get_data_len(buf);
|
|
|
|
if (dl < LOG_BLOCK_HDR_SIZE
|
|
|
|
|| (dl > OS_FILE_LOG_BLOCK_SIZE - LOG_BLOCK_TRL_SIZE
|
|
|
|
&& dl != OS_FILE_LOG_BLOCK_SIZE)) {
|
|
|
|
recv_sys->found_corrupt_log = true;
|
|
|
|
end_lsn = *start_lsn;
|
|
|
|
break;
|
|
|
|
}
|
2017-02-10 12:11:42 +02:00
|
|
|
}
|
|
|
|
|
2017-03-07 17:16:49 +02:00
|
|
|
if (recv_sys->report(ut_time())) {
|
2017-11-29 22:56:23 +00:00
|
|
|
ib::info() << "Read redo log up to LSN=" << *start_lsn;
|
2018-04-10 17:43:18 +03:00
|
|
|
service_manager_extend_timeout(INNODB_EXTEND_TIMEOUT_INTERVAL,
|
|
|
|
"Read redo log up to LSN=" LSN_PF,
|
|
|
|
*start_lsn);
|
2017-03-07 17:16:49 +02:00
|
|
|
}
|
2017-02-10 12:11:42 +02:00
|
|
|
|
2017-11-29 22:56:23 +00:00
|
|
|
if (*start_lsn != end_lsn) {
|
2017-02-10 12:11:42 +02:00
|
|
|
goto loop;
|
|
|
|
}
|
|
|
|
|
2017-11-29 22:56:23 +00:00
|
|
|
return(success);
|
2017-02-10 12:11:42 +02:00
|
|
|
}
|
|
|
|
|
2017-11-29 22:56:23 +00:00
|
|
|
|
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
/********************************************************//**
|
|
|
|
Copies a log segment from the most up-to-date log group to the other log
|
|
|
|
groups, so that they all contain the latest log data. Also writes the info
|
|
|
|
about the latest checkpoint to the groups, and inits the fields in the group
|
|
|
|
memory structs to up-to-date values. */
|
|
|
|
static
|
|
|
|
void
|
2017-02-10 12:11:42 +02:00
|
|
|
recv_synchronize_groups()
|
2014-02-26 19:11:54 +01:00
|
|
|
{
|
2017-02-10 19:32:03 +02:00
|
|
|
const lsn_t recovered_lsn = recv_sys->recovered_lsn;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
/* Read the last recovered log block to the recovery system buffer:
|
|
|
|
the block is always incomplete */
|
|
|
|
|
2017-11-29 22:56:23 +00:00
|
|
|
lsn_t start_lsn = ut_uint64_align_down(recovered_lsn,
|
2017-02-10 19:32:03 +02:00
|
|
|
OS_FILE_LOG_BLOCK_SIZE);
|
2017-05-26 14:04:19 +03:00
|
|
|
log_group_read_log_seg(log_sys->buf, &log_sys->log,
|
2017-11-29 22:56:23 +00:00
|
|
|
&start_lsn, start_lsn + OS_FILE_LOG_BLOCK_SIZE);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
/* Update the fields in the group struct to correspond to
|
|
|
|
recovered_lsn */
|
2017-02-10 19:32:03 +02:00
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
log_group_set_fields(&log_sys->log, recovered_lsn);
|
2016-08-12 11:17:45 +03:00
|
|
|
|
|
|
|
/* Copy the checkpoint info to the log; remember that we have
|
2014-02-26 19:11:54 +01:00
|
|
|
incremented checkpoint_no by one, and the info will not be written
|
|
|
|
over the max checkpoint info, thus making the preservation of max
|
|
|
|
checkpoint info on disk certain */
|
|
|
|
|
2017-02-10 12:11:42 +02:00
|
|
|
if (!srv_read_only_mode) {
|
2017-03-01 23:43:37 +02:00
|
|
|
log_write_checkpoint_info(true, 0);
|
2017-02-10 12:11:42 +02:00
|
|
|
log_mutex_enter();
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/** Check the consistency of a log header block.
|
|
|
|
@param[in] log header block
|
|
|
|
@return true if ok */
|
2014-02-26 19:11:54 +01:00
|
|
|
static
|
2016-08-12 11:17:45 +03:00
|
|
|
bool
|
|
|
|
recv_check_log_header_checksum(
|
|
|
|
const byte* buf)
|
|
|
|
{
|
|
|
|
return(log_block_get_checksum(buf)
|
|
|
|
== log_block_calc_checksum_crc32(buf));
|
|
|
|
}
|
|
|
|
|
|
|
|
/** Find the latest checkpoint in the format-0 log header.
|
|
|
|
@param[out] max_group log group, or NULL
|
|
|
|
@param[out] max_field LOG_CHECKPOINT_1 or LOG_CHECKPOINT_2
|
|
|
|
@return error code or DB_SUCCESS */
|
2016-09-06 09:43:16 +03:00
|
|
|
static MY_ATTRIBUTE((warn_unused_result))
|
2016-08-12 11:17:45 +03:00
|
|
|
dberr_t
|
2017-05-26 14:04:19 +03:00
|
|
|
recv_find_max_checkpoint_0(log_group_t** max_group, ulint* max_field)
|
2014-02-26 19:11:54 +01:00
|
|
|
{
|
2017-05-26 14:04:19 +03:00
|
|
|
log_group_t* group = &log_sys->log;
|
2016-08-12 11:17:45 +03:00
|
|
|
ib_uint64_t max_no = 0;
|
|
|
|
ib_uint64_t checkpoint_no;
|
|
|
|
byte* buf = log_sys->checkpoint_buf;
|
|
|
|
|
|
|
|
ut_ad(group->format == 0);
|
|
|
|
|
|
|
|
/** Offset of the first checkpoint checksum */
|
|
|
|
static const uint CHECKSUM_1 = 288;
|
|
|
|
/** Offset of the second checkpoint checksum */
|
|
|
|
static const uint CHECKSUM_2 = CHECKSUM_1 + 4;
|
|
|
|
/** Most significant bits of the checkpoint offset */
|
|
|
|
static const uint OFFSET_HIGH32 = CHECKSUM_2 + 12;
|
|
|
|
/** Least significant bits of the checkpoint offset */
|
|
|
|
static const uint OFFSET_LOW32 = 16;
|
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
*max_group = NULL;
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
for (ulint field = LOG_CHECKPOINT_1; field <= LOG_CHECKPOINT_2;
|
|
|
|
field += LOG_CHECKPOINT_2 - LOG_CHECKPOINT_1) {
|
|
|
|
log_group_header_read(group, field);
|
|
|
|
|
|
|
|
if (static_cast<uint32_t>(ut_fold_binary(buf, CHECKSUM_1))
|
|
|
|
!= mach_read_from_4(buf + CHECKSUM_1)
|
|
|
|
|| static_cast<uint32_t>(
|
|
|
|
ut_fold_binary(buf + LOG_CHECKPOINT_LSN,
|
|
|
|
CHECKSUM_2 - LOG_CHECKPOINT_LSN))
|
|
|
|
!= mach_read_from_4(buf + CHECKSUM_2)) {
|
2017-01-24 10:29:29 +02:00
|
|
|
DBUG_LOG("ib_log",
|
|
|
|
"invalid pre-10.2.2 checkpoint " << field);
|
2016-08-12 11:17:45 +03:00
|
|
|
continue;
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
checkpoint_no = mach_read_from_8(
|
|
|
|
buf + LOG_CHECKPOINT_NO);
|
|
|
|
|
2017-02-10 20:26:02 +02:00
|
|
|
if (!log_crypt_101_read_checkpoint(buf)) {
|
2017-02-10 12:11:42 +02:00
|
|
|
ib::error() << "Decrypting checkpoint failed";
|
2017-01-24 10:29:29 +02:00
|
|
|
continue;
|
2016-09-06 09:43:16 +03:00
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
DBUG_PRINT("ib_log",
|
2017-05-26 14:04:19 +03:00
|
|
|
("checkpoint " UINT64PF " at " LSN_PF " found",
|
2017-08-07 17:21:30 +03:00
|
|
|
checkpoint_no,
|
|
|
|
mach_read_from_8(buf + LOG_CHECKPOINT_LSN)));
|
2016-08-12 11:17:45 +03:00
|
|
|
|
|
|
|
if (checkpoint_no >= max_no) {
|
|
|
|
*max_group = group;
|
|
|
|
*max_field = field;
|
|
|
|
max_no = checkpoint_no;
|
2017-08-07 17:21:30 +03:00
|
|
|
|
|
|
|
group->state = LOG_GROUP_OK;
|
|
|
|
|
|
|
|
group->lsn = mach_read_from_8(
|
|
|
|
buf + LOG_CHECKPOINT_LSN);
|
|
|
|
group->lsn_offset = static_cast<ib_uint64_t>(
|
|
|
|
mach_read_from_4(buf + OFFSET_HIGH32)) << 32
|
|
|
|
| mach_read_from_4(buf + OFFSET_LOW32);
|
2016-08-12 11:17:45 +03:00
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (*max_group != NULL) {
|
|
|
|
return(DB_SUCCESS);
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
ib::error() << "Upgrade after a crash is not supported."
|
2017-01-24 10:29:29 +02:00
|
|
|
" This redo log was created before MariaDB 10.2.2,"
|
2016-08-12 11:17:45 +03:00
|
|
|
" and we did not find a valid checkpoint."
|
|
|
|
" Please follow the instructions at"
|
2018-01-10 13:53:44 +02:00
|
|
|
" https://mariadb.com/kb/en/library/upgrading/";
|
2016-08-12 11:17:45 +03:00
|
|
|
return(DB_ERROR);
|
|
|
|
}
|
|
|
|
|
2017-01-24 10:29:29 +02:00
|
|
|
/** Determine if a pre-MySQL 5.7.9/MariaDB 10.2.2 redo log is clean.
|
2016-08-12 11:17:45 +03:00
|
|
|
@param[in] lsn checkpoint LSN
|
2018-06-04 11:31:39 +03:00
|
|
|
@param[in] crypt whether the log might be encrypted
|
2016-08-12 11:17:45 +03:00
|
|
|
@return error code
|
|
|
|
@retval DB_SUCCESS if the redo log is clean
|
|
|
|
@retval DB_ERROR if the redo log is corrupted or dirty */
|
2018-06-04 11:31:39 +03:00
|
|
|
static dberr_t recv_log_format_0_recover(lsn_t lsn, bool crypt)
|
2016-08-12 11:17:45 +03:00
|
|
|
{
|
|
|
|
log_mutex_enter();
|
2017-05-26 14:04:19 +03:00
|
|
|
log_group_t* group = &log_sys->log;
|
2016-08-12 11:17:45 +03:00
|
|
|
const lsn_t source_offset
|
|
|
|
= log_group_calc_lsn_offset(lsn, group);
|
|
|
|
log_mutex_exit();
|
|
|
|
const ulint page_no
|
|
|
|
= (ulint) (source_offset / univ_page_size.physical());
|
|
|
|
byte* buf = log_sys->buf;
|
|
|
|
|
|
|
|
static const char* NO_UPGRADE_RECOVERY_MSG =
|
|
|
|
"Upgrade after a crash is not supported."
|
2017-01-24 10:29:29 +02:00
|
|
|
" This redo log was created before MariaDB 10.2.2";
|
2016-08-12 11:17:45 +03:00
|
|
|
static const char* NO_UPGRADE_RTFM_MSG =
|
|
|
|
". Please follow the instructions at "
|
2018-01-10 13:53:44 +02:00
|
|
|
"https://mariadb.com/kb/en/library/upgrading/";
|
2016-08-12 11:17:45 +03:00
|
|
|
|
|
|
|
fil_io(IORequestLogRead, true,
|
2017-05-26 14:04:19 +03:00
|
|
|
page_id_t(SRV_LOG_SPACE_FIRST_ID, page_no),
|
2016-08-12 11:17:45 +03:00
|
|
|
univ_page_size,
|
|
|
|
(ulint) ((source_offset & ~(OS_FILE_LOG_BLOCK_SIZE - 1))
|
|
|
|
% univ_page_size.physical()),
|
MDEV-11254: innodb-use-trim has no effect in 10.2
Problem was that implementation merged from 10.1 was incompatible
with InnoDB 5.7.
buf0buf.cc: Add functions to return should we punch hole and
how big.
buf0flu.cc: Add written page to IORequest
fil0fil.cc: Remove unneeded status call and add test is
sparse files and punch hole supported by file system when
tablespace is created. Add call to get file system
block size. Used file node is added to IORequest. Added
functions to check is punch hole supported and setting
punch hole.
ha_innodb.cc: Remove unneeded status variables (trim512-32768)
and trim_op_saved. Deprecate innodb_use_trim and
set it ON by default. Add function to set innodb-use-trim
dynamically.
dberr.h: Add error code DB_IO_NO_PUNCH_HOLE
if punch hole operation fails.
fil0fil.h: Add punch_hole variable to fil_space_t and
block size to fil_node_t.
os0api.h: Header to helper functions on buf0buf.cc and
fil0fil.cc for os0file.h
os0file.h: Remove unneeded m_block_size from IORequest
and add bpage to IORequest to know actual size of
the block and m_fil_node to know tablespace file
system block size and does it support punch hole.
os0file.cc: Add function punch_hole() to IORequest
to do punch_hole operation,
get the file system block size and determine
does file system support sparse files (for punch hole).
page0size.h: remove implicit copy disable and
use this implicit copy to implement copy_from()
function.
buf0dblwr.cc, buf0flu.cc, buf0rea.cc, fil0fil.cc, fil0fil.h,
os0file.h, os0file.cc, log0log.cc, log0recv.cc:
Remove unneeded write_size parameter from fil_io
calls.
srv0mon.h, srv0srv.h, srv0mon.cc: Remove unneeded
trim512-trim32678 status variables. Removed
these from monitor tests.
2017-01-24 14:40:58 +02:00
|
|
|
OS_FILE_LOG_BLOCK_SIZE, buf, NULL);
|
2016-08-12 11:17:45 +03:00
|
|
|
|
|
|
|
if (log_block_calc_checksum_format_0(buf)
|
2017-02-10 20:26:02 +02:00
|
|
|
!= log_block_get_checksum(buf)
|
|
|
|
&& !log_crypt_101_read_block(buf)) {
|
2016-08-12 11:17:45 +03:00
|
|
|
ib::error() << NO_UPGRADE_RECOVERY_MSG
|
|
|
|
<< ", and it appears corrupted"
|
|
|
|
<< NO_UPGRADE_RTFM_MSG;
|
|
|
|
return(DB_CORRUPTION);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (log_block_get_data_len(buf)
|
2018-06-04 11:31:39 +03:00
|
|
|
== (source_offset & (OS_FILE_LOG_BLOCK_SIZE - 1))) {
|
|
|
|
} else if (crypt) {
|
|
|
|
ib::error() << "Cannot decrypt log for upgrading."
|
|
|
|
" The encrypted log was created before MariaDB 10.2.2"
|
|
|
|
<< NO_UPGRADE_RTFM_MSG;
|
|
|
|
return DB_ERROR;
|
|
|
|
} else {
|
2016-08-12 11:17:45 +03:00
|
|
|
ib::error() << NO_UPGRADE_RECOVERY_MSG
|
|
|
|
<< NO_UPGRADE_RTFM_MSG;
|
|
|
|
return(DB_ERROR);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Mark the redo log for upgrading. */
|
|
|
|
srv_log_file_size = 0;
|
|
|
|
recv_sys->parse_start_lsn = recv_sys->recovered_lsn
|
|
|
|
= recv_sys->scanned_lsn
|
|
|
|
= recv_sys->mlog_checkpoint_lsn = lsn;
|
|
|
|
log_sys->last_checkpoint_lsn = log_sys->next_checkpoint_lsn
|
|
|
|
= log_sys->lsn = log_sys->write_lsn
|
|
|
|
= log_sys->current_flush_lsn = log_sys->flushed_to_disk_lsn
|
|
|
|
= lsn;
|
|
|
|
log_sys->next_checkpoint_no = 0;
|
|
|
|
return(DB_SUCCESS);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2018-01-10 13:18:02 +02:00
|
|
|
/** Determine if a redo log from MariaDB 10.3 is clean.
|
|
|
|
@return error code
|
|
|
|
@retval DB_SUCCESS if the redo log is clean
|
|
|
|
@retval DB_CORRUPTION if the redo log is corrupted
|
|
|
|
@retval DB_ERROR if the redo log is not empty */
|
|
|
|
static
|
|
|
|
dberr_t
|
|
|
|
recv_log_recover_10_3()
|
|
|
|
{
|
|
|
|
log_group_t* group = &log_sys->log;
|
|
|
|
const lsn_t lsn = group->lsn;
|
|
|
|
const lsn_t source_offset = log_group_calc_lsn_offset(lsn, group);
|
|
|
|
const ulint page_no
|
|
|
|
= (ulint) (source_offset / univ_page_size.physical());
|
|
|
|
byte* buf = log_sys->buf;
|
|
|
|
|
|
|
|
fil_io(IORequestLogRead, true,
|
|
|
|
page_id_t(SRV_LOG_SPACE_FIRST_ID, page_no),
|
|
|
|
univ_page_size,
|
|
|
|
(ulint) ((source_offset & ~(OS_FILE_LOG_BLOCK_SIZE - 1))
|
|
|
|
% univ_page_size.physical()),
|
|
|
|
OS_FILE_LOG_BLOCK_SIZE, buf, NULL);
|
|
|
|
|
|
|
|
if (log_block_calc_checksum(buf) != log_block_get_checksum(buf)) {
|
|
|
|
return(DB_CORRUPTION);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (group->is_encrypted()) {
|
|
|
|
log_crypt(buf, lsn, OS_FILE_LOG_BLOCK_SIZE, true);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* On a clean shutdown, the redo log will be logically empty
|
|
|
|
after the checkpoint lsn. */
|
|
|
|
|
|
|
|
if (log_block_get_data_len(buf)
|
|
|
|
!= (source_offset & (OS_FILE_LOG_BLOCK_SIZE - 1))) {
|
|
|
|
return(DB_ERROR);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Mark the redo log for downgrading. */
|
|
|
|
srv_log_file_size = 0;
|
|
|
|
recv_sys->parse_start_lsn = recv_sys->recovered_lsn
|
|
|
|
= recv_sys->scanned_lsn
|
|
|
|
= recv_sys->mlog_checkpoint_lsn = lsn;
|
|
|
|
log_sys->last_checkpoint_lsn = log_sys->next_checkpoint_lsn
|
|
|
|
= log_sys->lsn = log_sys->write_lsn
|
|
|
|
= log_sys->current_flush_lsn = log_sys->flushed_to_disk_lsn
|
|
|
|
= lsn;
|
|
|
|
log_sys->next_checkpoint_no = 0;
|
|
|
|
return(DB_SUCCESS);
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/** Find the latest checkpoint in the log header.
|
|
|
|
@param[out] max_field LOG_CHECKPOINT_1 or LOG_CHECKPOINT_2
|
|
|
|
@return error code or DB_SUCCESS */
|
2014-02-26 19:11:54 +01:00
|
|
|
dberr_t
|
2017-05-26 14:04:19 +03:00
|
|
|
recv_find_max_checkpoint(ulint* max_field)
|
2014-02-26 19:11:54 +01:00
|
|
|
{
|
|
|
|
log_group_t* group;
|
|
|
|
ib_uint64_t max_no;
|
|
|
|
ib_uint64_t checkpoint_no;
|
|
|
|
ulint field;
|
|
|
|
byte* buf;
|
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
group = &log_sys->log;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
max_no = 0;
|
|
|
|
*max_field = 0;
|
|
|
|
|
|
|
|
buf = log_sys->checkpoint_buf;
|
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
group->state = LOG_GROUP_CORRUPTED;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
log_group_header_read(group, 0);
|
|
|
|
/* Check the header page checksum. There was no
|
|
|
|
checksum in the first redo log format (version 0). */
|
|
|
|
group->format = mach_read_from_4(buf + LOG_HEADER_FORMAT);
|
MDEV-14717: Prevent crash-downgrade to earlier MariaDB 10.2
A crash-downgrade of a RENAME (or TRUNCATE or table-rebuilding
ALTER TABLE or OPTIMIZE TABLE) operation to an earlier 10.2 version
would trigger a debug assertion failure during rollback,
in trx_roll_pop_top_rec_of_trx(). In a non-debug build, the
TRX_UNDO_RENAME_TABLE record would be misinterpreted as an
update_undo log record, and typically the file name would be
interpreted as DB_TRX_ID,DB_ROLL_PTR,PRIMARY KEY. If a matching
record would be found, row_undo_mod() would hit ut_error in
switch (node->rec_type). Typically, ut_a(table2 == NULL) would
fail when opening the table from SQL.
Because of this, we prevent a crash-downgrade to earlier MariaDB 10.2
versions by changing the InnoDB redo log format identifier to the
10.3 identifier, and by introducing a subformat identifier so that
10.2 can continue to refuse crash-downgrade from 10.3 or later.
After a clean shutdown, a downgrade to MariaDB 10.2.13 or later would
still be possible thanks to MDEV-14909. A downgrade to older 10.2
versions is only possible after removing the log files (not recommended).
LOG_HEADER_FORMAT_CURRENT: Change to 103 (originally the 10.3 format).
log_group_t: Add subformat. For 10.2, we will use subformat 1,
and will refuse crash recovery from any other subformat of the
10.3 format, that is, a genuine 10.3 redo log.
recv_find_max_checkpoint(): Allow startup after clean shutdown
from a future LOG_HEADER_FORMAT_10_4 (unencrypted only).
We cannot handle the encrypted 10.4 redo log block format,
which was introduced in MDEV-12041. Allow crash recovery from
the original 10.2 format as well as the new format.
In Mariabackup --backup, do not allow any startup from 10.3 or 10.4
redo logs.
recv_recovery_from_checkpoint_start(): Skip redo log apply for
clean 10.3 redo log, but not for the new 10.2 redo log
(10.3 format, subformat 1).
srv_prepare_to_delete_redo_log_files(): On format or subformat
mismatch, set srv_log_file_size = 0, so that we will display the
correct message.
innobase_start_or_create_for_mysql(): Check for format or subformat
mismatch.
xtrabackup_backup_func(): Remove debug assertions that were made
redundant by the code changes in recv_find_max_checkpoint().
2018-09-07 17:24:31 +03:00
|
|
|
group->subformat = group->format
|
|
|
|
? mach_read_from_4(buf + LOG_HEADER_SUBFORMAT)
|
|
|
|
: 0;
|
2017-05-26 14:04:19 +03:00
|
|
|
if (group->format != 0
|
|
|
|
&& !recv_check_log_header_checksum(buf)) {
|
|
|
|
ib::error() << "Invalid redo log header checksum.";
|
|
|
|
return(DB_CORRUPTION);
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2018-01-10 13:18:02 +02:00
|
|
|
char creator[LOG_HEADER_CREATOR_END - LOG_HEADER_CREATOR + 1];
|
|
|
|
|
|
|
|
memcpy(creator, buf + LOG_HEADER_CREATOR, sizeof creator);
|
|
|
|
/* Ensure that the string is NUL-terminated. */
|
|
|
|
creator[LOG_HEADER_CREATOR_END - LOG_HEADER_CREATOR] = 0;
|
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
switch (group->format) {
|
|
|
|
case 0:
|
|
|
|
return(recv_find_max_checkpoint_0(&group, max_field));
|
MDEV-14717: Prevent crash-downgrade to earlier MariaDB 10.2
A crash-downgrade of a RENAME (or TRUNCATE or table-rebuilding
ALTER TABLE or OPTIMIZE TABLE) operation to an earlier 10.2 version
would trigger a debug assertion failure during rollback,
in trx_roll_pop_top_rec_of_trx(). In a non-debug build, the
TRX_UNDO_RENAME_TABLE record would be misinterpreted as an
update_undo log record, and typically the file name would be
interpreted as DB_TRX_ID,DB_ROLL_PTR,PRIMARY KEY. If a matching
record would be found, row_undo_mod() would hit ut_error in
switch (node->rec_type). Typically, ut_a(table2 == NULL) would
fail when opening the table from SQL.
Because of this, we prevent a crash-downgrade to earlier MariaDB 10.2
versions by changing the InnoDB redo log format identifier to the
10.3 identifier, and by introducing a subformat identifier so that
10.2 can continue to refuse crash-downgrade from 10.3 or later.
After a clean shutdown, a downgrade to MariaDB 10.2.13 or later would
still be possible thanks to MDEV-14909. A downgrade to older 10.2
versions is only possible after removing the log files (not recommended).
LOG_HEADER_FORMAT_CURRENT: Change to 103 (originally the 10.3 format).
log_group_t: Add subformat. For 10.2, we will use subformat 1,
and will refuse crash recovery from any other subformat of the
10.3 format, that is, a genuine 10.3 redo log.
recv_find_max_checkpoint(): Allow startup after clean shutdown
from a future LOG_HEADER_FORMAT_10_4 (unencrypted only).
We cannot handle the encrypted 10.4 redo log block format,
which was introduced in MDEV-12041. Allow crash recovery from
the original 10.2 format as well as the new format.
In Mariabackup --backup, do not allow any startup from 10.3 or 10.4
redo logs.
recv_recovery_from_checkpoint_start(): Skip redo log apply for
clean 10.3 redo log, but not for the new 10.2 redo log
(10.3 format, subformat 1).
srv_prepare_to_delete_redo_log_files(): On format or subformat
mismatch, set srv_log_file_size = 0, so that we will display the
correct message.
innobase_start_or_create_for_mysql(): Check for format or subformat
mismatch.
xtrabackup_backup_func(): Remove debug assertions that were made
redundant by the code changes in recv_find_max_checkpoint().
2018-09-07 17:24:31 +03:00
|
|
|
case LOG_HEADER_FORMAT_10_2:
|
|
|
|
case LOG_HEADER_FORMAT_10_2 | LOG_HEADER_FORMAT_ENCRYPTED:
|
MDEV-13564: Implement innodb_unsafe_truncate=ON for compatibility
While MariaDB Server 10.2 is not really guaranteed to be compatible
with Percona XtraBackup 2.4 (for example, the MySQL 5.7 undo log format
change that could be present in XtraBackup, but was reverted from
MariaDB in MDEV-12289), we do not want to disrupt users who have
deployed xtrabackup and MariaDB Server 10.2 in their environments.
With this change, MariaDB 10.2 will continue to use the backup-unsafe
TRUNCATE TABLE code, so that neither the undo log nor the redo log
formats will change in an incompatible way.
Undo tablespace truncation will keep using the redo log only. Recovery
or backup with old code will fail to shrink the undo tablespace files,
but the contents will be recovered just fine.
In the MariaDB Server 10.2 series only, we introduce the configuration
parameter innodb_unsafe_truncate and make it ON by default. To allow
MariaDB Backup (mariabackup) to work properly with TRUNCATE TABLE
operations, use loose_innodb_unsafe_truncate=OFF.
MariaDB Server 10.3.10 and later releases will always use the
backup-safe TRUNCATE TABLE, and this parameter will not be
added there.
recv_recovery_rollback_active(): Skip row_mysql_drop_garbage_tables()
unless innodb_unsafe_truncate=OFF. It is too unsafe to drop orphan
tables if RENAME operations are not transactional within InnoDB.
LOG_HEADER_FORMAT_10_3: Replaces LOG_HEADER_FORMAT_CURRENT.
log_init(), log_group_file_header_flush(),
srv_prepare_to_delete_redo_log_files(),
innobase_start_or_create_for_mysql(): Choose the redo log format
and subformat based on the value of innodb_unsafe_truncate.
2018-10-10 19:19:29 +03:00
|
|
|
case LOG_HEADER_FORMAT_10_3:
|
|
|
|
case LOG_HEADER_FORMAT_10_3 | LOG_HEADER_FORMAT_ENCRYPTED:
|
MDEV-14717: Prevent crash-downgrade to earlier MariaDB 10.2
A crash-downgrade of a RENAME (or TRUNCATE or table-rebuilding
ALTER TABLE or OPTIMIZE TABLE) operation to an earlier 10.2 version
would trigger a debug assertion failure during rollback,
in trx_roll_pop_top_rec_of_trx(). In a non-debug build, the
TRX_UNDO_RENAME_TABLE record would be misinterpreted as an
update_undo log record, and typically the file name would be
interpreted as DB_TRX_ID,DB_ROLL_PTR,PRIMARY KEY. If a matching
record would be found, row_undo_mod() would hit ut_error in
switch (node->rec_type). Typically, ut_a(table2 == NULL) would
fail when opening the table from SQL.
Because of this, we prevent a crash-downgrade to earlier MariaDB 10.2
versions by changing the InnoDB redo log format identifier to the
10.3 identifier, and by introducing a subformat identifier so that
10.2 can continue to refuse crash-downgrade from 10.3 or later.
After a clean shutdown, a downgrade to MariaDB 10.2.13 or later would
still be possible thanks to MDEV-14909. A downgrade to older 10.2
versions is only possible after removing the log files (not recommended).
LOG_HEADER_FORMAT_CURRENT: Change to 103 (originally the 10.3 format).
log_group_t: Add subformat. For 10.2, we will use subformat 1,
and will refuse crash recovery from any other subformat of the
10.3 format, that is, a genuine 10.3 redo log.
recv_find_max_checkpoint(): Allow startup after clean shutdown
from a future LOG_HEADER_FORMAT_10_4 (unencrypted only).
We cannot handle the encrypted 10.4 redo log block format,
which was introduced in MDEV-12041. Allow crash recovery from
the original 10.2 format as well as the new format.
In Mariabackup --backup, do not allow any startup from 10.3 or 10.4
redo logs.
recv_recovery_from_checkpoint_start(): Skip redo log apply for
clean 10.3 redo log, but not for the new 10.2 redo log
(10.3 format, subformat 1).
srv_prepare_to_delete_redo_log_files(): On format or subformat
mismatch, set srv_log_file_size = 0, so that we will display the
correct message.
innobase_start_or_create_for_mysql(): Check for format or subformat
mismatch.
xtrabackup_backup_func(): Remove debug assertions that were made
redundant by the code changes in recv_find_max_checkpoint().
2018-09-07 17:24:31 +03:00
|
|
|
case LOG_HEADER_FORMAT_10_4:
|
|
|
|
/* We can only parse the unencrypted LOG_HEADER_FORMAT_10_4.
|
|
|
|
The encrypted format uses a larger redo log block trailer. */
|
2017-05-26 14:04:19 +03:00
|
|
|
break;
|
|
|
|
default:
|
|
|
|
ib::error() << "Unsupported redo log format."
|
|
|
|
" The redo log was created"
|
2018-01-10 13:18:02 +02:00
|
|
|
" with " << creator <<
|
2017-05-26 14:04:19 +03:00
|
|
|
". Please follow the instructions at "
|
|
|
|
REFMAN "upgrading-downgrading.html";
|
|
|
|
/* Do not issue a message about a possibility
|
|
|
|
to cleanly shut down the newer server version
|
|
|
|
and to remove the redo logs, because the
|
|
|
|
format of the system data structures may
|
|
|
|
radically change after MySQL 5.7. */
|
|
|
|
return(DB_ERROR);
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
for (field = LOG_CHECKPOINT_1; field <= LOG_CHECKPOINT_2;
|
|
|
|
field += LOG_CHECKPOINT_2 - LOG_CHECKPOINT_1) {
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
log_group_header_read(group, field);
|
2016-08-12 11:17:45 +03:00
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
const ulint crc32 = log_block_calc_checksum_crc32(buf);
|
|
|
|
const ulint cksum = log_block_get_checksum(buf);
|
2017-03-01 23:43:37 +02:00
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
if (crc32 != cksum) {
|
|
|
|
DBUG_PRINT("ib_log",
|
|
|
|
("invalid checkpoint,"
|
|
|
|
" at " ULINTPF
|
|
|
|
", checksum " ULINTPFx
|
|
|
|
" expected " ULINTPFx,
|
|
|
|
field, cksum, crc32));
|
|
|
|
continue;
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
if (group->is_encrypted()
|
|
|
|
&& !log_crypt_read_checkpoint_buf(buf)) {
|
|
|
|
ib::error() << "Reading checkpoint"
|
|
|
|
" encryption info failed.";
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
checkpoint_no = mach_read_from_8(
|
|
|
|
buf + LOG_CHECKPOINT_NO);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
DBUG_PRINT("ib_log",
|
2017-08-07 17:21:30 +03:00
|
|
|
("checkpoint " UINT64PF " at " LSN_PF " found",
|
|
|
|
checkpoint_no, mach_read_from_8(
|
|
|
|
buf + LOG_CHECKPOINT_LSN)));
|
2015-06-18 19:58:57 +03:00
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
if (checkpoint_no >= max_no) {
|
|
|
|
*max_field = field;
|
|
|
|
max_no = checkpoint_no;
|
2017-08-07 17:21:30 +03:00
|
|
|
group->state = LOG_GROUP_OK;
|
|
|
|
group->lsn = mach_read_from_8(
|
|
|
|
buf + LOG_CHECKPOINT_LSN);
|
|
|
|
group->lsn_offset = mach_read_from_8(
|
|
|
|
buf + LOG_CHECKPOINT_OFFSET);
|
2017-09-11 16:47:23 +03:00
|
|
|
log_sys->next_checkpoint_no = checkpoint_no;
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
if (*max_field == 0) {
|
2017-08-31 09:28:59 +03:00
|
|
|
/* Before 10.2.2, we could get here during database
|
2016-08-12 11:17:45 +03:00
|
|
|
initialization if we created an ib_logfile0 file that
|
|
|
|
was filled with zeroes, and were killed. After
|
2017-08-31 09:28:59 +03:00
|
|
|
10.2.2, we would reject such a file already earlier,
|
2016-08-12 11:17:45 +03:00
|
|
|
when checking the file header. */
|
|
|
|
ib::error() << "No valid checkpoint found"
|
|
|
|
" (corrupted redo log)."
|
|
|
|
" You can try --innodb-force-recovery=6"
|
|
|
|
" as a last resort.";
|
2014-02-26 19:11:54 +01:00
|
|
|
return(DB_ERROR);
|
|
|
|
}
|
|
|
|
|
2018-01-10 13:18:02 +02:00
|
|
|
switch (group->format) {
|
MDEV-13564: Implement innodb_unsafe_truncate=ON for compatibility
While MariaDB Server 10.2 is not really guaranteed to be compatible
with Percona XtraBackup 2.4 (for example, the MySQL 5.7 undo log format
change that could be present in XtraBackup, but was reverted from
MariaDB in MDEV-12289), we do not want to disrupt users who have
deployed xtrabackup and MariaDB Server 10.2 in their environments.
With this change, MariaDB 10.2 will continue to use the backup-unsafe
TRUNCATE TABLE code, so that neither the undo log nor the redo log
formats will change in an incompatible way.
Undo tablespace truncation will keep using the redo log only. Recovery
or backup with old code will fail to shrink the undo tablespace files,
but the contents will be recovered just fine.
In the MariaDB Server 10.2 series only, we introduce the configuration
parameter innodb_unsafe_truncate and make it ON by default. To allow
MariaDB Backup (mariabackup) to work properly with TRUNCATE TABLE
operations, use loose_innodb_unsafe_truncate=OFF.
MariaDB Server 10.3.10 and later releases will always use the
backup-safe TRUNCATE TABLE, and this parameter will not be
added there.
recv_recovery_rollback_active(): Skip row_mysql_drop_garbage_tables()
unless innodb_unsafe_truncate=OFF. It is too unsafe to drop orphan
tables if RENAME operations are not transactional within InnoDB.
LOG_HEADER_FORMAT_10_3: Replaces LOG_HEADER_FORMAT_CURRENT.
log_init(), log_group_file_header_flush(),
srv_prepare_to_delete_redo_log_files(),
innobase_start_or_create_for_mysql(): Choose the redo log format
and subformat based on the value of innodb_unsafe_truncate.
2018-10-10 19:19:29 +03:00
|
|
|
case LOG_HEADER_FORMAT_10_3:
|
|
|
|
case LOG_HEADER_FORMAT_10_3 | LOG_HEADER_FORMAT_ENCRYPTED:
|
MDEV-14717: Prevent crash-downgrade to earlier MariaDB 10.2
A crash-downgrade of a RENAME (or TRUNCATE or table-rebuilding
ALTER TABLE or OPTIMIZE TABLE) operation to an earlier 10.2 version
would trigger a debug assertion failure during rollback,
in trx_roll_pop_top_rec_of_trx(). In a non-debug build, the
TRX_UNDO_RENAME_TABLE record would be misinterpreted as an
update_undo log record, and typically the file name would be
interpreted as DB_TRX_ID,DB_ROLL_PTR,PRIMARY KEY. If a matching
record would be found, row_undo_mod() would hit ut_error in
switch (node->rec_type). Typically, ut_a(table2 == NULL) would
fail when opening the table from SQL.
Because of this, we prevent a crash-downgrade to earlier MariaDB 10.2
versions by changing the InnoDB redo log format identifier to the
10.3 identifier, and by introducing a subformat identifier so that
10.2 can continue to refuse crash-downgrade from 10.3 or later.
After a clean shutdown, a downgrade to MariaDB 10.2.13 or later would
still be possible thanks to MDEV-14909. A downgrade to older 10.2
versions is only possible after removing the log files (not recommended).
LOG_HEADER_FORMAT_CURRENT: Change to 103 (originally the 10.3 format).
log_group_t: Add subformat. For 10.2, we will use subformat 1,
and will refuse crash recovery from any other subformat of the
10.3 format, that is, a genuine 10.3 redo log.
recv_find_max_checkpoint(): Allow startup after clean shutdown
from a future LOG_HEADER_FORMAT_10_4 (unencrypted only).
We cannot handle the encrypted 10.4 redo log block format,
which was introduced in MDEV-12041. Allow crash recovery from
the original 10.2 format as well as the new format.
In Mariabackup --backup, do not allow any startup from 10.3 or 10.4
redo logs.
recv_recovery_from_checkpoint_start(): Skip redo log apply for
clean 10.3 redo log, but not for the new 10.2 redo log
(10.3 format, subformat 1).
srv_prepare_to_delete_redo_log_files(): On format or subformat
mismatch, set srv_log_file_size = 0, so that we will display the
correct message.
innobase_start_or_create_for_mysql(): Check for format or subformat
mismatch.
xtrabackup_backup_func(): Remove debug assertions that were made
redundant by the code changes in recv_find_max_checkpoint().
2018-09-07 17:24:31 +03:00
|
|
|
if (group->subformat == 1) {
|
|
|
|
/* 10.2 with new crash-safe TRUNCATE */
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
/* fall through */
|
|
|
|
case LOG_HEADER_FORMAT_10_4:
|
|
|
|
if (srv_operation == SRV_OPERATION_BACKUP) {
|
|
|
|
ib::error()
|
|
|
|
<< "Incompatible redo log format."
|
|
|
|
" The redo log was created with " << creator;
|
|
|
|
return DB_ERROR;
|
|
|
|
}
|
2018-01-10 13:18:02 +02:00
|
|
|
dberr_t err = recv_log_recover_10_3();
|
|
|
|
if (err != DB_SUCCESS) {
|
|
|
|
ib::error()
|
|
|
|
<< "Downgrade after a crash is not supported."
|
|
|
|
" The redo log was created with " << creator
|
|
|
|
<< (err == DB_ERROR
|
|
|
|
? "." : ", and it appears corrupted.");
|
|
|
|
}
|
|
|
|
return(err);
|
|
|
|
}
|
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
return(DB_SUCCESS);
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/** Try to parse a single log record body and also applies it if
|
|
|
|
specified.
|
|
|
|
@param[in] type redo log entry type
|
|
|
|
@param[in] ptr redo log record body
|
|
|
|
@param[in] end_ptr end of buffer
|
|
|
|
@param[in] space_id tablespace identifier
|
|
|
|
@param[in] page_no page number
|
|
|
|
@param[in] apply whether to apply the record
|
|
|
|
@param[in,out] block buffer block, or NULL if
|
|
|
|
a page log record should not be applied
|
|
|
|
or if it is a MLOG_FILE_ operation
|
|
|
|
@param[in,out] mtr mini-transaction, or NULL if
|
|
|
|
a page log record should not be applied
|
|
|
|
@return log record end, NULL if not a complete record */
|
2014-02-26 19:11:54 +01:00
|
|
|
static
|
|
|
|
byte*
|
|
|
|
recv_parse_or_apply_log_rec_body(
|
2016-08-12 11:17:45 +03:00
|
|
|
mlog_id_t type,
|
|
|
|
byte* ptr,
|
|
|
|
byte* end_ptr,
|
|
|
|
ulint space_id,
|
|
|
|
ulint page_no,
|
|
|
|
bool apply,
|
|
|
|
buf_block_t* block,
|
|
|
|
mtr_t* mtr)
|
2014-02-26 19:11:54 +01:00
|
|
|
{
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(!block == !mtr);
|
|
|
|
ut_ad(!apply || recv_sys->mlog_checkpoint_lsn != 0);
|
|
|
|
|
|
|
|
switch (type) {
|
|
|
|
case MLOG_FILE_NAME:
|
|
|
|
case MLOG_FILE_DELETE:
|
|
|
|
case MLOG_FILE_CREATE2:
|
|
|
|
case MLOG_FILE_RENAME2:
|
|
|
|
ut_ad(block == NULL);
|
|
|
|
/* Collect the file names when parsing the log,
|
|
|
|
before applying any log records. */
|
|
|
|
return(fil_name_parse(ptr, end_ptr, space_id, page_no, type,
|
|
|
|
apply));
|
|
|
|
case MLOG_INDEX_LOAD:
|
|
|
|
if (end_ptr < ptr + 8) {
|
|
|
|
return(NULL);
|
|
|
|
}
|
|
|
|
return(ptr + 8);
|
|
|
|
case MLOG_TRUNCATE:
|
2018-08-16 16:10:18 +03:00
|
|
|
if (log_truncate) {
|
|
|
|
ut_ad(srv_operation != SRV_OPERATION_NORMAL);
|
|
|
|
log_truncate();
|
|
|
|
recv_sys->found_corrupt_fs = true;
|
|
|
|
return NULL;
|
|
|
|
}
|
2016-08-12 11:17:45 +03:00
|
|
|
return(truncate_t::parse_redo_entry(ptr, end_ptr, space_id));
|
2016-09-06 09:43:16 +03:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
dict_index_t* index = NULL;
|
|
|
|
page_t* page;
|
|
|
|
page_zip_des_t* page_zip;
|
|
|
|
#ifdef UNIV_DEBUG
|
|
|
|
ulint page_type;
|
|
|
|
#endif /* UNIV_DEBUG */
|
|
|
|
|
|
|
|
if (block) {
|
2016-08-12 11:17:45 +03:00
|
|
|
/* Applying a page log record. */
|
|
|
|
ut_ad(apply);
|
2014-02-26 19:11:54 +01:00
|
|
|
page = block->frame;
|
|
|
|
page_zip = buf_block_get_page_zip(block);
|
|
|
|
ut_d(page_type = fil_page_get_type(page));
|
2016-08-12 11:17:45 +03:00
|
|
|
} else if (apply
|
|
|
|
&& !is_predefined_tablespace(space_id)
|
|
|
|
&& recv_spaces.find(space_id) == recv_spaces.end()) {
|
2017-03-01 23:43:37 +02:00
|
|
|
if (recv_sys->recovered_lsn < recv_sys->mlog_checkpoint_lsn) {
|
|
|
|
/* We have not seen all records between the
|
|
|
|
checkpoint and MLOG_CHECKPOINT. There should be
|
|
|
|
a MLOG_FILE_DELETE for this tablespace later. */
|
|
|
|
recv_spaces.insert(
|
|
|
|
std::make_pair(space_id,
|
|
|
|
file_name_t("", false)));
|
|
|
|
goto parse_log;
|
|
|
|
}
|
|
|
|
|
|
|
|
ib::error() << "Missing MLOG_FILE_NAME or MLOG_FILE_DELETE"
|
2016-08-12 11:17:45 +03:00
|
|
|
" for redo log record " << type << " (page "
|
2017-03-01 23:43:37 +02:00
|
|
|
<< space_id << ":" << page_no << ") at "
|
|
|
|
<< recv_sys->recovered_lsn << ".";
|
|
|
|
recv_sys->found_corrupt_log = true;
|
2016-08-12 11:17:45 +03:00
|
|
|
return(NULL);
|
2014-02-26 19:11:54 +01:00
|
|
|
} else {
|
2017-03-01 23:43:37 +02:00
|
|
|
parse_log:
|
2016-08-12 11:17:45 +03:00
|
|
|
/* Parsing a page log record. */
|
2014-02-26 19:11:54 +01:00
|
|
|
page = NULL;
|
|
|
|
page_zip = NULL;
|
|
|
|
ut_d(page_type = FIL_PAGE_TYPE_ALLOCATED);
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
const byte* old_ptr = ptr;
|
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
switch (type) {
|
|
|
|
#ifdef UNIV_LOG_LSN_DEBUG
|
|
|
|
case MLOG_LSN:
|
|
|
|
/* The LSN is checked in recv_parse_log_rec(). */
|
|
|
|
break;
|
|
|
|
#endif /* UNIV_LOG_LSN_DEBUG */
|
|
|
|
case MLOG_1BYTE: case MLOG_2BYTES: case MLOG_4BYTES: case MLOG_8BYTES:
|
2016-09-06 09:43:16 +03:00
|
|
|
#ifdef UNIV_DEBUG
|
|
|
|
if (page && page_type == FIL_PAGE_TYPE_ALLOCATED
|
|
|
|
&& end_ptr >= ptr + 2) {
|
|
|
|
/* It is OK to set FIL_PAGE_TYPE and certain
|
|
|
|
list node fields on an empty page. Any other
|
|
|
|
write is not OK. */
|
|
|
|
|
|
|
|
/* NOTE: There may be bogus assertion failures for
|
|
|
|
dict_hdr_create(), trx_rseg_header_create(),
|
|
|
|
trx_sys_create_doublewrite_buf(), and
|
|
|
|
trx_sysf_create().
|
|
|
|
These are only called during database creation. */
|
|
|
|
ulint offs = mach_read_from_2(ptr);
|
|
|
|
|
|
|
|
switch (type) {
|
|
|
|
default:
|
|
|
|
ut_error;
|
|
|
|
case MLOG_2BYTES:
|
|
|
|
/* Note that this can fail when the
|
|
|
|
redo log been written with something
|
|
|
|
older than InnoDB Plugin 1.0.4. */
|
|
|
|
ut_ad(offs == FIL_PAGE_TYPE
|
2018-08-28 16:48:19 +03:00
|
|
|
|| srv_is_undo_tablespace(space_id)
|
2016-09-06 09:43:16 +03:00
|
|
|
|| offs == IBUF_TREE_SEG_HEADER
|
|
|
|
+ IBUF_HEADER + FSEG_HDR_OFFSET
|
|
|
|
|| offs == PAGE_BTR_IBUF_FREE_LIST
|
|
|
|
+ PAGE_HEADER + FIL_ADDR_BYTE
|
|
|
|
|| offs == PAGE_BTR_IBUF_FREE_LIST
|
|
|
|
+ PAGE_HEADER + FIL_ADDR_BYTE
|
|
|
|
+ FIL_ADDR_SIZE
|
|
|
|
|| offs == PAGE_BTR_SEG_LEAF
|
|
|
|
+ PAGE_HEADER + FSEG_HDR_OFFSET
|
|
|
|
|| offs == PAGE_BTR_SEG_TOP
|
|
|
|
+ PAGE_HEADER + FSEG_HDR_OFFSET
|
|
|
|
|| offs == PAGE_BTR_IBUF_FREE_LIST_NODE
|
|
|
|
+ PAGE_HEADER + FIL_ADDR_BYTE
|
|
|
|
+ 0 /*FLST_PREV*/
|
|
|
|
|| offs == PAGE_BTR_IBUF_FREE_LIST_NODE
|
|
|
|
+ PAGE_HEADER + FIL_ADDR_BYTE
|
|
|
|
+ FIL_ADDR_SIZE /*FLST_NEXT*/);
|
|
|
|
break;
|
|
|
|
case MLOG_4BYTES:
|
|
|
|
/* Note that this can fail when the
|
|
|
|
redo log been written with something
|
|
|
|
older than InnoDB Plugin 1.0.4. */
|
|
|
|
ut_ad(0
|
2018-01-08 12:58:25 +02:00
|
|
|
/* fil_crypt_rotate_page() writes this */
|
|
|
|
|| offs == FIL_PAGE_SPACE_ID
|
2018-08-28 16:48:19 +03:00
|
|
|
|| srv_is_undo_tablespace(space_id)
|
2016-09-06 09:43:16 +03:00
|
|
|
|| offs == IBUF_TREE_SEG_HEADER
|
|
|
|
+ IBUF_HEADER + FSEG_HDR_SPACE
|
|
|
|
|| offs == IBUF_TREE_SEG_HEADER
|
|
|
|
+ IBUF_HEADER + FSEG_HDR_PAGE_NO
|
|
|
|
|| offs == PAGE_BTR_IBUF_FREE_LIST
|
|
|
|
+ PAGE_HEADER/* flst_init */
|
|
|
|
|| offs == PAGE_BTR_IBUF_FREE_LIST
|
|
|
|
+ PAGE_HEADER + FIL_ADDR_PAGE
|
|
|
|
|| offs == PAGE_BTR_IBUF_FREE_LIST
|
|
|
|
+ PAGE_HEADER + FIL_ADDR_PAGE
|
|
|
|
+ FIL_ADDR_SIZE
|
|
|
|
|| offs == PAGE_BTR_SEG_LEAF
|
|
|
|
+ PAGE_HEADER + FSEG_HDR_PAGE_NO
|
|
|
|
|| offs == PAGE_BTR_SEG_LEAF
|
|
|
|
+ PAGE_HEADER + FSEG_HDR_SPACE
|
|
|
|
|| offs == PAGE_BTR_SEG_TOP
|
|
|
|
+ PAGE_HEADER + FSEG_HDR_PAGE_NO
|
|
|
|
|| offs == PAGE_BTR_SEG_TOP
|
|
|
|
+ PAGE_HEADER + FSEG_HDR_SPACE
|
|
|
|
|| offs == PAGE_BTR_IBUF_FREE_LIST_NODE
|
|
|
|
+ PAGE_HEADER + FIL_ADDR_PAGE
|
|
|
|
+ 0 /*FLST_PREV*/
|
|
|
|
|| offs == PAGE_BTR_IBUF_FREE_LIST_NODE
|
|
|
|
+ PAGE_HEADER + FIL_ADDR_PAGE
|
|
|
|
+ FIL_ADDR_SIZE /*FLST_NEXT*/);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
#endif /* UNIV_DEBUG */
|
2014-02-26 19:11:54 +01:00
|
|
|
ptr = mlog_parse_nbytes(type, ptr, end_ptr, page, page_zip);
|
2016-08-12 11:17:45 +03:00
|
|
|
if (ptr != NULL && page != NULL
|
|
|
|
&& page_no == 0 && type == MLOG_4BYTES) {
|
|
|
|
ulint offs = mach_read_from_2(old_ptr);
|
|
|
|
switch (offs) {
|
|
|
|
fil_space_t* space;
|
|
|
|
ulint val;
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
case FSP_HEADER_OFFSET + FSP_SPACE_FLAGS:
|
|
|
|
case FSP_HEADER_OFFSET + FSP_SIZE:
|
|
|
|
case FSP_HEADER_OFFSET + FSP_FREE_LIMIT:
|
|
|
|
case FSP_HEADER_OFFSET + FSP_FREE + FLST_LEN:
|
|
|
|
space = fil_space_get(space_id);
|
|
|
|
ut_a(space != NULL);
|
|
|
|
val = mach_read_from_4(page + offs);
|
|
|
|
|
|
|
|
switch (offs) {
|
|
|
|
case FSP_HEADER_OFFSET + FSP_SPACE_FLAGS:
|
|
|
|
space->flags = val;
|
|
|
|
break;
|
|
|
|
case FSP_HEADER_OFFSET + FSP_SIZE:
|
|
|
|
space->size_in_header = val;
|
|
|
|
break;
|
|
|
|
case FSP_HEADER_OFFSET + FSP_FREE_LIMIT:
|
|
|
|
space->free_limit = val;
|
|
|
|
break;
|
|
|
|
case FSP_HEADER_OFFSET + FSP_FREE + FLST_LEN:
|
|
|
|
space->free_len = val;
|
|
|
|
ut_ad(val == flst_get_len(
|
|
|
|
page + offs));
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
break;
|
|
|
|
case MLOG_REC_INSERT: case MLOG_COMP_REC_INSERT:
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(!page || fil_page_type_is_index(page_type));
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
if (NULL != (ptr = mlog_parse_index(
|
|
|
|
ptr, end_ptr,
|
|
|
|
type == MLOG_COMP_REC_INSERT,
|
|
|
|
&index))) {
|
|
|
|
ut_a(!page
|
|
|
|
|| (ibool)!!page_is_comp(page)
|
|
|
|
== dict_table_is_comp(index->table));
|
|
|
|
ptr = page_cur_parse_insert_rec(FALSE, ptr, end_ptr,
|
|
|
|
block, index, mtr);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case MLOG_REC_CLUST_DELETE_MARK: case MLOG_COMP_REC_CLUST_DELETE_MARK:
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(!page || fil_page_type_is_index(page_type));
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
if (NULL != (ptr = mlog_parse_index(
|
|
|
|
ptr, end_ptr,
|
|
|
|
type == MLOG_COMP_REC_CLUST_DELETE_MARK,
|
|
|
|
&index))) {
|
|
|
|
ut_a(!page
|
|
|
|
|| (ibool)!!page_is_comp(page)
|
|
|
|
== dict_table_is_comp(index->table));
|
|
|
|
ptr = btr_cur_parse_del_mark_set_clust_rec(
|
|
|
|
ptr, end_ptr, page, page_zip, index);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case MLOG_REC_SEC_DELETE_MARK:
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(!page || fil_page_type_is_index(page_type));
|
2014-02-26 19:11:54 +01:00
|
|
|
ptr = btr_cur_parse_del_mark_set_sec_rec(ptr, end_ptr,
|
|
|
|
page, page_zip);
|
|
|
|
break;
|
|
|
|
case MLOG_REC_UPDATE_IN_PLACE: case MLOG_COMP_REC_UPDATE_IN_PLACE:
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(!page || fil_page_type_is_index(page_type));
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
if (NULL != (ptr = mlog_parse_index(
|
|
|
|
ptr, end_ptr,
|
|
|
|
type == MLOG_COMP_REC_UPDATE_IN_PLACE,
|
|
|
|
&index))) {
|
|
|
|
ut_a(!page
|
|
|
|
|| (ibool)!!page_is_comp(page)
|
|
|
|
== dict_table_is_comp(index->table));
|
|
|
|
ptr = btr_cur_parse_update_in_place(ptr, end_ptr, page,
|
|
|
|
page_zip, index);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case MLOG_LIST_END_DELETE: case MLOG_COMP_LIST_END_DELETE:
|
|
|
|
case MLOG_LIST_START_DELETE: case MLOG_COMP_LIST_START_DELETE:
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(!page || fil_page_type_is_index(page_type));
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
if (NULL != (ptr = mlog_parse_index(
|
|
|
|
ptr, end_ptr,
|
|
|
|
type == MLOG_COMP_LIST_END_DELETE
|
|
|
|
|| type == MLOG_COMP_LIST_START_DELETE,
|
|
|
|
&index))) {
|
|
|
|
ut_a(!page
|
|
|
|
|| (ibool)!!page_is_comp(page)
|
|
|
|
== dict_table_is_comp(index->table));
|
|
|
|
ptr = page_parse_delete_rec_list(type, ptr, end_ptr,
|
|
|
|
block, index, mtr);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case MLOG_LIST_END_COPY_CREATED: case MLOG_COMP_LIST_END_COPY_CREATED:
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(!page || fil_page_type_is_index(page_type));
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
if (NULL != (ptr = mlog_parse_index(
|
|
|
|
ptr, end_ptr,
|
|
|
|
type == MLOG_COMP_LIST_END_COPY_CREATED,
|
|
|
|
&index))) {
|
|
|
|
ut_a(!page
|
|
|
|
|| (ibool)!!page_is_comp(page)
|
|
|
|
== dict_table_is_comp(index->table));
|
|
|
|
ptr = page_parse_copy_rec_list_to_created_page(
|
|
|
|
ptr, end_ptr, block, index, mtr);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case MLOG_PAGE_REORGANIZE:
|
|
|
|
case MLOG_COMP_PAGE_REORGANIZE:
|
|
|
|
case MLOG_ZIP_PAGE_REORGANIZE:
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(!page || fil_page_type_is_index(page_type));
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
if (NULL != (ptr = mlog_parse_index(
|
|
|
|
ptr, end_ptr,
|
|
|
|
type != MLOG_PAGE_REORGANIZE,
|
|
|
|
&index))) {
|
|
|
|
ut_a(!page
|
|
|
|
|| (ibool)!!page_is_comp(page)
|
|
|
|
== dict_table_is_comp(index->table));
|
|
|
|
ptr = btr_parse_page_reorganize(
|
|
|
|
ptr, end_ptr, index,
|
|
|
|
type == MLOG_ZIP_PAGE_REORGANIZE,
|
|
|
|
block, mtr);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case MLOG_PAGE_CREATE: case MLOG_COMP_PAGE_CREATE:
|
|
|
|
/* Allow anything in page_type when creating a page. */
|
|
|
|
ut_a(!page_zip);
|
2016-08-12 11:17:45 +03:00
|
|
|
page_parse_create(block, type == MLOG_COMP_PAGE_CREATE, false);
|
|
|
|
break;
|
|
|
|
case MLOG_PAGE_CREATE_RTREE: case MLOG_COMP_PAGE_CREATE_RTREE:
|
|
|
|
page_parse_create(block, type == MLOG_COMP_PAGE_CREATE_RTREE,
|
|
|
|
true);
|
2014-02-26 19:11:54 +01:00
|
|
|
break;
|
|
|
|
case MLOG_UNDO_INSERT:
|
|
|
|
ut_ad(!page || page_type == FIL_PAGE_UNDO_LOG);
|
|
|
|
ptr = trx_undo_parse_add_undo_rec(ptr, end_ptr, page);
|
|
|
|
break;
|
|
|
|
case MLOG_UNDO_ERASE_END:
|
|
|
|
ut_ad(!page || page_type == FIL_PAGE_UNDO_LOG);
|
|
|
|
ptr = trx_undo_parse_erase_page_end(ptr, end_ptr, page, mtr);
|
|
|
|
break;
|
|
|
|
case MLOG_UNDO_INIT:
|
|
|
|
/* Allow anything in page_type when creating a page. */
|
|
|
|
ptr = trx_undo_parse_page_init(ptr, end_ptr, page, mtr);
|
|
|
|
break;
|
|
|
|
case MLOG_UNDO_HDR_CREATE:
|
|
|
|
case MLOG_UNDO_HDR_REUSE:
|
|
|
|
ut_ad(!page || page_type == FIL_PAGE_UNDO_LOG);
|
|
|
|
ptr = trx_undo_parse_page_header(type, ptr, end_ptr,
|
|
|
|
page, mtr);
|
|
|
|
break;
|
|
|
|
case MLOG_REC_MIN_MARK: case MLOG_COMP_REC_MIN_MARK:
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(!page || fil_page_type_is_index(page_type));
|
2014-02-26 19:11:54 +01:00
|
|
|
/* On a compressed page, MLOG_COMP_REC_MIN_MARK
|
|
|
|
will be followed by MLOG_COMP_REC_DELETE
|
|
|
|
or MLOG_ZIP_WRITE_HEADER(FIL_PAGE_PREV, FIL_NULL)
|
|
|
|
in the same mini-transaction. */
|
|
|
|
ut_a(type == MLOG_COMP_REC_MIN_MARK || !page_zip);
|
|
|
|
ptr = btr_parse_set_min_rec_mark(
|
|
|
|
ptr, end_ptr, type == MLOG_COMP_REC_MIN_MARK,
|
|
|
|
page, mtr);
|
|
|
|
break;
|
|
|
|
case MLOG_REC_DELETE: case MLOG_COMP_REC_DELETE:
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(!page || fil_page_type_is_index(page_type));
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
if (NULL != (ptr = mlog_parse_index(
|
|
|
|
ptr, end_ptr,
|
|
|
|
type == MLOG_COMP_REC_DELETE,
|
|
|
|
&index))) {
|
|
|
|
ut_a(!page
|
|
|
|
|| (ibool)!!page_is_comp(page)
|
|
|
|
== dict_table_is_comp(index->table));
|
|
|
|
ptr = page_cur_parse_delete_rec(ptr, end_ptr,
|
|
|
|
block, index, mtr);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
case MLOG_IBUF_BITMAP_INIT:
|
|
|
|
/* Allow anything in page_type when creating a page. */
|
|
|
|
ptr = ibuf_parse_bitmap_init(ptr, end_ptr, block, mtr);
|
|
|
|
break;
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_INIT_FILE_PAGE2:
|
2014-02-26 19:11:54 +01:00
|
|
|
/* Allow anything in page_type when creating a page. */
|
|
|
|
ptr = fsp_parse_init_file_page(ptr, end_ptr, block);
|
|
|
|
break;
|
|
|
|
case MLOG_WRITE_STRING:
|
|
|
|
ptr = mlog_parse_string(ptr, end_ptr, page, page_zip);
|
|
|
|
break;
|
|
|
|
case MLOG_ZIP_WRITE_NODE_PTR:
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(!page || fil_page_type_is_index(page_type));
|
2014-02-26 19:11:54 +01:00
|
|
|
ptr = page_zip_parse_write_node_ptr(ptr, end_ptr,
|
|
|
|
page, page_zip);
|
|
|
|
break;
|
|
|
|
case MLOG_ZIP_WRITE_BLOB_PTR:
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(!page || fil_page_type_is_index(page_type));
|
2014-02-26 19:11:54 +01:00
|
|
|
ptr = page_zip_parse_write_blob_ptr(ptr, end_ptr,
|
|
|
|
page, page_zip);
|
|
|
|
break;
|
|
|
|
case MLOG_ZIP_WRITE_HEADER:
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(!page || fil_page_type_is_index(page_type));
|
2014-02-26 19:11:54 +01:00
|
|
|
ptr = page_zip_parse_write_header(ptr, end_ptr,
|
|
|
|
page, page_zip);
|
|
|
|
break;
|
|
|
|
case MLOG_ZIP_PAGE_COMPRESS:
|
|
|
|
/* Allow anything in page_type when creating a page. */
|
|
|
|
ptr = page_zip_parse_compress(ptr, end_ptr,
|
|
|
|
page, page_zip);
|
|
|
|
break;
|
|
|
|
case MLOG_ZIP_PAGE_COMPRESS_NO_DATA:
|
|
|
|
if (NULL != (ptr = mlog_parse_index(
|
|
|
|
ptr, end_ptr, TRUE, &index))) {
|
|
|
|
|
|
|
|
ut_a(!page || ((ibool)!!page_is_comp(page)
|
|
|
|
== dict_table_is_comp(index->table)));
|
|
|
|
ptr = page_zip_parse_compress_no_data(
|
|
|
|
ptr, end_ptr, page, page_zip, index);
|
|
|
|
}
|
|
|
|
break;
|
2014-12-22 16:53:17 +02:00
|
|
|
case MLOG_FILE_WRITE_CRYPT_DATA:
|
MDEV-12253: Buffer pool blocks are accessed after they have been freed
Problem was that bpage was referenced after it was already freed
from LRU. Fixed by adding a new variable encrypted that is
passed down to buf_page_check_corrupt() and used in
buf_page_get_gen() to stop processing page read.
This patch should also address following test failures and
bugs:
MDEV-12419: IMPORT should not look up tablespace in
PageConverter::validate(). This is now removed.
MDEV-10099: encryption.innodb_onlinealter_encryption fails
sporadically in buildbot
MDEV-11420: encryption.innodb_encryption-page-compression
failed in buildbot
MDEV-11222: encryption.encrypt_and_grep failed in buildbot on P8
Removed dict_table_t::is_encrypted and dict_table_t::ibd_file_missing
and replaced these with dict_table_t::file_unreadable. Table
ibd file is missing if fil_get_space(space_id) returns NULL
and encrypted if not. Removed dict_table_t::is_corrupted field.
Ported FilSpace class from 10.2 and using that on buf_page_check_corrupt(),
buf_page_decrypt_after_read(), buf_page_encrypt_before_write(),
buf_dblwr_process(), buf_read_page(), dict_stats_save_defrag_stats().
Added test cases when enrypted page could be read while doing
redo log crash recovery. Also added test case for row compressed
blobs.
btr_cur_open_at_index_side_func(),
btr_cur_open_at_rnd_pos_func(): Avoid referencing block that is
NULL.
buf_page_get_zip(): Issue error if page read fails.
buf_page_get_gen(): Use dberr_t for error detection and
do not reference bpage after we hare freed it.
buf_mark_space_corrupt(): remove bpage from LRU also when
it is encrypted.
buf_page_check_corrupt(): @return DB_SUCCESS if page has
been read and is not corrupted,
DB_PAGE_CORRUPTED if page based on checksum check is corrupted,
DB_DECRYPTION_FAILED if page post encryption checksum matches but
after decryption normal page checksum does not match. In read
case only DB_SUCCESS is possible.
buf_page_io_complete(): use dberr_t for error handling.
buf_flush_write_block_low(),
buf_read_ahead_random(),
buf_read_page_async(),
buf_read_ahead_linear(),
buf_read_ibuf_merge_pages(),
buf_read_recv_pages(),
fil_aio_wait():
Issue error if page read fails.
btr_pcur_move_to_next_page(): Do not reference page if it is
NULL.
Introduced dict_table_t::is_readable() and dict_index_t::is_readable()
that will return true if tablespace exists and pages read from
tablespace are not corrupted or page decryption failed.
Removed buf_page_t::key_version. After page decryption the
key version is not removed from page frame. For unencrypted
pages, old key_version is removed at buf_page_encrypt_before_write()
dict_stats_update_transient_for_index(),
dict_stats_update_transient()
Do not continue if table decryption failed or table
is corrupted.
dict0stats.cc: Introduced a dict_stats_report_error function
to avoid code duplication.
fil_parse_write_crypt_data():
Check that key read from redo log entry is found from
encryption plugin and if it is not, refuse to start.
PageConverter::validate(): Removed access to fil_space_t as
tablespace is not available during import.
Fixed error code on innodb.innodb test.
Merged test cased innodb-bad-key-change5 and innodb-bad-key-shutdown
to innodb-bad-key-change2. Removed innodb-bad-key-change5 test.
Decreased unnecessary complexity on some long lasting tests.
Removed fil_inc_pending_ops(), fil_decr_pending_ops(),
fil_get_first_space(), fil_get_next_space(),
fil_get_first_space_safe(), fil_get_next_space_safe()
functions.
fil_space_verify_crypt_checksum(): Fixed bug found using ASAN
where FIL_PAGE_END_LSN_OLD_CHECKSUM field was incorrectly
accessed from row compressed tables. Fixed out of page frame
bug for row compressed tables in
fil_space_verify_crypt_checksum() found using ASAN. Incorrect
function was called for compressed table.
Added new tests for discard, rename table and drop (we should allow them
even when page decryption fails). Alter table rename is not allowed.
Added test for restart with innodb-force-recovery=1 when page read on
redo-recovery cant be decrypted. Added test for corrupted table where
both page data and FIL_PAGE_FILE_FLUSH_LSN_OR_KEY_VERSION is corrupted.
Adjusted the test case innodb_bug14147491 so that it does not anymore
expect crash. Instead table is just mostly not usable.
fil0fil.h: fil_space_acquire_low is not visible function
and fil_space_acquire and fil_space_acquire_silent are
inline functions. FilSpace class uses fil_space_acquire_low
directly.
recv_apply_hashed_log_recs() does not return anything.
2017-04-26 15:19:16 +03:00
|
|
|
dberr_t err;
|
|
|
|
ptr = const_cast<byte*>(fil_parse_write_crypt_data(ptr, end_ptr, block, &err));
|
|
|
|
|
|
|
|
if (err != DB_SUCCESS) {
|
|
|
|
recv_sys->found_corrupt_log = TRUE;
|
|
|
|
}
|
2014-12-22 16:53:17 +02:00
|
|
|
break;
|
2014-02-26 19:11:54 +01:00
|
|
|
default:
|
|
|
|
ptr = NULL;
|
2018-08-09 17:38:40 +03:00
|
|
|
ib::error() << "Incorrect log record type "
|
|
|
|
<< ib::hex(unsigned(type));
|
2016-08-12 11:17:45 +03:00
|
|
|
|
|
|
|
recv_sys->found_corrupt_log = true;
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
if (index) {
|
|
|
|
dict_table_t* table = index->table;
|
|
|
|
|
|
|
|
dict_mem_index_free(index);
|
|
|
|
dict_mem_table_free(table);
|
|
|
|
}
|
|
|
|
|
|
|
|
return(ptr);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*********************************************************************//**
|
|
|
|
Calculates the fold value of a page file address: used in inserting or
|
|
|
|
searching for a log record in the hash table.
|
2016-08-12 11:17:45 +03:00
|
|
|
@return folded value */
|
2014-02-26 19:11:54 +01:00
|
|
|
UNIV_INLINE
|
|
|
|
ulint
|
|
|
|
recv_fold(
|
|
|
|
/*======*/
|
|
|
|
ulint space, /*!< in: space */
|
|
|
|
ulint page_no)/*!< in: page number */
|
|
|
|
{
|
|
|
|
return(ut_fold_ulint_pair(space, page_no));
|
|
|
|
}
|
|
|
|
|
|
|
|
/*********************************************************************//**
|
|
|
|
Calculates the hash value of a page file address: used in inserting or
|
|
|
|
searching for a log record in the hash table.
|
2016-08-12 11:17:45 +03:00
|
|
|
@return folded value */
|
2014-02-26 19:11:54 +01:00
|
|
|
UNIV_INLINE
|
|
|
|
ulint
|
|
|
|
recv_hash(
|
|
|
|
/*======*/
|
|
|
|
ulint space, /*!< in: space */
|
|
|
|
ulint page_no)/*!< in: page number */
|
|
|
|
{
|
|
|
|
return(hash_calc_hash(recv_fold(space, page_no), recv_sys->addr_hash));
|
|
|
|
}
|
|
|
|
|
|
|
|
/*********************************************************************//**
|
|
|
|
Gets the hashed file address struct for a page.
|
2016-08-12 11:17:45 +03:00
|
|
|
@return file address struct, NULL if not found from the hash table */
|
2014-02-26 19:11:54 +01:00
|
|
|
static
|
|
|
|
recv_addr_t*
|
|
|
|
recv_get_fil_addr_struct(
|
|
|
|
/*=====================*/
|
|
|
|
ulint space, /*!< in: space id */
|
|
|
|
ulint page_no)/*!< in: page number */
|
|
|
|
{
|
|
|
|
recv_addr_t* recv_addr;
|
|
|
|
|
|
|
|
for (recv_addr = static_cast<recv_addr_t*>(
|
|
|
|
HASH_GET_FIRST(recv_sys->addr_hash,
|
|
|
|
recv_hash(space, page_no)));
|
|
|
|
recv_addr != 0;
|
|
|
|
recv_addr = static_cast<recv_addr_t*>(
|
|
|
|
HASH_GET_NEXT(addr_hash, recv_addr))) {
|
|
|
|
|
|
|
|
if (recv_addr->space == space
|
|
|
|
&& recv_addr->page_no == page_no) {
|
|
|
|
|
|
|
|
return(recv_addr);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return(NULL);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*******************************************************************//**
|
|
|
|
Adds a new log record to the hash table of log records. */
|
|
|
|
static
|
|
|
|
void
|
|
|
|
recv_add_to_hash_table(
|
|
|
|
/*===================*/
|
2016-08-12 11:17:45 +03:00
|
|
|
mlog_id_t type, /*!< in: log record type */
|
|
|
|
ulint space, /*!< in: space id */
|
|
|
|
ulint page_no, /*!< in: page number */
|
|
|
|
byte* body, /*!< in: log record body */
|
|
|
|
byte* rec_end, /*!< in: log record end */
|
|
|
|
lsn_t start_lsn, /*!< in: start lsn of the mtr */
|
|
|
|
lsn_t end_lsn) /*!< in: end lsn of the mtr */
|
2014-02-26 19:11:54 +01:00
|
|
|
{
|
|
|
|
recv_t* recv;
|
|
|
|
ulint len;
|
|
|
|
recv_data_t* recv_data;
|
|
|
|
recv_data_t** prev_field;
|
|
|
|
recv_addr_t* recv_addr;
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(type != MLOG_FILE_DELETE);
|
|
|
|
ut_ad(type != MLOG_FILE_CREATE2);
|
|
|
|
ut_ad(type != MLOG_FILE_RENAME2);
|
|
|
|
ut_ad(type != MLOG_FILE_NAME);
|
|
|
|
ut_ad(type != MLOG_DUMMY_RECORD);
|
|
|
|
ut_ad(type != MLOG_CHECKPOINT);
|
|
|
|
ut_ad(type != MLOG_INDEX_LOAD);
|
|
|
|
ut_ad(type != MLOG_TRUNCATE);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
len = rec_end - body;
|
|
|
|
|
|
|
|
recv = static_cast<recv_t*>(
|
|
|
|
mem_heap_alloc(recv_sys->heap, sizeof(recv_t)));
|
|
|
|
|
|
|
|
recv->type = type;
|
|
|
|
recv->len = rec_end - body;
|
|
|
|
recv->start_lsn = start_lsn;
|
|
|
|
recv->end_lsn = end_lsn;
|
|
|
|
|
|
|
|
recv_addr = recv_get_fil_addr_struct(space, page_no);
|
|
|
|
|
|
|
|
if (recv_addr == NULL) {
|
|
|
|
recv_addr = static_cast<recv_addr_t*>(
|
|
|
|
mem_heap_alloc(recv_sys->heap, sizeof(recv_addr_t)));
|
|
|
|
|
|
|
|
recv_addr->space = space;
|
|
|
|
recv_addr->page_no = page_no;
|
|
|
|
recv_addr->state = RECV_NOT_PROCESSED;
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
UT_LIST_INIT(recv_addr->rec_list, &recv_t::rec_list);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
HASH_INSERT(recv_addr_t, addr_hash, recv_sys->addr_hash,
|
|
|
|
recv_fold(space, page_no), recv_addr);
|
|
|
|
recv_sys->n_addrs++;
|
|
|
|
#if 0
|
|
|
|
fprintf(stderr, "Inserting log rec for space %lu, page %lu\n",
|
|
|
|
space, page_no);
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
UT_LIST_ADD_LAST(recv_addr->rec_list, recv);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
prev_field = &(recv->data);
|
|
|
|
|
|
|
|
/* Store the log record body in chunks of less than UNIV_PAGE_SIZE:
|
|
|
|
recv_sys->heap grows into the buffer pool, and bigger chunks could not
|
|
|
|
be allocated */
|
|
|
|
|
|
|
|
while (rec_end > body) {
|
|
|
|
|
|
|
|
len = rec_end - body;
|
|
|
|
|
|
|
|
if (len > RECV_DATA_BLOCK_SIZE) {
|
|
|
|
len = RECV_DATA_BLOCK_SIZE;
|
|
|
|
}
|
|
|
|
|
|
|
|
recv_data = static_cast<recv_data_t*>(
|
|
|
|
mem_heap_alloc(recv_sys->heap,
|
|
|
|
sizeof(recv_data_t) + len));
|
|
|
|
|
|
|
|
*prev_field = recv_data;
|
|
|
|
|
|
|
|
memcpy(recv_data + 1, body, len);
|
|
|
|
|
|
|
|
prev_field = &(recv_data->next);
|
|
|
|
|
|
|
|
body += len;
|
|
|
|
}
|
|
|
|
|
|
|
|
*prev_field = NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*********************************************************************//**
|
|
|
|
Copies the log record body from recv to buf. */
|
|
|
|
static
|
|
|
|
void
|
|
|
|
recv_data_copy_to_buf(
|
|
|
|
/*==================*/
|
|
|
|
byte* buf, /*!< in: buffer of length at least recv->len */
|
|
|
|
recv_t* recv) /*!< in: log record */
|
|
|
|
{
|
|
|
|
recv_data_t* recv_data;
|
|
|
|
ulint part_len;
|
|
|
|
ulint len;
|
|
|
|
|
|
|
|
len = recv->len;
|
|
|
|
recv_data = recv->data;
|
|
|
|
|
|
|
|
while (len > 0) {
|
|
|
|
if (len > RECV_DATA_BLOCK_SIZE) {
|
|
|
|
part_len = RECV_DATA_BLOCK_SIZE;
|
|
|
|
} else {
|
|
|
|
part_len = len;
|
|
|
|
}
|
|
|
|
|
|
|
|
ut_memcpy(buf, ((byte*) recv_data) + sizeof(recv_data_t),
|
|
|
|
part_len);
|
|
|
|
buf += part_len;
|
|
|
|
len -= part_len;
|
|
|
|
|
|
|
|
recv_data = recv_data->next;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-12-30 15:04:10 +02:00
|
|
|
/** Apply the hashed log records to the page, if the page lsn is less than the
|
|
|
|
lsn of a log record.
|
|
|
|
@param just_read_in whether the page recently arrived to the I/O handler
|
|
|
|
@param block the page in the buffer pool */
|
2014-02-26 19:11:54 +01:00
|
|
|
void
|
2016-12-30 15:04:10 +02:00
|
|
|
recv_recover_page(bool just_read_in, buf_block_t* block)
|
2014-02-26 19:11:54 +01:00
|
|
|
{
|
|
|
|
page_t* page;
|
|
|
|
page_zip_des_t* page_zip;
|
|
|
|
recv_addr_t* recv_addr;
|
|
|
|
recv_t* recv;
|
|
|
|
byte* buf;
|
|
|
|
lsn_t start_lsn;
|
|
|
|
lsn_t end_lsn;
|
|
|
|
lsn_t page_lsn;
|
|
|
|
lsn_t page_newest_lsn;
|
|
|
|
ibool modification_to_page;
|
|
|
|
mtr_t mtr;
|
|
|
|
|
|
|
|
mutex_enter(&(recv_sys->mutex));
|
|
|
|
|
|
|
|
if (recv_sys->apply_log_recs == FALSE) {
|
|
|
|
|
|
|
|
/* Log records should not be applied now */
|
|
|
|
|
|
|
|
mutex_exit(&(recv_sys->mutex));
|
|
|
|
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
recv_addr = recv_get_fil_addr_struct(block->page.id.space(),
|
|
|
|
block->page.id.page_no());
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
if ((recv_addr == NULL)
|
|
|
|
|| (recv_addr->state == RECV_BEING_PROCESSED)
|
|
|
|
|| (recv_addr->state == RECV_PROCESSED)) {
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(recv_addr == NULL || recv_needed_recovery);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
mutex_exit(&(recv_sys->mutex));
|
|
|
|
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(recv_needed_recovery);
|
|
|
|
|
2018-06-15 14:09:15 +03:00
|
|
|
if (UNIV_UNLIKELY(srv_print_verbose_log == 2)) {
|
|
|
|
fprintf(stderr, "Applying log to page %u:%u\n",
|
|
|
|
recv_addr->space, recv_addr->page_no);
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
DBUG_PRINT("ib_log",
|
|
|
|
("Applying log to page %u:%u",
|
|
|
|
recv_addr->space, recv_addr->page_no));
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
recv_addr->state = RECV_BEING_PROCESSED;
|
|
|
|
|
|
|
|
mutex_exit(&(recv_sys->mutex));
|
|
|
|
|
|
|
|
mtr_start(&mtr);
|
|
|
|
mtr_set_log_mode(&mtr, MTR_LOG_NONE);
|
|
|
|
|
|
|
|
page = block->frame;
|
|
|
|
page_zip = buf_block_get_page_zip(block);
|
|
|
|
|
|
|
|
if (just_read_in) {
|
|
|
|
/* Move the ownership of the x-latch on the page to
|
|
|
|
this OS thread, so that we can acquire a second
|
|
|
|
x-latch on it. This is needed for the operations to
|
|
|
|
the page to pass the debug checks. */
|
|
|
|
|
|
|
|
rw_lock_x_lock_move_ownership(&block->lock);
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
ibool success = buf_page_get_known_nowait(
|
|
|
|
RW_X_LATCH, block, BUF_KEEP_OLD,
|
|
|
|
__FILE__, __LINE__, &mtr);
|
2014-02-26 19:11:54 +01:00
|
|
|
ut_a(success);
|
|
|
|
|
|
|
|
buf_block_dbg_add_level(block, SYNC_NO_ORDER_CHECK);
|
|
|
|
|
|
|
|
/* Read the newest modification lsn from the page */
|
|
|
|
page_lsn = mach_read_from_8(page + FIL_PAGE_LSN);
|
|
|
|
|
|
|
|
/* It may be that the page has been modified in the buffer
|
|
|
|
pool: read the newest modification lsn there */
|
|
|
|
|
|
|
|
page_newest_lsn = buf_page_get_newest_modification(&block->page);
|
|
|
|
|
|
|
|
if (page_newest_lsn) {
|
|
|
|
|
|
|
|
page_lsn = page_newest_lsn;
|
|
|
|
}
|
|
|
|
|
|
|
|
modification_to_page = FALSE;
|
|
|
|
start_lsn = end_lsn = 0;
|
|
|
|
|
|
|
|
recv = UT_LIST_GET_FIRST(recv_addr->rec_list);
|
|
|
|
|
|
|
|
while (recv) {
|
|
|
|
end_lsn = recv->end_lsn;
|
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
ut_ad(end_lsn <= log_sys->log.scanned_lsn);
|
2016-08-12 11:17:45 +03:00
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
if (recv->len > RECV_DATA_BLOCK_SIZE) {
|
|
|
|
/* We have to copy the record body to a separate
|
|
|
|
buffer */
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
buf = static_cast<byte*>(ut_malloc_nokey(recv->len));
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
recv_data_copy_to_buf(buf, recv);
|
|
|
|
} else {
|
|
|
|
buf = ((byte*)(recv->data)) + sizeof(recv_data_t);
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/* If per-table tablespace was truncated and there exist REDO
|
|
|
|
records before truncate that are to be applied as part of
|
|
|
|
recovery (checkpoint didn't happen since truncate was done)
|
|
|
|
skip such records using lsn check as they may not stand valid
|
|
|
|
post truncate.
|
|
|
|
LSN at start of truncate is recorded and any redo record
|
|
|
|
with LSN less than recorded LSN is skipped.
|
|
|
|
Note: We can't skip complete recv_addr as same page may have
|
|
|
|
valid REDO records post truncate those needs to be applied. */
|
|
|
|
bool skip_recv = false;
|
2016-09-06 09:43:16 +03:00
|
|
|
if (srv_was_tablespace_truncated(fil_space_get(recv_addr->space))) {
|
2016-08-12 11:17:45 +03:00
|
|
|
lsn_t init_lsn =
|
|
|
|
truncate_t::get_truncated_tablespace_init_lsn(
|
|
|
|
recv_addr->space);
|
|
|
|
skip_recv = (recv->start_lsn < init_lsn);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Ignore applying the redo logs for tablespace that is
|
|
|
|
truncated. Post recovery there is fixup action that will
|
|
|
|
restore the tablespace back to normal state.
|
|
|
|
Applying redo at this stage can result in error given that
|
|
|
|
redo will have action recorded on page before tablespace
|
|
|
|
was re-inited and that would lead to an error while applying
|
|
|
|
such action. */
|
|
|
|
if (recv->start_lsn >= page_lsn
|
|
|
|
&& !srv_is_tablespace_truncated(recv_addr->space)
|
|
|
|
&& !skip_recv) {
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
lsn_t end_lsn;
|
|
|
|
|
|
|
|
if (!modification_to_page) {
|
|
|
|
|
|
|
|
modification_to_page = TRUE;
|
|
|
|
start_lsn = recv->start_lsn;
|
|
|
|
}
|
|
|
|
|
2018-06-15 14:09:15 +03:00
|
|
|
if (UNIV_UNLIKELY(srv_print_verbose_log == 2)) {
|
|
|
|
fprintf(stderr, "apply " LSN_PF ":"
|
|
|
|
" %d len " ULINTPF " page %u:%u\n",
|
|
|
|
recv->start_lsn, recv->type, recv->len,
|
|
|
|
recv_addr->space, recv_addr->page_no);
|
|
|
|
}
|
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
DBUG_PRINT("ib_log",
|
2016-08-12 11:17:45 +03:00
|
|
|
("apply " LSN_PF ":"
|
|
|
|
" %s len " ULINTPF " page %u:%u",
|
|
|
|
recv->start_lsn,
|
|
|
|
get_mlog_string(recv->type), recv->len,
|
|
|
|
recv_addr->space,
|
|
|
|
recv_addr->page_no));
|
|
|
|
|
|
|
|
recv_parse_or_apply_log_rec_body(
|
|
|
|
recv->type, buf, buf + recv->len,
|
|
|
|
recv_addr->space, recv_addr->page_no,
|
|
|
|
true, block, &mtr);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
end_lsn = recv->start_lsn + recv->len;
|
|
|
|
mach_write_to_8(FIL_PAGE_LSN + page, end_lsn);
|
|
|
|
mach_write_to_8(UNIV_PAGE_SIZE
|
|
|
|
- FIL_PAGE_END_LSN_OLD_CHKSUM
|
|
|
|
+ page, end_lsn);
|
|
|
|
|
|
|
|
if (page_zip) {
|
|
|
|
mach_write_to_8(FIL_PAGE_LSN
|
|
|
|
+ page_zip->data, end_lsn);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (recv->len > RECV_DATA_BLOCK_SIZE) {
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_free(buf);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
recv = UT_LIST_GET_NEXT(rec_list, recv);
|
|
|
|
}
|
|
|
|
|
|
|
|
#ifdef UNIV_ZIP_DEBUG
|
2016-08-12 11:17:45 +03:00
|
|
|
if (fil_page_index_page_check(page)) {
|
2014-02-26 19:11:54 +01:00
|
|
|
page_zip_des_t* page_zip = buf_block_get_page_zip(block);
|
|
|
|
|
|
|
|
ut_a(!page_zip
|
|
|
|
|| page_zip_validate_low(page_zip, page, NULL, FALSE));
|
|
|
|
}
|
|
|
|
#endif /* UNIV_ZIP_DEBUG */
|
|
|
|
|
|
|
|
if (modification_to_page) {
|
|
|
|
ut_a(block);
|
|
|
|
|
|
|
|
log_flush_order_mutex_enter();
|
|
|
|
buf_flush_recv_note_modification(block, start_lsn, end_lsn);
|
|
|
|
log_flush_order_mutex_exit();
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Make sure that committing mtr does not change the modification
|
|
|
|
lsn values of page */
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
mtr.discard_modifications();
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
mtr_commit(&mtr);
|
|
|
|
|
2017-03-07 17:16:49 +02:00
|
|
|
ib_time_t time = ut_time();
|
|
|
|
|
2017-03-08 19:44:22 +02:00
|
|
|
mutex_enter(&recv_sys->mutex);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
if (recv_max_page_lsn < page_lsn) {
|
|
|
|
recv_max_page_lsn = page_lsn;
|
|
|
|
}
|
|
|
|
|
|
|
|
recv_addr->state = RECV_PROCESSED;
|
|
|
|
|
2017-03-07 17:16:49 +02:00
|
|
|
ut_a(recv_sys->n_addrs > 0);
|
|
|
|
if (ulint n = --recv_sys->n_addrs) {
|
|
|
|
if (recv_sys->report(time)) {
|
|
|
|
ib::info() << "To recover: " << n << " pages from log";
|
2017-11-30 13:37:59 +11:00
|
|
|
service_manager_extend_timeout(
|
|
|
|
INNODB_EXTEND_TIMEOUT_INTERVAL, "To recover: " ULINTPF " pages from log", n);
|
2017-03-07 17:16:49 +02:00
|
|
|
}
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-03-07 17:16:49 +02:00
|
|
|
mutex_exit(&recv_sys->mutex);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/** Reads in pages which have hashed log records, from an area around a given
|
2014-02-26 19:11:54 +01:00
|
|
|
page number.
|
2016-08-12 11:17:45 +03:00
|
|
|
@param[in] page_id page id
|
|
|
|
@return number of pages found */
|
2018-10-18 18:23:12 +03:00
|
|
|
static ulint recv_read_in_area(const page_id_t page_id)
|
2014-02-26 19:11:54 +01:00
|
|
|
{
|
|
|
|
recv_addr_t* recv_addr;
|
|
|
|
ulint page_nos[RECV_READ_AHEAD_AREA];
|
|
|
|
ulint low_limit;
|
|
|
|
ulint n;
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
low_limit = page_id.page_no()
|
|
|
|
- (page_id.page_no() % RECV_READ_AHEAD_AREA);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
n = 0;
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
for (ulint page_no = low_limit;
|
|
|
|
page_no < low_limit + RECV_READ_AHEAD_AREA;
|
2014-02-26 19:11:54 +01:00
|
|
|
page_no++) {
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
recv_addr = recv_get_fil_addr_struct(page_id.space(), page_no);
|
|
|
|
|
|
|
|
const page_id_t cur_page_id(page_id.space(), page_no);
|
|
|
|
|
|
|
|
if (recv_addr && !buf_page_peek(cur_page_id)) {
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
mutex_enter(&(recv_sys->mutex));
|
|
|
|
|
|
|
|
if (recv_addr->state == RECV_NOT_PROCESSED) {
|
|
|
|
recv_addr->state = RECV_BEING_READ;
|
|
|
|
|
|
|
|
page_nos[n] = page_no;
|
|
|
|
|
|
|
|
n++;
|
|
|
|
}
|
|
|
|
|
|
|
|
mutex_exit(&(recv_sys->mutex));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
buf_read_recv_pages(FALSE, page_id.space(), page_nos, n);
|
2014-02-26 19:11:54 +01:00
|
|
|
return(n);
|
|
|
|
}
|
|
|
|
|
2017-03-07 17:16:49 +02:00
|
|
|
/** Apply the hash table of stored log records to persistent data pages.
|
|
|
|
@param[in] last_batch whether the change buffer merge will be
|
|
|
|
performed as part of the operation */
|
2018-11-20 14:55:44 +02:00
|
|
|
void recv_apply_hashed_log_recs(bool last_batch)
|
2014-02-26 19:11:54 +01:00
|
|
|
{
|
MDEV-12548 Initial implementation of Mariabackup for MariaDB 10.2
InnoDB I/O and buffer pool interfaces and the redo log format
have been changed between MariaDB 10.1 and 10.2, and the backup
code has to be adjusted accordingly.
The code has been simplified, and many memory leaks have been fixed.
Instead of the file name xtrabackup_logfile, the file name ib_logfile0
is being used for the copy of the redo log. Unnecessary InnoDB startup and
shutdown and some unnecessary threads have been removed.
Some help was provided by Vladislav Vaintroub.
Parameters have been cleaned up and aligned with those of MariaDB 10.2.
The --dbug option has been added, so that in debug builds,
--dbug=d,ib_log can be specified to enable diagnostic messages
for processing redo log entries.
By default, innodb_doublewrite=OFF, so that --prepare works faster.
If more crash-safety for --prepare is needed, double buffering
can be enabled.
The parameter innodb_log_checksums=OFF can be used to ignore redo log
checksums in --backup.
Some messages have been cleaned up.
Unless --export is specified, Mariabackup will not deal with undo log.
The InnoDB mini-transaction redo log is not only about user-level
transactions; it is actually about mini-transactions. To avoid confusion,
call it the redo log, not transaction log.
We disable any undo log processing in --prepare.
Because MariaDB 10.2 supports indexed virtual columns, the
undo log processing would need to be able to evaluate virtual column
expressions. To reduce the amount of code dependencies, we will not
process any undo log in prepare.
This means that the --export option must be disabled for now.
This also means that the following options are redundant
and have been removed:
xtrabackup --apply-log-only
innobackupex --redo-only
In addition to disabling any undo log processing, we will disable any
further changes to data pages during --prepare, including the change
buffer merge. This means that restoring incremental backups should
reliably work even when change buffering is being used on the server.
Because of this, preparing a backup will not generate any further
redo log, and the redo log file can be safely deleted. (If the
--export option is enabled in the future, it must generate redo log
when processing undo logs and buffered changes.)
In --prepare, we cannot easily know if a partial backup was used,
especially when restoring a series of incremental backups. So, we
simply warn about any missing files, and ignore the redo log for them.
FIXME: Enable the --export option.
FIXME: Improve the handling of the MLOG_INDEX_LOAD record, and write
a test that initiates a backup while an ALGORITHM=INPLACE operation
is creating indexes or rebuilding a table. An error should be detected
when preparing the backup.
FIXME: In --incremental --prepare, xtrabackup_apply_delta() should
ensure that if FSP_SIZE is modified, the file size will be adjusted
accordingly.
2017-06-30 10:49:37 +03:00
|
|
|
ut_ad(srv_operation == SRV_OPERATION_NORMAL
|
2017-10-10 10:28:54 +03:00
|
|
|
|| srv_operation == SRV_OPERATION_RESTORE
|
|
|
|
|| srv_operation == SRV_OPERATION_RESTORE_EXPORT);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
MDEV-12548 Initial implementation of Mariabackup for MariaDB 10.2
InnoDB I/O and buffer pool interfaces and the redo log format
have been changed between MariaDB 10.1 and 10.2, and the backup
code has to be adjusted accordingly.
The code has been simplified, and many memory leaks have been fixed.
Instead of the file name xtrabackup_logfile, the file name ib_logfile0
is being used for the copy of the redo log. Unnecessary InnoDB startup and
shutdown and some unnecessary threads have been removed.
Some help was provided by Vladislav Vaintroub.
Parameters have been cleaned up and aligned with those of MariaDB 10.2.
The --dbug option has been added, so that in debug builds,
--dbug=d,ib_log can be specified to enable diagnostic messages
for processing redo log entries.
By default, innodb_doublewrite=OFF, so that --prepare works faster.
If more crash-safety for --prepare is needed, double buffering
can be enabled.
The parameter innodb_log_checksums=OFF can be used to ignore redo log
checksums in --backup.
Some messages have been cleaned up.
Unless --export is specified, Mariabackup will not deal with undo log.
The InnoDB mini-transaction redo log is not only about user-level
transactions; it is actually about mini-transactions. To avoid confusion,
call it the redo log, not transaction log.
We disable any undo log processing in --prepare.
Because MariaDB 10.2 supports indexed virtual columns, the
undo log processing would need to be able to evaluate virtual column
expressions. To reduce the amount of code dependencies, we will not
process any undo log in prepare.
This means that the --export option must be disabled for now.
This also means that the following options are redundant
and have been removed:
xtrabackup --apply-log-only
innobackupex --redo-only
In addition to disabling any undo log processing, we will disable any
further changes to data pages during --prepare, including the change
buffer merge. This means that restoring incremental backups should
reliably work even when change buffering is being used on the server.
Because of this, preparing a backup will not generate any further
redo log, and the redo log file can be safely deleted. (If the
--export option is enabled in the future, it must generate redo log
when processing undo logs and buffered changes.)
In --prepare, we cannot easily know if a partial backup was used,
especially when restoring a series of incremental backups. So, we
simply warn about any missing files, and ignore the redo log for them.
FIXME: Enable the --export option.
FIXME: Improve the handling of the MLOG_INDEX_LOAD record, and write
a test that initiates a backup while an ALGORITHM=INPLACE operation
is creating indexes or rebuilding a table. An error should be detected
when preparing the backup.
FIXME: In --incremental --prepare, xtrabackup_apply_delta() should
ensure that if FSP_SIZE is modified, the file size will be adjusted
accordingly.
2017-06-30 10:49:37 +03:00
|
|
|
mutex_enter(&recv_sys->mutex);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
MDEV-12548 Initial implementation of Mariabackup for MariaDB 10.2
InnoDB I/O and buffer pool interfaces and the redo log format
have been changed between MariaDB 10.1 and 10.2, and the backup
code has to be adjusted accordingly.
The code has been simplified, and many memory leaks have been fixed.
Instead of the file name xtrabackup_logfile, the file name ib_logfile0
is being used for the copy of the redo log. Unnecessary InnoDB startup and
shutdown and some unnecessary threads have been removed.
Some help was provided by Vladislav Vaintroub.
Parameters have been cleaned up and aligned with those of MariaDB 10.2.
The --dbug option has been added, so that in debug builds,
--dbug=d,ib_log can be specified to enable diagnostic messages
for processing redo log entries.
By default, innodb_doublewrite=OFF, so that --prepare works faster.
If more crash-safety for --prepare is needed, double buffering
can be enabled.
The parameter innodb_log_checksums=OFF can be used to ignore redo log
checksums in --backup.
Some messages have been cleaned up.
Unless --export is specified, Mariabackup will not deal with undo log.
The InnoDB mini-transaction redo log is not only about user-level
transactions; it is actually about mini-transactions. To avoid confusion,
call it the redo log, not transaction log.
We disable any undo log processing in --prepare.
Because MariaDB 10.2 supports indexed virtual columns, the
undo log processing would need to be able to evaluate virtual column
expressions. To reduce the amount of code dependencies, we will not
process any undo log in prepare.
This means that the --export option must be disabled for now.
This also means that the following options are redundant
and have been removed:
xtrabackup --apply-log-only
innobackupex --redo-only
In addition to disabling any undo log processing, we will disable any
further changes to data pages during --prepare, including the change
buffer merge. This means that restoring incremental backups should
reliably work even when change buffering is being used on the server.
Because of this, preparing a backup will not generate any further
redo log, and the redo log file can be safely deleted. (If the
--export option is enabled in the future, it must generate redo log
when processing undo logs and buffered changes.)
In --prepare, we cannot easily know if a partial backup was used,
especially when restoring a series of incremental backups. So, we
simply warn about any missing files, and ignore the redo log for them.
FIXME: Enable the --export option.
FIXME: Improve the handling of the MLOG_INDEX_LOAD record, and write
a test that initiates a backup while an ALGORITHM=INPLACE operation
is creating indexes or rebuilding a table. An error should be detected
when preparing the backup.
FIXME: In --incremental --prepare, xtrabackup_apply_delta() should
ensure that if FSP_SIZE is modified, the file size will be adjusted
accordingly.
2017-06-30 10:49:37 +03:00
|
|
|
while (recv_sys->apply_batch_on) {
|
|
|
|
bool abort = recv_sys->found_corrupt_log;
|
|
|
|
mutex_exit(&recv_sys->mutex);
|
|
|
|
|
|
|
|
if (abort) {
|
MDEV-12253: Buffer pool blocks are accessed after they have been freed
Problem was that bpage was referenced after it was already freed
from LRU. Fixed by adding a new variable encrypted that is
passed down to buf_page_check_corrupt() and used in
buf_page_get_gen() to stop processing page read.
This patch should also address following test failures and
bugs:
MDEV-12419: IMPORT should not look up tablespace in
PageConverter::validate(). This is now removed.
MDEV-10099: encryption.innodb_onlinealter_encryption fails
sporadically in buildbot
MDEV-11420: encryption.innodb_encryption-page-compression
failed in buildbot
MDEV-11222: encryption.encrypt_and_grep failed in buildbot on P8
Removed dict_table_t::is_encrypted and dict_table_t::ibd_file_missing
and replaced these with dict_table_t::file_unreadable. Table
ibd file is missing if fil_get_space(space_id) returns NULL
and encrypted if not. Removed dict_table_t::is_corrupted field.
Ported FilSpace class from 10.2 and using that on buf_page_check_corrupt(),
buf_page_decrypt_after_read(), buf_page_encrypt_before_write(),
buf_dblwr_process(), buf_read_page(), dict_stats_save_defrag_stats().
Added test cases when enrypted page could be read while doing
redo log crash recovery. Also added test case for row compressed
blobs.
btr_cur_open_at_index_side_func(),
btr_cur_open_at_rnd_pos_func(): Avoid referencing block that is
NULL.
buf_page_get_zip(): Issue error if page read fails.
buf_page_get_gen(): Use dberr_t for error detection and
do not reference bpage after we hare freed it.
buf_mark_space_corrupt(): remove bpage from LRU also when
it is encrypted.
buf_page_check_corrupt(): @return DB_SUCCESS if page has
been read and is not corrupted,
DB_PAGE_CORRUPTED if page based on checksum check is corrupted,
DB_DECRYPTION_FAILED if page post encryption checksum matches but
after decryption normal page checksum does not match. In read
case only DB_SUCCESS is possible.
buf_page_io_complete(): use dberr_t for error handling.
buf_flush_write_block_low(),
buf_read_ahead_random(),
buf_read_page_async(),
buf_read_ahead_linear(),
buf_read_ibuf_merge_pages(),
buf_read_recv_pages(),
fil_aio_wait():
Issue error if page read fails.
btr_pcur_move_to_next_page(): Do not reference page if it is
NULL.
Introduced dict_table_t::is_readable() and dict_index_t::is_readable()
that will return true if tablespace exists and pages read from
tablespace are not corrupted or page decryption failed.
Removed buf_page_t::key_version. After page decryption the
key version is not removed from page frame. For unencrypted
pages, old key_version is removed at buf_page_encrypt_before_write()
dict_stats_update_transient_for_index(),
dict_stats_update_transient()
Do not continue if table decryption failed or table
is corrupted.
dict0stats.cc: Introduced a dict_stats_report_error function
to avoid code duplication.
fil_parse_write_crypt_data():
Check that key read from redo log entry is found from
encryption plugin and if it is not, refuse to start.
PageConverter::validate(): Removed access to fil_space_t as
tablespace is not available during import.
Fixed error code on innodb.innodb test.
Merged test cased innodb-bad-key-change5 and innodb-bad-key-shutdown
to innodb-bad-key-change2. Removed innodb-bad-key-change5 test.
Decreased unnecessary complexity on some long lasting tests.
Removed fil_inc_pending_ops(), fil_decr_pending_ops(),
fil_get_first_space(), fil_get_next_space(),
fil_get_first_space_safe(), fil_get_next_space_safe()
functions.
fil_space_verify_crypt_checksum(): Fixed bug found using ASAN
where FIL_PAGE_END_LSN_OLD_CHECKSUM field was incorrectly
accessed from row compressed tables. Fixed out of page frame
bug for row compressed tables in
fil_space_verify_crypt_checksum() found using ASAN. Incorrect
function was called for compressed table.
Added new tests for discard, rename table and drop (we should allow them
even when page decryption fails). Alter table rename is not allowed.
Added test for restart with innodb-force-recovery=1 when page read on
redo-recovery cant be decrypted. Added test for corrupted table where
both page data and FIL_PAGE_FILE_FLUSH_LSN_OR_KEY_VERSION is corrupted.
Adjusted the test case innodb_bug14147491 so that it does not anymore
expect crash. Instead table is just mostly not usable.
fil0fil.h: fil_space_acquire_low is not visible function
and fil_space_acquire and fil_space_acquire_silent are
inline functions. FilSpace class uses fil_space_acquire_low
directly.
recv_apply_hashed_log_recs() does not return anything.
2017-04-26 15:19:16 +03:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
os_thread_sleep(500000);
|
MDEV-12548 Initial implementation of Mariabackup for MariaDB 10.2
InnoDB I/O and buffer pool interfaces and the redo log format
have been changed between MariaDB 10.1 and 10.2, and the backup
code has to be adjusted accordingly.
The code has been simplified, and many memory leaks have been fixed.
Instead of the file name xtrabackup_logfile, the file name ib_logfile0
is being used for the copy of the redo log. Unnecessary InnoDB startup and
shutdown and some unnecessary threads have been removed.
Some help was provided by Vladislav Vaintroub.
Parameters have been cleaned up and aligned with those of MariaDB 10.2.
The --dbug option has been added, so that in debug builds,
--dbug=d,ib_log can be specified to enable diagnostic messages
for processing redo log entries.
By default, innodb_doublewrite=OFF, so that --prepare works faster.
If more crash-safety for --prepare is needed, double buffering
can be enabled.
The parameter innodb_log_checksums=OFF can be used to ignore redo log
checksums in --backup.
Some messages have been cleaned up.
Unless --export is specified, Mariabackup will not deal with undo log.
The InnoDB mini-transaction redo log is not only about user-level
transactions; it is actually about mini-transactions. To avoid confusion,
call it the redo log, not transaction log.
We disable any undo log processing in --prepare.
Because MariaDB 10.2 supports indexed virtual columns, the
undo log processing would need to be able to evaluate virtual column
expressions. To reduce the amount of code dependencies, we will not
process any undo log in prepare.
This means that the --export option must be disabled for now.
This also means that the following options are redundant
and have been removed:
xtrabackup --apply-log-only
innobackupex --redo-only
In addition to disabling any undo log processing, we will disable any
further changes to data pages during --prepare, including the change
buffer merge. This means that restoring incremental backups should
reliably work even when change buffering is being used on the server.
Because of this, preparing a backup will not generate any further
redo log, and the redo log file can be safely deleted. (If the
--export option is enabled in the future, it must generate redo log
when processing undo logs and buffered changes.)
In --prepare, we cannot easily know if a partial backup was used,
especially when restoring a series of incremental backups. So, we
simply warn about any missing files, and ignore the redo log for them.
FIXME: Enable the --export option.
FIXME: Improve the handling of the MLOG_INDEX_LOAD record, and write
a test that initiates a backup while an ALGORITHM=INPLACE operation
is creating indexes or rebuilding a table. An error should be detected
when preparing the backup.
FIXME: In --incremental --prepare, xtrabackup_apply_delta() should
ensure that if FSP_SIZE is modified, the file size will be adjusted
accordingly.
2017-06-30 10:49:37 +03:00
|
|
|
mutex_enter(&recv_sys->mutex);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2017-03-07 17:16:49 +02:00
|
|
|
ut_ad(!last_batch == log_mutex_own());
|
2014-02-26 19:11:54 +01:00
|
|
|
|
MDEV-12548 Initial implementation of Mariabackup for MariaDB 10.2
InnoDB I/O and buffer pool interfaces and the redo log format
have been changed between MariaDB 10.1 and 10.2, and the backup
code has to be adjusted accordingly.
The code has been simplified, and many memory leaks have been fixed.
Instead of the file name xtrabackup_logfile, the file name ib_logfile0
is being used for the copy of the redo log. Unnecessary InnoDB startup and
shutdown and some unnecessary threads have been removed.
Some help was provided by Vladislav Vaintroub.
Parameters have been cleaned up and aligned with those of MariaDB 10.2.
The --dbug option has been added, so that in debug builds,
--dbug=d,ib_log can be specified to enable diagnostic messages
for processing redo log entries.
By default, innodb_doublewrite=OFF, so that --prepare works faster.
If more crash-safety for --prepare is needed, double buffering
can be enabled.
The parameter innodb_log_checksums=OFF can be used to ignore redo log
checksums in --backup.
Some messages have been cleaned up.
Unless --export is specified, Mariabackup will not deal with undo log.
The InnoDB mini-transaction redo log is not only about user-level
transactions; it is actually about mini-transactions. To avoid confusion,
call it the redo log, not transaction log.
We disable any undo log processing in --prepare.
Because MariaDB 10.2 supports indexed virtual columns, the
undo log processing would need to be able to evaluate virtual column
expressions. To reduce the amount of code dependencies, we will not
process any undo log in prepare.
This means that the --export option must be disabled for now.
This also means that the following options are redundant
and have been removed:
xtrabackup --apply-log-only
innobackupex --redo-only
In addition to disabling any undo log processing, we will disable any
further changes to data pages during --prepare, including the change
buffer merge. This means that restoring incremental backups should
reliably work even when change buffering is being used on the server.
Because of this, preparing a backup will not generate any further
redo log, and the redo log file can be safely deleted. (If the
--export option is enabled in the future, it must generate redo log
when processing undo logs and buffered changes.)
In --prepare, we cannot easily know if a partial backup was used,
especially when restoring a series of incremental backups. So, we
simply warn about any missing files, and ignore the redo log for them.
FIXME: Enable the --export option.
FIXME: Improve the handling of the MLOG_INDEX_LOAD record, and write
a test that initiates a backup while an ALGORITHM=INPLACE operation
is creating indexes or rebuilding a table. An error should be detected
when preparing the backup.
FIXME: In --incremental --prepare, xtrabackup_apply_delta() should
ensure that if FSP_SIZE is modified, the file size will be adjusted
accordingly.
2017-06-30 10:49:37 +03:00
|
|
|
recv_no_ibuf_operations = !last_batch
|
2017-10-10 10:28:54 +03:00
|
|
|
|| srv_operation == SRV_OPERATION_RESTORE
|
|
|
|
|| srv_operation == SRV_OPERATION_RESTORE_EXPORT;
|
MDEV-12548 Initial implementation of Mariabackup for MariaDB 10.2
InnoDB I/O and buffer pool interfaces and the redo log format
have been changed between MariaDB 10.1 and 10.2, and the backup
code has to be adjusted accordingly.
The code has been simplified, and many memory leaks have been fixed.
Instead of the file name xtrabackup_logfile, the file name ib_logfile0
is being used for the copy of the redo log. Unnecessary InnoDB startup and
shutdown and some unnecessary threads have been removed.
Some help was provided by Vladislav Vaintroub.
Parameters have been cleaned up and aligned with those of MariaDB 10.2.
The --dbug option has been added, so that in debug builds,
--dbug=d,ib_log can be specified to enable diagnostic messages
for processing redo log entries.
By default, innodb_doublewrite=OFF, so that --prepare works faster.
If more crash-safety for --prepare is needed, double buffering
can be enabled.
The parameter innodb_log_checksums=OFF can be used to ignore redo log
checksums in --backup.
Some messages have been cleaned up.
Unless --export is specified, Mariabackup will not deal with undo log.
The InnoDB mini-transaction redo log is not only about user-level
transactions; it is actually about mini-transactions. To avoid confusion,
call it the redo log, not transaction log.
We disable any undo log processing in --prepare.
Because MariaDB 10.2 supports indexed virtual columns, the
undo log processing would need to be able to evaluate virtual column
expressions. To reduce the amount of code dependencies, we will not
process any undo log in prepare.
This means that the --export option must be disabled for now.
This also means that the following options are redundant
and have been removed:
xtrabackup --apply-log-only
innobackupex --redo-only
In addition to disabling any undo log processing, we will disable any
further changes to data pages during --prepare, including the change
buffer merge. This means that restoring incremental backups should
reliably work even when change buffering is being used on the server.
Because of this, preparing a backup will not generate any further
redo log, and the redo log file can be safely deleted. (If the
--export option is enabled in the future, it must generate redo log
when processing undo logs and buffered changes.)
In --prepare, we cannot easily know if a partial backup was used,
especially when restoring a series of incremental backups. So, we
simply warn about any missing files, and ignore the redo log for them.
FIXME: Enable the --export option.
FIXME: Improve the handling of the MLOG_INDEX_LOAD record, and write
a test that initiates a backup while an ALGORITHM=INPLACE operation
is creating indexes or rebuilding a table. An error should be detected
when preparing the backup.
FIXME: In --incremental --prepare, xtrabackup_apply_delta() should
ensure that if FSP_SIZE is modified, the file size will be adjusted
accordingly.
2017-06-30 10:49:37 +03:00
|
|
|
|
|
|
|
ut_d(recv_no_log_write = recv_no_ibuf_operations);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-03-07 17:16:49 +02:00
|
|
|
if (ulint n = recv_sys->n_addrs) {
|
|
|
|
const char* msg = last_batch
|
|
|
|
? "Starting final batch to recover "
|
|
|
|
: "Starting a batch to recover ";
|
|
|
|
ib::info() << msg << n << " pages from redo log.";
|
|
|
|
sd_notifyf(0, "STATUS=%s" ULINTPF " pages from redo log",
|
|
|
|
msg, n);
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
recv_sys->apply_log_recs = TRUE;
|
|
|
|
recv_sys->apply_batch_on = TRUE;
|
|
|
|
|
MDEV-13564 Mariabackup does not work with TRUNCATE
Implement undo tablespace truncation via normal redo logging.
Implement TRUNCATE TABLE as a combination of RENAME to #sql-ib name,
CREATE, and DROP.
Note: Orphan #sql-ib*.ibd may be left behind if MariaDB Server 10.2
is killed before the DROP operation is committed. If MariaDB Server 10.2
is killed during TRUNCATE, it is also possible that the old table
was renamed to #sql-ib*.ibd but the data dictionary will refer to the
table using the original name.
In MariaDB Server 10.3, RENAME inside InnoDB is transactional,
and #sql-* tables will be dropped on startup. So, this new TRUNCATE
will be fully crash-safe in 10.3.
ha_mroonga::wrapper_truncate(): Pass table options to the underlying
storage engine, now that ha_innobase::truncate() will need them.
rpl_slave_state::truncate_state_table(): Before truncating
mysql.gtid_slave_pos, evict any cached table handles from
the table definition cache, so that there will be no stale
references to the old table after truncating.
== TRUNCATE TABLE ==
WL#6501 in MySQL 5.7 introduced separate log files for implementing
atomic and crash-safe TRUNCATE TABLE, instead of using the InnoDB
undo and redo log. Some convoluted logic was added to the InnoDB
crash recovery, and some extra synchronization (including a redo log
checkpoint) was introduced to make this work. This synchronization
has caused performance problems and race conditions, and the extra
log files cannot be copied or applied by external backup programs.
In order to support crash-upgrade from MariaDB 10.2, we will keep
the logic for parsing and applying the extra log files, but we will
no longer generate those files in TRUNCATE TABLE.
A prerequisite for crash-safe TRUNCATE is a crash-safe RENAME TABLE
(with full redo and undo logging and proper rollback). This will
be implemented in MDEV-14717.
ha_innobase::truncate(): Invoke RENAME, create(), delete_table().
Because RENAME cannot be fully rolled back before MariaDB 10.3
due to missing undo logging, add some explicit rename-back in
case the operation fails.
ha_innobase::delete(): Introduce a variant that takes sqlcom as
a parameter. In TRUNCATE TABLE, we do not want to touch any
FOREIGN KEY constraints.
ha_innobase::create(): Add the parameters file_per_table, trx.
In TRUNCATE, the new table must be created in the same transaction
that renames the old table.
create_table_info_t::create_table_info_t(): Add the parameters
file_per_table, trx.
row_drop_table_for_mysql(): Replace a bool parameter with sqlcom.
row_drop_table_after_create_fail(): New function, wrapping
row_drop_table_for_mysql().
dict_truncate_index_tree_in_mem(), fil_truncate_tablespace(),
fil_prepare_for_truncate(), fil_reinit_space_header_for_table(),
row_truncate_table_for_mysql(), TruncateLogger,
row_truncate_prepare(), row_truncate_rollback(),
row_truncate_complete(), row_truncate_fts(),
row_truncate_update_system_tables(),
row_truncate_foreign_key_checks(), row_truncate_sanity_checks():
Remove.
row_upd_check_references_constraints(): Remove a check for
TRUNCATE, now that the table is no longer truncated in place.
The new test innodb.truncate_foreign uses DEBUG_SYNC to cover some
race-condition like scenarios. The test innodb-innodb.truncate does
not use any synchronization.
We add a redo log subformat to indicate backup-friendly format.
MariaDB 10.4 will remove support for the old TRUNCATE logging,
so crash-upgrade from old 10.2 or 10.3 to 10.4 will involve
limitations.
== Undo tablespace truncation ==
MySQL 5.7 implements undo tablespace truncation. It is only
possible when innodb_undo_tablespaces is set to at least 2.
The logging is implemented similar to the WL#6501 TRUNCATE,
that is, using separate log files and a redo log checkpoint.
We can simply implement undo tablespace truncation within
a single mini-transaction that reinitializes the undo log
tablespace file. Unfortunately, due to the redo log format
of some operations, currently, the total redo log written by
undo tablespace truncation will be more than the combined size
of the truncated undo tablespace. It should be acceptable
to have a little more than 1 megabyte of log in a single
mini-transaction. This will be fixed in MDEV-17138 in
MariaDB Server 10.4.
recv_sys_t: Add truncated_undo_spaces[] to remember for which undo
tablespaces a MLOG_FILE_CREATE2 record was seen.
namespace undo: Remove some unnecessary declarations.
fil_space_t::is_being_truncated: Document that this flag now
only applies to undo tablespaces. Remove some references.
fil_space_t::is_stopping(): Do not refer to is_being_truncated.
This check is for tablespaces of tables. Potentially used
tablespaces are never truncated any more.
buf_dblwr_process(): Suppress the out-of-bounds warning
for undo tablespaces.
fil_truncate_log(): Write a MLOG_FILE_CREATE2 with a nonzero
page number (new size of the tablespace in pages) to inform
crash recovery that the undo tablespace size has been reduced.
fil_op_write_log(): Relax assertions, so that MLOG_FILE_CREATE2
can be written for undo tablespaces (without .ibd file suffix)
for a nonzero page number.
os_file_truncate(): Add the parameter allow_shrink=false
so that undo tablespaces can actually be shrunk using this function.
fil_name_parse(): For undo tablespace truncation,
buffer MLOG_FILE_CREATE2 in truncated_undo_spaces[].
recv_read_in_area(): Avoid reading pages for which no redo log
records remain buffered, after recv_addr_trim() removed them.
trx_rseg_header_create(): Add a FIXME comment that we could write
much less redo log.
trx_undo_truncate_tablespace(): Reinitialize the undo tablespace
in a single mini-transaction, which will be flushed to the redo log
before the file size is trimmed.
recv_addr_trim(): Discard any redo logs for pages that were
logged after the new end of a file, before the truncation LSN.
If the rec_list becomes empty, reduce n_addrs. After removing
any affected records, actually truncate the file.
recv_apply_hashed_log_recs(): Invoke recv_addr_trim() right before
applying any log records. The undo tablespace files must be open
at this point.
buf_flush_or_remove_pages(), buf_flush_dirty_pages(),
buf_LRU_flush_or_remove_pages(): Add a parameter for specifying
the number of the first page to flush or remove (default 0).
trx_purge_initiate_truncate(): Remove the log checkpoints, the
extra logging, and some unnecessary crash points. Merge the code
from trx_undo_truncate_tablespace(). First, flush all to-be-discarded
pages (beyond the new end of the file), then trim the space->size
to make the page allocation deterministic. At the only remaining
crash injection point, flush the redo log, so that the recovery
can be tested.
2018-08-28 13:43:06 +03:00
|
|
|
for (ulint id = srv_undo_tablespaces_open; id--; ) {
|
|
|
|
recv_sys_t::trunc& t = recv_sys->truncated_undo_spaces[id];
|
|
|
|
if (t.lsn) {
|
|
|
|
recv_addr_trim(id + srv_undo_space_id_start, t.pages,
|
|
|
|
t.lsn);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-03-07 17:16:49 +02:00
|
|
|
for (ulint i = 0; i < hash_get_n_cells(recv_sys->addr_hash); i++) {
|
|
|
|
for (recv_addr_t* recv_addr = static_cast<recv_addr_t*>(
|
2017-03-08 11:40:43 +02:00
|
|
|
HASH_GET_FIRST(recv_sys->addr_hash, i));
|
2017-03-07 17:16:49 +02:00
|
|
|
recv_addr;
|
2014-02-26 19:11:54 +01:00
|
|
|
recv_addr = static_cast<recv_addr_t*>(
|
|
|
|
HASH_GET_NEXT(addr_hash, recv_addr))) {
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (srv_is_tablespace_truncated(recv_addr->space)) {
|
|
|
|
/* Avoid applying REDO log for the tablespace
|
|
|
|
that is schedule for TRUNCATE. */
|
|
|
|
ut_a(recv_sys->n_addrs);
|
|
|
|
recv_addr->state = RECV_DISCARDED;
|
|
|
|
recv_sys->n_addrs--;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2018-11-20 14:55:44 +02:00
|
|
|
if (recv_addr->state == RECV_DISCARDED
|
|
|
|
|| !UT_LIST_GET_LEN(recv_addr->rec_list)) {
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_a(recv_sys->n_addrs);
|
|
|
|
recv_sys->n_addrs--;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
const page_id_t page_id(recv_addr->space,
|
|
|
|
recv_addr->page_no);
|
|
|
|
bool found;
|
|
|
|
const page_size_t& page_size
|
|
|
|
= fil_space_get_page_size(recv_addr->space,
|
|
|
|
&found);
|
|
|
|
|
|
|
|
ut_ad(found);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
if (recv_addr->state == RECV_NOT_PROCESSED) {
|
2017-03-07 17:16:49 +02:00
|
|
|
mutex_exit(&recv_sys->mutex);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (buf_page_peek(page_id)) {
|
2017-03-07 17:16:49 +02:00
|
|
|
mtr_t mtr;
|
|
|
|
mtr.start();
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-03-07 17:16:49 +02:00
|
|
|
buf_block_t* block = buf_page_get(
|
2016-08-12 11:17:45 +03:00
|
|
|
page_id, page_size,
|
2014-02-26 19:11:54 +01:00
|
|
|
RW_X_LATCH, &mtr);
|
2016-08-12 11:17:45 +03:00
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
buf_block_dbg_add_level(
|
|
|
|
block, SYNC_NO_ORDER_CHECK);
|
|
|
|
|
|
|
|
recv_recover_page(FALSE, block);
|
2017-03-07 17:16:49 +02:00
|
|
|
mtr.commit();
|
2014-02-26 19:11:54 +01:00
|
|
|
} else {
|
2016-08-12 11:17:45 +03:00
|
|
|
recv_read_in_area(page_id);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2017-03-08 11:40:43 +02:00
|
|
|
mutex_enter(&recv_sys->mutex);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Wait until all the pages have been processed */
|
|
|
|
|
|
|
|
while (recv_sys->n_addrs != 0) {
|
MDEV-12548 Initial implementation of Mariabackup for MariaDB 10.2
InnoDB I/O and buffer pool interfaces and the redo log format
have been changed between MariaDB 10.1 and 10.2, and the backup
code has to be adjusted accordingly.
The code has been simplified, and many memory leaks have been fixed.
Instead of the file name xtrabackup_logfile, the file name ib_logfile0
is being used for the copy of the redo log. Unnecessary InnoDB startup and
shutdown and some unnecessary threads have been removed.
Some help was provided by Vladislav Vaintroub.
Parameters have been cleaned up and aligned with those of MariaDB 10.2.
The --dbug option has been added, so that in debug builds,
--dbug=d,ib_log can be specified to enable diagnostic messages
for processing redo log entries.
By default, innodb_doublewrite=OFF, so that --prepare works faster.
If more crash-safety for --prepare is needed, double buffering
can be enabled.
The parameter innodb_log_checksums=OFF can be used to ignore redo log
checksums in --backup.
Some messages have been cleaned up.
Unless --export is specified, Mariabackup will not deal with undo log.
The InnoDB mini-transaction redo log is not only about user-level
transactions; it is actually about mini-transactions. To avoid confusion,
call it the redo log, not transaction log.
We disable any undo log processing in --prepare.
Because MariaDB 10.2 supports indexed virtual columns, the
undo log processing would need to be able to evaluate virtual column
expressions. To reduce the amount of code dependencies, we will not
process any undo log in prepare.
This means that the --export option must be disabled for now.
This also means that the following options are redundant
and have been removed:
xtrabackup --apply-log-only
innobackupex --redo-only
In addition to disabling any undo log processing, we will disable any
further changes to data pages during --prepare, including the change
buffer merge. This means that restoring incremental backups should
reliably work even when change buffering is being used on the server.
Because of this, preparing a backup will not generate any further
redo log, and the redo log file can be safely deleted. (If the
--export option is enabled in the future, it must generate redo log
when processing undo logs and buffered changes.)
In --prepare, we cannot easily know if a partial backup was used,
especially when restoring a series of incremental backups. So, we
simply warn about any missing files, and ignore the redo log for them.
FIXME: Enable the --export option.
FIXME: Improve the handling of the MLOG_INDEX_LOAD record, and write
a test that initiates a backup while an ALGORITHM=INPLACE operation
is creating indexes or rebuilding a table. An error should be detected
when preparing the backup.
FIXME: In --incremental --prepare, xtrabackup_apply_delta() should
ensure that if FSP_SIZE is modified, the file size will be adjusted
accordingly.
2017-06-30 10:49:37 +03:00
|
|
|
bool abort = recv_sys->found_corrupt_log;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
mutex_exit(&(recv_sys->mutex));
|
|
|
|
|
MDEV-12548 Initial implementation of Mariabackup for MariaDB 10.2
InnoDB I/O and buffer pool interfaces and the redo log format
have been changed between MariaDB 10.1 and 10.2, and the backup
code has to be adjusted accordingly.
The code has been simplified, and many memory leaks have been fixed.
Instead of the file name xtrabackup_logfile, the file name ib_logfile0
is being used for the copy of the redo log. Unnecessary InnoDB startup and
shutdown and some unnecessary threads have been removed.
Some help was provided by Vladislav Vaintroub.
Parameters have been cleaned up and aligned with those of MariaDB 10.2.
The --dbug option has been added, so that in debug builds,
--dbug=d,ib_log can be specified to enable diagnostic messages
for processing redo log entries.
By default, innodb_doublewrite=OFF, so that --prepare works faster.
If more crash-safety for --prepare is needed, double buffering
can be enabled.
The parameter innodb_log_checksums=OFF can be used to ignore redo log
checksums in --backup.
Some messages have been cleaned up.
Unless --export is specified, Mariabackup will not deal with undo log.
The InnoDB mini-transaction redo log is not only about user-level
transactions; it is actually about mini-transactions. To avoid confusion,
call it the redo log, not transaction log.
We disable any undo log processing in --prepare.
Because MariaDB 10.2 supports indexed virtual columns, the
undo log processing would need to be able to evaluate virtual column
expressions. To reduce the amount of code dependencies, we will not
process any undo log in prepare.
This means that the --export option must be disabled for now.
This also means that the following options are redundant
and have been removed:
xtrabackup --apply-log-only
innobackupex --redo-only
In addition to disabling any undo log processing, we will disable any
further changes to data pages during --prepare, including the change
buffer merge. This means that restoring incremental backups should
reliably work even when change buffering is being used on the server.
Because of this, preparing a backup will not generate any further
redo log, and the redo log file can be safely deleted. (If the
--export option is enabled in the future, it must generate redo log
when processing undo logs and buffered changes.)
In --prepare, we cannot easily know if a partial backup was used,
especially when restoring a series of incremental backups. So, we
simply warn about any missing files, and ignore the redo log for them.
FIXME: Enable the --export option.
FIXME: Improve the handling of the MLOG_INDEX_LOAD record, and write
a test that initiates a backup while an ALGORITHM=INPLACE operation
is creating indexes or rebuilding a table. An error should be detected
when preparing the backup.
FIXME: In --incremental --prepare, xtrabackup_apply_delta() should
ensure that if FSP_SIZE is modified, the file size will be adjusted
accordingly.
2017-06-30 10:49:37 +03:00
|
|
|
if (abort) {
|
MDEV-12253: Buffer pool blocks are accessed after they have been freed
Problem was that bpage was referenced after it was already freed
from LRU. Fixed by adding a new variable encrypted that is
passed down to buf_page_check_corrupt() and used in
buf_page_get_gen() to stop processing page read.
This patch should also address following test failures and
bugs:
MDEV-12419: IMPORT should not look up tablespace in
PageConverter::validate(). This is now removed.
MDEV-10099: encryption.innodb_onlinealter_encryption fails
sporadically in buildbot
MDEV-11420: encryption.innodb_encryption-page-compression
failed in buildbot
MDEV-11222: encryption.encrypt_and_grep failed in buildbot on P8
Removed dict_table_t::is_encrypted and dict_table_t::ibd_file_missing
and replaced these with dict_table_t::file_unreadable. Table
ibd file is missing if fil_get_space(space_id) returns NULL
and encrypted if not. Removed dict_table_t::is_corrupted field.
Ported FilSpace class from 10.2 and using that on buf_page_check_corrupt(),
buf_page_decrypt_after_read(), buf_page_encrypt_before_write(),
buf_dblwr_process(), buf_read_page(), dict_stats_save_defrag_stats().
Added test cases when enrypted page could be read while doing
redo log crash recovery. Also added test case for row compressed
blobs.
btr_cur_open_at_index_side_func(),
btr_cur_open_at_rnd_pos_func(): Avoid referencing block that is
NULL.
buf_page_get_zip(): Issue error if page read fails.
buf_page_get_gen(): Use dberr_t for error detection and
do not reference bpage after we hare freed it.
buf_mark_space_corrupt(): remove bpage from LRU also when
it is encrypted.
buf_page_check_corrupt(): @return DB_SUCCESS if page has
been read and is not corrupted,
DB_PAGE_CORRUPTED if page based on checksum check is corrupted,
DB_DECRYPTION_FAILED if page post encryption checksum matches but
after decryption normal page checksum does not match. In read
case only DB_SUCCESS is possible.
buf_page_io_complete(): use dberr_t for error handling.
buf_flush_write_block_low(),
buf_read_ahead_random(),
buf_read_page_async(),
buf_read_ahead_linear(),
buf_read_ibuf_merge_pages(),
buf_read_recv_pages(),
fil_aio_wait():
Issue error if page read fails.
btr_pcur_move_to_next_page(): Do not reference page if it is
NULL.
Introduced dict_table_t::is_readable() and dict_index_t::is_readable()
that will return true if tablespace exists and pages read from
tablespace are not corrupted or page decryption failed.
Removed buf_page_t::key_version. After page decryption the
key version is not removed from page frame. For unencrypted
pages, old key_version is removed at buf_page_encrypt_before_write()
dict_stats_update_transient_for_index(),
dict_stats_update_transient()
Do not continue if table decryption failed or table
is corrupted.
dict0stats.cc: Introduced a dict_stats_report_error function
to avoid code duplication.
fil_parse_write_crypt_data():
Check that key read from redo log entry is found from
encryption plugin and if it is not, refuse to start.
PageConverter::validate(): Removed access to fil_space_t as
tablespace is not available during import.
Fixed error code on innodb.innodb test.
Merged test cased innodb-bad-key-change5 and innodb-bad-key-shutdown
to innodb-bad-key-change2. Removed innodb-bad-key-change5 test.
Decreased unnecessary complexity on some long lasting tests.
Removed fil_inc_pending_ops(), fil_decr_pending_ops(),
fil_get_first_space(), fil_get_next_space(),
fil_get_first_space_safe(), fil_get_next_space_safe()
functions.
fil_space_verify_crypt_checksum(): Fixed bug found using ASAN
where FIL_PAGE_END_LSN_OLD_CHECKSUM field was incorrectly
accessed from row compressed tables. Fixed out of page frame
bug for row compressed tables in
fil_space_verify_crypt_checksum() found using ASAN. Incorrect
function was called for compressed table.
Added new tests for discard, rename table and drop (we should allow them
even when page decryption fails). Alter table rename is not allowed.
Added test for restart with innodb-force-recovery=1 when page read on
redo-recovery cant be decrypted. Added test for corrupted table where
both page data and FIL_PAGE_FILE_FLUSH_LSN_OR_KEY_VERSION is corrupted.
Adjusted the test case innodb_bug14147491 so that it does not anymore
expect crash. Instead table is just mostly not usable.
fil0fil.h: fil_space_acquire_low is not visible function
and fil_space_acquire and fil_space_acquire_silent are
inline functions. FilSpace class uses fil_space_acquire_low
directly.
recv_apply_hashed_log_recs() does not return anything.
2017-04-26 15:19:16 +03:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
os_thread_sleep(500000);
|
|
|
|
|
|
|
|
mutex_enter(&(recv_sys->mutex));
|
|
|
|
}
|
|
|
|
|
2017-03-07 17:16:49 +02:00
|
|
|
if (!last_batch) {
|
2014-02-26 19:11:54 +01:00
|
|
|
/* Flush all the file pages to disk and invalidate them in
|
|
|
|
the buffer pool */
|
|
|
|
|
|
|
|
mutex_exit(&(recv_sys->mutex));
|
2016-08-12 11:17:45 +03:00
|
|
|
log_mutex_exit();
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
/* Stop the recv_writer thread from issuing any LRU
|
|
|
|
flush batches. */
|
|
|
|
mutex_enter(&recv_sys->writer_mutex);
|
|
|
|
|
|
|
|
/* Wait for any currently run batch to end. */
|
|
|
|
buf_flush_wait_LRU_batch_end();
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
os_event_reset(recv_sys->flush_end);
|
|
|
|
recv_sys->flush_type = BUF_FLUSH_LIST;
|
|
|
|
os_event_set(recv_sys->flush_start);
|
|
|
|
os_event_wait(recv_sys->flush_end);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
buf_pool_invalidate();
|
|
|
|
|
|
|
|
/* Allow batches from recv_writer thread. */
|
|
|
|
mutex_exit(&recv_sys->writer_mutex);
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
log_mutex_enter();
|
2014-02-26 19:11:54 +01:00
|
|
|
mutex_enter(&(recv_sys->mutex));
|
|
|
|
}
|
|
|
|
|
|
|
|
recv_sys->apply_log_recs = FALSE;
|
|
|
|
recv_sys->apply_batch_on = FALSE;
|
|
|
|
|
2016-09-06 09:43:16 +03:00
|
|
|
recv_sys_empty_hash();
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-03-07 17:16:49 +02:00
|
|
|
mutex_exit(&recv_sys->mutex);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/** Tries to parse a single log record.
|
|
|
|
@param[out] type log record type
|
|
|
|
@param[in] ptr pointer to a buffer
|
|
|
|
@param[in] end_ptr end of the buffer
|
|
|
|
@param[out] space_id tablespace identifier
|
|
|
|
@param[out] page_no page number
|
|
|
|
@param[in] apply whether to apply MLOG_FILE_* records
|
|
|
|
@param[out] body start of log record body
|
|
|
|
@return length of the record, or 0 if the record was not complete */
|
2014-02-26 19:11:54 +01:00
|
|
|
static
|
|
|
|
ulint
|
|
|
|
recv_parse_log_rec(
|
2016-08-12 11:17:45 +03:00
|
|
|
mlog_id_t* type,
|
|
|
|
byte* ptr,
|
|
|
|
byte* end_ptr,
|
|
|
|
ulint* space,
|
|
|
|
ulint* page_no,
|
|
|
|
bool apply,
|
|
|
|
byte** body)
|
2014-02-26 19:11:54 +01:00
|
|
|
{
|
|
|
|
byte* new_ptr;
|
|
|
|
|
|
|
|
*body = NULL;
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
UNIV_MEM_INVALID(type, sizeof *type);
|
|
|
|
UNIV_MEM_INVALID(space, sizeof *space);
|
|
|
|
UNIV_MEM_INVALID(page_no, sizeof *page_no);
|
|
|
|
UNIV_MEM_INVALID(body, sizeof *body);
|
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
if (ptr == end_ptr) {
|
|
|
|
|
|
|
|
return(0);
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
switch (*ptr) {
|
|
|
|
#ifdef UNIV_LOG_LSN_DEBUG
|
|
|
|
case MLOG_LSN | MLOG_SINGLE_REC_FLAG:
|
|
|
|
case MLOG_LSN:
|
|
|
|
new_ptr = mlog_parse_initial_log_record(
|
|
|
|
ptr, end_ptr, type, space, page_no);
|
|
|
|
if (new_ptr != NULL) {
|
|
|
|
const lsn_t lsn = static_cast<lsn_t>(
|
|
|
|
*space) << 32 | *page_no;
|
|
|
|
ut_a(lsn == recv_sys->recovered_lsn);
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
*type = MLOG_LSN;
|
|
|
|
return(new_ptr - ptr);
|
|
|
|
#endif /* UNIV_LOG_LSN_DEBUG */
|
|
|
|
case MLOG_MULTI_REC_END:
|
|
|
|
case MLOG_DUMMY_RECORD:
|
|
|
|
*type = static_cast<mlog_id_t>(*ptr);
|
2014-02-26 19:11:54 +01:00
|
|
|
return(1);
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_CHECKPOINT:
|
|
|
|
if (end_ptr < ptr + SIZE_OF_MLOG_CHECKPOINT) {
|
|
|
|
return(0);
|
|
|
|
}
|
|
|
|
*type = static_cast<mlog_id_t>(*ptr);
|
|
|
|
return(SIZE_OF_MLOG_CHECKPOINT);
|
|
|
|
case MLOG_MULTI_REC_END | MLOG_SINGLE_REC_FLAG:
|
|
|
|
case MLOG_DUMMY_RECORD | MLOG_SINGLE_REC_FLAG:
|
|
|
|
case MLOG_CHECKPOINT | MLOG_SINGLE_REC_FLAG:
|
2018-08-16 06:35:28 +03:00
|
|
|
ib::error() << "Incorrect log record type "
|
|
|
|
<< ib::hex(unsigned(*ptr));
|
2016-08-12 11:17:45 +03:00
|
|
|
recv_sys->found_corrupt_log = true;
|
|
|
|
return(0);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
new_ptr = mlog_parse_initial_log_record(ptr, end_ptr, type, space,
|
|
|
|
page_no);
|
|
|
|
*body = new_ptr;
|
|
|
|
|
|
|
|
if (UNIV_UNLIKELY(!new_ptr)) {
|
|
|
|
|
|
|
|
return(0);
|
|
|
|
}
|
|
|
|
|
2016-12-30 13:48:22 +02:00
|
|
|
const byte* old_ptr = new_ptr;
|
2016-08-12 11:17:45 +03:00
|
|
|
new_ptr = recv_parse_or_apply_log_rec_body(
|
|
|
|
*type, new_ptr, end_ptr, *space, *page_no, apply, NULL, NULL);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
if (UNIV_UNLIKELY(new_ptr == NULL)) {
|
|
|
|
return(0);
|
|
|
|
}
|
|
|
|
|
MDEV-11556 InnoDB redo log apply fails to adjust data file sizes
fil_space_t::recv_size: New member: recovered tablespace size in pages;
0 if no size change was read from the redo log,
or if the size change was implemented.
fil_space_set_recv_size(): New function for setting space->recv_size.
innodb_data_file_size_debug: A debug parameter for setting the system
tablespace size in recovery even when the redo log does not contain
any size changes. It is hard to write a small test case that would
cause the system tablespace to be extended at the critical moment.
recv_parse_log_rec(): Note those tablespaces whose size is being changed
by the redo log, by invoking fil_space_set_recv_size().
innobase_init(): Correct an error message, and do not require a larger
innodb_buffer_pool_size when starting up with a smaller innodb_page_size.
innobase_start_or_create_for_mysql(): Allow startup with any initial
size of the ibdata1 file if the autoextend attribute is set. Require
the minimum size of fixed-size system tablespaces to be 640 pages,
not 10 megabytes. Implement innodb_data_file_size_debug.
open_or_create_data_files(): Round the system tablespace size down
to pages, not to full megabytes, (Our test truncates the system
tablespace to more than 800 pages with innodb_page_size=4k.
InnoDB should not imagine that it was truncated to 768 pages
and then overwrite good pages in the tablespace.)
fil_flush_low(): Refactored from fil_flush().
fil_space_extend_must_retry(): Refactored from
fil_extend_space_to_desired_size().
fil_mutex_enter_and_prepare_for_io(): Extend the tablespace if
fil_space_set_recv_size() was called.
The test case has been successfully run with all the
innodb_page_size values 4k, 8k, 16k, 32k, 64k.
2016-12-28 12:05:43 +02:00
|
|
|
if (*page_no == 0 && *type == MLOG_4BYTES
|
|
|
|
&& mach_read_from_2(old_ptr) == FSP_HEADER_OFFSET + FSP_SIZE) {
|
2016-12-30 13:48:22 +02:00
|
|
|
old_ptr += 2;
|
|
|
|
fil_space_set_recv_size(*space,
|
|
|
|
mach_parse_compressed(&old_ptr,
|
|
|
|
end_ptr));
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
return(new_ptr - ptr);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*******************************************************//**
|
|
|
|
Calculates the new value for lsn when more data is added to the log. */
|
|
|
|
static
|
|
|
|
lsn_t
|
|
|
|
recv_calc_lsn_on_data_add(
|
|
|
|
/*======================*/
|
|
|
|
lsn_t lsn, /*!< in: old lsn */
|
|
|
|
ib_uint64_t len) /*!< in: this many bytes of data is
|
|
|
|
added, log block headers not included */
|
|
|
|
{
|
|
|
|
ulint frag_len;
|
|
|
|
ib_uint64_t lsn_len;
|
|
|
|
|
|
|
|
frag_len = (lsn % OS_FILE_LOG_BLOCK_SIZE) - LOG_BLOCK_HDR_SIZE;
|
|
|
|
ut_ad(frag_len < OS_FILE_LOG_BLOCK_SIZE - LOG_BLOCK_HDR_SIZE
|
|
|
|
- LOG_BLOCK_TRL_SIZE);
|
|
|
|
lsn_len = len;
|
|
|
|
lsn_len += (lsn_len + frag_len)
|
|
|
|
/ (OS_FILE_LOG_BLOCK_SIZE - LOG_BLOCK_HDR_SIZE
|
|
|
|
- LOG_BLOCK_TRL_SIZE)
|
|
|
|
* (LOG_BLOCK_HDR_SIZE + LOG_BLOCK_TRL_SIZE);
|
|
|
|
|
|
|
|
return(lsn + lsn_len);
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/** Prints diagnostic info of corrupt log.
|
|
|
|
@param[in] ptr pointer to corrupt log record
|
|
|
|
@param[in] type type of the log record (could be garbage)
|
|
|
|
@param[in] space tablespace ID (could be garbage)
|
|
|
|
@param[in] page_no page number (could be garbage)
|
|
|
|
@return whether processing should continue */
|
2014-02-26 19:11:54 +01:00
|
|
|
static
|
2016-08-12 11:17:45 +03:00
|
|
|
bool
|
2014-02-26 19:11:54 +01:00
|
|
|
recv_report_corrupt_log(
|
2016-08-12 11:17:45 +03:00
|
|
|
const byte* ptr,
|
|
|
|
int type,
|
|
|
|
ulint space,
|
|
|
|
ulint page_no)
|
2014-02-26 19:11:54 +01:00
|
|
|
{
|
2016-08-12 11:17:45 +03:00
|
|
|
ib::error() <<
|
|
|
|
"############### CORRUPT LOG RECORD FOUND ##################";
|
|
|
|
|
2018-08-10 10:00:47 +03:00
|
|
|
const ulint ptr_offset = ulint(ptr - recv_sys->buf);
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
ib::info() << "Log record type " << type << ", page " << space << ":"
|
|
|
|
<< page_no << ". Log parsing proceeded successfully up to "
|
|
|
|
<< recv_sys->recovered_lsn << ". Previous log record type "
|
|
|
|
<< recv_previous_parsed_rec_type << ", is multi "
|
|
|
|
<< recv_previous_parsed_rec_is_multi << " Recv offset "
|
2018-08-10 10:00:47 +03:00
|
|
|
<< ptr_offset << ", prev "
|
2016-08-12 11:17:45 +03:00
|
|
|
<< recv_previous_parsed_rec_offset;
|
|
|
|
|
|
|
|
ut_ad(ptr <= recv_sys->buf + recv_sys->len);
|
|
|
|
|
|
|
|
const ulint limit = 100;
|
2018-08-10 10:00:47 +03:00
|
|
|
const ulint prev_offset = std::min(recv_previous_parsed_rec_offset,
|
|
|
|
ptr_offset);
|
|
|
|
const ulint before = std::min(prev_offset, limit);
|
|
|
|
const ulint after = std::min(recv_sys->len - ptr_offset, limit);
|
2016-08-12 11:17:45 +03:00
|
|
|
|
|
|
|
ib::info() << "Hex dump starting " << before << " bytes before and"
|
|
|
|
" ending " << after << " bytes after the corrupted record:";
|
|
|
|
|
2018-08-10 10:00:47 +03:00
|
|
|
const byte* start = recv_sys->buf + prev_offset - before;
|
|
|
|
|
|
|
|
ut_print_buf(stderr, start, ulint(ptr - start) + after);
|
2016-08-12 11:17:45 +03:00
|
|
|
putc('\n', stderr);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
if (!srv_force_recovery) {
|
2016-08-12 11:17:45 +03:00
|
|
|
ib::info() << "Set innodb_force_recovery to ignore this error.";
|
|
|
|
return(false);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
ib::warn() << "The log file may have been corrupt and it is possible"
|
|
|
|
" that the log scan did not proceed far enough in recovery!"
|
|
|
|
" Please run CHECK TABLE on your InnoDB tables to check"
|
|
|
|
" that they are ok! If mysqld crashes after this recovery; "
|
|
|
|
<< FORCE_RECOVERY_MSG;
|
|
|
|
return(true);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/** Parse log records from a buffer and optionally store them to a
|
|
|
|
hash table to wait merging to file pages.
|
|
|
|
@param[in] checkpoint_lsn the LSN of the latest checkpoint
|
|
|
|
@param[in] store whether to store page operations
|
|
|
|
@param[in] apply whether to apply the records
|
|
|
|
@return whether MLOG_CHECKPOINT record was seen the first time,
|
|
|
|
or corruption was noticed */
|
2018-03-13 15:19:30 +05:30
|
|
|
bool recv_parse_log_recs(lsn_t checkpoint_lsn, store_t store, bool apply)
|
2014-02-26 19:11:54 +01:00
|
|
|
{
|
2016-08-12 11:17:45 +03:00
|
|
|
byte* ptr;
|
|
|
|
byte* end_ptr;
|
|
|
|
bool single_rec;
|
|
|
|
ulint len;
|
|
|
|
lsn_t new_recovered_lsn;
|
|
|
|
lsn_t old_lsn;
|
|
|
|
mlog_id_t type;
|
|
|
|
ulint space;
|
|
|
|
ulint page_no;
|
|
|
|
byte* body;
|
|
|
|
|
|
|
|
ut_ad(log_mutex_own());
|
2014-02-26 19:11:54 +01:00
|
|
|
ut_ad(recv_sys->parse_start_lsn != 0);
|
|
|
|
loop:
|
|
|
|
ptr = recv_sys->buf + recv_sys->recovered_offset;
|
|
|
|
|
|
|
|
end_ptr = recv_sys->buf + recv_sys->len;
|
|
|
|
|
|
|
|
if (ptr == end_ptr) {
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
return(false);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
switch (*ptr) {
|
|
|
|
case MLOG_CHECKPOINT:
|
|
|
|
#ifdef UNIV_LOG_LSN_DEBUG
|
|
|
|
case MLOG_LSN:
|
|
|
|
#endif /* UNIV_LOG_LSN_DEBUG */
|
|
|
|
case MLOG_DUMMY_RECORD:
|
|
|
|
single_rec = true;
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
single_rec = !!(*ptr & MLOG_SINGLE_REC_FLAG);
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (single_rec) {
|
|
|
|
/* The mtr did not modify multiple pages */
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
old_lsn = recv_sys->recovered_lsn;
|
|
|
|
|
|
|
|
/* Try to parse a log record, fetching its type, space id,
|
|
|
|
page no, and a pointer to the body of the log record */
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
len = recv_parse_log_rec(&type, ptr, end_ptr, &space,
|
|
|
|
&page_no, apply, &body);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (recv_sys->found_corrupt_log) {
|
2018-08-10 13:02:01 +03:00
|
|
|
recv_report_corrupt_log(ptr, type, space, page_no);
|
2016-08-12 11:17:45 +03:00
|
|
|
return(true);
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (recv_sys->found_corrupt_fs) {
|
|
|
|
return(true);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2018-08-16 06:35:28 +03:00
|
|
|
if (len == 0) {
|
|
|
|
return(false);
|
|
|
|
}
|
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
new_recovered_lsn = recv_calc_lsn_on_data_add(old_lsn, len);
|
|
|
|
|
|
|
|
if (new_recovered_lsn > recv_sys->scanned_lsn) {
|
|
|
|
/* The log record filled a log block, and we require
|
|
|
|
that also the next log block should have been scanned
|
|
|
|
in */
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
return(false);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
recv_previous_parsed_rec_type = type;
|
2014-02-26 19:11:54 +01:00
|
|
|
recv_previous_parsed_rec_offset = recv_sys->recovered_offset;
|
|
|
|
recv_previous_parsed_rec_is_multi = 0;
|
|
|
|
|
|
|
|
recv_sys->recovered_offset += len;
|
|
|
|
recv_sys->recovered_lsn = new_recovered_lsn;
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
switch (type) {
|
|
|
|
lsn_t lsn;
|
|
|
|
case MLOG_DUMMY_RECORD:
|
2014-02-26 19:11:54 +01:00
|
|
|
/* Do nothing */
|
2016-08-12 11:17:45 +03:00
|
|
|
break;
|
|
|
|
case MLOG_CHECKPOINT:
|
|
|
|
#if SIZE_OF_MLOG_CHECKPOINT != 1 + 8
|
|
|
|
# error SIZE_OF_MLOG_CHECKPOINT != 1 + 8
|
|
|
|
#endif
|
|
|
|
lsn = mach_read_from_8(ptr + 1);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2018-06-15 14:09:15 +03:00
|
|
|
if (UNIV_UNLIKELY(srv_print_verbose_log == 2)) {
|
|
|
|
fprintf(stderr,
|
|
|
|
"MLOG_CHECKPOINT(" LSN_PF ") %s at "
|
|
|
|
LSN_PF "\n", lsn,
|
|
|
|
lsn != checkpoint_lsn ? "ignored"
|
|
|
|
: recv_sys->mlog_checkpoint_lsn
|
|
|
|
? "reread" : "read",
|
|
|
|
recv_sys->recovered_lsn);
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
DBUG_PRINT("ib_log",
|
|
|
|
("MLOG_CHECKPOINT(" LSN_PF ") %s at "
|
|
|
|
LSN_PF,
|
|
|
|
lsn,
|
|
|
|
lsn != checkpoint_lsn ? "ignored"
|
|
|
|
: recv_sys->mlog_checkpoint_lsn
|
|
|
|
? "reread" : "read",
|
|
|
|
recv_sys->recovered_lsn));
|
|
|
|
|
|
|
|
if (lsn == checkpoint_lsn) {
|
|
|
|
if (recv_sys->mlog_checkpoint_lsn) {
|
|
|
|
/* At recv_reset_logs() we may
|
|
|
|
write a duplicate MLOG_CHECKPOINT
|
|
|
|
for the same checkpoint LSN. Thus
|
|
|
|
recv_sys->mlog_checkpoint_lsn
|
|
|
|
can differ from the current LSN. */
|
|
|
|
ut_ad(recv_sys->mlog_checkpoint_lsn
|
|
|
|
<= recv_sys->recovered_lsn);
|
|
|
|
break;
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
2016-08-12 11:17:45 +03:00
|
|
|
recv_sys->mlog_checkpoint_lsn
|
|
|
|
= recv_sys->recovered_lsn;
|
|
|
|
return(true);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
2016-08-12 11:17:45 +03:00
|
|
|
break;
|
2014-02-26 19:11:54 +01:00
|
|
|
#ifdef UNIV_LOG_LSN_DEBUG
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_LSN:
|
2014-02-26 19:11:54 +01:00
|
|
|
/* Do not add these records to the hash table.
|
|
|
|
The page number and space id fields are misused
|
|
|
|
for something else. */
|
2016-08-12 11:17:45 +03:00
|
|
|
break;
|
2014-02-26 19:11:54 +01:00
|
|
|
#endif /* UNIV_LOG_LSN_DEBUG */
|
2016-08-12 11:17:45 +03:00
|
|
|
default:
|
|
|
|
switch (store) {
|
|
|
|
case STORE_NO:
|
|
|
|
break;
|
|
|
|
case STORE_IF_EXISTS:
|
|
|
|
if (fil_space_get_flags(space)
|
|
|
|
== ULINT_UNDEFINED) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
/* fall through */
|
|
|
|
case STORE_YES:
|
|
|
|
recv_add_to_hash_table(
|
|
|
|
type, space, page_no, body,
|
|
|
|
ptr + len, old_lsn,
|
|
|
|
recv_sys->recovered_lsn);
|
|
|
|
}
|
|
|
|
/* fall through */
|
MDEV-12548 Initial implementation of Mariabackup for MariaDB 10.2
InnoDB I/O and buffer pool interfaces and the redo log format
have been changed between MariaDB 10.1 and 10.2, and the backup
code has to be adjusted accordingly.
The code has been simplified, and many memory leaks have been fixed.
Instead of the file name xtrabackup_logfile, the file name ib_logfile0
is being used for the copy of the redo log. Unnecessary InnoDB startup and
shutdown and some unnecessary threads have been removed.
Some help was provided by Vladislav Vaintroub.
Parameters have been cleaned up and aligned with those of MariaDB 10.2.
The --dbug option has been added, so that in debug builds,
--dbug=d,ib_log can be specified to enable diagnostic messages
for processing redo log entries.
By default, innodb_doublewrite=OFF, so that --prepare works faster.
If more crash-safety for --prepare is needed, double buffering
can be enabled.
The parameter innodb_log_checksums=OFF can be used to ignore redo log
checksums in --backup.
Some messages have been cleaned up.
Unless --export is specified, Mariabackup will not deal with undo log.
The InnoDB mini-transaction redo log is not only about user-level
transactions; it is actually about mini-transactions. To avoid confusion,
call it the redo log, not transaction log.
We disable any undo log processing in --prepare.
Because MariaDB 10.2 supports indexed virtual columns, the
undo log processing would need to be able to evaluate virtual column
expressions. To reduce the amount of code dependencies, we will not
process any undo log in prepare.
This means that the --export option must be disabled for now.
This also means that the following options are redundant
and have been removed:
xtrabackup --apply-log-only
innobackupex --redo-only
In addition to disabling any undo log processing, we will disable any
further changes to data pages during --prepare, including the change
buffer merge. This means that restoring incremental backups should
reliably work even when change buffering is being used on the server.
Because of this, preparing a backup will not generate any further
redo log, and the redo log file can be safely deleted. (If the
--export option is enabled in the future, it must generate redo log
when processing undo logs and buffered changes.)
In --prepare, we cannot easily know if a partial backup was used,
especially when restoring a series of incremental backups. So, we
simply warn about any missing files, and ignore the redo log for them.
FIXME: Enable the --export option.
FIXME: Improve the handling of the MLOG_INDEX_LOAD record, and write
a test that initiates a backup while an ALGORITHM=INPLACE operation
is creating indexes or rebuilding a table. An error should be detected
when preparing the backup.
FIXME: In --incremental --prepare, xtrabackup_apply_delta() should
ensure that if FSP_SIZE is modified, the file size will be adjusted
accordingly.
2017-06-30 10:49:37 +03:00
|
|
|
case MLOG_INDEX_LOAD:
|
2018-03-13 15:19:30 +05:30
|
|
|
if (type == MLOG_INDEX_LOAD) {
|
2018-08-09 15:06:52 +01:00
|
|
|
if (log_optimized_ddl_op) {
|
|
|
|
log_optimized_ddl_op(space);
|
2018-03-13 15:19:30 +05:30
|
|
|
}
|
|
|
|
}
|
MDEV-12548 Initial implementation of Mariabackup for MariaDB 10.2
InnoDB I/O and buffer pool interfaces and the redo log format
have been changed between MariaDB 10.1 and 10.2, and the backup
code has to be adjusted accordingly.
The code has been simplified, and many memory leaks have been fixed.
Instead of the file name xtrabackup_logfile, the file name ib_logfile0
is being used for the copy of the redo log. Unnecessary InnoDB startup and
shutdown and some unnecessary threads have been removed.
Some help was provided by Vladislav Vaintroub.
Parameters have been cleaned up and aligned with those of MariaDB 10.2.
The --dbug option has been added, so that in debug builds,
--dbug=d,ib_log can be specified to enable diagnostic messages
for processing redo log entries.
By default, innodb_doublewrite=OFF, so that --prepare works faster.
If more crash-safety for --prepare is needed, double buffering
can be enabled.
The parameter innodb_log_checksums=OFF can be used to ignore redo log
checksums in --backup.
Some messages have been cleaned up.
Unless --export is specified, Mariabackup will not deal with undo log.
The InnoDB mini-transaction redo log is not only about user-level
transactions; it is actually about mini-transactions. To avoid confusion,
call it the redo log, not transaction log.
We disable any undo log processing in --prepare.
Because MariaDB 10.2 supports indexed virtual columns, the
undo log processing would need to be able to evaluate virtual column
expressions. To reduce the amount of code dependencies, we will not
process any undo log in prepare.
This means that the --export option must be disabled for now.
This also means that the following options are redundant
and have been removed:
xtrabackup --apply-log-only
innobackupex --redo-only
In addition to disabling any undo log processing, we will disable any
further changes to data pages during --prepare, including the change
buffer merge. This means that restoring incremental backups should
reliably work even when change buffering is being used on the server.
Because of this, preparing a backup will not generate any further
redo log, and the redo log file can be safely deleted. (If the
--export option is enabled in the future, it must generate redo log
when processing undo logs and buffered changes.)
In --prepare, we cannot easily know if a partial backup was used,
especially when restoring a series of incremental backups. So, we
simply warn about any missing files, and ignore the redo log for them.
FIXME: Enable the --export option.
FIXME: Improve the handling of the MLOG_INDEX_LOAD record, and write
a test that initiates a backup while an ALGORITHM=INPLACE operation
is creating indexes or rebuilding a table. An error should be detected
when preparing the backup.
FIXME: In --incremental --prepare, xtrabackup_apply_delta() should
ensure that if FSP_SIZE is modified, the file size will be adjusted
accordingly.
2017-06-30 10:49:37 +03:00
|
|
|
/* fall through */
|
2017-03-01 23:43:37 +02:00
|
|
|
case MLOG_FILE_NAME:
|
|
|
|
case MLOG_FILE_DELETE:
|
|
|
|
case MLOG_FILE_CREATE2:
|
|
|
|
case MLOG_FILE_RENAME2:
|
|
|
|
case MLOG_TRUNCATE:
|
|
|
|
/* These were already handled by
|
|
|
|
recv_parse_log_rec() and
|
|
|
|
recv_parse_or_apply_log_rec_body(). */
|
2016-08-12 11:17:45 +03:00
|
|
|
DBUG_PRINT("ib_log",
|
2016-09-06 09:43:16 +03:00
|
|
|
("scan " LSN_PF ": log rec %s"
|
|
|
|
" len " ULINTPF
|
|
|
|
" page " ULINTPF ":" ULINTPF,
|
|
|
|
old_lsn, get_mlog_string(type),
|
|
|
|
len, space, page_no));
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
} else {
|
|
|
|
/* Check that all the records associated with the single mtr
|
|
|
|
are included within the buffer */
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
ulint total_len = 0;
|
|
|
|
ulint n_recs = 0;
|
2017-01-10 10:48:56 +05:30
|
|
|
bool only_mlog_file = true;
|
|
|
|
ulint mlog_rec_len = 0;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
for (;;) {
|
2016-08-12 11:17:45 +03:00
|
|
|
len = recv_parse_log_rec(
|
|
|
|
&type, ptr, end_ptr, &space, &page_no,
|
|
|
|
false, &body);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (recv_sys->found_corrupt_log
|
|
|
|
|| type == MLOG_CHECKPOINT
|
2018-08-16 06:35:28 +03:00
|
|
|
|| (ptr != end_ptr
|
|
|
|
&& (*ptr & MLOG_SINGLE_REC_FLAG))) {
|
2016-08-12 11:17:45 +03:00
|
|
|
recv_sys->found_corrupt_log = true;
|
|
|
|
recv_report_corrupt_log(
|
|
|
|
ptr, type, space, page_no);
|
|
|
|
return(true);
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (recv_sys->found_corrupt_fs) {
|
|
|
|
return(true);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2018-08-16 06:35:28 +03:00
|
|
|
if (len == 0) {
|
|
|
|
return(false);
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
recv_previous_parsed_rec_type = type;
|
2014-02-26 19:11:54 +01:00
|
|
|
recv_previous_parsed_rec_offset
|
|
|
|
= recv_sys->recovered_offset + total_len;
|
|
|
|
recv_previous_parsed_rec_is_multi = 1;
|
|
|
|
|
2017-01-10 10:48:56 +05:30
|
|
|
/* MLOG_FILE_NAME redo log records doesn't make changes
|
|
|
|
to persistent data. If only MLOG_FILE_NAME redo
|
|
|
|
log record exists then reset the parsing buffer pointer
|
|
|
|
by changing recovered_lsn and recovered_offset. */
|
|
|
|
if (type != MLOG_FILE_NAME && only_mlog_file == true) {
|
|
|
|
only_mlog_file = false;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (only_mlog_file) {
|
|
|
|
new_recovered_lsn = recv_calc_lsn_on_data_add(
|
|
|
|
recv_sys->recovered_lsn, len);
|
|
|
|
mlog_rec_len += len;
|
|
|
|
recv_sys->recovered_offset += len;
|
|
|
|
recv_sys->recovered_lsn = new_recovered_lsn;
|
|
|
|
}
|
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
total_len += len;
|
|
|
|
n_recs++;
|
|
|
|
|
|
|
|
ptr += len;
|
|
|
|
|
|
|
|
if (type == MLOG_MULTI_REC_END) {
|
2016-08-12 11:17:45 +03:00
|
|
|
DBUG_PRINT("ib_log",
|
|
|
|
("scan " LSN_PF
|
|
|
|
": multi-log end"
|
|
|
|
" total_len " ULINTPF
|
|
|
|
" n=" ULINTPF,
|
|
|
|
recv_sys->recovered_lsn,
|
|
|
|
total_len, n_recs));
|
2017-01-10 10:48:56 +05:30
|
|
|
total_len -= mlog_rec_len;
|
2014-02-26 19:11:54 +01:00
|
|
|
break;
|
|
|
|
}
|
2016-08-12 11:17:45 +03:00
|
|
|
|
|
|
|
DBUG_PRINT("ib_log",
|
|
|
|
("scan " LSN_PF ": multi-log rec %s"
|
|
|
|
" len " ULINTPF
|
|
|
|
" page " ULINTPF ":" ULINTPF,
|
|
|
|
recv_sys->recovered_lsn,
|
|
|
|
get_mlog_string(type), len, space, page_no));
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
new_recovered_lsn = recv_calc_lsn_on_data_add(
|
|
|
|
recv_sys->recovered_lsn, total_len);
|
|
|
|
|
|
|
|
if (new_recovered_lsn > recv_sys->scanned_lsn) {
|
|
|
|
/* The log record filled a log block, and we require
|
|
|
|
that also the next log block should have been scanned
|
|
|
|
in */
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
return(false);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
/* Add all the records to the hash table */
|
|
|
|
|
|
|
|
ptr = recv_sys->buf + recv_sys->recovered_offset;
|
|
|
|
|
|
|
|
for (;;) {
|
|
|
|
old_lsn = recv_sys->recovered_lsn;
|
2016-08-12 11:17:45 +03:00
|
|
|
/* This will apply MLOG_FILE_ records. We
|
|
|
|
had to skip them in the first scan, because we
|
|
|
|
did not know if the mini-transaction was
|
|
|
|
completely recovered (until MLOG_MULTI_REC_END). */
|
|
|
|
len = recv_parse_log_rec(
|
|
|
|
&type, ptr, end_ptr, &space, &page_no,
|
|
|
|
apply, &body);
|
|
|
|
|
|
|
|
if (recv_sys->found_corrupt_log
|
|
|
|
&& !recv_report_corrupt_log(
|
|
|
|
ptr, type, space, page_no)) {
|
|
|
|
return(true);
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (recv_sys->found_corrupt_fs) {
|
|
|
|
return(true);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
ut_a(len != 0);
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_a(!(*ptr & MLOG_SINGLE_REC_FLAG));
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
recv_sys->recovered_offset += len;
|
|
|
|
recv_sys->recovered_lsn
|
|
|
|
= recv_calc_lsn_on_data_add(old_lsn, len);
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
switch (type) {
|
|
|
|
case MLOG_MULTI_REC_END:
|
2014-02-26 19:11:54 +01:00
|
|
|
/* Found the end mark for the records */
|
2016-08-12 11:17:45 +03:00
|
|
|
goto loop;
|
2014-02-26 19:11:54 +01:00
|
|
|
#ifdef UNIV_LOG_LSN_DEBUG
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_LSN:
|
|
|
|
/* Do not add these records to the hash table.
|
|
|
|
The page number and space id fields are misused
|
|
|
|
for something else. */
|
|
|
|
break;
|
2014-02-26 19:11:54 +01:00
|
|
|
#endif /* UNIV_LOG_LSN_DEBUG */
|
MDEV-12548 Initial implementation of Mariabackup for MariaDB 10.2
InnoDB I/O and buffer pool interfaces and the redo log format
have been changed between MariaDB 10.1 and 10.2, and the backup
code has to be adjusted accordingly.
The code has been simplified, and many memory leaks have been fixed.
Instead of the file name xtrabackup_logfile, the file name ib_logfile0
is being used for the copy of the redo log. Unnecessary InnoDB startup and
shutdown and some unnecessary threads have been removed.
Some help was provided by Vladislav Vaintroub.
Parameters have been cleaned up and aligned with those of MariaDB 10.2.
The --dbug option has been added, so that in debug builds,
--dbug=d,ib_log can be specified to enable diagnostic messages
for processing redo log entries.
By default, innodb_doublewrite=OFF, so that --prepare works faster.
If more crash-safety for --prepare is needed, double buffering
can be enabled.
The parameter innodb_log_checksums=OFF can be used to ignore redo log
checksums in --backup.
Some messages have been cleaned up.
Unless --export is specified, Mariabackup will not deal with undo log.
The InnoDB mini-transaction redo log is not only about user-level
transactions; it is actually about mini-transactions. To avoid confusion,
call it the redo log, not transaction log.
We disable any undo log processing in --prepare.
Because MariaDB 10.2 supports indexed virtual columns, the
undo log processing would need to be able to evaluate virtual column
expressions. To reduce the amount of code dependencies, we will not
process any undo log in prepare.
This means that the --export option must be disabled for now.
This also means that the following options are redundant
and have been removed:
xtrabackup --apply-log-only
innobackupex --redo-only
In addition to disabling any undo log processing, we will disable any
further changes to data pages during --prepare, including the change
buffer merge. This means that restoring incremental backups should
reliably work even when change buffering is being used on the server.
Because of this, preparing a backup will not generate any further
redo log, and the redo log file can be safely deleted. (If the
--export option is enabled in the future, it must generate redo log
when processing undo logs and buffered changes.)
In --prepare, we cannot easily know if a partial backup was used,
especially when restoring a series of incremental backups. So, we
simply warn about any missing files, and ignore the redo log for them.
FIXME: Enable the --export option.
FIXME: Improve the handling of the MLOG_INDEX_LOAD record, and write
a test that initiates a backup while an ALGORITHM=INPLACE operation
is creating indexes or rebuilding a table. An error should be detected
when preparing the backup.
FIXME: In --incremental --prepare, xtrabackup_apply_delta() should
ensure that if FSP_SIZE is modified, the file size will be adjusted
accordingly.
2017-06-30 10:49:37 +03:00
|
|
|
case MLOG_INDEX_LOAD:
|
|
|
|
/* Mariabackup FIXME: Report an error
|
|
|
|
when encountering MLOG_INDEX_LOAD on
|
|
|
|
--prepare or already on --backup. */
|
|
|
|
ut_a(srv_operation == SRV_OPERATION_NORMAL);
|
|
|
|
break;
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_FILE_NAME:
|
|
|
|
case MLOG_FILE_DELETE:
|
|
|
|
case MLOG_FILE_CREATE2:
|
|
|
|
case MLOG_FILE_RENAME2:
|
|
|
|
case MLOG_TRUNCATE:
|
|
|
|
/* These were already handled by
|
|
|
|
recv_parse_log_rec() and
|
|
|
|
recv_parse_or_apply_log_rec_body(). */
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
switch (store) {
|
|
|
|
case STORE_NO:
|
|
|
|
break;
|
|
|
|
case STORE_IF_EXISTS:
|
|
|
|
if (fil_space_get_flags(space)
|
|
|
|
== ULINT_UNDEFINED) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
/* fall through */
|
|
|
|
case STORE_YES:
|
|
|
|
recv_add_to_hash_table(
|
|
|
|
type, space, page_no,
|
|
|
|
body, ptr + len,
|
|
|
|
old_lsn,
|
|
|
|
new_recovered_lsn);
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
ptr += len;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
goto loop;
|
|
|
|
}
|
|
|
|
|
2018-03-13 15:19:30 +05:30
|
|
|
/** Adds data from a new log block to the parsing buffer of recv_sys if
|
2014-02-26 19:11:54 +01:00
|
|
|
recv_sys->parse_start_lsn is non-zero.
|
2018-03-13 15:19:30 +05:30
|
|
|
@param[in] log_block log block to add
|
|
|
|
@param[in] scanned_lsn lsn of how far we were able to find
|
|
|
|
data in this log block
|
2016-08-12 11:17:45 +03:00
|
|
|
@return true if more data added */
|
2018-03-13 15:19:30 +05:30
|
|
|
bool recv_sys_add_to_parsing_buf(const byte* log_block, lsn_t scanned_lsn)
|
2014-02-26 19:11:54 +01:00
|
|
|
{
|
|
|
|
ulint more_len;
|
|
|
|
ulint data_len;
|
|
|
|
ulint start_offset;
|
|
|
|
ulint end_offset;
|
|
|
|
|
|
|
|
ut_ad(scanned_lsn >= recv_sys->scanned_lsn);
|
|
|
|
|
|
|
|
if (!recv_sys->parse_start_lsn) {
|
|
|
|
/* Cannot start parsing yet because no start point for
|
|
|
|
it found */
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
return(false);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
data_len = log_block_get_data_len(log_block);
|
|
|
|
|
|
|
|
if (recv_sys->parse_start_lsn >= scanned_lsn) {
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
return(false);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
} else if (recv_sys->scanned_lsn >= scanned_lsn) {
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
return(false);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
} else if (recv_sys->parse_start_lsn > recv_sys->scanned_lsn) {
|
|
|
|
more_len = (ulint) (scanned_lsn - recv_sys->parse_start_lsn);
|
|
|
|
} else {
|
|
|
|
more_len = (ulint) (scanned_lsn - recv_sys->scanned_lsn);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (more_len == 0) {
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
return(false);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
ut_ad(data_len >= more_len);
|
|
|
|
|
|
|
|
start_offset = data_len - more_len;
|
|
|
|
|
|
|
|
if (start_offset < LOG_BLOCK_HDR_SIZE) {
|
|
|
|
start_offset = LOG_BLOCK_HDR_SIZE;
|
|
|
|
}
|
|
|
|
|
|
|
|
end_offset = data_len;
|
|
|
|
|
|
|
|
if (end_offset > OS_FILE_LOG_BLOCK_SIZE - LOG_BLOCK_TRL_SIZE) {
|
|
|
|
end_offset = OS_FILE_LOG_BLOCK_SIZE - LOG_BLOCK_TRL_SIZE;
|
|
|
|
}
|
|
|
|
|
|
|
|
ut_ad(start_offset <= end_offset);
|
|
|
|
|
|
|
|
if (start_offset < end_offset) {
|
|
|
|
ut_memcpy(recv_sys->buf + recv_sys->len,
|
|
|
|
log_block + start_offset, end_offset - start_offset);
|
|
|
|
|
|
|
|
recv_sys->len += end_offset - start_offset;
|
|
|
|
|
|
|
|
ut_a(recv_sys->len <= RECV_PARSING_BUF_SIZE);
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
return(true);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2018-03-13 15:19:30 +05:30
|
|
|
/** Moves the parsing buffer data left to the buffer start. */
|
|
|
|
void recv_sys_justify_left_parsing_buf()
|
2014-02-26 19:11:54 +01:00
|
|
|
{
|
|
|
|
ut_memmove(recv_sys->buf, recv_sys->buf + recv_sys->recovered_offset,
|
|
|
|
recv_sys->len - recv_sys->recovered_offset);
|
|
|
|
|
|
|
|
recv_sys->len -= recv_sys->recovered_offset;
|
|
|
|
|
|
|
|
recv_sys->recovered_offset = 0;
|
|
|
|
}
|
|
|
|
|
2016-12-30 15:04:10 +02:00
|
|
|
/** Scan redo log from a buffer and stores new log data to the parsing buffer.
|
|
|
|
Parse and hash the log records if new data found.
|
|
|
|
Apply log records automatically when the hash table becomes full.
|
2016-08-12 11:17:45 +03:00
|
|
|
@return true if not able to scan any more in this log group */
|
|
|
|
static
|
|
|
|
bool
|
2014-02-26 19:11:54 +01:00
|
|
|
recv_scan_log_recs(
|
|
|
|
/*===============*/
|
|
|
|
ulint available_memory,/*!< in: we let the hash table of recs
|
|
|
|
to grow to this size, at the maximum */
|
2016-08-12 11:17:45 +03:00
|
|
|
store_t* store_to_hash, /*!< in,out: whether the records should be
|
|
|
|
stored to the hash table; this is reset
|
|
|
|
if just debug checking is needed, or
|
|
|
|
when the available_memory runs out */
|
2017-03-11 15:20:33 +02:00
|
|
|
const byte* log_block, /*!< in: log segment */
|
2016-08-12 11:17:45 +03:00
|
|
|
lsn_t checkpoint_lsn, /*!< in: latest checkpoint LSN */
|
2017-03-11 15:20:33 +02:00
|
|
|
lsn_t start_lsn, /*!< in: buffer start LSN */
|
|
|
|
lsn_t end_lsn, /*!< in: buffer end LSN */
|
2014-02-26 19:11:54 +01:00
|
|
|
lsn_t* contiguous_lsn, /*!< in/out: it is known that all log
|
|
|
|
groups contain contiguous log data up
|
|
|
|
to this lsn */
|
2017-02-10 12:11:42 +02:00
|
|
|
lsn_t* group_scanned_lsn)/*!< out: scanning succeeded up to
|
2014-02-26 19:11:54 +01:00
|
|
|
this lsn */
|
|
|
|
{
|
2016-08-12 11:17:45 +03:00
|
|
|
lsn_t scanned_lsn = start_lsn;
|
|
|
|
bool finished = false;
|
2014-02-26 19:11:54 +01:00
|
|
|
ulint data_len;
|
2016-08-12 11:17:45 +03:00
|
|
|
bool more_data = false;
|
|
|
|
bool apply = recv_sys->mlog_checkpoint_lsn != 0;
|
2017-01-10 10:48:56 +05:30
|
|
|
ulint recv_parsing_buf_size = RECV_PARSING_BUF_SIZE;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
ut_ad(start_lsn % OS_FILE_LOG_BLOCK_SIZE == 0);
|
2017-03-11 15:20:33 +02:00
|
|
|
ut_ad(end_lsn % OS_FILE_LOG_BLOCK_SIZE == 0);
|
|
|
|
ut_ad(end_lsn >= start_lsn + OS_FILE_LOG_BLOCK_SIZE);
|
|
|
|
|
|
|
|
const byte* const log_end = log_block
|
|
|
|
+ ulint(end_lsn - start_lsn);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
do {
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(!finished);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
if (log_block_get_flush_bit(log_block)) {
|
|
|
|
/* This block was a start of a log flush operation:
|
|
|
|
we know that the previous flush operation must have
|
|
|
|
been completed for all log groups before this block
|
|
|
|
can have been flushed to any of the groups. Therefore,
|
|
|
|
we know that log data is contiguous up to scanned_lsn
|
|
|
|
in all non-corrupt log groups. */
|
|
|
|
|
|
|
|
if (scanned_lsn > *contiguous_lsn) {
|
|
|
|
*contiguous_lsn = scanned_lsn;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
data_len = log_block_get_data_len(log_block);
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (scanned_lsn + data_len > recv_sys->scanned_lsn
|
|
|
|
&& log_block_get_checkpoint_no(log_block)
|
|
|
|
< recv_sys->scanned_checkpoint_no
|
2014-02-26 19:11:54 +01:00
|
|
|
&& (recv_sys->scanned_checkpoint_no
|
|
|
|
- log_block_get_checkpoint_no(log_block)
|
|
|
|
> 0x80000000UL)) {
|
|
|
|
|
|
|
|
/* Garbage from a log buffer flush which was made
|
|
|
|
before the most recent database recovery */
|
2016-08-12 11:17:45 +03:00
|
|
|
finished = true;
|
2014-02-26 19:11:54 +01:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!recv_sys->parse_start_lsn
|
|
|
|
&& (log_block_get_first_rec_group(log_block) > 0)) {
|
|
|
|
|
|
|
|
/* We found a point from which to start the parsing
|
|
|
|
of log records */
|
|
|
|
|
|
|
|
recv_sys->parse_start_lsn = scanned_lsn
|
|
|
|
+ log_block_get_first_rec_group(log_block);
|
|
|
|
recv_sys->scanned_lsn = recv_sys->parse_start_lsn;
|
|
|
|
recv_sys->recovered_lsn = recv_sys->parse_start_lsn;
|
|
|
|
}
|
|
|
|
|
|
|
|
scanned_lsn += data_len;
|
|
|
|
|
2017-06-28 11:58:43 +03:00
|
|
|
if (data_len == LOG_BLOCK_HDR_SIZE + SIZE_OF_MLOG_CHECKPOINT
|
|
|
|
&& scanned_lsn == checkpoint_lsn + SIZE_OF_MLOG_CHECKPOINT
|
|
|
|
&& log_block[LOG_BLOCK_HDR_SIZE] == MLOG_CHECKPOINT
|
|
|
|
&& checkpoint_lsn == mach_read_from_8(LOG_BLOCK_HDR_SIZE
|
|
|
|
+ 1 + log_block)) {
|
|
|
|
/* The redo log is logically empty. */
|
|
|
|
ut_ad(recv_sys->mlog_checkpoint_lsn == 0
|
|
|
|
|| recv_sys->mlog_checkpoint_lsn
|
|
|
|
== checkpoint_lsn);
|
|
|
|
recv_sys->mlog_checkpoint_lsn = checkpoint_lsn;
|
|
|
|
DBUG_PRINT("ib_log", ("found empty log; LSN=" LSN_PF,
|
|
|
|
scanned_lsn));
|
|
|
|
finished = true;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
if (scanned_lsn > recv_sys->scanned_lsn) {
|
2017-06-28 11:58:43 +03:00
|
|
|
ut_ad(!srv_log_files_created);
|
2016-08-12 11:17:45 +03:00
|
|
|
if (!recv_needed_recovery) {
|
2017-03-01 23:43:37 +02:00
|
|
|
recv_needed_recovery = true;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-03-01 23:43:37 +02:00
|
|
|
if (srv_read_only_mode) {
|
2017-01-25 15:11:46 +02:00
|
|
|
ib::warn() << "innodb_read_only"
|
|
|
|
" prevents crash recovery";
|
2016-08-12 11:17:45 +03:00
|
|
|
return(true);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
2017-03-01 23:43:37 +02:00
|
|
|
|
2017-03-07 17:16:49 +02:00
|
|
|
ib::info() << "Starting crash recovery from"
|
|
|
|
" checkpoint LSN="
|
2017-03-01 23:43:37 +02:00
|
|
|
<< recv_sys->scanned_lsn;
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
/* We were able to find more log data: add it to the
|
|
|
|
parsing buffer if parse_start_lsn is already
|
|
|
|
non-zero */
|
|
|
|
|
2017-01-10 10:48:56 +05:30
|
|
|
DBUG_EXECUTE_IF(
|
|
|
|
"reduce_recv_parsing_buf",
|
|
|
|
recv_parsing_buf_size
|
|
|
|
= (70 * 1024);
|
|
|
|
);
|
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
if (recv_sys->len + 4 * OS_FILE_LOG_BLOCK_SIZE
|
2017-01-10 10:48:56 +05:30
|
|
|
>= recv_parsing_buf_size) {
|
2016-08-12 11:17:45 +03:00
|
|
|
ib::error() << "Log parsing buffer overflow."
|
|
|
|
" Recovery may have failed!";
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
recv_sys->found_corrupt_log = true;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
if (!srv_force_recovery) {
|
2016-08-12 11:17:45 +03:00
|
|
|
ib::error()
|
|
|
|
<< "Set innodb_force_recovery"
|
|
|
|
" to ignore this error.";
|
2016-09-06 09:43:16 +03:00
|
|
|
return(true);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
} else if (!recv_sys->found_corrupt_log) {
|
|
|
|
more_data = recv_sys_add_to_parsing_buf(
|
|
|
|
log_block, scanned_lsn);
|
|
|
|
}
|
|
|
|
|
|
|
|
recv_sys->scanned_lsn = scanned_lsn;
|
|
|
|
recv_sys->scanned_checkpoint_no
|
|
|
|
= log_block_get_checkpoint_no(log_block);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (data_len < OS_FILE_LOG_BLOCK_SIZE) {
|
|
|
|
/* Log data for this group ends here */
|
2016-08-12 11:17:45 +03:00
|
|
|
finished = true;
|
2014-02-26 19:11:54 +01:00
|
|
|
break;
|
|
|
|
} else {
|
|
|
|
log_block += OS_FILE_LOG_BLOCK_SIZE;
|
|
|
|
}
|
2017-03-11 15:20:33 +02:00
|
|
|
} while (log_block < log_end);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
*group_scanned_lsn = scanned_lsn;
|
|
|
|
|
|
|
|
if (more_data && !recv_sys->found_corrupt_log) {
|
|
|
|
/* Try to parse more log records */
|
|
|
|
|
2017-02-10 12:11:42 +02:00
|
|
|
if (recv_parse_log_recs(checkpoint_lsn,
|
|
|
|
*store_to_hash, apply)) {
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(recv_sys->found_corrupt_log
|
|
|
|
|| recv_sys->found_corrupt_fs
|
|
|
|
|| recv_sys->mlog_checkpoint_lsn
|
|
|
|
== recv_sys->recovered_lsn);
|
|
|
|
return(true);
|
|
|
|
}
|
2015-09-29 15:15:28 +03:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (*store_to_hash != STORE_NO
|
|
|
|
&& mem_heap_get_size(recv_sys->heap) > available_memory) {
|
2018-03-27 13:47:56 +05:30
|
|
|
|
|
|
|
DBUG_PRINT("ib_log", ("Ran out of memory and last "
|
|
|
|
"stored lsn " LSN_PF,
|
|
|
|
recv_sys->recovered_lsn));
|
|
|
|
|
|
|
|
recv_sys->last_stored_lsn = recv_sys->recovered_lsn;
|
2016-08-12 11:17:45 +03:00
|
|
|
*store_to_hash = STORE_NO;
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2017-01-10 10:48:56 +05:30
|
|
|
if (recv_sys->recovered_offset > recv_parsing_buf_size / 4) {
|
2014-02-26 19:11:54 +01:00
|
|
|
/* Move parsing buffer data to the buffer start */
|
|
|
|
|
|
|
|
recv_sys_justify_left_parsing_buf();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return(finished);
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/** Scans log from a buffer and stores new log data to the parsing buffer.
|
|
|
|
Parses and hashes the log records if new data found.
|
|
|
|
@param[in,out] group log group
|
2017-03-01 23:43:37 +02:00
|
|
|
@param[in] checkpoint_lsn latest checkpoint log sequence number
|
2016-08-12 11:17:45 +03:00
|
|
|
@param[in,out] contiguous_lsn log sequence number
|
|
|
|
until which all redo log has been scanned
|
|
|
|
@param[in] last_phase whether changes
|
|
|
|
can be applied to the tablespaces
|
|
|
|
@return whether rescan is needed (not everything was stored) */
|
2014-02-26 19:11:54 +01:00
|
|
|
static
|
2016-08-12 11:17:45 +03:00
|
|
|
bool
|
2014-02-26 19:11:54 +01:00
|
|
|
recv_group_scan_log_recs(
|
2016-08-12 11:17:45 +03:00
|
|
|
log_group_t* group,
|
2017-03-01 23:43:37 +02:00
|
|
|
lsn_t checkpoint_lsn,
|
2016-08-12 11:17:45 +03:00
|
|
|
lsn_t* contiguous_lsn,
|
2017-02-10 12:11:42 +02:00
|
|
|
bool last_phase)
|
2014-02-26 19:11:54 +01:00
|
|
|
{
|
2016-08-12 11:17:45 +03:00
|
|
|
DBUG_ENTER("recv_group_scan_log_recs");
|
|
|
|
DBUG_ASSERT(!last_phase || recv_sys->mlog_checkpoint_lsn > 0);
|
|
|
|
|
|
|
|
mutex_enter(&recv_sys->mutex);
|
|
|
|
recv_sys->len = 0;
|
|
|
|
recv_sys->recovered_offset = 0;
|
|
|
|
recv_sys->n_addrs = 0;
|
|
|
|
recv_sys_empty_hash();
|
|
|
|
srv_start_lsn = *contiguous_lsn;
|
|
|
|
recv_sys->parse_start_lsn = *contiguous_lsn;
|
|
|
|
recv_sys->scanned_lsn = *contiguous_lsn;
|
|
|
|
recv_sys->recovered_lsn = *contiguous_lsn;
|
|
|
|
recv_sys->scanned_checkpoint_no = 0;
|
|
|
|
recv_previous_parsed_rec_type = MLOG_SINGLE_REC_FLAG;
|
|
|
|
recv_previous_parsed_rec_offset = 0;
|
|
|
|
recv_previous_parsed_rec_is_multi = 0;
|
|
|
|
ut_ad(recv_max_page_lsn == 0);
|
|
|
|
ut_ad(last_phase || !recv_writer_thread_active);
|
|
|
|
mutex_exit(&recv_sys->mutex);
|
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
lsn_t start_lsn;
|
|
|
|
lsn_t end_lsn;
|
2016-08-12 11:17:45 +03:00
|
|
|
store_t store_to_hash = recv_sys->mlog_checkpoint_lsn == 0
|
|
|
|
? STORE_NO : (last_phase ? STORE_IF_EXISTS : STORE_YES);
|
|
|
|
ulint available_mem = UNIV_PAGE_SIZE
|
|
|
|
* (buf_pool_get_n_pages()
|
|
|
|
- (recv_n_pool_free_frames * srv_buf_pool_instances));
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-02-10 12:11:42 +02:00
|
|
|
group->scanned_lsn = end_lsn = *contiguous_lsn = ut_uint64_align_down(
|
2016-08-12 11:17:45 +03:00
|
|
|
*contiguous_lsn, OS_FILE_LOG_BLOCK_SIZE);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
do {
|
|
|
|
if (last_phase && store_to_hash == STORE_NO) {
|
|
|
|
store_to_hash = STORE_IF_EXISTS;
|
|
|
|
/* We must not allow change buffer
|
|
|
|
merge here, because it would generate
|
|
|
|
redo log records before we have
|
|
|
|
finished the redo log scan. */
|
2017-03-07 17:16:49 +02:00
|
|
|
recv_apply_hashed_log_recs(false);
|
2015-08-07 15:21:20 +03:00
|
|
|
}
|
|
|
|
|
2017-11-09 16:25:16 +00:00
|
|
|
start_lsn = ut_uint64_align_down(end_lsn,
|
|
|
|
OS_FILE_LOG_BLOCK_SIZE);
|
2017-11-29 22:56:23 +00:00
|
|
|
end_lsn = start_lsn;
|
|
|
|
log_group_read_log_seg(
|
|
|
|
log_sys->buf, group, &end_lsn,
|
2017-02-10 12:11:42 +02:00
|
|
|
start_lsn + RECV_SCAN_SIZE);
|
|
|
|
} while (end_lsn != start_lsn
|
|
|
|
&& !recv_scan_log_recs(
|
2016-08-12 11:17:45 +03:00
|
|
|
available_mem, &store_to_hash, log_sys->buf,
|
|
|
|
checkpoint_lsn,
|
2017-03-11 15:20:33 +02:00
|
|
|
start_lsn, end_lsn,
|
|
|
|
contiguous_lsn, &group->scanned_lsn));
|
2016-08-12 11:17:45 +03:00
|
|
|
|
|
|
|
if (recv_sys->found_corrupt_log || recv_sys->found_corrupt_fs) {
|
|
|
|
DBUG_RETURN(false);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
DBUG_PRINT("ib_log", ("%s " LSN_PF " completed",
|
2016-08-12 11:17:45 +03:00
|
|
|
last_phase ? "rescan" : "scan",
|
2017-05-26 14:04:19 +03:00
|
|
|
group->scanned_lsn));
|
2016-08-12 11:17:45 +03:00
|
|
|
|
|
|
|
DBUG_RETURN(store_to_hash == STORE_NO);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/** Report a missing tablespace for which page-redo log exists.
|
|
|
|
@param[in] err previous error code
|
|
|
|
@param[in] i tablespace descriptor
|
|
|
|
@return new error code */
|
|
|
|
static
|
2014-02-26 19:11:54 +01:00
|
|
|
dberr_t
|
2016-08-12 11:17:45 +03:00
|
|
|
recv_init_missing_space(dberr_t err, const recv_spaces_t::const_iterator& i)
|
|
|
|
{
|
2017-10-10 10:28:54 +03:00
|
|
|
if (srv_operation == SRV_OPERATION_RESTORE
|
|
|
|
|| srv_operation == SRV_OPERATION_RESTORE_EXPORT) {
|
MDEV-12548 Initial implementation of Mariabackup for MariaDB 10.2
InnoDB I/O and buffer pool interfaces and the redo log format
have been changed between MariaDB 10.1 and 10.2, and the backup
code has to be adjusted accordingly.
The code has been simplified, and many memory leaks have been fixed.
Instead of the file name xtrabackup_logfile, the file name ib_logfile0
is being used for the copy of the redo log. Unnecessary InnoDB startup and
shutdown and some unnecessary threads have been removed.
Some help was provided by Vladislav Vaintroub.
Parameters have been cleaned up and aligned with those of MariaDB 10.2.
The --dbug option has been added, so that in debug builds,
--dbug=d,ib_log can be specified to enable diagnostic messages
for processing redo log entries.
By default, innodb_doublewrite=OFF, so that --prepare works faster.
If more crash-safety for --prepare is needed, double buffering
can be enabled.
The parameter innodb_log_checksums=OFF can be used to ignore redo log
checksums in --backup.
Some messages have been cleaned up.
Unless --export is specified, Mariabackup will not deal with undo log.
The InnoDB mini-transaction redo log is not only about user-level
transactions; it is actually about mini-transactions. To avoid confusion,
call it the redo log, not transaction log.
We disable any undo log processing in --prepare.
Because MariaDB 10.2 supports indexed virtual columns, the
undo log processing would need to be able to evaluate virtual column
expressions. To reduce the amount of code dependencies, we will not
process any undo log in prepare.
This means that the --export option must be disabled for now.
This also means that the following options are redundant
and have been removed:
xtrabackup --apply-log-only
innobackupex --redo-only
In addition to disabling any undo log processing, we will disable any
further changes to data pages during --prepare, including the change
buffer merge. This means that restoring incremental backups should
reliably work even when change buffering is being used on the server.
Because of this, preparing a backup will not generate any further
redo log, and the redo log file can be safely deleted. (If the
--export option is enabled in the future, it must generate redo log
when processing undo logs and buffered changes.)
In --prepare, we cannot easily know if a partial backup was used,
especially when restoring a series of incremental backups. So, we
simply warn about any missing files, and ignore the redo log for them.
FIXME: Enable the --export option.
FIXME: Improve the handling of the MLOG_INDEX_LOAD record, and write
a test that initiates a backup while an ALGORITHM=INPLACE operation
is creating indexes or rebuilding a table. An error should be detected
when preparing the backup.
FIXME: In --incremental --prepare, xtrabackup_apply_delta() should
ensure that if FSP_SIZE is modified, the file size will be adjusted
accordingly.
2017-06-30 10:49:37 +03:00
|
|
|
ib::warn() << "Tablespace " << i->first << " was not"
|
|
|
|
" found at " << i->second.name << " when"
|
|
|
|
" restoring a (partial?) backup. All redo log"
|
|
|
|
" for this file will be ignored!";
|
|
|
|
return(err);
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (srv_force_recovery == 0) {
|
|
|
|
ib::error() << "Tablespace " << i->first << " was not"
|
|
|
|
" found at " << i->second.name << ".";
|
|
|
|
|
|
|
|
if (err == DB_SUCCESS) {
|
|
|
|
ib::error() << "Set innodb_force_recovery=1 to"
|
|
|
|
" ignore this and to permanently lose"
|
|
|
|
" all changes to the tablespace.";
|
|
|
|
err = DB_TABLESPACE_NOT_FOUND;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
ib::warn() << "Tablespace " << i->first << " was not"
|
|
|
|
" found at " << i->second.name << ", and"
|
|
|
|
" innodb_force_recovery was set. All redo log"
|
|
|
|
" for this tablespace will be ignored!";
|
|
|
|
}
|
|
|
|
|
|
|
|
return(err);
|
|
|
|
}
|
|
|
|
|
2018-03-27 13:47:56 +05:30
|
|
|
/** Report the missing tablespace and discard the redo logs for the deleted
|
|
|
|
tablespace.
|
|
|
|
@param[in] rescan rescan of redo logs is needed
|
|
|
|
if hash table ran out of memory
|
|
|
|
@param[out] missing_tablespace missing tablespace exists or not
|
|
|
|
@return error code or DB_SUCCESS. */
|
|
|
|
static MY_ATTRIBUTE((warn_unused_result))
|
|
|
|
dberr_t
|
|
|
|
recv_validate_tablespace(bool rescan, bool& missing_tablespace)
|
|
|
|
{
|
|
|
|
dberr_t err = DB_SUCCESS;
|
|
|
|
|
|
|
|
for (ulint h = 0; h < hash_get_n_cells(recv_sys->addr_hash); h++) {
|
|
|
|
for (recv_addr_t* recv_addr = static_cast<recv_addr_t*>(
|
2018-03-28 20:40:09 +03:00
|
|
|
HASH_GET_FIRST(recv_sys->addr_hash, h));
|
|
|
|
recv_addr != 0;
|
|
|
|
recv_addr = static_cast<recv_addr_t*>(
|
|
|
|
HASH_GET_NEXT(addr_hash, recv_addr))) {
|
2018-03-27 13:47:56 +05:30
|
|
|
|
|
|
|
const ulint space = recv_addr->space;
|
|
|
|
|
|
|
|
if (is_predefined_tablespace(space)) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2018-03-28 20:40:09 +03:00
|
|
|
recv_spaces_t::iterator i = recv_spaces.find(space);
|
2018-03-27 13:47:56 +05:30
|
|
|
ut_ad(i != recv_spaces.end());
|
|
|
|
|
2018-03-28 20:40:09 +03:00
|
|
|
switch (i->second.status) {
|
2018-03-27 13:47:56 +05:30
|
|
|
case file_name_t::MISSING:
|
|
|
|
err = recv_init_missing_space(err, i);
|
|
|
|
i->second.status = file_name_t::DELETED;
|
2018-03-28 20:40:09 +03:00
|
|
|
/* fall through */
|
2018-03-27 13:47:56 +05:30
|
|
|
case file_name_t::DELETED:
|
|
|
|
recv_addr->state = RECV_DISCARDED;
|
2018-03-28 20:40:09 +03:00
|
|
|
/* fall through */
|
2018-03-27 13:47:56 +05:30
|
|
|
case file_name_t::NORMAL:
|
2018-03-28 20:40:09 +03:00
|
|
|
continue;
|
2018-03-27 13:47:56 +05:30
|
|
|
}
|
2018-03-28 20:40:09 +03:00
|
|
|
ut_ad(0);
|
2018-03-27 13:47:56 +05:30
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (err != DB_SUCCESS) {
|
|
|
|
return(err);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* When rescan is not needed then recv_sys->addr_hash will have
|
|
|
|
all space id belongs to redo log. If rescan is needed and
|
|
|
|
innodb_force_recovery > 0 then InnoDB can ignore missing tablespace. */
|
|
|
|
for (recv_spaces_t::iterator i = recv_spaces.begin();
|
|
|
|
i != recv_spaces.end(); i++) {
|
|
|
|
|
|
|
|
if (i->second.status != file_name_t::MISSING) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
missing_tablespace = true;
|
|
|
|
|
|
|
|
if (srv_force_recovery > 0) {
|
|
|
|
ib::warn() << "Tablespace " << i->first
|
|
|
|
<<" was not found at " << i->second.name
|
|
|
|
<<", and innodb_force_recovery was set."
|
|
|
|
<<" All redo log for this tablespace"
|
|
|
|
<<" will be ignored!";
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!rescan) {
|
|
|
|
ib::info() << "Tablespace " << i->first
|
|
|
|
<< " was not found at '"
|
|
|
|
<< i->second.name << "', but there"
|
|
|
|
<<" were no modifications either.";
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!rescan || srv_force_recovery > 0) {
|
|
|
|
missing_tablespace = false;
|
|
|
|
}
|
|
|
|
|
|
|
|
return DB_SUCCESS;
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/** Check if all tablespaces were found for crash recovery.
|
2018-03-27 13:47:56 +05:30
|
|
|
@param[in] rescan rescan of redo logs is needed
|
|
|
|
@param[out] missing_tablespace missing table exists
|
2016-08-12 11:17:45 +03:00
|
|
|
@return error code or DB_SUCCESS */
|
2016-09-06 09:43:16 +03:00
|
|
|
static MY_ATTRIBUTE((warn_unused_result))
|
2016-08-12 11:17:45 +03:00
|
|
|
dberr_t
|
2018-03-27 13:47:56 +05:30
|
|
|
recv_init_crash_recovery_spaces(bool rescan, bool& missing_tablespace)
|
2016-08-12 11:17:45 +03:00
|
|
|
{
|
|
|
|
bool flag_deleted = false;
|
|
|
|
|
|
|
|
ut_ad(!srv_read_only_mode);
|
|
|
|
ut_ad(recv_needed_recovery);
|
|
|
|
|
|
|
|
for (recv_spaces_t::iterator i = recv_spaces.begin();
|
|
|
|
i != recv_spaces.end(); i++) {
|
|
|
|
ut_ad(!is_predefined_tablespace(i->first));
|
2018-03-27 13:47:56 +05:30
|
|
|
ut_ad(i->second.status != file_name_t::DELETED || !i->second.space);
|
2016-08-12 11:17:45 +03:00
|
|
|
|
2018-03-27 13:47:56 +05:30
|
|
|
if (i->second.status == file_name_t::DELETED) {
|
2016-08-12 11:17:45 +03:00
|
|
|
/* The tablespace was deleted,
|
|
|
|
so we can ignore any redo log for it. */
|
|
|
|
flag_deleted = true;
|
|
|
|
} else if (i->second.space != NULL) {
|
|
|
|
/* The tablespace was found, and there
|
|
|
|
are some redo log records for it. */
|
|
|
|
fil_names_dirty(i->second.space);
|
2017-03-01 23:43:37 +02:00
|
|
|
} else if (i->second.name == "") {
|
|
|
|
ib::error() << "Missing MLOG_FILE_NAME"
|
|
|
|
" or MLOG_FILE_DELETE"
|
|
|
|
" before MLOG_CHECKPOINT for tablespace "
|
|
|
|
<< i->first;
|
|
|
|
recv_sys->found_corrupt_log = true;
|
|
|
|
return(DB_CORRUPTION);
|
2016-08-12 11:17:45 +03:00
|
|
|
} else {
|
2018-03-27 13:47:56 +05:30
|
|
|
i->second.status = file_name_t::MISSING;
|
2016-08-12 11:17:45 +03:00
|
|
|
flag_deleted = true;
|
|
|
|
}
|
2017-03-03 14:43:45 +02:00
|
|
|
|
2018-03-27 13:47:56 +05:30
|
|
|
ut_ad(i->second.status == file_name_t::DELETED || i->second.name != "");
|
2016-08-12 11:17:45 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
if (flag_deleted) {
|
2018-03-27 13:47:56 +05:30
|
|
|
return recv_validate_tablespace(rescan, missing_tablespace);
|
2016-08-12 11:17:45 +03:00
|
|
|
}
|
|
|
|
|
2018-03-27 13:47:56 +05:30
|
|
|
return DB_SUCCESS;
|
2016-08-12 11:17:45 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
/** Start recovering from a redo log checkpoint.
|
|
|
|
@see recv_recovery_from_checkpoint_finish
|
|
|
|
@param[in] flush_lsn FIL_PAGE_FILE_FLUSH_LSN
|
|
|
|
of first system tablespace page
|
|
|
|
@return error code or DB_SUCCESS */
|
|
|
|
dberr_t
|
2017-05-26 14:04:19 +03:00
|
|
|
recv_recovery_from_checkpoint_start(lsn_t flush_lsn)
|
2014-02-26 19:11:54 +01:00
|
|
|
{
|
|
|
|
ulint max_cp_field;
|
|
|
|
lsn_t checkpoint_lsn;
|
2016-08-12 11:17:45 +03:00
|
|
|
bool rescan;
|
2014-02-26 19:11:54 +01:00
|
|
|
ib_uint64_t checkpoint_no;
|
|
|
|
lsn_t contiguous_lsn;
|
|
|
|
byte* buf;
|
2016-08-12 11:17:45 +03:00
|
|
|
dberr_t err = DB_SUCCESS;
|
|
|
|
|
2017-07-07 18:29:31 +03:00
|
|
|
ut_ad(srv_operation == SRV_OPERATION_NORMAL
|
2017-10-10 10:28:54 +03:00
|
|
|
|| srv_operation == SRV_OPERATION_RESTORE
|
|
|
|
|| srv_operation == SRV_OPERATION_RESTORE_EXPORT);
|
2017-07-07 18:29:31 +03:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/* Initialize red-black tree for fast insertions into the
|
|
|
|
flush_list during recovery process. */
|
|
|
|
buf_flush_init_flush_rbt();
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
if (srv_force_recovery >= SRV_FORCE_NO_LOG_REDO) {
|
|
|
|
|
2017-02-10 12:11:42 +02:00
|
|
|
ib::info() << "innodb_force_recovery=6 skips redo log apply";
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
return(DB_SUCCESS);
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
recv_recovery_on = true;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
log_mutex_enter();
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
/* Look for the latest checkpoint from any of the log groups */
|
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
err = recv_find_max_checkpoint(&max_cp_field);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
MDEV-14717: Prevent crash-downgrade to earlier MariaDB 10.2
A crash-downgrade of a RENAME (or TRUNCATE or table-rebuilding
ALTER TABLE or OPTIMIZE TABLE) operation to an earlier 10.2 version
would trigger a debug assertion failure during rollback,
in trx_roll_pop_top_rec_of_trx(). In a non-debug build, the
TRX_UNDO_RENAME_TABLE record would be misinterpreted as an
update_undo log record, and typically the file name would be
interpreted as DB_TRX_ID,DB_ROLL_PTR,PRIMARY KEY. If a matching
record would be found, row_undo_mod() would hit ut_error in
switch (node->rec_type). Typically, ut_a(table2 == NULL) would
fail when opening the table from SQL.
Because of this, we prevent a crash-downgrade to earlier MariaDB 10.2
versions by changing the InnoDB redo log format identifier to the
10.3 identifier, and by introducing a subformat identifier so that
10.2 can continue to refuse crash-downgrade from 10.3 or later.
After a clean shutdown, a downgrade to MariaDB 10.2.13 or later would
still be possible thanks to MDEV-14909. A downgrade to older 10.2
versions is only possible after removing the log files (not recommended).
LOG_HEADER_FORMAT_CURRENT: Change to 103 (originally the 10.3 format).
log_group_t: Add subformat. For 10.2, we will use subformat 1,
and will refuse crash recovery from any other subformat of the
10.3 format, that is, a genuine 10.3 redo log.
recv_find_max_checkpoint(): Allow startup after clean shutdown
from a future LOG_HEADER_FORMAT_10_4 (unencrypted only).
We cannot handle the encrypted 10.4 redo log block format,
which was introduced in MDEV-12041. Allow crash recovery from
the original 10.2 format as well as the new format.
In Mariabackup --backup, do not allow any startup from 10.3 or 10.4
redo logs.
recv_recovery_from_checkpoint_start(): Skip redo log apply for
clean 10.3 redo log, but not for the new 10.2 redo log
(10.3 format, subformat 1).
srv_prepare_to_delete_redo_log_files(): On format or subformat
mismatch, set srv_log_file_size = 0, so that we will display the
correct message.
innobase_start_or_create_for_mysql(): Check for format or subformat
mismatch.
xtrabackup_backup_func(): Remove debug assertions that were made
redundant by the code changes in recv_find_max_checkpoint().
2018-09-07 17:24:31 +03:00
|
|
|
if (err != DB_SUCCESS) {
|
|
|
|
skip_apply:
|
2016-08-12 11:17:45 +03:00
|
|
|
log_mutex_exit();
|
2014-02-26 19:11:54 +01:00
|
|
|
return(err);
|
|
|
|
}
|
|
|
|
|
MDEV-14717: Prevent crash-downgrade to earlier MariaDB 10.2
A crash-downgrade of a RENAME (or TRUNCATE or table-rebuilding
ALTER TABLE or OPTIMIZE TABLE) operation to an earlier 10.2 version
would trigger a debug assertion failure during rollback,
in trx_roll_pop_top_rec_of_trx(). In a non-debug build, the
TRX_UNDO_RENAME_TABLE record would be misinterpreted as an
update_undo log record, and typically the file name would be
interpreted as DB_TRX_ID,DB_ROLL_PTR,PRIMARY KEY. If a matching
record would be found, row_undo_mod() would hit ut_error in
switch (node->rec_type). Typically, ut_a(table2 == NULL) would
fail when opening the table from SQL.
Because of this, we prevent a crash-downgrade to earlier MariaDB 10.2
versions by changing the InnoDB redo log format identifier to the
10.3 identifier, and by introducing a subformat identifier so that
10.2 can continue to refuse crash-downgrade from 10.3 or later.
After a clean shutdown, a downgrade to MariaDB 10.2.13 or later would
still be possible thanks to MDEV-14909. A downgrade to older 10.2
versions is only possible after removing the log files (not recommended).
LOG_HEADER_FORMAT_CURRENT: Change to 103 (originally the 10.3 format).
log_group_t: Add subformat. For 10.2, we will use subformat 1,
and will refuse crash recovery from any other subformat of the
10.3 format, that is, a genuine 10.3 redo log.
recv_find_max_checkpoint(): Allow startup after clean shutdown
from a future LOG_HEADER_FORMAT_10_4 (unencrypted only).
We cannot handle the encrypted 10.4 redo log block format,
which was introduced in MDEV-12041. Allow crash recovery from
the original 10.2 format as well as the new format.
In Mariabackup --backup, do not allow any startup from 10.3 or 10.4
redo logs.
recv_recovery_from_checkpoint_start(): Skip redo log apply for
clean 10.3 redo log, but not for the new 10.2 redo log
(10.3 format, subformat 1).
srv_prepare_to_delete_redo_log_files(): On format or subformat
mismatch, set srv_log_file_size = 0, so that we will display the
correct message.
innobase_start_or_create_for_mysql(): Check for format or subformat
mismatch.
xtrabackup_backup_func(): Remove debug assertions that were made
redundant by the code changes in recv_find_max_checkpoint().
2018-09-07 17:24:31 +03:00
|
|
|
switch (log_sys->log.format) {
|
|
|
|
case 0:
|
|
|
|
break;
|
|
|
|
case LOG_HEADER_FORMAT_10_2:
|
|
|
|
case LOG_HEADER_FORMAT_10_2 | LOG_HEADER_FORMAT_ENCRYPTED:
|
|
|
|
break;
|
MDEV-13564: Implement innodb_unsafe_truncate=ON for compatibility
While MariaDB Server 10.2 is not really guaranteed to be compatible
with Percona XtraBackup 2.4 (for example, the MySQL 5.7 undo log format
change that could be present in XtraBackup, but was reverted from
MariaDB in MDEV-12289), we do not want to disrupt users who have
deployed xtrabackup and MariaDB Server 10.2 in their environments.
With this change, MariaDB 10.2 will continue to use the backup-unsafe
TRUNCATE TABLE code, so that neither the undo log nor the redo log
formats will change in an incompatible way.
Undo tablespace truncation will keep using the redo log only. Recovery
or backup with old code will fail to shrink the undo tablespace files,
but the contents will be recovered just fine.
In the MariaDB Server 10.2 series only, we introduce the configuration
parameter innodb_unsafe_truncate and make it ON by default. To allow
MariaDB Backup (mariabackup) to work properly with TRUNCATE TABLE
operations, use loose_innodb_unsafe_truncate=OFF.
MariaDB Server 10.3.10 and later releases will always use the
backup-safe TRUNCATE TABLE, and this parameter will not be
added there.
recv_recovery_rollback_active(): Skip row_mysql_drop_garbage_tables()
unless innodb_unsafe_truncate=OFF. It is too unsafe to drop orphan
tables if RENAME operations are not transactional within InnoDB.
LOG_HEADER_FORMAT_10_3: Replaces LOG_HEADER_FORMAT_CURRENT.
log_init(), log_group_file_header_flush(),
srv_prepare_to_delete_redo_log_files(),
innobase_start_or_create_for_mysql(): Choose the redo log format
and subformat based on the value of innodb_unsafe_truncate.
2018-10-10 19:19:29 +03:00
|
|
|
case LOG_HEADER_FORMAT_10_3:
|
|
|
|
case LOG_HEADER_FORMAT_10_3 | LOG_HEADER_FORMAT_ENCRYPTED:
|
MDEV-14717: Prevent crash-downgrade to earlier MariaDB 10.2
A crash-downgrade of a RENAME (or TRUNCATE or table-rebuilding
ALTER TABLE or OPTIMIZE TABLE) operation to an earlier 10.2 version
would trigger a debug assertion failure during rollback,
in trx_roll_pop_top_rec_of_trx(). In a non-debug build, the
TRX_UNDO_RENAME_TABLE record would be misinterpreted as an
update_undo log record, and typically the file name would be
interpreted as DB_TRX_ID,DB_ROLL_PTR,PRIMARY KEY. If a matching
record would be found, row_undo_mod() would hit ut_error in
switch (node->rec_type). Typically, ut_a(table2 == NULL) would
fail when opening the table from SQL.
Because of this, we prevent a crash-downgrade to earlier MariaDB 10.2
versions by changing the InnoDB redo log format identifier to the
10.3 identifier, and by introducing a subformat identifier so that
10.2 can continue to refuse crash-downgrade from 10.3 or later.
After a clean shutdown, a downgrade to MariaDB 10.2.13 or later would
still be possible thanks to MDEV-14909. A downgrade to older 10.2
versions is only possible after removing the log files (not recommended).
LOG_HEADER_FORMAT_CURRENT: Change to 103 (originally the 10.3 format).
log_group_t: Add subformat. For 10.2, we will use subformat 1,
and will refuse crash recovery from any other subformat of the
10.3 format, that is, a genuine 10.3 redo log.
recv_find_max_checkpoint(): Allow startup after clean shutdown
from a future LOG_HEADER_FORMAT_10_4 (unencrypted only).
We cannot handle the encrypted 10.4 redo log block format,
which was introduced in MDEV-12041. Allow crash recovery from
the original 10.2 format as well as the new format.
In Mariabackup --backup, do not allow any startup from 10.3 or 10.4
redo logs.
recv_recovery_from_checkpoint_start(): Skip redo log apply for
clean 10.3 redo log, but not for the new 10.2 redo log
(10.3 format, subformat 1).
srv_prepare_to_delete_redo_log_files(): On format or subformat
mismatch, set srv_log_file_size = 0, so that we will display the
correct message.
innobase_start_or_create_for_mysql(): Check for format or subformat
mismatch.
xtrabackup_backup_func(): Remove debug assertions that were made
redundant by the code changes in recv_find_max_checkpoint().
2018-09-07 17:24:31 +03:00
|
|
|
if (log_sys->log.subformat == 1) {
|
|
|
|
/* 10.2 with new crash-safe TRUNCATE */
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
/* fall through */
|
|
|
|
default:
|
|
|
|
/* This must be a clean log from a newer version. */
|
|
|
|
goto skip_apply;
|
|
|
|
}
|
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
log_group_header_read(&log_sys->log, max_cp_field);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
buf = log_sys->checkpoint_buf;
|
|
|
|
|
|
|
|
checkpoint_lsn = mach_read_from_8(buf + LOG_CHECKPOINT_LSN);
|
|
|
|
checkpoint_no = mach_read_from_8(buf + LOG_CHECKPOINT_NO);
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/* Start reading the log groups from the checkpoint lsn up. The
|
|
|
|
variable contiguous_lsn contains an lsn up to which the log is
|
|
|
|
known to be contiguously written to all log groups. */
|
2016-09-06 09:43:16 +03:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
recv_sys->mlog_checkpoint_lsn = 0;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(RECV_SCAN_SIZE <= log_sys->buf_size);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-03-01 23:43:37 +02:00
|
|
|
const lsn_t end_lsn = mach_read_from_8(
|
|
|
|
buf + LOG_CHECKPOINT_END_LSN);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(recv_sys->n_addrs == 0);
|
|
|
|
contiguous_lsn = checkpoint_lsn;
|
MDEV-14717: Prevent crash-downgrade to earlier MariaDB 10.2
A crash-downgrade of a RENAME (or TRUNCATE or table-rebuilding
ALTER TABLE or OPTIMIZE TABLE) operation to an earlier 10.2 version
would trigger a debug assertion failure during rollback,
in trx_roll_pop_top_rec_of_trx(). In a non-debug build, the
TRX_UNDO_RENAME_TABLE record would be misinterpreted as an
update_undo log record, and typically the file name would be
interpreted as DB_TRX_ID,DB_ROLL_PTR,PRIMARY KEY. If a matching
record would be found, row_undo_mod() would hit ut_error in
switch (node->rec_type). Typically, ut_a(table2 == NULL) would
fail when opening the table from SQL.
Because of this, we prevent a crash-downgrade to earlier MariaDB 10.2
versions by changing the InnoDB redo log format identifier to the
10.3 identifier, and by introducing a subformat identifier so that
10.2 can continue to refuse crash-downgrade from 10.3 or later.
After a clean shutdown, a downgrade to MariaDB 10.2.13 or later would
still be possible thanks to MDEV-14909. A downgrade to older 10.2
versions is only possible after removing the log files (not recommended).
LOG_HEADER_FORMAT_CURRENT: Change to 103 (originally the 10.3 format).
log_group_t: Add subformat. For 10.2, we will use subformat 1,
and will refuse crash recovery from any other subformat of the
10.3 format, that is, a genuine 10.3 redo log.
recv_find_max_checkpoint(): Allow startup after clean shutdown
from a future LOG_HEADER_FORMAT_10_4 (unencrypted only).
We cannot handle the encrypted 10.4 redo log block format,
which was introduced in MDEV-12041. Allow crash recovery from
the original 10.2 format as well as the new format.
In Mariabackup --backup, do not allow any startup from 10.3 or 10.4
redo logs.
recv_recovery_from_checkpoint_start(): Skip redo log apply for
clean 10.3 redo log, but not for the new 10.2 redo log
(10.3 format, subformat 1).
srv_prepare_to_delete_redo_log_files(): On format or subformat
mismatch, set srv_log_file_size = 0, so that we will display the
correct message.
innobase_start_or_create_for_mysql(): Check for format or subformat
mismatch.
xtrabackup_backup_func(): Remove debug assertions that were made
redundant by the code changes in recv_find_max_checkpoint().
2018-09-07 17:24:31 +03:00
|
|
|
switch (log_sys->log.format) {
|
2016-08-12 11:17:45 +03:00
|
|
|
case 0:
|
|
|
|
log_mutex_exit();
|
2018-06-04 11:31:39 +03:00
|
|
|
return recv_log_format_0_recover(checkpoint_lsn,
|
|
|
|
buf[20 + 32 * 9] == 2);
|
2017-08-07 17:21:30 +03:00
|
|
|
default:
|
2017-03-01 23:43:37 +02:00
|
|
|
if (end_lsn == 0) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
if (end_lsn >= checkpoint_lsn) {
|
|
|
|
contiguous_lsn = end_lsn;
|
|
|
|
break;
|
|
|
|
}
|
2016-08-12 11:17:45 +03:00
|
|
|
recv_sys->found_corrupt_log = true;
|
|
|
|
log_mutex_exit();
|
|
|
|
return(DB_ERROR);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/* Look for MLOG_CHECKPOINT. */
|
MDEV-14717: Prevent crash-downgrade to earlier MariaDB 10.2
A crash-downgrade of a RENAME (or TRUNCATE or table-rebuilding
ALTER TABLE or OPTIMIZE TABLE) operation to an earlier 10.2 version
would trigger a debug assertion failure during rollback,
in trx_roll_pop_top_rec_of_trx(). In a non-debug build, the
TRX_UNDO_RENAME_TABLE record would be misinterpreted as an
update_undo log record, and typically the file name would be
interpreted as DB_TRX_ID,DB_ROLL_PTR,PRIMARY KEY. If a matching
record would be found, row_undo_mod() would hit ut_error in
switch (node->rec_type). Typically, ut_a(table2 == NULL) would
fail when opening the table from SQL.
Because of this, we prevent a crash-downgrade to earlier MariaDB 10.2
versions by changing the InnoDB redo log format identifier to the
10.3 identifier, and by introducing a subformat identifier so that
10.2 can continue to refuse crash-downgrade from 10.3 or later.
After a clean shutdown, a downgrade to MariaDB 10.2.13 or later would
still be possible thanks to MDEV-14909. A downgrade to older 10.2
versions is only possible after removing the log files (not recommended).
LOG_HEADER_FORMAT_CURRENT: Change to 103 (originally the 10.3 format).
log_group_t: Add subformat. For 10.2, we will use subformat 1,
and will refuse crash recovery from any other subformat of the
10.3 format, that is, a genuine 10.3 redo log.
recv_find_max_checkpoint(): Allow startup after clean shutdown
from a future LOG_HEADER_FORMAT_10_4 (unencrypted only).
We cannot handle the encrypted 10.4 redo log block format,
which was introduced in MDEV-12041. Allow crash recovery from
the original 10.2 format as well as the new format.
In Mariabackup --backup, do not allow any startup from 10.3 or 10.4
redo logs.
recv_recovery_from_checkpoint_start(): Skip redo log apply for
clean 10.3 redo log, but not for the new 10.2 redo log
(10.3 format, subformat 1).
srv_prepare_to_delete_redo_log_files(): On format or subformat
mismatch, set srv_log_file_size = 0, so that we will display the
correct message.
innobase_start_or_create_for_mysql(): Check for format or subformat
mismatch.
xtrabackup_backup_func(): Remove debug assertions that were made
redundant by the code changes in recv_find_max_checkpoint().
2018-09-07 17:24:31 +03:00
|
|
|
log_group_t* group = &log_sys->log;
|
2017-03-01 23:43:37 +02:00
|
|
|
recv_group_scan_log_recs(group, checkpoint_lsn, &contiguous_lsn,
|
|
|
|
false);
|
2016-08-12 11:17:45 +03:00
|
|
|
/* The first scan should not have stored or applied any records. */
|
|
|
|
ut_ad(recv_sys->n_addrs == 0);
|
|
|
|
ut_ad(!recv_sys->found_corrupt_fs);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-01-25 15:11:46 +02:00
|
|
|
if (srv_read_only_mode && recv_needed_recovery) {
|
2017-01-31 19:43:03 +02:00
|
|
|
log_mutex_exit();
|
2017-01-25 15:11:46 +02:00
|
|
|
return(DB_READ_ONLY);
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (recv_sys->found_corrupt_log && !srv_force_recovery) {
|
|
|
|
log_mutex_exit();
|
2017-02-10 12:11:42 +02:00
|
|
|
ib::warn() << "Log scan aborted at LSN " << contiguous_lsn;
|
2016-08-12 11:17:45 +03:00
|
|
|
return(DB_ERROR);
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (recv_sys->mlog_checkpoint_lsn == 0) {
|
2017-03-07 17:16:49 +02:00
|
|
|
lsn_t scan_lsn = group->scanned_lsn;
|
|
|
|
if (!srv_read_only_mode && scan_lsn != checkpoint_lsn) {
|
2017-02-10 12:11:42 +02:00
|
|
|
log_mutex_exit();
|
2017-03-01 23:43:37 +02:00
|
|
|
ib::error err;
|
|
|
|
err << "Missing MLOG_CHECKPOINT";
|
|
|
|
if (end_lsn) {
|
|
|
|
err << " at " << end_lsn;
|
|
|
|
}
|
|
|
|
err << " between the checkpoint " << checkpoint_lsn
|
|
|
|
<< " and the end " << scan_lsn << ".";
|
2017-02-10 12:11:42 +02:00
|
|
|
return(DB_ERROR);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
group->scanned_lsn = checkpoint_lsn;
|
|
|
|
rescan = false;
|
|
|
|
} else {
|
|
|
|
contiguous_lsn = checkpoint_lsn;
|
|
|
|
rescan = recv_group_scan_log_recs(
|
2017-03-01 23:43:37 +02:00
|
|
|
group, checkpoint_lsn, &contiguous_lsn, false);
|
2016-08-12 11:17:45 +03:00
|
|
|
|
|
|
|
if ((recv_sys->found_corrupt_log && !srv_force_recovery)
|
|
|
|
|| recv_sys->found_corrupt_fs) {
|
|
|
|
log_mutex_exit();
|
2014-02-26 19:11:54 +01:00
|
|
|
return(DB_ERROR);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/* NOTE: we always do a 'recovery' at startup, but only if
|
|
|
|
there is something wrong we will print a message to the
|
|
|
|
user about recovery: */
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-06-28 11:58:43 +03:00
|
|
|
if (flush_lsn == checkpoint_lsn + SIZE_OF_MLOG_CHECKPOINT
|
|
|
|
&& recv_sys->mlog_checkpoint_lsn == checkpoint_lsn) {
|
|
|
|
/* The redo log is logically empty. */
|
|
|
|
} else if (checkpoint_lsn != flush_lsn) {
|
|
|
|
ut_ad(!srv_log_files_created);
|
2015-08-07 15:21:20 +03:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (checkpoint_lsn + SIZE_OF_MLOG_CHECKPOINT < flush_lsn) {
|
2017-07-05 10:16:36 +03:00
|
|
|
ib::warn() << "Are you sure you are using the"
|
2016-08-12 11:17:45 +03:00
|
|
|
" right ib_logfiles to start up the database?"
|
|
|
|
" Log sequence number in the ib_logfiles is "
|
|
|
|
<< checkpoint_lsn << ", less than the"
|
|
|
|
" log sequence number in the first system"
|
|
|
|
" tablespace file header, " << flush_lsn << ".";
|
2015-08-07 15:21:20 +03:00
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (!recv_needed_recovery) {
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
ib::info() << "The log sequence number " << flush_lsn
|
|
|
|
<< " in the system tablespace does not match"
|
|
|
|
" the log sequence number " << checkpoint_lsn
|
|
|
|
<< " in the ib_logfiles!";
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (srv_read_only_mode) {
|
2017-03-01 23:43:37 +02:00
|
|
|
ib::error() << "innodb_read_only"
|
|
|
|
" prevents crash recovery";
|
2016-08-12 11:17:45 +03:00
|
|
|
log_mutex_exit();
|
|
|
|
return(DB_READ_ONLY);
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2017-03-01 23:43:37 +02:00
|
|
|
recv_needed_recovery = true;
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
}
|
2016-09-06 09:43:16 +03:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
log_sys->lsn = recv_sys->recovered_lsn;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (recv_needed_recovery) {
|
2018-03-27 13:47:56 +05:30
|
|
|
bool missing_tablespace = false;
|
|
|
|
|
|
|
|
err = recv_init_crash_recovery_spaces(
|
|
|
|
rescan, missing_tablespace);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (err != DB_SUCCESS) {
|
|
|
|
log_mutex_exit();
|
|
|
|
return(err);
|
|
|
|
}
|
|
|
|
|
2018-03-27 13:47:56 +05:30
|
|
|
/* If there is any missing tablespace and rescan is needed
|
|
|
|
then there is a possiblity that hash table will not contain
|
|
|
|
all space ids redo logs. Rescan the remaining unstored
|
|
|
|
redo logs for the validation of missing tablespace. */
|
2018-10-05 16:44:51 +05:30
|
|
|
ut_ad(rescan || !missing_tablespace);
|
|
|
|
|
2018-03-27 13:47:56 +05:30
|
|
|
while (missing_tablespace) {
|
|
|
|
DBUG_PRINT("ib_log", ("Rescan of redo log to validate "
|
|
|
|
"the missing tablespace. Scan "
|
|
|
|
"from last stored LSN " LSN_PF,
|
|
|
|
recv_sys->last_stored_lsn));
|
|
|
|
|
|
|
|
lsn_t recent_stored_lsn = recv_sys->last_stored_lsn;
|
|
|
|
rescan = recv_group_scan_log_recs(
|
|
|
|
group, checkpoint_lsn,
|
|
|
|
&recent_stored_lsn, false);
|
|
|
|
|
|
|
|
ut_ad(!recv_sys->found_corrupt_fs);
|
|
|
|
|
|
|
|
missing_tablespace = false;
|
|
|
|
|
|
|
|
err = recv_sys->found_corrupt_log
|
|
|
|
? DB_ERROR
|
|
|
|
: recv_validate_tablespace(
|
|
|
|
rescan, missing_tablespace);
|
|
|
|
|
|
|
|
if (err != DB_SUCCESS) {
|
|
|
|
log_mutex_exit();
|
|
|
|
return err;
|
|
|
|
}
|
2018-10-05 16:44:51 +05:30
|
|
|
|
|
|
|
rescan = true;
|
2018-03-27 13:47:56 +05:30
|
|
|
}
|
|
|
|
|
|
|
|
if (srv_operation == SRV_OPERATION_NORMAL) {
|
|
|
|
buf_dblwr_process();
|
|
|
|
}
|
|
|
|
|
|
|
|
ut_ad(srv_force_recovery <= SRV_FORCE_NO_UNDO_LOG_SCAN);
|
|
|
|
|
|
|
|
/* Spawn the background thread to flush dirty pages
|
|
|
|
from the buffer pools. */
|
|
|
|
recv_writer_thread_active = true;
|
|
|
|
os_thread_create(recv_writer_thread, 0, 0);
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (rescan) {
|
|
|
|
contiguous_lsn = checkpoint_lsn;
|
2016-09-06 09:43:16 +03:00
|
|
|
|
2017-03-01 23:43:37 +02:00
|
|
|
recv_group_scan_log_recs(group, checkpoint_lsn,
|
|
|
|
&contiguous_lsn, true);
|
2016-08-12 11:17:45 +03:00
|
|
|
|
|
|
|
if ((recv_sys->found_corrupt_log
|
|
|
|
&& !srv_force_recovery)
|
|
|
|
|| recv_sys->found_corrupt_fs) {
|
|
|
|
log_mutex_exit();
|
|
|
|
return(DB_ERROR);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
}
|
2016-08-12 11:17:45 +03:00
|
|
|
} else {
|
|
|
|
ut_ad(!rescan || recv_sys->n_addrs == 0);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
/* We currently have only one log group */
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (group->scanned_lsn < checkpoint_lsn
|
|
|
|
|| group->scanned_lsn < recv_max_page_lsn) {
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
ib::error() << "We scanned the log up to " << group->scanned_lsn
|
|
|
|
<< ". A checkpoint was at " << checkpoint_lsn << " and"
|
|
|
|
" the maximum LSN on a database page was "
|
|
|
|
<< recv_max_page_lsn << ". It is possible that the"
|
|
|
|
" database is now corrupt!";
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (recv_sys->recovered_lsn < checkpoint_lsn) {
|
|
|
|
log_mutex_exit();
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-09-06 09:43:16 +03:00
|
|
|
ib::error() << "Recovered only to lsn:"
|
|
|
|
<< recv_sys->recovered_lsn << " checkpoint_lsn: " << checkpoint_lsn;
|
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
return(DB_ERROR);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Synchronize the uncorrupted log groups to the most up-to-date log
|
|
|
|
group; we also copy checkpoint info to groups */
|
|
|
|
|
|
|
|
log_sys->next_checkpoint_lsn = checkpoint_lsn;
|
|
|
|
log_sys->next_checkpoint_no = checkpoint_no + 1;
|
2016-09-06 09:43:16 +03:00
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
recv_synchronize_groups();
|
|
|
|
|
|
|
|
if (!recv_needed_recovery) {
|
|
|
|
ut_a(checkpoint_lsn == recv_sys->recovered_lsn);
|
|
|
|
} else {
|
|
|
|
srv_start_lsn = recv_sys->recovered_lsn;
|
|
|
|
}
|
|
|
|
|
|
|
|
log_sys->buf_free = (ulint) log_sys->lsn % OS_FILE_LOG_BLOCK_SIZE;
|
|
|
|
log_sys->buf_next_to_write = log_sys->buf_free;
|
2016-08-12 11:17:45 +03:00
|
|
|
log_sys->write_lsn = log_sys->lsn;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
log_sys->last_checkpoint_lsn = checkpoint_lsn;
|
|
|
|
|
2017-07-07 18:29:31 +03:00
|
|
|
if (!srv_read_only_mode && srv_operation == SRV_OPERATION_NORMAL) {
|
2016-08-12 11:17:45 +03:00
|
|
|
/* Write a MLOG_CHECKPOINT marker as the first thing,
|
2017-07-07 18:29:31 +03:00
|
|
|
before generating any other redo log. This ensures
|
|
|
|
that subsequent crash recovery will be possible even
|
|
|
|
if the server were killed soon after this. */
|
2016-08-12 11:17:45 +03:00
|
|
|
fil_names_clear(log_sys->last_checkpoint_lsn, true);
|
|
|
|
}
|
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
MONITOR_SET(MONITOR_LSN_CHECKPOINT_AGE,
|
|
|
|
log_sys->lsn - log_sys->last_checkpoint_lsn);
|
|
|
|
|
2017-02-10 12:11:42 +02:00
|
|
|
log_sys->next_checkpoint_no = ++checkpoint_no;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
mutex_enter(&recv_sys->mutex);
|
|
|
|
|
|
|
|
recv_sys->apply_log_recs = TRUE;
|
|
|
|
|
|
|
|
mutex_exit(&recv_sys->mutex);
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
log_mutex_exit();
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
recv_lsn_checks_on = true;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
/* The database is now ready to start almost normal processing of user
|
|
|
|
transactions: transaction rollbacks and the application of the log
|
|
|
|
records in the hash table can be run in background. */
|
|
|
|
|
|
|
|
return(DB_SUCCESS);
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/** Complete recovery from a checkpoint. */
|
2014-02-26 19:11:54 +01:00
|
|
|
void
|
|
|
|
recv_recovery_from_checkpoint_finish(void)
|
|
|
|
{
|
|
|
|
/* Make sure that the recv_writer thread is done. This is
|
|
|
|
required because it grabs various mutexes and we want to
|
|
|
|
ensure that when we enable sync_order_checks there is no
|
|
|
|
mutex currently held by any thread. */
|
|
|
|
mutex_enter(&recv_sys->writer_mutex);
|
|
|
|
|
|
|
|
/* Free the resources of the recovery system */
|
2016-08-12 11:17:45 +03:00
|
|
|
recv_recovery_on = false;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
/* By acquring the mutex we ensure that the recv_writer thread
|
2016-08-12 11:17:45 +03:00
|
|
|
won't trigger any more LRU batches. Now wait for currently
|
2014-02-26 19:11:54 +01:00
|
|
|
in progress batches to finish. */
|
|
|
|
buf_flush_wait_LRU_batch_end();
|
|
|
|
|
|
|
|
mutex_exit(&recv_sys->writer_mutex);
|
|
|
|
|
|
|
|
ulint count = 0;
|
|
|
|
while (recv_writer_thread_active) {
|
|
|
|
++count;
|
|
|
|
os_thread_sleep(100000);
|
|
|
|
if (srv_print_verbose_log && count > 600) {
|
2016-08-12 11:17:45 +03:00
|
|
|
ib::info() << "Waiting for recv_writer to"
|
|
|
|
" finish flushing of buffer pool";
|
2014-02-26 19:11:54 +01:00
|
|
|
count = 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
recv_sys_debug_free();
|
2016-08-12 11:17:45 +03:00
|
|
|
|
|
|
|
/* Free up the flush_rbt. */
|
|
|
|
buf_flush_free_flush_rbt();
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
/********************************************************//**
|
|
|
|
Initiates the rollback of active transactions. */
|
|
|
|
void
|
|
|
|
recv_recovery_rollback_active(void)
|
|
|
|
/*===============================*/
|
|
|
|
{
|
|
|
|
ut_ad(!recv_writer_thread_active);
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/* Switch latching order checks on in sync0debug.cc, if
|
|
|
|
--innodb-sync-debug=true (default) */
|
|
|
|
ut_d(sync_check_enable());
|
|
|
|
|
2014-02-26 19:11:54 +01:00
|
|
|
/* We can't start any (DDL) transactions if UNDO logging
|
|
|
|
has been disabled, additionally disable ROLLBACK of recovered
|
|
|
|
user transactions. */
|
|
|
|
if (srv_force_recovery < SRV_FORCE_NO_TRX_UNDO
|
|
|
|
&& !srv_read_only_mode) {
|
|
|
|
|
|
|
|
/* Drop partially created indexes. */
|
|
|
|
row_merge_drop_temp_indexes();
|
Follow-up to MDEV-13407 innodb.drop_table_background failed in buildbot with "Tablespace for table exists"
This is a backport of commit 88aff5f471d3d9ae8ecc2f909bcf5bd0ddd6aa7c.
The InnoDB background DROP TABLE queue is something that we should
really remove, but are unable to until we remove dict_operation_lock
so that DDL and DML operations can be combined in a single transaction.
Because the queue is not persistent, it is not crash-safe. We should
in some way ensure that the deferred-dropped tables will be dropped
after server restart.
The existence of two separate transactions complicates the error handling
of CREATE TABLE...SELECT. We should really not break locks in DROP TABLE.
Our solution to these problems is to rename the table to a temporary
name, and to drop such-named tables on InnoDB startup. Also, the
queue will use table IDs instead of names from now on.
check-testcase.test: Ignore #sql-ib*.ibd files, because tables may enter
the background DROP TABLE queue shortly before the test finishes.
innodb.drop_table_background: Test CREATE...SELECT and the creation of
tables whose file name starts with #sql-ib.
innodb.alter_crash: Adjust the recovery, now that the #sql-ib tables
will be dropped on InnoDB startup.
row_mysql_drop_garbage_tables(): New function, to drop all #sql-ib tables
on InnoDB startup.
row_drop_table_for_mysql_in_background(): Remove an unnecessary and
misplaced call to log_buffer_flush_to_disk(). (The call should have been
after the transaction commit. We do not care about flushing the redo log
here, because the table would be dropped again at server startup.)
Remove the entry from the list after the table no longer exists.
If server shutdown has been initiated, empty the list without actually
dropping any tables. They will be dropped again on startup.
row_drop_table_for_mysql(): Do not call lock_remove_all_on_table().
Instead, if locks exist, defer the DROP TABLE until they do not exist.
If the table name does not start with #sql-ib, rename it to that prefix
before adding it to the background DROP TABLE queue.
2018-09-06 11:47:54 +03:00
|
|
|
/* Drop garbage tables. */
|
2018-10-11 15:10:13 +03:00
|
|
|
if (srv_safe_truncate)
|
Follow-up to MDEV-13407 innodb.drop_table_background failed in buildbot with "Tablespace for table exists"
This is a backport of commit 88aff5f471d3d9ae8ecc2f909bcf5bd0ddd6aa7c.
The InnoDB background DROP TABLE queue is something that we should
really remove, but are unable to until we remove dict_operation_lock
so that DDL and DML operations can be combined in a single transaction.
Because the queue is not persistent, it is not crash-safe. We should
in some way ensure that the deferred-dropped tables will be dropped
after server restart.
The existence of two separate transactions complicates the error handling
of CREATE TABLE...SELECT. We should really not break locks in DROP TABLE.
Our solution to these problems is to rename the table to a temporary
name, and to drop such-named tables on InnoDB startup. Also, the
queue will use table IDs instead of names from now on.
check-testcase.test: Ignore #sql-ib*.ibd files, because tables may enter
the background DROP TABLE queue shortly before the test finishes.
innodb.drop_table_background: Test CREATE...SELECT and the creation of
tables whose file name starts with #sql-ib.
innodb.alter_crash: Adjust the recovery, now that the #sql-ib tables
will be dropped on InnoDB startup.
row_mysql_drop_garbage_tables(): New function, to drop all #sql-ib tables
on InnoDB startup.
row_drop_table_for_mysql_in_background(): Remove an unnecessary and
misplaced call to log_buffer_flush_to_disk(). (The call should have been
after the transaction commit. We do not care about flushing the redo log
here, because the table would be dropped again at server startup.)
Remove the entry from the list after the table no longer exists.
If server shutdown has been initiated, empty the list without actually
dropping any tables. They will be dropped again on startup.
row_drop_table_for_mysql(): Do not call lock_remove_all_on_table().
Instead, if locks exist, defer the DROP TABLE until they do not exist.
If the table name does not start with #sql-ib, rename it to that prefix
before adding it to the background DROP TABLE queue.
2018-09-06 11:47:54 +03:00
|
|
|
row_mysql_drop_garbage_tables();
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
/* Drop any auxiliary tables that were not dropped when the
|
|
|
|
parent table was dropped. This can happen if the parent table
|
|
|
|
was dropped but the server crashed before the auxiliary tables
|
|
|
|
were dropped. */
|
|
|
|
fts_drop_orphaned_tables();
|
|
|
|
|
|
|
|
/* Rollback the uncommitted transactions which have no user
|
|
|
|
session */
|
|
|
|
|
2015-02-18 16:20:46 +01:00
|
|
|
trx_rollback_or_clean_is_active = true;
|
2014-02-26 19:11:54 +01:00
|
|
|
os_thread_create(trx_rollback_or_clean_all_recovered, 0, 0);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/******************************************************//**
|
|
|
|
Resets the logs. The contents of log files will be lost! */
|
|
|
|
void
|
|
|
|
recv_reset_logs(
|
|
|
|
/*============*/
|
|
|
|
lsn_t lsn) /*!< in: reset to this lsn
|
|
|
|
rounded up to be divisible by
|
|
|
|
OS_FILE_LOG_BLOCK_SIZE, after
|
|
|
|
which we add
|
|
|
|
LOG_BLOCK_HDR_SIZE */
|
|
|
|
{
|
2016-08-12 11:17:45 +03:00
|
|
|
ut_ad(log_mutex_own());
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
log_sys->lsn = ut_uint64_align_up(lsn, OS_FILE_LOG_BLOCK_SIZE);
|
|
|
|
|
2017-05-26 14:04:19 +03:00
|
|
|
log_sys->log.lsn = log_sys->lsn;
|
|
|
|
log_sys->log.lsn_offset = LOG_FILE_HDR_SIZE;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
log_sys->buf_next_to_write = 0;
|
2016-08-12 11:17:45 +03:00
|
|
|
log_sys->write_lsn = log_sys->lsn;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
log_sys->next_checkpoint_no = 0;
|
|
|
|
log_sys->last_checkpoint_lsn = 0;
|
|
|
|
|
2017-09-07 12:01:07 +03:00
|
|
|
memset(log_sys->buf, 0, log_sys->buf_size);
|
2014-02-26 19:11:54 +01:00
|
|
|
log_block_init(log_sys->buf, log_sys->lsn);
|
|
|
|
log_block_set_first_rec_group(log_sys->buf, LOG_BLOCK_HDR_SIZE);
|
|
|
|
|
|
|
|
log_sys->buf_free = LOG_BLOCK_HDR_SIZE;
|
|
|
|
log_sys->lsn += LOG_BLOCK_HDR_SIZE;
|
|
|
|
|
|
|
|
MONITOR_SET(MONITOR_LSN_CHECKPOINT_AGE,
|
|
|
|
(log_sys->lsn - log_sys->last_checkpoint_lsn));
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
log_mutex_exit();
|
2014-02-26 19:11:54 +01:00
|
|
|
|
|
|
|
/* Reset the checkpoint fields in logs */
|
|
|
|
|
|
|
|
log_make_checkpoint_at(LSN_MAX, TRUE);
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
log_mutex_enter();
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
/** Find a doublewrite copy of a page.
|
|
|
|
@param[in] space_id tablespace identifier
|
|
|
|
@param[in] page_no page number
|
|
|
|
@return page frame
|
|
|
|
@retval NULL if no page was found */
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
const byte*
|
|
|
|
recv_dblwr_t::find_page(ulint space_id, ulint page_no)
|
|
|
|
{
|
|
|
|
typedef std::vector<const byte*, ut_allocator<const byte*> >
|
|
|
|
matches_t;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
matches_t matches;
|
|
|
|
const byte* result = 0;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
for (list::iterator i = pages.begin(); i != pages.end(); ++i) {
|
|
|
|
if (page_get_space_id(*i) == space_id
|
|
|
|
&& page_get_page_no(*i) == page_no) {
|
|
|
|
matches.push_back(*i);
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (matches.size() == 1) {
|
|
|
|
result = matches[0];
|
|
|
|
} else if (matches.size() > 1) {
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
lsn_t max_lsn = 0;
|
|
|
|
lsn_t page_lsn = 0;
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
for (matches_t::iterator i = matches.begin();
|
|
|
|
i != matches.end();
|
|
|
|
++i) {
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
page_lsn = mach_read_from_8(*i + FIL_PAGE_LSN);
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
if (page_lsn > max_lsn) {
|
|
|
|
max_lsn = page_lsn;
|
|
|
|
result = *i;
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
return(result);
|
|
|
|
}
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
#ifndef DBUG_OFF
|
|
|
|
/** Return string name of the redo log record type.
|
|
|
|
@param[in] type record log record enum
|
|
|
|
@return string name of record log record */
|
MDEV-13564 Mariabackup does not work with TRUNCATE
Implement undo tablespace truncation via normal redo logging.
Implement TRUNCATE TABLE as a combination of RENAME to #sql-ib name,
CREATE, and DROP.
Note: Orphan #sql-ib*.ibd may be left behind if MariaDB Server 10.2
is killed before the DROP operation is committed. If MariaDB Server 10.2
is killed during TRUNCATE, it is also possible that the old table
was renamed to #sql-ib*.ibd but the data dictionary will refer to the
table using the original name.
In MariaDB Server 10.3, RENAME inside InnoDB is transactional,
and #sql-* tables will be dropped on startup. So, this new TRUNCATE
will be fully crash-safe in 10.3.
ha_mroonga::wrapper_truncate(): Pass table options to the underlying
storage engine, now that ha_innobase::truncate() will need them.
rpl_slave_state::truncate_state_table(): Before truncating
mysql.gtid_slave_pos, evict any cached table handles from
the table definition cache, so that there will be no stale
references to the old table after truncating.
== TRUNCATE TABLE ==
WL#6501 in MySQL 5.7 introduced separate log files for implementing
atomic and crash-safe TRUNCATE TABLE, instead of using the InnoDB
undo and redo log. Some convoluted logic was added to the InnoDB
crash recovery, and some extra synchronization (including a redo log
checkpoint) was introduced to make this work. This synchronization
has caused performance problems and race conditions, and the extra
log files cannot be copied or applied by external backup programs.
In order to support crash-upgrade from MariaDB 10.2, we will keep
the logic for parsing and applying the extra log files, but we will
no longer generate those files in TRUNCATE TABLE.
A prerequisite for crash-safe TRUNCATE is a crash-safe RENAME TABLE
(with full redo and undo logging and proper rollback). This will
be implemented in MDEV-14717.
ha_innobase::truncate(): Invoke RENAME, create(), delete_table().
Because RENAME cannot be fully rolled back before MariaDB 10.3
due to missing undo logging, add some explicit rename-back in
case the operation fails.
ha_innobase::delete(): Introduce a variant that takes sqlcom as
a parameter. In TRUNCATE TABLE, we do not want to touch any
FOREIGN KEY constraints.
ha_innobase::create(): Add the parameters file_per_table, trx.
In TRUNCATE, the new table must be created in the same transaction
that renames the old table.
create_table_info_t::create_table_info_t(): Add the parameters
file_per_table, trx.
row_drop_table_for_mysql(): Replace a bool parameter with sqlcom.
row_drop_table_after_create_fail(): New function, wrapping
row_drop_table_for_mysql().
dict_truncate_index_tree_in_mem(), fil_truncate_tablespace(),
fil_prepare_for_truncate(), fil_reinit_space_header_for_table(),
row_truncate_table_for_mysql(), TruncateLogger,
row_truncate_prepare(), row_truncate_rollback(),
row_truncate_complete(), row_truncate_fts(),
row_truncate_update_system_tables(),
row_truncate_foreign_key_checks(), row_truncate_sanity_checks():
Remove.
row_upd_check_references_constraints(): Remove a check for
TRUNCATE, now that the table is no longer truncated in place.
The new test innodb.truncate_foreign uses DEBUG_SYNC to cover some
race-condition like scenarios. The test innodb-innodb.truncate does
not use any synchronization.
We add a redo log subformat to indicate backup-friendly format.
MariaDB 10.4 will remove support for the old TRUNCATE logging,
so crash-upgrade from old 10.2 or 10.3 to 10.4 will involve
limitations.
== Undo tablespace truncation ==
MySQL 5.7 implements undo tablespace truncation. It is only
possible when innodb_undo_tablespaces is set to at least 2.
The logging is implemented similar to the WL#6501 TRUNCATE,
that is, using separate log files and a redo log checkpoint.
We can simply implement undo tablespace truncation within
a single mini-transaction that reinitializes the undo log
tablespace file. Unfortunately, due to the redo log format
of some operations, currently, the total redo log written by
undo tablespace truncation will be more than the combined size
of the truncated undo tablespace. It should be acceptable
to have a little more than 1 megabyte of log in a single
mini-transaction. This will be fixed in MDEV-17138 in
MariaDB Server 10.4.
recv_sys_t: Add truncated_undo_spaces[] to remember for which undo
tablespaces a MLOG_FILE_CREATE2 record was seen.
namespace undo: Remove some unnecessary declarations.
fil_space_t::is_being_truncated: Document that this flag now
only applies to undo tablespaces. Remove some references.
fil_space_t::is_stopping(): Do not refer to is_being_truncated.
This check is for tablespaces of tables. Potentially used
tablespaces are never truncated any more.
buf_dblwr_process(): Suppress the out-of-bounds warning
for undo tablespaces.
fil_truncate_log(): Write a MLOG_FILE_CREATE2 with a nonzero
page number (new size of the tablespace in pages) to inform
crash recovery that the undo tablespace size has been reduced.
fil_op_write_log(): Relax assertions, so that MLOG_FILE_CREATE2
can be written for undo tablespaces (without .ibd file suffix)
for a nonzero page number.
os_file_truncate(): Add the parameter allow_shrink=false
so that undo tablespaces can actually be shrunk using this function.
fil_name_parse(): For undo tablespace truncation,
buffer MLOG_FILE_CREATE2 in truncated_undo_spaces[].
recv_read_in_area(): Avoid reading pages for which no redo log
records remain buffered, after recv_addr_trim() removed them.
trx_rseg_header_create(): Add a FIXME comment that we could write
much less redo log.
trx_undo_truncate_tablespace(): Reinitialize the undo tablespace
in a single mini-transaction, which will be flushed to the redo log
before the file size is trimmed.
recv_addr_trim(): Discard any redo logs for pages that were
logged after the new end of a file, before the truncation LSN.
If the rec_list becomes empty, reduce n_addrs. After removing
any affected records, actually truncate the file.
recv_apply_hashed_log_recs(): Invoke recv_addr_trim() right before
applying any log records. The undo tablespace files must be open
at this point.
buf_flush_or_remove_pages(), buf_flush_dirty_pages(),
buf_LRU_flush_or_remove_pages(): Add a parameter for specifying
the number of the first page to flush or remove (default 0).
trx_purge_initiate_truncate(): Remove the log checkpoints, the
extra logging, and some unnecessary crash points. Merge the code
from trx_undo_truncate_tablespace(). First, flush all to-be-discarded
pages (beyond the new end of the file), then trim the space->size
to make the page allocation deterministic. At the only remaining
crash injection point, flush the redo log, so that the recovery
can be tested.
2018-08-28 13:43:06 +03:00
|
|
|
static const char* get_mlog_string(mlog_id_t type)
|
2016-08-12 11:17:45 +03:00
|
|
|
{
|
|
|
|
switch (type) {
|
|
|
|
case MLOG_SINGLE_REC_FLAG:
|
|
|
|
return("MLOG_SINGLE_REC_FLAG");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_1BYTE:
|
|
|
|
return("MLOG_1BYTE");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_2BYTES:
|
|
|
|
return("MLOG_2BYTES");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_4BYTES:
|
|
|
|
return("MLOG_4BYTES");
|
2015-08-07 15:21:20 +03:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_8BYTES:
|
|
|
|
return("MLOG_8BYTES");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_REC_INSERT:
|
|
|
|
return("MLOG_REC_INSERT");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_REC_CLUST_DELETE_MARK:
|
|
|
|
return("MLOG_REC_CLUST_DELETE_MARK");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_REC_SEC_DELETE_MARK:
|
|
|
|
return("MLOG_REC_SEC_DELETE_MARK");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_REC_UPDATE_IN_PLACE:
|
|
|
|
return("MLOG_REC_UPDATE_IN_PLACE");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_REC_DELETE:
|
|
|
|
return("MLOG_REC_DELETE");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_LIST_END_DELETE:
|
|
|
|
return("MLOG_LIST_END_DELETE");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_LIST_START_DELETE:
|
|
|
|
return("MLOG_LIST_START_DELETE");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_LIST_END_COPY_CREATED:
|
|
|
|
return("MLOG_LIST_END_COPY_CREATED");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_PAGE_REORGANIZE:
|
|
|
|
return("MLOG_PAGE_REORGANIZE");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_PAGE_CREATE:
|
|
|
|
return("MLOG_PAGE_CREATE");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_UNDO_INSERT:
|
|
|
|
return("MLOG_UNDO_INSERT");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_UNDO_ERASE_END:
|
|
|
|
return("MLOG_UNDO_ERASE_END");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_UNDO_INIT:
|
|
|
|
return("MLOG_UNDO_INIT");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_UNDO_HDR_REUSE:
|
|
|
|
return("MLOG_UNDO_HDR_REUSE");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_UNDO_HDR_CREATE:
|
|
|
|
return("MLOG_UNDO_HDR_CREATE");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_REC_MIN_MARK:
|
|
|
|
return("MLOG_REC_MIN_MARK");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_IBUF_BITMAP_INIT:
|
|
|
|
return("MLOG_IBUF_BITMAP_INIT");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
#ifdef UNIV_LOG_LSN_DEBUG
|
|
|
|
case MLOG_LSN:
|
|
|
|
return("MLOG_LSN");
|
|
|
|
#endif /* UNIV_LOG_LSN_DEBUG */
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_WRITE_STRING:
|
|
|
|
return("MLOG_WRITE_STRING");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_MULTI_REC_END:
|
|
|
|
return("MLOG_MULTI_REC_END");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_DUMMY_RECORD:
|
|
|
|
return("MLOG_DUMMY_RECORD");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_FILE_DELETE:
|
|
|
|
return("MLOG_FILE_DELETE");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_COMP_REC_MIN_MARK:
|
|
|
|
return("MLOG_COMP_REC_MIN_MARK");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_COMP_PAGE_CREATE:
|
|
|
|
return("MLOG_COMP_PAGE_CREATE");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_COMP_REC_INSERT:
|
|
|
|
return("MLOG_COMP_REC_INSERT");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_COMP_REC_CLUST_DELETE_MARK:
|
|
|
|
return("MLOG_COMP_REC_CLUST_DELETE_MARK");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_COMP_REC_UPDATE_IN_PLACE:
|
|
|
|
return("MLOG_COMP_REC_UPDATE_IN_PLACE");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_COMP_REC_DELETE:
|
|
|
|
return("MLOG_COMP_REC_DELETE");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_COMP_LIST_END_DELETE:
|
|
|
|
return("MLOG_COMP_LIST_END_DELETE");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_COMP_LIST_START_DELETE:
|
|
|
|
return("MLOG_COMP_LIST_START_DELETE");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_COMP_LIST_END_COPY_CREATED:
|
|
|
|
return("MLOG_COMP_LIST_END_COPY_CREATED");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_COMP_PAGE_REORGANIZE:
|
|
|
|
return("MLOG_COMP_PAGE_REORGANIZE");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_FILE_CREATE2:
|
|
|
|
return("MLOG_FILE_CREATE2");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_ZIP_WRITE_NODE_PTR:
|
|
|
|
return("MLOG_ZIP_WRITE_NODE_PTR");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_ZIP_WRITE_BLOB_PTR:
|
|
|
|
return("MLOG_ZIP_WRITE_BLOB_PTR");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_ZIP_WRITE_HEADER:
|
|
|
|
return("MLOG_ZIP_WRITE_HEADER");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_ZIP_PAGE_COMPRESS:
|
|
|
|
return("MLOG_ZIP_PAGE_COMPRESS");
|
2014-02-26 19:11:54 +01:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_ZIP_PAGE_COMPRESS_NO_DATA:
|
|
|
|
return("MLOG_ZIP_PAGE_COMPRESS_NO_DATA");
|
2014-05-05 18:20:28 +02:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_ZIP_PAGE_REORGANIZE:
|
|
|
|
return("MLOG_ZIP_PAGE_REORGANIZE");
|
2014-05-05 18:20:28 +02:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_FILE_RENAME2:
|
|
|
|
return("MLOG_FILE_RENAME2");
|
2014-05-05 18:20:28 +02:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_FILE_NAME:
|
|
|
|
return("MLOG_FILE_NAME");
|
2014-05-05 18:20:28 +02:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_CHECKPOINT:
|
|
|
|
return("MLOG_CHECKPOINT");
|
2014-05-05 18:20:28 +02:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_PAGE_CREATE_RTREE:
|
|
|
|
return("MLOG_PAGE_CREATE_RTREE");
|
2014-05-05 18:20:28 +02:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_COMP_PAGE_CREATE_RTREE:
|
|
|
|
return("MLOG_COMP_PAGE_CREATE_RTREE");
|
2014-05-05 18:20:28 +02:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_INIT_FILE_PAGE2:
|
|
|
|
return("MLOG_INIT_FILE_PAGE2");
|
2014-05-05 18:20:28 +02:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_INDEX_LOAD:
|
|
|
|
return("MLOG_INDEX_LOAD");
|
2014-05-05 18:20:28 +02:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_TRUNCATE:
|
|
|
|
return("MLOG_TRUNCATE");
|
2014-05-05 18:20:28 +02:00
|
|
|
|
2016-08-12 11:17:45 +03:00
|
|
|
case MLOG_FILE_WRITE_CRYPT_DATA:
|
|
|
|
return("MLOG_FILE_WRITE_CRYPT_DATA");
|
2014-05-05 18:20:28 +02:00
|
|
|
}
|
2016-08-12 11:17:45 +03:00
|
|
|
DBUG_ASSERT(0);
|
|
|
|
return(NULL);
|
2014-05-05 18:20:28 +02:00
|
|
|
}
|
2016-08-12 11:17:45 +03:00
|
|
|
#endif /* !DBUG_OFF */
|