2009-03-26 07:11:11 +01:00
|
|
|
/*****************************************************************************
|
|
|
|
|
2016-08-10 19:24:58 +02:00
|
|
|
Copyright (c) 1997, 2016, Oracle and/or its affiliates. All Rights Reserved.
|
2017-05-16 19:08:47 +02:00
|
|
|
Copyright (c) 2017, MariaDB Corporation.
|
2009-03-26 07:11:11 +01:00
|
|
|
|
|
|
|
This program is free software; you can redistribute it and/or modify it under
|
|
|
|
the terms of the GNU General Public License as published by the Free Software
|
|
|
|
Foundation; version 2 of the License.
|
|
|
|
|
|
|
|
This program is distributed in the hope that it will be useful, but WITHOUT
|
|
|
|
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
|
|
FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License along with
|
2011-12-14 14:58:22 +01:00
|
|
|
this program; if not, write to the Free Software Foundation, Inc.,
|
|
|
|
51 Franklin Street, Suite 500, Boston, MA 02110-1335 USA
|
2009-03-26 07:11:11 +01:00
|
|
|
|
|
|
|
*****************************************************************************/
|
|
|
|
|
2009-09-07 12:22:53 +02:00
|
|
|
/**************************************************//**
|
2013-12-16 15:38:05 +01:00
|
|
|
@file row/row0purge.cc
|
2008-12-01 07:10:29 +01:00
|
|
|
Purge obsolete records
|
|
|
|
|
|
|
|
Created 3/14/1997 Heikki Tuuri
|
|
|
|
*******************************************************/
|
|
|
|
|
|
|
|
#include "row0purge.h"
|
|
|
|
|
|
|
|
#ifdef UNIV_NONINL
|
|
|
|
#include "row0purge.ic"
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#include "fsp0fsp.h"
|
|
|
|
#include "mach0data.h"
|
|
|
|
#include "trx0rseg.h"
|
|
|
|
#include "trx0trx.h"
|
|
|
|
#include "trx0roll.h"
|
|
|
|
#include "trx0undo.h"
|
|
|
|
#include "trx0purge.h"
|
|
|
|
#include "trx0rec.h"
|
|
|
|
#include "que0que.h"
|
|
|
|
#include "row0row.h"
|
|
|
|
#include "row0upd.h"
|
|
|
|
#include "row0vers.h"
|
|
|
|
#include "row0mysql.h"
|
2013-12-16 15:38:05 +01:00
|
|
|
#include "row0log.h"
|
2008-12-01 07:10:29 +01:00
|
|
|
#include "log0log.h"
|
2013-12-16 15:38:05 +01:00
|
|
|
#include "srv0mon.h"
|
|
|
|
#include "srv0start.h"
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2010-09-03 17:41:57 +02:00
|
|
|
/*************************************************************************
|
|
|
|
IMPORTANT NOTE: Any operation that generates redo MUST check that there
|
|
|
|
is enough space in the redo log before for that operation. This is
|
|
|
|
done by calling log_free_check(). The reason for checking the
|
|
|
|
availability of the redo log space before the start of the operation is
|
|
|
|
that we MUST not hold any synchonization objects when performing the
|
|
|
|
check.
|
|
|
|
If you make a change in this module make sure that no codepath is
|
|
|
|
introduced where a call to log_free_check() is bypassed. */
|
|
|
|
|
2009-09-07 12:22:53 +02:00
|
|
|
/********************************************************************//**
|
|
|
|
Creates a purge node to a query graph.
|
|
|
|
@return own: purge node */
|
2008-12-01 07:10:29 +01:00
|
|
|
UNIV_INTERN
|
|
|
|
purge_node_t*
|
|
|
|
row_purge_node_create(
|
|
|
|
/*==================*/
|
2013-12-16 15:38:05 +01:00
|
|
|
que_thr_t* parent, /*!< in: parent node */
|
|
|
|
mem_heap_t* heap) /*!< in: memory heap where created */
|
2008-12-01 07:10:29 +01:00
|
|
|
{
|
|
|
|
purge_node_t* node;
|
|
|
|
|
2016-08-10 19:24:58 +02:00
|
|
|
ut_ad(parent != NULL);
|
|
|
|
ut_ad(heap != NULL);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
node = static_cast<purge_node_t*>(
|
|
|
|
mem_heap_zalloc(heap, sizeof(*node)));
|
2008-12-01 07:10:29 +01:00
|
|
|
|
|
|
|
node->common.type = QUE_NODE_PURGE;
|
|
|
|
node->common.parent = parent;
|
2013-12-16 15:38:05 +01:00
|
|
|
node->done = TRUE;
|
2008-12-01 07:10:29 +01:00
|
|
|
node->heap = mem_heap_create(256);
|
|
|
|
|
|
|
|
return(node);
|
|
|
|
}
|
|
|
|
|
2009-09-07 12:22:53 +02:00
|
|
|
/***********************************************************//**
|
2008-12-01 07:10:29 +01:00
|
|
|
Repositions the pcur in the purge node on the clustered index record,
|
2015-10-09 17:20:49 +02:00
|
|
|
if found. If the record is not found, close pcur.
|
2009-09-07 12:22:53 +02:00
|
|
|
@return TRUE if the record was found */
|
2008-12-01 07:10:29 +01:00
|
|
|
static
|
|
|
|
ibool
|
|
|
|
row_purge_reposition_pcur(
|
|
|
|
/*======================*/
|
2009-09-07 12:22:53 +02:00
|
|
|
ulint mode, /*!< in: latching mode */
|
|
|
|
purge_node_t* node, /*!< in: row purge node */
|
|
|
|
mtr_t* mtr) /*!< in: mtr */
|
2008-12-01 07:10:29 +01:00
|
|
|
{
|
|
|
|
if (node->found_clust) {
|
2015-10-09 17:20:49 +02:00
|
|
|
ut_ad(node->validate_pcur());
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2015-10-09 17:20:49 +02:00
|
|
|
node->found_clust = btr_pcur_restore_position(mode, &node->pcur, mtr);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
} else {
|
|
|
|
node->found_clust = row_search_on_row_ref(
|
|
|
|
&node->pcur, mode, node->table, node->ref, mtr);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
if (node->found_clust) {
|
|
|
|
btr_pcur_store_position(&node->pcur, mtr);
|
|
|
|
}
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
|
2015-10-09 17:20:49 +02:00
|
|
|
/* Close the current cursor if we fail to position it correctly. */
|
|
|
|
if (!node->found_clust) {
|
|
|
|
btr_pcur_close(&node->pcur);
|
|
|
|
}
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
return(node->found_clust);
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
|
2009-09-07 12:22:53 +02:00
|
|
|
/***********************************************************//**
|
|
|
|
Removes a delete marked clustered index record if possible.
|
2013-12-16 15:38:05 +01:00
|
|
|
@retval true if the row was not found, or it was successfully removed
|
|
|
|
@retval false if the row was modified after the delete marking */
|
2016-08-10 19:24:58 +02:00
|
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
2013-12-16 15:38:05 +01:00
|
|
|
bool
|
2008-12-01 07:10:29 +01:00
|
|
|
row_purge_remove_clust_if_poss_low(
|
|
|
|
/*===============================*/
|
2013-12-16 15:38:05 +01:00
|
|
|
purge_node_t* node, /*!< in/out: row purge node */
|
2009-09-07 12:22:53 +02:00
|
|
|
ulint mode) /*!< in: BTR_MODIFY_LEAF or BTR_MODIFY_TREE */
|
2008-12-01 07:10:29 +01:00
|
|
|
{
|
2013-12-16 15:38:05 +01:00
|
|
|
dict_index_t* index;
|
|
|
|
bool success = true;
|
|
|
|
mtr_t mtr;
|
|
|
|
rec_t* rec;
|
|
|
|
mem_heap_t* heap = NULL;
|
|
|
|
ulint* offsets;
|
|
|
|
ulint offsets_[REC_OFFS_NORMAL_SIZE];
|
2008-12-01 07:10:29 +01:00
|
|
|
rec_offs_init(offsets_);
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
#ifdef UNIV_SYNC_DEBUG
|
|
|
|
ut_ad(rw_lock_own(&dict_operation_lock, RW_LOCK_SHARED));
|
|
|
|
#endif /* UNIV_SYNC_DEBUG */
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
index = dict_table_get_first_index(node->table);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2010-09-03 17:41:57 +02:00
|
|
|
log_free_check();
|
2008-12-01 07:10:29 +01:00
|
|
|
mtr_start(&mtr);
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
if (!row_purge_reposition_pcur(mode, node, &mtr)) {
|
|
|
|
/* The record was already removed. */
|
|
|
|
goto func_exit;
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
rec = btr_pcur_get_rec(&node->pcur);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
offsets = rec_get_offsets(
|
|
|
|
rec, index, offsets_, ULINT_UNDEFINED, &heap);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
if (node->roll_ptr != row_get_rec_roll_ptr(rec, index, offsets)) {
|
|
|
|
/* Someone else has modified the record later: do not remove */
|
|
|
|
goto func_exit;
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
if (mode == BTR_MODIFY_LEAF) {
|
2013-12-16 15:38:05 +01:00
|
|
|
success = btr_cur_optimistic_delete(
|
|
|
|
btr_pcur_get_btr_cur(&node->pcur), 0, &mtr);
|
2008-12-01 07:10:29 +01:00
|
|
|
} else {
|
2013-12-16 15:38:05 +01:00
|
|
|
dberr_t err;
|
2008-12-01 07:10:29 +01:00
|
|
|
ut_ad(mode == BTR_MODIFY_TREE);
|
2013-12-16 15:38:05 +01:00
|
|
|
btr_cur_pessimistic_delete(
|
|
|
|
&err, FALSE, btr_pcur_get_btr_cur(&node->pcur), 0,
|
|
|
|
RB_NONE, &mtr);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
switch (err) {
|
|
|
|
case DB_SUCCESS:
|
|
|
|
break;
|
|
|
|
case DB_OUT_OF_FILE_SPACE:
|
|
|
|
success = false;
|
|
|
|
break;
|
|
|
|
default:
|
2008-12-01 07:10:29 +01:00
|
|
|
ut_error;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
func_exit:
|
|
|
|
if (heap) {
|
|
|
|
mem_heap_free(heap);
|
|
|
|
}
|
|
|
|
|
2015-10-09 17:20:49 +02:00
|
|
|
/* Persistent cursor is closed if reposition fails. */
|
|
|
|
if (node->found_clust) {
|
|
|
|
btr_pcur_commit_specify_mtr(&node->pcur, &mtr);
|
|
|
|
} else {
|
|
|
|
mtr_commit(&mtr);
|
|
|
|
}
|
2008-12-01 07:10:29 +01:00
|
|
|
|
|
|
|
return(success);
|
|
|
|
}
|
|
|
|
|
2009-09-07 12:22:53 +02:00
|
|
|
/***********************************************************//**
|
2008-12-01 07:10:29 +01:00
|
|
|
Removes a clustered index record if it has not been modified after the delete
|
2013-12-16 15:38:05 +01:00
|
|
|
marking.
|
|
|
|
@retval true if the row was not found, or it was successfully removed
|
|
|
|
@retval false the purge needs to be suspended because of running out
|
|
|
|
of file space. */
|
2016-08-10 19:24:58 +02:00
|
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
2013-12-16 15:38:05 +01:00
|
|
|
bool
|
2008-12-01 07:10:29 +01:00
|
|
|
row_purge_remove_clust_if_poss(
|
|
|
|
/*===========================*/
|
2013-12-16 15:38:05 +01:00
|
|
|
purge_node_t* node) /*!< in/out: row purge node */
|
2008-12-01 07:10:29 +01:00
|
|
|
{
|
2013-12-16 15:38:05 +01:00
|
|
|
if (row_purge_remove_clust_if_poss_low(node, BTR_MODIFY_LEAF)) {
|
|
|
|
return(true);
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
for (ulint n_tries = 0;
|
|
|
|
n_tries < BTR_CUR_RETRY_DELETE_N_TIMES;
|
|
|
|
n_tries++) {
|
|
|
|
if (row_purge_remove_clust_if_poss_low(
|
|
|
|
node, BTR_MODIFY_TREE)) {
|
|
|
|
return(true);
|
|
|
|
}
|
2008-12-01 07:10:29 +01:00
|
|
|
|
|
|
|
os_thread_sleep(BTR_CUR_RETRY_SLEEP_TIME);
|
|
|
|
}
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
return(false);
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
|
2009-09-07 12:22:53 +02:00
|
|
|
/***********************************************************//**
|
2011-07-14 21:22:41 +02:00
|
|
|
Determines if it is possible to remove a secondary index entry.
|
|
|
|
Removal is possible if the secondary index entry does not refer to any
|
|
|
|
not delete marked version of a clustered index record where DB_TRX_ID
|
|
|
|
is newer than the purge view.
|
|
|
|
|
|
|
|
NOTE: This function should only be called by the purge thread, only
|
|
|
|
while holding a latch on the leaf page of the secondary index entry
|
|
|
|
(or keeping the buffer pool watch on the page). It is possible that
|
2013-12-16 15:38:05 +01:00
|
|
|
this function first returns true and then false, if a user transaction
|
2011-07-14 21:22:41 +02:00
|
|
|
inserts a record that the secondary index entry would refer to.
|
|
|
|
However, in that case, the user transaction would also re-insert the
|
|
|
|
secondary index entry after purge has removed it and released the leaf
|
|
|
|
page latch.
|
2013-12-16 15:38:05 +01:00
|
|
|
@return true if the secondary index record can be purged */
|
2011-07-14 21:22:41 +02:00
|
|
|
UNIV_INTERN
|
2013-12-16 15:38:05 +01:00
|
|
|
bool
|
2011-07-14 21:22:41 +02:00
|
|
|
row_purge_poss_sec(
|
|
|
|
/*===============*/
|
|
|
|
purge_node_t* node, /*!< in/out: row purge node */
|
|
|
|
dict_index_t* index, /*!< in: secondary index */
|
|
|
|
const dtuple_t* entry) /*!< in: secondary index entry */
|
|
|
|
{
|
2013-12-16 15:38:05 +01:00
|
|
|
bool can_delete;
|
2011-07-14 21:22:41 +02:00
|
|
|
mtr_t mtr;
|
|
|
|
|
|
|
|
ut_ad(!dict_index_is_clust(index));
|
|
|
|
mtr_start(&mtr);
|
|
|
|
|
|
|
|
can_delete = !row_purge_reposition_pcur(BTR_SEARCH_LEAF, node, &mtr)
|
|
|
|
|| !row_vers_old_has_index_entry(TRUE,
|
|
|
|
btr_pcur_get_rec(&node->pcur),
|
|
|
|
&mtr, index, entry);
|
|
|
|
|
2015-10-09 17:20:49 +02:00
|
|
|
/* Persistent cursor is closed if reposition fails. */
|
|
|
|
if (node->found_clust) {
|
|
|
|
btr_pcur_commit_specify_mtr(&node->pcur, &mtr);
|
|
|
|
} else {
|
|
|
|
mtr_commit(&mtr);
|
|
|
|
}
|
2011-07-14 21:22:41 +02:00
|
|
|
|
|
|
|
return(can_delete);
|
|
|
|
}
|
|
|
|
|
|
|
|
/***************************************************************
|
|
|
|
Removes a secondary index entry if possible, by modifying the
|
|
|
|
index tree. Does not try to buffer the delete.
|
2009-09-07 12:22:53 +02:00
|
|
|
@return TRUE if success or if not found */
|
2016-08-10 19:24:58 +02:00
|
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
2008-12-01 07:10:29 +01:00
|
|
|
ibool
|
2011-07-14 21:22:41 +02:00
|
|
|
row_purge_remove_sec_if_poss_tree(
|
|
|
|
/*==============================*/
|
2009-09-07 12:22:53 +02:00
|
|
|
purge_node_t* node, /*!< in: row purge node */
|
|
|
|
dict_index_t* index, /*!< in: index */
|
2011-07-14 21:22:41 +02:00
|
|
|
const dtuple_t* entry) /*!< in: index entry */
|
2008-12-01 07:10:29 +01:00
|
|
|
{
|
2011-07-14 21:22:41 +02:00
|
|
|
btr_pcur_t pcur;
|
|
|
|
btr_cur_t* btr_cur;
|
|
|
|
ibool success = TRUE;
|
2013-12-16 15:38:05 +01:00
|
|
|
dberr_t err;
|
2011-07-14 21:22:41 +02:00
|
|
|
mtr_t mtr;
|
|
|
|
enum row_search_result search_result;
|
2008-12-01 07:10:29 +01:00
|
|
|
|
|
|
|
log_free_check();
|
|
|
|
mtr_start(&mtr);
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
if (*index->name == TEMP_INDEX_PREFIX) {
|
|
|
|
/* The index->online_status may change if the
|
|
|
|
index->name starts with TEMP_INDEX_PREFIX (meaning
|
|
|
|
that the index is or was being created online). It is
|
|
|
|
protected by index->lock. */
|
|
|
|
mtr_x_lock(dict_index_get_lock(index), &mtr);
|
|
|
|
|
|
|
|
if (dict_index_is_online_ddl(index)) {
|
|
|
|
/* Online secondary index creation will not
|
|
|
|
copy any delete-marked records. Therefore
|
|
|
|
there is nothing to be purged. We must also
|
|
|
|
skip the purge when a completed index is
|
|
|
|
dropped by rollback_inplace_alter_table(). */
|
|
|
|
goto func_exit_no_pcur;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
/* For secondary indexes,
|
|
|
|
index->online_status==ONLINE_INDEX_CREATION unless
|
|
|
|
index->name starts with TEMP_INDEX_PREFIX. */
|
|
|
|
ut_ad(!dict_index_is_online_ddl(index));
|
|
|
|
}
|
|
|
|
|
2011-07-14 21:22:41 +02:00
|
|
|
search_result = row_search_index_entry(index, entry, BTR_MODIFY_TREE,
|
|
|
|
&pcur, &mtr);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2011-07-14 21:22:41 +02:00
|
|
|
switch (search_result) {
|
|
|
|
case ROW_NOT_FOUND:
|
2009-03-26 07:11:11 +01:00
|
|
|
/* Not found. This is a legitimate condition. In a
|
|
|
|
rollback, InnoDB will remove secondary recs that would
|
|
|
|
be purged anyway. Then the actual purge will not find
|
|
|
|
the secondary index record. Also, the purge itself is
|
|
|
|
eager: if it comes to consider a secondary index
|
|
|
|
record, and notices it does not need to exist in the
|
|
|
|
index, it will remove it. Then if/when the purge
|
|
|
|
comes to consider the secondary index record a second
|
|
|
|
time, it will not exist any more in the index. */
|
2008-12-01 07:10:29 +01:00
|
|
|
|
|
|
|
/* fputs("PURGE:........sec entry not found\n", stderr); */
|
|
|
|
/* dtuple_print(stderr, entry); */
|
2011-07-14 21:22:41 +02:00
|
|
|
goto func_exit;
|
|
|
|
case ROW_FOUND:
|
|
|
|
break;
|
|
|
|
case ROW_BUFFERED:
|
|
|
|
case ROW_NOT_DELETED_REF:
|
|
|
|
/* These are invalid outcomes, because the mode passed
|
|
|
|
to row_search_index_entry() did not include any of the
|
|
|
|
flags BTR_INSERT, BTR_DELETE, or BTR_DELETE_MARK. */
|
|
|
|
ut_error;
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
btr_cur = btr_pcur_get_btr_cur(&pcur);
|
|
|
|
|
|
|
|
/* We should remove the index record if no later version of the row,
|
|
|
|
which cannot be purged yet, requires its existence. If some requires,
|
|
|
|
we should do nothing. */
|
|
|
|
|
2011-07-14 21:22:41 +02:00
|
|
|
if (row_purge_poss_sec(node, index, entry)) {
|
|
|
|
/* Remove the index record, which should have been
|
|
|
|
marked for deletion. */
|
2014-11-18 18:11:15 +01:00
|
|
|
if (!rec_get_deleted_flag(btr_cur_get_rec(btr_cur),
|
|
|
|
dict_table_is_comp(index->table))) {
|
|
|
|
fputs("InnoDB: tried to purge sec index entry not"
|
|
|
|
" marked for deletion in\n"
|
|
|
|
"InnoDB: ", stderr);
|
|
|
|
dict_index_name_print(stderr, NULL, index);
|
|
|
|
fputs("\n"
|
|
|
|
"InnoDB: tuple ", stderr);
|
|
|
|
dtuple_print(stderr, entry);
|
|
|
|
fputs("\n"
|
|
|
|
"InnoDB: record ", stderr);
|
|
|
|
rec_print(stderr, btr_cur_get_rec(btr_cur), index);
|
|
|
|
putc('\n', stderr);
|
|
|
|
|
|
|
|
ut_ad(0);
|
|
|
|
|
|
|
|
goto func_exit;
|
|
|
|
}
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
btr_cur_pessimistic_delete(&err, FALSE, btr_cur, 0,
|
2011-07-14 21:22:41 +02:00
|
|
|
RB_NONE, &mtr);
|
|
|
|
switch (UNIV_EXPECT(err, DB_SUCCESS)) {
|
|
|
|
case DB_SUCCESS:
|
|
|
|
break;
|
|
|
|
case DB_OUT_OF_FILE_SPACE:
|
|
|
|
success = FALSE;
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
ut_error;
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2011-07-14 21:22:41 +02:00
|
|
|
func_exit:
|
2008-12-01 07:10:29 +01:00
|
|
|
btr_pcur_close(&pcur);
|
2013-12-16 15:38:05 +01:00
|
|
|
func_exit_no_pcur:
|
2008-12-01 07:10:29 +01:00
|
|
|
mtr_commit(&mtr);
|
|
|
|
|
|
|
|
return(success);
|
|
|
|
}
|
|
|
|
|
2011-07-14 21:22:41 +02:00
|
|
|
/***************************************************************
|
|
|
|
Removes a secondary index entry without modifying the index tree,
|
|
|
|
if possible.
|
2013-12-16 15:38:05 +01:00
|
|
|
@retval true if success or if not found
|
|
|
|
@retval false if row_purge_remove_sec_if_poss_tree() should be invoked */
|
2016-08-10 19:24:58 +02:00
|
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
2013-12-16 15:38:05 +01:00
|
|
|
bool
|
2011-07-14 21:22:41 +02:00
|
|
|
row_purge_remove_sec_if_poss_leaf(
|
|
|
|
/*==============================*/
|
|
|
|
purge_node_t* node, /*!< in: row purge node */
|
|
|
|
dict_index_t* index, /*!< in: index */
|
|
|
|
const dtuple_t* entry) /*!< in: index entry */
|
|
|
|
{
|
|
|
|
mtr_t mtr;
|
|
|
|
btr_pcur_t pcur;
|
2013-12-16 15:38:05 +01:00
|
|
|
ulint mode;
|
2011-07-14 21:22:41 +02:00
|
|
|
enum row_search_result search_result;
|
2013-12-16 15:38:05 +01:00
|
|
|
bool success = true;
|
2011-07-14 21:22:41 +02:00
|
|
|
|
|
|
|
log_free_check();
|
|
|
|
|
|
|
|
mtr_start(&mtr);
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
if (*index->name == TEMP_INDEX_PREFIX) {
|
|
|
|
/* The index->online_status may change if the
|
|
|
|
index->name starts with TEMP_INDEX_PREFIX (meaning
|
|
|
|
that the index is or was being created online). It is
|
|
|
|
protected by index->lock. */
|
|
|
|
mtr_s_lock(dict_index_get_lock(index), &mtr);
|
|
|
|
|
|
|
|
if (dict_index_is_online_ddl(index)) {
|
|
|
|
/* Online secondary index creation will not
|
|
|
|
copy any delete-marked records. Therefore
|
|
|
|
there is nothing to be purged. We must also
|
|
|
|
skip the purge when a completed index is
|
|
|
|
dropped by rollback_inplace_alter_table(). */
|
|
|
|
goto func_exit_no_pcur;
|
|
|
|
}
|
|
|
|
|
|
|
|
mode = BTR_MODIFY_LEAF | BTR_ALREADY_S_LATCHED | BTR_DELETE;
|
|
|
|
} else {
|
|
|
|
/* For secondary indexes,
|
|
|
|
index->online_status==ONLINE_INDEX_CREATION unless
|
|
|
|
index->name starts with TEMP_INDEX_PREFIX. */
|
|
|
|
ut_ad(!dict_index_is_online_ddl(index));
|
|
|
|
|
|
|
|
mode = BTR_MODIFY_LEAF | BTR_DELETE;
|
|
|
|
}
|
|
|
|
|
2011-07-14 21:22:41 +02:00
|
|
|
/* Set the purge node for the call to row_purge_poss_sec(). */
|
|
|
|
pcur.btr_cur.purge_node = node;
|
|
|
|
/* Set the query thread, so that ibuf_insert_low() will be
|
|
|
|
able to invoke thd_get_trx(). */
|
2013-12-16 15:38:05 +01:00
|
|
|
pcur.btr_cur.thr = static_cast<que_thr_t*>(que_node_get_parent(node));
|
2011-07-14 21:22:41 +02:00
|
|
|
|
|
|
|
search_result = row_search_index_entry(
|
2013-12-16 15:38:05 +01:00
|
|
|
index, entry, mode, &pcur, &mtr);
|
2011-07-14 21:22:41 +02:00
|
|
|
|
|
|
|
switch (search_result) {
|
|
|
|
case ROW_FOUND:
|
|
|
|
/* Before attempting to purge a record, check
|
|
|
|
if it is safe to do so. */
|
|
|
|
if (row_purge_poss_sec(node, index, entry)) {
|
|
|
|
btr_cur_t* btr_cur = btr_pcur_get_btr_cur(&pcur);
|
|
|
|
|
|
|
|
/* Only delete-marked records should be purged. */
|
2014-11-18 18:11:15 +01:00
|
|
|
if (!rec_get_deleted_flag(
|
|
|
|
btr_cur_get_rec(btr_cur),
|
|
|
|
dict_table_is_comp(index->table))) {
|
|
|
|
|
|
|
|
fputs("InnoDB: tried to purge sec index"
|
|
|
|
" entry not marked for deletion in\n"
|
|
|
|
"InnoDB: ", stderr);
|
|
|
|
dict_index_name_print(stderr, NULL, index);
|
|
|
|
fputs("\n"
|
|
|
|
"InnoDB: tuple ", stderr);
|
|
|
|
dtuple_print(stderr, entry);
|
|
|
|
fputs("\n"
|
|
|
|
"InnoDB: record ", stderr);
|
|
|
|
rec_print(stderr, btr_cur_get_rec(btr_cur),
|
|
|
|
index);
|
|
|
|
putc('\n', stderr);
|
|
|
|
|
|
|
|
ut_ad(0);
|
|
|
|
|
|
|
|
btr_pcur_close(&pcur);
|
|
|
|
|
|
|
|
goto func_exit_no_pcur;
|
|
|
|
}
|
2011-07-14 21:22:41 +02:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
if (!btr_cur_optimistic_delete(btr_cur, 0, &mtr)) {
|
2011-07-14 21:22:41 +02:00
|
|
|
|
|
|
|
/* The index entry could not be deleted. */
|
2013-12-16 15:38:05 +01:00
|
|
|
success = false;
|
2011-07-14 21:22:41 +02:00
|
|
|
}
|
|
|
|
}
|
2017-05-16 19:08:47 +02:00
|
|
|
/* (The index entry is still needed,
|
2011-07-14 21:22:41 +02:00
|
|
|
or the deletion succeeded) */
|
2017-05-16 19:08:47 +02:00
|
|
|
/* fall through */
|
2011-07-14 21:22:41 +02:00
|
|
|
case ROW_NOT_DELETED_REF:
|
|
|
|
/* The index entry is still needed. */
|
|
|
|
case ROW_BUFFERED:
|
|
|
|
/* The deletion was buffered. */
|
|
|
|
case ROW_NOT_FOUND:
|
|
|
|
/* The index entry does not exist, nothing to do. */
|
|
|
|
btr_pcur_close(&pcur);
|
2013-12-16 15:38:05 +01:00
|
|
|
func_exit_no_pcur:
|
2011-07-14 21:22:41 +02:00
|
|
|
mtr_commit(&mtr);
|
|
|
|
return(success);
|
|
|
|
}
|
|
|
|
|
|
|
|
ut_error;
|
|
|
|
return(FALSE);
|
|
|
|
}
|
|
|
|
|
2009-09-07 12:22:53 +02:00
|
|
|
/***********************************************************//**
|
2008-12-01 07:10:29 +01:00
|
|
|
Removes a secondary index entry if possible. */
|
2016-08-10 19:24:58 +02:00
|
|
|
UNIV_INLINE MY_ATTRIBUTE((nonnull(1,2)))
|
2008-12-01 07:10:29 +01:00
|
|
|
void
|
|
|
|
row_purge_remove_sec_if_poss(
|
|
|
|
/*=========================*/
|
2009-09-07 12:22:53 +02:00
|
|
|
purge_node_t* node, /*!< in: row purge node */
|
|
|
|
dict_index_t* index, /*!< in: index */
|
2013-12-16 15:38:05 +01:00
|
|
|
const dtuple_t* entry) /*!< in: index entry */
|
2008-12-01 07:10:29 +01:00
|
|
|
{
|
|
|
|
ibool success;
|
|
|
|
ulint n_tries = 0;
|
|
|
|
|
|
|
|
/* fputs("Purge: Removing secondary record\n", stderr); */
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
if (!entry) {
|
|
|
|
/* The node->row must have lacked some fields of this
|
|
|
|
index. This is possible when the undo log record was
|
|
|
|
written before this index was created. */
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2011-07-14 21:22:41 +02:00
|
|
|
if (row_purge_remove_sec_if_poss_leaf(node, index, entry)) {
|
2008-12-01 07:10:29 +01:00
|
|
|
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
retry:
|
2011-07-14 21:22:41 +02:00
|
|
|
success = row_purge_remove_sec_if_poss_tree(node, index, entry);
|
2008-12-01 07:10:29 +01:00
|
|
|
/* The delete operation may fail if we have little
|
|
|
|
file space left: TODO: easiest to crash the database
|
|
|
|
and restart with more file space */
|
|
|
|
|
|
|
|
if (!success && n_tries < BTR_CUR_RETRY_DELETE_N_TIMES) {
|
|
|
|
|
|
|
|
n_tries++;
|
|
|
|
|
|
|
|
os_thread_sleep(BTR_CUR_RETRY_SLEEP_TIME);
|
|
|
|
|
|
|
|
goto retry;
|
|
|
|
}
|
|
|
|
|
|
|
|
ut_a(success);
|
|
|
|
}
|
|
|
|
|
2009-09-07 12:22:53 +02:00
|
|
|
/***********************************************************//**
|
2013-12-16 15:38:05 +01:00
|
|
|
Purges a delete marking of a record.
|
|
|
|
@retval true if the row was not found, or it was successfully removed
|
|
|
|
@retval false the purge needs to be suspended because of
|
|
|
|
running out of file space */
|
2016-08-10 19:24:58 +02:00
|
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
2013-12-16 15:38:05 +01:00
|
|
|
bool
|
2008-12-01 07:10:29 +01:00
|
|
|
row_purge_del_mark(
|
|
|
|
/*===============*/
|
2013-12-16 15:38:05 +01:00
|
|
|
purge_node_t* node) /*!< in/out: row purge node */
|
2008-12-01 07:10:29 +01:00
|
|
|
{
|
|
|
|
mem_heap_t* heap;
|
|
|
|
|
|
|
|
heap = mem_heap_create(1024);
|
|
|
|
|
|
|
|
while (node->index != NULL) {
|
2011-12-14 14:58:22 +01:00
|
|
|
/* skip corrupted secondary index */
|
|
|
|
dict_table_skip_corrupt_index(node->index);
|
|
|
|
|
|
|
|
if (!node->index) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
if (node->index->type != DICT_FTS) {
|
|
|
|
dtuple_t* entry = row_build_index_entry_low(
|
|
|
|
node->row, NULL, node->index, heap);
|
|
|
|
row_purge_remove_sec_if_poss(node, node->index, entry);
|
|
|
|
mem_heap_empty(heap);
|
|
|
|
}
|
2008-12-01 07:10:29 +01:00
|
|
|
|
|
|
|
node->index = dict_table_get_next_index(node->index);
|
|
|
|
}
|
|
|
|
|
|
|
|
mem_heap_free(heap);
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
return(row_purge_remove_clust_if_poss(node));
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
|
2009-09-07 12:22:53 +02:00
|
|
|
/***********************************************************//**
|
2008-12-01 07:10:29 +01:00
|
|
|
Purges an update of an existing record. Also purges an update of a delete
|
|
|
|
marked record if that record contained an externally stored field. */
|
|
|
|
static
|
|
|
|
void
|
2011-04-29 14:49:04 +02:00
|
|
|
row_purge_upd_exist_or_extern_func(
|
|
|
|
/*===============================*/
|
|
|
|
#ifdef UNIV_DEBUG
|
2013-12-16 15:38:05 +01:00
|
|
|
const que_thr_t*thr, /*!< in: query thread */
|
2011-04-29 14:49:04 +02:00
|
|
|
#endif /* UNIV_DEBUG */
|
2013-12-16 15:38:05 +01:00
|
|
|
purge_node_t* node, /*!< in: row purge node */
|
|
|
|
trx_undo_rec_t* undo_rec) /*!< in: record to purge */
|
2008-12-01 07:10:29 +01:00
|
|
|
{
|
|
|
|
mem_heap_t* heap;
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
#ifdef UNIV_SYNC_DEBUG
|
|
|
|
ut_ad(rw_lock_own(&dict_operation_lock, RW_LOCK_SHARED));
|
|
|
|
#endif /* UNIV_SYNC_DEBUG */
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2011-12-14 14:58:22 +01:00
|
|
|
if (node->rec_type == TRX_UNDO_UPD_DEL_REC
|
|
|
|
|| (node->cmpl_info & UPD_NODE_NO_ORD_CHANGE)) {
|
2008-12-01 07:10:29 +01:00
|
|
|
|
|
|
|
goto skip_secondaries;
|
|
|
|
}
|
|
|
|
|
|
|
|
heap = mem_heap_create(1024);
|
|
|
|
|
|
|
|
while (node->index != NULL) {
|
2011-12-14 14:58:22 +01:00
|
|
|
dict_table_skip_corrupt_index(node->index);
|
|
|
|
|
|
|
|
if (!node->index) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2011-04-29 14:49:04 +02:00
|
|
|
if (row_upd_changes_ord_field_binary(node->index, node->update,
|
|
|
|
thr, NULL, NULL)) {
|
2008-12-01 07:10:29 +01:00
|
|
|
/* Build the older version of the index entry */
|
2013-12-16 15:38:05 +01:00
|
|
|
dtuple_t* entry = row_build_index_entry_low(
|
|
|
|
node->row, NULL, node->index, heap);
|
|
|
|
row_purge_remove_sec_if_poss(node, node->index, entry);
|
|
|
|
mem_heap_empty(heap);
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
node->index = dict_table_get_next_index(node->index);
|
|
|
|
}
|
|
|
|
|
|
|
|
mem_heap_free(heap);
|
|
|
|
|
|
|
|
skip_secondaries:
|
|
|
|
/* Free possible externally stored fields */
|
2013-12-16 15:38:05 +01:00
|
|
|
for (ulint i = 0; i < upd_get_n_fields(node->update); i++) {
|
2008-12-01 07:10:29 +01:00
|
|
|
|
|
|
|
const upd_field_t* ufield
|
|
|
|
= upd_get_nth_field(node->update, i);
|
|
|
|
|
|
|
|
if (dfield_is_ext(&ufield->new_val)) {
|
2013-12-16 15:38:05 +01:00
|
|
|
trx_rseg_t* rseg;
|
2008-12-01 07:10:29 +01:00
|
|
|
buf_block_t* block;
|
|
|
|
ulint internal_offset;
|
|
|
|
byte* data_field;
|
2013-12-16 15:38:05 +01:00
|
|
|
dict_index_t* index;
|
|
|
|
ibool is_insert;
|
|
|
|
ulint rseg_id;
|
|
|
|
ulint page_no;
|
|
|
|
ulint offset;
|
|
|
|
mtr_t mtr;
|
2008-12-01 07:10:29 +01:00
|
|
|
|
|
|
|
/* We use the fact that new_val points to
|
2013-12-16 15:38:05 +01:00
|
|
|
undo_rec and get thus the offset of
|
2008-12-01 07:10:29 +01:00
|
|
|
dfield data inside the undo record. Then we
|
|
|
|
can calculate from node->roll_ptr the file
|
|
|
|
address of the new_val data */
|
|
|
|
|
|
|
|
internal_offset
|
|
|
|
= ((const byte*)
|
|
|
|
dfield_get_data(&ufield->new_val))
|
2013-12-16 15:38:05 +01:00
|
|
|
- undo_rec;
|
2008-12-01 07:10:29 +01:00
|
|
|
|
|
|
|
ut_a(internal_offset < UNIV_PAGE_SIZE);
|
|
|
|
|
|
|
|
trx_undo_decode_roll_ptr(node->roll_ptr,
|
|
|
|
&is_insert, &rseg_id,
|
|
|
|
&page_no, &offset);
|
2013-12-16 15:38:05 +01:00
|
|
|
|
|
|
|
rseg = trx_sys_get_nth_rseg(trx_sys, rseg_id);
|
|
|
|
ut_a(rseg != NULL);
|
|
|
|
ut_a(rseg->id == rseg_id);
|
|
|
|
|
2008-12-01 07:10:29 +01:00
|
|
|
mtr_start(&mtr);
|
|
|
|
|
|
|
|
/* We have to acquire an X-latch to the clustered
|
|
|
|
index tree */
|
|
|
|
|
|
|
|
index = dict_table_get_first_index(node->table);
|
|
|
|
mtr_x_lock(dict_index_get_lock(index), &mtr);
|
|
|
|
|
|
|
|
/* NOTE: we must also acquire an X-latch to the
|
|
|
|
root page of the tree. We will need it when we
|
|
|
|
free pages from the tree. If the tree is of height 1,
|
|
|
|
the tree X-latch does NOT protect the root page,
|
|
|
|
because it is also a leaf page. Since we will have a
|
|
|
|
latch on an undo log page, we would break the
|
|
|
|
latching order if we would only later latch the
|
|
|
|
root page of such a tree! */
|
|
|
|
|
|
|
|
btr_root_get(index, &mtr);
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
block = buf_page_get(
|
|
|
|
rseg->space, 0, page_no, RW_X_LATCH, &mtr);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
|
|
|
buf_block_dbg_add_level(block, SYNC_TRX_UNDO_PAGE);
|
2008-12-03 06:06:00 +01:00
|
|
|
|
2008-12-01 07:10:29 +01:00
|
|
|
data_field = buf_block_get_frame(block)
|
|
|
|
+ offset + internal_offset;
|
|
|
|
|
|
|
|
ut_a(dfield_get_len(&ufield->new_val)
|
|
|
|
>= BTR_EXTERN_FIELD_REF_SIZE);
|
|
|
|
btr_free_externally_stored_field(
|
|
|
|
index,
|
|
|
|
data_field + dfield_get_len(&ufield->new_val)
|
|
|
|
- BTR_EXTERN_FIELD_REF_SIZE,
|
2008-12-03 06:06:00 +01:00
|
|
|
NULL, NULL, NULL, 0, RB_NONE, &mtr);
|
2008-12-01 07:10:29 +01:00
|
|
|
mtr_commit(&mtr);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2011-04-29 14:49:04 +02:00
|
|
|
#ifdef UNIV_DEBUG
|
2013-12-16 15:38:05 +01:00
|
|
|
# define row_purge_upd_exist_or_extern(thr,node,undo_rec) \
|
|
|
|
row_purge_upd_exist_or_extern_func(thr,node,undo_rec)
|
2011-04-29 14:49:04 +02:00
|
|
|
#else /* UNIV_DEBUG */
|
2013-12-16 15:38:05 +01:00
|
|
|
# define row_purge_upd_exist_or_extern(thr,node,undo_rec) \
|
|
|
|
row_purge_upd_exist_or_extern_func(node,undo_rec)
|
2011-04-29 14:49:04 +02:00
|
|
|
#endif /* UNIV_DEBUG */
|
|
|
|
|
2009-09-07 12:22:53 +02:00
|
|
|
/***********************************************************//**
|
|
|
|
Parses the row reference and other info in a modify undo log record.
|
2013-12-16 15:38:05 +01:00
|
|
|
@return true if purge operation required */
|
2008-12-01 07:10:29 +01:00
|
|
|
static
|
2013-12-16 15:38:05 +01:00
|
|
|
bool
|
2008-12-01 07:10:29 +01:00
|
|
|
row_purge_parse_undo_rec(
|
|
|
|
/*=====================*/
|
2013-12-16 15:38:05 +01:00
|
|
|
purge_node_t* node, /*!< in: row undo node */
|
|
|
|
trx_undo_rec_t* undo_rec, /*!< in: record to purge */
|
|
|
|
bool* updated_extern, /*!< out: true if an externally
|
|
|
|
stored field was updated */
|
|
|
|
que_thr_t* thr) /*!< in: query thread */
|
2008-12-01 07:10:29 +01:00
|
|
|
{
|
|
|
|
dict_index_t* clust_index;
|
|
|
|
byte* ptr;
|
|
|
|
trx_t* trx;
|
2009-09-07 12:22:53 +02:00
|
|
|
undo_no_t undo_no;
|
2011-07-14 21:22:41 +02:00
|
|
|
table_id_t table_id;
|
2009-09-07 12:22:53 +02:00
|
|
|
trx_id_t trx_id;
|
|
|
|
roll_ptr_t roll_ptr;
|
2008-12-01 07:10:29 +01:00
|
|
|
ulint info_bits;
|
|
|
|
ulint type;
|
|
|
|
|
2016-08-10 19:24:58 +02:00
|
|
|
ut_ad(node != NULL);
|
|
|
|
ut_ad(thr != NULL);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2011-12-14 14:58:22 +01:00
|
|
|
ptr = trx_undo_rec_get_pars(
|
2013-12-16 15:38:05 +01:00
|
|
|
undo_rec, &type, &node->cmpl_info,
|
2011-12-14 14:58:22 +01:00
|
|
|
updated_extern, &undo_no, &table_id);
|
2013-12-16 15:38:05 +01:00
|
|
|
|
2008-12-01 07:10:29 +01:00
|
|
|
node->rec_type = type;
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
if (type == TRX_UNDO_UPD_DEL_REC && !*updated_extern) {
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
return(false);
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
ptr = trx_undo_update_rec_get_sys_cols(ptr, &trx_id, &roll_ptr,
|
|
|
|
&info_bits);
|
|
|
|
node->table = NULL;
|
|
|
|
|
|
|
|
/* Prevent DROP TABLE etc. from running when we are doing the purge
|
|
|
|
for this row */
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
rw_lock_s_lock_inline(&dict_operation_lock, 0, __FILE__, __LINE__);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
node->table = dict_table_open_on_id(
|
|
|
|
table_id, FALSE, DICT_TABLE_OP_NORMAL);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
|
|
|
if (node->table == NULL) {
|
|
|
|
/* The table has been dropped: no need to do purge */
|
2013-12-16 15:38:05 +01:00
|
|
|
goto err_exit;
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
|
MDEV-12253: Buffer pool blocks are accessed after they have been freed
Problem was that bpage was referenced after it was already freed
from LRU. Fixed by adding a new variable encrypted that is
passed down to buf_page_check_corrupt() and used in
buf_page_get_gen() to stop processing page read.
This patch should also address following test failures and
bugs:
MDEV-12419: IMPORT should not look up tablespace in
PageConverter::validate(). This is now removed.
MDEV-10099: encryption.innodb_onlinealter_encryption fails
sporadically in buildbot
MDEV-11420: encryption.innodb_encryption-page-compression
failed in buildbot
MDEV-11222: encryption.encrypt_and_grep failed in buildbot on P8
Removed dict_table_t::is_encrypted and dict_table_t::ibd_file_missing
and replaced these with dict_table_t::file_unreadable. Table
ibd file is missing if fil_get_space(space_id) returns NULL
and encrypted if not. Removed dict_table_t::is_corrupted field.
Ported FilSpace class from 10.2 and using that on buf_page_check_corrupt(),
buf_page_decrypt_after_read(), buf_page_encrypt_before_write(),
buf_dblwr_process(), buf_read_page(), dict_stats_save_defrag_stats().
Added test cases when enrypted page could be read while doing
redo log crash recovery. Also added test case for row compressed
blobs.
btr_cur_open_at_index_side_func(),
btr_cur_open_at_rnd_pos_func(): Avoid referencing block that is
NULL.
buf_page_get_zip(): Issue error if page read fails.
buf_page_get_gen(): Use dberr_t for error detection and
do not reference bpage after we hare freed it.
buf_mark_space_corrupt(): remove bpage from LRU also when
it is encrypted.
buf_page_check_corrupt(): @return DB_SUCCESS if page has
been read and is not corrupted,
DB_PAGE_CORRUPTED if page based on checksum check is corrupted,
DB_DECRYPTION_FAILED if page post encryption checksum matches but
after decryption normal page checksum does not match. In read
case only DB_SUCCESS is possible.
buf_page_io_complete(): use dberr_t for error handling.
buf_flush_write_block_low(),
buf_read_ahead_random(),
buf_read_page_async(),
buf_read_ahead_linear(),
buf_read_ibuf_merge_pages(),
buf_read_recv_pages(),
fil_aio_wait():
Issue error if page read fails.
btr_pcur_move_to_next_page(): Do not reference page if it is
NULL.
Introduced dict_table_t::is_readable() and dict_index_t::is_readable()
that will return true if tablespace exists and pages read from
tablespace are not corrupted or page decryption failed.
Removed buf_page_t::key_version. After page decryption the
key version is not removed from page frame. For unencrypted
pages, old key_version is removed at buf_page_encrypt_before_write()
dict_stats_update_transient_for_index(),
dict_stats_update_transient()
Do not continue if table decryption failed or table
is corrupted.
dict0stats.cc: Introduced a dict_stats_report_error function
to avoid code duplication.
fil_parse_write_crypt_data():
Check that key read from redo log entry is found from
encryption plugin and if it is not, refuse to start.
PageConverter::validate(): Removed access to fil_space_t as
tablespace is not available during import.
Fixed error code on innodb.innodb test.
Merged test cased innodb-bad-key-change5 and innodb-bad-key-shutdown
to innodb-bad-key-change2. Removed innodb-bad-key-change5 test.
Decreased unnecessary complexity on some long lasting tests.
Removed fil_inc_pending_ops(), fil_decr_pending_ops(),
fil_get_first_space(), fil_get_next_space(),
fil_get_first_space_safe(), fil_get_next_space_safe()
functions.
fil_space_verify_crypt_checksum(): Fixed bug found using ASAN
where FIL_PAGE_END_LSN_OLD_CHECKSUM field was incorrectly
accessed from row compressed tables. Fixed out of page frame
bug for row compressed tables in
fil_space_verify_crypt_checksum() found using ASAN. Incorrect
function was called for compressed table.
Added new tests for discard, rename table and drop (we should allow them
even when page decryption fails). Alter table rename is not allowed.
Added test for restart with innodb-force-recovery=1 when page read on
redo-recovery cant be decrypted. Added test for corrupted table where
both page data and FIL_PAGE_FILE_FLUSH_LSN_OR_KEY_VERSION is corrupted.
Adjusted the test case innodb_bug14147491 so that it does not anymore
expect crash. Instead table is just mostly not usable.
fil0fil.h: fil_space_acquire_low is not visible function
and fil_space_acquire and fil_space_acquire_silent are
inline functions. FilSpace class uses fil_space_acquire_low
directly.
recv_apply_hashed_log_recs() does not return anything.
2017-04-26 14:19:16 +02:00
|
|
|
if (node->table->file_unreadable) {
|
2008-12-01 07:10:29 +01:00
|
|
|
/* We skip purge of missing .ibd files */
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
dict_table_close(node->table, FALSE, FALSE);
|
|
|
|
|
2008-12-01 07:10:29 +01:00
|
|
|
node->table = NULL;
|
|
|
|
|
|
|
|
goto err_exit;
|
|
|
|
}
|
|
|
|
|
|
|
|
clust_index = dict_table_get_first_index(node->table);
|
|
|
|
|
|
|
|
if (clust_index == NULL) {
|
2013-12-16 15:38:05 +01:00
|
|
|
/* The table was corrupt in the data dictionary.
|
|
|
|
dict_set_corrupted() works on an index, and
|
|
|
|
we do not have an index to call it with. */
|
|
|
|
close_exit:
|
|
|
|
dict_table_close(node->table, FALSE, FALSE);
|
|
|
|
err_exit:
|
|
|
|
rw_lock_s_unlock(&dict_operation_lock);
|
|
|
|
return(false);
|
|
|
|
}
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
if (type == TRX_UNDO_UPD_EXIST_REC
|
|
|
|
&& (node->cmpl_info & UPD_NODE_NO_ORD_CHANGE)
|
|
|
|
&& !*updated_extern) {
|
|
|
|
|
|
|
|
/* Purge requires no changes to indexes: we may return */
|
|
|
|
goto close_exit;
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
ptr = trx_undo_rec_get_row_ref(ptr, clust_index, &(node->ref),
|
|
|
|
node->heap);
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
trx = thr_get_trx(thr);
|
|
|
|
|
2008-12-01 07:10:29 +01:00
|
|
|
ptr = trx_undo_update_rec_get_update(ptr, clust_index, type, trx_id,
|
|
|
|
roll_ptr, info_bits, trx,
|
|
|
|
node->heap, &(node->update));
|
|
|
|
|
|
|
|
/* Read to the partial row the fields that occur in indexes */
|
|
|
|
|
2011-12-14 14:58:22 +01:00
|
|
|
if (!(node->cmpl_info & UPD_NODE_NO_ORD_CHANGE)) {
|
2008-12-03 06:06:00 +01:00
|
|
|
ptr = trx_undo_rec_get_partial_row(
|
|
|
|
ptr, clust_index, &node->row,
|
|
|
|
type == TRX_UNDO_UPD_DEL_REC,
|
|
|
|
node->heap);
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
return(true);
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
/***********************************************************//**
|
|
|
|
Purges the parsed record.
|
|
|
|
@return true if purged, false if skipped */
|
2016-08-10 19:24:58 +02:00
|
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
2013-12-16 15:38:05 +01:00
|
|
|
bool
|
|
|
|
row_purge_record_func(
|
|
|
|
/*==================*/
|
|
|
|
purge_node_t* node, /*!< in: row purge node */
|
|
|
|
trx_undo_rec_t* undo_rec, /*!< in: record to purge */
|
|
|
|
#ifdef UNIV_DEBUG
|
|
|
|
const que_thr_t*thr, /*!< in: query thread */
|
|
|
|
#endif /* UNIV_DEBUG */
|
|
|
|
bool updated_extern) /*!< in: whether external columns
|
|
|
|
were updated */
|
|
|
|
{
|
|
|
|
dict_index_t* clust_index;
|
|
|
|
bool purged = true;
|
|
|
|
|
2015-10-09 17:20:49 +02:00
|
|
|
ut_ad(!node->found_clust);
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
clust_index = dict_table_get_first_index(node->table);
|
|
|
|
|
|
|
|
node->index = dict_table_get_next_index(clust_index);
|
|
|
|
|
|
|
|
switch (node->rec_type) {
|
|
|
|
case TRX_UNDO_DEL_MARK_REC:
|
|
|
|
purged = row_purge_del_mark(node);
|
|
|
|
if (!purged) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
MONITOR_INC(MONITOR_N_DEL_ROW_PURGE);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
if (!updated_extern) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
/* fall through */
|
|
|
|
case TRX_UNDO_UPD_EXIST_REC:
|
|
|
|
row_purge_upd_exist_or_extern(thr, node, undo_rec);
|
|
|
|
MONITOR_INC(MONITOR_N_UPD_EXIST_EXTERN);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (node->found_clust) {
|
|
|
|
btr_pcur_close(&node->pcur);
|
|
|
|
node->found_clust = FALSE;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (node->table != NULL) {
|
|
|
|
dict_table_close(node->table, FALSE, FALSE);
|
|
|
|
node->table = NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
return(purged);
|
|
|
|
}
|
|
|
|
|
|
|
|
#ifdef UNIV_DEBUG
|
|
|
|
# define row_purge_record(node,undo_rec,thr,updated_extern) \
|
|
|
|
row_purge_record_func(node,undo_rec,thr,updated_extern)
|
|
|
|
#else /* UNIV_DEBUG */
|
|
|
|
# define row_purge_record(node,undo_rec,thr,updated_extern) \
|
|
|
|
row_purge_record_func(node,undo_rec,updated_extern)
|
|
|
|
#endif /* UNIV_DEBUG */
|
|
|
|
|
2009-09-07 12:22:53 +02:00
|
|
|
/***********************************************************//**
|
2008-12-01 07:10:29 +01:00
|
|
|
Fetches an undo log record and does the purge for the recorded operation.
|
|
|
|
If none left, or the current purge completed, returns the control to the
|
2011-04-29 14:49:04 +02:00
|
|
|
parent node, which is always a query thread node. */
|
2017-03-04 19:49:14 +01:00
|
|
|
static
|
2011-04-29 14:49:04 +02:00
|
|
|
void
|
2008-12-01 07:10:29 +01:00
|
|
|
row_purge(
|
|
|
|
/*======*/
|
2013-12-16 15:38:05 +01:00
|
|
|
purge_node_t* node, /*!< in: row purge node */
|
|
|
|
trx_undo_rec_t* undo_rec, /*!< in: record to purge */
|
|
|
|
que_thr_t* thr) /*!< in: query thread */
|
2008-12-01 07:10:29 +01:00
|
|
|
{
|
2013-12-16 15:38:05 +01:00
|
|
|
if (undo_rec != &trx_purge_dummy_rec) {
|
|
|
|
bool updated_extern;
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
while (row_purge_parse_undo_rec(
|
|
|
|
node, undo_rec, &updated_extern, thr)) {
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
bool purged = row_purge_record(
|
|
|
|
node, undo_rec, thr, updated_extern);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
rw_lock_s_unlock(&dict_operation_lock);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
if (purged
|
|
|
|
|| srv_shutdown_state != SRV_SHUTDOWN_NONE) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Retry the purge in a second. */
|
|
|
|
os_thread_sleep(1000000);
|
|
|
|
}
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
2013-12-16 15:38:05 +01:00
|
|
|
}
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
/***********************************************************//**
|
|
|
|
Reset the purge query thread. */
|
|
|
|
UNIV_INLINE
|
|
|
|
void
|
|
|
|
row_purge_end(
|
|
|
|
/*==========*/
|
|
|
|
que_thr_t* thr) /*!< in: query thread */
|
|
|
|
{
|
|
|
|
purge_node_t* node;
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
ut_ad(thr);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
node = static_cast<purge_node_t*>(thr->run_node);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
ut_ad(que_node_get_type(node) == QUE_NODE_PURGE);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
thr->run_node = que_node_get_parent(node);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
node->undo_recs = NULL;
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
node->done = TRUE;
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
ut_a(thr->run_node != NULL);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
mem_heap_empty(node->heap);
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
|
2009-09-07 12:22:53 +02:00
|
|
|
/***********************************************************//**
|
2008-12-01 07:10:29 +01:00
|
|
|
Does the purge operation for a single undo log record. This is a high-level
|
2009-09-07 12:22:53 +02:00
|
|
|
function used in an SQL execution graph.
|
|
|
|
@return query thread to run next or NULL */
|
2008-12-01 07:10:29 +01:00
|
|
|
UNIV_INTERN
|
|
|
|
que_thr_t*
|
|
|
|
row_purge_step(
|
|
|
|
/*===========*/
|
2009-09-07 12:22:53 +02:00
|
|
|
que_thr_t* thr) /*!< in: query thread */
|
2008-12-01 07:10:29 +01:00
|
|
|
{
|
|
|
|
purge_node_t* node;
|
|
|
|
|
|
|
|
ut_ad(thr);
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
node = static_cast<purge_node_t*>(thr->run_node);
|
|
|
|
|
|
|
|
node->table = NULL;
|
|
|
|
node->row = NULL;
|
|
|
|
node->ref = NULL;
|
|
|
|
node->index = NULL;
|
|
|
|
node->update = NULL;
|
|
|
|
node->found_clust = FALSE;
|
|
|
|
node->rec_type = ULINT_UNDEFINED;
|
|
|
|
node->cmpl_info = ULINT_UNDEFINED;
|
|
|
|
|
|
|
|
ut_a(!node->done);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
|
|
|
ut_ad(que_node_get_type(node) == QUE_NODE_PURGE);
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
if (!(node->undo_recs == NULL || ib_vector_is_empty(node->undo_recs))) {
|
|
|
|
trx_purge_rec_t*purge_rec;
|
|
|
|
|
|
|
|
purge_rec = static_cast<trx_purge_rec_t*>(
|
|
|
|
ib_vector_pop(node->undo_recs));
|
|
|
|
|
|
|
|
node->roll_ptr = purge_rec->roll_ptr;
|
|
|
|
|
|
|
|
row_purge(node, purge_rec->undo_rec, thr);
|
|
|
|
|
|
|
|
if (ib_vector_is_empty(node->undo_recs)) {
|
|
|
|
row_purge_end(thr);
|
|
|
|
} else {
|
|
|
|
thr->run_node = node;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
row_purge_end(thr);
|
|
|
|
}
|
2008-12-01 07:10:29 +01:00
|
|
|
|
|
|
|
return(thr);
|
|
|
|
}
|
2015-10-09 17:20:49 +02:00
|
|
|
|
|
|
|
#ifdef UNIV_DEBUG
|
|
|
|
/***********************************************************//**
|
|
|
|
Validate the persisent cursor. The purge node has two references
|
|
|
|
to the clustered index record - one via the ref member, and the
|
|
|
|
other via the persistent cursor. These two references must match
|
|
|
|
each other if the found_clust flag is set.
|
|
|
|
@return true if the stored copy of persistent cursor is consistent
|
|
|
|
with the ref member.*/
|
|
|
|
bool
|
|
|
|
purge_node_t::validate_pcur()
|
|
|
|
{
|
|
|
|
if (!found_clust) {
|
|
|
|
return(true);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (index == NULL) {
|
|
|
|
return(true);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (index->type == DICT_FTS) {
|
|
|
|
return(true);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (pcur.old_stored != BTR_PCUR_OLD_STORED) {
|
|
|
|
return(true);
|
|
|
|
}
|
|
|
|
|
|
|
|
dict_index_t* clust_index = pcur.btr_cur.index;
|
|
|
|
|
|
|
|
ulint* offsets = rec_get_offsets(
|
|
|
|
pcur.old_rec, clust_index, NULL, pcur.old_n_fields, &heap);
|
|
|
|
|
|
|
|
/* Here we are comparing the purge ref record and the stored initial
|
|
|
|
part in persistent cursor. Both cases we store n_uniq fields of the
|
|
|
|
cluster index and so it is fine to do the comparison. We note this
|
|
|
|
dependency here as pcur and ref belong to different modules. */
|
|
|
|
int st = cmp_dtuple_rec(ref, pcur.old_rec, offsets);
|
|
|
|
|
|
|
|
if (st != 0) {
|
|
|
|
fprintf(stderr, "Purge node pcur validation failed\n");
|
|
|
|
dtuple_print(stderr, ref);
|
|
|
|
rec_print(stderr, pcur.old_rec, clust_index);
|
|
|
|
return(false);
|
|
|
|
}
|
|
|
|
|
|
|
|
return(true);
|
|
|
|
}
|
|
|
|
#endif /* UNIV_DEBUG */
|