2009-03-26 07:11:11 +01:00
|
|
|
/*****************************************************************************
|
|
|
|
|
2016-08-10 19:24:58 +02:00
|
|
|
Copyright (c) 1997, 2016, Oracle and/or its affiliates. All Rights Reserved.
|
2017-08-24 14:38:05 +02:00
|
|
|
Copyright (c) 2017, MariaDB Corporation.
|
2009-03-26 07:11:11 +01:00
|
|
|
|
|
|
|
This program is free software; you can redistribute it and/or modify it under
|
|
|
|
the terms of the GNU General Public License as published by the Free Software
|
|
|
|
Foundation; version 2 of the License.
|
|
|
|
|
|
|
|
This program is distributed in the hope that it will be useful, but WITHOUT
|
|
|
|
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
|
|
FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License along with
|
2013-12-16 15:38:05 +01:00
|
|
|
this program; if not, write to the Free Software Foundation, Inc.,
|
2019-05-11 18:25:02 +02:00
|
|
|
51 Franklin Street, Fifth Floor, Boston, MA 02110-1335 USA
|
2009-03-26 07:11:11 +01:00
|
|
|
|
|
|
|
*****************************************************************************/
|
|
|
|
|
2009-09-07 12:22:53 +02:00
|
|
|
/**************************************************//**
|
2013-12-16 15:38:05 +01:00
|
|
|
@file row/row0uins.cc
|
2008-12-01 07:10:29 +01:00
|
|
|
Fresh insert undo
|
|
|
|
|
|
|
|
Created 2/25/1997 Heikki Tuuri
|
|
|
|
*******************************************************/
|
|
|
|
|
|
|
|
#include "row0uins.h"
|
|
|
|
|
|
|
|
#ifdef UNIV_NONINL
|
|
|
|
#include "row0uins.ic"
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#include "dict0dict.h"
|
|
|
|
#include "dict0boot.h"
|
|
|
|
#include "dict0crea.h"
|
|
|
|
#include "trx0undo.h"
|
|
|
|
#include "trx0roll.h"
|
|
|
|
#include "btr0btr.h"
|
|
|
|
#include "mach0data.h"
|
|
|
|
#include "row0undo.h"
|
|
|
|
#include "row0vers.h"
|
2013-12-16 15:38:05 +01:00
|
|
|
#include "row0log.h"
|
2008-12-01 07:10:29 +01:00
|
|
|
#include "trx0trx.h"
|
|
|
|
#include "trx0rec.h"
|
|
|
|
#include "row0row.h"
|
|
|
|
#include "row0upd.h"
|
|
|
|
#include "que0que.h"
|
|
|
|
#include "ibuf0ibuf.h"
|
|
|
|
#include "log0log.h"
|
|
|
|
|
2010-09-03 17:41:57 +02:00
|
|
|
/*************************************************************************
|
|
|
|
IMPORTANT NOTE: Any operation that generates redo MUST check that there
|
|
|
|
is enough space in the redo log before for that operation. This is
|
|
|
|
done by calling log_free_check(). The reason for checking the
|
|
|
|
availability of the redo log space before the start of the operation is
|
|
|
|
that we MUST not hold any synchonization objects when performing the
|
|
|
|
check.
|
|
|
|
If you make a change in this module make sure that no codepath is
|
|
|
|
introduced where a call to log_free_check() is bypassed. */
|
|
|
|
|
2009-09-07 12:22:53 +02:00
|
|
|
/***************************************************************//**
|
2008-12-01 07:10:29 +01:00
|
|
|
Removes a clustered index record. The pcur in node was positioned on the
|
2009-09-07 12:22:53 +02:00
|
|
|
record, now it is detached.
|
|
|
|
@return DB_SUCCESS or DB_OUT_OF_FILE_SPACE */
|
2016-08-10 19:24:58 +02:00
|
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
2013-12-16 15:38:05 +01:00
|
|
|
dberr_t
|
2008-12-01 07:10:29 +01:00
|
|
|
row_undo_ins_remove_clust_rec(
|
|
|
|
/*==========================*/
|
2009-09-07 12:22:53 +02:00
|
|
|
undo_node_t* node) /*!< in: undo node */
|
2008-12-01 07:10:29 +01:00
|
|
|
{
|
|
|
|
btr_cur_t* btr_cur;
|
|
|
|
ibool success;
|
2013-12-16 15:38:05 +01:00
|
|
|
dberr_t err;
|
|
|
|
ulint n_tries = 0;
|
2008-12-01 07:10:29 +01:00
|
|
|
mtr_t mtr;
|
2013-12-16 15:38:05 +01:00
|
|
|
dict_index_t* index = node->pcur.btr_cur.index;
|
|
|
|
bool online;
|
|
|
|
|
|
|
|
ut_ad(dict_index_is_clust(index));
|
2008-12-01 07:10:29 +01:00
|
|
|
|
|
|
|
mtr_start(&mtr);
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
/* This is similar to row_undo_mod_clust(). The DDL thread may
|
|
|
|
already have copied this row from the log to the new table.
|
|
|
|
We must log the removal, so that the row will be correctly
|
|
|
|
purged. However, we can log the removal out of sync with the
|
|
|
|
B-tree modification. */
|
|
|
|
|
|
|
|
online = dict_index_is_online_ddl(index);
|
|
|
|
if (online) {
|
|
|
|
ut_ad(node->trx->dict_operation_lock_mode
|
|
|
|
!= RW_X_LATCH);
|
|
|
|
ut_ad(node->table->id != DICT_INDEXES_ID);
|
|
|
|
mtr_s_lock(dict_index_get_lock(index), &mtr);
|
|
|
|
}
|
|
|
|
|
|
|
|
success = btr_pcur_restore_position(
|
|
|
|
online
|
|
|
|
? BTR_MODIFY_LEAF | BTR_ALREADY_S_LATCHED
|
|
|
|
: BTR_MODIFY_LEAF, &node->pcur, &mtr);
|
2008-12-01 07:10:29 +01:00
|
|
|
ut_a(success);
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
btr_cur = btr_pcur_get_btr_cur(&node->pcur);
|
|
|
|
|
|
|
|
ut_ad(rec_get_trx_id(btr_cur_get_rec(btr_cur), btr_cur->index)
|
|
|
|
== node->trx->id);
|
|
|
|
|
|
|
|
if (online && dict_index_is_online_ddl(index)) {
|
|
|
|
const rec_t* rec = btr_cur_get_rec(btr_cur);
|
|
|
|
mem_heap_t* heap = NULL;
|
|
|
|
const ulint* offsets = rec_get_offsets(
|
|
|
|
rec, index, NULL, ULINT_UNDEFINED, &heap);
|
2014-05-06 21:18:00 +02:00
|
|
|
row_log_table_delete(rec, index, offsets, NULL);
|
2013-12-16 15:38:05 +01:00
|
|
|
mem_heap_free(heap);
|
|
|
|
}
|
|
|
|
|
2011-07-14 21:22:41 +02:00
|
|
|
if (node->table->id == DICT_INDEXES_ID) {
|
2013-12-16 15:38:05 +01:00
|
|
|
ut_ad(!online);
|
2008-12-01 07:10:29 +01:00
|
|
|
ut_ad(node->trx->dict_operation_lock_mode == RW_X_LATCH);
|
|
|
|
|
|
|
|
/* Drop the index tree associated with the row in
|
|
|
|
SYS_INDEXES table: */
|
|
|
|
|
|
|
|
dict_drop_index_tree(btr_pcur_get_rec(&(node->pcur)), &mtr);
|
|
|
|
|
|
|
|
mtr_commit(&mtr);
|
|
|
|
|
|
|
|
mtr_start(&mtr);
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
success = btr_pcur_restore_position(
|
|
|
|
BTR_MODIFY_LEAF, &node->pcur, &mtr);
|
2008-12-01 07:10:29 +01:00
|
|
|
ut_a(success);
|
|
|
|
}
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
if (btr_cur_optimistic_delete(btr_cur, 0, &mtr)) {
|
|
|
|
err = DB_SUCCESS;
|
|
|
|
goto func_exit;
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
2013-12-16 15:38:05 +01:00
|
|
|
|
|
|
|
btr_pcur_commit_specify_mtr(&node->pcur, &mtr);
|
2008-12-01 07:10:29 +01:00
|
|
|
retry:
|
|
|
|
/* If did not succeed, try pessimistic descent to tree */
|
|
|
|
mtr_start(&mtr);
|
|
|
|
|
|
|
|
success = btr_pcur_restore_position(BTR_MODIFY_TREE,
|
|
|
|
&(node->pcur), &mtr);
|
|
|
|
ut_a(success);
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
btr_cur_pessimistic_delete(&err, FALSE, btr_cur, 0,
|
2008-12-03 06:06:00 +01:00
|
|
|
trx_is_recv(node->trx)
|
|
|
|
? RB_RECOVERY
|
|
|
|
: RB_NORMAL, &mtr);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
|
|
|
/* The delete operation may fail if we have little
|
|
|
|
file space left: TODO: easiest to crash the database
|
|
|
|
and restart with more file space */
|
|
|
|
|
|
|
|
if (err == DB_OUT_OF_FILE_SPACE
|
|
|
|
&& n_tries < BTR_CUR_RETRY_DELETE_N_TIMES) {
|
|
|
|
|
|
|
|
btr_pcur_commit_specify_mtr(&(node->pcur), &mtr);
|
|
|
|
|
|
|
|
n_tries++;
|
|
|
|
|
|
|
|
os_thread_sleep(BTR_CUR_RETRY_SLEEP_TIME);
|
|
|
|
|
|
|
|
goto retry;
|
|
|
|
}
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
func_exit:
|
|
|
|
btr_pcur_commit_specify_mtr(&node->pcur, &mtr);
|
2008-12-01 07:10:29 +01:00
|
|
|
trx_undo_rec_release(node->trx, node->undo_no);
|
|
|
|
|
|
|
|
return(err);
|
|
|
|
}
|
|
|
|
|
2009-09-07 12:22:53 +02:00
|
|
|
/***************************************************************//**
|
|
|
|
Removes a secondary index entry if found.
|
|
|
|
@return DB_SUCCESS, DB_FAIL, or DB_OUT_OF_FILE_SPACE */
|
2016-08-10 19:24:58 +02:00
|
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
2013-12-16 15:38:05 +01:00
|
|
|
dberr_t
|
2008-12-01 07:10:29 +01:00
|
|
|
row_undo_ins_remove_sec_low(
|
|
|
|
/*========================*/
|
2009-09-07 12:22:53 +02:00
|
|
|
ulint mode, /*!< in: BTR_MODIFY_LEAF or BTR_MODIFY_TREE,
|
2008-12-01 07:10:29 +01:00
|
|
|
depending on whether we wish optimistic or
|
|
|
|
pessimistic descent down the index tree */
|
2009-09-07 12:22:53 +02:00
|
|
|
dict_index_t* index, /*!< in: index */
|
|
|
|
dtuple_t* entry) /*!< in: index entry to remove */
|
2008-12-01 07:10:29 +01:00
|
|
|
{
|
2011-07-14 21:22:41 +02:00
|
|
|
btr_pcur_t pcur;
|
|
|
|
btr_cur_t* btr_cur;
|
2013-12-16 15:38:05 +01:00
|
|
|
dberr_t err = DB_SUCCESS;
|
2011-07-14 21:22:41 +02:00
|
|
|
mtr_t mtr;
|
|
|
|
enum row_search_result search_result;
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
log_free_check();
|
|
|
|
|
2008-12-01 07:10:29 +01:00
|
|
|
mtr_start(&mtr);
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
if (mode == BTR_MODIFY_LEAF) {
|
|
|
|
mode = BTR_MODIFY_LEAF | BTR_ALREADY_S_LATCHED;
|
|
|
|
mtr_s_lock(dict_index_get_lock(index), &mtr);
|
|
|
|
} else {
|
|
|
|
ut_ad(mode == BTR_MODIFY_TREE);
|
2017-08-24 14:38:05 +02:00
|
|
|
if (index->space == IBUF_SPACE_ID
|
|
|
|
&& !dict_index_is_unique(index)) {
|
|
|
|
ibuf_free_excess_pages();
|
|
|
|
}
|
2013-12-16 15:38:05 +01:00
|
|
|
mtr_x_lock(dict_index_get_lock(index), &mtr);
|
|
|
|
}
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
if (row_log_online_op_try(index, entry, 0)) {
|
|
|
|
goto func_exit_no_pcur;
|
|
|
|
}
|
2011-07-14 21:22:41 +02:00
|
|
|
|
|
|
|
search_result = row_search_index_entry(index, entry, mode,
|
|
|
|
&pcur, &mtr);
|
|
|
|
|
|
|
|
switch (search_result) {
|
|
|
|
case ROW_NOT_FOUND:
|
|
|
|
goto func_exit;
|
|
|
|
case ROW_FOUND:
|
|
|
|
break;
|
|
|
|
case ROW_BUFFERED:
|
|
|
|
case ROW_NOT_DELETED_REF:
|
|
|
|
/* These are invalid outcomes, because the mode passed
|
|
|
|
to row_search_index_entry() did not include any of the
|
|
|
|
flags BTR_INSERT, BTR_DELETE, or BTR_DELETE_MARK. */
|
|
|
|
ut_error;
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
btr_cur = btr_pcur_get_btr_cur(&pcur);
|
|
|
|
|
|
|
|
if (mode != BTR_MODIFY_TREE) {
|
|
|
|
err = btr_cur_optimistic_delete(btr_cur, 0, &mtr)
|
2011-07-14 21:22:41 +02:00
|
|
|
? DB_SUCCESS : DB_FAIL;
|
2008-12-01 07:10:29 +01:00
|
|
|
} else {
|
2008-12-03 06:06:00 +01:00
|
|
|
/* No need to distinguish RB_RECOVERY here, because we
|
|
|
|
are deleting a secondary index record: the distinction
|
|
|
|
between RB_NORMAL and RB_RECOVERY only matters when
|
|
|
|
deleting a record that contains externally stored
|
|
|
|
columns. */
|
|
|
|
ut_ad(!dict_index_is_clust(index));
|
2013-12-16 15:38:05 +01:00
|
|
|
btr_cur_pessimistic_delete(&err, FALSE, btr_cur, 0,
|
2008-12-03 06:06:00 +01:00
|
|
|
RB_NORMAL, &mtr);
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
2011-07-14 21:22:41 +02:00
|
|
|
func_exit:
|
2008-12-01 07:10:29 +01:00
|
|
|
btr_pcur_close(&pcur);
|
2013-12-16 15:38:05 +01:00
|
|
|
func_exit_no_pcur:
|
2008-12-01 07:10:29 +01:00
|
|
|
mtr_commit(&mtr);
|
|
|
|
|
|
|
|
return(err);
|
|
|
|
}
|
|
|
|
|
2009-09-07 12:22:53 +02:00
|
|
|
/***************************************************************//**
|
2008-12-01 07:10:29 +01:00
|
|
|
Removes a secondary index entry from the index if found. Tries first
|
2009-09-07 12:22:53 +02:00
|
|
|
optimistic, then pessimistic descent down the tree.
|
|
|
|
@return DB_SUCCESS or DB_OUT_OF_FILE_SPACE */
|
2016-08-10 19:24:58 +02:00
|
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
2013-12-16 15:38:05 +01:00
|
|
|
dberr_t
|
2008-12-01 07:10:29 +01:00
|
|
|
row_undo_ins_remove_sec(
|
|
|
|
/*====================*/
|
2009-09-07 12:22:53 +02:00
|
|
|
dict_index_t* index, /*!< in: index */
|
|
|
|
dtuple_t* entry) /*!< in: index entry to insert */
|
2008-12-01 07:10:29 +01:00
|
|
|
{
|
2013-12-16 15:38:05 +01:00
|
|
|
dberr_t err;
|
2008-12-01 07:10:29 +01:00
|
|
|
ulint n_tries = 0;
|
|
|
|
|
|
|
|
/* Try first optimistic descent to the B-tree */
|
|
|
|
|
|
|
|
err = row_undo_ins_remove_sec_low(BTR_MODIFY_LEAF, index, entry);
|
|
|
|
|
|
|
|
if (err == DB_SUCCESS) {
|
|
|
|
|
|
|
|
return(err);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Try then pessimistic descent to the B-tree */
|
|
|
|
retry:
|
|
|
|
err = row_undo_ins_remove_sec_low(BTR_MODIFY_TREE, index, entry);
|
|
|
|
|
|
|
|
/* The delete operation may fail if we have little
|
|
|
|
file space left: TODO: easiest to crash the database
|
|
|
|
and restart with more file space */
|
|
|
|
|
|
|
|
if (err != DB_SUCCESS && n_tries < BTR_CUR_RETRY_DELETE_N_TIMES) {
|
|
|
|
|
|
|
|
n_tries++;
|
|
|
|
|
|
|
|
os_thread_sleep(BTR_CUR_RETRY_SLEEP_TIME);
|
|
|
|
|
|
|
|
goto retry;
|
|
|
|
}
|
|
|
|
|
|
|
|
return(err);
|
|
|
|
}
|
|
|
|
|
2009-09-07 12:22:53 +02:00
|
|
|
/***********************************************************//**
|
2008-12-01 07:10:29 +01:00
|
|
|
Parses the row reference and other info in a fresh insert undo record. */
|
|
|
|
static
|
|
|
|
void
|
|
|
|
row_undo_ins_parse_undo_rec(
|
|
|
|
/*========================*/
|
2013-12-16 15:38:05 +01:00
|
|
|
undo_node_t* node, /*!< in/out: row undo node */
|
|
|
|
ibool dict_locked) /*!< in: TRUE if own dict_sys->mutex */
|
2008-12-01 07:10:29 +01:00
|
|
|
{
|
|
|
|
dict_index_t* clust_index;
|
|
|
|
byte* ptr;
|
2009-09-07 12:22:53 +02:00
|
|
|
undo_no_t undo_no;
|
2011-07-14 21:22:41 +02:00
|
|
|
table_id_t table_id;
|
2008-12-01 07:10:29 +01:00
|
|
|
ulint type;
|
|
|
|
ulint dummy;
|
2013-12-16 15:38:05 +01:00
|
|
|
bool dummy_extern;
|
2008-12-01 07:10:29 +01:00
|
|
|
|
|
|
|
ut_ad(node);
|
|
|
|
|
|
|
|
ptr = trx_undo_rec_get_pars(node->undo_rec, &type, &dummy,
|
|
|
|
&dummy_extern, &undo_no, &table_id);
|
|
|
|
ut_ad(type == TRX_UNDO_INSERT_REC);
|
|
|
|
node->rec_type = type;
|
|
|
|
|
|
|
|
node->update = NULL;
|
2013-12-16 15:38:05 +01:00
|
|
|
node->table = dict_table_open_on_id(
|
|
|
|
table_id, dict_locked, DICT_TABLE_OP_NORMAL);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
|
|
|
/* Skip the UNDO if we can't find the table or the .ibd file. */
|
|
|
|
if (UNIV_UNLIKELY(node->table == NULL)) {
|
MDEV-12253: Buffer pool blocks are accessed after they have been freed
Problem was that bpage was referenced after it was already freed
from LRU. Fixed by adding a new variable encrypted that is
passed down to buf_page_check_corrupt() and used in
buf_page_get_gen() to stop processing page read.
This patch should also address following test failures and
bugs:
MDEV-12419: IMPORT should not look up tablespace in
PageConverter::validate(). This is now removed.
MDEV-10099: encryption.innodb_onlinealter_encryption fails
sporadically in buildbot
MDEV-11420: encryption.innodb_encryption-page-compression
failed in buildbot
MDEV-11222: encryption.encrypt_and_grep failed in buildbot on P8
Removed dict_table_t::is_encrypted and dict_table_t::ibd_file_missing
and replaced these with dict_table_t::file_unreadable. Table
ibd file is missing if fil_get_space(space_id) returns NULL
and encrypted if not. Removed dict_table_t::is_corrupted field.
Ported FilSpace class from 10.2 and using that on buf_page_check_corrupt(),
buf_page_decrypt_after_read(), buf_page_encrypt_before_write(),
buf_dblwr_process(), buf_read_page(), dict_stats_save_defrag_stats().
Added test cases when enrypted page could be read while doing
redo log crash recovery. Also added test case for row compressed
blobs.
btr_cur_open_at_index_side_func(),
btr_cur_open_at_rnd_pos_func(): Avoid referencing block that is
NULL.
buf_page_get_zip(): Issue error if page read fails.
buf_page_get_gen(): Use dberr_t for error detection and
do not reference bpage after we hare freed it.
buf_mark_space_corrupt(): remove bpage from LRU also when
it is encrypted.
buf_page_check_corrupt(): @return DB_SUCCESS if page has
been read and is not corrupted,
DB_PAGE_CORRUPTED if page based on checksum check is corrupted,
DB_DECRYPTION_FAILED if page post encryption checksum matches but
after decryption normal page checksum does not match. In read
case only DB_SUCCESS is possible.
buf_page_io_complete(): use dberr_t for error handling.
buf_flush_write_block_low(),
buf_read_ahead_random(),
buf_read_page_async(),
buf_read_ahead_linear(),
buf_read_ibuf_merge_pages(),
buf_read_recv_pages(),
fil_aio_wait():
Issue error if page read fails.
btr_pcur_move_to_next_page(): Do not reference page if it is
NULL.
Introduced dict_table_t::is_readable() and dict_index_t::is_readable()
that will return true if tablespace exists and pages read from
tablespace are not corrupted or page decryption failed.
Removed buf_page_t::key_version. After page decryption the
key version is not removed from page frame. For unencrypted
pages, old key_version is removed at buf_page_encrypt_before_write()
dict_stats_update_transient_for_index(),
dict_stats_update_transient()
Do not continue if table decryption failed or table
is corrupted.
dict0stats.cc: Introduced a dict_stats_report_error function
to avoid code duplication.
fil_parse_write_crypt_data():
Check that key read from redo log entry is found from
encryption plugin and if it is not, refuse to start.
PageConverter::validate(): Removed access to fil_space_t as
tablespace is not available during import.
Fixed error code on innodb.innodb test.
Merged test cased innodb-bad-key-change5 and innodb-bad-key-shutdown
to innodb-bad-key-change2. Removed innodb-bad-key-change5 test.
Decreased unnecessary complexity on some long lasting tests.
Removed fil_inc_pending_ops(), fil_decr_pending_ops(),
fil_get_first_space(), fil_get_next_space(),
fil_get_first_space_safe(), fil_get_next_space_safe()
functions.
fil_space_verify_crypt_checksum(): Fixed bug found using ASAN
where FIL_PAGE_END_LSN_OLD_CHECKSUM field was incorrectly
accessed from row compressed tables. Fixed out of page frame
bug for row compressed tables in
fil_space_verify_crypt_checksum() found using ASAN. Incorrect
function was called for compressed table.
Added new tests for discard, rename table and drop (we should allow them
even when page decryption fails). Alter table rename is not allowed.
Added test for restart with innodb-force-recovery=1 when page read on
redo-recovery cant be decrypted. Added test for corrupted table where
both page data and FIL_PAGE_FILE_FLUSH_LSN_OR_KEY_VERSION is corrupted.
Adjusted the test case innodb_bug14147491 so that it does not anymore
expect crash. Instead table is just mostly not usable.
fil0fil.h: fil_space_acquire_low is not visible function
and fil_space_acquire and fil_space_acquire_silent are
inline functions. FilSpace class uses fil_space_acquire_low
directly.
recv_apply_hashed_log_recs() does not return anything.
2017-04-26 14:19:16 +02:00
|
|
|
} else if (UNIV_UNLIKELY(node->table->file_unreadable)) {
|
2013-12-16 15:38:05 +01:00
|
|
|
close_table:
|
|
|
|
dict_table_close(node->table, dict_locked, FALSE);
|
2008-12-01 07:10:29 +01:00
|
|
|
node->table = NULL;
|
|
|
|
} else {
|
|
|
|
clust_index = dict_table_get_first_index(node->table);
|
|
|
|
|
2008-12-03 06:06:00 +01:00
|
|
|
if (clust_index != NULL) {
|
2013-12-16 15:38:05 +01:00
|
|
|
trx_undo_rec_get_row_ref(
|
2008-12-03 06:06:00 +01:00
|
|
|
ptr, clust_index, &node->ref, node->heap);
|
2013-12-16 15:38:05 +01:00
|
|
|
|
|
|
|
if (!row_undo_search_clust_to_pcur(node)) {
|
|
|
|
goto close_table;
|
|
|
|
}
|
|
|
|
|
2008-12-03 06:06:00 +01:00
|
|
|
} else {
|
|
|
|
ut_print_timestamp(stderr);
|
|
|
|
fprintf(stderr, " InnoDB: table ");
|
|
|
|
ut_print_name(stderr, node->trx, TRUE,
|
|
|
|
node->table->name);
|
|
|
|
fprintf(stderr, " has no indexes, "
|
|
|
|
"ignoring the table\n");
|
2013-12-16 15:38:05 +01:00
|
|
|
goto close_table;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/***************************************************************//**
|
|
|
|
Removes secondary index records.
|
|
|
|
@return DB_SUCCESS or DB_OUT_OF_FILE_SPACE */
|
2016-08-10 19:24:58 +02:00
|
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
2013-12-16 15:38:05 +01:00
|
|
|
dberr_t
|
|
|
|
row_undo_ins_remove_sec_rec(
|
|
|
|
/*========================*/
|
|
|
|
undo_node_t* node) /*!< in/out: row undo node */
|
|
|
|
{
|
|
|
|
dberr_t err = DB_SUCCESS;
|
|
|
|
dict_index_t* index = node->index;
|
|
|
|
mem_heap_t* heap;
|
2008-12-03 06:06:00 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
heap = mem_heap_create(1024);
|
|
|
|
|
|
|
|
while (index != NULL) {
|
|
|
|
dtuple_t* entry;
|
|
|
|
|
|
|
|
if (index->type & DICT_FTS) {
|
|
|
|
dict_table_next_uncorrupted_index(index);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* An insert undo record TRX_UNDO_INSERT_REC will
|
|
|
|
always contain all fields of the index. It does not
|
|
|
|
matter if any indexes were created afterwards; all
|
|
|
|
index entries can be reconstructed from the row. */
|
|
|
|
entry = row_build_index_entry(
|
|
|
|
node->row, node->ext, index, heap);
|
|
|
|
if (UNIV_UNLIKELY(!entry)) {
|
|
|
|
/* The database must have crashed after
|
|
|
|
inserting a clustered index record but before
|
|
|
|
writing all the externally stored columns of
|
|
|
|
that record, or a statement is being rolled
|
|
|
|
back because an error occurred while storing
|
|
|
|
off-page columns.
|
|
|
|
|
|
|
|
Because secondary index entries are inserted
|
|
|
|
after the clustered index record, we may
|
|
|
|
assume that the secondary index record does
|
|
|
|
not exist. */
|
|
|
|
} else {
|
|
|
|
err = row_undo_ins_remove_sec(index, entry);
|
|
|
|
|
|
|
|
if (UNIV_UNLIKELY(err != DB_SUCCESS)) {
|
|
|
|
goto func_exit;
|
|
|
|
}
|
2008-12-03 06:06:00 +01:00
|
|
|
}
|
2013-12-16 15:38:05 +01:00
|
|
|
|
|
|
|
mem_heap_empty(heap);
|
|
|
|
dict_table_next_uncorrupted_index(index);
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
2013-12-16 15:38:05 +01:00
|
|
|
|
|
|
|
func_exit:
|
|
|
|
node->index = index;
|
|
|
|
mem_heap_free(heap);
|
|
|
|
return(err);
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
|
2009-09-07 12:22:53 +02:00
|
|
|
/***********************************************************//**
|
2008-12-01 07:10:29 +01:00
|
|
|
Undoes a fresh insert of a row to a table. A fresh insert means that
|
|
|
|
the same clustered index unique key did not have any record, even delete
|
2009-03-26 07:11:11 +01:00
|
|
|
marked, at the time of the insert. InnoDB is eager in a rollback:
|
|
|
|
if it figures out that an index record will be removed in the purge
|
2009-09-07 12:22:53 +02:00
|
|
|
anyway, it will remove it in the rollback.
|
|
|
|
@return DB_SUCCESS or DB_OUT_OF_FILE_SPACE */
|
2008-12-01 07:10:29 +01:00
|
|
|
UNIV_INTERN
|
2013-12-16 15:38:05 +01:00
|
|
|
dberr_t
|
2008-12-01 07:10:29 +01:00
|
|
|
row_undo_ins(
|
|
|
|
/*=========*/
|
2009-09-07 12:22:53 +02:00
|
|
|
undo_node_t* node) /*!< in: row undo node */
|
2008-12-01 07:10:29 +01:00
|
|
|
{
|
2013-12-16 15:38:05 +01:00
|
|
|
dberr_t err;
|
|
|
|
ibool dict_locked;
|
|
|
|
|
2008-12-01 07:10:29 +01:00
|
|
|
ut_ad(node->state == UNDO_NODE_INSERT);
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
dict_locked = node->trx->dict_operation_lock_mode == RW_X_LATCH;
|
|
|
|
|
|
|
|
row_undo_ins_parse_undo_rec(node, dict_locked);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
if (node->table == NULL) {
|
2008-12-01 07:10:29 +01:00
|
|
|
trx_undo_rec_release(node->trx, node->undo_no);
|
|
|
|
|
|
|
|
return(DB_SUCCESS);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Iterate over all the indexes and undo the insert.*/
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
node->index = dict_table_get_first_index(node->table);
|
|
|
|
ut_ad(dict_index_is_clust(node->index));
|
2008-12-01 07:10:29 +01:00
|
|
|
/* Skip the clustered index (the first index) */
|
2013-12-16 15:38:05 +01:00
|
|
|
node->index = dict_table_get_next_index(node->index);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2011-12-14 14:58:22 +01:00
|
|
|
dict_table_skip_corrupt_index(node->index);
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
err = row_undo_ins_remove_sec_rec(node);
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
if (err == DB_SUCCESS) {
|
2013-11-07 21:44:46 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
log_free_check();
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
if (node->table->id == DICT_INDEXES_ID) {
|
2008-12-01 07:10:29 +01:00
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
if (!dict_locked) {
|
|
|
|
mutex_enter(&dict_sys->mutex);
|
2008-12-03 06:06:00 +01:00
|
|
|
}
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
// FIXME: We need to update the dict_index_t::space and
|
|
|
|
// page number fields too.
|
|
|
|
err = row_undo_ins_remove_clust_rec(node);
|
|
|
|
|
|
|
|
if (node->table->id == DICT_INDEXES_ID
|
|
|
|
&& !dict_locked) {
|
|
|
|
|
|
|
|
mutex_exit(&dict_sys->mutex);
|
|
|
|
}
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|
|
|
|
|
2013-12-16 15:38:05 +01:00
|
|
|
dict_table_close(node->table, dict_locked, FALSE);
|
|
|
|
|
|
|
|
node->table = NULL;
|
|
|
|
|
|
|
|
return(err);
|
2008-12-01 07:10:29 +01:00
|
|
|
}
|