mirror of
https://github.com/MariaDB/server.git
synced 2025-01-18 13:02:28 +01:00
4136 lines
104 KiB
C++
4136 lines
104 KiB
C++
/*****************************************************************************
|
|
|
|
Copyright (c) 2012, 2016, Oracle and/or its affiliates. All Rights Reserved.
|
|
Copyright (c) 2015, 2019, MariaDB Corporation.
|
|
|
|
This program is free software; you can redistribute it and/or modify it under
|
|
the terms of the GNU General Public License as published by the Free Software
|
|
Foundation; version 2 of the License.
|
|
|
|
This program is distributed in the hope that it will be useful, but WITHOUT
|
|
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License along with
|
|
this program; if not, write to the Free Software Foundation, Inc.,
|
|
51 Franklin Street, Fifth Floor, Boston, MA 02110-1335 USA
|
|
|
|
*****************************************************************************/
|
|
|
|
/**************************************************//**
|
|
@file row/row0import.cc
|
|
Import a tablespace to a running instance.
|
|
|
|
Created 2012-02-08 by Sunny Bains.
|
|
*******************************************************/
|
|
|
|
#include "row0import.h"
|
|
#include "btr0pcur.h"
|
|
#include "que0que.h"
|
|
#include "dict0boot.h"
|
|
#include "dict0load.h"
|
|
#include "ibuf0ibuf.h"
|
|
#include "pars0pars.h"
|
|
#include "row0sel.h"
|
|
#include "row0mysql.h"
|
|
#include "srv0start.h"
|
|
#include "row0quiesce.h"
|
|
#include "fil0pagecompress.h"
|
|
#include "trx0undo.h"
|
|
#ifdef HAVE_LZO
|
|
#include "lzo/lzo1x.h"
|
|
#endif
|
|
#ifdef HAVE_SNAPPY
|
|
#include "snappy-c.h"
|
|
#endif
|
|
|
|
#include <vector>
|
|
|
|
#ifdef HAVE_MY_AES_H
|
|
#include <my_aes.h>
|
|
#endif
|
|
|
|
/** The size of the buffer to use for IO.
|
|
@param n physical page size
|
|
@return number of pages */
|
|
#define IO_BUFFER_SIZE(n) ((1024 * 1024) / n)
|
|
|
|
/** For gathering stats on records during phase I */
|
|
struct row_stats_t {
|
|
ulint m_n_deleted; /*!< Number of deleted records
|
|
found in the index */
|
|
|
|
ulint m_n_purged; /*!< Number of records purged
|
|
optimisatically */
|
|
|
|
ulint m_n_rows; /*!< Number of rows */
|
|
|
|
ulint m_n_purge_failed; /*!< Number of deleted rows
|
|
that could not be purged */
|
|
};
|
|
|
|
/** Index information required by IMPORT. */
|
|
struct row_index_t {
|
|
index_id_t m_id; /*!< Index id of the table
|
|
in the exporting server */
|
|
byte* m_name; /*!< Index name */
|
|
|
|
ulint m_space; /*!< Space where it is placed */
|
|
|
|
ulint m_page_no; /*!< Root page number */
|
|
|
|
ulint m_type; /*!< Index type */
|
|
|
|
ulint m_trx_id_offset; /*!< Relevant only for clustered
|
|
indexes, offset of transaction
|
|
id system column */
|
|
|
|
ulint m_n_user_defined_cols; /*!< User defined columns */
|
|
|
|
ulint m_n_uniq; /*!< Number of columns that can
|
|
uniquely identify the row */
|
|
|
|
ulint m_n_nullable; /*!< Number of nullable
|
|
columns */
|
|
|
|
ulint m_n_fields; /*!< Total number of fields */
|
|
|
|
dict_field_t* m_fields; /*!< Index fields */
|
|
|
|
const dict_index_t*
|
|
m_srv_index; /*!< Index instance in the
|
|
importing server */
|
|
|
|
row_stats_t m_stats; /*!< Statistics gathered during
|
|
the import phase */
|
|
|
|
};
|
|
|
|
/** Meta data required by IMPORT. */
|
|
struct row_import {
|
|
row_import() UNIV_NOTHROW
|
|
:
|
|
m_table(NULL),
|
|
m_version(0),
|
|
m_hostname(NULL),
|
|
m_table_name(NULL),
|
|
m_autoinc(0),
|
|
m_page_size(0, 0, false),
|
|
m_flags(0),
|
|
m_n_cols(0),
|
|
m_cols(NULL),
|
|
m_col_names(NULL),
|
|
m_n_indexes(0),
|
|
m_indexes(NULL),
|
|
m_missing(true) { }
|
|
|
|
~row_import() UNIV_NOTHROW;
|
|
|
|
/** Find the index entry in in the indexes array.
|
|
@param name index name
|
|
@return instance if found else 0. */
|
|
row_index_t* get_index(const char* name) const UNIV_NOTHROW;
|
|
|
|
/** Get the number of rows in the index.
|
|
@param name index name
|
|
@return number of rows (doesn't include delete marked rows). */
|
|
ulint get_n_rows(const char* name) const UNIV_NOTHROW;
|
|
|
|
/** Find the ordinal value of the column name in the cfg table columns.
|
|
@param name of column to look for.
|
|
@return ULINT_UNDEFINED if not found. */
|
|
ulint find_col(const char* name) const UNIV_NOTHROW;
|
|
|
|
/** Get the number of rows for which purge failed during the
|
|
convert phase.
|
|
@param name index name
|
|
@return number of rows for which purge failed. */
|
|
ulint get_n_purge_failed(const char* name) const UNIV_NOTHROW;
|
|
|
|
/** Check if the index is clean. ie. no delete-marked records
|
|
@param name index name
|
|
@return true if index needs to be purged. */
|
|
bool requires_purge(const char* name) const UNIV_NOTHROW
|
|
{
|
|
return(get_n_purge_failed(name) > 0);
|
|
}
|
|
|
|
/** Set the index root <space, pageno> using the index name */
|
|
void set_root_by_name() UNIV_NOTHROW;
|
|
|
|
/** Set the index root <space, pageno> using a heuristic
|
|
@return DB_SUCCESS or error code */
|
|
dberr_t set_root_by_heuristic() UNIV_NOTHROW;
|
|
|
|
/** Check if the index schema that was read from the .cfg file
|
|
matches the in memory index definition.
|
|
Note: It will update row_import_t::m_srv_index to map the meta-data
|
|
read from the .cfg file to the server index instance.
|
|
@return DB_SUCCESS or error code. */
|
|
dberr_t match_index_columns(
|
|
THD* thd,
|
|
const dict_index_t* index) UNIV_NOTHROW;
|
|
|
|
/** Check if the table schema that was read from the .cfg file
|
|
matches the in memory table definition.
|
|
@param thd MySQL session variable
|
|
@return DB_SUCCESS or error code. */
|
|
dberr_t match_table_columns(
|
|
THD* thd) UNIV_NOTHROW;
|
|
|
|
/** Check if the table (and index) schema that was read from the
|
|
.cfg file matches the in memory table definition.
|
|
@param thd MySQL session variable
|
|
@return DB_SUCCESS or error code. */
|
|
dberr_t match_schema(
|
|
THD* thd) UNIV_NOTHROW;
|
|
|
|
dict_table_t* m_table; /*!< Table instance */
|
|
|
|
ulint m_version; /*!< Version of config file */
|
|
|
|
byte* m_hostname; /*!< Hostname where the
|
|
tablespace was exported */
|
|
byte* m_table_name; /*!< Exporting instance table
|
|
name */
|
|
|
|
ib_uint64_t m_autoinc; /*!< Next autoinc value */
|
|
|
|
page_size_t m_page_size; /*!< Tablespace page size */
|
|
|
|
ulint m_flags; /*!< Table flags */
|
|
|
|
ulint m_n_cols; /*!< Number of columns in the
|
|
meta-data file */
|
|
|
|
dict_col_t* m_cols; /*!< Column data */
|
|
|
|
byte** m_col_names; /*!< Column names, we store the
|
|
column naems separately becuase
|
|
there is no field to store the
|
|
value in dict_col_t */
|
|
|
|
ulint m_n_indexes; /*!< Number of indexes,
|
|
including clustered index */
|
|
|
|
row_index_t* m_indexes; /*!< Index meta data */
|
|
|
|
bool m_missing; /*!< true if a .cfg file was
|
|
found and was readable */
|
|
};
|
|
|
|
/** Use the page cursor to iterate over records in a block. */
|
|
class RecIterator {
|
|
public:
|
|
/** Default constructor */
|
|
RecIterator() UNIV_NOTHROW
|
|
{
|
|
memset(&m_cur, 0x0, sizeof(m_cur));
|
|
}
|
|
|
|
/** Position the cursor on the first user record. */
|
|
void open(buf_block_t* block) UNIV_NOTHROW
|
|
{
|
|
page_cur_set_before_first(block, &m_cur);
|
|
|
|
if (!end()) {
|
|
next();
|
|
}
|
|
}
|
|
|
|
/** Move to the next record. */
|
|
void next() UNIV_NOTHROW
|
|
{
|
|
page_cur_move_to_next(&m_cur);
|
|
}
|
|
|
|
/**
|
|
@return the current record */
|
|
rec_t* current() UNIV_NOTHROW
|
|
{
|
|
ut_ad(!end());
|
|
return(page_cur_get_rec(&m_cur));
|
|
}
|
|
|
|
/**
|
|
@return true if cursor is at the end */
|
|
bool end() UNIV_NOTHROW
|
|
{
|
|
return(page_cur_is_after_last(&m_cur) == TRUE);
|
|
}
|
|
|
|
/** Remove the current record
|
|
@return true on success */
|
|
bool remove(
|
|
const dict_index_t* index,
|
|
page_zip_des_t* page_zip,
|
|
ulint* offsets) UNIV_NOTHROW
|
|
{
|
|
/* We can't end up with an empty page unless it is root. */
|
|
if (page_get_n_recs(m_cur.block->frame) <= 1) {
|
|
return(false);
|
|
}
|
|
|
|
return(page_delete_rec(index, &m_cur, page_zip, offsets));
|
|
}
|
|
|
|
private:
|
|
page_cur_t m_cur;
|
|
};
|
|
|
|
/** Class that purges delete marked reocords from indexes, both secondary
|
|
and cluster. It does a pessimistic delete. This should only be done if we
|
|
couldn't purge the delete marked reocrds during Phase I. */
|
|
class IndexPurge {
|
|
public:
|
|
/** Constructor
|
|
@param trx the user transaction covering the import tablespace
|
|
@param index to be imported
|
|
@param space_id space id of the tablespace */
|
|
IndexPurge(
|
|
trx_t* trx,
|
|
dict_index_t* index) UNIV_NOTHROW
|
|
:
|
|
m_trx(trx),
|
|
m_index(index),
|
|
m_n_rows(0)
|
|
{
|
|
ib::info() << "Phase II - Purge records from index "
|
|
<< index->name;
|
|
}
|
|
|
|
/** Descructor */
|
|
~IndexPurge() UNIV_NOTHROW { }
|
|
|
|
/** Purge delete marked records.
|
|
@return DB_SUCCESS or error code. */
|
|
dberr_t garbage_collect() UNIV_NOTHROW;
|
|
|
|
/** The number of records that are not delete marked.
|
|
@return total records in the index after purge */
|
|
ulint get_n_rows() const UNIV_NOTHROW
|
|
{
|
|
return(m_n_rows);
|
|
}
|
|
|
|
private:
|
|
/** Begin import, position the cursor on the first record. */
|
|
void open() UNIV_NOTHROW;
|
|
|
|
/** Close the persistent curosr and commit the mini-transaction. */
|
|
void close() UNIV_NOTHROW;
|
|
|
|
/** Position the cursor on the next record.
|
|
@return DB_SUCCESS or error code */
|
|
dberr_t next() UNIV_NOTHROW;
|
|
|
|
/** Store the persistent cursor position and reopen the
|
|
B-tree cursor in BTR_MODIFY_TREE mode, because the
|
|
tree structure may be changed during a pessimistic delete. */
|
|
void purge_pessimistic_delete() UNIV_NOTHROW;
|
|
|
|
/** Purge delete-marked records.
|
|
@param offsets current row offsets. */
|
|
void purge() UNIV_NOTHROW;
|
|
|
|
protected:
|
|
// Disable copying
|
|
IndexPurge();
|
|
IndexPurge(const IndexPurge&);
|
|
IndexPurge &operator=(const IndexPurge&);
|
|
|
|
private:
|
|
trx_t* m_trx; /*!< User transaction */
|
|
mtr_t m_mtr; /*!< Mini-transaction */
|
|
btr_pcur_t m_pcur; /*!< Persistent cursor */
|
|
dict_index_t* m_index; /*!< Index to be processed */
|
|
ulint m_n_rows; /*!< Records in index */
|
|
};
|
|
|
|
/** Functor that is called for each physical page that is read from the
|
|
tablespace file. */
|
|
class AbstractCallback
|
|
{
|
|
public:
|
|
/** Constructor
|
|
@param trx covering transaction */
|
|
AbstractCallback(trx_t* trx, ulint space_id)
|
|
:
|
|
m_page_size(0, 0, false),
|
|
m_trx(trx),
|
|
m_space(space_id),
|
|
m_xdes(),
|
|
m_xdes_page_no(ULINT_UNDEFINED),
|
|
m_space_flags(ULINT_UNDEFINED) UNIV_NOTHROW { }
|
|
|
|
/** Free any extent descriptor instance */
|
|
virtual ~AbstractCallback()
|
|
{
|
|
UT_DELETE_ARRAY(m_xdes);
|
|
}
|
|
|
|
/** Determine the page size to use for traversing the tablespace
|
|
@param file_size size of the tablespace file in bytes
|
|
@param block contents of the first page in the tablespace file.
|
|
@retval DB_SUCCESS or error code. */
|
|
virtual dberr_t init(
|
|
os_offset_t file_size,
|
|
const buf_block_t* block) UNIV_NOTHROW;
|
|
|
|
/** @return true if compressed table. */
|
|
bool is_compressed_table() const UNIV_NOTHROW
|
|
{
|
|
return(get_page_size().is_compressed());
|
|
}
|
|
|
|
/** @return the tablespace flags */
|
|
ulint get_space_flags() const
|
|
{
|
|
return(m_space_flags);
|
|
}
|
|
|
|
/**
|
|
Set the name of the physical file and the file handle that is used
|
|
to open it for the file that is being iterated over.
|
|
@param filename the physical name of the tablespace file
|
|
@param file OS file handle */
|
|
void set_file(const char* filename, pfs_os_file_t file) UNIV_NOTHROW
|
|
{
|
|
m_file = file;
|
|
m_filepath = filename;
|
|
}
|
|
|
|
const page_size_t& get_page_size() const { return m_page_size; }
|
|
|
|
const char* filename() const { return m_filepath; }
|
|
|
|
/**
|
|
Called for every page in the tablespace. If the page was not
|
|
updated then its state must be set to BUF_PAGE_NOT_USED. For
|
|
compressed tables the page descriptor memory will be at offset:
|
|
block->frame + srv_page_size;
|
|
@param block block read from file, note it is not from the buffer pool
|
|
@retval DB_SUCCESS or error code. */
|
|
virtual dberr_t operator()(buf_block_t* block) UNIV_NOTHROW = 0;
|
|
|
|
/** @return the tablespace identifier */
|
|
ulint get_space_id() const { return m_space; }
|
|
|
|
bool is_interrupted() const { return trx_is_interrupted(m_trx); }
|
|
|
|
/**
|
|
Get the data page depending on the table type, compressed or not.
|
|
@param block - block read from disk
|
|
@retval the buffer frame */
|
|
static byte* get_frame(const buf_block_t* block)
|
|
{
|
|
return block->page.zip.data
|
|
? block->page.zip.data : block->frame;
|
|
}
|
|
|
|
protected:
|
|
/** Get the physical offset of the extent descriptor within the page.
|
|
@param page_no page number of the extent descriptor
|
|
@param page contents of the page containing the extent descriptor.
|
|
@return the start of the xdes array in a page */
|
|
const xdes_t* xdes(
|
|
ulint page_no,
|
|
const page_t* page) const UNIV_NOTHROW
|
|
{
|
|
ulint offset;
|
|
|
|
offset = xdes_calc_descriptor_index(get_page_size(), page_no);
|
|
|
|
return(page + XDES_ARR_OFFSET + XDES_SIZE * offset);
|
|
}
|
|
|
|
/** Set the current page directory (xdes). If the extent descriptor is
|
|
marked as free then free the current extent descriptor and set it to
|
|
0. This implies that all pages that are covered by this extent
|
|
descriptor are also freed.
|
|
|
|
@param page_no offset of page within the file
|
|
@param page page contents
|
|
@return DB_SUCCESS or error code. */
|
|
dberr_t set_current_xdes(
|
|
ulint page_no,
|
|
const page_t* page) UNIV_NOTHROW
|
|
{
|
|
m_xdes_page_no = page_no;
|
|
|
|
UT_DELETE_ARRAY(m_xdes);
|
|
m_xdes = NULL;
|
|
|
|
ulint state;
|
|
const xdes_t* xdesc = page + XDES_ARR_OFFSET;
|
|
|
|
state = mach_read_ulint(xdesc + XDES_STATE, MLOG_4BYTES);
|
|
|
|
if (state != XDES_FREE) {
|
|
|
|
m_xdes = UT_NEW_ARRAY_NOKEY(xdes_t,
|
|
m_page_size.physical());
|
|
|
|
/* Trigger OOM */
|
|
DBUG_EXECUTE_IF(
|
|
"ib_import_OOM_13",
|
|
UT_DELETE_ARRAY(m_xdes);
|
|
m_xdes = NULL;
|
|
);
|
|
|
|
if (m_xdes == NULL) {
|
|
return(DB_OUT_OF_MEMORY);
|
|
}
|
|
|
|
memcpy(m_xdes, page, m_page_size.physical());
|
|
}
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/** Check if the page is marked as free in the extent descriptor.
|
|
@param page_no page number to check in the extent descriptor.
|
|
@return true if the page is marked as free */
|
|
bool is_free(ulint page_no) const UNIV_NOTHROW
|
|
{
|
|
ut_a(xdes_calc_descriptor_page(get_page_size(), page_no)
|
|
== m_xdes_page_no);
|
|
|
|
if (m_xdes != 0) {
|
|
const xdes_t* xdesc = xdes(page_no, m_xdes);
|
|
ulint pos = page_no % FSP_EXTENT_SIZE;
|
|
|
|
return(xdes_get_bit(xdesc, XDES_FREE_BIT, pos));
|
|
}
|
|
|
|
/* If the current xdes was free, the page must be free. */
|
|
return(true);
|
|
}
|
|
|
|
protected:
|
|
/** The tablespace page size. */
|
|
page_size_t m_page_size;
|
|
|
|
/** File handle to the tablespace */
|
|
pfs_os_file_t m_file;
|
|
|
|
/** Physical file path. */
|
|
const char* m_filepath;
|
|
|
|
/** Covering transaction. */
|
|
trx_t* m_trx;
|
|
|
|
/** Space id of the file being iterated over. */
|
|
ulint m_space;
|
|
|
|
/** Minimum page number for which the free list has not been
|
|
initialized: the pages >= this limit are, by definition, free;
|
|
note that in a single-table tablespace where size < 64 pages,
|
|
this number is 64, i.e., we have initialized the space about
|
|
the first extent, but have not physically allocted those pages
|
|
to the file. @see FSP_LIMIT. */
|
|
ulint m_free_limit;
|
|
|
|
/** Current size of the space in pages */
|
|
ulint m_size;
|
|
|
|
/** Current extent descriptor page */
|
|
xdes_t* m_xdes;
|
|
|
|
/** Physical page offset in the file of the extent descriptor */
|
|
ulint m_xdes_page_no;
|
|
|
|
/** Flags value read from the header page */
|
|
ulint m_space_flags;
|
|
};
|
|
|
|
/** Determine the page size to use for traversing the tablespace
|
|
@param file_size size of the tablespace file in bytes
|
|
@param block contents of the first page in the tablespace file.
|
|
@retval DB_SUCCESS or error code. */
|
|
dberr_t
|
|
AbstractCallback::init(
|
|
os_offset_t file_size,
|
|
const buf_block_t* block) UNIV_NOTHROW
|
|
{
|
|
const page_t* page = block->frame;
|
|
|
|
m_space_flags = fsp_header_get_flags(page);
|
|
if (!fsp_flags_is_valid(m_space_flags, true)) {
|
|
ulint cflags = fsp_flags_convert_from_101(m_space_flags);
|
|
if (cflags == ULINT_UNDEFINED) {
|
|
ib::error() << "Invalid FSP_SPACE_FLAGS="
|
|
<< ib::hex(m_space_flags);
|
|
return(DB_CORRUPTION);
|
|
}
|
|
m_space_flags = cflags;
|
|
}
|
|
|
|
/* Clear the DATA_DIR flag, which is basically garbage. */
|
|
m_space_flags &= ~(1U << FSP_FLAGS_POS_RESERVED);
|
|
m_page_size.copy_from(page_size_t(m_space_flags));
|
|
|
|
if (!is_compressed_table() && !m_page_size.equals_to(univ_page_size)) {
|
|
|
|
ib::error() << "Page size " << m_page_size.physical()
|
|
<< " of ibd file is not the same as the server page"
|
|
" size " << srv_page_size;
|
|
|
|
return(DB_CORRUPTION);
|
|
|
|
} else if (file_size % m_page_size.physical() != 0) {
|
|
|
|
ib::error() << "File size " << file_size << " is not a"
|
|
" multiple of the page size "
|
|
<< m_page_size.physical();
|
|
|
|
return(DB_CORRUPTION);
|
|
}
|
|
|
|
m_size = mach_read_from_4(page + FSP_SIZE);
|
|
m_free_limit = mach_read_from_4(page + FSP_FREE_LIMIT);
|
|
if (m_space == ULINT_UNDEFINED) {
|
|
m_space = mach_read_from_4(FSP_HEADER_OFFSET + FSP_SPACE_ID
|
|
+ page);
|
|
}
|
|
|
|
return set_current_xdes(0, page);
|
|
}
|
|
|
|
/**
|
|
Try and determine the index root pages by checking if the next/prev
|
|
pointers are both FIL_NULL. We need to ensure that skip deleted pages. */
|
|
struct FetchIndexRootPages : public AbstractCallback {
|
|
|
|
/** Index information gathered from the .ibd file. */
|
|
struct Index {
|
|
|
|
Index(index_id_t id, ulint page_no)
|
|
:
|
|
m_id(id),
|
|
m_page_no(page_no) { }
|
|
|
|
index_id_t m_id; /*!< Index id */
|
|
ulint m_page_no; /*!< Root page number */
|
|
};
|
|
|
|
typedef std::vector<Index, ut_allocator<Index> > Indexes;
|
|
|
|
/** Constructor
|
|
@param trx covering (user) transaction
|
|
@param table table definition in server .*/
|
|
FetchIndexRootPages(const dict_table_t* table, trx_t* trx)
|
|
:
|
|
AbstractCallback(trx, ULINT_UNDEFINED),
|
|
m_table(table) UNIV_NOTHROW { }
|
|
|
|
/** Destructor */
|
|
virtual ~FetchIndexRootPages() UNIV_NOTHROW { }
|
|
|
|
/** Called for each block as it is read from the file.
|
|
@param block block to convert, it is not from the buffer pool.
|
|
@retval DB_SUCCESS or error code. */
|
|
dberr_t operator()(buf_block_t* block) UNIV_NOTHROW;
|
|
|
|
/** Update the import configuration that will be used to import
|
|
the tablespace. */
|
|
dberr_t build_row_import(row_import* cfg) const UNIV_NOTHROW;
|
|
|
|
/** Table definition in server. */
|
|
const dict_table_t* m_table;
|
|
|
|
/** Index information */
|
|
Indexes m_indexes;
|
|
};
|
|
|
|
/** Called for each block as it is read from the file. Check index pages to
|
|
determine the exact row format. We can't get that from the tablespace
|
|
header flags alone.
|
|
|
|
@param block block to convert, it is not from the buffer pool.
|
|
@retval DB_SUCCESS or error code. */
|
|
dberr_t FetchIndexRootPages::operator()(buf_block_t* block) UNIV_NOTHROW
|
|
{
|
|
if (is_interrupted()) return DB_INTERRUPTED;
|
|
|
|
const page_t* page = get_frame(block);
|
|
|
|
ulint page_type = fil_page_get_type(page);
|
|
|
|
if (page_type == FIL_PAGE_TYPE_XDES) {
|
|
return set_current_xdes(block->page.id.page_no(), page);
|
|
} else if (fil_page_index_page_check(page)
|
|
&& !is_free(block->page.id.page_no())
|
|
&& !page_has_siblings(page)) {
|
|
|
|
index_id_t id = btr_page_get_index_id(page);
|
|
|
|
m_indexes.push_back(Index(id, block->page.id.page_no()));
|
|
|
|
if (m_indexes.size() == 1) {
|
|
/* Check that the tablespace flags match the table flags. */
|
|
ulint expected = dict_tf_to_fsp_flags(m_table->flags);
|
|
if (!fsp_flags_match(expected, m_space_flags)) {
|
|
ib_errf(m_trx->mysql_thd, IB_LOG_LEVEL_ERROR,
|
|
ER_TABLE_SCHEMA_MISMATCH,
|
|
"Expected FSP_SPACE_FLAGS=0x%x, .ibd "
|
|
"file contains 0x%x.",
|
|
unsigned(expected),
|
|
unsigned(m_space_flags));
|
|
return(DB_CORRUPTION);
|
|
}
|
|
}
|
|
}
|
|
|
|
return DB_SUCCESS;
|
|
}
|
|
|
|
/**
|
|
Update the import configuration that will be used to import the tablespace.
|
|
@return error code or DB_SUCCESS */
|
|
dberr_t
|
|
FetchIndexRootPages::build_row_import(row_import* cfg) const UNIV_NOTHROW
|
|
{
|
|
Indexes::const_iterator end = m_indexes.end();
|
|
|
|
ut_a(cfg->m_table == m_table);
|
|
cfg->m_page_size.copy_from(m_page_size);
|
|
cfg->m_n_indexes = m_indexes.size();
|
|
|
|
if (cfg->m_n_indexes == 0) {
|
|
|
|
ib::error() << "No B+Tree found in tablespace";
|
|
|
|
return(DB_CORRUPTION);
|
|
}
|
|
|
|
cfg->m_indexes = UT_NEW_ARRAY_NOKEY(row_index_t, cfg->m_n_indexes);
|
|
|
|
/* Trigger OOM */
|
|
DBUG_EXECUTE_IF(
|
|
"ib_import_OOM_11",
|
|
UT_DELETE_ARRAY(cfg->m_indexes);
|
|
cfg->m_indexes = NULL;
|
|
);
|
|
|
|
if (cfg->m_indexes == NULL) {
|
|
return(DB_OUT_OF_MEMORY);
|
|
}
|
|
|
|
memset(cfg->m_indexes, 0x0, sizeof(*cfg->m_indexes) * cfg->m_n_indexes);
|
|
|
|
row_index_t* cfg_index = cfg->m_indexes;
|
|
|
|
for (Indexes::const_iterator it = m_indexes.begin();
|
|
it != end;
|
|
++it, ++cfg_index) {
|
|
|
|
char name[BUFSIZ];
|
|
|
|
snprintf(name, sizeof(name), "index" IB_ID_FMT, it->m_id);
|
|
|
|
ulint len = strlen(name) + 1;
|
|
|
|
cfg_index->m_name = UT_NEW_ARRAY_NOKEY(byte, len);
|
|
|
|
/* Trigger OOM */
|
|
DBUG_EXECUTE_IF(
|
|
"ib_import_OOM_12",
|
|
UT_DELETE_ARRAY(cfg_index->m_name);
|
|
cfg_index->m_name = NULL;
|
|
);
|
|
|
|
if (cfg_index->m_name == NULL) {
|
|
return(DB_OUT_OF_MEMORY);
|
|
}
|
|
|
|
memcpy(cfg_index->m_name, name, len);
|
|
|
|
cfg_index->m_id = it->m_id;
|
|
|
|
cfg_index->m_space = m_space;
|
|
|
|
cfg_index->m_page_no = it->m_page_no;
|
|
}
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/* Functor that is called for each physical page that is read from the
|
|
tablespace file.
|
|
|
|
1. Check each page for corruption.
|
|
|
|
2. Update the space id and LSN on every page
|
|
* For the header page
|
|
- Validate the flags
|
|
- Update the LSN
|
|
|
|
3. On Btree pages
|
|
* Set the index id
|
|
* Update the max trx id
|
|
* In a cluster index, update the system columns
|
|
* In a cluster index, update the BLOB ptr, set the space id
|
|
* Purge delete marked records, but only if they can be easily
|
|
removed from the page
|
|
* Keep a counter of number of rows, ie. non-delete-marked rows
|
|
* Keep a counter of number of delete marked rows
|
|
* Keep a counter of number of purge failure
|
|
* If a page is stamped with an index id that isn't in the .cfg file
|
|
we assume it is deleted and the page can be ignored.
|
|
|
|
4. Set the page state to dirty so that it will be written to disk.
|
|
*/
|
|
class PageConverter : public AbstractCallback {
|
|
public:
|
|
/** Constructor
|
|
@param cfg config of table being imported.
|
|
@param space_id tablespace identifier
|
|
@param trx transaction covering the import */
|
|
PageConverter(row_import* cfg, ulint space_id, trx_t* trx)
|
|
:
|
|
AbstractCallback(trx, space_id),
|
|
m_cfg(cfg),
|
|
m_index(cfg->m_indexes),
|
|
m_current_lsn(log_get_lsn()),
|
|
m_page_zip_ptr(0),
|
|
m_rec_iter(),
|
|
m_offsets_(), m_offsets(m_offsets_),
|
|
m_heap(0),
|
|
m_cluster_index(dict_table_get_first_index(cfg->m_table))
|
|
{
|
|
ut_ad(m_current_lsn);
|
|
rec_offs_init(m_offsets_);
|
|
}
|
|
|
|
virtual ~PageConverter() UNIV_NOTHROW
|
|
{
|
|
if (m_heap != 0) {
|
|
mem_heap_free(m_heap);
|
|
}
|
|
}
|
|
|
|
/** Called for each block as it is read from the file.
|
|
@param block block to convert, it is not from the buffer pool.
|
|
@retval DB_SUCCESS or error code. */
|
|
dberr_t operator()(buf_block_t* block) UNIV_NOTHROW;
|
|
private:
|
|
/** Update the page, set the space id, max trx id and index id.
|
|
@param block block read from file
|
|
@param page_type type of the page
|
|
@retval DB_SUCCESS or error code */
|
|
dberr_t update_page(
|
|
buf_block_t* block,
|
|
ulint& page_type) UNIV_NOTHROW;
|
|
|
|
/** Update the space, index id, trx id.
|
|
@param block block to convert
|
|
@return DB_SUCCESS or error code */
|
|
dberr_t update_index_page(buf_block_t* block) UNIV_NOTHROW;
|
|
|
|
/** Update the BLOB refrences and write UNDO log entries for
|
|
rows that can't be purged optimistically.
|
|
@param block block to update
|
|
@retval DB_SUCCESS or error code */
|
|
dberr_t update_records(buf_block_t* block) UNIV_NOTHROW;
|
|
|
|
/** Validate the space flags and update tablespace header page.
|
|
@param block block read from file, not from the buffer pool.
|
|
@retval DB_SUCCESS or error code */
|
|
dberr_t update_header(buf_block_t* block) UNIV_NOTHROW;
|
|
|
|
/** Adjust the BLOB reference for a single column that is externally stored
|
|
@param rec record to update
|
|
@param offsets column offsets for the record
|
|
@param i column ordinal value
|
|
@return DB_SUCCESS or error code */
|
|
dberr_t adjust_cluster_index_blob_column(
|
|
rec_t* rec,
|
|
const ulint* offsets,
|
|
ulint i) UNIV_NOTHROW;
|
|
|
|
/** Adjusts the BLOB reference in the clustered index row for all
|
|
externally stored columns.
|
|
@param rec record to update
|
|
@param offsets column offsets for the record
|
|
@return DB_SUCCESS or error code */
|
|
dberr_t adjust_cluster_index_blob_columns(
|
|
rec_t* rec,
|
|
const ulint* offsets) UNIV_NOTHROW;
|
|
|
|
/** In the clustered index, adjist the BLOB pointers as needed.
|
|
Also update the BLOB reference, write the new space id.
|
|
@param rec record to update
|
|
@param offsets column offsets for the record
|
|
@return DB_SUCCESS or error code */
|
|
dberr_t adjust_cluster_index_blob_ref(
|
|
rec_t* rec,
|
|
const ulint* offsets) UNIV_NOTHROW;
|
|
|
|
/** Purge delete-marked records, only if it is possible to do
|
|
so without re-organising the B+tree.
|
|
@retval true if purged */
|
|
bool purge() UNIV_NOTHROW;
|
|
|
|
/** Adjust the BLOB references and sys fields for the current record.
|
|
@param rec record to update
|
|
@param offsets column offsets for the record
|
|
@return DB_SUCCESS or error code. */
|
|
dberr_t adjust_cluster_record(
|
|
rec_t* rec,
|
|
const ulint* offsets) UNIV_NOTHROW;
|
|
|
|
/** Find an index with the matching id.
|
|
@return row_index_t* instance or 0 */
|
|
row_index_t* find_index(index_id_t id) UNIV_NOTHROW
|
|
{
|
|
row_index_t* index = &m_cfg->m_indexes[0];
|
|
|
|
for (ulint i = 0; i < m_cfg->m_n_indexes; ++i, ++index) {
|
|
if (id == index->m_id) {
|
|
return(index);
|
|
}
|
|
}
|
|
|
|
return(0);
|
|
|
|
}
|
|
private:
|
|
/** Config for table that is being imported. */
|
|
row_import* m_cfg;
|
|
|
|
/** Current index whose pages are being imported */
|
|
row_index_t* m_index;
|
|
|
|
/** Current system LSN */
|
|
lsn_t m_current_lsn;
|
|
|
|
/** Alias for m_page_zip, only set for compressed pages. */
|
|
page_zip_des_t* m_page_zip_ptr;
|
|
|
|
/** Iterator over records in a block */
|
|
RecIterator m_rec_iter;
|
|
|
|
/** Record offset */
|
|
ulint m_offsets_[REC_OFFS_NORMAL_SIZE];
|
|
|
|
/** Pointer to m_offsets_ */
|
|
ulint* m_offsets;
|
|
|
|
/** Memory heap for the record offsets */
|
|
mem_heap_t* m_heap;
|
|
|
|
/** Cluster index instance */
|
|
dict_index_t* m_cluster_index;
|
|
};
|
|
|
|
/**
|
|
row_import destructor. */
|
|
row_import::~row_import() UNIV_NOTHROW
|
|
{
|
|
for (ulint i = 0; m_indexes != 0 && i < m_n_indexes; ++i) {
|
|
UT_DELETE_ARRAY(m_indexes[i].m_name);
|
|
|
|
if (m_indexes[i].m_fields == NULL) {
|
|
continue;
|
|
}
|
|
|
|
dict_field_t* fields = m_indexes[i].m_fields;
|
|
ulint n_fields = m_indexes[i].m_n_fields;
|
|
|
|
for (ulint j = 0; j < n_fields; ++j) {
|
|
UT_DELETE_ARRAY(const_cast<char*>(fields[j].name()));
|
|
}
|
|
|
|
UT_DELETE_ARRAY(fields);
|
|
}
|
|
|
|
for (ulint i = 0; m_col_names != 0 && i < m_n_cols; ++i) {
|
|
UT_DELETE_ARRAY(m_col_names[i]);
|
|
}
|
|
|
|
UT_DELETE_ARRAY(m_cols);
|
|
UT_DELETE_ARRAY(m_indexes);
|
|
UT_DELETE_ARRAY(m_col_names);
|
|
UT_DELETE_ARRAY(m_table_name);
|
|
UT_DELETE_ARRAY(m_hostname);
|
|
}
|
|
|
|
/** Find the index entry in in the indexes array.
|
|
@param name index name
|
|
@return instance if found else 0. */
|
|
row_index_t*
|
|
row_import::get_index(
|
|
const char* name) const UNIV_NOTHROW
|
|
{
|
|
for (ulint i = 0; i < m_n_indexes; ++i) {
|
|
const char* index_name;
|
|
row_index_t* index = &m_indexes[i];
|
|
|
|
index_name = reinterpret_cast<const char*>(index->m_name);
|
|
|
|
if (strcmp(index_name, name) == 0) {
|
|
|
|
return(index);
|
|
}
|
|
}
|
|
|
|
return(0);
|
|
}
|
|
|
|
/** Get the number of rows in the index.
|
|
@param name index name
|
|
@return number of rows (doesn't include delete marked rows). */
|
|
ulint
|
|
row_import::get_n_rows(
|
|
const char* name) const UNIV_NOTHROW
|
|
{
|
|
const row_index_t* index = get_index(name);
|
|
|
|
ut_a(name != 0);
|
|
|
|
return(index->m_stats.m_n_rows);
|
|
}
|
|
|
|
/** Get the number of rows for which purge failed uding the convert phase.
|
|
@param name index name
|
|
@return number of rows for which purge failed. */
|
|
ulint
|
|
row_import::get_n_purge_failed(
|
|
const char* name) const UNIV_NOTHROW
|
|
{
|
|
const row_index_t* index = get_index(name);
|
|
|
|
ut_a(name != 0);
|
|
|
|
return(index->m_stats.m_n_purge_failed);
|
|
}
|
|
|
|
/** Find the ordinal value of the column name in the cfg table columns.
|
|
@param name of column to look for.
|
|
@return ULINT_UNDEFINED if not found. */
|
|
ulint
|
|
row_import::find_col(
|
|
const char* name) const UNIV_NOTHROW
|
|
{
|
|
for (ulint i = 0; i < m_n_cols; ++i) {
|
|
const char* col_name;
|
|
|
|
col_name = reinterpret_cast<const char*>(m_col_names[i]);
|
|
|
|
if (strcmp(col_name, name) == 0) {
|
|
return(i);
|
|
}
|
|
}
|
|
|
|
return(ULINT_UNDEFINED);
|
|
}
|
|
|
|
/**
|
|
Check if the index schema that was read from the .cfg file matches the
|
|
in memory index definition.
|
|
@return DB_SUCCESS or error code. */
|
|
dberr_t
|
|
row_import::match_index_columns(
|
|
THD* thd,
|
|
const dict_index_t* index) UNIV_NOTHROW
|
|
{
|
|
row_index_t* cfg_index;
|
|
dberr_t err = DB_SUCCESS;
|
|
|
|
cfg_index = get_index(index->name);
|
|
|
|
if (cfg_index == 0) {
|
|
ib_errf(thd, IB_LOG_LEVEL_ERROR,
|
|
ER_TABLE_SCHEMA_MISMATCH,
|
|
"Index %s not found in tablespace meta-data file.",
|
|
index->name());
|
|
|
|
return(DB_ERROR);
|
|
}
|
|
|
|
if (cfg_index->m_n_fields != index->n_fields) {
|
|
|
|
ib_errf(thd, IB_LOG_LEVEL_ERROR,
|
|
ER_TABLE_SCHEMA_MISMATCH,
|
|
"Index field count %u doesn't match"
|
|
" tablespace metadata file value " ULINTPF,
|
|
index->n_fields, cfg_index->m_n_fields);
|
|
|
|
return(DB_ERROR);
|
|
}
|
|
|
|
cfg_index->m_srv_index = index;
|
|
|
|
const dict_field_t* field = index->fields;
|
|
const dict_field_t* cfg_field = cfg_index->m_fields;
|
|
|
|
for (ulint i = 0; i < index->n_fields; ++i, ++field, ++cfg_field) {
|
|
|
|
if (strcmp(field->name(), cfg_field->name()) != 0) {
|
|
ib_errf(thd, IB_LOG_LEVEL_ERROR,
|
|
ER_TABLE_SCHEMA_MISMATCH,
|
|
"Index field name %s doesn't match"
|
|
" tablespace metadata field name %s"
|
|
" for field position " ULINTPF,
|
|
field->name(), cfg_field->name(), i);
|
|
|
|
err = DB_ERROR;
|
|
}
|
|
|
|
if (cfg_field->prefix_len != field->prefix_len) {
|
|
ib_errf(thd, IB_LOG_LEVEL_ERROR,
|
|
ER_TABLE_SCHEMA_MISMATCH,
|
|
"Index %s field %s prefix len %u"
|
|
" doesn't match metadata file value %u",
|
|
index->name(), field->name(),
|
|
field->prefix_len, cfg_field->prefix_len);
|
|
|
|
err = DB_ERROR;
|
|
}
|
|
|
|
if (cfg_field->fixed_len != field->fixed_len) {
|
|
ib_errf(thd, IB_LOG_LEVEL_ERROR,
|
|
ER_TABLE_SCHEMA_MISMATCH,
|
|
"Index %s field %s fixed len %u"
|
|
" doesn't match metadata file value %u",
|
|
index->name(), field->name(),
|
|
field->fixed_len,
|
|
cfg_field->fixed_len);
|
|
|
|
err = DB_ERROR;
|
|
}
|
|
}
|
|
|
|
return(err);
|
|
}
|
|
|
|
/** Check if the table schema that was read from the .cfg file matches the
|
|
in memory table definition.
|
|
@param thd MySQL session variable
|
|
@return DB_SUCCESS or error code. */
|
|
dberr_t
|
|
row_import::match_table_columns(
|
|
THD* thd) UNIV_NOTHROW
|
|
{
|
|
dberr_t err = DB_SUCCESS;
|
|
const dict_col_t* col = m_table->cols;
|
|
|
|
for (ulint i = 0; i < m_table->n_cols; ++i, ++col) {
|
|
|
|
const char* col_name;
|
|
ulint cfg_col_index;
|
|
|
|
col_name = dict_table_get_col_name(
|
|
m_table, dict_col_get_no(col));
|
|
|
|
cfg_col_index = find_col(col_name);
|
|
|
|
if (cfg_col_index == ULINT_UNDEFINED) {
|
|
|
|
ib_errf(thd, IB_LOG_LEVEL_ERROR,
|
|
ER_TABLE_SCHEMA_MISMATCH,
|
|
"Column %s not found in tablespace.",
|
|
col_name);
|
|
|
|
err = DB_ERROR;
|
|
} else if (cfg_col_index != col->ind) {
|
|
|
|
ib_errf(thd, IB_LOG_LEVEL_ERROR,
|
|
ER_TABLE_SCHEMA_MISMATCH,
|
|
"Column %s ordinal value mismatch, it's at %u"
|
|
" in the table and " ULINTPF
|
|
" in the tablespace meta-data file",
|
|
col_name, col->ind, cfg_col_index);
|
|
|
|
err = DB_ERROR;
|
|
} else {
|
|
const dict_col_t* cfg_col;
|
|
|
|
cfg_col = &m_cols[cfg_col_index];
|
|
ut_a(cfg_col->ind == cfg_col_index);
|
|
|
|
if (cfg_col->prtype != col->prtype) {
|
|
ib_errf(thd,
|
|
IB_LOG_LEVEL_ERROR,
|
|
ER_TABLE_SCHEMA_MISMATCH,
|
|
"Column %s precise type mismatch.",
|
|
col_name);
|
|
err = DB_ERROR;
|
|
}
|
|
|
|
if (cfg_col->mtype != col->mtype) {
|
|
ib_errf(thd,
|
|
IB_LOG_LEVEL_ERROR,
|
|
ER_TABLE_SCHEMA_MISMATCH,
|
|
"Column %s main type mismatch.",
|
|
col_name);
|
|
err = DB_ERROR;
|
|
}
|
|
|
|
if (cfg_col->len != col->len) {
|
|
ib_errf(thd,
|
|
IB_LOG_LEVEL_ERROR,
|
|
ER_TABLE_SCHEMA_MISMATCH,
|
|
"Column %s length mismatch.",
|
|
col_name);
|
|
err = DB_ERROR;
|
|
}
|
|
|
|
if (cfg_col->mbminlen != col->mbminlen
|
|
|| cfg_col->mbmaxlen != col->mbmaxlen) {
|
|
ib_errf(thd,
|
|
IB_LOG_LEVEL_ERROR,
|
|
ER_TABLE_SCHEMA_MISMATCH,
|
|
"Column %s multi-byte len mismatch.",
|
|
col_name);
|
|
err = DB_ERROR;
|
|
}
|
|
|
|
if (cfg_col->ind != col->ind) {
|
|
err = DB_ERROR;
|
|
}
|
|
|
|
if (cfg_col->ord_part != col->ord_part) {
|
|
ib_errf(thd,
|
|
IB_LOG_LEVEL_ERROR,
|
|
ER_TABLE_SCHEMA_MISMATCH,
|
|
"Column %s ordering mismatch.",
|
|
col_name);
|
|
err = DB_ERROR;
|
|
}
|
|
|
|
if (cfg_col->max_prefix != col->max_prefix) {
|
|
ib_errf(thd,
|
|
IB_LOG_LEVEL_ERROR,
|
|
ER_TABLE_SCHEMA_MISMATCH,
|
|
"Column %s max prefix mismatch.",
|
|
col_name);
|
|
err = DB_ERROR;
|
|
}
|
|
}
|
|
}
|
|
|
|
return(err);
|
|
}
|
|
|
|
/** Check if the table (and index) schema that was read from the .cfg file
|
|
matches the in memory table definition.
|
|
@param thd MySQL session variable
|
|
@return DB_SUCCESS or error code. */
|
|
dberr_t
|
|
row_import::match_schema(
|
|
THD* thd) UNIV_NOTHROW
|
|
{
|
|
/* Do some simple checks. */
|
|
|
|
if (ulint mismatch = (m_table->flags ^ m_flags)
|
|
& ~DICT_TF_MASK_DATA_DIR) {
|
|
const char* msg;
|
|
if (mismatch & DICT_TF_MASK_ZIP_SSIZE) {
|
|
if ((m_table->flags & DICT_TF_MASK_ZIP_SSIZE)
|
|
&& (m_flags & DICT_TF_MASK_ZIP_SSIZE)) {
|
|
switch (m_flags & DICT_TF_MASK_ZIP_SSIZE) {
|
|
case 0U << DICT_TF_POS_ZIP_SSIZE:
|
|
goto uncompressed;
|
|
case 1U << DICT_TF_POS_ZIP_SSIZE:
|
|
msg = "ROW_FORMAT=COMPRESSED"
|
|
" KEY_BLOCK_SIZE=1";
|
|
break;
|
|
case 2U << DICT_TF_POS_ZIP_SSIZE:
|
|
msg = "ROW_FORMAT=COMPRESSED"
|
|
" KEY_BLOCK_SIZE=2";
|
|
break;
|
|
case 3U << DICT_TF_POS_ZIP_SSIZE:
|
|
msg = "ROW_FORMAT=COMPRESSED"
|
|
" KEY_BLOCK_SIZE=4";
|
|
break;
|
|
case 4U << DICT_TF_POS_ZIP_SSIZE:
|
|
msg = "ROW_FORMAT=COMPRESSED"
|
|
" KEY_BLOCK_SIZE=8";
|
|
break;
|
|
case 5U << DICT_TF_POS_ZIP_SSIZE:
|
|
msg = "ROW_FORMAT=COMPRESSED"
|
|
" KEY_BLOCK_SIZE=16";
|
|
break;
|
|
default:
|
|
msg = "strange KEY_BLOCK_SIZE";
|
|
}
|
|
} else if (m_flags & DICT_TF_MASK_ZIP_SSIZE) {
|
|
msg = "ROW_FORMAT=COMPRESSED";
|
|
} else {
|
|
goto uncompressed;
|
|
}
|
|
} else {
|
|
uncompressed:
|
|
msg = (m_flags & DICT_TF_MASK_ATOMIC_BLOBS)
|
|
? "ROW_FORMAT=DYNAMIC"
|
|
: (m_flags & DICT_TF_MASK_COMPACT)
|
|
? "ROW_FORMAT=COMPACT"
|
|
: "ROW_FORMAT=REDUNDANT";
|
|
}
|
|
|
|
ib_errf(thd, IB_LOG_LEVEL_ERROR, ER_TABLE_SCHEMA_MISMATCH,
|
|
"Table flags don't match, server table has 0x%x"
|
|
" and the meta-data file has 0x" ULINTPFx ";"
|
|
" .cfg file uses %s",
|
|
m_table->flags, m_flags, msg);
|
|
|
|
return(DB_ERROR);
|
|
} else if (m_table->n_cols != m_n_cols) {
|
|
ib_errf(thd, IB_LOG_LEVEL_ERROR, ER_TABLE_SCHEMA_MISMATCH,
|
|
"Number of columns don't match, table has %u "
|
|
"columns but the tablespace meta-data file has "
|
|
ULINTPF " columns",
|
|
m_table->n_cols, m_n_cols);
|
|
|
|
return(DB_ERROR);
|
|
} else if (UT_LIST_GET_LEN(m_table->indexes) != m_n_indexes) {
|
|
|
|
/* If the number of indexes don't match then it is better
|
|
to abort the IMPORT. It is easy for the user to create a
|
|
table matching the IMPORT definition. */
|
|
|
|
ib_errf(thd, IB_LOG_LEVEL_ERROR, ER_TABLE_SCHEMA_MISMATCH,
|
|
"Number of indexes don't match, table has " ULINTPF
|
|
" indexes but the tablespace meta-data file has "
|
|
ULINTPF " indexes",
|
|
UT_LIST_GET_LEN(m_table->indexes), m_n_indexes);
|
|
|
|
return(DB_ERROR);
|
|
}
|
|
|
|
dberr_t err = match_table_columns(thd);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
return(err);
|
|
}
|
|
|
|
/* Check if the index definitions match. */
|
|
|
|
const dict_index_t* index;
|
|
|
|
for (index = UT_LIST_GET_FIRST(m_table->indexes);
|
|
index != 0;
|
|
index = UT_LIST_GET_NEXT(indexes, index)) {
|
|
|
|
dberr_t index_err;
|
|
|
|
index_err = match_index_columns(thd, index);
|
|
|
|
if (index_err != DB_SUCCESS) {
|
|
err = index_err;
|
|
}
|
|
}
|
|
|
|
return(err);
|
|
}
|
|
|
|
/**
|
|
Set the index root <space, pageno>, using index name. */
|
|
void
|
|
row_import::set_root_by_name() UNIV_NOTHROW
|
|
{
|
|
row_index_t* cfg_index = m_indexes;
|
|
|
|
for (ulint i = 0; i < m_n_indexes; ++i, ++cfg_index) {
|
|
dict_index_t* index;
|
|
|
|
const char* index_name;
|
|
|
|
index_name = reinterpret_cast<const char*>(cfg_index->m_name);
|
|
|
|
index = dict_table_get_index_on_name(m_table, index_name);
|
|
|
|
/* We've already checked that it exists. */
|
|
ut_a(index != 0);
|
|
|
|
index->page = cfg_index->m_page_no;
|
|
}
|
|
}
|
|
|
|
/**
|
|
Set the index root <space, pageno>, using a heuristic.
|
|
@return DB_SUCCESS or error code */
|
|
dberr_t
|
|
row_import::set_root_by_heuristic() UNIV_NOTHROW
|
|
{
|
|
row_index_t* cfg_index = m_indexes;
|
|
|
|
ut_a(m_n_indexes > 0);
|
|
|
|
// TODO: For now use brute force, based on ordinality
|
|
|
|
if (UT_LIST_GET_LEN(m_table->indexes) != m_n_indexes) {
|
|
|
|
ib::warn() << "Table " << m_table->name << " should have "
|
|
<< UT_LIST_GET_LEN(m_table->indexes) << " indexes but"
|
|
" the tablespace has " << m_n_indexes << " indexes";
|
|
}
|
|
|
|
dict_mutex_enter_for_mysql();
|
|
|
|
ulint i = 0;
|
|
dberr_t err = DB_SUCCESS;
|
|
|
|
for (dict_index_t* index = UT_LIST_GET_FIRST(m_table->indexes);
|
|
index != 0;
|
|
index = UT_LIST_GET_NEXT(indexes, index)) {
|
|
|
|
if (index->type & DICT_FTS) {
|
|
index->type |= DICT_CORRUPT;
|
|
ib::warn() << "Skipping FTS index: " << index->name;
|
|
} else if (i < m_n_indexes) {
|
|
|
|
UT_DELETE_ARRAY(cfg_index[i].m_name);
|
|
|
|
ulint len = strlen(index->name) + 1;
|
|
|
|
cfg_index[i].m_name = UT_NEW_ARRAY_NOKEY(byte, len);
|
|
|
|
/* Trigger OOM */
|
|
DBUG_EXECUTE_IF(
|
|
"ib_import_OOM_14",
|
|
UT_DELETE_ARRAY(cfg_index[i].m_name);
|
|
cfg_index[i].m_name = NULL;
|
|
);
|
|
|
|
if (cfg_index[i].m_name == NULL) {
|
|
err = DB_OUT_OF_MEMORY;
|
|
break;
|
|
}
|
|
|
|
memcpy(cfg_index[i].m_name, index->name, len);
|
|
|
|
cfg_index[i].m_srv_index = index;
|
|
|
|
index->page = cfg_index[i].m_page_no;
|
|
|
|
++i;
|
|
}
|
|
}
|
|
|
|
dict_mutex_exit_for_mysql();
|
|
|
|
return(err);
|
|
}
|
|
|
|
/**
|
|
Purge delete marked records.
|
|
@return DB_SUCCESS or error code. */
|
|
dberr_t
|
|
IndexPurge::garbage_collect() UNIV_NOTHROW
|
|
{
|
|
dberr_t err;
|
|
ibool comp = dict_table_is_comp(m_index->table);
|
|
|
|
/* Open the persistent cursor and start the mini-transaction. */
|
|
|
|
open();
|
|
|
|
while ((err = next()) == DB_SUCCESS) {
|
|
|
|
rec_t* rec = btr_pcur_get_rec(&m_pcur);
|
|
ibool deleted = rec_get_deleted_flag(rec, comp);
|
|
|
|
if (!deleted) {
|
|
++m_n_rows;
|
|
} else {
|
|
purge();
|
|
}
|
|
}
|
|
|
|
/* Close the persistent cursor and commit the mini-transaction. */
|
|
|
|
close();
|
|
|
|
return(err == DB_END_OF_INDEX ? DB_SUCCESS : err);
|
|
}
|
|
|
|
/**
|
|
Begin import, position the cursor on the first record. */
|
|
void
|
|
IndexPurge::open() UNIV_NOTHROW
|
|
{
|
|
mtr_start(&m_mtr);
|
|
|
|
mtr_set_log_mode(&m_mtr, MTR_LOG_NO_REDO);
|
|
|
|
btr_pcur_open_at_index_side(
|
|
true, m_index, BTR_MODIFY_LEAF, &m_pcur, true, 0, &m_mtr);
|
|
btr_pcur_move_to_next_user_rec(&m_pcur, &m_mtr);
|
|
if (rec_is_metadata(btr_pcur_get_rec(&m_pcur), m_index)) {
|
|
ut_ad(btr_pcur_is_on_user_rec(&m_pcur));
|
|
/* Skip the metadata pseudo-record. */
|
|
} else {
|
|
btr_pcur_move_to_prev_on_page(&m_pcur);
|
|
}
|
|
}
|
|
|
|
/**
|
|
Close the persistent curosr and commit the mini-transaction. */
|
|
void
|
|
IndexPurge::close() UNIV_NOTHROW
|
|
{
|
|
btr_pcur_close(&m_pcur);
|
|
mtr_commit(&m_mtr);
|
|
}
|
|
|
|
/**
|
|
Position the cursor on the next record.
|
|
@return DB_SUCCESS or error code */
|
|
dberr_t
|
|
IndexPurge::next() UNIV_NOTHROW
|
|
{
|
|
btr_pcur_move_to_next_on_page(&m_pcur);
|
|
|
|
/* When switching pages, commit the mini-transaction
|
|
in order to release the latch on the old page. */
|
|
|
|
if (!btr_pcur_is_after_last_on_page(&m_pcur)) {
|
|
return(DB_SUCCESS);
|
|
} else if (trx_is_interrupted(m_trx)) {
|
|
/* Check after every page because the check
|
|
is expensive. */
|
|
return(DB_INTERRUPTED);
|
|
}
|
|
|
|
btr_pcur_store_position(&m_pcur, &m_mtr);
|
|
|
|
mtr_commit(&m_mtr);
|
|
|
|
mtr_start(&m_mtr);
|
|
|
|
mtr_set_log_mode(&m_mtr, MTR_LOG_NO_REDO);
|
|
|
|
btr_pcur_restore_position(BTR_MODIFY_LEAF, &m_pcur, &m_mtr);
|
|
|
|
if (!btr_pcur_move_to_next_user_rec(&m_pcur, &m_mtr)) {
|
|
|
|
return(DB_END_OF_INDEX);
|
|
}
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/**
|
|
Store the persistent cursor position and reopen the
|
|
B-tree cursor in BTR_MODIFY_TREE mode, because the
|
|
tree structure may be changed during a pessimistic delete. */
|
|
void
|
|
IndexPurge::purge_pessimistic_delete() UNIV_NOTHROW
|
|
{
|
|
dberr_t err;
|
|
|
|
btr_pcur_restore_position(BTR_MODIFY_TREE | BTR_LATCH_FOR_DELETE,
|
|
&m_pcur, &m_mtr);
|
|
|
|
ut_ad(rec_get_deleted_flag(
|
|
btr_pcur_get_rec(&m_pcur),
|
|
dict_table_is_comp(m_index->table)));
|
|
|
|
btr_cur_pessimistic_delete(
|
|
&err, FALSE, btr_pcur_get_btr_cur(&m_pcur), 0, false, &m_mtr);
|
|
|
|
ut_a(err == DB_SUCCESS);
|
|
|
|
/* Reopen the B-tree cursor in BTR_MODIFY_LEAF mode */
|
|
mtr_commit(&m_mtr);
|
|
}
|
|
|
|
/**
|
|
Purge delete-marked records. */
|
|
void
|
|
IndexPurge::purge() UNIV_NOTHROW
|
|
{
|
|
btr_pcur_store_position(&m_pcur, &m_mtr);
|
|
|
|
purge_pessimistic_delete();
|
|
|
|
mtr_start(&m_mtr);
|
|
|
|
mtr_set_log_mode(&m_mtr, MTR_LOG_NO_REDO);
|
|
|
|
btr_pcur_restore_position(BTR_MODIFY_LEAF, &m_pcur, &m_mtr);
|
|
}
|
|
|
|
/** Adjust the BLOB reference for a single column that is externally stored
|
|
@param rec record to update
|
|
@param offsets column offsets for the record
|
|
@param i column ordinal value
|
|
@return DB_SUCCESS or error code */
|
|
inline
|
|
dberr_t
|
|
PageConverter::adjust_cluster_index_blob_column(
|
|
rec_t* rec,
|
|
const ulint* offsets,
|
|
ulint i) UNIV_NOTHROW
|
|
{
|
|
ulint len;
|
|
byte* field;
|
|
|
|
field = rec_get_nth_field(rec, offsets, i, &len);
|
|
|
|
DBUG_EXECUTE_IF("ib_import_trigger_corruption_2",
|
|
len = BTR_EXTERN_FIELD_REF_SIZE - 1;);
|
|
|
|
if (len < BTR_EXTERN_FIELD_REF_SIZE) {
|
|
|
|
ib_errf(m_trx->mysql_thd, IB_LOG_LEVEL_ERROR,
|
|
ER_INNODB_INDEX_CORRUPT,
|
|
"Externally stored column(" ULINTPF
|
|
") has a reference length of " ULINTPF
|
|
" in the cluster index %s",
|
|
i, len, m_cluster_index->name());
|
|
|
|
return(DB_CORRUPTION);
|
|
}
|
|
|
|
field += len - (BTR_EXTERN_FIELD_REF_SIZE - BTR_EXTERN_SPACE_ID);
|
|
|
|
mach_write_to_4(field, get_space_id());
|
|
|
|
if (m_page_zip_ptr) {
|
|
page_zip_write_blob_ptr(
|
|
m_page_zip_ptr, rec, m_cluster_index, offsets, i, 0);
|
|
}
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/** Adjusts the BLOB reference in the clustered index row for all externally
|
|
stored columns.
|
|
@param rec record to update
|
|
@param offsets column offsets for the record
|
|
@return DB_SUCCESS or error code */
|
|
inline
|
|
dberr_t
|
|
PageConverter::adjust_cluster_index_blob_columns(
|
|
rec_t* rec,
|
|
const ulint* offsets) UNIV_NOTHROW
|
|
{
|
|
ut_ad(rec_offs_any_extern(offsets));
|
|
|
|
/* Adjust the space_id in the BLOB pointers. */
|
|
|
|
for (ulint i = 0; i < rec_offs_n_fields(offsets); ++i) {
|
|
|
|
/* Only if the column is stored "externally". */
|
|
|
|
if (rec_offs_nth_extern(offsets, i)) {
|
|
dberr_t err;
|
|
|
|
err = adjust_cluster_index_blob_column(rec, offsets, i);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
return(err);
|
|
}
|
|
}
|
|
}
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/** In the clustered index, adjust BLOB pointers as needed. Also update the
|
|
BLOB reference, write the new space id.
|
|
@param rec record to update
|
|
@param offsets column offsets for the record
|
|
@return DB_SUCCESS or error code */
|
|
inline
|
|
dberr_t
|
|
PageConverter::adjust_cluster_index_blob_ref(
|
|
rec_t* rec,
|
|
const ulint* offsets) UNIV_NOTHROW
|
|
{
|
|
if (rec_offs_any_extern(offsets)) {
|
|
dberr_t err;
|
|
|
|
err = adjust_cluster_index_blob_columns(rec, offsets);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
return(err);
|
|
}
|
|
}
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/** Purge delete-marked records, only if it is possible to do so without
|
|
re-organising the B+tree.
|
|
@return true if purge succeeded */
|
|
inline bool PageConverter::purge() UNIV_NOTHROW
|
|
{
|
|
const dict_index_t* index = m_index->m_srv_index;
|
|
|
|
/* We can't have a page that is empty and not root. */
|
|
if (m_rec_iter.remove(index, m_page_zip_ptr, m_offsets)) {
|
|
|
|
++m_index->m_stats.m_n_purged;
|
|
|
|
return(true);
|
|
} else {
|
|
++m_index->m_stats.m_n_purge_failed;
|
|
}
|
|
|
|
return(false);
|
|
}
|
|
|
|
/** Adjust the BLOB references and sys fields for the current record.
|
|
@param rec record to update
|
|
@param offsets column offsets for the record
|
|
@return DB_SUCCESS or error code. */
|
|
inline
|
|
dberr_t
|
|
PageConverter::adjust_cluster_record(
|
|
rec_t* rec,
|
|
const ulint* offsets) UNIV_NOTHROW
|
|
{
|
|
dberr_t err;
|
|
|
|
if ((err = adjust_cluster_index_blob_ref(rec, offsets)) == DB_SUCCESS) {
|
|
|
|
/* Reset DB_TRX_ID and DB_ROLL_PTR. Normally, these fields
|
|
are only written in conjunction with other changes to the
|
|
record. */
|
|
ulint trx_id_pos = m_cluster_index->n_uniq
|
|
? m_cluster_index->n_uniq : 1;
|
|
if (m_page_zip_ptr) {
|
|
page_zip_write_trx_id_and_roll_ptr(
|
|
m_page_zip_ptr, rec, m_offsets, trx_id_pos,
|
|
0, roll_ptr_t(1) << ROLL_PTR_INSERT_FLAG_POS,
|
|
NULL);
|
|
} else {
|
|
ulint len;
|
|
byte* ptr = rec_get_nth_field(
|
|
rec, m_offsets, trx_id_pos, &len);
|
|
ut_ad(len == DATA_TRX_ID_LEN);
|
|
memcpy(ptr, reset_trx_id, sizeof reset_trx_id);
|
|
}
|
|
}
|
|
|
|
return(err);
|
|
}
|
|
|
|
/** Update the BLOB refrences and write UNDO log entries for
|
|
rows that can't be purged optimistically.
|
|
@param block block to update
|
|
@retval DB_SUCCESS or error code */
|
|
inline
|
|
dberr_t
|
|
PageConverter::update_records(
|
|
buf_block_t* block) UNIV_NOTHROW
|
|
{
|
|
ibool comp = dict_table_is_comp(m_cfg->m_table);
|
|
bool clust_index = m_index->m_srv_index == m_cluster_index;
|
|
|
|
/* This will also position the cursor on the first user record. */
|
|
|
|
m_rec_iter.open(block);
|
|
|
|
while (!m_rec_iter.end()) {
|
|
rec_t* rec = m_rec_iter.current();
|
|
ibool deleted = rec_get_deleted_flag(rec, comp);
|
|
|
|
/* For the clustered index we have to adjust the BLOB
|
|
reference and the system fields irrespective of the
|
|
delete marked flag. The adjustment of delete marked
|
|
cluster records is required for purge to work later. */
|
|
|
|
if (deleted || clust_index) {
|
|
m_offsets = rec_get_offsets(
|
|
rec, m_index->m_srv_index, m_offsets, true,
|
|
ULINT_UNDEFINED, &m_heap);
|
|
}
|
|
|
|
if (clust_index) {
|
|
|
|
dberr_t err = adjust_cluster_record(rec, m_offsets);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
return(err);
|
|
}
|
|
}
|
|
|
|
/* If it is a delete marked record then try an
|
|
optimistic delete. */
|
|
|
|
if (deleted) {
|
|
/* A successful purge will move the cursor to the
|
|
next record. */
|
|
|
|
if (!purge()) {
|
|
m_rec_iter.next();
|
|
}
|
|
|
|
++m_index->m_stats.m_n_deleted;
|
|
} else {
|
|
++m_index->m_stats.m_n_rows;
|
|
m_rec_iter.next();
|
|
}
|
|
}
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/** Update the space, index id, trx id.
|
|
@return DB_SUCCESS or error code */
|
|
inline
|
|
dberr_t
|
|
PageConverter::update_index_page(
|
|
buf_block_t* block) UNIV_NOTHROW
|
|
{
|
|
index_id_t id;
|
|
buf_frame_t* page = block->frame;
|
|
|
|
if (is_free(block->page.id.page_no())) {
|
|
return(DB_SUCCESS);
|
|
} else if ((id = btr_page_get_index_id(page)) != m_index->m_id) {
|
|
|
|
row_index_t* index = find_index(id);
|
|
|
|
if (index == 0) {
|
|
ib::error() << "Page for tablespace " << m_space
|
|
<< " is index page with id " << id
|
|
<< " but that index is not found from"
|
|
<< " configuration file. Current index name "
|
|
<< m_index->m_name << " and id " << m_index->m_id;
|
|
m_index = 0;
|
|
return(DB_CORRUPTION);
|
|
}
|
|
|
|
/* Update current index */
|
|
m_index = index;
|
|
}
|
|
|
|
/* If the .cfg file is missing and there is an index mismatch
|
|
then ignore the error. */
|
|
if (m_cfg->m_missing && (m_index == 0 || m_index->m_srv_index == 0)) {
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
#ifdef UNIV_ZIP_DEBUG
|
|
ut_a(!is_compressed_table()
|
|
|| page_zip_validate(m_page_zip_ptr, page, m_index->m_srv_index));
|
|
#endif /* UNIV_ZIP_DEBUG */
|
|
|
|
/* This has to be written to uncompressed index header. Set it to
|
|
the current index id. */
|
|
btr_page_set_index_id(
|
|
page, m_page_zip_ptr, m_index->m_srv_index->id, 0);
|
|
|
|
if (dict_index_is_clust(m_index->m_srv_index)) {
|
|
dict_index_t* index = const_cast<dict_index_t*>(
|
|
m_index->m_srv_index);
|
|
if (block->page.id.page_no() == index->page) {
|
|
/* Preserve the PAGE_ROOT_AUTO_INC. */
|
|
if (index->table->supports_instant()) {
|
|
if (btr_cur_instant_root_init(index, page)) {
|
|
return(DB_CORRUPTION);
|
|
}
|
|
|
|
/* Provisionally set all instantly
|
|
added columns to be DEFAULT NULL. */
|
|
for (unsigned i = index->n_core_fields;
|
|
i < index->n_fields; i++) {
|
|
dict_col_t* col = index->fields[i].col;
|
|
col->def_val.len = UNIV_SQL_NULL;
|
|
col->def_val.data = NULL;
|
|
}
|
|
}
|
|
} else {
|
|
/* Clear PAGE_MAX_TRX_ID so that it can be
|
|
used for other purposes in the future. IMPORT
|
|
in MySQL 5.6, 5.7 and MariaDB 10.0 and 10.1
|
|
would set the field to the transaction ID even
|
|
on clustered index pages. */
|
|
page_set_max_trx_id(block, m_page_zip_ptr, 0, NULL);
|
|
}
|
|
} else {
|
|
/* Set PAGE_MAX_TRX_ID on secondary index leaf pages,
|
|
and clear it on non-leaf pages. */
|
|
page_set_max_trx_id(block, m_page_zip_ptr,
|
|
page_is_leaf(page) ? m_trx->id : 0, NULL);
|
|
}
|
|
|
|
if (page_is_empty(page)) {
|
|
|
|
/* Only a root page can be empty. */
|
|
if (page_has_siblings(page)) {
|
|
// TODO: We should relax this and skip secondary
|
|
// indexes. Mark them as corrupt because they can
|
|
// always be rebuilt.
|
|
return(DB_CORRUPTION);
|
|
}
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
return page_is_leaf(block->frame) ? update_records(block) : DB_SUCCESS;
|
|
}
|
|
|
|
/** Validate the space flags and update tablespace header page.
|
|
@param block block read from file, not from the buffer pool.
|
|
@retval DB_SUCCESS or error code */
|
|
inline
|
|
dberr_t
|
|
PageConverter::update_header(
|
|
buf_block_t* block) UNIV_NOTHROW
|
|
{
|
|
/* Check for valid header */
|
|
switch (fsp_header_get_space_id(get_frame(block))) {
|
|
case 0:
|
|
return(DB_CORRUPTION);
|
|
case ULINT_UNDEFINED:
|
|
ib::warn() << "Space id check in the header failed: ignored";
|
|
}
|
|
|
|
mach_write_to_8(
|
|
get_frame(block) + FIL_PAGE_FILE_FLUSH_LSN_OR_KEY_VERSION,
|
|
m_current_lsn);
|
|
|
|
/* Write back the adjusted flags. */
|
|
mach_write_to_4(FSP_HEADER_OFFSET + FSP_SPACE_FLAGS
|
|
+ get_frame(block), m_space_flags);
|
|
|
|
/* Write space_id to the tablespace header, page 0. */
|
|
mach_write_to_4(
|
|
get_frame(block) + FSP_HEADER_OFFSET + FSP_SPACE_ID,
|
|
get_space_id());
|
|
|
|
/* This is on every page in the tablespace. */
|
|
mach_write_to_4(
|
|
get_frame(block) + FIL_PAGE_ARCH_LOG_NO_OR_SPACE_ID,
|
|
get_space_id());
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/** Update the page, set the space id, max trx id and index id.
|
|
@param block block read from file
|
|
@retval DB_SUCCESS or error code */
|
|
inline
|
|
dberr_t
|
|
PageConverter::update_page(
|
|
buf_block_t* block,
|
|
ulint& page_type) UNIV_NOTHROW
|
|
{
|
|
dberr_t err = DB_SUCCESS;
|
|
|
|
ut_ad(!block->page.zip.data == !is_compressed_table());
|
|
|
|
if (block->page.zip.data) {
|
|
m_page_zip_ptr = &block->page.zip;
|
|
} else {
|
|
ut_ad(!m_page_zip_ptr);
|
|
}
|
|
|
|
switch (page_type = fil_page_get_type(get_frame(block))) {
|
|
case FIL_PAGE_TYPE_FSP_HDR:
|
|
ut_a(block->page.id.page_no() == 0);
|
|
/* Work directly on the uncompressed page headers. */
|
|
return(update_header(block));
|
|
|
|
case FIL_PAGE_INDEX:
|
|
case FIL_PAGE_RTREE:
|
|
/* We need to decompress the contents into block->frame
|
|
before we can do any thing with Btree pages. */
|
|
|
|
if (is_compressed_table() && !buf_zip_decompress(block, TRUE)) {
|
|
return(DB_CORRUPTION);
|
|
}
|
|
|
|
/* fall through */
|
|
case FIL_PAGE_TYPE_INSTANT:
|
|
/* This is on every page in the tablespace. */
|
|
mach_write_to_4(
|
|
get_frame(block)
|
|
+ FIL_PAGE_ARCH_LOG_NO_OR_SPACE_ID, get_space_id());
|
|
|
|
/* Only update the Btree nodes. */
|
|
return(update_index_page(block));
|
|
|
|
case FIL_PAGE_TYPE_SYS:
|
|
/* This is page 0 in the system tablespace. */
|
|
return(DB_CORRUPTION);
|
|
|
|
case FIL_PAGE_TYPE_XDES:
|
|
err = set_current_xdes(
|
|
block->page.id.page_no(), get_frame(block));
|
|
/* fall through */
|
|
case FIL_PAGE_INODE:
|
|
case FIL_PAGE_TYPE_TRX_SYS:
|
|
case FIL_PAGE_IBUF_FREE_LIST:
|
|
case FIL_PAGE_TYPE_ALLOCATED:
|
|
case FIL_PAGE_IBUF_BITMAP:
|
|
case FIL_PAGE_TYPE_BLOB:
|
|
case FIL_PAGE_TYPE_ZBLOB:
|
|
case FIL_PAGE_TYPE_ZBLOB2:
|
|
|
|
/* Work directly on the uncompressed page headers. */
|
|
/* This is on every page in the tablespace. */
|
|
mach_write_to_4(
|
|
get_frame(block)
|
|
+ FIL_PAGE_ARCH_LOG_NO_OR_SPACE_ID, get_space_id());
|
|
|
|
return(err);
|
|
}
|
|
|
|
ib::warn() << "Unknown page type (" << page_type << ")";
|
|
|
|
return(DB_CORRUPTION);
|
|
}
|
|
|
|
/** Called for every page in the tablespace. If the page was not
|
|
updated then its state must be set to BUF_PAGE_NOT_USED.
|
|
@param block block read from file, note it is not from the buffer pool
|
|
@retval DB_SUCCESS or error code. */
|
|
dberr_t PageConverter::operator()(buf_block_t* block) UNIV_NOTHROW
|
|
{
|
|
/* If we already had an old page with matching number
|
|
in the buffer pool, evict it now, because
|
|
we no longer evict the pages on DISCARD TABLESPACE. */
|
|
buf_page_get_gen(block->page.id, get_page_size(),
|
|
RW_NO_LATCH, NULL, BUF_EVICT_IF_IN_POOL,
|
|
__FILE__, __LINE__, NULL, NULL);
|
|
|
|
ulint page_type;
|
|
|
|
dberr_t err = update_page(block, page_type);
|
|
if (err != DB_SUCCESS) return err;
|
|
|
|
if (!block->page.zip.data) {
|
|
buf_flush_init_for_writing(
|
|
NULL, block->frame, NULL, m_current_lsn);
|
|
} else if (fil_page_type_is_index(page_type)) {
|
|
buf_flush_init_for_writing(
|
|
NULL, block->page.zip.data, &block->page.zip,
|
|
m_current_lsn);
|
|
} else {
|
|
/* Calculate and update the checksum of non-index
|
|
pages for ROW_FORMAT=COMPRESSED tables. */
|
|
buf_flush_update_zip_checksum(
|
|
block->page.zip.data, get_page_size().physical(),
|
|
m_current_lsn);
|
|
}
|
|
|
|
return DB_SUCCESS;
|
|
}
|
|
|
|
/*****************************************************************//**
|
|
Clean up after import tablespace failure, this function will acquire
|
|
the dictionary latches on behalf of the transaction if the transaction
|
|
hasn't already acquired them. */
|
|
static MY_ATTRIBUTE((nonnull))
|
|
void
|
|
row_import_discard_changes(
|
|
/*=======================*/
|
|
row_prebuilt_t* prebuilt, /*!< in/out: prebuilt from handler */
|
|
trx_t* trx, /*!< in/out: transaction for import */
|
|
dberr_t err) /*!< in: error code */
|
|
{
|
|
dict_table_t* table = prebuilt->table;
|
|
|
|
ut_a(err != DB_SUCCESS);
|
|
|
|
prebuilt->trx->error_info = NULL;
|
|
|
|
ib::info() << "Discarding tablespace of table "
|
|
<< prebuilt->table->name
|
|
<< ": " << ut_strerr(err);
|
|
|
|
if (trx->dict_operation_lock_mode != RW_X_LATCH) {
|
|
ut_a(trx->dict_operation_lock_mode == 0);
|
|
row_mysql_lock_data_dictionary(trx);
|
|
}
|
|
|
|
ut_a(trx->dict_operation_lock_mode == RW_X_LATCH);
|
|
|
|
/* Since we update the index root page numbers on disk after
|
|
we've done a successful import. The table will not be loadable.
|
|
However, we need to ensure that the in memory root page numbers
|
|
are reset to "NULL". */
|
|
|
|
for (dict_index_t* index = UT_LIST_GET_FIRST(table->indexes);
|
|
index != 0;
|
|
index = UT_LIST_GET_NEXT(indexes, index)) {
|
|
|
|
index->page = FIL_NULL;
|
|
}
|
|
|
|
table->file_unreadable = true;
|
|
if (table->space) {
|
|
fil_close_tablespace(trx, table->space_id);
|
|
table->space = NULL;
|
|
}
|
|
}
|
|
|
|
/*****************************************************************//**
|
|
Clean up after import tablespace. */
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
|
dberr_t
|
|
row_import_cleanup(
|
|
/*===============*/
|
|
row_prebuilt_t* prebuilt, /*!< in/out: prebuilt from handler */
|
|
trx_t* trx, /*!< in/out: transaction for import */
|
|
dberr_t err) /*!< in: error code */
|
|
{
|
|
ut_a(prebuilt->trx != trx);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
row_import_discard_changes(prebuilt, trx, err);
|
|
}
|
|
|
|
ut_a(trx->dict_operation_lock_mode == RW_X_LATCH);
|
|
|
|
DBUG_EXECUTE_IF("ib_import_before_commit_crash", DBUG_SUICIDE(););
|
|
|
|
trx_commit_for_mysql(trx);
|
|
|
|
row_mysql_unlock_data_dictionary(trx);
|
|
|
|
trx_free(trx);
|
|
|
|
prebuilt->trx->op_info = "";
|
|
|
|
DBUG_EXECUTE_IF("ib_import_before_checkpoint_crash", DBUG_SUICIDE(););
|
|
|
|
log_make_checkpoint_at(LSN_MAX);
|
|
|
|
return(err);
|
|
}
|
|
|
|
/*****************************************************************//**
|
|
Report error during tablespace import. */
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
|
dberr_t
|
|
row_import_error(
|
|
/*=============*/
|
|
row_prebuilt_t* prebuilt, /*!< in/out: prebuilt from handler */
|
|
trx_t* trx, /*!< in/out: transaction for import */
|
|
dberr_t err) /*!< in: error code */
|
|
{
|
|
if (!trx_is_interrupted(trx)) {
|
|
char table_name[MAX_FULL_NAME_LEN + 1];
|
|
|
|
innobase_format_name(
|
|
table_name, sizeof(table_name),
|
|
prebuilt->table->name.m_name);
|
|
|
|
ib_senderrf(
|
|
trx->mysql_thd, IB_LOG_LEVEL_WARN,
|
|
ER_INNODB_IMPORT_ERROR,
|
|
table_name, (ulong) err, ut_strerr(err));
|
|
}
|
|
|
|
return(row_import_cleanup(prebuilt, trx, err));
|
|
}
|
|
|
|
/*****************************************************************//**
|
|
Adjust the root page index node and leaf node segment headers, update
|
|
with the new space id. For all the table's secondary indexes.
|
|
@return error code */
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
|
dberr_t
|
|
row_import_adjust_root_pages_of_secondary_indexes(
|
|
/*==============================================*/
|
|
trx_t* trx, /*!< in: transaction used for
|
|
the import */
|
|
dict_table_t* table, /*!< in: table the indexes
|
|
belong to */
|
|
const row_import& cfg) /*!< Import context */
|
|
{
|
|
dict_index_t* index;
|
|
ulint n_rows_in_table;
|
|
dberr_t err = DB_SUCCESS;
|
|
|
|
/* Skip the clustered index. */
|
|
index = dict_table_get_first_index(table);
|
|
|
|
n_rows_in_table = cfg.get_n_rows(index->name);
|
|
|
|
DBUG_EXECUTE_IF("ib_import_sec_rec_count_mismatch_failure",
|
|
n_rows_in_table++;);
|
|
|
|
/* Adjust the root pages of the secondary indexes only. */
|
|
while ((index = dict_table_get_next_index(index)) != NULL) {
|
|
ut_a(!dict_index_is_clust(index));
|
|
|
|
if (!(index->type & DICT_CORRUPT)
|
|
&& index->page != FIL_NULL) {
|
|
|
|
/* Update the Btree segment headers for index node and
|
|
leaf nodes in the root page. Set the new space id. */
|
|
|
|
err = btr_root_adjust_on_import(index);
|
|
} else {
|
|
ib::warn() << "Skip adjustment of root pages for"
|
|
" index " << index->name << ".";
|
|
|
|
err = DB_CORRUPTION;
|
|
}
|
|
|
|
if (err != DB_SUCCESS) {
|
|
|
|
if (index->type & DICT_CLUSTERED) {
|
|
break;
|
|
}
|
|
|
|
ib_errf(trx->mysql_thd,
|
|
IB_LOG_LEVEL_WARN,
|
|
ER_INNODB_INDEX_CORRUPT,
|
|
"Index %s not found or corrupt,"
|
|
" you should recreate this index.",
|
|
index->name());
|
|
|
|
/* Do not bail out, so that the data
|
|
can be recovered. */
|
|
|
|
err = DB_SUCCESS;
|
|
index->type |= DICT_CORRUPT;
|
|
continue;
|
|
}
|
|
|
|
/* If we failed to purge any records in the index then
|
|
do it the hard way.
|
|
|
|
TODO: We can do this in the first pass by generating UNDO log
|
|
records for the failed rows. */
|
|
|
|
if (!cfg.requires_purge(index->name)) {
|
|
continue;
|
|
}
|
|
|
|
IndexPurge purge(trx, index);
|
|
|
|
trx->op_info = "secondary: purge delete marked records";
|
|
|
|
err = purge.garbage_collect();
|
|
|
|
trx->op_info = "";
|
|
|
|
if (err != DB_SUCCESS) {
|
|
break;
|
|
} else if (purge.get_n_rows() != n_rows_in_table) {
|
|
|
|
ib_errf(trx->mysql_thd,
|
|
IB_LOG_LEVEL_WARN,
|
|
ER_INNODB_INDEX_CORRUPT,
|
|
"Index '%s' contains " ULINTPF " entries, "
|
|
"should be " ULINTPF ", you should recreate "
|
|
"this index.", index->name(),
|
|
purge.get_n_rows(), n_rows_in_table);
|
|
|
|
index->type |= DICT_CORRUPT;
|
|
|
|
/* Do not bail out, so that the data
|
|
can be recovered. */
|
|
|
|
err = DB_SUCCESS;
|
|
}
|
|
}
|
|
|
|
return(err);
|
|
}
|
|
|
|
/*****************************************************************//**
|
|
Ensure that dict_sys->row_id exceeds SELECT MAX(DB_ROW_ID).
|
|
@return error code */
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
|
dberr_t
|
|
row_import_set_sys_max_row_id(
|
|
/*==========================*/
|
|
row_prebuilt_t* prebuilt, /*!< in/out: prebuilt from
|
|
handler */
|
|
const dict_table_t* table) /*!< in: table to import */
|
|
{
|
|
dberr_t err;
|
|
const rec_t* rec;
|
|
mtr_t mtr;
|
|
btr_pcur_t pcur;
|
|
row_id_t row_id = 0;
|
|
dict_index_t* index;
|
|
|
|
index = dict_table_get_first_index(table);
|
|
ut_a(dict_index_is_clust(index));
|
|
|
|
mtr_start(&mtr);
|
|
|
|
mtr_set_log_mode(&mtr, MTR_LOG_NO_REDO);
|
|
|
|
btr_pcur_open_at_index_side(
|
|
false, // High end
|
|
index,
|
|
BTR_SEARCH_LEAF,
|
|
&pcur,
|
|
true, // Init cursor
|
|
0, // Leaf level
|
|
&mtr);
|
|
|
|
btr_pcur_move_to_prev_on_page(&pcur);
|
|
rec = btr_pcur_get_rec(&pcur);
|
|
|
|
/* Check for empty table. */
|
|
if (page_rec_is_infimum(rec)) {
|
|
/* The table is empty. */
|
|
err = DB_SUCCESS;
|
|
} else if (rec_is_metadata(rec, index)) {
|
|
/* The clustered index contains the metadata record only,
|
|
that is, the table is empty. */
|
|
err = DB_SUCCESS;
|
|
} else {
|
|
ulint len;
|
|
const byte* field;
|
|
mem_heap_t* heap = NULL;
|
|
ulint offsets_[1 + REC_OFFS_HEADER_SIZE];
|
|
ulint* offsets;
|
|
|
|
rec_offs_init(offsets_);
|
|
|
|
offsets = rec_get_offsets(
|
|
rec, index, offsets_, true, ULINT_UNDEFINED, &heap);
|
|
|
|
field = rec_get_nth_field(
|
|
rec, offsets,
|
|
dict_index_get_sys_col_pos(index, DATA_ROW_ID),
|
|
&len);
|
|
|
|
if (len == DATA_ROW_ID_LEN) {
|
|
row_id = mach_read_from_6(field);
|
|
err = DB_SUCCESS;
|
|
} else {
|
|
err = DB_CORRUPTION;
|
|
}
|
|
|
|
if (heap != NULL) {
|
|
mem_heap_free(heap);
|
|
}
|
|
}
|
|
|
|
btr_pcur_close(&pcur);
|
|
mtr_commit(&mtr);
|
|
|
|
DBUG_EXECUTE_IF("ib_import_set_max_rowid_failure",
|
|
err = DB_CORRUPTION;);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
ib_errf(prebuilt->trx->mysql_thd,
|
|
IB_LOG_LEVEL_WARN,
|
|
ER_INNODB_INDEX_CORRUPT,
|
|
"Index `%s` corruption detected, invalid DB_ROW_ID"
|
|
" in index.", index->name());
|
|
|
|
return(err);
|
|
|
|
} else if (row_id > 0) {
|
|
|
|
/* Update the system row id if the imported index row id is
|
|
greater than the max system row id. */
|
|
|
|
mutex_enter(&dict_sys->mutex);
|
|
|
|
if (row_id >= dict_sys->row_id) {
|
|
dict_sys->row_id = row_id + 1;
|
|
dict_hdr_flush_row_id();
|
|
}
|
|
|
|
mutex_exit(&dict_sys->mutex);
|
|
}
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/*****************************************************************//**
|
|
Read the a string from the meta data file.
|
|
@return DB_SUCCESS or error code. */
|
|
static
|
|
dberr_t
|
|
row_import_cfg_read_string(
|
|
/*=======================*/
|
|
FILE* file, /*!< in/out: File to read from */
|
|
byte* ptr, /*!< out: string to read */
|
|
ulint max_len) /*!< in: maximum length of the output
|
|
buffer in bytes */
|
|
{
|
|
DBUG_EXECUTE_IF("ib_import_string_read_error",
|
|
errno = EINVAL; return(DB_IO_ERROR););
|
|
|
|
ulint len = 0;
|
|
|
|
while (!feof(file)) {
|
|
int ch = fgetc(file);
|
|
|
|
if (ch == EOF) {
|
|
break;
|
|
} else if (ch != 0) {
|
|
if (len < max_len) {
|
|
ptr[len++] = ch;
|
|
} else {
|
|
break;
|
|
}
|
|
/* max_len includes the NUL byte */
|
|
} else if (len != max_len - 1) {
|
|
break;
|
|
} else {
|
|
ptr[len] = 0;
|
|
return(DB_SUCCESS);
|
|
}
|
|
}
|
|
|
|
errno = EINVAL;
|
|
|
|
return(DB_IO_ERROR);
|
|
}
|
|
|
|
/*********************************************************************//**
|
|
Write the meta data (index user fields) config file.
|
|
@return DB_SUCCESS or error code. */
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
|
dberr_t
|
|
row_import_cfg_read_index_fields(
|
|
/*=============================*/
|
|
FILE* file, /*!< in: file to write to */
|
|
THD* thd, /*!< in/out: session */
|
|
row_index_t* index) /*!< Index being read in */
|
|
{
|
|
byte row[sizeof(ib_uint32_t) * 3];
|
|
ulint n_fields = index->m_n_fields;
|
|
|
|
index->m_fields = UT_NEW_ARRAY_NOKEY(dict_field_t, n_fields);
|
|
|
|
/* Trigger OOM */
|
|
DBUG_EXECUTE_IF(
|
|
"ib_import_OOM_4",
|
|
UT_DELETE_ARRAY(index->m_fields);
|
|
index->m_fields = NULL;
|
|
);
|
|
|
|
if (index->m_fields == NULL) {
|
|
return(DB_OUT_OF_MEMORY);
|
|
}
|
|
|
|
dict_field_t* field = index->m_fields;
|
|
|
|
for (ulint i = 0; i < n_fields; ++i, ++field) {
|
|
byte* ptr = row;
|
|
|
|
/* Trigger EOF */
|
|
DBUG_EXECUTE_IF("ib_import_io_read_error_1",
|
|
(void) fseek(file, 0L, SEEK_END););
|
|
|
|
if (fread(row, 1, sizeof(row), file) != sizeof(row)) {
|
|
|
|
ib_senderrf(
|
|
thd, IB_LOG_LEVEL_ERROR, ER_IO_READ_ERROR,
|
|
(ulong) errno, strerror(errno),
|
|
"while reading index fields.");
|
|
|
|
return(DB_IO_ERROR);
|
|
}
|
|
|
|
new (field) dict_field_t();
|
|
|
|
field->prefix_len = mach_read_from_4(ptr);
|
|
ptr += sizeof(ib_uint32_t);
|
|
|
|
field->fixed_len = mach_read_from_4(ptr);
|
|
ptr += sizeof(ib_uint32_t);
|
|
|
|
/* Include the NUL byte in the length. */
|
|
ulint len = mach_read_from_4(ptr);
|
|
|
|
byte* name = UT_NEW_ARRAY_NOKEY(byte, len);
|
|
|
|
/* Trigger OOM */
|
|
DBUG_EXECUTE_IF(
|
|
"ib_import_OOM_5",
|
|
UT_DELETE_ARRAY(name);
|
|
name = NULL;
|
|
);
|
|
|
|
if (name == NULL) {
|
|
return(DB_OUT_OF_MEMORY);
|
|
}
|
|
|
|
field->name = reinterpret_cast<const char*>(name);
|
|
|
|
dberr_t err = row_import_cfg_read_string(file, name, len);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
|
|
ib_senderrf(
|
|
thd, IB_LOG_LEVEL_ERROR, ER_IO_READ_ERROR,
|
|
(ulong) errno, strerror(errno),
|
|
"while parsing table name.");
|
|
|
|
return(err);
|
|
}
|
|
}
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/*****************************************************************//**
|
|
Read the index names and root page numbers of the indexes and set the values.
|
|
Row format [root_page_no, len of str, str ... ]
|
|
@return DB_SUCCESS or error code. */
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
|
dberr_t
|
|
row_import_read_index_data(
|
|
/*=======================*/
|
|
FILE* file, /*!< in: File to read from */
|
|
THD* thd, /*!< in: session */
|
|
row_import* cfg) /*!< in/out: meta-data read */
|
|
{
|
|
byte* ptr;
|
|
row_index_t* cfg_index;
|
|
byte row[sizeof(index_id_t) + sizeof(ib_uint32_t) * 9];
|
|
|
|
/* FIXME: What is the max value? */
|
|
ut_a(cfg->m_n_indexes > 0);
|
|
ut_a(cfg->m_n_indexes < 1024);
|
|
|
|
cfg->m_indexes = UT_NEW_ARRAY_NOKEY(row_index_t, cfg->m_n_indexes);
|
|
|
|
/* Trigger OOM */
|
|
DBUG_EXECUTE_IF(
|
|
"ib_import_OOM_6",
|
|
UT_DELETE_ARRAY(cfg->m_indexes);
|
|
cfg->m_indexes = NULL;
|
|
);
|
|
|
|
if (cfg->m_indexes == NULL) {
|
|
return(DB_OUT_OF_MEMORY);
|
|
}
|
|
|
|
memset(cfg->m_indexes, 0x0, sizeof(*cfg->m_indexes) * cfg->m_n_indexes);
|
|
|
|
cfg_index = cfg->m_indexes;
|
|
|
|
for (ulint i = 0; i < cfg->m_n_indexes; ++i, ++cfg_index) {
|
|
/* Trigger EOF */
|
|
DBUG_EXECUTE_IF("ib_import_io_read_error_2",
|
|
(void) fseek(file, 0L, SEEK_END););
|
|
|
|
/* Read the index data. */
|
|
size_t n_bytes = fread(row, 1, sizeof(row), file);
|
|
|
|
/* Trigger EOF */
|
|
DBUG_EXECUTE_IF("ib_import_io_read_error",
|
|
(void) fseek(file, 0L, SEEK_END););
|
|
|
|
if (n_bytes != sizeof(row)) {
|
|
char msg[BUFSIZ];
|
|
|
|
snprintf(msg, sizeof(msg),
|
|
"while reading index meta-data, expected "
|
|
"to read " ULINTPF
|
|
" bytes but read only " ULINTPF " bytes",
|
|
sizeof(row), n_bytes);
|
|
|
|
ib_senderrf(
|
|
thd, IB_LOG_LEVEL_ERROR, ER_IO_READ_ERROR,
|
|
(ulong) errno, strerror(errno), msg);
|
|
|
|
ib::error() << "IO Error: " << msg;
|
|
|
|
return(DB_IO_ERROR);
|
|
}
|
|
|
|
ptr = row;
|
|
|
|
cfg_index->m_id = mach_read_from_8(ptr);
|
|
ptr += sizeof(index_id_t);
|
|
|
|
cfg_index->m_space = mach_read_from_4(ptr);
|
|
ptr += sizeof(ib_uint32_t);
|
|
|
|
cfg_index->m_page_no = mach_read_from_4(ptr);
|
|
ptr += sizeof(ib_uint32_t);
|
|
|
|
cfg_index->m_type = mach_read_from_4(ptr);
|
|
ptr += sizeof(ib_uint32_t);
|
|
|
|
cfg_index->m_trx_id_offset = mach_read_from_4(ptr);
|
|
if (cfg_index->m_trx_id_offset != mach_read_from_4(ptr)) {
|
|
ut_ad(0);
|
|
/* Overflow. Pretend that the clustered index
|
|
has a variable-length PRIMARY KEY. */
|
|
cfg_index->m_trx_id_offset = 0;
|
|
}
|
|
ptr += sizeof(ib_uint32_t);
|
|
|
|
cfg_index->m_n_user_defined_cols = mach_read_from_4(ptr);
|
|
ptr += sizeof(ib_uint32_t);
|
|
|
|
cfg_index->m_n_uniq = mach_read_from_4(ptr);
|
|
ptr += sizeof(ib_uint32_t);
|
|
|
|
cfg_index->m_n_nullable = mach_read_from_4(ptr);
|
|
ptr += sizeof(ib_uint32_t);
|
|
|
|
cfg_index->m_n_fields = mach_read_from_4(ptr);
|
|
ptr += sizeof(ib_uint32_t);
|
|
|
|
/* The NUL byte is included in the name length. */
|
|
ulint len = mach_read_from_4(ptr);
|
|
|
|
if (len > OS_FILE_MAX_PATH) {
|
|
ib_errf(thd, IB_LOG_LEVEL_ERROR,
|
|
ER_INNODB_INDEX_CORRUPT,
|
|
"Index name length (" ULINTPF ") is too long, "
|
|
"the meta-data is corrupt", len);
|
|
|
|
return(DB_CORRUPTION);
|
|
}
|
|
|
|
cfg_index->m_name = UT_NEW_ARRAY_NOKEY(byte, len);
|
|
|
|
/* Trigger OOM */
|
|
DBUG_EXECUTE_IF(
|
|
"ib_import_OOM_7",
|
|
UT_DELETE_ARRAY(cfg_index->m_name);
|
|
cfg_index->m_name = NULL;
|
|
);
|
|
|
|
if (cfg_index->m_name == NULL) {
|
|
return(DB_OUT_OF_MEMORY);
|
|
}
|
|
|
|
dberr_t err;
|
|
|
|
err = row_import_cfg_read_string(file, cfg_index->m_name, len);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
|
|
ib_senderrf(
|
|
thd, IB_LOG_LEVEL_ERROR, ER_IO_READ_ERROR,
|
|
(ulong) errno, strerror(errno),
|
|
"while parsing index name.");
|
|
|
|
return(err);
|
|
}
|
|
|
|
err = row_import_cfg_read_index_fields(file, thd, cfg_index);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
return(err);
|
|
}
|
|
|
|
}
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/*****************************************************************//**
|
|
Set the index root page number for v1 format.
|
|
@return DB_SUCCESS or error code. */
|
|
static
|
|
dberr_t
|
|
row_import_read_indexes(
|
|
/*====================*/
|
|
FILE* file, /*!< in: File to read from */
|
|
THD* thd, /*!< in: session */
|
|
row_import* cfg) /*!< in/out: meta-data read */
|
|
{
|
|
byte row[sizeof(ib_uint32_t)];
|
|
|
|
/* Trigger EOF */
|
|
DBUG_EXECUTE_IF("ib_import_io_read_error_3",
|
|
(void) fseek(file, 0L, SEEK_END););
|
|
|
|
/* Read the number of indexes. */
|
|
if (fread(row, 1, sizeof(row), file) != sizeof(row)) {
|
|
ib_senderrf(
|
|
thd, IB_LOG_LEVEL_ERROR, ER_IO_READ_ERROR,
|
|
(ulong) errno, strerror(errno),
|
|
"while reading number of indexes.");
|
|
|
|
return(DB_IO_ERROR);
|
|
}
|
|
|
|
cfg->m_n_indexes = mach_read_from_4(row);
|
|
|
|
if (cfg->m_n_indexes == 0) {
|
|
ib_errf(thd, IB_LOG_LEVEL_ERROR, ER_IO_READ_ERROR,
|
|
"Number of indexes in meta-data file is 0");
|
|
|
|
return(DB_CORRUPTION);
|
|
|
|
} else if (cfg->m_n_indexes > 1024) {
|
|
// FIXME: What is the upper limit? */
|
|
ib_errf(thd, IB_LOG_LEVEL_ERROR, ER_IO_READ_ERROR,
|
|
"Number of indexes in meta-data file is too high: "
|
|
ULINTPF, cfg->m_n_indexes);
|
|
cfg->m_n_indexes = 0;
|
|
|
|
return(DB_CORRUPTION);
|
|
}
|
|
|
|
return(row_import_read_index_data(file, thd, cfg));
|
|
}
|
|
|
|
/*********************************************************************//**
|
|
Read the meta data (table columns) config file. Deserialise the contents of
|
|
dict_col_t structure, along with the column name. */
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
|
dberr_t
|
|
row_import_read_columns(
|
|
/*====================*/
|
|
FILE* file, /*!< in: file to write to */
|
|
THD* thd, /*!< in/out: session */
|
|
row_import* cfg) /*!< in/out: meta-data read */
|
|
{
|
|
dict_col_t* col;
|
|
byte row[sizeof(ib_uint32_t) * 8];
|
|
|
|
/* FIXME: What should the upper limit be? */
|
|
ut_a(cfg->m_n_cols > 0);
|
|
ut_a(cfg->m_n_cols < 1024);
|
|
|
|
cfg->m_cols = UT_NEW_ARRAY_NOKEY(dict_col_t, cfg->m_n_cols);
|
|
|
|
/* Trigger OOM */
|
|
DBUG_EXECUTE_IF(
|
|
"ib_import_OOM_8",
|
|
UT_DELETE_ARRAY(cfg->m_cols);
|
|
cfg->m_cols = NULL;
|
|
);
|
|
|
|
if (cfg->m_cols == NULL) {
|
|
return(DB_OUT_OF_MEMORY);
|
|
}
|
|
|
|
cfg->m_col_names = UT_NEW_ARRAY_NOKEY(byte*, cfg->m_n_cols);
|
|
|
|
/* Trigger OOM */
|
|
DBUG_EXECUTE_IF(
|
|
"ib_import_OOM_9",
|
|
UT_DELETE_ARRAY(cfg->m_col_names);
|
|
cfg->m_col_names = NULL;
|
|
);
|
|
|
|
if (cfg->m_col_names == NULL) {
|
|
return(DB_OUT_OF_MEMORY);
|
|
}
|
|
|
|
memset(cfg->m_cols, 0x0, sizeof(cfg->m_cols) * cfg->m_n_cols);
|
|
memset(cfg->m_col_names, 0x0, sizeof(cfg->m_col_names) * cfg->m_n_cols);
|
|
|
|
col = cfg->m_cols;
|
|
|
|
for (ulint i = 0; i < cfg->m_n_cols; ++i, ++col) {
|
|
byte* ptr = row;
|
|
|
|
/* Trigger EOF */
|
|
DBUG_EXECUTE_IF("ib_import_io_read_error_4",
|
|
(void) fseek(file, 0L, SEEK_END););
|
|
|
|
if (fread(row, 1, sizeof(row), file) != sizeof(row)) {
|
|
ib_senderrf(
|
|
thd, IB_LOG_LEVEL_ERROR, ER_IO_READ_ERROR,
|
|
(ulong) errno, strerror(errno),
|
|
"while reading table column meta-data.");
|
|
|
|
return(DB_IO_ERROR);
|
|
}
|
|
|
|
col->prtype = mach_read_from_4(ptr);
|
|
ptr += sizeof(ib_uint32_t);
|
|
|
|
col->mtype = mach_read_from_4(ptr);
|
|
ptr += sizeof(ib_uint32_t);
|
|
|
|
col->len = mach_read_from_4(ptr);
|
|
ptr += sizeof(ib_uint32_t);
|
|
|
|
ulint mbminmaxlen = mach_read_from_4(ptr);
|
|
col->mbmaxlen = mbminmaxlen / 5;
|
|
col->mbminlen = mbminmaxlen % 5;
|
|
ptr += sizeof(ib_uint32_t);
|
|
|
|
col->ind = mach_read_from_4(ptr);
|
|
ptr += sizeof(ib_uint32_t);
|
|
|
|
col->ord_part = mach_read_from_4(ptr);
|
|
ptr += sizeof(ib_uint32_t);
|
|
|
|
col->max_prefix = mach_read_from_4(ptr);
|
|
ptr += sizeof(ib_uint32_t);
|
|
|
|
/* Read in the column name as [len, byte array]. The len
|
|
includes the NUL byte. */
|
|
|
|
ulint len = mach_read_from_4(ptr);
|
|
|
|
/* FIXME: What is the maximum column name length? */
|
|
if (len == 0 || len > 128) {
|
|
ib_errf(thd, IB_LOG_LEVEL_ERROR,
|
|
ER_IO_READ_ERROR,
|
|
"Column name length " ULINTPF ", is invalid",
|
|
len);
|
|
|
|
return(DB_CORRUPTION);
|
|
}
|
|
|
|
cfg->m_col_names[i] = UT_NEW_ARRAY_NOKEY(byte, len);
|
|
|
|
/* Trigger OOM */
|
|
DBUG_EXECUTE_IF(
|
|
"ib_import_OOM_10",
|
|
UT_DELETE_ARRAY(cfg->m_col_names[i]);
|
|
cfg->m_col_names[i] = NULL;
|
|
);
|
|
|
|
if (cfg->m_col_names[i] == NULL) {
|
|
return(DB_OUT_OF_MEMORY);
|
|
}
|
|
|
|
dberr_t err;
|
|
|
|
err = row_import_cfg_read_string(
|
|
file, cfg->m_col_names[i], len);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
|
|
ib_senderrf(
|
|
thd, IB_LOG_LEVEL_ERROR, ER_IO_READ_ERROR,
|
|
(ulong) errno, strerror(errno),
|
|
"while parsing table column name.");
|
|
|
|
return(err);
|
|
}
|
|
}
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/*****************************************************************//**
|
|
Read the contents of the <tablespace>.cfg file.
|
|
@return DB_SUCCESS or error code. */
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
|
dberr_t
|
|
row_import_read_v1(
|
|
/*===============*/
|
|
FILE* file, /*!< in: File to read from */
|
|
THD* thd, /*!< in: session */
|
|
row_import* cfg) /*!< out: meta data */
|
|
{
|
|
byte value[sizeof(ib_uint32_t)];
|
|
|
|
/* Trigger EOF */
|
|
DBUG_EXECUTE_IF("ib_import_io_read_error_5",
|
|
(void) fseek(file, 0L, SEEK_END););
|
|
|
|
/* Read the hostname where the tablespace was exported. */
|
|
if (fread(value, 1, sizeof(value), file) != sizeof(value)) {
|
|
ib_senderrf(
|
|
thd, IB_LOG_LEVEL_ERROR, ER_IO_READ_ERROR,
|
|
(ulong) errno, strerror(errno),
|
|
"while reading meta-data export hostname length.");
|
|
|
|
return(DB_IO_ERROR);
|
|
}
|
|
|
|
ulint len = mach_read_from_4(value);
|
|
|
|
/* NUL byte is part of name length. */
|
|
cfg->m_hostname = UT_NEW_ARRAY_NOKEY(byte, len);
|
|
|
|
/* Trigger OOM */
|
|
DBUG_EXECUTE_IF(
|
|
"ib_import_OOM_1",
|
|
UT_DELETE_ARRAY(cfg->m_hostname);
|
|
cfg->m_hostname = NULL;
|
|
);
|
|
|
|
if (cfg->m_hostname == NULL) {
|
|
return(DB_OUT_OF_MEMORY);
|
|
}
|
|
|
|
dberr_t err = row_import_cfg_read_string(file, cfg->m_hostname, len);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
|
|
ib_senderrf(
|
|
thd, IB_LOG_LEVEL_ERROR, ER_IO_READ_ERROR,
|
|
(ulong) errno, strerror(errno),
|
|
"while parsing export hostname.");
|
|
|
|
return(err);
|
|
}
|
|
|
|
/* Trigger EOF */
|
|
DBUG_EXECUTE_IF("ib_import_io_read_error_6",
|
|
(void) fseek(file, 0L, SEEK_END););
|
|
|
|
/* Read the table name of tablespace that was exported. */
|
|
if (fread(value, 1, sizeof(value), file) != sizeof(value)) {
|
|
ib_senderrf(
|
|
thd, IB_LOG_LEVEL_ERROR, ER_IO_READ_ERROR,
|
|
(ulong) errno, strerror(errno),
|
|
"while reading meta-data table name length.");
|
|
|
|
return(DB_IO_ERROR);
|
|
}
|
|
|
|
len = mach_read_from_4(value);
|
|
|
|
/* NUL byte is part of name length. */
|
|
cfg->m_table_name = UT_NEW_ARRAY_NOKEY(byte, len);
|
|
|
|
/* Trigger OOM */
|
|
DBUG_EXECUTE_IF(
|
|
"ib_import_OOM_2",
|
|
UT_DELETE_ARRAY(cfg->m_table_name);
|
|
cfg->m_table_name = NULL;
|
|
);
|
|
|
|
if (cfg->m_table_name == NULL) {
|
|
return(DB_OUT_OF_MEMORY);
|
|
}
|
|
|
|
err = row_import_cfg_read_string(file, cfg->m_table_name, len);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
ib_senderrf(
|
|
thd, IB_LOG_LEVEL_ERROR, ER_IO_READ_ERROR,
|
|
(ulong) errno, strerror(errno),
|
|
"while parsing table name.");
|
|
|
|
return(err);
|
|
}
|
|
|
|
ib::info() << "Importing tablespace for table '" << cfg->m_table_name
|
|
<< "' that was exported from host '" << cfg->m_hostname << "'";
|
|
|
|
byte row[sizeof(ib_uint32_t) * 3];
|
|
|
|
/* Trigger EOF */
|
|
DBUG_EXECUTE_IF("ib_import_io_read_error_7",
|
|
(void) fseek(file, 0L, SEEK_END););
|
|
|
|
/* Read the autoinc value. */
|
|
if (fread(row, 1, sizeof(ib_uint64_t), file) != sizeof(ib_uint64_t)) {
|
|
ib_senderrf(
|
|
thd, IB_LOG_LEVEL_ERROR, ER_IO_READ_ERROR,
|
|
(ulong) errno, strerror(errno),
|
|
"while reading autoinc value.");
|
|
|
|
return(DB_IO_ERROR);
|
|
}
|
|
|
|
cfg->m_autoinc = mach_read_from_8(row);
|
|
|
|
/* Trigger EOF */
|
|
DBUG_EXECUTE_IF("ib_import_io_read_error_8",
|
|
(void) fseek(file, 0L, SEEK_END););
|
|
|
|
/* Read the tablespace page size. */
|
|
if (fread(row, 1, sizeof(row), file) != sizeof(row)) {
|
|
ib_senderrf(
|
|
thd, IB_LOG_LEVEL_ERROR, ER_IO_READ_ERROR,
|
|
(ulong) errno, strerror(errno),
|
|
"while reading meta-data header.");
|
|
|
|
return(DB_IO_ERROR);
|
|
}
|
|
|
|
byte* ptr = row;
|
|
|
|
const ulint logical_page_size = mach_read_from_4(ptr);
|
|
ptr += sizeof(ib_uint32_t);
|
|
|
|
if (logical_page_size != srv_page_size) {
|
|
|
|
ib_errf(thd, IB_LOG_LEVEL_ERROR, ER_TABLE_SCHEMA_MISMATCH,
|
|
"Tablespace to be imported has a different"
|
|
" page size than this server. Server page size"
|
|
" is %lu, whereas tablespace page size"
|
|
" is " ULINTPF,
|
|
srv_page_size,
|
|
logical_page_size);
|
|
|
|
return(DB_ERROR);
|
|
}
|
|
|
|
cfg->m_flags = mach_read_from_4(ptr);
|
|
ptr += sizeof(ib_uint32_t);
|
|
|
|
cfg->m_page_size.copy_from(dict_tf_get_page_size(cfg->m_flags));
|
|
|
|
ut_a(logical_page_size == cfg->m_page_size.logical());
|
|
|
|
cfg->m_n_cols = mach_read_from_4(ptr);
|
|
|
|
if (!dict_tf_is_valid(cfg->m_flags)) {
|
|
ib_errf(thd, IB_LOG_LEVEL_ERROR,
|
|
ER_TABLE_SCHEMA_MISMATCH,
|
|
"Invalid table flags: " ULINTPF, cfg->m_flags);
|
|
|
|
return(DB_CORRUPTION);
|
|
}
|
|
|
|
err = row_import_read_columns(file, thd, cfg);
|
|
|
|
if (err == DB_SUCCESS) {
|
|
err = row_import_read_indexes(file, thd, cfg);
|
|
}
|
|
|
|
return(err);
|
|
}
|
|
|
|
/**
|
|
Read the contents of the <tablespace>.cfg file.
|
|
@return DB_SUCCESS or error code. */
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
|
dberr_t
|
|
row_import_read_meta_data(
|
|
/*======================*/
|
|
FILE* file, /*!< in: File to read from */
|
|
THD* thd, /*!< in: session */
|
|
row_import& cfg) /*!< out: contents of the .cfg file */
|
|
{
|
|
byte row[sizeof(ib_uint32_t)];
|
|
|
|
/* Trigger EOF */
|
|
DBUG_EXECUTE_IF("ib_import_io_read_error_9",
|
|
(void) fseek(file, 0L, SEEK_END););
|
|
|
|
if (fread(&row, 1, sizeof(row), file) != sizeof(row)) {
|
|
ib_senderrf(
|
|
thd, IB_LOG_LEVEL_ERROR, ER_IO_READ_ERROR,
|
|
(ulong) errno, strerror(errno),
|
|
"while reading meta-data version.");
|
|
|
|
return(DB_IO_ERROR);
|
|
}
|
|
|
|
cfg.m_version = mach_read_from_4(row);
|
|
|
|
/* Check the version number. */
|
|
switch (cfg.m_version) {
|
|
case IB_EXPORT_CFG_VERSION_V1:
|
|
|
|
return(row_import_read_v1(file, thd, &cfg));
|
|
default:
|
|
ib_errf(thd, IB_LOG_LEVEL_ERROR, ER_IO_READ_ERROR,
|
|
"Unsupported meta-data version number (" ULINTPF "), "
|
|
"file ignored", cfg.m_version);
|
|
}
|
|
|
|
return(DB_ERROR);
|
|
}
|
|
|
|
/**
|
|
Read the contents of the <tablename>.cfg file.
|
|
@return DB_SUCCESS or error code. */
|
|
static MY_ATTRIBUTE((nonnull, warn_unused_result))
|
|
dberr_t
|
|
row_import_read_cfg(
|
|
/*================*/
|
|
dict_table_t* table, /*!< in: table */
|
|
THD* thd, /*!< in: session */
|
|
row_import& cfg) /*!< out: contents of the .cfg file */
|
|
{
|
|
dberr_t err;
|
|
char name[OS_FILE_MAX_PATH];
|
|
|
|
cfg.m_table = table;
|
|
|
|
srv_get_meta_data_filename(table, name, sizeof(name));
|
|
|
|
FILE* file = fopen(name, "rb");
|
|
|
|
if (file == NULL) {
|
|
char msg[BUFSIZ];
|
|
|
|
snprintf(msg, sizeof(msg),
|
|
"Error opening '%s', will attempt to import"
|
|
" without schema verification", name);
|
|
|
|
ib_senderrf(
|
|
thd, IB_LOG_LEVEL_WARN, ER_IO_READ_ERROR,
|
|
(ulong) errno, strerror(errno), msg);
|
|
|
|
cfg.m_missing = true;
|
|
|
|
err = DB_FAIL;
|
|
} else {
|
|
|
|
cfg.m_missing = false;
|
|
|
|
err = row_import_read_meta_data(file, thd, cfg);
|
|
fclose(file);
|
|
}
|
|
|
|
return(err);
|
|
}
|
|
|
|
/** Update the root page numbers and tablespace ID of a table.
|
|
@param[in,out] trx dictionary transaction
|
|
@param[in,out] table persistent table
|
|
@param[in] reset whether to reset the fields to FIL_NULL
|
|
@return DB_SUCCESS or error code */
|
|
dberr_t
|
|
row_import_update_index_root(trx_t* trx, dict_table_t* table, bool reset)
|
|
{
|
|
const dict_index_t* index;
|
|
que_t* graph = 0;
|
|
dberr_t err = DB_SUCCESS;
|
|
|
|
ut_ad(reset || table->space->id == table->space_id);
|
|
|
|
static const char sql[] = {
|
|
"PROCEDURE UPDATE_INDEX_ROOT() IS\n"
|
|
"BEGIN\n"
|
|
"UPDATE SYS_INDEXES\n"
|
|
"SET SPACE = :space,\n"
|
|
" PAGE_NO = :page,\n"
|
|
" TYPE = :type\n"
|
|
"WHERE TABLE_ID = :table_id AND ID = :index_id;\n"
|
|
"END;\n"};
|
|
|
|
table->def_trx_id = trx->id;
|
|
|
|
for (index = dict_table_get_first_index(table);
|
|
index != 0;
|
|
index = dict_table_get_next_index(index)) {
|
|
|
|
pars_info_t* info;
|
|
ib_uint32_t page;
|
|
ib_uint32_t space;
|
|
ib_uint32_t type;
|
|
index_id_t index_id;
|
|
table_id_t table_id;
|
|
|
|
info = (graph != 0) ? graph->info : pars_info_create();
|
|
|
|
mach_write_to_4(
|
|
reinterpret_cast<byte*>(&type),
|
|
index->type);
|
|
|
|
mach_write_to_4(
|
|
reinterpret_cast<byte*>(&page),
|
|
reset ? FIL_NULL : index->page);
|
|
|
|
mach_write_to_4(
|
|
reinterpret_cast<byte*>(&space),
|
|
reset ? FIL_NULL : index->table->space_id);
|
|
|
|
mach_write_to_8(
|
|
reinterpret_cast<byte*>(&index_id),
|
|
index->id);
|
|
|
|
mach_write_to_8(
|
|
reinterpret_cast<byte*>(&table_id),
|
|
table->id);
|
|
|
|
/* If we set the corrupt bit during the IMPORT phase then
|
|
we need to update the system tables. */
|
|
pars_info_bind_int4_literal(info, "type", &type);
|
|
pars_info_bind_int4_literal(info, "space", &space);
|
|
pars_info_bind_int4_literal(info, "page", &page);
|
|
pars_info_bind_ull_literal(info, "index_id", &index_id);
|
|
pars_info_bind_ull_literal(info, "table_id", &table_id);
|
|
|
|
if (graph == 0) {
|
|
graph = pars_sql(info, sql);
|
|
ut_a(graph);
|
|
graph->trx = trx;
|
|
}
|
|
|
|
que_thr_t* thr;
|
|
|
|
graph->fork_type = QUE_FORK_MYSQL_INTERFACE;
|
|
|
|
ut_a(thr = que_fork_start_command(graph));
|
|
|
|
que_run_threads(thr);
|
|
|
|
DBUG_EXECUTE_IF("ib_import_internal_error",
|
|
trx->error_state = DB_ERROR;);
|
|
|
|
err = trx->error_state;
|
|
|
|
if (err != DB_SUCCESS) {
|
|
ib_errf(trx->mysql_thd, IB_LOG_LEVEL_ERROR,
|
|
ER_INTERNAL_ERROR,
|
|
"While updating the <space, root page"
|
|
" number> of index %s - %s",
|
|
index->name(), ut_strerr(err));
|
|
|
|
break;
|
|
}
|
|
}
|
|
|
|
que_graph_free(graph);
|
|
|
|
return(err);
|
|
}
|
|
|
|
/** Callback arg for row_import_set_discarded. */
|
|
struct discard_t {
|
|
ib_uint32_t flags2; /*!< Value read from column */
|
|
bool state; /*!< New state of the flag */
|
|
ulint n_recs; /*!< Number of recs processed */
|
|
};
|
|
|
|
/******************************************************************//**
|
|
Fetch callback that sets or unsets the DISCARDED tablespace flag in
|
|
SYS_TABLES. The flags is stored in MIX_LEN column.
|
|
@return FALSE if all OK */
|
|
static
|
|
ibool
|
|
row_import_set_discarded(
|
|
/*=====================*/
|
|
void* row, /*!< in: sel_node_t* */
|
|
void* user_arg) /*!< in: bool set/unset flag */
|
|
{
|
|
sel_node_t* node = static_cast<sel_node_t*>(row);
|
|
discard_t* discard = static_cast<discard_t*>(user_arg);
|
|
dfield_t* dfield = que_node_get_val(node->select_list);
|
|
dtype_t* type = dfield_get_type(dfield);
|
|
ulint len = dfield_get_len(dfield);
|
|
|
|
ut_a(dtype_get_mtype(type) == DATA_INT);
|
|
ut_a(len == sizeof(ib_uint32_t));
|
|
|
|
ulint flags2 = mach_read_from_4(
|
|
static_cast<byte*>(dfield_get_data(dfield)));
|
|
|
|
if (discard->state) {
|
|
flags2 |= DICT_TF2_DISCARDED;
|
|
} else {
|
|
flags2 &= ~DICT_TF2_DISCARDED;
|
|
}
|
|
|
|
mach_write_to_4(reinterpret_cast<byte*>(&discard->flags2), flags2);
|
|
|
|
++discard->n_recs;
|
|
|
|
/* There should be at most one matching record. */
|
|
ut_a(discard->n_recs == 1);
|
|
|
|
return(FALSE);
|
|
}
|
|
|
|
/** Update the DICT_TF2_DISCARDED flag in SYS_TABLES.MIX_LEN.
|
|
@param[in,out] trx dictionary transaction
|
|
@param[in] table_id table identifier
|
|
@param[in] discarded whether to set or clear the flag
|
|
@return DB_SUCCESS or error code */
|
|
dberr_t row_import_update_discarded_flag(trx_t* trx, table_id_t table_id,
|
|
bool discarded)
|
|
{
|
|
pars_info_t* info;
|
|
discard_t discard;
|
|
|
|
static const char sql[] =
|
|
"PROCEDURE UPDATE_DISCARDED_FLAG() IS\n"
|
|
"DECLARE FUNCTION my_func;\n"
|
|
"DECLARE CURSOR c IS\n"
|
|
" SELECT MIX_LEN"
|
|
" FROM SYS_TABLES"
|
|
" WHERE ID = :table_id FOR UPDATE;"
|
|
"\n"
|
|
"BEGIN\n"
|
|
"OPEN c;\n"
|
|
"WHILE 1 = 1 LOOP\n"
|
|
" FETCH c INTO my_func();\n"
|
|
" IF c % NOTFOUND THEN\n"
|
|
" EXIT;\n"
|
|
" END IF;\n"
|
|
"END LOOP;\n"
|
|
"UPDATE SYS_TABLES"
|
|
" SET MIX_LEN = :flags2"
|
|
" WHERE ID = :table_id;\n"
|
|
"CLOSE c;\n"
|
|
"END;\n";
|
|
|
|
discard.n_recs = 0;
|
|
discard.state = discarded;
|
|
discard.flags2 = ULINT32_UNDEFINED;
|
|
|
|
info = pars_info_create();
|
|
|
|
pars_info_add_ull_literal(info, "table_id", table_id);
|
|
pars_info_bind_int4_literal(info, "flags2", &discard.flags2);
|
|
|
|
pars_info_bind_function(
|
|
info, "my_func", row_import_set_discarded, &discard);
|
|
|
|
dberr_t err = que_eval_sql(info, sql, false, trx);
|
|
|
|
ut_a(discard.n_recs == 1);
|
|
ut_a(discard.flags2 != ULINT32_UNDEFINED);
|
|
|
|
return(err);
|
|
}
|
|
|
|
struct fil_iterator_t {
|
|
pfs_os_file_t file; /*!< File handle */
|
|
const char* filepath; /*!< File path name */
|
|
os_offset_t start; /*!< From where to start */
|
|
os_offset_t end; /*!< Where to stop */
|
|
os_offset_t file_size; /*!< File size in bytes */
|
|
ulint n_io_buffers; /*!< Number of pages to use
|
|
for IO */
|
|
byte* io_buffer; /*!< Buffer to use for IO */
|
|
fil_space_crypt_t *crypt_data; /*!< Crypt data (if encrypted) */
|
|
byte* crypt_io_buffer; /*!< IO buffer when encrypted */
|
|
};
|
|
|
|
/********************************************************************//**
|
|
TODO: This can be made parallel trivially by chunking up the file and creating
|
|
a callback per thread. . Main benefit will be to use multiple CPUs for
|
|
checksums and compressed tables. We have to do compressed tables block by
|
|
block right now. Secondly we need to decompress/compress and copy too much
|
|
of data. These are CPU intensive.
|
|
|
|
Iterate over all the pages in the tablespace.
|
|
@param iter - Tablespace iterator
|
|
@param block - block to use for IO
|
|
@param callback - Callback to inspect and update page contents
|
|
@retval DB_SUCCESS or error code */
|
|
static
|
|
dberr_t
|
|
fil_iterate(
|
|
/*========*/
|
|
const fil_iterator_t& iter,
|
|
buf_block_t* block,
|
|
AbstractCallback& callback)
|
|
{
|
|
os_offset_t offset;
|
|
const ulint size = callback.get_page_size().physical();
|
|
ulint n_bytes = iter.n_io_buffers * size;
|
|
|
|
const ulint buf_size = srv_page_size
|
|
#ifdef HAVE_LZO
|
|
+ LZO1X_1_15_MEM_COMPRESS
|
|
#elif defined HAVE_SNAPPY
|
|
+ snappy_max_compressed_length(srv_page_size)
|
|
#endif
|
|
;
|
|
byte* page_compress_buf = static_cast<byte*>(malloc(buf_size));
|
|
ut_ad(!srv_read_only_mode);
|
|
|
|
if (!page_compress_buf) {
|
|
return DB_OUT_OF_MEMORY;
|
|
}
|
|
|
|
/* TODO: For ROW_FORMAT=COMPRESSED tables we do a lot of useless
|
|
copying for non-index pages. Unfortunately, it is
|
|
required by buf_zip_decompress() */
|
|
dberr_t err = DB_SUCCESS;
|
|
|
|
for (offset = iter.start; offset < iter.end; offset += n_bytes) {
|
|
if (callback.is_interrupted()) {
|
|
err = DB_INTERRUPTED;
|
|
goto func_exit;
|
|
}
|
|
|
|
byte* io_buffer = iter.io_buffer;
|
|
block->frame = io_buffer;
|
|
|
|
if (block->page.zip.data) {
|
|
/* Zip IO is done in the compressed page buffer. */
|
|
io_buffer = block->page.zip.data;
|
|
}
|
|
|
|
/* We have to read the exact number of bytes. Otherwise the
|
|
InnoDB IO functions croak on failed reads. */
|
|
|
|
n_bytes = ulint(ut_min(os_offset_t(n_bytes),
|
|
iter.end - offset));
|
|
|
|
ut_ad(n_bytes > 0);
|
|
ut_ad(!(n_bytes % size));
|
|
|
|
const bool encrypted = iter.crypt_data != NULL
|
|
&& iter.crypt_data->should_encrypt();
|
|
/* Use additional crypt io buffer if tablespace is encrypted */
|
|
byte* const readptr = encrypted
|
|
? iter.crypt_io_buffer : io_buffer;
|
|
byte* const writeptr = readptr;
|
|
|
|
IORequest read_request(IORequest::READ);
|
|
read_request.disable_partial_io_warnings();
|
|
|
|
err = os_file_read_no_error_handling(
|
|
read_request, iter.file, readptr, offset, n_bytes, 0);
|
|
if (err != DB_SUCCESS) {
|
|
ib::error() << iter.filepath
|
|
<< ": os_file_read() failed";
|
|
goto func_exit;
|
|
}
|
|
|
|
bool updated = false;
|
|
os_offset_t page_off = offset;
|
|
ulint n_pages_read = n_bytes / size;
|
|
block->page.id.set_page_no(ulint(page_off / size));
|
|
|
|
for (ulint i = 0; i < n_pages_read;
|
|
block->page.id.set_page_no(block->page.id.page_no() + 1),
|
|
++i, page_off += size, block->frame += size) {
|
|
byte* src = readptr + i * size;
|
|
const ulint page_no = page_get_page_no(src);
|
|
if (!page_no && block->page.id.page_no()) {
|
|
const ulint* b = reinterpret_cast<const ulint*>
|
|
(src);
|
|
const ulint* const e = b + size / sizeof *b;
|
|
do {
|
|
if (*b++) {
|
|
goto page_corrupted;
|
|
}
|
|
} while (b != e);
|
|
|
|
/* Proceed to the next page,
|
|
because this one is all zero. */
|
|
continue;
|
|
}
|
|
|
|
if (page_no != block->page.id.page_no()) {
|
|
page_corrupted:
|
|
ib::warn() << callback.filename()
|
|
<< ": Page " << (offset / size)
|
|
<< " at offset " << offset
|
|
<< " looks corrupted.";
|
|
err = DB_CORRUPTION;
|
|
goto func_exit;
|
|
}
|
|
|
|
const bool page_compressed
|
|
= fil_page_is_compressed_encrypted(src)
|
|
|| fil_page_is_compressed(src);
|
|
|
|
if (page_compressed && block->page.zip.data) {
|
|
goto page_corrupted;
|
|
}
|
|
|
|
bool decrypted = false;
|
|
byte* dst = io_buffer + i * size;
|
|
bool frame_changed = false;
|
|
|
|
if (!encrypted) {
|
|
} else if (!mach_read_from_4(
|
|
FIL_PAGE_FILE_FLUSH_LSN_OR_KEY_VERSION
|
|
+ src)) {
|
|
not_encrypted:
|
|
if (block->page.id.page_no() == 0
|
|
&& block->page.zip.data) {
|
|
block->page.zip.data = src;
|
|
frame_changed = true;
|
|
} else if (!page_compressed
|
|
&& !block->page.zip.data) {
|
|
block->frame = src;
|
|
frame_changed = true;
|
|
} else {
|
|
ut_ad(dst != src);
|
|
memcpy(dst, src, size);
|
|
}
|
|
} else {
|
|
if (!fil_space_verify_crypt_checksum(
|
|
src, callback.get_page_size())) {
|
|
goto page_corrupted;
|
|
}
|
|
|
|
decrypted = fil_space_decrypt(
|
|
iter.crypt_data, dst,
|
|
callback.get_page_size(), src, &err);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
goto func_exit;
|
|
}
|
|
|
|
if (!decrypted) {
|
|
goto not_encrypted;
|
|
}
|
|
|
|
updated = true;
|
|
}
|
|
|
|
/* If the original page is page_compressed, we need
|
|
to decompress it before adjusting further. */
|
|
if (page_compressed) {
|
|
ulint compress_length = fil_page_decompress(
|
|
page_compress_buf, dst);
|
|
ut_ad(compress_length != srv_page_size);
|
|
if (compress_length == 0) {
|
|
goto page_corrupted;
|
|
}
|
|
updated = true;
|
|
} else if (buf_page_is_corrupted(
|
|
false,
|
|
encrypted && !frame_changed
|
|
? dst : src,
|
|
callback.get_page_size(), NULL)) {
|
|
goto page_corrupted;
|
|
}
|
|
|
|
if ((err = callback(block)) != DB_SUCCESS) {
|
|
goto func_exit;
|
|
} else if (!updated) {
|
|
updated = buf_block_get_state(block)
|
|
== BUF_BLOCK_FILE_PAGE;
|
|
}
|
|
|
|
/* If tablespace is encrypted we use additional
|
|
temporary scratch area where pages are read
|
|
for decrypting readptr == crypt_io_buffer != io_buffer.
|
|
|
|
Destination for decryption is a buffer pool block
|
|
block->frame == dst == io_buffer that is updated.
|
|
Pages that did not require decryption even when
|
|
tablespace is marked as encrypted are not copied
|
|
instead block->frame is set to src == readptr.
|
|
|
|
For encryption we again use temporary scratch area
|
|
writeptr != io_buffer == dst
|
|
that is then written to the tablespace
|
|
|
|
(1) For normal tables io_buffer == dst == writeptr
|
|
(2) For only page compressed tables
|
|
io_buffer == dst == writeptr
|
|
(3) For encrypted (and page compressed)
|
|
readptr != io_buffer == dst != writeptr
|
|
*/
|
|
|
|
ut_ad(!encrypted && !page_compressed ?
|
|
src == dst && dst == writeptr + (i * size):1);
|
|
ut_ad(page_compressed && !encrypted ?
|
|
src == dst && dst == writeptr + (i * size):1);
|
|
ut_ad(encrypted ?
|
|
src != dst && dst != writeptr + (i * size):1);
|
|
|
|
/* When tablespace is encrypted or compressed its
|
|
first page (i.e. page 0) is not encrypted or
|
|
compressed and there is no need to copy frame. */
|
|
if (encrypted && block->page.id.page_no() != 0) {
|
|
byte *local_frame = callback.get_frame(block);
|
|
ut_ad((writeptr + (i * size)) != local_frame);
|
|
memcpy((writeptr + (i * size)), local_frame, size);
|
|
}
|
|
|
|
if (frame_changed) {
|
|
if (block->page.zip.data) {
|
|
block->page.zip.data = dst;
|
|
} else {
|
|
block->frame = dst;
|
|
}
|
|
}
|
|
|
|
src = io_buffer + (i * size);
|
|
|
|
if (page_compressed) {
|
|
updated = true;
|
|
if (ulint len = fil_page_compress(
|
|
src,
|
|
page_compress_buf,
|
|
0,/* FIXME: compression level */
|
|
512,/* FIXME: proper block size */
|
|
encrypted)) {
|
|
/* FIXME: remove memcpy() */
|
|
memcpy(src, page_compress_buf, len);
|
|
memset(src + len, 0,
|
|
srv_page_size - len);
|
|
}
|
|
}
|
|
|
|
/* Encrypt the page if encryption was used. */
|
|
if (encrypted && decrypted) {
|
|
byte *dest = writeptr + i * size;
|
|
byte* tmp = fil_encrypt_buf(
|
|
iter.crypt_data,
|
|
block->page.id.space(),
|
|
block->page.id.page_no(),
|
|
mach_read_from_8(src + FIL_PAGE_LSN),
|
|
src, callback.get_page_size(), dest);
|
|
|
|
if (tmp == src) {
|
|
/* TODO: remove unnecessary memcpy's */
|
|
ut_ad(dest != src);
|
|
memcpy(dest, src, size);
|
|
}
|
|
|
|
updated = true;
|
|
}
|
|
}
|
|
|
|
/* A page was updated in the set, write back to disk. */
|
|
if (updated) {
|
|
IORequest write_request(IORequest::WRITE);
|
|
|
|
err = os_file_write(write_request,
|
|
iter.filepath, iter.file,
|
|
writeptr, offset, n_bytes);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
goto func_exit;
|
|
}
|
|
}
|
|
}
|
|
|
|
func_exit:
|
|
free(page_compress_buf);
|
|
return err;
|
|
}
|
|
|
|
/********************************************************************//**
|
|
Iterate over all the pages in the tablespace.
|
|
@param table - the table definiton in the server
|
|
@param n_io_buffers - number of blocks to read and write together
|
|
@param callback - functor that will do the page updates
|
|
@return DB_SUCCESS or error code */
|
|
static
|
|
dberr_t
|
|
fil_tablespace_iterate(
|
|
/*===================*/
|
|
dict_table_t* table,
|
|
ulint n_io_buffers,
|
|
AbstractCallback& callback)
|
|
{
|
|
dberr_t err;
|
|
pfs_os_file_t file;
|
|
char* filepath;
|
|
|
|
ut_a(n_io_buffers > 0);
|
|
ut_ad(!srv_read_only_mode);
|
|
|
|
DBUG_EXECUTE_IF("ib_import_trigger_corruption_1",
|
|
return(DB_CORRUPTION););
|
|
|
|
/* Make sure the data_dir_path is set. */
|
|
dict_get_and_save_data_dir_path(table, false);
|
|
|
|
if (DICT_TF_HAS_DATA_DIR(table->flags)) {
|
|
ut_a(table->data_dir_path);
|
|
|
|
filepath = fil_make_filepath(
|
|
table->data_dir_path, table->name.m_name, IBD, true);
|
|
} else {
|
|
filepath = fil_make_filepath(
|
|
NULL, table->name.m_name, IBD, false);
|
|
}
|
|
|
|
if (!filepath) {
|
|
return(DB_OUT_OF_MEMORY);
|
|
} else {
|
|
bool success;
|
|
|
|
file = os_file_create_simple_no_error_handling(
|
|
innodb_data_file_key, filepath,
|
|
OS_FILE_OPEN, OS_FILE_READ_WRITE, false, &success);
|
|
|
|
if (!success) {
|
|
/* The following call prints an error message */
|
|
os_file_get_last_error(true);
|
|
ib::error() << "Trying to import a tablespace,"
|
|
" but could not open the tablespace file "
|
|
<< filepath;
|
|
ut_free(filepath);
|
|
return DB_TABLESPACE_NOT_FOUND;
|
|
} else {
|
|
err = DB_SUCCESS;
|
|
}
|
|
}
|
|
|
|
callback.set_file(filepath, file);
|
|
|
|
os_offset_t file_size = os_file_get_size(file);
|
|
ut_a(file_size != (os_offset_t) -1);
|
|
|
|
/* Allocate a page to read in the tablespace header, so that we
|
|
can determine the page size and zip_size (if it is compressed).
|
|
We allocate an extra page in case it is a compressed table. One
|
|
page is to ensure alignement. */
|
|
|
|
void* page_ptr = ut_malloc_nokey(3U << srv_page_size_shift);
|
|
byte* page = static_cast<byte*>(ut_align(page_ptr, srv_page_size));
|
|
|
|
buf_block_t* block = reinterpret_cast<buf_block_t*>
|
|
(ut_zalloc_nokey(sizeof *block));
|
|
block->frame = page;
|
|
block->page.id = page_id_t(0, 0);
|
|
block->page.io_fix = BUF_IO_NONE;
|
|
block->page.buf_fix_count = 1;
|
|
block->page.state = BUF_BLOCK_FILE_PAGE;
|
|
|
|
/* Read the first page and determine the page and zip size. */
|
|
|
|
IORequest request(IORequest::READ);
|
|
request.disable_partial_io_warnings();
|
|
|
|
err = os_file_read_no_error_handling(request, file, page, 0,
|
|
srv_page_size, 0);
|
|
|
|
if (err == DB_SUCCESS) {
|
|
err = callback.init(file_size, block);
|
|
}
|
|
|
|
if (err == DB_SUCCESS) {
|
|
block->page.id = page_id_t(callback.get_space_id(), 0);
|
|
block->page.size.copy_from(callback.get_page_size());
|
|
if (block->page.size.is_compressed()) {
|
|
page_zip_set_size(&block->page.zip,
|
|
callback.get_page_size().physical());
|
|
/* ROW_FORMAT=COMPRESSED is not optimised for block IO
|
|
for now. We do the IMPORT page by page. */
|
|
n_io_buffers = 1;
|
|
}
|
|
|
|
fil_iterator_t iter;
|
|
|
|
/* read (optional) crypt data */
|
|
iter.crypt_data = fil_space_read_crypt_data(
|
|
callback.get_page_size(), page);
|
|
|
|
/* If tablespace is encrypted, it needs extra buffers */
|
|
if (iter.crypt_data && n_io_buffers > 1) {
|
|
/* decrease io buffers so that memory
|
|
consumption will not double */
|
|
n_io_buffers /= 2;
|
|
}
|
|
|
|
iter.file = file;
|
|
iter.start = 0;
|
|
iter.end = file_size;
|
|
iter.filepath = filepath;
|
|
iter.file_size = file_size;
|
|
iter.n_io_buffers = n_io_buffers;
|
|
|
|
/* Add an extra page for compressed page scratch area. */
|
|
void* io_buffer = ut_malloc_nokey(
|
|
(2 + iter.n_io_buffers) << srv_page_size_shift);
|
|
|
|
iter.io_buffer = static_cast<byte*>(
|
|
ut_align(io_buffer, srv_page_size));
|
|
|
|
void* crypt_io_buffer = NULL;
|
|
if (iter.crypt_data) {
|
|
crypt_io_buffer = ut_malloc_nokey(
|
|
(2 + iter.n_io_buffers)
|
|
<< srv_page_size_shift);
|
|
iter.crypt_io_buffer = static_cast<byte*>(
|
|
ut_align(crypt_io_buffer, srv_page_size));
|
|
}
|
|
|
|
if (block->page.zip.ssize) {
|
|
ut_ad(iter.n_io_buffers == 1);
|
|
block->frame = iter.io_buffer;
|
|
block->page.zip.data = block->frame + srv_page_size;
|
|
}
|
|
|
|
err = fil_iterate(iter, block, callback);
|
|
|
|
if (iter.crypt_data) {
|
|
fil_space_destroy_crypt_data(&iter.crypt_data);
|
|
}
|
|
|
|
ut_free(crypt_io_buffer);
|
|
ut_free(io_buffer);
|
|
}
|
|
|
|
if (err == DB_SUCCESS) {
|
|
ib::info() << "Sync to disk";
|
|
|
|
if (!os_file_flush(file)) {
|
|
ib::info() << "os_file_flush() failed!";
|
|
err = DB_IO_ERROR;
|
|
} else {
|
|
ib::info() << "Sync to disk - done!";
|
|
}
|
|
}
|
|
|
|
os_file_close(file);
|
|
|
|
ut_free(page_ptr);
|
|
ut_free(filepath);
|
|
ut_free(block);
|
|
|
|
return(err);
|
|
}
|
|
|
|
/*****************************************************************//**
|
|
Imports a tablespace. The space id in the .ibd file must match the space id
|
|
of the table in the data dictionary.
|
|
@return error code or DB_SUCCESS */
|
|
dberr_t
|
|
row_import_for_mysql(
|
|
/*=================*/
|
|
dict_table_t* table, /*!< in/out: table */
|
|
row_prebuilt_t* prebuilt) /*!< in: prebuilt struct in MySQL */
|
|
{
|
|
dberr_t err;
|
|
trx_t* trx;
|
|
ib_uint64_t autoinc = 0;
|
|
char* filepath = NULL;
|
|
ulint space_flags MY_ATTRIBUTE((unused));
|
|
|
|
/* The caller assured that this is not read_only_mode and that no
|
|
temorary tablespace is being imported. */
|
|
ut_ad(!srv_read_only_mode);
|
|
ut_ad(!table->is_temporary());
|
|
|
|
ut_ad(table->space_id);
|
|
ut_ad(table->space_id < SRV_LOG_SPACE_FIRST_ID);
|
|
ut_ad(prebuilt->trx);
|
|
ut_ad(!table->is_readable());
|
|
|
|
ibuf_delete_for_discarded_space(table->space_id);
|
|
|
|
trx_start_if_not_started(prebuilt->trx, true);
|
|
|
|
trx = trx_create();
|
|
|
|
/* So that the table is not DROPped during recovery. */
|
|
trx_set_dict_operation(trx, TRX_DICT_OP_INDEX);
|
|
|
|
trx_start_if_not_started(trx, true);
|
|
|
|
/* So that we can send error messages to the user. */
|
|
trx->mysql_thd = prebuilt->trx->mysql_thd;
|
|
|
|
/* Ensure that the table will be dropped by trx_rollback_active()
|
|
in case of a crash. */
|
|
|
|
trx->table_id = table->id;
|
|
|
|
/* Assign an undo segment for the transaction, so that the
|
|
transaction will be recovered after a crash. */
|
|
|
|
/* TODO: Do not write any undo log for the IMPORT cleanup. */
|
|
{
|
|
mtr_t mtr;
|
|
mtr.start();
|
|
trx_undo_assign(trx, &err, &mtr);
|
|
mtr.commit();
|
|
}
|
|
|
|
DBUG_EXECUTE_IF("ib_import_undo_assign_failure",
|
|
err = DB_TOO_MANY_CONCURRENT_TRXS;);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
|
|
return(row_import_cleanup(prebuilt, trx, err));
|
|
|
|
} else if (trx->rsegs.m_redo.undo == 0) {
|
|
|
|
err = DB_TOO_MANY_CONCURRENT_TRXS;
|
|
return(row_import_cleanup(prebuilt, trx, err));
|
|
}
|
|
|
|
prebuilt->trx->op_info = "read meta-data file";
|
|
|
|
/* Prevent DDL operations while we are checking. */
|
|
|
|
rw_lock_s_lock_func(&dict_operation_lock, 0, __FILE__, __LINE__);
|
|
|
|
row_import cfg;
|
|
|
|
err = row_import_read_cfg(table, trx->mysql_thd, cfg);
|
|
|
|
/* Check if the table column definitions match the contents
|
|
of the config file. */
|
|
|
|
if (err == DB_SUCCESS) {
|
|
|
|
/* We have a schema file, try and match it with our
|
|
data dictionary. */
|
|
|
|
err = cfg.match_schema(trx->mysql_thd);
|
|
|
|
/* Update index->page and SYS_INDEXES.PAGE_NO to match the
|
|
B-tree root page numbers in the tablespace. Use the index
|
|
name from the .cfg file to find match. */
|
|
|
|
if (err == DB_SUCCESS) {
|
|
cfg.set_root_by_name();
|
|
autoinc = cfg.m_autoinc;
|
|
}
|
|
|
|
rw_lock_s_unlock_gen(&dict_operation_lock, 0);
|
|
|
|
DBUG_EXECUTE_IF("ib_import_set_index_root_failure",
|
|
err = DB_TOO_MANY_CONCURRENT_TRXS;);
|
|
|
|
} else if (cfg.m_missing) {
|
|
|
|
rw_lock_s_unlock_gen(&dict_operation_lock, 0);
|
|
|
|
/* We don't have a schema file, we will have to discover
|
|
the index root pages from the .ibd file and skip the schema
|
|
matching step. */
|
|
|
|
ut_a(err == DB_FAIL);
|
|
|
|
cfg.m_page_size.copy_from(univ_page_size);
|
|
|
|
FetchIndexRootPages fetchIndexRootPages(table, trx);
|
|
|
|
err = fil_tablespace_iterate(
|
|
table, IO_BUFFER_SIZE(cfg.m_page_size.physical()),
|
|
fetchIndexRootPages);
|
|
|
|
if (err == DB_SUCCESS) {
|
|
|
|
err = fetchIndexRootPages.build_row_import(&cfg);
|
|
|
|
/* Update index->page and SYS_INDEXES.PAGE_NO
|
|
to match the B-tree root page numbers in the
|
|
tablespace. */
|
|
|
|
if (err == DB_SUCCESS) {
|
|
err = cfg.set_root_by_heuristic();
|
|
}
|
|
}
|
|
|
|
space_flags = fetchIndexRootPages.get_space_flags();
|
|
|
|
} else {
|
|
rw_lock_s_unlock_gen(&dict_operation_lock, 0);
|
|
}
|
|
|
|
if (err != DB_SUCCESS) {
|
|
return(row_import_error(prebuilt, trx, err));
|
|
}
|
|
|
|
prebuilt->trx->op_info = "importing tablespace";
|
|
|
|
ib::info() << "Phase I - Update all pages";
|
|
|
|
/* Iterate over all the pages and do the sanity checking and
|
|
the conversion required to import the tablespace. */
|
|
|
|
PageConverter converter(&cfg, table->space_id, trx);
|
|
|
|
/* Set the IO buffer size in pages. */
|
|
|
|
err = fil_tablespace_iterate(
|
|
table, IO_BUFFER_SIZE(cfg.m_page_size.physical()), converter);
|
|
|
|
DBUG_EXECUTE_IF("ib_import_reset_space_and_lsn_failure",
|
|
err = DB_TOO_MANY_CONCURRENT_TRXS;);
|
|
#ifdef BTR_CUR_HASH_ADAPT
|
|
/* On DISCARD TABLESPACE, we did not drop any adaptive hash
|
|
index entries. If we replaced the discarded tablespace with a
|
|
smaller one here, there could still be some adaptive hash
|
|
index entries that point to cached garbage pages in the buffer
|
|
pool, because PageConverter::operator() only evicted those
|
|
pages that were replaced by the imported pages. We must
|
|
discard all remaining adaptive hash index entries, because the
|
|
adaptive hash index must be a subset of the table contents;
|
|
false positives are not tolerated. */
|
|
while (buf_LRU_drop_page_hash_for_tablespace(table)) {
|
|
if (trx_is_interrupted(trx)
|
|
|| srv_shutdown_state != SRV_SHUTDOWN_NONE) {
|
|
err = DB_INTERRUPTED;
|
|
break;
|
|
}
|
|
}
|
|
#endif /* BTR_CUR_HASH_ADAPT */
|
|
|
|
if (err != DB_SUCCESS) {
|
|
char table_name[MAX_FULL_NAME_LEN + 1];
|
|
|
|
innobase_format_name(
|
|
table_name, sizeof(table_name),
|
|
table->name.m_name);
|
|
|
|
if (err != DB_DECRYPTION_FAILED) {
|
|
|
|
ib_errf(trx->mysql_thd, IB_LOG_LEVEL_ERROR,
|
|
ER_INTERNAL_ERROR,
|
|
"Cannot reset LSNs in table %s : %s",
|
|
table_name, ut_strerr(err));
|
|
}
|
|
|
|
return(row_import_cleanup(prebuilt, trx, err));
|
|
}
|
|
|
|
row_mysql_lock_data_dictionary(trx);
|
|
|
|
/* If the table is stored in a remote tablespace, we need to
|
|
determine that filepath from the link file and system tables.
|
|
Find the space ID in SYS_TABLES since this is an ALTER TABLE. */
|
|
dict_get_and_save_data_dir_path(table, true);
|
|
|
|
if (DICT_TF_HAS_DATA_DIR(table->flags)) {
|
|
ut_a(table->data_dir_path);
|
|
|
|
filepath = fil_make_filepath(
|
|
table->data_dir_path, table->name.m_name, IBD, true);
|
|
} else {
|
|
filepath = fil_make_filepath(
|
|
NULL, table->name.m_name, IBD, false);
|
|
}
|
|
|
|
DBUG_EXECUTE_IF(
|
|
"ib_import_OOM_15",
|
|
ut_free(filepath);
|
|
filepath = NULL;
|
|
);
|
|
|
|
if (filepath == NULL) {
|
|
row_mysql_unlock_data_dictionary(trx);
|
|
return(row_import_cleanup(prebuilt, trx, DB_OUT_OF_MEMORY));
|
|
}
|
|
|
|
/* Open the tablespace so that we can access via the buffer pool.
|
|
We set the 2nd param (fix_dict = true) here because we already
|
|
have an x-lock on dict_operation_lock and dict_sys->mutex.
|
|
The tablespace is initially opened as a temporary one, because
|
|
we will not be writing any redo log for it before we have invoked
|
|
fil_space_t::set_imported() to declare it a persistent tablespace. */
|
|
|
|
ulint fsp_flags = dict_tf_to_fsp_flags(table->flags);
|
|
|
|
table->space = fil_ibd_open(
|
|
true, true, FIL_TYPE_IMPORT, table->space_id,
|
|
fsp_flags, table->name, filepath, &err);
|
|
|
|
ut_ad((table->space == NULL) == (err != DB_SUCCESS));
|
|
DBUG_EXECUTE_IF("ib_import_open_tablespace_failure",
|
|
err = DB_TABLESPACE_NOT_FOUND; table->space = NULL;);
|
|
|
|
if (!table->space) {
|
|
row_mysql_unlock_data_dictionary(trx);
|
|
|
|
ib_senderrf(trx->mysql_thd, IB_LOG_LEVEL_ERROR,
|
|
ER_GET_ERRMSG,
|
|
err, ut_strerr(err), filepath);
|
|
|
|
ut_free(filepath);
|
|
|
|
return(row_import_cleanup(prebuilt, trx, err));
|
|
}
|
|
|
|
row_mysql_unlock_data_dictionary(trx);
|
|
|
|
ut_free(filepath);
|
|
|
|
err = ibuf_check_bitmap_on_import(trx, table->space);
|
|
|
|
DBUG_EXECUTE_IF("ib_import_check_bitmap_failure", err = DB_CORRUPTION;);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
return(row_import_cleanup(prebuilt, trx, err));
|
|
}
|
|
|
|
/* The first index must always be the clustered index. */
|
|
|
|
dict_index_t* index = dict_table_get_first_index(table);
|
|
|
|
if (!dict_index_is_clust(index)) {
|
|
return(row_import_error(prebuilt, trx, DB_CORRUPTION));
|
|
}
|
|
|
|
/* Update the Btree segment headers for index node and
|
|
leaf nodes in the root page. Set the new space id. */
|
|
|
|
err = btr_root_adjust_on_import(index);
|
|
|
|
DBUG_EXECUTE_IF("ib_import_cluster_root_adjust_failure",
|
|
err = DB_CORRUPTION;);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
return(row_import_error(prebuilt, trx, err));
|
|
} else if (cfg.requires_purge(index->name)) {
|
|
|
|
/* Purge any delete-marked records that couldn't be
|
|
purged during the page conversion phase from the
|
|
cluster index. */
|
|
|
|
IndexPurge purge(trx, index);
|
|
|
|
trx->op_info = "cluster: purging delete marked records";
|
|
|
|
err = purge.garbage_collect();
|
|
|
|
trx->op_info = "";
|
|
}
|
|
|
|
DBUG_EXECUTE_IF("ib_import_cluster_failure", err = DB_CORRUPTION;);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
return(row_import_error(prebuilt, trx, err));
|
|
}
|
|
|
|
/* For secondary indexes, purge any records that couldn't be purged
|
|
during the page conversion phase. */
|
|
|
|
err = row_import_adjust_root_pages_of_secondary_indexes(
|
|
trx, table, cfg);
|
|
|
|
DBUG_EXECUTE_IF("ib_import_sec_root_adjust_failure",
|
|
err = DB_CORRUPTION;);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
return(row_import_error(prebuilt, trx, err));
|
|
}
|
|
|
|
/* Ensure that the next available DB_ROW_ID is not smaller than
|
|
any DB_ROW_ID stored in the table. */
|
|
|
|
if (prebuilt->clust_index_was_generated) {
|
|
|
|
err = row_import_set_sys_max_row_id(prebuilt, table);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
return(row_import_error(prebuilt, trx, err));
|
|
}
|
|
}
|
|
|
|
ib::info() << "Phase III - Flush changes to disk";
|
|
|
|
/* Ensure that all pages dirtied during the IMPORT make it to disk.
|
|
The only dirty pages generated should be from the pessimistic purge
|
|
of delete marked records that couldn't be purged in Phase I. */
|
|
|
|
{
|
|
FlushObserver observer(prebuilt->table->space, trx, NULL);
|
|
buf_LRU_flush_or_remove_pages(prebuilt->table->space_id,
|
|
&observer);
|
|
|
|
if (observer.is_interrupted()) {
|
|
ib::info() << "Phase III - Flush interrupted";
|
|
return(row_import_error(prebuilt, trx,
|
|
DB_INTERRUPTED));
|
|
}
|
|
}
|
|
|
|
ib::info() << "Phase IV - Flush complete";
|
|
prebuilt->table->space->set_imported();
|
|
|
|
/* The dictionary latches will be released in in row_import_cleanup()
|
|
after the transaction commit, for both success and error. */
|
|
|
|
row_mysql_lock_data_dictionary(trx);
|
|
|
|
/* Update the root pages of the table's indexes. */
|
|
err = row_import_update_index_root(trx, table, false);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
return(row_import_error(prebuilt, trx, err));
|
|
}
|
|
|
|
err = row_import_update_discarded_flag(trx, table->id, false);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
return(row_import_error(prebuilt, trx, err));
|
|
}
|
|
|
|
table->file_unreadable = false;
|
|
table->flags2 &= ~DICT_TF2_DISCARDED;
|
|
|
|
/* Set autoinc value read from .cfg file, if one was specified.
|
|
Otherwise, keep the PAGE_ROOT_AUTO_INC as is. */
|
|
if (autoinc) {
|
|
ib::info() << table->name << " autoinc value set to "
|
|
<< autoinc;
|
|
|
|
table->autoinc = autoinc--;
|
|
btr_write_autoinc(dict_table_get_first_index(table), autoinc);
|
|
}
|
|
|
|
return(row_import_cleanup(prebuilt, trx, err));
|
|
}
|