mirror of
https://github.com/MariaDB/server.git
synced 2025-02-05 13:22:17 +01:00
1018 lines
26 KiB
C++
1018 lines
26 KiB
C++
/*****************************************************************************
|
|
|
|
Copyright (c) 2013, 2016, Oracle and/or its affiliates. All Rights Reserved.
|
|
Copyright (c) 2017, 2022, MariaDB Corporation.
|
|
|
|
This program is free software; you can redistribute it and/or modify it under
|
|
the terms of the GNU General Public License as published by the Free Software
|
|
Foundation; version 2 of the License.
|
|
|
|
This program is distributed in the hope that it will be useful, but WITHOUT
|
|
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License along with
|
|
this program; if not, write to the Free Software Foundation, Inc.,
|
|
51 Franklin Street, Fifth Floor, Boston, MA 02110-1335 USA
|
|
|
|
*****************************************************************************/
|
|
|
|
/**************************************************//**
|
|
@file fsp/fsp0file.cc
|
|
Tablespace data file implementation
|
|
|
|
Created 2013-7-26 by Kevin Lewis
|
|
*******************************************************/
|
|
|
|
#include "fil0fil.h"
|
|
#include "fsp0types.h"
|
|
#include "os0file.h"
|
|
#include "page0page.h"
|
|
#include "srv0start.h"
|
|
#include "log.h"
|
|
|
|
/** Release the resources. */
|
|
void
|
|
Datafile::shutdown()
|
|
{
|
|
close();
|
|
|
|
free_filepath();
|
|
free_first_page();
|
|
}
|
|
|
|
/** Create/open a data file.
|
|
@param[in] read_only_mode if true, then readonly mode checks are enforced.
|
|
@return DB_SUCCESS or error code */
|
|
dberr_t
|
|
Datafile::open_or_create(bool read_only_mode)
|
|
{
|
|
bool success;
|
|
ut_a(m_filepath != NULL);
|
|
ut_ad(m_handle == OS_FILE_CLOSED);
|
|
|
|
m_handle = os_file_create(
|
|
innodb_data_file_key, m_filepath, m_open_flags,
|
|
OS_DATA_FILE, read_only_mode, &success);
|
|
|
|
if (!success) {
|
|
m_last_os_error = os_file_get_last_error(true);
|
|
ib::error() << "Cannot open datafile '" << m_filepath << "'";
|
|
return(DB_CANNOT_OPEN_FILE);
|
|
}
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/** Open a data file in read-only mode to check if it exists so that it
|
|
can be validated.
|
|
@param[in] strict whether to issue error messages
|
|
@return DB_SUCCESS or error code */
|
|
dberr_t
|
|
Datafile::open_read_only(bool strict)
|
|
{
|
|
bool success = false;
|
|
ut_ad(m_handle == OS_FILE_CLOSED);
|
|
|
|
/* This function can be called for file objects that do not need
|
|
to be opened, which is the case when the m_filepath is NULL */
|
|
if (m_filepath == NULL) {
|
|
return(DB_ERROR);
|
|
}
|
|
|
|
set_open_flags(OS_FILE_OPEN);
|
|
m_handle = os_file_create_simple_no_error_handling(
|
|
innodb_data_file_key, m_filepath, m_open_flags,
|
|
OS_FILE_READ_ONLY, true, &success);
|
|
|
|
if (success) {
|
|
m_exists = true;
|
|
init_file_info();
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
if (strict) {
|
|
m_last_os_error = os_file_get_last_error(true);
|
|
ib::error() << "Cannot open datafile for read-only: '"
|
|
<< m_filepath << "' OS error: " << m_last_os_error;
|
|
}
|
|
|
|
return(DB_CANNOT_OPEN_FILE);
|
|
}
|
|
|
|
/** Open a data file in read-write mode during start-up so that
|
|
doublewrite pages can be restored and then it can be validated.*
|
|
@return DB_SUCCESS or error code */
|
|
inline dberr_t Datafile::open_read_write()
|
|
{
|
|
bool success = false;
|
|
ut_ad(m_handle == OS_FILE_CLOSED);
|
|
ut_ad(!srv_read_only_mode);
|
|
|
|
/* This function can be called for file objects that do not need
|
|
to be opened, which is the case when the m_filepath is NULL */
|
|
if (m_filepath == NULL) {
|
|
return(DB_ERROR);
|
|
}
|
|
|
|
set_open_flags(OS_FILE_OPEN);
|
|
m_handle = os_file_create_simple_no_error_handling(
|
|
innodb_data_file_key, m_filepath, m_open_flags,
|
|
OS_FILE_READ_WRITE, false, &success);
|
|
|
|
if (!success) {
|
|
m_last_os_error = os_file_get_last_error(true);
|
|
ib::error() << "Cannot open datafile for read-write: '"
|
|
<< m_filepath << "'";
|
|
return(DB_CANNOT_OPEN_FILE);
|
|
}
|
|
|
|
m_exists = true;
|
|
|
|
init_file_info();
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/** Initialize OS specific file info. */
|
|
void
|
|
Datafile::init_file_info()
|
|
{
|
|
#ifdef _WIN32
|
|
GetFileInformationByHandle((os_file_t)m_handle, &m_file_info);
|
|
#else
|
|
fstat(m_handle, &m_file_info);
|
|
#endif /* WIN32 */
|
|
}
|
|
|
|
/** Close a data file.
|
|
@return DB_SUCCESS or error code */
|
|
dberr_t
|
|
Datafile::close()
|
|
{
|
|
if (m_handle != OS_FILE_CLOSED) {
|
|
ibool success = os_file_close(m_handle);
|
|
ut_a(success);
|
|
|
|
m_handle = OS_FILE_CLOSED;
|
|
}
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/** Make a full filepath from a directory path and a filename.
|
|
Prepend the dirpath to filename using the extension given.
|
|
If dirpath is NULL, prepend the default datadir to filepath.
|
|
Store the result in m_filepath.
|
|
@param dirpath directory path
|
|
@param name tablespace (table) name
|
|
@param ext filename extension */
|
|
void Datafile::make_filepath(const char *dirpath, fil_space_t::name_type name,
|
|
ib_extention ext)
|
|
{
|
|
ut_ad(dirpath || name.size());
|
|
free_filepath();
|
|
m_filepath= fil_make_filepath(dirpath, name, ext, false);
|
|
ut_ad(m_filepath);
|
|
set_filename();
|
|
}
|
|
|
|
/** Set the filepath by duplicating the filepath sent in. This is the
|
|
name of the file with its extension and absolute or relative path.
|
|
@param[in] filepath filepath to set */
|
|
void
|
|
Datafile::set_filepath(const char* filepath)
|
|
{
|
|
free_filepath();
|
|
m_filepath = static_cast<char*>(ut_malloc_nokey(strlen(filepath) + 1));
|
|
::strcpy(m_filepath, filepath);
|
|
set_filename();
|
|
}
|
|
|
|
/** Free the filepath buffer. */
|
|
void
|
|
Datafile::free_filepath()
|
|
{
|
|
if (m_filepath != NULL) {
|
|
ut_free(m_filepath);
|
|
m_filepath = NULL;
|
|
m_filename = NULL;
|
|
}
|
|
}
|
|
|
|
/** Do a quick test if the filepath provided looks the same as this filepath
|
|
byte by byte. If they are two different looking paths to the same file,
|
|
same_as() will be used to show that after the files are opened.
|
|
@param[in] other filepath to compare with
|
|
@retval true if it is the same filename by byte comparison
|
|
@retval false if it looks different */
|
|
bool
|
|
Datafile::same_filepath_as(
|
|
const char* other) const
|
|
{
|
|
return(0 == strcmp(m_filepath, other));
|
|
}
|
|
|
|
/** Test if another opened datafile is the same file as this object.
|
|
@param[in] other Datafile to compare with
|
|
@return true if it is the same file, else false */
|
|
bool
|
|
Datafile::same_as(
|
|
const Datafile& other) const
|
|
{
|
|
#ifdef _WIN32
|
|
return(m_file_info.dwVolumeSerialNumber
|
|
== other.m_file_info.dwVolumeSerialNumber
|
|
&& m_file_info.nFileIndexHigh
|
|
== other.m_file_info.nFileIndexHigh
|
|
&& m_file_info.nFileIndexLow
|
|
== other.m_file_info.nFileIndexLow);
|
|
#else
|
|
return(m_file_info.st_ino == other.m_file_info.st_ino
|
|
&& m_file_info.st_dev == other.m_file_info.st_dev);
|
|
#endif /* WIN32 */
|
|
}
|
|
|
|
dberr_t Datafile::read_first_page_flags(const page_t *page) noexcept
|
|
{
|
|
ut_ad(m_order == 0);
|
|
|
|
if (memcmp_aligned<2>(FIL_PAGE_SPACE_ID + page,
|
|
FSP_HEADER_OFFSET + FSP_SPACE_ID + page, 4))
|
|
{
|
|
sql_print_error("InnoDB: Inconsistent tablespace ID in %s", m_filepath);
|
|
return DB_CORRUPTION;
|
|
}
|
|
|
|
m_space_id= mach_read_from_4(FIL_PAGE_SPACE_ID + page);
|
|
m_flags= fsp_header_get_flags(page);
|
|
if (!fil_space_t::is_valid_flags(m_flags, m_space_id))
|
|
{
|
|
uint32_t cflags= fsp_flags_convert_from_101(m_flags);
|
|
if (cflags == UINT32_MAX)
|
|
switch (fsp_flags_is_incompatible_mysql(m_flags)) {
|
|
case 0:
|
|
sql_print_error("InnoDB: Invalid flags 0x%" PRIx32 " in %s",
|
|
m_flags, m_filepath);
|
|
return DB_CORRUPTION;
|
|
case 3:
|
|
case 2:
|
|
sql_print_error("InnoDB: MySQL-8.0 tablespace in %s", m_filepath);
|
|
goto unsupported;
|
|
case 1:
|
|
sql_print_error("InnoDB: MySQL Encrypted tablespace in %s",
|
|
m_filepath);
|
|
unsupported:
|
|
sql_print_error("InnoDB: Restart in MySQL for migration/recovery.");
|
|
return DB_UNSUPPORTED;
|
|
}
|
|
else
|
|
m_flags= cflags;
|
|
}
|
|
|
|
return DB_SUCCESS;
|
|
}
|
|
|
|
/** Reads a few significant fields from the first page of the first
|
|
datafile. The Datafile must already be open.
|
|
@param[in] read_only_mode If true, then readonly mode checks are enforced.
|
|
@return DB_SUCCESS or DB_IO_ERROR if page cannot be read */
|
|
dberr_t
|
|
Datafile::read_first_page(bool read_only_mode)
|
|
{
|
|
if (m_handle == OS_FILE_CLOSED) {
|
|
|
|
dberr_t err = open_or_create(read_only_mode);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
return(err);
|
|
}
|
|
}
|
|
|
|
/* Align the memory for a possible read from a raw device */
|
|
|
|
m_first_page = static_cast<byte*>(
|
|
aligned_malloc(UNIV_PAGE_SIZE_MAX, srv_page_size));
|
|
|
|
dberr_t err = DB_ERROR;
|
|
size_t page_size = UNIV_PAGE_SIZE_MAX;
|
|
|
|
/* Don't want unnecessary complaints about partial reads. */
|
|
|
|
while (page_size >= UNIV_PAGE_SIZE_MIN) {
|
|
|
|
ulint n_read = 0;
|
|
|
|
err = os_file_read(
|
|
IORequestReadPartial, m_handle, m_first_page, 0,
|
|
page_size, &n_read);
|
|
|
|
if (err == DB_SUCCESS) {
|
|
break;
|
|
}
|
|
|
|
if (err == DB_IO_ERROR && n_read == 0) {
|
|
break;
|
|
}
|
|
if (err == DB_IO_ERROR && n_read >= UNIV_PAGE_SIZE_MIN) {
|
|
page_size >>= 1;
|
|
} else if (srv_operation == SRV_OPERATION_BACKUP) {
|
|
break;
|
|
} else {
|
|
ib::info() << "Cannot read first page of '"
|
|
<< m_filepath << "': " << err;
|
|
break;
|
|
}
|
|
}
|
|
|
|
if (err == DB_SUCCESS && m_order == 0) {
|
|
err = read_first_page_flags(m_first_page);
|
|
}
|
|
|
|
if (err == DB_SUCCESS
|
|
&& fil_space_t::physical_size(m_flags) > page_size) {
|
|
ib::error() << "File " << m_filepath
|
|
<< " should be longer than "
|
|
<< page_size << " bytes";
|
|
err = DB_CORRUPTION;
|
|
}
|
|
|
|
return(err);
|
|
}
|
|
|
|
/** Free the first page from memory when it is no longer needed. */
|
|
void Datafile::free_first_page()
|
|
{
|
|
aligned_free(m_first_page);
|
|
m_first_page= nullptr;
|
|
}
|
|
|
|
/** Validates the datafile and checks that it conforms with the expected
|
|
space ID and flags. The file should exist and be successfully opened
|
|
in order for this function to validate it.
|
|
@param[in] space_id The expected tablespace ID.
|
|
@param[in] flags The expected tablespace flags.
|
|
@retval DB_SUCCESS if tablespace is valid, DB_ERROR if not.
|
|
m_is_valid is also set true on success, else false. */
|
|
dberr_t Datafile::validate_to_dd(uint32_t space_id, uint32_t flags)
|
|
{
|
|
dberr_t err;
|
|
|
|
if (!is_open()) {
|
|
return DB_ERROR;
|
|
}
|
|
|
|
/* Validate this single-table-tablespace with the data dictionary,
|
|
but do not compare the DATA_DIR flag, in case the tablespace was
|
|
remotely located. */
|
|
err = validate_first_page(m_first_page);
|
|
if (err != DB_SUCCESS) {
|
|
return(err);
|
|
}
|
|
|
|
flags &= ~FSP_FLAGS_MEM_MASK;
|
|
|
|
/* Make sure the datafile we found matched the space ID.
|
|
If the datafile is a file-per-table tablespace then also match
|
|
the row format and zip page size. */
|
|
if (m_space_id == space_id
|
|
&& (fil_space_t::is_flags_equal(flags, m_flags)
|
|
|| fil_space_t::is_flags_equal(m_flags, flags))) {
|
|
/* Datafile matches the tablespace expected. */
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/* else do not use this tablespace. */
|
|
m_is_valid = false;
|
|
|
|
ib::error() << "Refusing to load '" << m_filepath << "' (id="
|
|
<< m_space_id << ", flags=" << ib::hex(m_flags)
|
|
<< "); dictionary contains id="
|
|
<< space_id << ", flags=" << ib::hex(flags);
|
|
|
|
return(DB_ERROR);
|
|
}
|
|
|
|
inline
|
|
uint32_t recv_dblwr_t::find_first_page(const char *name, pfs_os_file_t file)
|
|
const noexcept
|
|
{
|
|
os_offset_t file_size= os_file_get_size(file);
|
|
if (file_size != (os_offset_t) -1)
|
|
{
|
|
for (const page_t *page : pages)
|
|
{
|
|
uint32_t space_id= page_get_space_id(page);
|
|
byte *read_page= nullptr;
|
|
if (page_get_page_no(page) > 0 || space_id == 0)
|
|
{
|
|
next_page:
|
|
aligned_free(read_page);
|
|
continue;
|
|
}
|
|
uint32_t flags= mach_read_from_4(FSP_HEADER_OFFSET + FSP_SPACE_FLAGS +
|
|
page);
|
|
size_t page_size= fil_space_t::physical_size(flags);
|
|
if (file_size < 4 * page_size)
|
|
goto next_page;
|
|
read_page=
|
|
static_cast<byte*>(aligned_malloc(3 * page_size, page_size));
|
|
/* Read 3 pages from the file and match the space id
|
|
with the space id which is stored in
|
|
doublewrite buffer page. */
|
|
if (os_file_read(IORequestRead, file, read_page, page_size,
|
|
3 * page_size, nullptr) != DB_SUCCESS)
|
|
goto next_page;
|
|
for (ulint j= 0; j <= 2; j++)
|
|
{
|
|
byte *cur_page= read_page + j * page_size;
|
|
if (buf_is_zeroes(span<const byte>(cur_page, page_size)))
|
|
{
|
|
aligned_free(read_page);
|
|
return 0;
|
|
}
|
|
if (mach_read_from_4(cur_page + FIL_PAGE_OFFSET) != j + 1 ||
|
|
memcmp(cur_page + FIL_PAGE_SPACE_ID,
|
|
page + FIL_PAGE_SPACE_ID, 4) ||
|
|
buf_page_is_corrupted(false, cur_page, flags))
|
|
goto next_page;
|
|
}
|
|
|
|
aligned_free(read_page);
|
|
page= find_page(page_id_t{space_id, 0}, LSN_MAX);
|
|
|
|
if (!page)
|
|
{
|
|
/* If the first page of the given user tablespace is not there
|
|
in the doublewrite buffer, then the recovery is going to fail
|
|
now. Report error only when doublewrite buffer is not empty */
|
|
sql_print_error("InnoDB: Corrupted page "
|
|
"[page id: space=" UINT32PF ", page number=0]"
|
|
" of datafile '%s' could not be found"
|
|
" in the doublewrite buffer", space_id, name);
|
|
break;
|
|
}
|
|
|
|
return space_id;
|
|
}
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
/** Validates this datafile for the purpose of recovery. The file should
|
|
exist and be successfully opened. We initially open it in read-only mode
|
|
because we just want to read the SpaceID. However, if the first page is
|
|
corrupt and needs to be restored from the doublewrite buffer, we will
|
|
reopen it in write mode and ry to restore that page.
|
|
@retval DB_SUCCESS if tablespace is valid, DB_ERROR if not.
|
|
m_is_valid is also set true on success, else false. */
|
|
dberr_t
|
|
Datafile::validate_for_recovery()
|
|
{
|
|
dberr_t err;
|
|
|
|
ut_ad(is_open());
|
|
ut_ad(!srv_read_only_mode);
|
|
|
|
err = validate_first_page(m_first_page);
|
|
|
|
switch (err) {
|
|
case DB_TABLESPACE_EXISTS:
|
|
break;
|
|
case DB_SUCCESS:
|
|
if (!m_defer || !m_space_id) {
|
|
break;
|
|
}
|
|
/* InnoDB should check whether the deferred
|
|
tablespace page0 can be recovered from
|
|
double write buffer. InnoDB should try
|
|
to recover only if m_space_id exists because
|
|
dblwr pages can be searched via {space_id, 0}.
|
|
m_space_id is set in read_first_page(). */
|
|
/* fall through */
|
|
default:
|
|
const page_t *first_page = nullptr;
|
|
|
|
if (!m_space_id) {
|
|
m_space_id = recv_sys.dblwr.find_first_page(
|
|
m_filepath, m_handle);
|
|
if (m_space_id) {
|
|
m_defer= false;
|
|
goto free_first_page;
|
|
} else return err;
|
|
}
|
|
|
|
if (!m_defer) {
|
|
err = find_space_id();
|
|
if (err != DB_SUCCESS || m_space_id == 0) {
|
|
sql_print_error(
|
|
"InnoDB: Datafile '%s' is corrupted."
|
|
" Cannot determine the space ID from"
|
|
" the first 64 pages.", m_filepath);
|
|
return(err);
|
|
}
|
|
}
|
|
|
|
if (m_space_id == UINT32_MAX) {
|
|
return DB_SUCCESS; /* empty file */
|
|
}
|
|
|
|
first_page = recv_sys.dblwr.find_page(
|
|
page_id_t(m_space_id, 0), LSN_MAX);
|
|
|
|
if (!first_page) {
|
|
return m_defer ? err : DB_CORRUPTION;
|
|
}
|
|
free_first_page:
|
|
/* Free the previously read first page and then re-validate. */
|
|
free_first_page();
|
|
m_defer = false;
|
|
err = validate_first_page(first_page);
|
|
}
|
|
|
|
return(err);
|
|
}
|
|
|
|
/** Check the consistency of the first page of a datafile when the
|
|
tablespace is opened. This occurs before the fil_space_t is created
|
|
so the Space ID found here must not already be open.
|
|
m_is_valid is set true on success, else false.
|
|
@param[in] first_page the contents of the first page
|
|
@retval DB_SUCCESS on if the datafile is valid
|
|
@retval DB_CORRUPTION if the datafile is not readable
|
|
@retval DB_TABLESPACE_EXISTS if there is a duplicate space_id */
|
|
dberr_t Datafile::validate_first_page(const page_t *first_page) noexcept
|
|
{
|
|
const char* error_txt = NULL;
|
|
|
|
m_is_valid = true;
|
|
ut_ad(first_page || !m_first_page);
|
|
|
|
if (first_page) {
|
|
if (dberr_t err = read_first_page_flags(first_page)) {
|
|
m_is_valid = false;
|
|
return err;
|
|
}
|
|
} else if (read_first_page(srv_read_only_mode) != DB_SUCCESS) {
|
|
error_txt = "Cannot read first page";
|
|
err_exit:
|
|
free_first_page();
|
|
|
|
if (recv_recovery_is_on()
|
|
|| srv_operation == SRV_OPERATION_BACKUP) {
|
|
m_defer= true;
|
|
return DB_SUCCESS;
|
|
}
|
|
|
|
sql_print_information(
|
|
"InnoDB: %s in datafile: %s, Space ID: " UINT32PF
|
|
", " "Flags: " UINT32PF,
|
|
error_txt, m_filepath, m_space_id, m_flags);
|
|
m_is_valid = false;
|
|
return DB_CORRUPTION;
|
|
} else {
|
|
first_page = m_first_page;
|
|
ut_ad(first_page);
|
|
}
|
|
|
|
/* Check if the whole page is blank. */
|
|
if (!m_space_id && !m_flags) {
|
|
const byte* b = first_page;
|
|
ulint nonzero_bytes = srv_page_size;
|
|
|
|
while (*b == '\0' && --nonzero_bytes != 0) {
|
|
|
|
b++;
|
|
}
|
|
|
|
if (nonzero_bytes == 0) {
|
|
error_txt = "Header page consists of zero bytes";
|
|
goto err_exit;
|
|
}
|
|
}
|
|
|
|
if (!fil_space_t::is_valid_flags(m_flags, m_space_id)) {
|
|
/* Tablespace flags must be valid. */
|
|
error_txt = "Tablespace flags are invalid";
|
|
goto err_exit;
|
|
}
|
|
|
|
ulint logical_size = fil_space_t::logical_size(m_flags);
|
|
|
|
if (srv_page_size != logical_size) {
|
|
free_first_page();
|
|
if (recv_recovery_is_on()
|
|
|| srv_operation == SRV_OPERATION_BACKUP) {
|
|
m_defer= true;
|
|
return DB_SUCCESS;
|
|
}
|
|
/* Logical size must be innodb_page_size. */
|
|
ib::error()
|
|
<< "Data file '" << m_filepath << "' uses page size "
|
|
<< logical_size << ", but the innodb_page_size"
|
|
" start-up parameter is "
|
|
<< srv_page_size;
|
|
return(DB_ERROR);
|
|
}
|
|
|
|
if (page_get_page_no(first_page) != 0) {
|
|
/* First page must be number 0 */
|
|
error_txt = "Header page contains inconsistent data";
|
|
goto err_exit;
|
|
}
|
|
|
|
if (m_space_id >= SRV_SPACE_ID_UPPER_BOUND) {
|
|
error_txt = "A bad Space ID was found";
|
|
goto err_exit;
|
|
}
|
|
|
|
switch (buf_page_is_corrupted(false, first_page, m_flags)) {
|
|
case NOT_CORRUPTED:
|
|
break;
|
|
case CORRUPTED_FUTURE_LSN:
|
|
error_txt = "LSN is in the future";
|
|
goto err_exit;
|
|
case CORRUPTED_OTHER:
|
|
error_txt = "Checksum mismatch";
|
|
goto err_exit;
|
|
}
|
|
|
|
mysql_mutex_lock(&fil_system.mutex);
|
|
|
|
fil_space_t* space = fil_space_get_by_id(m_space_id);
|
|
|
|
if (space) {
|
|
fil_node_t* node = UT_LIST_GET_FIRST(space->chain);
|
|
|
|
if (node && !strcmp(m_filepath, node->name)) {
|
|
ok_exit:
|
|
mysql_mutex_unlock(&fil_system.mutex);
|
|
return DB_SUCCESS;
|
|
}
|
|
|
|
if (!m_space_id
|
|
&& (recv_recovery_is_on()
|
|
|| srv_operation == SRV_OPERATION_BACKUP)) {
|
|
m_defer= true;
|
|
goto ok_exit;
|
|
}
|
|
|
|
/* Make sure the space_id has not already been opened. */
|
|
ib::error() << "Attempted to open a previously opened"
|
|
" tablespace. Previous tablespace: "
|
|
<< (node ? node->name : "(unknown)")
|
|
<< " uses space ID: " << m_space_id
|
|
<< ". Cannot open filepath: " << m_filepath
|
|
<< " which uses the same space ID.";
|
|
}
|
|
|
|
mysql_mutex_unlock(&fil_system.mutex);
|
|
|
|
if (space) {
|
|
m_is_valid = false;
|
|
|
|
free_first_page();
|
|
|
|
return(is_predefined_tablespace(m_space_id)
|
|
? DB_CORRUPTION
|
|
: DB_TABLESPACE_EXISTS);
|
|
}
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/** Determine the space id of the given file descriptor by reading a few
|
|
pages from the beginning of the .ibd file.
|
|
@return DB_SUCCESS if space id was successfully identified, else DB_ERROR. */
|
|
dberr_t
|
|
Datafile::find_space_id()
|
|
{
|
|
os_offset_t file_size;
|
|
|
|
ut_ad(m_handle != OS_FILE_CLOSED);
|
|
|
|
file_size = os_file_get_size(m_handle);
|
|
|
|
if (!file_size) {
|
|
return DB_SUCCESS;
|
|
}
|
|
|
|
if (file_size == (os_offset_t) -1) {
|
|
ib::error() << "Could not get file size of datafile '"
|
|
<< m_filepath << "'";
|
|
return(DB_CORRUPTION);
|
|
}
|
|
|
|
/* Assuming a page size, read the space_id from each page and store it
|
|
in a map. Find out which space_id is agreed on by majority of the
|
|
pages. Choose that space_id. */
|
|
for (ulint page_size = UNIV_ZIP_SIZE_MIN;
|
|
page_size <= UNIV_PAGE_SIZE_MAX;
|
|
page_size <<= 1) {
|
|
/* map[space_id] = count of pages */
|
|
typedef std::map<
|
|
uint32_t,
|
|
uint32_t,
|
|
std::less<uint32_t>,
|
|
ut_allocator<std::pair<const uint32_t, uint32_t> > >
|
|
Pages;
|
|
|
|
Pages verify;
|
|
uint32_t page_count = 64;
|
|
uint32_t valid_pages = 0;
|
|
|
|
/* Adjust the number of pages to analyze based on file size */
|
|
while ((page_count * page_size) > file_size) {
|
|
--page_count;
|
|
}
|
|
|
|
ib::info()
|
|
<< "Page size:" << page_size
|
|
<< ". Pages to analyze:" << page_count;
|
|
|
|
byte* page = static_cast<byte*>(
|
|
aligned_malloc(page_size, page_size));
|
|
|
|
uint32_t fsp_flags;
|
|
/* provide dummy value if the first os_file_read() fails */
|
|
switch (srv_checksum_algorithm) {
|
|
case SRV_CHECKSUM_ALGORITHM_STRICT_FULL_CRC32:
|
|
case SRV_CHECKSUM_ALGORITHM_FULL_CRC32:
|
|
fsp_flags = 1U << FSP_FLAGS_FCRC32_POS_MARKER
|
|
| FSP_FLAGS_FCRC32_PAGE_SSIZE()
|
|
| uint(innodb_compression_algorithm)
|
|
<< FSP_FLAGS_FCRC32_POS_COMPRESSED_ALGO;
|
|
break;
|
|
default:
|
|
fsp_flags = 0;
|
|
}
|
|
|
|
for (ulint j = 0; j < page_count; ++j) {
|
|
if (os_file_read(IORequestRead, m_handle, page,
|
|
j * page_size, page_size, nullptr)) {
|
|
ib::info()
|
|
<< "READ FAIL: page_no:" << j;
|
|
continue;
|
|
}
|
|
|
|
if (j == 0) {
|
|
fsp_flags = mach_read_from_4(
|
|
page + FSP_HEADER_OFFSET + FSP_SPACE_FLAGS);
|
|
}
|
|
|
|
bool noncompressed_ok = false;
|
|
|
|
/* For noncompressed pages, the page size must be
|
|
equal to srv_page_size. */
|
|
if (page_size == srv_page_size
|
|
&& !fil_space_t::zip_size(fsp_flags)) {
|
|
noncompressed_ok = !buf_page_is_corrupted(
|
|
false, page, fsp_flags);
|
|
}
|
|
|
|
bool compressed_ok = false;
|
|
|
|
if (srv_page_size <= UNIV_PAGE_SIZE_DEF
|
|
&& page_size == fil_space_t::zip_size(fsp_flags)) {
|
|
compressed_ok = !buf_page_is_corrupted(
|
|
false, page, fsp_flags);
|
|
}
|
|
|
|
if (noncompressed_ok || compressed_ok) {
|
|
|
|
uint32_t space_id = mach_read_from_4(page
|
|
+ FIL_PAGE_SPACE_ID);
|
|
|
|
if (space_id > 0) {
|
|
|
|
ib::info()
|
|
<< "VALID: space:"
|
|
<< space_id << " page_no:" << j
|
|
<< " page_size:" << page_size;
|
|
|
|
++valid_pages;
|
|
|
|
++verify[space_id];
|
|
}
|
|
}
|
|
}
|
|
|
|
aligned_free(page);
|
|
|
|
ib::info()
|
|
<< "Page size: " << page_size
|
|
<< ". Possible space_id count:" << verify.size();
|
|
|
|
const ulint pages_corrupted = 3;
|
|
|
|
for (ulint missed = 0; missed <= pages_corrupted; ++missed) {
|
|
|
|
for (Pages::const_iterator it = verify.begin();
|
|
it != verify.end();
|
|
++it) {
|
|
|
|
ib::info() << "space_id:" << it->first
|
|
<< ", Number of pages matched: "
|
|
<< it->second << "/" << valid_pages
|
|
<< " (" << page_size << ")";
|
|
|
|
if (it->second == (valid_pages - missed)) {
|
|
ib::info() << "Chosen space:"
|
|
<< it->first;
|
|
|
|
m_space_id = it->first;
|
|
return(DB_SUCCESS);
|
|
}
|
|
}
|
|
|
|
}
|
|
}
|
|
|
|
return(DB_CORRUPTION);
|
|
}
|
|
|
|
/** Read an InnoDB Symbolic Link (ISL) file by name.
|
|
@param link_filepath filepath of the ISL file
|
|
@return data file name (must be freed by the caller)
|
|
@retval nullptr on error */
|
|
static char *read_link_file(const char *link_filepath)
|
|
{
|
|
if (FILE* file= fopen(link_filepath, "r+b" STR_O_CLOEXEC))
|
|
{
|
|
char *filepath= static_cast<char*>(ut_malloc_nokey(OS_FILE_MAX_PATH));
|
|
|
|
os_file_read_string(file, filepath, OS_FILE_MAX_PATH);
|
|
fclose(file);
|
|
|
|
if (size_t len= strlen(filepath))
|
|
{
|
|
/* Trim whitespace from end of filepath */
|
|
len--;
|
|
while (static_cast<byte>(filepath[len]) <= 0x20)
|
|
{
|
|
if (!len)
|
|
return nullptr;
|
|
filepath[len--]= 0;
|
|
}
|
|
/* Ensure that the last 2 path separators are forward slashes,
|
|
because elsewhere we are assuming that tablespace file names end
|
|
in "/databasename/tablename.ibd". */
|
|
unsigned trailing_slashes= 0;
|
|
for (; len; len--)
|
|
{
|
|
switch (filepath[len]) {
|
|
#ifdef _WIN32
|
|
case '\\':
|
|
filepath[len]= '/';
|
|
/* fall through */
|
|
#endif
|
|
case '/':
|
|
if (++trailing_slashes >= 2)
|
|
return filepath;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
return nullptr;
|
|
}
|
|
|
|
/** Create a link filename,
|
|
open that file, and read the contents into m_filepath.
|
|
@param name table name
|
|
@return filepath()
|
|
@retval nullptr if the .isl file does not exist or cannot be read */
|
|
const char *RemoteDatafile::open_link_file(const fil_space_t::name_type name)
|
|
{
|
|
if (!m_link_filepath)
|
|
m_link_filepath= fil_make_filepath(nullptr, name, ISL, false);
|
|
m_filepath= read_link_file(m_link_filepath);
|
|
return m_filepath;
|
|
}
|
|
|
|
/** Release the resources. */
|
|
void
|
|
RemoteDatafile::shutdown()
|
|
{
|
|
Datafile::shutdown();
|
|
|
|
if (m_link_filepath != 0) {
|
|
ut_free(m_link_filepath);
|
|
m_link_filepath = 0;
|
|
}
|
|
}
|
|
|
|
/** Create InnoDB Symbolic Link (ISL) file.
|
|
@param name tablespace name
|
|
@param filepath full file name
|
|
@return DB_SUCCESS or error code */
|
|
dberr_t RemoteDatafile::create_link_file(fil_space_t::name_type name,
|
|
const char *filepath)
|
|
{
|
|
bool success;
|
|
dberr_t err = DB_SUCCESS;
|
|
char* link_filepath = NULL;
|
|
char* prev_filepath = NULL;
|
|
|
|
ut_ad(!srv_read_only_mode);
|
|
|
|
link_filepath = fil_make_filepath(NULL, name, ISL, false);
|
|
|
|
if (link_filepath == NULL) {
|
|
return(DB_ERROR);
|
|
}
|
|
|
|
prev_filepath = read_link_file(link_filepath);
|
|
if (prev_filepath) {
|
|
/* Truncate (starting with MySQL 5.6, probably no
|
|
longer since MariaDB Server 10.2.19) used to call this
|
|
with an existing link file which contains the same filepath. */
|
|
bool same = !strncmp(prev_filepath, name.data(), name.size())
|
|
&& !strcmp(prev_filepath + name.size(), DOT_IBD);
|
|
ut_free(prev_filepath);
|
|
if (same) {
|
|
ut_free(link_filepath);
|
|
return(DB_SUCCESS);
|
|
}
|
|
}
|
|
|
|
/** Check if the file already exists. */
|
|
FILE* file = NULL;
|
|
bool exists;
|
|
os_file_type_t ftype;
|
|
|
|
success = os_file_status(link_filepath, &exists, &ftype);
|
|
ulint error = 0;
|
|
|
|
if (success && !exists) {
|
|
|
|
file = fopen(link_filepath, "w");
|
|
if (file == NULL) {
|
|
/* This call will print its own error message */
|
|
error = os_file_get_last_error(true);
|
|
}
|
|
} else {
|
|
error = OS_FILE_ALREADY_EXISTS;
|
|
}
|
|
|
|
if (error != 0) {
|
|
|
|
ib::error() << "Cannot create file " << link_filepath << ".";
|
|
|
|
if (error == OS_FILE_ALREADY_EXISTS) {
|
|
ib::error() << "The link file: " << link_filepath
|
|
<< " already exists.";
|
|
err = DB_TABLESPACE_EXISTS;
|
|
|
|
} else if (error == OS_FILE_DISK_FULL) {
|
|
err = DB_OUT_OF_FILE_SPACE;
|
|
|
|
} else {
|
|
err = DB_ERROR;
|
|
}
|
|
|
|
/* file is not open, no need to close it. */
|
|
ut_free(link_filepath);
|
|
return(err);
|
|
}
|
|
|
|
const size_t len = strlen(filepath);
|
|
if (fwrite(filepath, 1, len, file) != len) {
|
|
error = os_file_get_last_error(true);
|
|
ib::error() <<
|
|
"Cannot write link file: "
|
|
<< link_filepath << " filepath: " << filepath;
|
|
err = DB_ERROR;
|
|
}
|
|
|
|
/* Close the file, we only need it at startup */
|
|
fclose(file);
|
|
|
|
ut_free(link_filepath);
|
|
|
|
return(err);
|
|
}
|
|
|
|
/** Delete an InnoDB Symbolic Link (ISL) file. */
|
|
void
|
|
RemoteDatafile::delete_link_file(void)
|
|
{
|
|
ut_ad(m_link_filepath != NULL);
|
|
|
|
if (m_link_filepath != NULL) {
|
|
os_file_delete_if_exists(innodb_data_file_key,
|
|
m_link_filepath, NULL);
|
|
}
|
|
}
|
|
|
|
/** Delete an InnoDB Symbolic Link (ISL) file by name.
|
|
@param name tablespace name */
|
|
void RemoteDatafile::delete_link_file(fil_space_t::name_type name)
|
|
{
|
|
if (char *link_filepath= fil_make_filepath(NULL, name, ISL, false))
|
|
{
|
|
os_file_delete_if_exists(innodb_data_file_key, link_filepath, nullptr);
|
|
ut_free(link_filepath);
|
|
}
|
|
}
|