mirror of
https://github.com/MariaDB/server.git
synced 2025-01-22 14:54:20 +01:00
1052 lines
24 KiB
C++
1052 lines
24 KiB
C++
/*****************************************************************************
|
|
|
|
Copyright (c) 2013, 2016, Oracle and/or its affiliates. All Rights Reserved.
|
|
|
|
This program is free software; you can redistribute it and/or modify it under
|
|
the terms of the GNU General Public License as published by the Free Software
|
|
Foundation; version 2 of the License.
|
|
|
|
This program is distributed in the hope that it will be useful, but WITHOUT
|
|
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License along with
|
|
this program; if not, write to the Free Software Foundation, Inc.,
|
|
51 Franklin Street, Suite 500, Boston, MA 02110-1335 USA
|
|
|
|
*****************************************************************************/
|
|
|
|
/**************************************************//**
|
|
@file fsp/fsp0space.cc
|
|
Multi file, shared, system tablespace implementation.
|
|
|
|
Created 2012-11-16 by Sunny Bains as srv/srv0space.cc
|
|
Refactored 2013-7-26 by Kevin Lewis
|
|
*******************************************************/
|
|
|
|
#include "ha_prototypes.h"
|
|
|
|
#include "fsp0sysspace.h"
|
|
#include "srv0start.h"
|
|
#include "trx0sys.h"
|
|
#ifndef UNIV_HOTBACKUP
|
|
#include "dict0load.h"
|
|
#include "mem0mem.h"
|
|
#include "os0file.h"
|
|
#include "row0mysql.h"
|
|
#include "ut0new.h"
|
|
|
|
/** The server header file is included to access opt_initialize global variable.
|
|
If server passes the option for create/open DB to SE, we should remove such
|
|
direct reference to server header and global variable */
|
|
#include "mysqld.h"
|
|
#else
|
|
my_bool opt_initialize = 0;
|
|
#endif /* !UNIV_HOTBACKUP */
|
|
|
|
/** The control info of the system tablespace. */
|
|
SysTablespace srv_sys_space;
|
|
|
|
/** The control info of a temporary table shared tablespace. */
|
|
SysTablespace srv_tmp_space;
|
|
|
|
/** If the last data file is auto-extended, we add this many pages to it
|
|
at a time. We have to make this public because it is a config variable. */
|
|
ulong sys_tablespace_auto_extend_increment;
|
|
|
|
#ifdef UNIV_DEBUG
|
|
/** Control if extra debug checks need to be done for temporary tablespace.
|
|
Default = true that is disable such checks.
|
|
This variable is not exposed to end-user but still kept as variable for
|
|
developer to enable it during debug. */
|
|
bool srv_skip_temp_table_checks_debug = true;
|
|
#endif /* UNIV_DEBUG */
|
|
|
|
/** Convert a numeric string that optionally ends in G or M or K,
|
|
to a number containing megabytes.
|
|
@param[in] str String with a quantity in bytes
|
|
@param[out] megs The number in megabytes
|
|
@return next character in string */
|
|
char*
|
|
SysTablespace::parse_units(
|
|
char* ptr,
|
|
ulint* megs)
|
|
{
|
|
char* endp;
|
|
|
|
*megs = strtoul(ptr, &endp, 10);
|
|
|
|
ptr = endp;
|
|
|
|
switch (*ptr) {
|
|
case 'G': case 'g':
|
|
*megs *= 1024;
|
|
/* fall through */
|
|
case 'M': case 'm':
|
|
++ptr;
|
|
break;
|
|
case 'K': case 'k':
|
|
*megs /= 1024;
|
|
++ptr;
|
|
break;
|
|
default:
|
|
*megs /= 1024 * 1024;
|
|
break;
|
|
}
|
|
|
|
return(ptr);
|
|
}
|
|
|
|
/** Parse the input params and populate member variables.
|
|
@param[in] filepath path to data files
|
|
@param[in] supports_raw true if the tablespace supports raw devices
|
|
@return true on success parse */
|
|
bool
|
|
SysTablespace::parse_params(
|
|
const char* filepath_spec,
|
|
bool supports_raw)
|
|
{
|
|
char* filepath;
|
|
ulint size;
|
|
char* input_str;
|
|
ulint n_files = 0;
|
|
|
|
ut_ad(m_last_file_size_max == 0);
|
|
ut_ad(!m_auto_extend_last_file);
|
|
|
|
char* new_str = mem_strdup(filepath_spec);
|
|
char* str = new_str;
|
|
|
|
input_str = str;
|
|
|
|
/*---------------------- PASS 1 ---------------------------*/
|
|
/* First calculate the number of data files and check syntax:
|
|
filepath:size[K |M | G];filepath:size[K |M | G]... .
|
|
Note that a Windows path may contain a drive name and a ':'. */
|
|
while (*str != '\0') {
|
|
filepath = str;
|
|
|
|
while ((*str != ':' && *str != '\0')
|
|
|| (*str == ':'
|
|
&& (*(str + 1) == '\\' || *(str + 1) == '/'
|
|
|| *(str + 1) == ':'))) {
|
|
str++;
|
|
}
|
|
|
|
if (*str == '\0') {
|
|
ut_free(new_str);
|
|
|
|
ib::error()
|
|
<< "syntax error in file path or size"
|
|
" specified is less than 1 megabyte";
|
|
return(false);
|
|
}
|
|
|
|
str++;
|
|
|
|
str = parse_units(str, &size);
|
|
|
|
if (0 == strncmp(str, ":autoextend",
|
|
(sizeof ":autoextend") - 1)) {
|
|
|
|
str += (sizeof ":autoextend") - 1;
|
|
|
|
if (0 == strncmp(str, ":max:",
|
|
(sizeof ":max:") - 1)) {
|
|
|
|
str += (sizeof ":max:") - 1;
|
|
|
|
str = parse_units(str, &size);
|
|
}
|
|
|
|
if (*str != '\0') {
|
|
ut_free(new_str);
|
|
ib::error()
|
|
<< "syntax error in file path or"
|
|
<< " size specified is less than"
|
|
<< " 1 megabyte";
|
|
return(false);
|
|
}
|
|
}
|
|
|
|
if (::strlen(str) >= 6
|
|
&& *str == 'n'
|
|
&& *(str + 1) == 'e'
|
|
&& *(str + 2) == 'w') {
|
|
|
|
if (!supports_raw) {
|
|
ib::error()
|
|
<< "Tablespace doesn't support raw"
|
|
" devices";
|
|
ut_free(new_str);
|
|
return(false);
|
|
}
|
|
|
|
str += 3;
|
|
}
|
|
|
|
if (*str == 'r' && *(str + 1) == 'a' && *(str + 2) == 'w') {
|
|
str += 3;
|
|
|
|
if (!supports_raw) {
|
|
ib::error()
|
|
<< "Tablespace doesn't support raw"
|
|
" devices";
|
|
ut_free(new_str);
|
|
return(false);
|
|
}
|
|
}
|
|
|
|
if (size == 0) {
|
|
|
|
ut_free(new_str);
|
|
|
|
ib::error()
|
|
<< "syntax error in file path or size"
|
|
" specified is less than 1 megabyte";
|
|
|
|
return(false);
|
|
}
|
|
|
|
++n_files;
|
|
|
|
if (*str == ';') {
|
|
str++;
|
|
} else if (*str != '\0') {
|
|
ut_free(new_str);
|
|
|
|
ib::error()
|
|
<< "syntax error in file path or size"
|
|
" specified is less than 1 megabyte";
|
|
return(false);
|
|
}
|
|
}
|
|
|
|
if (n_files == 0) {
|
|
|
|
/* filepath_spec must contain at least one data file
|
|
definition */
|
|
|
|
ut_free(new_str);
|
|
|
|
ib::error()
|
|
<< "syntax error in file path or size specified"
|
|
" is less than 1 megabyte";
|
|
|
|
return(false);
|
|
}
|
|
|
|
/*---------------------- PASS 2 ---------------------------*/
|
|
/* Then store the actual values to our arrays */
|
|
str = input_str;
|
|
ulint order = 0;
|
|
|
|
while (*str != '\0') {
|
|
filepath = str;
|
|
|
|
/* Note that we must step over the ':' in a Windows filepath;
|
|
a Windows path normally looks like C:\ibdata\ibdata1:1G, but
|
|
a Windows raw partition may have a specification like
|
|
\\.\C::1Gnewraw or \\.\PHYSICALDRIVE2:1Gnewraw */
|
|
|
|
while ((*str != ':' && *str != '\0')
|
|
|| (*str == ':'
|
|
&& (*(str + 1) == '\\' || *(str + 1) == '/'
|
|
|| *(str + 1) == ':'))) {
|
|
str++;
|
|
}
|
|
|
|
if (*str == ':') {
|
|
/* Make filepath a null-terminated string */
|
|
*str = '\0';
|
|
str++;
|
|
}
|
|
|
|
str = parse_units(str, &size);
|
|
|
|
if (0 == strncmp(str, ":autoextend",
|
|
(sizeof ":autoextend") - 1)) {
|
|
|
|
m_auto_extend_last_file = true;
|
|
|
|
str += (sizeof ":autoextend") - 1;
|
|
|
|
if (0 == strncmp(str, ":max:",
|
|
(sizeof ":max:") - 1)) {
|
|
|
|
str += (sizeof ":max:") - 1;
|
|
|
|
str = parse_units(str, &m_last_file_size_max);
|
|
}
|
|
|
|
if (*str != '\0') {
|
|
ut_free(new_str);
|
|
ib::error() << "syntax error in file path or"
|
|
" size specified is less than 1"
|
|
" megabyte";
|
|
return(false);
|
|
}
|
|
}
|
|
|
|
m_files.push_back(Datafile(filepath, flags(), size, order));
|
|
Datafile* datafile = &m_files.back();
|
|
datafile->make_filepath(path(), filepath, NO_EXT);
|
|
|
|
if (::strlen(str) >= 6
|
|
&& *str == 'n'
|
|
&& *(str + 1) == 'e'
|
|
&& *(str + 2) == 'w') {
|
|
|
|
ut_a(supports_raw);
|
|
|
|
str += 3;
|
|
|
|
/* Initialize new raw device only during initialize */
|
|
/* JAN: TODO: MySQL 5.7 used opt_initialize */
|
|
m_files.back().m_type =
|
|
opt_bootstrap ? SRV_NEW_RAW : SRV_OLD_RAW;
|
|
}
|
|
|
|
if (*str == 'r' && *(str + 1) == 'a' && *(str + 2) == 'w') {
|
|
|
|
ut_a(supports_raw);
|
|
|
|
str += 3;
|
|
|
|
/* Initialize new raw device only during initialize */
|
|
if (m_files.back().m_type == SRV_NOT_RAW) {
|
|
/* JAN: TODO: MySQL 5.7 used opt_initialize */
|
|
m_files.back().m_type =
|
|
opt_bootstrap ? SRV_NEW_RAW : SRV_OLD_RAW;
|
|
}
|
|
}
|
|
|
|
if (*str == ';') {
|
|
++str;
|
|
}
|
|
order++;
|
|
}
|
|
|
|
ut_ad(n_files == ulint(m_files.size()));
|
|
|
|
ut_free(new_str);
|
|
|
|
return(true);
|
|
}
|
|
|
|
/** Frees the memory allocated by the parse method. */
|
|
void
|
|
SysTablespace::shutdown()
|
|
{
|
|
Tablespace::shutdown();
|
|
|
|
m_auto_extend_last_file = 0;
|
|
m_last_file_size_max = 0;
|
|
m_created_new_raw = 0;
|
|
m_is_tablespace_full = false;
|
|
m_sanity_checks_done = false;
|
|
}
|
|
|
|
/** Verify the size of the physical file.
|
|
@param[in] file data file object
|
|
@return DB_SUCCESS if OK else error code. */
|
|
dberr_t
|
|
SysTablespace::check_size(
|
|
Datafile& file)
|
|
{
|
|
os_offset_t size = os_file_get_size(file.m_handle);
|
|
ut_a(size != (os_offset_t) -1);
|
|
|
|
/* Under some error conditions like disk full scenarios
|
|
or file size reaching filesystem limit the data file
|
|
could contain an incomplete extent at the end. When we
|
|
extend a data file and if some failure happens, then
|
|
also the data file could contain an incomplete extent.
|
|
So we need to round the size downward to a megabyte.*/
|
|
|
|
const ulint rounded_size_pages = static_cast<ulint>(
|
|
size >> UNIV_PAGE_SIZE_SHIFT);
|
|
|
|
/* If last file */
|
|
if (&file == &m_files.back() && m_auto_extend_last_file) {
|
|
|
|
if (file.m_size > rounded_size_pages
|
|
|| (m_last_file_size_max > 0
|
|
&& m_last_file_size_max < rounded_size_pages)) {
|
|
ib::error() << "The Auto-extending " << name()
|
|
<< " data file '" << file.filepath() << "' is"
|
|
" of a different size " << rounded_size_pages
|
|
<< " pages than specified"
|
|
" in the .cnf file: initial " << file.m_size
|
|
<< " pages, max " << m_last_file_size_max
|
|
<< " (relevant if non-zero) pages!";
|
|
return(DB_ERROR);
|
|
}
|
|
|
|
file.m_size = rounded_size_pages;
|
|
}
|
|
|
|
if (rounded_size_pages != file.m_size) {
|
|
ib::error() << "The " << name() << " data file '"
|
|
<< file.filepath() << "' is of a different size "
|
|
<< rounded_size_pages << " pages"
|
|
" than the " << file.m_size << " pages specified in"
|
|
" the .cnf file!";
|
|
return(DB_ERROR);
|
|
}
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/** Set the size of the file.
|
|
@param[in] file data file object
|
|
@return DB_SUCCESS or error code */
|
|
dberr_t
|
|
SysTablespace::set_size(
|
|
Datafile& file)
|
|
{
|
|
ut_a(!srv_read_only_mode || m_ignore_read_only);
|
|
|
|
/* We created the data file and now write it full of zeros */
|
|
ib::info() << "Setting file '" << file.filepath() << "' size to "
|
|
<< (file.m_size >> (20 - UNIV_PAGE_SIZE_SHIFT)) << " MB."
|
|
" Physically writing the file full; Please wait ...";
|
|
|
|
bool success = os_file_set_size(
|
|
file.m_filepath, file.m_handle,
|
|
static_cast<os_offset_t>(file.m_size << UNIV_PAGE_SIZE_SHIFT),
|
|
m_ignore_read_only ? false : srv_read_only_mode);
|
|
|
|
if (success) {
|
|
ib::info() << "File '" << file.filepath() << "' size is now "
|
|
<< (file.m_size >> (20 - UNIV_PAGE_SIZE_SHIFT))
|
|
<< " MB.";
|
|
} else {
|
|
ib::error() << "Could not set the file size of '"
|
|
<< file.filepath() << "'. Probably out of disk space";
|
|
|
|
return(DB_ERROR);
|
|
}
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/** Create a data file.
|
|
@param[in] file data file object
|
|
@return DB_SUCCESS or error code */
|
|
dberr_t
|
|
SysTablespace::create_file(
|
|
Datafile& file)
|
|
{
|
|
dberr_t err = DB_SUCCESS;
|
|
|
|
ut_a(!file.m_exists);
|
|
ut_a(!srv_read_only_mode || m_ignore_read_only);
|
|
|
|
switch (file.m_type) {
|
|
case SRV_NEW_RAW:
|
|
|
|
/* The partition is opened, not created; then it is
|
|
written over */
|
|
m_created_new_raw = true;
|
|
|
|
/* Fall through. */
|
|
|
|
case SRV_OLD_RAW:
|
|
|
|
srv_start_raw_disk_in_use = TRUE;
|
|
|
|
/* Fall through. */
|
|
|
|
case SRV_NOT_RAW:
|
|
err = file.open_or_create(
|
|
m_ignore_read_only ? false : srv_read_only_mode);
|
|
break;
|
|
}
|
|
|
|
|
|
if (err == DB_SUCCESS && file.m_type != SRV_OLD_RAW) {
|
|
err = set_size(file);
|
|
}
|
|
|
|
return(err);
|
|
}
|
|
|
|
/** Open a data file.
|
|
@param[in] file data file object
|
|
@return DB_SUCCESS or error code */
|
|
dberr_t
|
|
SysTablespace::open_file(
|
|
Datafile& file)
|
|
{
|
|
dberr_t err = DB_SUCCESS;
|
|
|
|
ut_a(file.m_exists);
|
|
|
|
switch (file.m_type) {
|
|
case SRV_NEW_RAW:
|
|
/* The partition is opened, not created; then it is
|
|
written over */
|
|
m_created_new_raw = true;
|
|
|
|
/* Fall through */
|
|
|
|
case SRV_OLD_RAW:
|
|
srv_start_raw_disk_in_use = TRUE;
|
|
|
|
if (srv_read_only_mode && !m_ignore_read_only) {
|
|
ib::error() << "Can't open a raw device '"
|
|
<< file.m_filepath << "' when"
|
|
" --innodb-read-only is set";
|
|
|
|
return(DB_ERROR);
|
|
}
|
|
|
|
/* Fall through */
|
|
|
|
case SRV_NOT_RAW:
|
|
err = file.open_or_create(
|
|
m_ignore_read_only ? false : srv_read_only_mode);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
return(err);
|
|
}
|
|
break;
|
|
}
|
|
|
|
switch (file.m_type) {
|
|
case SRV_NEW_RAW:
|
|
/* Set file size for new raw device. */
|
|
err = set_size(file);
|
|
break;
|
|
|
|
case SRV_NOT_RAW:
|
|
/* Check file size for existing file. */
|
|
err = check_size(file);
|
|
break;
|
|
|
|
case SRV_OLD_RAW:
|
|
err = DB_SUCCESS;
|
|
break;
|
|
|
|
}
|
|
|
|
if (err != DB_SUCCESS) {
|
|
file.close();
|
|
}
|
|
|
|
return(err);
|
|
}
|
|
|
|
#ifndef UNIV_HOTBACKUP
|
|
/** Check the tablespace header for this tablespace.
|
|
@param[out] flushed_lsn the value of FIL_PAGE_FILE_FLUSH_LSN
|
|
@return DB_SUCCESS or error code */
|
|
dberr_t
|
|
SysTablespace::read_lsn_and_check_flags(lsn_t* flushed_lsn)
|
|
{
|
|
dberr_t err;
|
|
|
|
/* Only relevant for the system tablespace. */
|
|
ut_ad(space_id() == TRX_SYS_SPACE);
|
|
|
|
files_t::iterator it = m_files.begin();
|
|
|
|
ut_a(it->m_exists);
|
|
|
|
if (it->m_handle == OS_FILE_CLOSED) {
|
|
|
|
err = it->open_or_create(
|
|
m_ignore_read_only ? false : srv_read_only_mode);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
return(err);
|
|
}
|
|
}
|
|
|
|
err = it->read_first_page(
|
|
m_ignore_read_only ? false : srv_read_only_mode);
|
|
|
|
m_crypt_info = it->m_crypt_info;
|
|
|
|
if (err != DB_SUCCESS) {
|
|
return(err);
|
|
}
|
|
|
|
ut_a(it->order() == 0);
|
|
|
|
|
|
buf_dblwr_init_or_load_pages(it->handle(), it->filepath());
|
|
|
|
/* Check the contents of the first page of the
|
|
first datafile. */
|
|
for (int retry = 0; retry < 2; ++retry) {
|
|
|
|
err = it->validate_first_page(flushed_lsn, false);
|
|
|
|
if (err != DB_SUCCESS
|
|
&& (retry == 1
|
|
|| it->restore_from_doublewrite(0) != DB_SUCCESS)) {
|
|
|
|
it->close();
|
|
|
|
return(err);
|
|
}
|
|
}
|
|
|
|
/* Make sure the tablespace space ID matches the
|
|
space ID on the first page of the first datafile. */
|
|
if (space_id() != it->m_space_id) {
|
|
|
|
ib::error()
|
|
<< "The " << name() << " data file '" << it->name()
|
|
<< "' has the wrong space ID. It should be "
|
|
<< space_id() << ", but " << it->m_space_id
|
|
<< " was found";
|
|
|
|
it->close();
|
|
|
|
return(err);
|
|
}
|
|
|
|
it->close();
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
#endif /* !UNIV_HOTBACKUP */
|
|
/** Check if a file can be opened in the correct mode.
|
|
@param[in] file data file object
|
|
@param[out] reason exact reason if file_status check failed.
|
|
@return DB_SUCCESS or error code. */
|
|
dberr_t
|
|
SysTablespace::check_file_status(
|
|
const Datafile& file,
|
|
file_status_t& reason)
|
|
{
|
|
os_file_stat_t stat;
|
|
|
|
memset(&stat, 0x0, sizeof(stat));
|
|
|
|
dberr_t err = os_file_get_status(
|
|
file.m_filepath, &stat, true,
|
|
m_ignore_read_only ? false : srv_read_only_mode);
|
|
|
|
reason = FILE_STATUS_VOID;
|
|
/* File exists but we can't read the rw-permission settings. */
|
|
switch (err) {
|
|
case DB_FAIL:
|
|
ib::error() << "os_file_get_status() failed on '"
|
|
<< file.filepath()
|
|
<< "'. Can't determine file permissions";
|
|
err = DB_ERROR;
|
|
reason = FILE_STATUS_RW_PERMISSION_ERROR;
|
|
break;
|
|
|
|
case DB_SUCCESS:
|
|
|
|
/* Note: stat.rw_perm is only valid for "regular" files */
|
|
|
|
if (stat.type == OS_FILE_TYPE_FILE) {
|
|
|
|
if (!stat.rw_perm) {
|
|
const char *p = (!srv_read_only_mode
|
|
|| m_ignore_read_only)
|
|
? "writable"
|
|
: "readable";
|
|
|
|
ib::error() << "The " << name() << " data file"
|
|
<< " '" << file.name() << "' must be "
|
|
<< p;
|
|
|
|
err = DB_ERROR;
|
|
reason = FILE_STATUS_READ_WRITE_ERROR;
|
|
}
|
|
|
|
} else {
|
|
/* Not a regular file, bail out. */
|
|
ib::error() << "The " << name() << " data file '"
|
|
<< file.name() << "' is not a regular"
|
|
" InnoDB data file.";
|
|
|
|
err = DB_ERROR;
|
|
reason = FILE_STATUS_NOT_REGULAR_FILE_ERROR;
|
|
}
|
|
break;
|
|
|
|
case DB_NOT_FOUND:
|
|
break;
|
|
|
|
default:
|
|
ut_ad(0);
|
|
}
|
|
|
|
return(err);
|
|
}
|
|
|
|
/** Note that the data file was not found.
|
|
@param[in] file data file object
|
|
@param[out] create_new_db true if a new instance to be created
|
|
@return DB_SUCESS or error code */
|
|
dberr_t
|
|
SysTablespace::file_not_found(
|
|
Datafile& file,
|
|
bool* create_new_db)
|
|
{
|
|
file.m_exists = false;
|
|
|
|
if (srv_read_only_mode && !m_ignore_read_only) {
|
|
ib::error() << "Can't create file '" << file.filepath()
|
|
<< "' when --innodb-read-only is set";
|
|
|
|
return(DB_ERROR);
|
|
|
|
} else if (&file == &m_files.front()) {
|
|
|
|
/* First data file. */
|
|
ut_a(!*create_new_db);
|
|
*create_new_db = TRUE;
|
|
|
|
if (space_id() == TRX_SYS_SPACE) {
|
|
ib::info() << "The first " << name() << " data file '"
|
|
<< file.name() << "' did not exist."
|
|
" A new tablespace will be created!";
|
|
}
|
|
|
|
} else {
|
|
ib::info() << "Need to create a new " << name()
|
|
<< " data file '" << file.name() << "'.";
|
|
}
|
|
|
|
/* Set the file create mode. */
|
|
switch (file.m_type) {
|
|
case SRV_NOT_RAW:
|
|
file.set_open_flags(OS_FILE_CREATE);
|
|
break;
|
|
|
|
case SRV_NEW_RAW:
|
|
case SRV_OLD_RAW:
|
|
file.set_open_flags(OS_FILE_OPEN_RAW);
|
|
break;
|
|
}
|
|
|
|
return(DB_SUCCESS);
|
|
}
|
|
|
|
/** Note that the data file was found.
|
|
@param[in,out] file data file object
|
|
@return true if a new instance to be created */
|
|
bool
|
|
SysTablespace::file_found(
|
|
Datafile& file)
|
|
{
|
|
/* Note that the file exists and can be opened
|
|
in the appropriate mode. */
|
|
file.m_exists = true;
|
|
|
|
/* Set the file open mode */
|
|
switch (file.m_type) {
|
|
case SRV_NOT_RAW:
|
|
file.set_open_flags(
|
|
&file == &m_files.front()
|
|
? OS_FILE_OPEN_RETRY : OS_FILE_OPEN);
|
|
break;
|
|
|
|
case SRV_NEW_RAW:
|
|
case SRV_OLD_RAW:
|
|
file.set_open_flags(OS_FILE_OPEN_RAW);
|
|
break;
|
|
}
|
|
|
|
/* Need to create the system tablespace for new raw device. */
|
|
return(file.m_type == SRV_NEW_RAW);
|
|
}
|
|
#ifndef UNIV_HOTBACKUP
|
|
/** Check the data file specification.
|
|
@param[out] create_new_db true if a new database is to be created
|
|
@param[in] min_expected_size Minimum expected tablespace size in bytes
|
|
@return DB_SUCCESS if all OK else error code */
|
|
dberr_t
|
|
SysTablespace::check_file_spec(
|
|
bool* create_new_db,
|
|
ulint min_expected_size)
|
|
{
|
|
*create_new_db = FALSE;
|
|
|
|
if (m_files.size() >= 1000) {
|
|
ib::error() << "There must be < 1000 data files in "
|
|
<< name() << " but " << m_files.size() << " have been"
|
|
" defined.";
|
|
|
|
return(DB_ERROR);
|
|
}
|
|
|
|
if (!m_auto_extend_last_file
|
|
&& get_sum_of_sizes() < min_expected_size / UNIV_PAGE_SIZE) {
|
|
|
|
ib::error() << "Tablespace size must be at least "
|
|
<< min_expected_size / (1024 * 1024) << " MB";
|
|
|
|
return(DB_ERROR);
|
|
}
|
|
|
|
dberr_t err = DB_SUCCESS;
|
|
|
|
ut_a(!m_files.empty());
|
|
|
|
/* If there is more than one data file and the last data file
|
|
doesn't exist, that is OK. We allow adding of new data files. */
|
|
|
|
files_t::iterator begin = m_files.begin();
|
|
files_t::iterator end = m_files.end();
|
|
|
|
for (files_t::iterator it = begin; it != end; ++it) {
|
|
|
|
file_status_t reason_if_failed;
|
|
err = check_file_status(*it, reason_if_failed);
|
|
|
|
if (err == DB_NOT_FOUND) {
|
|
|
|
err = file_not_found(*it, create_new_db);
|
|
|
|
if (err != DB_SUCCESS) {
|
|
break;
|
|
}
|
|
|
|
} else if (err != DB_SUCCESS) {
|
|
if (reason_if_failed == FILE_STATUS_READ_WRITE_ERROR) {
|
|
const char* p = (!srv_read_only_mode
|
|
|| m_ignore_read_only)
|
|
? "writable" : "readable";
|
|
ib::error() << "The " << name() << " data file"
|
|
<< " '" << it->name() << "' must be "
|
|
<< p;
|
|
}
|
|
|
|
ut_a(err != DB_FAIL);
|
|
break;
|
|
|
|
} else if (*create_new_db) {
|
|
ib::error() << "The " << name() << " data file '"
|
|
<< begin->m_name << "' was not found but"
|
|
" one of the other data files '" << it->m_name
|
|
<< "' exists.";
|
|
|
|
err = DB_ERROR;
|
|
break;
|
|
|
|
} else {
|
|
*create_new_db = file_found(*it);
|
|
}
|
|
}
|
|
|
|
/* We assume doublewirte blocks in the first data file. */
|
|
if (err == DB_SUCCESS && *create_new_db
|
|
&& begin->m_size < TRX_SYS_DOUBLEWRITE_BLOCK_SIZE * 3) {
|
|
ib::error() << "The " << name() << " data file "
|
|
<< "'" << begin->name() << "' must be at least "
|
|
<< TRX_SYS_DOUBLEWRITE_BLOCK_SIZE * 3 * UNIV_PAGE_SIZE
|
|
/ (1024 * 1024) << " MB";
|
|
|
|
err = DB_ERROR;
|
|
}
|
|
|
|
return(err);
|
|
}
|
|
|
|
/** Open or create the data files
|
|
@param[in] is_temp whether this is a temporary tablespace
|
|
@param[in] create_new_db whether we are creating a new database
|
|
@param[out] sum_new_sizes sum of sizes of the new files added
|
|
@param[out] flush_lsn FIL_PAGE_FILE_FLUSH_LSN of first file
|
|
@return DB_SUCCESS or error code */
|
|
dberr_t
|
|
SysTablespace::open_or_create(
|
|
bool is_temp,
|
|
bool create_new_db,
|
|
ulint* sum_new_sizes,
|
|
lsn_t* flush_lsn)
|
|
{
|
|
dberr_t err = DB_SUCCESS;
|
|
fil_space_t* space = NULL;
|
|
|
|
ut_ad(!m_files.empty());
|
|
|
|
if (sum_new_sizes) {
|
|
*sum_new_sizes = 0;
|
|
}
|
|
|
|
files_t::iterator begin = m_files.begin();
|
|
files_t::iterator end = m_files.end();
|
|
|
|
ut_ad(begin->order() == 0);
|
|
|
|
for (files_t::iterator it = begin; it != end; ++it) {
|
|
|
|
if (it->m_exists) {
|
|
err = open_file(*it);
|
|
|
|
/* For new raw device increment new size. */
|
|
if (sum_new_sizes && it->m_type == SRV_NEW_RAW) {
|
|
|
|
*sum_new_sizes += it->m_size;
|
|
}
|
|
|
|
} else {
|
|
err = create_file(*it);
|
|
|
|
if (sum_new_sizes) {
|
|
*sum_new_sizes += it->m_size;
|
|
}
|
|
|
|
/* Set the correct open flags now that we have
|
|
successfully created the file. */
|
|
if (err == DB_SUCCESS) {
|
|
/* We ignore new_db OUT parameter here
|
|
as the information is known at this stage */
|
|
file_found(*it);
|
|
}
|
|
}
|
|
|
|
if (err != DB_SUCCESS) {
|
|
return(err);
|
|
}
|
|
|
|
#ifdef UNIV_LINUX
|
|
/* Note: This should really be per node and not per
|
|
tablespace because a tablespace can contain multiple
|
|
files (nodes). The implication is that all files of
|
|
the tablespace should be on the same medium. */
|
|
|
|
it->m_atomic_write
|
|
= fil_fusionio_enable_atomic_write(it->m_handle);
|
|
|
|
if (it->m_atomic_write && srv_use_doublewrite_buf) {
|
|
ib::info() << "FusionIO atomic IO enabled,"
|
|
" disabling the double write buffer";
|
|
|
|
srv_use_doublewrite_buf = false;
|
|
}
|
|
#else
|
|
it->m_atomic_write = false;
|
|
#endif
|
|
}
|
|
|
|
if (!create_new_db && flush_lsn) {
|
|
/* Validate the header page in the first datafile
|
|
and read LSNs fom the others. */
|
|
err = read_lsn_and_check_flags(flush_lsn);
|
|
if (err != DB_SUCCESS) {
|
|
return(err);
|
|
}
|
|
}
|
|
|
|
/* Close the curent handles, add space and file info to the
|
|
fil_system cache and the Data Dictionary, and re-open them
|
|
in file_system cache so that they stay open until shutdown. */
|
|
ulint node_counter = 0;
|
|
for (files_t::iterator it = begin; it != end; ++it) {
|
|
it->close();
|
|
it->m_exists = true;
|
|
|
|
if (it == begin) {
|
|
/* First data file. */
|
|
|
|
/* Create the tablespace entry for the multi-file
|
|
tablespace in the tablespace manager. */
|
|
|
|
if (!m_crypt_info) {
|
|
/* Create default crypt info for system
|
|
tablespace if it does not yet exists. */
|
|
m_crypt_info = fil_space_create_crypt_data(
|
|
FIL_SPACE_ENCRYPTION_DEFAULT,
|
|
FIL_DEFAULT_ENCRYPTION_KEY);
|
|
}
|
|
|
|
space = fil_space_create(
|
|
name(), space_id(), flags(), is_temp
|
|
? FIL_TYPE_TEMPORARY : FIL_TYPE_TABLESPACE, m_crypt_info,
|
|
false);
|
|
}
|
|
|
|
ut_a(fil_validate());
|
|
|
|
ulint max_size = (++node_counter == m_files.size()
|
|
? (m_last_file_size_max == 0
|
|
? ULINT_MAX
|
|
: m_last_file_size_max)
|
|
: it->m_size);
|
|
|
|
/* Add the datafile to the fil_system cache. */
|
|
if (!fil_node_create(
|
|
it->m_filepath, it->m_size,
|
|
space, it->m_type != SRV_NOT_RAW,
|
|
it->m_atomic_write, max_size)) {
|
|
|
|
err = DB_ERROR;
|
|
break;
|
|
}
|
|
}
|
|
|
|
return(err);
|
|
}
|
|
#endif /* UNIV_HOTBACKUP */
|
|
/** Normalize the file size, convert from megabytes to number of pages. */
|
|
void
|
|
SysTablespace::normalize()
|
|
{
|
|
files_t::iterator end = m_files.end();
|
|
|
|
for (files_t::iterator it = m_files.begin(); it != end; ++it) {
|
|
|
|
it->m_size *= (1024 * 1024) / UNIV_PAGE_SIZE;
|
|
}
|
|
|
|
m_last_file_size_max *= (1024 * 1024) / UNIV_PAGE_SIZE;
|
|
}
|
|
|
|
|
|
/**
|
|
@return next increment size */
|
|
ulint
|
|
SysTablespace::get_increment() const
|
|
{
|
|
ulint increment;
|
|
|
|
if (m_last_file_size_max == 0) {
|
|
increment = get_autoextend_increment();
|
|
} else {
|
|
|
|
if (!is_valid_size()) {
|
|
ib::error() << "The last data file in " << name()
|
|
<< " has a size of " << last_file_size()
|
|
<< " but the max size allowed is "
|
|
<< m_last_file_size_max;
|
|
}
|
|
|
|
increment = m_last_file_size_max - last_file_size();
|
|
}
|
|
|
|
if (increment > get_autoextend_increment()) {
|
|
increment = get_autoextend_increment();
|
|
}
|
|
|
|
return(increment);
|
|
}
|
|
|
|
|
|
/**
|
|
@return true if configured to use raw devices */
|
|
bool
|
|
SysTablespace::has_raw_device()
|
|
{
|
|
files_t::iterator end = m_files.end();
|
|
|
|
for (files_t::iterator it = m_files.begin(); it != end; ++it) {
|
|
|
|
if (it->is_raw_device()) {
|
|
return(true);
|
|
}
|
|
}
|
|
|
|
return(false);
|
|
}
|