2012-08-01 16:27:34 +02:00
|
|
|
/*****************************************************************************
|
|
|
|
|
2017-01-06 15:18:54 +01:00
|
|
|
Copyright (c) 2011, 2017, Oracle and/or its affiliates. All Rights Reserved.
|
|
|
|
Copyright (c) 2017, MariaDB Corporation.
|
2012-08-01 16:27:34 +02:00
|
|
|
|
|
|
|
This program is free software; you can redistribute it and/or modify it under
|
|
|
|
the terms of the GNU General Public License as published by the Free Software
|
|
|
|
Foundation; version 2 of the License.
|
|
|
|
|
|
|
|
This program is distributed in the hope that it will be useful, but WITHOUT
|
|
|
|
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
|
|
FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License along with
|
|
|
|
this program; if not, write to the Free Software Foundation, Inc.,
|
|
|
|
51 Franklin Street, Suite 500, Boston, MA 02110-1335 USA
|
|
|
|
|
|
|
|
*****************************************************************************/
|
|
|
|
|
|
|
|
/**************************************************//**
|
|
|
|
@file buf/buf0dump.cc
|
|
|
|
Implements a buffer pool dump/load.
|
|
|
|
|
|
|
|
Created April 08, 2011 Vasil Dimov
|
|
|
|
*******************************************************/
|
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
#include "my_global.h"
|
|
|
|
#include "my_sys.h"
|
|
|
|
|
|
|
|
#include "mysql/psi/mysql_stage.h"
|
|
|
|
#include "mysql/psi/psi.h"
|
2013-03-25 23:03:13 +01:00
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
#include "univ.i"
|
2012-08-01 16:27:34 +02:00
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
#include "buf0buf.h"
|
2012-08-01 16:27:34 +02:00
|
|
|
#include "buf0dump.h"
|
2016-08-12 10:17:45 +02:00
|
|
|
#include "dict0dict.h"
|
|
|
|
#include "os0file.h"
|
|
|
|
#include "os0thread.h"
|
|
|
|
#include "srv0srv.h"
|
|
|
|
#include "srv0start.h"
|
|
|
|
#include "sync0rw.h"
|
|
|
|
#include "ut0byte.h"
|
|
|
|
|
|
|
|
#include <algorithm>
|
2012-08-01 16:27:34 +02:00
|
|
|
|
2017-08-31 07:27:59 +02:00
|
|
|
#include "mysql/service_wsrep.h" /* wsrep_recovery */
|
2012-08-01 16:27:34 +02:00
|
|
|
|
|
|
|
enum status_severity {
|
|
|
|
STATUS_INFO,
|
|
|
|
STATUS_ERR
|
|
|
|
};
|
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
#define SHUTTING_DOWN() (srv_shutdown_state != SRV_SHUTDOWN_NONE)
|
2012-08-01 16:27:34 +02:00
|
|
|
|
|
|
|
/* Flags that tell the buffer pool dump/load thread which action should it
|
|
|
|
take after being waked up. */
|
2017-02-17 09:32:21 +01:00
|
|
|
static volatile bool buf_dump_should_start;
|
|
|
|
static volatile bool buf_load_should_start;
|
2012-08-01 16:27:34 +02:00
|
|
|
|
|
|
|
static ibool buf_load_abort_flag = FALSE;
|
|
|
|
|
|
|
|
/* Used to temporary store dump info in order to avoid IO while holding
|
|
|
|
buffer pool mutex during dump and also to sort the contents of the dump
|
|
|
|
before reading the pages from disk during load.
|
|
|
|
We store the space id in the high 32 bits and page no in low 32 bits. */
|
|
|
|
typedef ib_uint64_t buf_dump_t;
|
|
|
|
|
|
|
|
/* Aux macros to create buf_dump_t and to extract space and page from it */
|
|
|
|
#define BUF_DUMP_CREATE(space, page) ut_ull_create(space, page)
|
|
|
|
#define BUF_DUMP_SPACE(a) ((ulint) ((a) >> 32))
|
|
|
|
#define BUF_DUMP_PAGE(a) ((ulint) ((a) & 0xFFFFFFFFUL))
|
|
|
|
|
|
|
|
/*****************************************************************//**
|
|
|
|
Wakes up the buffer pool dump/load thread and instructs it to start
|
|
|
|
a dump. This function is called by MySQL code via buffer_pool_dump_now()
|
|
|
|
and it should return immediately because the whole MySQL is frozen during
|
|
|
|
its execution. */
|
|
|
|
void
|
|
|
|
buf_dump_start()
|
|
|
|
/*============*/
|
|
|
|
{
|
2017-02-17 09:32:21 +01:00
|
|
|
buf_dump_should_start = true;
|
2012-08-01 16:27:34 +02:00
|
|
|
os_event_set(srv_buf_dump_event);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*****************************************************************//**
|
|
|
|
Wakes up the buffer pool dump/load thread and instructs it to start
|
|
|
|
a load. This function is called by MySQL code via buffer_pool_load_now()
|
|
|
|
and it should return immediately because the whole MySQL is frozen during
|
|
|
|
its execution. */
|
|
|
|
void
|
|
|
|
buf_load_start()
|
|
|
|
/*============*/
|
|
|
|
{
|
2017-02-17 09:32:21 +01:00
|
|
|
buf_load_should_start = true;
|
2012-08-01 16:27:34 +02:00
|
|
|
os_event_set(srv_buf_dump_event);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*****************************************************************//**
|
|
|
|
Sets the global variable that feeds MySQL's innodb_buffer_pool_dump_status
|
|
|
|
to the specified string. The format and the following parameters are the
|
|
|
|
same as the ones used for printf(3). The value of this variable can be
|
|
|
|
retrieved by:
|
|
|
|
SELECT variable_value FROM information_schema.global_status WHERE
|
|
|
|
variable_name = 'INNODB_BUFFER_POOL_DUMP_STATUS';
|
|
|
|
or by:
|
|
|
|
SHOW STATUS LIKE 'innodb_buffer_pool_dump_status'; */
|
2016-06-21 14:21:03 +02:00
|
|
|
static MY_ATTRIBUTE((nonnull, format(printf, 2, 3)))
|
2012-08-01 16:27:34 +02:00
|
|
|
void
|
|
|
|
buf_dump_status(
|
|
|
|
/*============*/
|
|
|
|
enum status_severity severity,/*!< in: status severity */
|
|
|
|
const char* fmt, /*!< in: format */
|
|
|
|
...) /*!< in: extra parameters according
|
|
|
|
to fmt */
|
|
|
|
{
|
|
|
|
va_list ap;
|
|
|
|
|
|
|
|
va_start(ap, fmt);
|
|
|
|
|
2017-11-13 03:32:56 +01:00
|
|
|
vsnprintf(
|
2012-08-01 16:27:34 +02:00
|
|
|
export_vars.innodb_buffer_pool_dump_status,
|
|
|
|
sizeof(export_vars.innodb_buffer_pool_dump_status),
|
|
|
|
fmt, ap);
|
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
switch (severity) {
|
|
|
|
case STATUS_INFO:
|
|
|
|
ib::info() << export_vars.innodb_buffer_pool_dump_status;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case STATUS_ERR:
|
|
|
|
ib::error() << export_vars.innodb_buffer_pool_dump_status;
|
|
|
|
break;
|
|
|
|
}
|
2012-08-01 16:27:34 +02:00
|
|
|
|
|
|
|
va_end(ap);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*****************************************************************//**
|
|
|
|
Sets the global variable that feeds MySQL's innodb_buffer_pool_load_status
|
|
|
|
to the specified string. The format and the following parameters are the
|
|
|
|
same as the ones used for printf(3). The value of this variable can be
|
|
|
|
retrieved by:
|
|
|
|
SELECT variable_value FROM information_schema.global_status WHERE
|
|
|
|
variable_name = 'INNODB_BUFFER_POOL_LOAD_STATUS';
|
|
|
|
or by:
|
|
|
|
SHOW STATUS LIKE 'innodb_buffer_pool_load_status'; */
|
2016-06-21 14:21:03 +02:00
|
|
|
static MY_ATTRIBUTE((nonnull, format(printf, 2, 3)))
|
2012-08-01 16:27:34 +02:00
|
|
|
void
|
|
|
|
buf_load_status(
|
|
|
|
/*============*/
|
|
|
|
enum status_severity severity,/*!< in: status severity */
|
|
|
|
const char* fmt, /*!< in: format */
|
|
|
|
...) /*!< in: extra parameters according to fmt */
|
|
|
|
{
|
|
|
|
va_list ap;
|
|
|
|
|
|
|
|
va_start(ap, fmt);
|
|
|
|
|
2017-11-13 03:32:56 +01:00
|
|
|
vsnprintf(
|
2012-08-01 16:27:34 +02:00
|
|
|
export_vars.innodb_buffer_pool_load_status,
|
|
|
|
sizeof(export_vars.innodb_buffer_pool_load_status),
|
|
|
|
fmt, ap);
|
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
switch (severity) {
|
|
|
|
case STATUS_INFO:
|
|
|
|
ib::info() << export_vars.innodb_buffer_pool_load_status;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case STATUS_ERR:
|
|
|
|
ib::error() << export_vars.innodb_buffer_pool_load_status;
|
|
|
|
break;
|
2012-08-01 16:27:34 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
va_end(ap);
|
|
|
|
}
|
|
|
|
|
2016-09-06 08:43:16 +02:00
|
|
|
/** Returns the directory path where the buffer pool dump file will be created.
|
|
|
|
@return directory path */
|
|
|
|
static
|
|
|
|
const char*
|
|
|
|
get_buf_dump_dir()
|
|
|
|
{
|
|
|
|
const char* dump_dir;
|
|
|
|
|
|
|
|
/* The dump file should be created in the default data directory if
|
|
|
|
innodb_data_home_dir is set as an empty string. */
|
|
|
|
if (strcmp(srv_data_home, "") == 0) {
|
|
|
|
dump_dir = fil_path_to_mysql_datadir;
|
|
|
|
} else {
|
|
|
|
dump_dir = srv_data_home;
|
|
|
|
}
|
|
|
|
|
|
|
|
return(dump_dir);
|
|
|
|
}
|
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
/** Generate the path to the buffer pool dump/load file.
|
|
|
|
@param[out] path generated path
|
|
|
|
@param[in] path_size size of 'path', used as in snprintf(3). */
|
2016-02-16 12:07:18 +01:00
|
|
|
static
|
2016-08-12 10:17:45 +02:00
|
|
|
void
|
|
|
|
buf_dump_generate_path(
|
|
|
|
char* path,
|
|
|
|
size_t path_size)
|
2016-02-16 12:07:18 +01:00
|
|
|
{
|
2016-08-12 10:17:45 +02:00
|
|
|
char buf[FN_REFLEN];
|
|
|
|
|
2017-11-11 22:07:24 +01:00
|
|
|
snprintf(buf, sizeof(buf), "%s%c%s", get_buf_dump_dir(),
|
|
|
|
OS_PATH_SEPARATOR, srv_buf_dump_filename);
|
2016-08-12 10:17:45 +02:00
|
|
|
|
|
|
|
os_file_type_t type;
|
|
|
|
bool exists = false;
|
|
|
|
bool ret;
|
|
|
|
|
|
|
|
ret = os_file_status(buf, &exists, &type);
|
|
|
|
|
|
|
|
/* For realpath() to succeed the file must exist. */
|
|
|
|
|
|
|
|
if (ret && exists) {
|
|
|
|
/* my_realpath() assumes the destination buffer is big enough
|
|
|
|
to hold FN_REFLEN bytes. */
|
|
|
|
ut_a(path_size >= FN_REFLEN);
|
2016-02-16 12:07:18 +01:00
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
my_realpath(path, buf, 0);
|
2016-02-16 12:07:18 +01:00
|
|
|
} else {
|
2016-08-12 10:17:45 +02:00
|
|
|
/* If it does not exist, then resolve only srv_data_home
|
|
|
|
and append srv_buf_dump_filename to it. */
|
|
|
|
char srv_data_home_full[FN_REFLEN];
|
|
|
|
|
2016-09-06 08:43:16 +02:00
|
|
|
my_realpath(srv_data_home_full, get_buf_dump_dir(), 0);
|
2016-02-16 12:07:18 +01:00
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
if (srv_data_home_full[strlen(srv_data_home_full) - 1]
|
|
|
|
== OS_PATH_SEPARATOR) {
|
|
|
|
|
2017-11-11 22:07:24 +01:00
|
|
|
snprintf(path, path_size, "%s%s",
|
|
|
|
srv_data_home_full,
|
|
|
|
srv_buf_dump_filename);
|
2016-08-12 10:17:45 +02:00
|
|
|
} else {
|
2017-11-11 22:07:24 +01:00
|
|
|
snprintf(path, path_size, "%s%c%s",
|
|
|
|
srv_data_home_full,
|
|
|
|
OS_PATH_SEPARATOR,
|
|
|
|
srv_buf_dump_filename);
|
2016-08-12 10:17:45 +02:00
|
|
|
}
|
|
|
|
}
|
2016-02-16 12:07:18 +01:00
|
|
|
}
|
|
|
|
|
2012-08-01 16:27:34 +02:00
|
|
|
/*****************************************************************//**
|
|
|
|
Perform a buffer pool dump into the file specified by
|
|
|
|
innodb_buffer_pool_filename. If any errors occur then the value of
|
|
|
|
innodb_buffer_pool_dump_status will be set accordingly, see buf_dump_status().
|
|
|
|
The dump filename can be specified by (relative to srv_data_home):
|
|
|
|
SET GLOBAL innodb_buffer_pool_filename='filename'; */
|
|
|
|
static
|
|
|
|
void
|
|
|
|
buf_dump(
|
|
|
|
/*=====*/
|
|
|
|
ibool obey_shutdown) /*!< in: quit if we are in a shutting down
|
|
|
|
state */
|
|
|
|
{
|
|
|
|
#define SHOULD_QUIT() (SHUTTING_DOWN() && obey_shutdown)
|
|
|
|
|
|
|
|
char full_filename[OS_FILE_MAX_PATH];
|
|
|
|
char tmp_filename[OS_FILE_MAX_PATH];
|
|
|
|
char now[32];
|
|
|
|
FILE* f;
|
|
|
|
ulint i;
|
|
|
|
int ret;
|
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
buf_dump_generate_path(full_filename, sizeof(full_filename));
|
2012-08-01 16:27:34 +02:00
|
|
|
|
2017-11-11 22:07:24 +01:00
|
|
|
snprintf(tmp_filename, sizeof(tmp_filename),
|
|
|
|
"%s.incomplete", full_filename);
|
2012-08-01 16:27:34 +02:00
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
buf_dump_status(STATUS_INFO, "Dumping buffer pool(s) to %s",
|
2012-08-01 16:27:34 +02:00
|
|
|
full_filename);
|
|
|
|
|
|
|
|
f = fopen(tmp_filename, "w");
|
|
|
|
if (f == NULL) {
|
|
|
|
buf_dump_status(STATUS_ERR,
|
|
|
|
"Cannot open '%s' for writing: %s",
|
|
|
|
tmp_filename, strerror(errno));
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
/* else */
|
|
|
|
|
|
|
|
/* walk through each buffer pool */
|
|
|
|
for (i = 0; i < srv_buf_pool_instances && !SHOULD_QUIT(); i++) {
|
|
|
|
buf_pool_t* buf_pool;
|
|
|
|
const buf_page_t* bpage;
|
|
|
|
buf_dump_t* dump;
|
|
|
|
ulint n_pages;
|
|
|
|
ulint j;
|
|
|
|
|
|
|
|
buf_pool = buf_pool_from_array(i);
|
|
|
|
|
|
|
|
/* obtain buf_pool mutex before allocate, since
|
|
|
|
UT_LIST_GET_LEN(buf_pool->LRU) could change */
|
|
|
|
buf_pool_mutex_enter(buf_pool);
|
|
|
|
|
|
|
|
n_pages = UT_LIST_GET_LEN(buf_pool->LRU);
|
|
|
|
|
|
|
|
/* skip empty buffer pools */
|
|
|
|
if (n_pages == 0) {
|
|
|
|
buf_pool_mutex_exit(buf_pool);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2015-11-29 08:08:42 +01:00
|
|
|
if (srv_buf_pool_dump_pct != 100) {
|
2016-10-06 07:47:49 +02:00
|
|
|
ulint t_pages;
|
|
|
|
|
2015-11-29 08:08:42 +01:00
|
|
|
ut_ad(srv_buf_pool_dump_pct < 100);
|
|
|
|
|
2016-10-06 07:47:49 +02:00
|
|
|
/* limit the number of total pages dumped to X% of the
|
|
|
|
* total number of pages */
|
|
|
|
t_pages = buf_pool->curr_size
|
|
|
|
* srv_buf_pool_dump_pct / 100;
|
|
|
|
if (n_pages > t_pages) {
|
2016-12-05 07:21:31 +01:00
|
|
|
buf_dump_status(STATUS_INFO,
|
2017-02-24 21:08:09 +01:00
|
|
|
"Instance " ULINTPF
|
|
|
|
", restricted to " ULINTPF
|
|
|
|
" pages due to "
|
|
|
|
"innodb_buf_pool_dump_pct=%lu",
|
|
|
|
i, t_pages,
|
|
|
|
srv_buf_pool_dump_pct);
|
2016-10-06 07:47:49 +02:00
|
|
|
n_pages = t_pages;
|
|
|
|
}
|
2015-11-29 08:08:42 +01:00
|
|
|
|
|
|
|
if (n_pages == 0) {
|
|
|
|
n_pages = 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
dump = static_cast<buf_dump_t*>(ut_malloc_nokey(
|
|
|
|
n_pages * sizeof(*dump)));
|
2012-08-01 16:27:34 +02:00
|
|
|
|
|
|
|
if (dump == NULL) {
|
|
|
|
buf_pool_mutex_exit(buf_pool);
|
|
|
|
fclose(f);
|
|
|
|
buf_dump_status(STATUS_ERR,
|
|
|
|
"Cannot allocate " ULINTPF " bytes: %s",
|
|
|
|
(ulint) (n_pages * sizeof(*dump)),
|
|
|
|
strerror(errno));
|
|
|
|
/* leave tmp_filename to exist */
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2015-11-29 08:08:42 +01:00
|
|
|
for (bpage = UT_LIST_GET_FIRST(buf_pool->LRU), j = 0;
|
|
|
|
bpage != NULL && j < n_pages;
|
|
|
|
bpage = UT_LIST_GET_NEXT(LRU, bpage), j++) {
|
2012-08-01 16:27:34 +02:00
|
|
|
|
|
|
|
ut_a(buf_page_in_file(bpage));
|
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
dump[j] = BUF_DUMP_CREATE(bpage->id.space(),
|
|
|
|
bpage->id.page_no());
|
2012-08-01 16:27:34 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
ut_a(j == n_pages);
|
|
|
|
|
|
|
|
buf_pool_mutex_exit(buf_pool);
|
|
|
|
|
|
|
|
for (j = 0; j < n_pages && !SHOULD_QUIT(); j++) {
|
|
|
|
ret = fprintf(f, ULINTPF "," ULINTPF "\n",
|
|
|
|
BUF_DUMP_SPACE(dump[j]),
|
|
|
|
BUF_DUMP_PAGE(dump[j]));
|
|
|
|
if (ret < 0) {
|
|
|
|
ut_free(dump);
|
|
|
|
fclose(f);
|
|
|
|
buf_dump_status(STATUS_ERR,
|
|
|
|
"Cannot write to '%s': %s",
|
|
|
|
tmp_filename, strerror(errno));
|
|
|
|
/* leave tmp_filename to exist */
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
ut_free(dump);
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = fclose(f);
|
|
|
|
if (ret != 0) {
|
|
|
|
buf_dump_status(STATUS_ERR,
|
|
|
|
"Cannot close '%s': %s",
|
|
|
|
tmp_filename, strerror(errno));
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
/* else */
|
|
|
|
|
|
|
|
ret = unlink(full_filename);
|
|
|
|
if (ret != 0 && errno != ENOENT) {
|
|
|
|
buf_dump_status(STATUS_ERR,
|
|
|
|
"Cannot delete '%s': %s",
|
|
|
|
full_filename, strerror(errno));
|
|
|
|
/* leave tmp_filename to exist */
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
/* else */
|
|
|
|
|
|
|
|
ret = rename(tmp_filename, full_filename);
|
|
|
|
if (ret != 0) {
|
|
|
|
buf_dump_status(STATUS_ERR,
|
|
|
|
"Cannot rename '%s' to '%s': %s",
|
|
|
|
tmp_filename, full_filename,
|
|
|
|
strerror(errno));
|
|
|
|
/* leave tmp_filename to exist */
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
/* else */
|
|
|
|
|
|
|
|
/* success */
|
|
|
|
|
|
|
|
ut_sprintf_timestamp(now);
|
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
buf_dump_status(STATUS_INFO,
|
2012-08-01 16:27:34 +02:00
|
|
|
"Buffer pool(s) dump completed at %s", now);
|
|
|
|
}
|
|
|
|
|
2015-11-29 08:08:42 +01:00
|
|
|
/*****************************************************************//**
|
|
|
|
Artificially delay the buffer pool loading if necessary. The idea of
|
|
|
|
this function is to prevent hogging the server with IO and slowing down
|
|
|
|
too much normal client queries. */
|
|
|
|
UNIV_INLINE
|
|
|
|
void
|
|
|
|
buf_load_throttle_if_needed(
|
|
|
|
/*========================*/
|
2016-08-12 10:17:45 +02:00
|
|
|
ulint* last_check_time, /*!< in/out: milliseconds since epoch
|
2015-11-29 08:08:42 +01:00
|
|
|
of the last time we did check if
|
|
|
|
throttling is needed, we do the check
|
|
|
|
every srv_io_capacity IO ops. */
|
|
|
|
ulint* last_activity_count,
|
|
|
|
ulint n_io) /*!< in: number of IO ops done since
|
|
|
|
buffer pool load has started */
|
|
|
|
{
|
|
|
|
if (n_io % srv_io_capacity < srv_io_capacity - 1) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (*last_check_time == 0 || *last_activity_count == 0) {
|
|
|
|
*last_check_time = ut_time_ms();
|
|
|
|
*last_activity_count = srv_get_activity_count();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* srv_io_capacity IO operations have been performed by buffer pool
|
|
|
|
load since the last time we were here. */
|
|
|
|
|
|
|
|
/* If no other activity, then keep going without any delay. */
|
|
|
|
if (srv_get_activity_count() == *last_activity_count) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* There has been other activity, throttle. */
|
|
|
|
|
|
|
|
ulint now = ut_time_ms();
|
|
|
|
ulint elapsed_time = now - *last_check_time;
|
|
|
|
|
|
|
|
/* Notice that elapsed_time is not the time for the last
|
|
|
|
srv_io_capacity IO operations performed by BP load. It is the
|
|
|
|
time elapsed since the last time we detected that there has been
|
|
|
|
other activity. This has a small and acceptable deficiency, e.g.:
|
|
|
|
1. BP load runs and there is no other activity.
|
|
|
|
2. Other activity occurs, we run N IO operations after that and
|
|
|
|
enter here (where 0 <= N < srv_io_capacity).
|
|
|
|
3. last_check_time is very old and we do not sleep at this time, but
|
|
|
|
only update last_check_time and last_activity_count.
|
|
|
|
4. We run srv_io_capacity more IO operations and call this function
|
|
|
|
again.
|
|
|
|
5. There has been more other activity and thus we enter here.
|
|
|
|
6. Now last_check_time is recent and we sleep if necessary to prevent
|
|
|
|
more than srv_io_capacity IO operations per second.
|
|
|
|
The deficiency is that we could have slept at 3., but for this we
|
|
|
|
would have to update last_check_time before the
|
|
|
|
"cur_activity_count == *last_activity_count" check and calling
|
|
|
|
ut_time_ms() that often may turn out to be too expensive. */
|
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
if (elapsed_time < 1000 /* 1 sec (1000 milli secs) */) {
|
2015-11-29 08:08:42 +01:00
|
|
|
os_thread_sleep((1000 - elapsed_time) * 1000 /* micro secs */);
|
|
|
|
}
|
|
|
|
|
|
|
|
*last_check_time = ut_time_ms();
|
|
|
|
*last_activity_count = srv_get_activity_count();
|
|
|
|
}
|
|
|
|
|
2012-08-01 16:27:34 +02:00
|
|
|
/*****************************************************************//**
|
|
|
|
Perform a buffer pool load from the file specified by
|
|
|
|
innodb_buffer_pool_filename. If any errors occur then the value of
|
|
|
|
innodb_buffer_pool_load_status will be set accordingly, see buf_load_status().
|
|
|
|
The dump filename can be specified by (relative to srv_data_home):
|
|
|
|
SET GLOBAL innodb_buffer_pool_filename='filename'; */
|
|
|
|
static
|
|
|
|
void
|
|
|
|
buf_load()
|
|
|
|
/*======*/
|
|
|
|
{
|
|
|
|
char full_filename[OS_FILE_MAX_PATH];
|
|
|
|
char now[32];
|
|
|
|
FILE* f;
|
|
|
|
buf_dump_t* dump;
|
|
|
|
ulint dump_n;
|
|
|
|
ulint total_buffer_pools_pages;
|
|
|
|
ulint i;
|
|
|
|
ulint space_id;
|
|
|
|
ulint page_no;
|
|
|
|
int fscanf_ret;
|
|
|
|
|
|
|
|
/* Ignore any leftovers from before */
|
|
|
|
buf_load_abort_flag = FALSE;
|
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
buf_dump_generate_path(full_filename, sizeof(full_filename));
|
2012-08-01 16:27:34 +02:00
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
buf_load_status(STATUS_INFO,
|
2012-08-01 16:27:34 +02:00
|
|
|
"Loading buffer pool(s) from %s", full_filename);
|
|
|
|
|
|
|
|
f = fopen(full_filename, "r");
|
|
|
|
if (f == NULL) {
|
2017-04-04 11:19:42 +02:00
|
|
|
buf_load_status(STATUS_INFO,
|
2012-08-01 16:27:34 +02:00
|
|
|
"Cannot open '%s' for reading: %s",
|
|
|
|
full_filename, strerror(errno));
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
/* else */
|
|
|
|
|
|
|
|
/* First scan the file to estimate how many entries are in it.
|
|
|
|
This file is tiny (approx 500KB per 1GB buffer pool), reading it
|
|
|
|
two times is fine. */
|
|
|
|
dump_n = 0;
|
|
|
|
while (fscanf(f, ULINTPF "," ULINTPF, &space_id, &page_no) == 2
|
|
|
|
&& !SHUTTING_DOWN()) {
|
|
|
|
dump_n++;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!SHUTTING_DOWN() && !feof(f)) {
|
|
|
|
/* fscanf() returned != 2 */
|
|
|
|
const char* what;
|
|
|
|
if (ferror(f)) {
|
|
|
|
what = "reading";
|
|
|
|
} else {
|
|
|
|
what = "parsing";
|
|
|
|
}
|
|
|
|
fclose(f);
|
2016-08-12 10:17:45 +02:00
|
|
|
buf_load_status(STATUS_ERR, "Error %s '%s',"
|
|
|
|
" unable to load buffer pool (stage 1)",
|
2012-08-01 16:27:34 +02:00
|
|
|
what, full_filename);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* If dump is larger than the buffer pool(s), then we ignore the
|
|
|
|
extra trailing. This could happen if a dump is made, then buffer
|
2016-08-12 10:17:45 +02:00
|
|
|
pool is shrunk and then load is attempted. */
|
2012-08-01 16:27:34 +02:00
|
|
|
total_buffer_pools_pages = buf_pool_get_n_pages()
|
|
|
|
* srv_buf_pool_instances;
|
|
|
|
if (dump_n > total_buffer_pools_pages) {
|
|
|
|
dump_n = total_buffer_pools_pages;
|
|
|
|
}
|
|
|
|
|
2016-09-06 08:43:16 +02:00
|
|
|
if(dump_n != 0) {
|
|
|
|
dump = static_cast<buf_dump_t*>(ut_malloc_nokey(
|
|
|
|
dump_n * sizeof(*dump)));
|
|
|
|
} else {
|
|
|
|
fclose(f);
|
|
|
|
ut_sprintf_timestamp(now);
|
|
|
|
buf_load_status(STATUS_INFO,
|
|
|
|
"Buffer pool(s) load completed at %s"
|
|
|
|
" (%s was empty)", now, full_filename);
|
|
|
|
return;
|
|
|
|
}
|
2012-08-01 16:27:34 +02:00
|
|
|
|
|
|
|
if (dump == NULL) {
|
|
|
|
fclose(f);
|
|
|
|
buf_load_status(STATUS_ERR,
|
2017-06-06 10:50:42 +02:00
|
|
|
"Cannot allocate " ULINTPF " bytes: %s",
|
|
|
|
dump_n * sizeof(*dump),
|
2012-08-01 16:27:34 +02:00
|
|
|
strerror(errno));
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
rewind(f);
|
|
|
|
|
|
|
|
for (i = 0; i < dump_n && !SHUTTING_DOWN(); i++) {
|
|
|
|
fscanf_ret = fscanf(f, ULINTPF "," ULINTPF,
|
|
|
|
&space_id, &page_no);
|
|
|
|
|
|
|
|
if (fscanf_ret != 2) {
|
|
|
|
if (feof(f)) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
/* else */
|
|
|
|
|
|
|
|
ut_free(dump);
|
|
|
|
fclose(f);
|
|
|
|
buf_load_status(STATUS_ERR,
|
2016-08-12 10:17:45 +02:00
|
|
|
"Error parsing '%s', unable"
|
|
|
|
" to load buffer pool (stage 2)",
|
2012-08-01 16:27:34 +02:00
|
|
|
full_filename);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (space_id > ULINT32_MASK || page_no > ULINT32_MASK) {
|
|
|
|
ut_free(dump);
|
|
|
|
fclose(f);
|
|
|
|
buf_load_status(STATUS_ERR,
|
2016-08-12 10:17:45 +02:00
|
|
|
"Error parsing '%s': bogus"
|
|
|
|
" space,page " ULINTPF "," ULINTPF
|
|
|
|
" at line " ULINTPF ","
|
|
|
|
" unable to load buffer pool",
|
2012-08-01 16:27:34 +02:00
|
|
|
full_filename,
|
|
|
|
space_id, page_no,
|
|
|
|
i);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
dump[i] = BUF_DUMP_CREATE(space_id, page_no);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Set dump_n to the actual number of initialized elements,
|
|
|
|
i could be smaller than dump_n here if the file got truncated after
|
|
|
|
we read it the first time. */
|
|
|
|
dump_n = i;
|
|
|
|
|
|
|
|
fclose(f);
|
|
|
|
|
|
|
|
if (dump_n == 0) {
|
|
|
|
ut_free(dump);
|
|
|
|
ut_sprintf_timestamp(now);
|
2016-08-12 10:17:45 +02:00
|
|
|
buf_load_status(STATUS_INFO,
|
|
|
|
"Buffer pool(s) load completed at %s"
|
|
|
|
" (%s was empty)", now, full_filename);
|
2012-08-01 16:27:34 +02:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!SHUTTING_DOWN()) {
|
2016-08-12 10:17:45 +02:00
|
|
|
std::sort(dump, dump + dump_n);
|
2012-08-01 16:27:34 +02:00
|
|
|
}
|
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
ulint last_check_time = 0;
|
|
|
|
ulint last_activity_cnt = 0;
|
|
|
|
|
|
|
|
/* Avoid calling the expensive fil_space_acquire_silent() for each
|
|
|
|
page within the same tablespace. dump[] is sorted by (space, page),
|
|
|
|
so all pages from a given tablespace are consecutive. */
|
|
|
|
ulint cur_space_id = BUF_DUMP_SPACE(dump[0]);
|
|
|
|
fil_space_t* space = fil_space_acquire_silent(cur_space_id);
|
|
|
|
page_size_t page_size(space ? space->flags : 0);
|
|
|
|
|
|
|
|
/* JAN: TODO: MySQL 5.7 PSI
|
|
|
|
#ifdef HAVE_PSI_STAGE_INTERFACE
|
|
|
|
PSI_stage_progress* pfs_stage_progress
|
|
|
|
= mysql_set_stage(srv_stage_buffer_pool_load.m_key);
|
|
|
|
#endif*/ /* HAVE_PSI_STAGE_INTERFACE */
|
|
|
|
/*
|
|
|
|
mysql_stage_set_work_estimated(pfs_stage_progress, dump_n);
|
|
|
|
mysql_stage_set_work_completed(pfs_stage_progress, 0);
|
|
|
|
*/
|
2015-11-29 08:08:42 +01:00
|
|
|
|
2012-08-01 16:27:34 +02:00
|
|
|
for (i = 0; i < dump_n && !SHUTTING_DOWN(); i++) {
|
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
/* space_id for this iteration of the loop */
|
|
|
|
const ulint this_space_id = BUF_DUMP_SPACE(dump[i]);
|
|
|
|
|
|
|
|
if (this_space_id != cur_space_id) {
|
|
|
|
if (space != NULL) {
|
|
|
|
fil_space_release(space);
|
|
|
|
}
|
|
|
|
|
|
|
|
cur_space_id = this_space_id;
|
|
|
|
space = fil_space_acquire_silent(cur_space_id);
|
|
|
|
|
|
|
|
if (space != NULL) {
|
|
|
|
const page_size_t cur_page_size(
|
|
|
|
space->flags);
|
|
|
|
page_size.copy_from(cur_page_size);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/* JAN: TODO: As we use background page read below,
|
|
|
|
if tablespace is encrypted we cant use it. */
|
|
|
|
if (space == NULL ||
|
|
|
|
(space && space->crypt_data &&
|
2017-03-30 12:48:42 +02:00
|
|
|
space->crypt_data->encryption != FIL_ENCRYPTION_OFF &&
|
2016-08-12 10:17:45 +02:00
|
|
|
space->crypt_data->type != CRYPT_SCHEME_UNENCRYPTED)) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
buf_read_page_background(
|
|
|
|
page_id_t(this_space_id, BUF_DUMP_PAGE(dump[i])),
|
|
|
|
page_size, true);
|
2012-08-01 16:27:34 +02:00
|
|
|
|
|
|
|
if (i % 64 == 63) {
|
|
|
|
os_aio_simulated_wake_handler_threads();
|
|
|
|
}
|
|
|
|
|
|
|
|
if (buf_load_abort_flag) {
|
2016-08-12 10:17:45 +02:00
|
|
|
if (space != NULL) {
|
|
|
|
fil_space_release(space);
|
|
|
|
}
|
2012-08-01 16:27:34 +02:00
|
|
|
buf_load_abort_flag = FALSE;
|
|
|
|
ut_free(dump);
|
|
|
|
buf_load_status(
|
2016-08-12 10:17:45 +02:00
|
|
|
STATUS_INFO,
|
2012-08-01 16:27:34 +02:00
|
|
|
"Buffer pool(s) load aborted on request");
|
2016-08-12 10:17:45 +02:00
|
|
|
/* Premature end, set estimated = completed = i and
|
|
|
|
end the current stage event. */
|
|
|
|
/*
|
|
|
|
mysql_stage_set_work_estimated(pfs_stage_progress, i);
|
|
|
|
mysql_stage_set_work_completed(pfs_stage_progress,
|
|
|
|
i);
|
|
|
|
*/
|
|
|
|
#ifdef HAVE_PSI_STAGE_INTERFACE
|
|
|
|
/* mysql_end_stage(); */
|
|
|
|
#endif /* HAVE_PSI_STAGE_INTERFACE */
|
2012-08-01 16:27:34 +02:00
|
|
|
return;
|
|
|
|
}
|
2015-11-29 08:08:42 +01:00
|
|
|
|
|
|
|
buf_load_throttle_if_needed(
|
|
|
|
&last_check_time, &last_activity_cnt, i);
|
2012-08-01 16:27:34 +02:00
|
|
|
}
|
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
if (space != NULL) {
|
|
|
|
fil_space_release(space);
|
|
|
|
}
|
|
|
|
|
2012-08-01 16:27:34 +02:00
|
|
|
ut_free(dump);
|
|
|
|
|
|
|
|
ut_sprintf_timestamp(now);
|
|
|
|
|
2016-08-12 10:17:45 +02:00
|
|
|
buf_load_status(STATUS_INFO,
|
2012-08-01 16:27:34 +02:00
|
|
|
"Buffer pool(s) load completed at %s", now);
|
2016-08-12 10:17:45 +02:00
|
|
|
|
|
|
|
/* Make sure that estimated = completed when we end. */
|
|
|
|
/* mysql_stage_set_work_completed(pfs_stage_progress, dump_n); */
|
|
|
|
/* End the stage progress event. */
|
|
|
|
#ifdef HAVE_PSI_STAGE_INTERFACE
|
|
|
|
/* mysql_end_stage(); */
|
|
|
|
#endif /* HAVE_PSI_STAGE_INTERFACE */
|
2012-08-01 16:27:34 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
/*****************************************************************//**
|
|
|
|
Aborts a currently running buffer pool load. This function is called by
|
|
|
|
MySQL code via buffer_pool_load_abort() and it should return immediately
|
|
|
|
because the whole MySQL is frozen during its execution. */
|
|
|
|
void
|
|
|
|
buf_load_abort()
|
|
|
|
/*============*/
|
|
|
|
{
|
|
|
|
buf_load_abort_flag = TRUE;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*****************************************************************//**
|
|
|
|
This is the main thread for buffer pool dump/load. It waits for an
|
|
|
|
event and when waked up either performs a dump or load and sleeps
|
|
|
|
again.
|
|
|
|
@return this function does not return, it calls os_thread_exit() */
|
2016-08-12 10:17:45 +02:00
|
|
|
extern "C"
|
2012-08-01 16:27:34 +02:00
|
|
|
os_thread_ret_t
|
MDEV-11638 Encryption causes race conditions in InnoDB shutdown
InnoDB shutdown failed to properly take fil_crypt_thread() into account.
The encryption threads were signalled to shut down together with other
non-critical tasks. This could be much too early in case of slow shutdown,
which could need minutes to complete the purge. Furthermore, InnoDB
failed to wait for the fil_crypt_thread() to actually exit before
proceeding to the final steps of shutdown, causing the race conditions.
Furthermore, the log_scrub_thread() was shut down way too early.
Also it should remain until the SRV_SHUTDOWN_FLUSH_PHASE.
fil_crypt_threads_end(): Remove. This would cause the threads to
be terminated way too early.
srv_buf_dump_thread_active, srv_dict_stats_thread_active,
lock_sys->timeout_thread_active, log_scrub_thread_active,
srv_monitor_active, srv_error_monitor_active: Remove a race condition
between startup and shutdown, by setting these in the startup thread
that creates threads, not in each created thread. In this way, once the
flag is cleared, it will remain cleared during shutdown.
srv_n_fil_crypt_threads_started, fil_crypt_threads_event: Declare in
global rather than static scope.
log_scrub_event, srv_log_scrub_thread_active, log_scrub_thread():
Declare in static rather than global scope. Let these be created by
log_init() and freed by log_shutdown().
rotate_thread_t::should_shutdown(): Do not shut down before the
SRV_SHUTDOWN_FLUSH_PHASE.
srv_any_background_threads_are_active(): Remove. These checks now
exist in logs_empty_and_mark_files_at_shutdown().
logs_empty_and_mark_files_at_shutdown(): Shut down the threads in
the proper order. Keep fil_crypt_thread() and log_scrub_thread() alive
until SRV_SHUTDOWN_FLUSH_PHASE, and check that they actually terminate.
2017-01-04 17:43:32 +01:00
|
|
|
DECLARE_THREAD(buf_dump_thread)(void*)
|
2012-08-01 16:27:34 +02:00
|
|
|
{
|
2017-01-06 15:18:54 +01:00
|
|
|
my_thread_init();
|
2013-03-25 23:03:13 +01:00
|
|
|
ut_ad(!srv_read_only_mode);
|
2016-08-12 10:17:45 +02:00
|
|
|
/* JAN: TODO: MySQL 5.7 PSI
|
|
|
|
#ifdef UNIV_PFS_THREAD
|
|
|
|
pfs_register_thread(buf_dump_thread_key);
|
|
|
|
#endif */ /* UNIV_PFS_THREAD */
|
2013-03-25 23:03:13 +01:00
|
|
|
|
2012-08-01 16:27:34 +02:00
|
|
|
if (srv_buffer_pool_load_at_startup) {
|
2017-08-31 07:27:59 +02:00
|
|
|
|
2017-03-02 17:53:16 +01:00
|
|
|
#ifdef WITH_WSREP
|
|
|
|
if (!wsrep_recovery) {
|
|
|
|
#endif /* WITH_WSREP */
|
2017-08-31 07:27:59 +02:00
|
|
|
buf_load();
|
2017-03-02 17:53:16 +01:00
|
|
|
#ifdef WITH_WSREP
|
2017-08-31 07:27:59 +02:00
|
|
|
}
|
2017-03-02 17:53:16 +01:00
|
|
|
#endif /* WITH_WSREP */
|
2012-08-01 16:27:34 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
while (!SHUTTING_DOWN()) {
|
|
|
|
|
|
|
|
os_event_wait(srv_buf_dump_event);
|
|
|
|
|
|
|
|
if (buf_dump_should_start) {
|
2017-02-17 09:32:21 +01:00
|
|
|
buf_dump_should_start = false;
|
2012-08-01 16:27:34 +02:00
|
|
|
buf_dump(TRUE /* quit on shutdown */);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (buf_load_should_start) {
|
2017-02-17 09:32:21 +01:00
|
|
|
buf_load_should_start = false;
|
2012-08-01 16:27:34 +02:00
|
|
|
buf_load();
|
|
|
|
}
|
|
|
|
|
2017-02-17 09:32:21 +01:00
|
|
|
if (buf_dump_should_start || buf_load_should_start) {
|
|
|
|
continue;
|
|
|
|
}
|
2012-08-01 16:27:34 +02:00
|
|
|
os_event_reset(srv_buf_dump_event);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (srv_buffer_pool_dump_at_shutdown && srv_fast_shutdown != 2) {
|
2017-03-02 17:53:16 +01:00
|
|
|
#ifdef WITH_WSREP
|
|
|
|
if (!wsrep_recovery) {
|
|
|
|
#endif /* WITH_WSREP */
|
2017-08-31 07:27:59 +02:00
|
|
|
|
2012-08-01 16:27:34 +02:00
|
|
|
buf_dump(FALSE /* ignore shutdown down flag,
|
|
|
|
keep going even if we are in a shutdown state */);
|
2017-03-02 17:53:16 +01:00
|
|
|
#ifdef WITH_WSREP
|
|
|
|
}
|
|
|
|
#endif /* WITH_WSREP */
|
2012-08-01 16:27:34 +02:00
|
|
|
}
|
|
|
|
|
MDEV-11638 Encryption causes race conditions in InnoDB shutdown
InnoDB shutdown failed to properly take fil_crypt_thread() into account.
The encryption threads were signalled to shut down together with other
non-critical tasks. This could be much too early in case of slow shutdown,
which could need minutes to complete the purge. Furthermore, InnoDB
failed to wait for the fil_crypt_thread() to actually exit before
proceeding to the final steps of shutdown, causing the race conditions.
Furthermore, the log_scrub_thread() was shut down way too early.
Also it should remain until the SRV_SHUTDOWN_FLUSH_PHASE.
fil_crypt_threads_end(): Remove. This would cause the threads to
be terminated way too early.
srv_buf_dump_thread_active, srv_dict_stats_thread_active,
lock_sys->timeout_thread_active, log_scrub_thread_active,
srv_monitor_active, srv_error_monitor_active: Remove a race condition
between startup and shutdown, by setting these in the startup thread
that creates threads, not in each created thread. In this way, once the
flag is cleared, it will remain cleared during shutdown.
srv_n_fil_crypt_threads_started, fil_crypt_threads_event: Declare in
global rather than static scope.
log_scrub_event, srv_log_scrub_thread_active, log_scrub_thread():
Declare in static rather than global scope. Let these be created by
log_init() and freed by log_shutdown().
rotate_thread_t::should_shutdown(): Do not shut down before the
SRV_SHUTDOWN_FLUSH_PHASE.
srv_any_background_threads_are_active(): Remove. These checks now
exist in logs_empty_and_mark_files_at_shutdown().
logs_empty_and_mark_files_at_shutdown(): Shut down the threads in
the proper order. Keep fil_crypt_thread() and log_scrub_thread() alive
until SRV_SHUTDOWN_FLUSH_PHASE, and check that they actually terminate.
2017-01-04 17:43:32 +01:00
|
|
|
srv_buf_dump_thread_active = false;
|
2012-08-01 16:27:34 +02:00
|
|
|
|
2017-01-06 15:18:54 +01:00
|
|
|
my_thread_end();
|
2012-08-01 16:27:34 +02:00
|
|
|
/* We count the number of threads in os_thread_exit(). A created
|
|
|
|
thread should always use that to exit and not use return() to exit. */
|
2016-09-06 08:43:16 +02:00
|
|
|
os_thread_exit();
|
2012-08-01 16:27:34 +02:00
|
|
|
|
|
|
|
OS_THREAD_DUMMY_RETURN;
|
|
|
|
}
|