mirror of
https://github.com/MariaDB/server.git
synced 2025-10-24 16:38:14 +02:00
417 lines
13 KiB
C++
417 lines
13 KiB
C++
/*****************************************************************************
|
|
|
|
Copyright (c) 2012, 2017, Oracle and/or its affiliates. All Rights Reserved.
|
|
Copyright (c) 2017, 2022, MariaDB Corporation.
|
|
|
|
This program is free software; you can redistribute it and/or modify it under
|
|
the terms of the GNU General Public License as published by the Free Software
|
|
Foundation; version 2 of the License.
|
|
|
|
This program is distributed in the hope that it will be useful, but WITHOUT
|
|
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License along with
|
|
this program; if not, write to the Free Software Foundation, Inc.,
|
|
51 Franklin Street, Fifth Floor, Boston, MA 02110-1335 USA
|
|
|
|
*****************************************************************************/
|
|
|
|
/**************************************************//**
|
|
@file dict/dict0stats_bg.cc
|
|
Code used for background table and index stats gathering.
|
|
|
|
Created Apr 25, 2012 Vasil Dimov
|
|
*******************************************************/
|
|
|
|
#include "dict0dict.h"
|
|
#include "dict0stats.h"
|
|
#include "dict0stats_bg.h"
|
|
#include "row0mysql.h"
|
|
#include "srv0start.h"
|
|
#include "fil0fil.h"
|
|
#include "mysqld.h"
|
|
#ifdef WITH_WSREP
|
|
# include "trx0trx.h"
|
|
# include "mysql/service_wsrep.h"
|
|
# include "wsrep.h"
|
|
# include "log.h"
|
|
#endif
|
|
|
|
#include <vector>
|
|
|
|
/** Minimum time interval between stats recalc for a given table */
|
|
#define MIN_RECALC_INTERVAL 10 /* seconds */
|
|
static void dict_stats_schedule(int ms);
|
|
|
|
/** Protects recalc_pool */
|
|
static mysql_mutex_t recalc_pool_mutex;
|
|
|
|
/** for signaling recalc::state */
|
|
static pthread_cond_t recalc_pool_cond;
|
|
|
|
/** Work item of the recalc_pool; protected by recalc_pool_mutex */
|
|
struct recalc
|
|
{
|
|
/** identifies a table with persistent statistics */
|
|
table_id_t id;
|
|
/** state of the entry */
|
|
enum { IDLE, IN_PROGRESS, IN_PROGRESS_DELETING, DELETING} state;
|
|
};
|
|
|
|
/** The multitude of tables whose stats are to be automatically recalculated */
|
|
typedef std::vector<recalc, ut_allocator<recalc>> recalc_pool_t;
|
|
|
|
/** Pool where we store information on which tables are to be processed
|
|
by background statistics gathering. */
|
|
static recalc_pool_t recalc_pool;
|
|
/** Whether the global data structures have been initialized */
|
|
static bool stats_initialised;
|
|
|
|
static THD *dict_stats_thd;
|
|
|
|
/*****************************************************************//**
|
|
Free the resources occupied by the recalc pool, called once during
|
|
thread de-initialization. */
|
|
static void dict_stats_recalc_pool_deinit()
|
|
{
|
|
ut_ad(!srv_read_only_mode);
|
|
|
|
recalc_pool.clear();
|
|
/*
|
|
recalc_pool may still have its buffer allocated. It will free it when
|
|
its destructor is called.
|
|
The problem is, memory leak detector is run before the recalc_pool's
|
|
destructor is invoked, and will report recalc_pool's buffer as leaked
|
|
memory. To avoid that, we force recalc_pool to surrender its buffer
|
|
to empty_pool object, which will free it when leaving this function:
|
|
*/
|
|
recalc_pool_t recalc_empty_pool;
|
|
recalc_pool.swap(recalc_empty_pool);
|
|
|
|
if (dict_stats_thd)
|
|
destroy_background_thd(dict_stats_thd);
|
|
}
|
|
|
|
/*****************************************************************//**
|
|
Add a table to the recalc pool, which is processed by the
|
|
background stats gathering thread. Only the table id is added to the
|
|
list, so the table can be closed after being enqueued and it will be
|
|
opened when needed. If the table does not exist later (has been DROPped),
|
|
then it will be removed from the pool and skipped. */
|
|
static void dict_stats_recalc_pool_add(table_id_t id)
|
|
{
|
|
ut_ad(!srv_read_only_mode);
|
|
ut_ad(id);
|
|
bool schedule = false;
|
|
mysql_mutex_lock(&recalc_pool_mutex);
|
|
|
|
const auto begin= recalc_pool.begin(), end= recalc_pool.end();
|
|
if (end == std::find_if(begin, end, [&](const recalc &r){return r.id == id;}))
|
|
{
|
|
recalc_pool.emplace_back(recalc{id, recalc::IDLE});
|
|
schedule = true;
|
|
}
|
|
|
|
mysql_mutex_unlock(&recalc_pool_mutex);
|
|
if (schedule)
|
|
dict_stats_schedule_now();
|
|
}
|
|
|
|
#ifdef WITH_WSREP
|
|
/** Update the table modification counter and if necessary,
|
|
schedule new estimates for table and index statistics to be calculated.
|
|
@param[in,out] table persistent or temporary table
|
|
@param[in] thd current session */
|
|
void dict_stats_update_if_needed(dict_table_t *table, const trx_t &trx)
|
|
#else
|
|
/** Update the table modification counter and if necessary,
|
|
schedule new estimates for table and index statistics to be calculated.
|
|
@param[in,out] table persistent or temporary table */
|
|
void dict_stats_update_if_needed_func(dict_table_t *table)
|
|
#endif
|
|
{
|
|
uint32_t stat{table->stat};
|
|
|
|
if (UNIV_UNLIKELY(!table->stat_initialized(stat))) {
|
|
/* The table may have been evicted from dict_sys
|
|
and reloaded internally by InnoDB for FOREIGN KEY
|
|
processing, but not reloaded by the SQL layer.
|
|
|
|
We can (re)compute the transient statistics when the
|
|
table is actually loaded by the SQL layer.
|
|
|
|
Note: If InnoDB persistent statistics are enabled,
|
|
we will skip the updates. We must do this, because
|
|
dict_table_get_n_rows() below assumes that the
|
|
statistics have been initialized. The DBA may have
|
|
to execute ANALYZE TABLE. */
|
|
return;
|
|
}
|
|
|
|
ulonglong counter = table->stat_modified_counter++;
|
|
ulonglong n_rows = dict_table_get_n_rows(table);
|
|
|
|
if (table->stats_is_persistent(stat)) {
|
|
if (table->stats_is_auto_recalc(stat)
|
|
&& counter > n_rows / 10 && !table->name.is_temporary()) {
|
|
#ifdef WITH_WSREP
|
|
/* Do not add table to background
|
|
statistic calculation if this thread is not a
|
|
applier (as all DDL, which is replicated (i.e
|
|
is binlogged in master node), will be executed
|
|
with high priority (a.k.a BF) in slave nodes)
|
|
and is BF. This could again lead BF lock
|
|
waits in applier node but it is better than
|
|
no persistent index/table statistics at
|
|
applier nodes. TODO: allow BF threads
|
|
wait for these InnoDB internal SQL-parser
|
|
generated row locks and allow BF thread
|
|
lock waits to be enqueued at head of waiting
|
|
queue. */
|
|
if (trx.is_wsrep()
|
|
&& !wsrep_thd_is_applying(trx.mysql_thd)
|
|
&& wsrep_thd_is_BF(trx.mysql_thd, 0)) {
|
|
WSREP_DEBUG("Avoiding background statistics"
|
|
" calculation for table %s.",
|
|
table->name.m_name);
|
|
return;
|
|
}
|
|
#endif /* WITH_WSREP */
|
|
|
|
dict_stats_recalc_pool_add(table->id);
|
|
table->stat_modified_counter = 0;
|
|
}
|
|
return;
|
|
}
|
|
|
|
/* Calculate new statistics if 1 / 16 of table has been modified
|
|
since the last time a statistics batch was run.
|
|
We calculate statistics at most every 16th round, since we may have
|
|
a counter table which is very small and updated very often. */
|
|
ulonglong threshold = 16 + n_rows / 16; /* 6.25% */
|
|
|
|
if (srv_stats_modified_counter) {
|
|
threshold = std::min(srv_stats_modified_counter, threshold);
|
|
}
|
|
|
|
if (counter > threshold) {
|
|
/* this will reset table->stat_modified_counter to 0 */
|
|
dict_stats_update_transient(table);
|
|
}
|
|
}
|
|
|
|
/** Delete a table from the auto recalc pool, and ensure that
|
|
no statistics are being updated on it. */
|
|
void dict_stats_recalc_pool_del(table_id_t id, bool have_mdl_exclusive)
|
|
{
|
|
ut_ad(!srv_read_only_mode);
|
|
ut_ad(id);
|
|
|
|
mysql_mutex_lock(&recalc_pool_mutex);
|
|
|
|
auto end= recalc_pool.end();
|
|
auto i= std::find_if(recalc_pool.begin(), end,
|
|
[&](const recalc &r){return r.id == id;});
|
|
if (i != end)
|
|
{
|
|
switch (i->state) {
|
|
case recalc::IN_PROGRESS:
|
|
if (!have_mdl_exclusive)
|
|
{
|
|
i->state= recalc::IN_PROGRESS_DELETING;
|
|
do
|
|
{
|
|
my_cond_wait(&recalc_pool_cond, &recalc_pool_mutex.m_mutex);
|
|
end= recalc_pool.end();
|
|
i= std::find_if(recalc_pool.begin(), end,
|
|
[&](const recalc &r){return r.id == id;});
|
|
if (i == end)
|
|
goto done;
|
|
}
|
|
while (i->state == recalc::IN_PROGRESS_DELETING);
|
|
}
|
|
/* fall through */
|
|
case recalc::IDLE:
|
|
recalc_pool.erase(i);
|
|
break;
|
|
case recalc::IN_PROGRESS_DELETING:
|
|
case recalc::DELETING:
|
|
/* another thread will delete the entry in dict_stats_recalc_pool_del() */
|
|
break;
|
|
}
|
|
}
|
|
|
|
done:
|
|
mysql_mutex_unlock(&recalc_pool_mutex);
|
|
}
|
|
|
|
/*****************************************************************//**
|
|
Initialize global variables needed for the operation of dict_stats_thread()
|
|
Must be called before dict_stats_thread() is started. */
|
|
void dict_stats_init()
|
|
{
|
|
ut_ad(!srv_read_only_mode);
|
|
mysql_mutex_init(recalc_pool_mutex_key, &recalc_pool_mutex, nullptr);
|
|
pthread_cond_init(&recalc_pool_cond, nullptr);
|
|
stats_initialised= true;
|
|
}
|
|
|
|
/*****************************************************************//**
|
|
Free resources allocated by dict_stats_init(), must be called
|
|
after dict_stats task has exited. */
|
|
void dict_stats_deinit()
|
|
{
|
|
if (!stats_initialised) {
|
|
return;
|
|
}
|
|
|
|
ut_ad(!srv_read_only_mode);
|
|
stats_initialised = false;
|
|
|
|
dict_stats_recalc_pool_deinit();
|
|
|
|
mysql_mutex_destroy(&recalc_pool_mutex);
|
|
pthread_cond_destroy(&recalc_pool_cond);
|
|
}
|
|
|
|
/**
|
|
Get the first table that has been added for auto recalc and eventually
|
|
update its stats.
|
|
@return whether the first entry can be processed immediately */
|
|
static bool dict_stats_process_entry_from_recalc_pool(THD *thd)
|
|
{
|
|
ut_ad(!srv_read_only_mode);
|
|
table_id_t table_id;
|
|
mysql_mutex_lock(&recalc_pool_mutex);
|
|
next_table_id_with_mutex:
|
|
for (auto &r : recalc_pool)
|
|
{
|
|
if ((table_id= r.id) && r.state == recalc::IDLE)
|
|
{
|
|
r.state= recalc::IN_PROGRESS;
|
|
mysql_mutex_unlock(&recalc_pool_mutex);
|
|
goto process;
|
|
}
|
|
}
|
|
mysql_mutex_unlock(&recalc_pool_mutex);
|
|
return false;
|
|
|
|
process:
|
|
MDL_ticket *mdl= nullptr;
|
|
dict_table_t *table= dict_table_open_on_id(table_id, false,
|
|
DICT_TABLE_OP_NORMAL, thd, &mdl);
|
|
if (!table)
|
|
{
|
|
invalid_table_id:
|
|
mysql_mutex_lock(&recalc_pool_mutex);
|
|
auto i= std::find_if(recalc_pool.begin(), recalc_pool.end(),
|
|
[&](const recalc &r){return r.id == table_id;});
|
|
if (i == recalc_pool.end());
|
|
else if (UNIV_LIKELY(i->state == recalc::IN_PROGRESS))
|
|
recalc_pool.erase(i);
|
|
else
|
|
{
|
|
ut_ad(i->state == recalc::IN_PROGRESS_DELETING);
|
|
i->state= recalc::DELETING;
|
|
pthread_cond_broadcast(&recalc_pool_cond);
|
|
}
|
|
goto next_table_id_with_mutex;
|
|
}
|
|
|
|
ut_ad(!table->is_temporary());
|
|
|
|
if (!mdl || !table->is_accessible())
|
|
{
|
|
dict_table_close(table, thd, mdl);
|
|
goto invalid_table_id;
|
|
}
|
|
|
|
/* time() could be expensive, the current function
|
|
is called once every time a table has been changed more than 10% and
|
|
on a system with lots of small tables, this could become hot. If we
|
|
find out that this is a problem, then the check below could eventually
|
|
be replaced with something else, though a time interval is the natural
|
|
approach. */
|
|
const bool update_now=
|
|
difftime(time(nullptr), table->stats_last_recalc) >= MIN_RECALC_INTERVAL;
|
|
|
|
const dberr_t err= update_now
|
|
? dict_stats_update_persistent_try(table)
|
|
: DB_SUCCESS_LOCKED_REC;
|
|
|
|
dict_table_close(table, thd, mdl);
|
|
|
|
mysql_mutex_lock(&recalc_pool_mutex);
|
|
auto i= std::find_if(recalc_pool.begin(), recalc_pool.end(),
|
|
[&](const recalc &r){return r.id == table_id;});
|
|
if (i == recalc_pool.end())
|
|
goto done;
|
|
else if (i->state == recalc::IN_PROGRESS_DELETING)
|
|
{
|
|
i->state= recalc::DELETING;
|
|
pthread_cond_broadcast(&recalc_pool_cond);
|
|
done:
|
|
mysql_mutex_unlock(&recalc_pool_mutex);
|
|
}
|
|
else
|
|
{
|
|
ut_ad(i->state == recalc::IN_PROGRESS);
|
|
recalc_pool.erase(i);
|
|
if (err == DB_SUCCESS_LOCKED_REC)
|
|
recalc_pool.emplace_back(recalc{table_id, recalc::IDLE});
|
|
mysql_mutex_unlock(&recalc_pool_mutex);
|
|
}
|
|
|
|
return update_now;
|
|
}
|
|
|
|
/** Check if the recalc pool is empty. */
|
|
static bool is_recalc_pool_empty()
|
|
{
|
|
mysql_mutex_lock(&recalc_pool_mutex);
|
|
bool empty= recalc_pool.empty();
|
|
mysql_mutex_unlock(&recalc_pool_mutex);
|
|
return empty;
|
|
}
|
|
|
|
static tpool::timer* dict_stats_timer;
|
|
static void dict_stats_func(void*)
|
|
{
|
|
if (!dict_stats_thd)
|
|
dict_stats_thd= innobase_create_background_thd("InnoDB statistics");
|
|
set_current_thd(dict_stats_thd);
|
|
|
|
while (dict_stats_process_entry_from_recalc_pool(dict_stats_thd)) {}
|
|
|
|
innobase_reset_background_thd(dict_stats_thd);
|
|
set_current_thd(nullptr);
|
|
if (!is_recalc_pool_empty())
|
|
dict_stats_schedule(MIN_RECALC_INTERVAL * 1000);
|
|
}
|
|
|
|
|
|
void dict_stats_start()
|
|
{
|
|
DBUG_ASSERT(!dict_stats_timer);
|
|
dict_stats_timer= srv_thread_pool->create_timer(dict_stats_func);
|
|
}
|
|
|
|
|
|
static void dict_stats_schedule(int ms)
|
|
{
|
|
if(dict_stats_timer)
|
|
dict_stats_timer->set_time(ms,0);
|
|
}
|
|
|
|
void dict_stats_schedule_now()
|
|
{
|
|
dict_stats_schedule(0);
|
|
}
|
|
|
|
/** Shut down the dict_stats_thread. */
|
|
void dict_stats_shutdown()
|
|
{
|
|
delete dict_stats_timer;
|
|
dict_stats_timer= 0;
|
|
}
|