mirror of
				https://github.com/MariaDB/server.git
				synced 2025-10-26 16:38:11 +01:00 
			
		
		
		
	 9f40f02a8d
			
		
	
	
	9f40f02a8d
	
	
	
		
			
			Marko reported DBUG_ASSERT from dict_stats_shutdown(). destroy_background_thd() does not like when current_thd is set. In galera, it can be the case, dict_stats_shutdown() can be called from user thread, to stop and later restart stats recalculations.
		
			
				
	
	
		
			426 lines
		
	
	
	
		
			13 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			426 lines
		
	
	
	
		
			13 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /*****************************************************************************
 | |
| 
 | |
| Copyright (c) 2012, 2017, Oracle and/or its affiliates. All Rights Reserved.
 | |
| Copyright (c) 2017, 2022, MariaDB Corporation.
 | |
| 
 | |
| This program is free software; you can redistribute it and/or modify it under
 | |
| the terms of the GNU General Public License as published by the Free Software
 | |
| Foundation; version 2 of the License.
 | |
| 
 | |
| This program is distributed in the hope that it will be useful, but WITHOUT
 | |
| ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
 | |
| FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
 | |
| 
 | |
| You should have received a copy of the GNU General Public License along with
 | |
| this program; if not, write to the Free Software Foundation, Inc.,
 | |
| 51 Franklin Street, Fifth Floor, Boston, MA 02110-1335 USA
 | |
| 
 | |
| *****************************************************************************/
 | |
| 
 | |
| /**************************************************//**
 | |
| @file dict/dict0stats_bg.cc
 | |
| Code used for background table and index stats gathering.
 | |
| 
 | |
| Created Apr 25, 2012 Vasil Dimov
 | |
| *******************************************************/
 | |
| 
 | |
| #include "dict0dict.h"
 | |
| #include "dict0stats.h"
 | |
| #include "dict0stats_bg.h"
 | |
| #include "dict0defrag_bg.h"
 | |
| #include "row0mysql.h"
 | |
| #include "srv0start.h"
 | |
| #include "fil0fil.h"
 | |
| #include "mysqld.h"
 | |
| #ifdef WITH_WSREP
 | |
| # include "trx0trx.h"
 | |
| # include "mysql/service_wsrep.h"
 | |
| # include "wsrep.h"
 | |
| # include "log.h"
 | |
| #endif
 | |
| 
 | |
| #include <vector>
 | |
| 
 | |
| /** Minimum time interval between stats recalc for a given table */
 | |
| #define MIN_RECALC_INTERVAL	10 /* seconds */
 | |
| static void dict_stats_schedule(int ms);
 | |
| 
 | |
| /** Protects recalc_pool */
 | |
| static mysql_mutex_t recalc_pool_mutex;
 | |
| 
 | |
| /** for signaling recalc::state */
 | |
| static pthread_cond_t recalc_pool_cond;
 | |
| 
 | |
| /** Work item of the recalc_pool; protected by recalc_pool_mutex */
 | |
| struct recalc
 | |
| {
 | |
|   /** identifies a table with persistent statistics */
 | |
|   table_id_t id;
 | |
|   /** state of the entry */
 | |
|   enum { IDLE, IN_PROGRESS, IN_PROGRESS_DELETING, DELETING} state;
 | |
| };
 | |
| 
 | |
| /** The multitude of tables whose stats are to be automatically recalculated */
 | |
| typedef std::vector<recalc, ut_allocator<recalc>> recalc_pool_t;
 | |
| 
 | |
| /** Pool where we store information on which tables are to be processed
 | |
| by background statistics gathering. */
 | |
| static recalc_pool_t		recalc_pool;
 | |
| /** Whether the global data structures have been initialized */
 | |
| static bool			stats_initialised;
 | |
| 
 | |
| static THD *dict_stats_thd;
 | |
| 
 | |
| /*****************************************************************//**
 | |
| Free the resources occupied by the recalc pool, called once during
 | |
| thread de-initialization. */
 | |
| static void dict_stats_recalc_pool_deinit()
 | |
| {
 | |
| 	ut_ad(!srv_read_only_mode);
 | |
| 
 | |
| 	recalc_pool.clear();
 | |
| 	defrag_pool.clear();
 | |
|         /*
 | |
|           recalc_pool may still have its buffer allocated. It will free it when
 | |
|           its destructor is called.
 | |
|           The problem is, memory leak detector is run before the recalc_pool's
 | |
|           destructor is invoked, and will report recalc_pool's buffer as leaked
 | |
|           memory.  To avoid that, we force recalc_pool to surrender its buffer
 | |
|           to empty_pool object, which will free it when leaving this function:
 | |
|         */
 | |
| 	recalc_pool_t recalc_empty_pool;
 | |
| 	defrag_pool_t defrag_empty_pool;
 | |
| 	recalc_pool.swap(recalc_empty_pool);
 | |
| 	defrag_pool.swap(defrag_empty_pool);
 | |
| 
 | |
| 	if (dict_stats_thd)
 | |
| 		destroy_background_thd(dict_stats_thd);
 | |
| }
 | |
| 
 | |
| /*****************************************************************//**
 | |
| Add a table to the recalc pool, which is processed by the
 | |
| background stats gathering thread. Only the table id is added to the
 | |
| list, so the table can be closed after being enqueued and it will be
 | |
| opened when needed. If the table does not exist later (has been DROPped),
 | |
| then it will be removed from the pool and skipped. */
 | |
| static void dict_stats_recalc_pool_add(table_id_t id)
 | |
| {
 | |
|   ut_ad(!srv_read_only_mode);
 | |
|   ut_ad(id);
 | |
|   bool schedule = false;
 | |
|   mysql_mutex_lock(&recalc_pool_mutex);
 | |
| 
 | |
|   const auto begin= recalc_pool.begin(), end= recalc_pool.end();
 | |
|   if (end == std::find_if(begin, end, [&](const recalc &r){return r.id == id;}))
 | |
|   {
 | |
|     recalc_pool.emplace_back(recalc{id, recalc::IDLE});
 | |
|     schedule = true;
 | |
|   }
 | |
| 
 | |
|   mysql_mutex_unlock(&recalc_pool_mutex);
 | |
|   if (schedule)
 | |
|     dict_stats_schedule_now();
 | |
| }
 | |
| 
 | |
| #ifdef WITH_WSREP
 | |
| /** Update the table modification counter and if necessary,
 | |
| schedule new estimates for table and index statistics to be calculated.
 | |
| @param[in,out]	table	persistent or temporary table
 | |
| @param[in]	thd	current session */
 | |
| void dict_stats_update_if_needed(dict_table_t *table, const trx_t &trx)
 | |
| #else
 | |
| /** Update the table modification counter and if necessary,
 | |
| schedule new estimates for table and index statistics to be calculated.
 | |
| @param[in,out]	table	persistent or temporary table */
 | |
| void dict_stats_update_if_needed_func(dict_table_t *table)
 | |
| #endif
 | |
| {
 | |
| 	if (UNIV_UNLIKELY(!table->stat_initialized)) {
 | |
| 		/* The table may have been evicted from dict_sys
 | |
| 		and reloaded internally by InnoDB for FOREIGN KEY
 | |
| 		processing, but not reloaded by the SQL layer.
 | |
| 
 | |
| 		We can (re)compute the transient statistics when the
 | |
| 		table is actually loaded by the SQL layer.
 | |
| 
 | |
| 		Note: If InnoDB persistent statistics are enabled,
 | |
| 		we will skip the updates. We must do this, because
 | |
| 		dict_table_get_n_rows() below assumes that the
 | |
| 		statistics have been initialized. The DBA may have
 | |
| 		to execute ANALYZE TABLE. */
 | |
| 		return;
 | |
| 	}
 | |
| 
 | |
| 	ulonglong	counter = table->stat_modified_counter++;
 | |
| 	ulonglong	n_rows = dict_table_get_n_rows(table);
 | |
| 
 | |
| 	if (dict_stats_is_persistent_enabled(table)) {
 | |
| 		if (table->name.is_temporary()) {
 | |
| 			return;
 | |
| 		}
 | |
| 		if (counter > n_rows / 10 /* 10% */
 | |
| 		    && dict_stats_auto_recalc_is_enabled(table)) {
 | |
| 
 | |
| #ifdef WITH_WSREP
 | |
| 			/* Do not add table to background
 | |
| 			statistic calculation if this thread is not a
 | |
| 			applier (as all DDL, which is replicated (i.e
 | |
| 			is binlogged in master node), will be executed
 | |
| 			with high priority (a.k.a BF) in slave nodes)
 | |
| 			and is BF. This could again lead BF lock
 | |
| 			waits in applier node but it is better than
 | |
| 			no persistent index/table statistics at
 | |
| 			applier nodes. TODO: allow BF threads
 | |
| 			wait for these InnoDB internal SQL-parser
 | |
| 			generated row locks and allow BF thread
 | |
| 			lock waits to be enqueued at head of waiting
 | |
| 			queue. */
 | |
| 			if (trx.is_wsrep()
 | |
| 			    && !wsrep_thd_is_applying(trx.mysql_thd)
 | |
| 			    && wsrep_thd_is_BF(trx.mysql_thd, 0)) {
 | |
| 				WSREP_DEBUG("Avoiding background statistics"
 | |
| 					    " calculation for table %s.",
 | |
| 					table->name.m_name);
 | |
| 				return;
 | |
| 			}
 | |
| #endif /* WITH_WSREP */
 | |
| 
 | |
| 			dict_stats_recalc_pool_add(table->id);
 | |
| 			table->stat_modified_counter = 0;
 | |
| 		}
 | |
| 		return;
 | |
| 	}
 | |
| 
 | |
| 	/* Calculate new statistics if 1 / 16 of table has been modified
 | |
| 	since the last time a statistics batch was run.
 | |
| 	We calculate statistics at most every 16th round, since we may have
 | |
| 	a counter table which is very small and updated very often. */
 | |
| 	ulonglong threshold = 16 + n_rows / 16; /* 6.25% */
 | |
| 
 | |
| 	if (srv_stats_modified_counter) {
 | |
| 		threshold = std::min(srv_stats_modified_counter, threshold);
 | |
| 	}
 | |
| 
 | |
| 	if (counter > threshold) {
 | |
| 		/* this will reset table->stat_modified_counter to 0 */
 | |
| 		dict_stats_update(table, DICT_STATS_RECALC_TRANSIENT);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| /** Delete a table from the auto recalc pool, and ensure that
 | |
| no statistics are being updated on it. */
 | |
| void dict_stats_recalc_pool_del(table_id_t id, bool have_mdl_exclusive)
 | |
| {
 | |
|   ut_ad(!srv_read_only_mode);
 | |
|   ut_ad(id);
 | |
| 
 | |
|   mysql_mutex_lock(&recalc_pool_mutex);
 | |
| 
 | |
|   auto end= recalc_pool.end();
 | |
|   auto i= std::find_if(recalc_pool.begin(), end,
 | |
|                        [&](const recalc &r){return r.id == id;});
 | |
|   if (i != end)
 | |
|   {
 | |
|     switch (i->state) {
 | |
|     case recalc::IN_PROGRESS:
 | |
|       if (!have_mdl_exclusive)
 | |
|       {
 | |
|         i->state= recalc::IN_PROGRESS_DELETING;
 | |
|         do
 | |
|         {
 | |
|           my_cond_wait(&recalc_pool_cond, &recalc_pool_mutex.m_mutex);
 | |
|           end= recalc_pool.end();
 | |
|           i= std::find_if(recalc_pool.begin(), end,
 | |
|                           [&](const recalc &r){return r.id == id;});
 | |
|           if (i == end)
 | |
|             goto done;
 | |
|         }
 | |
|         while (i->state == recalc::IN_PROGRESS_DELETING);
 | |
|       }
 | |
|       /* fall through */
 | |
|     case recalc::IDLE:
 | |
|       recalc_pool.erase(i);
 | |
|       break;
 | |
|     case recalc::IN_PROGRESS_DELETING:
 | |
|     case recalc::DELETING:
 | |
|       /* another thread will delete the entry in dict_stats_recalc_pool_del() */
 | |
|       break;
 | |
|     }
 | |
|   }
 | |
| 
 | |
| done:
 | |
|   mysql_mutex_unlock(&recalc_pool_mutex);
 | |
| }
 | |
| 
 | |
| /*****************************************************************//**
 | |
| Initialize global variables needed for the operation of dict_stats_thread()
 | |
| Must be called before dict_stats_thread() is started. */
 | |
| void dict_stats_init()
 | |
| {
 | |
|   ut_ad(!srv_read_only_mode);
 | |
|   mysql_mutex_init(recalc_pool_mutex_key, &recalc_pool_mutex, nullptr);
 | |
|   pthread_cond_init(&recalc_pool_cond, nullptr);
 | |
|   dict_defrag_pool_init();
 | |
|   stats_initialised= true;
 | |
| }
 | |
| 
 | |
| /*****************************************************************//**
 | |
| Free resources allocated by dict_stats_init(), must be called
 | |
| after dict_stats task has exited. */
 | |
| void dict_stats_deinit()
 | |
| {
 | |
| 	if (!stats_initialised) {
 | |
| 		return;
 | |
| 	}
 | |
| 
 | |
| 	ut_ad(!srv_read_only_mode);
 | |
| 	stats_initialised = false;
 | |
| 
 | |
| 	dict_stats_recalc_pool_deinit();
 | |
| 	dict_defrag_pool_deinit();
 | |
| 
 | |
| 	mysql_mutex_destroy(&recalc_pool_mutex);
 | |
| 	pthread_cond_destroy(&recalc_pool_cond);
 | |
| }
 | |
| 
 | |
| /**
 | |
| Get the first table that has been added for auto recalc and eventually
 | |
| update its stats.
 | |
| @return whether the first entry can be processed immediately */
 | |
| static bool dict_stats_process_entry_from_recalc_pool(THD *thd)
 | |
| {
 | |
|   ut_ad(!srv_read_only_mode);
 | |
|   table_id_t table_id;
 | |
|   mysql_mutex_lock(&recalc_pool_mutex);
 | |
| next_table_id_with_mutex:
 | |
|   for (auto &r : recalc_pool)
 | |
|   {
 | |
|     if ((table_id= r.id) && r.state == recalc::IDLE)
 | |
|     {
 | |
|       r.state= recalc::IN_PROGRESS;
 | |
|       mysql_mutex_unlock(&recalc_pool_mutex);
 | |
|       goto process;
 | |
|     }
 | |
|   }
 | |
|   mysql_mutex_unlock(&recalc_pool_mutex);
 | |
|   return false;
 | |
| 
 | |
| process:
 | |
|   MDL_ticket *mdl= nullptr;
 | |
|   dict_table_t *table= dict_table_open_on_id(table_id, false,
 | |
|                                              DICT_TABLE_OP_NORMAL, thd, &mdl);
 | |
|   if (!table)
 | |
|   {
 | |
| invalid_table_id:
 | |
|     mysql_mutex_lock(&recalc_pool_mutex);
 | |
|     auto i= std::find_if(recalc_pool.begin(), recalc_pool.end(),
 | |
|                          [&](const recalc &r){return r.id == table_id;});
 | |
|     if (i == recalc_pool.end());
 | |
|     else if (UNIV_LIKELY(i->state == recalc::IN_PROGRESS))
 | |
|       recalc_pool.erase(i);
 | |
|     else
 | |
|     {
 | |
|       ut_ad(i->state == recalc::IN_PROGRESS_DELETING);
 | |
|       i->state= recalc::DELETING;
 | |
|       pthread_cond_broadcast(&recalc_pool_cond);
 | |
|     }
 | |
|     goto next_table_id_with_mutex;
 | |
|   }
 | |
| 
 | |
|   ut_ad(!table->is_temporary());
 | |
| 
 | |
|   if (!mdl || !table->is_accessible())
 | |
|   {
 | |
|     dict_table_close(table, false, thd, mdl);
 | |
|     goto invalid_table_id;
 | |
|   }
 | |
| 
 | |
|   /* time() could be expensive, the current function
 | |
|   is called once every time a table has been changed more than 10% and
 | |
|   on a system with lots of small tables, this could become hot. If we
 | |
|   find out that this is a problem, then the check below could eventually
 | |
|   be replaced with something else, though a time interval is the natural
 | |
|   approach. */
 | |
|   const bool update_now=
 | |
|     difftime(time(nullptr), table->stats_last_recalc) >= MIN_RECALC_INTERVAL;
 | |
| 
 | |
|   const dberr_t err= update_now
 | |
|     ? dict_stats_update(table, DICT_STATS_RECALC_PERSISTENT)
 | |
|     : DB_SUCCESS_LOCKED_REC;
 | |
| 
 | |
|   dict_table_close(table, false, thd, mdl);
 | |
| 
 | |
|   mysql_mutex_lock(&recalc_pool_mutex);
 | |
|   auto i= std::find_if(recalc_pool.begin(), recalc_pool.end(),
 | |
|                        [&](const recalc &r){return r.id == table_id;});
 | |
|   if (i == recalc_pool.end())
 | |
|     goto done;
 | |
|   else if (i->state == recalc::IN_PROGRESS_DELETING)
 | |
|   {
 | |
|     i->state= recalc::DELETING;
 | |
|     pthread_cond_broadcast(&recalc_pool_cond);
 | |
| done:
 | |
|     mysql_mutex_unlock(&recalc_pool_mutex);
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     ut_ad(i->state == recalc::IN_PROGRESS);
 | |
|     recalc_pool.erase(i);
 | |
|     if (err == DB_SUCCESS_LOCKED_REC)
 | |
|       recalc_pool.emplace_back(recalc{table_id, recalc::IDLE});
 | |
|     mysql_mutex_unlock(&recalc_pool_mutex);
 | |
|   }
 | |
| 
 | |
|   return update_now;
 | |
| }
 | |
| 
 | |
| /** Check if the recalc pool is empty. */
 | |
| static bool is_recalc_pool_empty()
 | |
| {
 | |
|   mysql_mutex_lock(&recalc_pool_mutex);
 | |
|   bool empty= recalc_pool.empty();
 | |
|   mysql_mutex_unlock(&recalc_pool_mutex);
 | |
|   return empty;
 | |
| }
 | |
| 
 | |
| static tpool::timer* dict_stats_timer;
 | |
| static void dict_stats_func(void*)
 | |
| {
 | |
|   if (!dict_stats_thd)
 | |
|     dict_stats_thd= innobase_create_background_thd("InnoDB statistics");
 | |
|   set_current_thd(dict_stats_thd);
 | |
| 
 | |
|   while (dict_stats_process_entry_from_recalc_pool(dict_stats_thd)) {}
 | |
|   dict_defrag_process_entries_from_defrag_pool(dict_stats_thd);
 | |
| 
 | |
|   innobase_reset_background_thd(dict_stats_thd);
 | |
|   set_current_thd(nullptr);
 | |
|   if (!is_recalc_pool_empty())
 | |
|     dict_stats_schedule(MIN_RECALC_INTERVAL * 1000);
 | |
| }
 | |
| 
 | |
| 
 | |
| void dict_stats_start()
 | |
| {
 | |
|   DBUG_ASSERT(!dict_stats_timer);
 | |
|   dict_stats_timer= srv_thread_pool->create_timer(dict_stats_func);
 | |
| }
 | |
| 
 | |
| 
 | |
| static void dict_stats_schedule(int ms)
 | |
| {
 | |
|   if(dict_stats_timer)
 | |
|     dict_stats_timer->set_time(ms,0);
 | |
| }
 | |
| 
 | |
| void dict_stats_schedule_now()
 | |
| {
 | |
|   dict_stats_schedule(0);
 | |
| }
 | |
| 
 | |
| /** Shut down the dict_stats_thread. */
 | |
| void dict_stats_shutdown()
 | |
| {
 | |
|   delete dict_stats_timer;
 | |
|   dict_stats_timer= 0;
 | |
| }
 |