mirror of
				https://github.com/MariaDB/server.git
				synced 2025-10-31 19:06:14 +01:00 
			
		
		
		
	
		
			
				
	
	
		
			1806 lines
		
	
	
	
		
			50 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			1806 lines
		
	
	
	
		
			50 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /*****************************************************************************
 | |
| 
 | |
| Copyright (c) 1995, 2017, Oracle and/or its affiliates. All Rights Reserved.
 | |
| Copyright (c) 2017, 2023, MariaDB Corporation.
 | |
| 
 | |
| This program is free software; you can redistribute it and/or modify it under
 | |
| the terms of the GNU General Public License as published by the Free Software
 | |
| Foundation; version 2 of the License.
 | |
| 
 | |
| This program is distributed in the hope that it will be useful, but WITHOUT
 | |
| ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
 | |
| FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
 | |
| 
 | |
| You should have received a copy of the GNU General Public License along with
 | |
| this program; if not, write to the Free Software Foundation, Inc.,
 | |
| 51 Franklin Street, Fifth Floor, Boston, MA 02110-1335 USA
 | |
| 
 | |
| *****************************************************************************/
 | |
| 
 | |
| /**************************************************//**
 | |
| @file mtr/mtr0mtr.cc
 | |
| Mini-transaction buffer
 | |
| 
 | |
| Created 11/26/1995 Heikki Tuuri
 | |
| *******************************************************/
 | |
| 
 | |
| #include "mtr0log.h"
 | |
| #include "buf0buf.h"
 | |
| #include "buf0flu.h"
 | |
| #include "page0types.h"
 | |
| #include "log0crypt.h"
 | |
| #ifdef BTR_CUR_HASH_ADAPT
 | |
| # include "btr0sea.h"
 | |
| #endif
 | |
| #include "btr0cur.h"
 | |
| #include "srv0start.h"
 | |
| #include "log.h"
 | |
| #include "mariadb_stats.h"
 | |
| #include "my_cpu.h"
 | |
| 
 | |
| #ifdef HAVE_PMEM
 | |
| void (*mtr_t::commit_logger)(mtr_t *, std::pair<lsn_t,page_flush_ahead>);
 | |
| #endif
 | |
| 
 | |
| std::pair<lsn_t,mtr_t::page_flush_ahead> (*mtr_t::finisher)(mtr_t *, size_t);
 | |
| unsigned mtr_t::spin_wait_delay;
 | |
| 
 | |
| void mtr_t::finisher_update()
 | |
| {
 | |
|   ut_ad(log_sys.latch_have_wr());
 | |
| #ifdef HAVE_PMEM
 | |
|   if (log_sys.is_mmap())
 | |
|   {
 | |
|     commit_logger= mtr_t::commit_log<true>;
 | |
|     finisher= spin_wait_delay
 | |
|       ? mtr_t::finish_writer<true,true> : mtr_t::finish_writer<false,true>;
 | |
|     return;
 | |
|   }
 | |
|   commit_logger= mtr_t::commit_log<false>;
 | |
| #endif
 | |
|   finisher=
 | |
|     (spin_wait_delay
 | |
|      ? mtr_t::finish_writer<true,false> : mtr_t::finish_writer<false,false>);
 | |
| }
 | |
| 
 | |
| void mtr_memo_slot_t::release() const
 | |
| {
 | |
|   ut_ad(object);
 | |
| 
 | |
|   switch (type) {
 | |
|   case MTR_MEMO_S_LOCK:
 | |
|     static_cast<index_lock*>(object)->s_unlock();
 | |
|     break;
 | |
|   case MTR_MEMO_X_LOCK:
 | |
|   case MTR_MEMO_SX_LOCK:
 | |
|     static_cast<index_lock*>(object)->
 | |
|       u_or_x_unlock(type == MTR_MEMO_SX_LOCK);
 | |
|     break;
 | |
|   case MTR_MEMO_SPACE_X_LOCK:
 | |
|     static_cast<fil_space_t*>(object)->set_committed_size();
 | |
|     static_cast<fil_space_t*>(object)->x_unlock();
 | |
|     break;
 | |
|   default:
 | |
|     buf_page_t *bpage= static_cast<buf_page_t*>(object);
 | |
|     ut_d(const auto s=)
 | |
|       bpage->unfix();
 | |
|     ut_ad(s < buf_page_t::READ_FIX || s >= buf_page_t::WRITE_FIX);
 | |
|     switch (type) {
 | |
|     case MTR_MEMO_PAGE_S_FIX:
 | |
|       bpage->lock.s_unlock();
 | |
|       break;
 | |
|     case MTR_MEMO_BUF_FIX:
 | |
|       break;
 | |
|     default:
 | |
|       ut_ad(type == MTR_MEMO_PAGE_SX_FIX ||
 | |
|             type == MTR_MEMO_PAGE_X_FIX ||
 | |
|             type == MTR_MEMO_PAGE_SX_MODIFY ||
 | |
|             type == MTR_MEMO_PAGE_X_MODIFY);
 | |
|       bpage->lock.u_or_x_unlock(type & MTR_MEMO_PAGE_SX_FIX);
 | |
|     }
 | |
|   }
 | |
| }
 | |
| 
 | |
| /** Prepare to insert a modified blcok into flush_list.
 | |
| @param lsn start LSN of the mini-transaction
 | |
| @return insert position for insert_into_flush_list() */
 | |
| inline buf_page_t *buf_pool_t::prepare_insert_into_flush_list(lsn_t lsn)
 | |
|   noexcept
 | |
| {
 | |
|   ut_ad(recv_recovery_is_on() || log_sys.latch_have_any());
 | |
|   ut_ad(lsn >= log_sys.last_checkpoint_lsn);
 | |
|   mysql_mutex_assert_owner(&flush_list_mutex);
 | |
|   static_assert(log_t::FIRST_LSN >= 2, "compatibility");
 | |
| 
 | |
| rescan:
 | |
|   buf_page_t *prev= UT_LIST_GET_FIRST(flush_list);
 | |
|   if (prev)
 | |
|   {
 | |
|     lsn_t om= prev->oldest_modification();
 | |
|     if (om == 1)
 | |
|     {
 | |
|       delete_from_flush_list(prev);
 | |
|       goto rescan;
 | |
|     }
 | |
|     ut_ad(om > 2);
 | |
|     if (om <= lsn)
 | |
|       return nullptr;
 | |
|     while (buf_page_t *next= UT_LIST_GET_NEXT(list, prev))
 | |
|     {
 | |
|       om= next->oldest_modification();
 | |
|       if (om == 1)
 | |
|       {
 | |
|         delete_from_flush_list(next);
 | |
|         continue;
 | |
|       }
 | |
|       ut_ad(om > 2);
 | |
|       if (om <= lsn)
 | |
|         break;
 | |
|       prev= next;
 | |
|     }
 | |
|     flush_hp.adjust(prev);
 | |
|   }
 | |
|   return prev;
 | |
| }
 | |
| 
 | |
| /** Insert a modified block into the flush list.
 | |
| @param prev     insert position (from prepare_insert_into_flush_list())
 | |
| @param block    modified block
 | |
| @param lsn      start LSN of the mini-transaction that modified the block */
 | |
| inline void buf_pool_t::insert_into_flush_list(buf_page_t *prev,
 | |
|                                                buf_block_t *block, lsn_t lsn)
 | |
|   noexcept
 | |
| {
 | |
|   ut_ad(!fsp_is_system_temporary(block->page.id().space()));
 | |
|   mysql_mutex_assert_owner(&flush_list_mutex);
 | |
| 
 | |
|   MEM_CHECK_DEFINED(block->page.zip.data
 | |
|                     ? block->page.zip.data : block->page.frame,
 | |
|                     block->physical_size());
 | |
| 
 | |
|   if (const lsn_t old= block->page.oldest_modification())
 | |
|   {
 | |
|     if (old > 1)
 | |
|       return;
 | |
|     flush_hp.adjust(&block->page);
 | |
|     UT_LIST_REMOVE(flush_list, &block->page);
 | |
|   }
 | |
|   else
 | |
|     flush_list_bytes+= block->physical_size();
 | |
| 
 | |
|   ut_ad(flush_list_bytes <= size_in_bytes);
 | |
| 
 | |
|   if (prev)
 | |
|     UT_LIST_INSERT_AFTER(flush_list, prev, &block->page);
 | |
|   else
 | |
|     UT_LIST_ADD_FIRST(flush_list, &block->page);
 | |
| 
 | |
|   block->page.set_oldest_modification(lsn);
 | |
| }
 | |
| 
 | |
| mtr_t::mtr_t()= default;
 | |
| mtr_t::~mtr_t()= default;
 | |
| 
 | |
| /** Start a mini-transaction. */
 | |
| void mtr_t::start()
 | |
| {
 | |
|   ut_ad(m_memo.empty());
 | |
|   ut_ad(!m_freed_pages);
 | |
|   ut_ad(!m_freed_space);
 | |
|   MEM_UNDEFINED(this, sizeof *this);
 | |
|   MEM_MAKE_DEFINED(&m_memo, sizeof m_memo);
 | |
|   MEM_MAKE_DEFINED(&m_freed_space, sizeof m_freed_space);
 | |
|   MEM_MAKE_DEFINED(&m_freed_pages, sizeof m_freed_pages);
 | |
| 
 | |
|   ut_d(m_start= true);
 | |
|   ut_d(m_commit= false);
 | |
|   ut_d(m_freeing_tree= false);
 | |
| 
 | |
|   m_last= nullptr;
 | |
|   m_last_offset= 0;
 | |
| 
 | |
|   new(&m_log) mtr_buf_t();
 | |
| 
 | |
|   m_made_dirty= false;
 | |
|   m_latch_ex= false;
 | |
|   m_modifications= false;
 | |
|   m_log_mode= MTR_LOG_ALL;
 | |
|   ut_d(m_user_space_id= TRX_SYS_SPACE);
 | |
|   m_user_space= nullptr;
 | |
|   m_commit_lsn= 0;
 | |
|   m_trim_pages= false;
 | |
| }
 | |
| 
 | |
| /** Release the resources */
 | |
| inline void mtr_t::release_resources()
 | |
| {
 | |
|   ut_ad(is_active());
 | |
|   ut_ad(m_memo.empty());
 | |
|   m_log.erase();
 | |
|   ut_d(m_commit= true);
 | |
| }
 | |
| 
 | |
| /** Handle any pages that were freed during the mini-transaction. */
 | |
| void mtr_t::process_freed_pages()
 | |
| {
 | |
|   if (m_freed_pages)
 | |
|   {
 | |
|     ut_ad(!m_freed_pages->empty());
 | |
|     ut_ad(m_freed_space);
 | |
|     ut_ad(m_freed_space->is_owner());
 | |
|     ut_ad(is_named_space(m_freed_space));
 | |
| 
 | |
|     /* Update the last freed lsn */
 | |
|     m_freed_space->freed_range_mutex.lock();
 | |
|     m_freed_space->update_last_freed_lsn(m_commit_lsn);
 | |
|     if (!m_trim_pages)
 | |
|       for (const auto &range : *m_freed_pages)
 | |
|         m_freed_space->add_free_range(range);
 | |
|     else
 | |
|       m_freed_space->clear_freed_ranges();
 | |
|     m_freed_space->freed_range_mutex.unlock();
 | |
| 
 | |
|     delete m_freed_pages;
 | |
|     m_freed_pages= nullptr;
 | |
|     m_freed_space= nullptr;
 | |
|     /* mtr_t::start() will reset m_trim_pages */
 | |
|   }
 | |
|   else
 | |
|     ut_ad(!m_freed_space);
 | |
| }
 | |
| 
 | |
| ATTRIBUTE_COLD __attribute__((noinline))
 | |
| /** Insert a modified block into buf_pool.flush_list on IMPORT TABLESPACE. */
 | |
| static void insert_imported(buf_block_t *block)
 | |
| {
 | |
|   if (block->page.oldest_modification() <= 1)
 | |
|   {
 | |
|     log_sys.latch.rd_lock(SRW_LOCK_CALL);
 | |
|     /* For unlogged mtrs (MTR_LOG_NO_REDO), we use the current system LSN. The
 | |
|     mtr that generated the LSN is either already committed or in mtr_t::commit.
 | |
|     Shared latch and relaxed atomics should be fine here as it is guaranteed
 | |
|     that both the current mtr and the mtr that generated the LSN would have
 | |
|     added the dirty pages to flush list before we access the minimum LSN during
 | |
|     checkpoint. log_checkpoint_low() acquires exclusive log_sys.latch before
 | |
|     commencing. */
 | |
|     const lsn_t lsn= log_sys.get_lsn();
 | |
|     mysql_mutex_lock(&buf_pool.flush_list_mutex);
 | |
|     buf_pool.insert_into_flush_list
 | |
|       (buf_pool.prepare_insert_into_flush_list(lsn), block, lsn);
 | |
|     log_sys.latch.rd_unlock();
 | |
|     mysql_mutex_unlock(&buf_pool.flush_list_mutex);
 | |
|   }
 | |
| }
 | |
| 
 | |
| /** Release modified pages when no log was written. */
 | |
| void mtr_t::release_unlogged()
 | |
| {
 | |
|   ut_ad(m_log_mode == MTR_LOG_NO_REDO);
 | |
|   ut_ad(m_log.size() == 0);
 | |
| 
 | |
|   process_freed_pages();
 | |
| 
 | |
|   for (auto it= m_memo.rbegin(); it != m_memo.rend(); it++)
 | |
|   {
 | |
|     mtr_memo_slot_t &slot= *it;
 | |
|     ut_ad(slot.object);
 | |
|     switch (slot.type) {
 | |
|     case MTR_MEMO_S_LOCK:
 | |
|       static_cast<index_lock*>(slot.object)->s_unlock();
 | |
|       break;
 | |
|     case MTR_MEMO_SPACE_X_LOCK:
 | |
|       static_cast<fil_space_t*>(slot.object)->set_committed_size();
 | |
|       static_cast<fil_space_t*>(slot.object)->x_unlock();
 | |
|       break;
 | |
|     case MTR_MEMO_X_LOCK:
 | |
|     case MTR_MEMO_SX_LOCK:
 | |
|       static_cast<index_lock*>(slot.object)->
 | |
|         u_or_x_unlock(slot.type == MTR_MEMO_SX_LOCK);
 | |
|       break;
 | |
|     default:
 | |
|       buf_block_t *block= static_cast<buf_block_t*>(slot.object);
 | |
|       ut_d(const auto s=) block->page.unfix();
 | |
|       ut_ad(s >= buf_page_t::FREED);
 | |
|       ut_ad(s < buf_page_t::READ_FIX);
 | |
| 
 | |
|       if (slot.type & MTR_MEMO_MODIFY)
 | |
|       {
 | |
|         ut_ad(slot.type == MTR_MEMO_PAGE_X_MODIFY ||
 | |
|               slot.type == MTR_MEMO_PAGE_SX_MODIFY);
 | |
|         ut_ad(block->page.id() < end_page_id);
 | |
|         insert_imported(block);
 | |
|       }
 | |
| 
 | |
|       switch (slot.type) {
 | |
|       case MTR_MEMO_PAGE_S_FIX:
 | |
|         block->page.lock.s_unlock();
 | |
|         break;
 | |
|       case MTR_MEMO_BUF_FIX:
 | |
|         break;
 | |
|       default:
 | |
|         ut_ad(slot.type == MTR_MEMO_PAGE_SX_FIX ||
 | |
|               slot.type == MTR_MEMO_PAGE_X_FIX ||
 | |
|               slot.type == MTR_MEMO_PAGE_SX_MODIFY ||
 | |
|               slot.type == MTR_MEMO_PAGE_X_MODIFY);
 | |
|         block->page.lock.u_or_x_unlock(slot.type & MTR_MEMO_PAGE_SX_FIX);
 | |
|       }
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   m_memo.clear();
 | |
| }
 | |
| 
 | |
| void mtr_t::release()
 | |
| {
 | |
|   for (auto it= m_memo.rbegin(); it != m_memo.rend(); it++)
 | |
|     it->release();
 | |
|   m_memo.clear();
 | |
| }
 | |
| 
 | |
| inline lsn_t log_t::get_write_target() const
 | |
| {
 | |
|   ut_ad(latch_have_any());
 | |
|   if (UNIV_LIKELY(buf_free_ok()))
 | |
|     return 0;
 | |
|   /* The LSN corresponding to the end of buf is
 | |
|   write_lsn - (first_lsn & 4095) + buf_free,
 | |
|   but we use simpler arithmetics to return a smaller write target in
 | |
|   order to minimize waiting in log_write_up_to(). */
 | |
|   ut_ad(max_buf_free >= 4096 * 4);
 | |
|   return write_lsn + max_buf_free / 2;
 | |
| }
 | |
| 
 | |
| template<bool mmap>
 | |
| void mtr_t::commit_log(mtr_t *mtr, std::pair<lsn_t,page_flush_ahead> lsns)
 | |
| {
 | |
|   size_t modified= 0;
 | |
|   const lsn_t write_lsn= mmap ? 0 : log_sys.get_write_target();
 | |
| 
 | |
|   if (mtr->m_made_dirty)
 | |
|   {
 | |
|     auto it= mtr->m_memo.rbegin();
 | |
| 
 | |
|     mysql_mutex_lock(&buf_pool.flush_list_mutex);
 | |
| 
 | |
|     buf_page_t *const prev=
 | |
|       buf_pool.prepare_insert_into_flush_list(lsns.first);
 | |
| 
 | |
|     while (it != mtr->m_memo.rend())
 | |
|     {
 | |
|       const mtr_memo_slot_t &slot= *it++;
 | |
|       if (slot.type & MTR_MEMO_MODIFY)
 | |
|       {
 | |
|         ut_ad(slot.type == MTR_MEMO_PAGE_X_MODIFY ||
 | |
|               slot.type == MTR_MEMO_PAGE_SX_MODIFY);
 | |
|         modified++;
 | |
|         buf_block_t *b= static_cast<buf_block_t*>(slot.object);
 | |
|         ut_ad(b->page.id() < end_page_id);
 | |
|         ut_d(const auto s= b->page.state());
 | |
|         ut_ad(s > buf_page_t::FREED);
 | |
|         ut_ad(s < buf_page_t::READ_FIX);
 | |
|         ut_ad(mach_read_from_8(b->page.frame + FIL_PAGE_LSN) <=
 | |
|               mtr->m_commit_lsn);
 | |
|         mach_write_to_8(b->page.frame + FIL_PAGE_LSN, mtr->m_commit_lsn);
 | |
|         if (UNIV_LIKELY_NULL(b->page.zip.data))
 | |
|           memcpy_aligned<8>(FIL_PAGE_LSN + b->page.zip.data,
 | |
|                             FIL_PAGE_LSN + b->page.frame, 8);
 | |
|         buf_pool.insert_into_flush_list(prev, b, lsns.first);
 | |
|       }
 | |
|     }
 | |
| 
 | |
|     ut_ad(modified);
 | |
|     buf_pool.flush_list_requests+= modified;
 | |
|     buf_pool.page_cleaner_wakeup();
 | |
|     mysql_mutex_unlock(&buf_pool.flush_list_mutex);
 | |
| 
 | |
|     if (mtr->m_latch_ex)
 | |
|     {
 | |
|       log_sys.latch.wr_unlock();
 | |
|       mtr->m_latch_ex= false;
 | |
|     }
 | |
|     else
 | |
|       log_sys.latch.rd_unlock();
 | |
| 
 | |
|     mtr->release();
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     if (mtr->m_latch_ex)
 | |
|     {
 | |
|       log_sys.latch.wr_unlock();
 | |
|       mtr->m_latch_ex= false;
 | |
|     }
 | |
|     else
 | |
|       log_sys.latch.rd_unlock();
 | |
| 
 | |
|     for (auto it= mtr->m_memo.rbegin(); it != mtr->m_memo.rend(); )
 | |
|     {
 | |
|       const mtr_memo_slot_t &slot= *it++;
 | |
|       ut_ad(slot.object);
 | |
|       switch (slot.type) {
 | |
|       case MTR_MEMO_S_LOCK:
 | |
|         static_cast<index_lock*>(slot.object)->s_unlock();
 | |
|         break;
 | |
|       case MTR_MEMO_SPACE_X_LOCK:
 | |
|         static_cast<fil_space_t*>(slot.object)->set_committed_size();
 | |
|         static_cast<fil_space_t*>(slot.object)->x_unlock();
 | |
|         break;
 | |
|       case MTR_MEMO_X_LOCK:
 | |
|       case MTR_MEMO_SX_LOCK:
 | |
|         static_cast<index_lock*>(slot.object)->
 | |
|           u_or_x_unlock(slot.type == MTR_MEMO_SX_LOCK);
 | |
|         break;
 | |
|       default:
 | |
|         buf_page_t *bpage= static_cast<buf_page_t*>(slot.object);
 | |
|         ut_d(const auto s=)
 | |
|           bpage->unfix();
 | |
|         if (slot.type & MTR_MEMO_MODIFY)
 | |
|         {
 | |
|           ut_ad(slot.type == MTR_MEMO_PAGE_X_MODIFY ||
 | |
|                 slot.type == MTR_MEMO_PAGE_SX_MODIFY);
 | |
|           ut_ad(bpage->oldest_modification() > 1);
 | |
|           ut_ad(bpage->oldest_modification() < mtr->m_commit_lsn);
 | |
|           ut_ad(bpage->id() < end_page_id);
 | |
|           ut_ad(s >= buf_page_t::FREED);
 | |
|           ut_ad(s < buf_page_t::READ_FIX);
 | |
|           ut_ad(mach_read_from_8(bpage->frame + FIL_PAGE_LSN) <=
 | |
|                 mtr->m_commit_lsn);
 | |
|           mach_write_to_8(bpage->frame + FIL_PAGE_LSN, mtr->m_commit_lsn);
 | |
|           if (UNIV_LIKELY_NULL(bpage->zip.data))
 | |
|             memcpy_aligned<8>(FIL_PAGE_LSN + bpage->zip.data,
 | |
|                               FIL_PAGE_LSN + bpage->frame, 8);
 | |
|           modified++;
 | |
|         }
 | |
|         switch (auto latch= slot.type & ~MTR_MEMO_MODIFY) {
 | |
|         case MTR_MEMO_PAGE_S_FIX:
 | |
|           bpage->lock.s_unlock();
 | |
|           continue;
 | |
|         case MTR_MEMO_PAGE_SX_FIX:
 | |
|         case MTR_MEMO_PAGE_X_FIX:
 | |
|           bpage->lock.u_or_x_unlock(latch == MTR_MEMO_PAGE_SX_FIX);
 | |
|           continue;
 | |
|         default:
 | |
|           ut_ad(latch == MTR_MEMO_BUF_FIX);
 | |
|         }
 | |
|       }
 | |
|     }
 | |
| 
 | |
|     buf_pool.add_flush_list_requests(modified);
 | |
|     mtr->m_memo.clear();
 | |
|   }
 | |
| 
 | |
|   mariadb_increment_pages_updated(modified);
 | |
| 
 | |
|   if (UNIV_UNLIKELY(lsns.second != PAGE_FLUSH_NO))
 | |
|     buf_flush_ahead(mtr->m_commit_lsn, lsns.second == PAGE_FLUSH_SYNC);
 | |
| 
 | |
|   if (!mmap && UNIV_UNLIKELY(write_lsn != 0))
 | |
|     log_write_up_to(write_lsn, false);
 | |
| }
 | |
| 
 | |
| /** Commit a mini-transaction. */
 | |
| void mtr_t::commit()
 | |
| {
 | |
|   ut_ad(is_active());
 | |
| 
 | |
|   /* This is a dirty read, for debugging. */
 | |
|   ut_ad(!m_modifications || !recv_no_log_write);
 | |
|   ut_ad(!m_modifications || m_log_mode != MTR_LOG_NONE);
 | |
|   ut_ad(!m_latch_ex);
 | |
| 
 | |
|   if (m_modifications && (m_log_mode == MTR_LOG_NO_REDO || !m_log.empty()))
 | |
|   {
 | |
|     if (UNIV_UNLIKELY(!is_logged()))
 | |
|     {
 | |
|       release_unlogged();
 | |
|       goto func_exit;
 | |
|     }
 | |
| 
 | |
|     ut_ad(!srv_read_only_mode);
 | |
|     std::pair<lsn_t,page_flush_ahead> lsns{do_write()};
 | |
|     process_freed_pages();
 | |
| #ifdef HAVE_PMEM
 | |
|     commit_logger(this, lsns);
 | |
| #else
 | |
|     commit_log<false>(this, lsns);
 | |
| #endif
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     if (m_freed_pages)
 | |
|     {
 | |
|       ut_ad(!m_freed_pages->empty());
 | |
|       ut_ad(m_freed_space == fil_system.temp_space);
 | |
|       ut_ad(!m_trim_pages);
 | |
|       for (const auto &range : *m_freed_pages)
 | |
|         m_freed_space->add_free_range(range);
 | |
|       delete m_freed_pages;
 | |
|       m_freed_pages= nullptr;
 | |
|       m_freed_space= nullptr;
 | |
|     }
 | |
|     release();
 | |
|   }
 | |
| 
 | |
| func_exit:
 | |
|   release_resources();
 | |
| }
 | |
| 
 | |
| void mtr_t::rollback_to_savepoint(ulint begin, ulint end)
 | |
| {
 | |
|   ut_ad(end <= m_memo.size());
 | |
|   ut_ad(begin <= end);
 | |
|   ulint s= end;
 | |
| 
 | |
|   while (s-- > begin)
 | |
|   {
 | |
|     const mtr_memo_slot_t &slot= m_memo[s];
 | |
|     ut_ad(slot.object);
 | |
|     /* This is intended for releasing latches on indexes or unmodified
 | |
|     buffer pool pages. */
 | |
|     ut_ad(slot.type <= MTR_MEMO_SX_LOCK);
 | |
|     ut_ad(!(slot.type & MTR_MEMO_MODIFY));
 | |
|     slot.release();
 | |
|   }
 | |
| 
 | |
|   m_memo.erase(m_memo.begin() + begin, m_memo.begin() + end);
 | |
| }
 | |
| 
 | |
| /** Set create_lsn. */
 | |
| inline void fil_space_t::set_create_lsn(lsn_t lsn) noexcept
 | |
| {
 | |
|   /* Concurrent log_checkpoint_low() must be impossible. */
 | |
|   ut_ad(latch.have_wr());
 | |
|   create_lsn= lsn;
 | |
| }
 | |
| 
 | |
| /** Commit a mini-transaction that is shrinking a tablespace.
 | |
| @param space   tablespace that is being shrunk
 | |
| @param size    new size in pages */
 | |
| void mtr_t::commit_shrink(fil_space_t &space, uint32_t size)
 | |
| {
 | |
|   ut_ad(is_active());
 | |
|   ut_ad(!high_level_read_only);
 | |
|   ut_ad(m_modifications);
 | |
|   ut_ad(!m_memo.empty());
 | |
|   ut_ad(!recv_recovery_is_on());
 | |
|   ut_ad(m_log_mode == MTR_LOG_ALL);
 | |
|   ut_ad(!m_freed_pages);
 | |
| 
 | |
|   log_write_and_flush_prepare();
 | |
|   m_latch_ex= true;
 | |
|   log_sys.latch.wr_lock(SRW_LOCK_CALL);
 | |
| 
 | |
|   const lsn_t start_lsn= do_write().first;
 | |
|   ut_d(m_log.erase());
 | |
| 
 | |
|   fil_node_t *file= UT_LIST_GET_LAST(space.chain);
 | |
|   mysql_mutex_lock(&fil_system.mutex);
 | |
|   ut_ad(file->is_open());
 | |
|   ut_ad(space.size >= size);
 | |
|   ut_ad(file->size >= space.size - size);
 | |
|   file->size-= space.size - size;
 | |
|   space.size= space.size_in_header= size;
 | |
| 
 | |
|   if (space.id == TRX_SYS_SPACE)
 | |
|     srv_sys_space.set_last_file_size(file->size);
 | |
|   else
 | |
|     space.set_create_lsn(m_commit_lsn);
 | |
| 
 | |
|   mysql_mutex_unlock(&fil_system.mutex);
 | |
| 
 | |
|   space.clear_freed_ranges();
 | |
| 
 | |
|   /* Durably write the reduced FSP_SIZE before truncating the data file. */
 | |
|   log_write_and_flush();
 | |
|   ut_ad(log_sys.latch_have_wr());
 | |
| 
 | |
|   os_file_truncate(file->name, file->handle,
 | |
|                    os_offset_t{file->size} << srv_page_size_shift, true);
 | |
| 
 | |
|   space.clear_freed_ranges();
 | |
| 
 | |
|   const page_id_t high{space.id, size};
 | |
|   size_t modified= 0;
 | |
|   auto it= m_memo.rbegin();
 | |
|   mysql_mutex_lock(&buf_pool.flush_list_mutex);
 | |
| 
 | |
|   buf_page_t *const prev= buf_pool.prepare_insert_into_flush_list(start_lsn);
 | |
| 
 | |
|   while (it != m_memo.rend())
 | |
|   {
 | |
|     mtr_memo_slot_t &slot= *it++;
 | |
| 
 | |
|     ut_ad(slot.object);
 | |
|     if (slot.type == MTR_MEMO_SPACE_X_LOCK)
 | |
|       ut_ad(high.space() == static_cast<fil_space_t*>(slot.object)->id);
 | |
|     else
 | |
|     {
 | |
|       ut_ad(slot.type == MTR_MEMO_PAGE_X_MODIFY ||
 | |
|             slot.type == MTR_MEMO_PAGE_SX_MODIFY ||
 | |
|             slot.type == MTR_MEMO_PAGE_X_FIX ||
 | |
|             slot.type == MTR_MEMO_PAGE_SX_FIX);
 | |
|       buf_block_t *b= static_cast<buf_block_t*>(slot.object);
 | |
|       const page_id_t id{b->page.id()};
 | |
|       const auto s= b->page.state();
 | |
|       ut_ad(s > buf_page_t::FREED);
 | |
|       ut_ad(s < buf_page_t::READ_FIX);
 | |
|       ut_ad(b->page.frame);
 | |
|       ut_ad(mach_read_from_8(b->page.frame + FIL_PAGE_LSN) <= m_commit_lsn);
 | |
|       ut_ad(!b->page.zip.data); // we no not shrink ROW_FORMAT=COMPRESSED
 | |
| 
 | |
|       if (id < high)
 | |
|       {
 | |
|         ut_ad(id.space() == high.space() ||
 | |
|               (id == page_id_t{0, TRX_SYS_PAGE_NO} &&
 | |
|                srv_is_undo_tablespace(high.space())));
 | |
|         if (slot.type & MTR_MEMO_MODIFY)
 | |
|         {
 | |
|           modified++;
 | |
|           mach_write_to_8(b->page.frame + FIL_PAGE_LSN, m_commit_lsn);
 | |
|           buf_pool.insert_into_flush_list(prev, b, start_lsn);
 | |
|         }
 | |
|       }
 | |
|       else
 | |
|       {
 | |
|         ut_ad(id.space() == high.space());
 | |
|         if (s >= buf_page_t::UNFIXED)
 | |
|           b->page.set_freed(s);
 | |
|         if (b->page.oldest_modification() > 1)
 | |
|           b->page.reset_oldest_modification();
 | |
|         slot.type= mtr_memo_type_t(slot.type & ~MTR_MEMO_MODIFY);
 | |
|       }
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   ut_ad(modified);
 | |
|   buf_pool.flush_list_requests+= modified;
 | |
|   buf_pool.page_cleaner_wakeup();
 | |
|   mysql_mutex_unlock(&buf_pool.flush_list_mutex);
 | |
| 
 | |
|   log_sys.latch.wr_unlock();
 | |
|   m_latch_ex= false;
 | |
| 
 | |
|   release();
 | |
|   release_resources();
 | |
| }
 | |
| 
 | |
| /** Commit a mini-transaction that is deleting or renaming a file.
 | |
| @param space   tablespace that is being renamed or deleted
 | |
| @param name    new file name (nullptr=the file will be deleted)
 | |
| @return whether the operation succeeded */
 | |
| bool mtr_t::commit_file(fil_space_t &space, const char *name)
 | |
| {
 | |
|   ut_ad(is_active());
 | |
|   ut_ad(!high_level_read_only);
 | |
|   ut_ad(m_modifications);
 | |
|   ut_ad(!m_made_dirty);
 | |
|   ut_ad(!recv_recovery_is_on());
 | |
|   ut_ad(m_log_mode == MTR_LOG_ALL);
 | |
|   ut_ad(UT_LIST_GET_LEN(space.chain) == 1);
 | |
|   ut_ad(!m_latch_ex);
 | |
| 
 | |
|   m_latch_ex= true;
 | |
| 
 | |
|   log_write_and_flush_prepare();
 | |
| 
 | |
|   log_sys.latch.wr_lock(SRW_LOCK_CALL);
 | |
| 
 | |
|   size_t size= m_log.size() + 5;
 | |
| 
 | |
|   if (log_sys.is_encrypted())
 | |
|   {
 | |
|     /* We will not encrypt any FILE_ records, but we will reserve
 | |
|     a nonce at the end. */
 | |
|     size+= 8;
 | |
|     m_commit_lsn= log_sys.get_lsn();
 | |
|   }
 | |
|   else
 | |
|     m_commit_lsn= 0;
 | |
| 
 | |
|   m_crc= 0;
 | |
|   m_log.for_each_block([this](const mtr_buf_t::block_t *b)
 | |
|   { m_crc= my_crc32c(m_crc, b->begin(), b->used()); return true; });
 | |
|   finish_write(size);
 | |
| 
 | |
|   if (!name && space.max_lsn)
 | |
|   {
 | |
|     ut_d(space.max_lsn= 0);
 | |
|     fil_system.named_spaces.remove(space);
 | |
|   }
 | |
| 
 | |
|   /* Block log_checkpoint(). */
 | |
|   mysql_mutex_lock(&buf_pool.flush_list_mutex);
 | |
| 
 | |
|   /* Durably write the log for the file system operation. */
 | |
|   log_write_and_flush();
 | |
| 
 | |
|   log_sys.latch.wr_unlock();
 | |
|   m_latch_ex= false;
 | |
| 
 | |
|   char *old_name= space.chain.start->name;
 | |
|   bool success= true;
 | |
| 
 | |
|   if (name)
 | |
|   {
 | |
|     char *new_name= mem_strdup(name);
 | |
|     mysql_mutex_lock(&fil_system.mutex);
 | |
|     success= os_file_rename(innodb_data_file_key, old_name, name);
 | |
|     if (success)
 | |
|       space.chain.start->name= new_name;
 | |
|     else
 | |
|       old_name= new_name;
 | |
|     mysql_mutex_unlock(&fil_system.mutex);
 | |
|     ut_free(old_name);
 | |
|   }
 | |
| 
 | |
|   mysql_mutex_unlock(&buf_pool.flush_list_mutex);
 | |
|   release_resources();
 | |
| 
 | |
|   return success;
 | |
| }
 | |
| 
 | |
| /** Commit a mini-transaction that did not modify any pages,
 | |
| but generated some redo log on a higher level, such as
 | |
| FILE_MODIFY records and an optional FILE_CHECKPOINT marker.
 | |
| The caller must hold exclusive log_sys.latch.
 | |
| This is to be used at log_checkpoint().
 | |
| @param checkpoint_lsn   the log sequence number of a checkpoint, or 0
 | |
| @return current LSN */
 | |
| ATTRIBUTE_COLD lsn_t mtr_t::commit_files(lsn_t checkpoint_lsn)
 | |
| {
 | |
|   ut_ad(log_sys.latch_have_wr());
 | |
|   ut_ad(is_active());
 | |
|   ut_ad(m_log_mode == MTR_LOG_ALL);
 | |
|   ut_ad(!m_made_dirty);
 | |
|   ut_ad(m_memo.empty());
 | |
|   ut_ad(!srv_read_only_mode);
 | |
|   ut_ad(!m_freed_space);
 | |
|   ut_ad(!m_freed_pages);
 | |
|   ut_ad(!m_user_space);
 | |
|   ut_ad(!m_latch_ex);
 | |
| 
 | |
|   m_latch_ex= true;
 | |
| 
 | |
|   if (checkpoint_lsn)
 | |
|   {
 | |
|     byte *ptr= m_log.push<byte*>(3 + 8);
 | |
|     *ptr= FILE_CHECKPOINT | (2 + 8);
 | |
|     ::memset(ptr + 1, 0, 2);
 | |
|     mach_write_to_8(ptr + 3, checkpoint_lsn);
 | |
|   }
 | |
| 
 | |
|   size_t size= m_log.size() + 5;
 | |
| 
 | |
|   if (log_sys.is_encrypted())
 | |
|   {
 | |
|     /* We will not encrypt any FILE_ records, but we will reserve
 | |
|     a nonce at the end. */
 | |
|     size+= 8;
 | |
|     m_commit_lsn= log_sys.get_lsn();
 | |
|   }
 | |
|   else
 | |
|     m_commit_lsn= 0;
 | |
| 
 | |
|   m_crc= 0;
 | |
|   m_log.for_each_block([this](const mtr_buf_t::block_t *b)
 | |
|   { m_crc= my_crc32c(m_crc, b->begin(), b->used()); return true; });
 | |
|   finish_write(size);
 | |
|   release_resources();
 | |
| 
 | |
|   if (checkpoint_lsn)
 | |
|     DBUG_PRINT("ib_log",
 | |
|                ("FILE_CHECKPOINT(" LSN_PF ") written at " LSN_PF,
 | |
|                 checkpoint_lsn, m_commit_lsn));
 | |
| 
 | |
|   return m_commit_lsn;
 | |
| }
 | |
| 
 | |
| #ifdef UNIV_DEBUG
 | |
| /** Check if a tablespace is associated with the mini-transaction
 | |
| (needed for generating a FILE_MODIFY record)
 | |
| @param[in]	space	tablespace
 | |
| @return whether the mini-transaction is associated with the space */
 | |
| bool
 | |
| mtr_t::is_named_space(uint32_t space) const
 | |
| {
 | |
|   ut_ad(!m_user_space || m_user_space->id != TRX_SYS_SPACE);
 | |
|   return !is_logged() || m_user_space_id == space ||
 | |
|     is_predefined_tablespace(space);
 | |
| }
 | |
| /** Check if a tablespace is associated with the mini-transaction
 | |
| (needed for generating a FILE_MODIFY record)
 | |
| @param[in]	space	tablespace
 | |
| @return whether the mini-transaction is associated with the space */
 | |
| bool mtr_t::is_named_space(const fil_space_t* space) const
 | |
| {
 | |
|   ut_ad(!m_user_space || m_user_space->id != TRX_SYS_SPACE);
 | |
| 
 | |
|   return !is_logged() || m_user_space == space ||
 | |
|     is_predefined_tablespace(space->id);
 | |
| }
 | |
| #endif /* UNIV_DEBUG */
 | |
| 
 | |
| /** Acquire a tablespace X-latch.
 | |
| @param[in]	space_id	tablespace ID
 | |
| @return the tablespace object (never NULL) */
 | |
| fil_space_t *mtr_t::x_lock_space(uint32_t space_id)
 | |
| {
 | |
| 	fil_space_t*	space;
 | |
| 
 | |
| 	ut_ad(is_active());
 | |
| 
 | |
| 	if (space_id == TRX_SYS_SPACE) {
 | |
| 		space = fil_system.sys_space;
 | |
| 	} else if ((space = m_user_space) && space_id == space->id) {
 | |
| 	} else {
 | |
| 		space = fil_space_get(space_id);
 | |
| 		ut_ad(m_log_mode != MTR_LOG_NO_REDO
 | |
| 		      || space->is_temporary() || space->is_being_imported());
 | |
| 	}
 | |
| 
 | |
| 	ut_ad(space);
 | |
| 	ut_ad(space->id == space_id);
 | |
| 	x_lock_space(space);
 | |
| 	return(space);
 | |
| }
 | |
| 
 | |
| /** Acquire an exclusive tablespace latch.
 | |
| @param space  tablespace */
 | |
| void mtr_t::x_lock_space(fil_space_t *space)
 | |
| {
 | |
|   if (!memo_contains(*space))
 | |
|   {
 | |
|     memo_push(space, MTR_MEMO_SPACE_X_LOCK);
 | |
|     space->x_lock();
 | |
|   }
 | |
| }
 | |
| 
 | |
| void mtr_t::release(const void *object)
 | |
| {
 | |
|   ut_ad(is_active());
 | |
| 
 | |
|   auto it=
 | |
|     std::find_if(m_memo.begin(), m_memo.end(),
 | |
|                  [object](const mtr_memo_slot_t& slot)
 | |
|                  { return slot.object == object; });
 | |
|   ut_ad(it != m_memo.end());
 | |
|   ut_ad(!(it->type & MTR_MEMO_MODIFY));
 | |
|   it->release();
 | |
|   m_memo.erase(it, it + 1);
 | |
|   ut_ad(std::find_if(m_memo.begin(), m_memo.end(),
 | |
|                      [object](const mtr_memo_slot_t& slot)
 | |
|                      { return slot.object == &object; }) == m_memo.end());
 | |
| }
 | |
| 
 | |
| static time_t log_close_warn_time;
 | |
| 
 | |
| /** Display a warning that the log tail is overwriting the head,
 | |
| making the server crash-unsafe. */
 | |
| ATTRIBUTE_COLD static void log_overwrite_warning(lsn_t lsn)
 | |
| {
 | |
|   if (log_sys.overwrite_warned)
 | |
|     return;
 | |
| 
 | |
|   time_t t= time(nullptr);
 | |
|   if (difftime(t, log_close_warn_time) < 15)
 | |
|     return;
 | |
| 
 | |
|   if (!log_sys.overwrite_warned)
 | |
|     log_sys.overwrite_warned= lsn;
 | |
|   log_close_warn_time= t;
 | |
| 
 | |
|   sql_print_error("InnoDB: Crash recovery is broken due to"
 | |
|                   " insufficient innodb_log_file_size;"
 | |
|                   " last checkpoint LSN=" LSN_PF ", current LSN=" LSN_PF
 | |
|                   "%s.",
 | |
|                   lsn_t{log_sys.last_checkpoint_lsn}, lsn,
 | |
|                   srv_shutdown_state > SRV_SHUTDOWN_INITIATED
 | |
|                   ? ". Shutdown is in progress" : "");
 | |
| }
 | |
| 
 | |
| static ATTRIBUTE_NOINLINE void lsn_delay(size_t delay, size_t mult) noexcept
 | |
| {
 | |
|   delay*= mult * 2; // GCC 13.2.0 -O2 targeting AMD64 wants to unroll twice
 | |
|   HMT_low();
 | |
|   do
 | |
|     MY_RELAX_CPU();
 | |
|   while (--delay);
 | |
|   HMT_medium();
 | |
| }
 | |
| 
 | |
| #if defined __clang_major__ && __clang_major__ < 10
 | |
| /* Only clang-10 introduced support for asm goto */
 | |
| #elif defined __APPLE__
 | |
| /* At least some versions of Apple Xcode do not support asm goto */
 | |
| #elif defined __GNUC__ && (defined __i386__ || defined __x86_64__)
 | |
| # if SIZEOF_SIZE_T == 8
 | |
| #  define LOCK_TSET                                             \
 | |
|   __asm__ goto("lock btsq $63, %0\n\t" "jnc %l1"                \
 | |
|                : : "m"(buf_free) : "cc", "memory" : got)
 | |
| # else
 | |
| #  define LOCK_TSET                                             \
 | |
|   __asm__ goto("lock btsl $31, %0\n\t" "jnc %l1"                \
 | |
|                : : "m"(buf_free) : "cc", "memory" : got)
 | |
| # endif
 | |
| #elif defined _MSC_VER && (defined _M_IX86 || defined _M_X64)
 | |
| # if SIZEOF_SIZE_T == 8
 | |
| #  define LOCK_TSET                                                     \
 | |
|   if (!_interlockedbittestandset64                                      \
 | |
|       (reinterpret_cast<volatile LONG64*>(&buf_free), 63)) return
 | |
| # else
 | |
| #  define LOCK_TSET                                                     \
 | |
|   if (!_interlockedbittestandset                                        \
 | |
|       (reinterpret_cast<volatile long*>(&buf_free), 31)) return
 | |
| # endif
 | |
| #endif
 | |
| 
 | |
| #ifdef LOCK_TSET
 | |
| ATTRIBUTE_NOINLINE
 | |
| void log_t::lsn_lock_bts() noexcept
 | |
| {
 | |
|   LOCK_TSET;
 | |
|   {
 | |
|     const size_t m= mtr_t::spin_wait_delay;
 | |
|     constexpr size_t DELAY= 10, MAX_ITERATIONS= 10;
 | |
|     for (size_t delay_count= DELAY, delay_iterations= 1;;
 | |
|          lsn_delay(delay_iterations, m))
 | |
|     {
 | |
|       if (!(buf_free.load(std::memory_order_relaxed) & buf_free_LOCK))
 | |
|         LOCK_TSET;
 | |
|       if (!delay_count);
 | |
|       else if (delay_iterations < MAX_ITERATIONS)
 | |
|         delay_count= DELAY, delay_iterations++;
 | |
|       else
 | |
|         delay_count--;
 | |
|     }
 | |
|   }
 | |
| 
 | |
| # ifdef __GNUC__
 | |
|  got:
 | |
|   return;
 | |
| # endif
 | |
| }
 | |
| 
 | |
| inline
 | |
| #else
 | |
| ATTRIBUTE_NOINLINE
 | |
| #endif
 | |
| size_t log_t::lock_lsn() noexcept
 | |
| {
 | |
| #ifdef LOCK_TSET
 | |
|   lsn_lock_bts();
 | |
|   return ~buf_free_LOCK & buf_free.load(std::memory_order_relaxed);
 | |
| # undef LOCK_TSET
 | |
| #else
 | |
|   size_t b= buf_free.fetch_or(buf_free_LOCK, std::memory_order_acquire);
 | |
|   if (b & buf_free_LOCK)
 | |
|   {
 | |
|     const size_t m= mtr_t::spin_wait_delay;
 | |
|     constexpr size_t DELAY= 10, MAX_ITERATIONS= 10;
 | |
|     for (size_t delay_count= DELAY, delay_iterations= 1;
 | |
|          ((b= buf_free.load(std::memory_order_relaxed)) & buf_free_LOCK) ||
 | |
|            (buf_free_LOCK & (b= buf_free.fetch_or(buf_free_LOCK,
 | |
|                                                   std::memory_order_acquire)));
 | |
|          lsn_delay(delay_iterations, m))
 | |
|       if (!delay_count);
 | |
|       else if (delay_iterations < MAX_ITERATIONS)
 | |
|         delay_count= DELAY, delay_iterations++;
 | |
|       else
 | |
|         delay_count--;
 | |
|   }
 | |
|   return b;
 | |
| #endif
 | |
| }
 | |
| 
 | |
| template<bool spin>
 | |
| ATTRIBUTE_COLD size_t log_t::append_prepare_wait(size_t b, bool ex, lsn_t lsn)
 | |
|   noexcept
 | |
| {
 | |
|   waits++;
 | |
|   ut_ad(buf_free.load(std::memory_order_relaxed) ==
 | |
|         (spin ? (b | buf_free_LOCK) : b));
 | |
|   if (spin)
 | |
|     buf_free.store(b, std::memory_order_release);
 | |
|   else
 | |
|     lsn_lock.wr_unlock();
 | |
| 
 | |
|   if (ex)
 | |
|     latch.wr_unlock();
 | |
|   else
 | |
|     latch.rd_unlock();
 | |
| 
 | |
|   log_write_up_to(lsn, is_mmap());
 | |
| 
 | |
|   if (ex)
 | |
|     latch.wr_lock(SRW_LOCK_CALL);
 | |
|   else
 | |
|     latch.rd_lock(SRW_LOCK_CALL);
 | |
| 
 | |
|   if (spin)
 | |
|     return lock_lsn();
 | |
| 
 | |
|   lsn_lock.wr_lock();
 | |
|   return buf_free.load(std::memory_order_relaxed);
 | |
| }
 | |
| 
 | |
| /** Reserve space in the log buffer for appending data.
 | |
| @tparam spin  whether to use the spin-only lock_lsn()
 | |
| @tparam mmap  log_sys.is_mmap()
 | |
| @param size   total length of the data to append(), in bytes
 | |
| @param ex     whether log_sys.latch is exclusively locked
 | |
| @return the start LSN and the buffer position for append() */
 | |
| template<bool spin,bool mmap>
 | |
| inline
 | |
| std::pair<lsn_t,byte*> log_t::append_prepare(size_t size, bool ex) noexcept
 | |
| {
 | |
|   ut_ad(ex ? latch_have_wr() : latch_have_rd());
 | |
|   ut_ad(mmap == is_mmap());
 | |
|   if (!spin)
 | |
|     lsn_lock.wr_lock();
 | |
|   size_t b{spin ? lock_lsn() : buf_free.load(std::memory_order_relaxed)};
 | |
|   write_to_buf++;
 | |
| 
 | |
|   lsn_t l{lsn.load(std::memory_order_relaxed)}, end_lsn{l + size};
 | |
| 
 | |
|   if (UNIV_UNLIKELY(mmap
 | |
|                     ? (end_lsn -
 | |
|                        get_flushed_lsn(std::memory_order_relaxed)) > capacity()
 | |
|                     : b + size >= buf_size))
 | |
|   {
 | |
|     b= append_prepare_wait<spin>(b, ex, l);
 | |
|     /* While flushing log, we had released the lsn lock and LSN could have
 | |
|     progressed in the meantime. */
 | |
|     l= lsn.load(std::memory_order_relaxed);
 | |
|     end_lsn= l + size;
 | |
|   }
 | |
| 
 | |
|   size_t new_buf_free= b + size;
 | |
|   if (mmap && new_buf_free >= file_size)
 | |
|     new_buf_free-= size_t(capacity());
 | |
| 
 | |
|   lsn.store(end_lsn, std::memory_order_relaxed);
 | |
| 
 | |
|   if (UNIV_UNLIKELY(end_lsn >= last_checkpoint_lsn + log_capacity))
 | |
|     set_check_for_checkpoint(true);
 | |
| 
 | |
|   byte *our_buf= buf;
 | |
|   if (spin)
 | |
|     buf_free.store(new_buf_free, std::memory_order_release);
 | |
|   else
 | |
|   {
 | |
|     buf_free.store(new_buf_free, std::memory_order_relaxed);
 | |
|     lsn_lock.wr_unlock();
 | |
|   }
 | |
| 
 | |
|   return {l, our_buf + b};
 | |
| }
 | |
| 
 | |
| /** Finish appending data to the log.
 | |
| @param lsn  the end LSN of the log record
 | |
| @return whether buf_flush_ahead() will have to be invoked */
 | |
| static mtr_t::page_flush_ahead log_close(lsn_t lsn) noexcept
 | |
| {
 | |
|   ut_ad(log_sys.latch_have_any());
 | |
| 
 | |
|   const lsn_t checkpoint_age= lsn - log_sys.last_checkpoint_lsn;
 | |
| 
 | |
|   if (UNIV_UNLIKELY(checkpoint_age >= log_sys.log_capacity) &&
 | |
|       /* silence message on create_log_file() after the log had been deleted */
 | |
|       checkpoint_age != lsn)
 | |
|     log_overwrite_warning(lsn);
 | |
|   else if (UNIV_LIKELY(checkpoint_age <= log_sys.max_modified_age_async))
 | |
|     return mtr_t::PAGE_FLUSH_NO;
 | |
|   else if (UNIV_LIKELY(checkpoint_age <= log_sys.max_checkpoint_age))
 | |
|     return mtr_t::PAGE_FLUSH_ASYNC;
 | |
| 
 | |
|   log_sys.set_check_for_checkpoint();
 | |
|   return mtr_t::PAGE_FLUSH_SYNC;
 | |
| }
 | |
| 
 | |
| inline void mtr_t::page_checksum(const buf_page_t &bpage)
 | |
| {
 | |
|   const byte *page= bpage.frame;
 | |
|   size_t size= srv_page_size;
 | |
| 
 | |
|   if (UNIV_LIKELY_NULL(bpage.zip.data))
 | |
|   {
 | |
|     size= (UNIV_ZIP_SIZE_MIN >> 1) << bpage.zip.ssize;
 | |
|     switch (fil_page_get_type(bpage.zip.data)) {
 | |
|     case FIL_PAGE_TYPE_ALLOCATED:
 | |
|     case FIL_PAGE_INODE:
 | |
|     case FIL_PAGE_IBUF_BITMAP:
 | |
|     case FIL_PAGE_TYPE_FSP_HDR:
 | |
|     case FIL_PAGE_TYPE_XDES:
 | |
|       /* These are essentially uncompressed pages. */
 | |
|       break;
 | |
|     default:
 | |
|       page= bpage.zip.data;
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   /* We have to exclude from the checksum the normal
 | |
|   page checksum that is written by buf_flush_init_for_writing()
 | |
|   and FIL_PAGE_LSN which would be updated once we have actually
 | |
|   allocated the LSN.
 | |
| 
 | |
|   Unfortunately, we cannot access fil_space_t easily here. In order to
 | |
|   be compatible with encrypted tablespaces in the pre-full_crc32
 | |
|   format we will unconditionally exclude the 8 bytes at
 | |
|   FIL_PAGE_FILE_FLUSH_LSN_OR_KEY_VERSION
 | |
|   a.k.a. FIL_RTREE_SPLIT_SEQ_NUM. */
 | |
|   const uint32_t checksum=
 | |
|     my_crc32c(my_crc32c(my_crc32c(0, page + FIL_PAGE_OFFSET,
 | |
|                                   FIL_PAGE_LSN - FIL_PAGE_OFFSET),
 | |
|                         page + FIL_PAGE_TYPE, 2),
 | |
|               page + FIL_PAGE_SPACE_ID, size - (FIL_PAGE_SPACE_ID + 8));
 | |
| 
 | |
|   byte *l= log_write<OPTION>(bpage.id(), nullptr, 5, true, 0);
 | |
|   *l++= OPT_PAGE_CHECKSUM;
 | |
|   mach_write_to_4(l, checksum);
 | |
|   m_log.close(l + 4);
 | |
| }
 | |
| 
 | |
| std::pair<lsn_t,mtr_t::page_flush_ahead> mtr_t::do_write()
 | |
| {
 | |
|   ut_ad(!recv_no_log_write);
 | |
|   ut_ad(is_logged());
 | |
|   ut_ad(m_log.size());
 | |
|   ut_ad(!m_latch_ex || log_sys.latch_have_wr());
 | |
|   ut_ad(!m_user_space ||
 | |
|         (m_user_space->id > 0 && m_user_space->id < SRV_SPACE_ID_UPPER_BOUND));
 | |
| 
 | |
| #ifndef DBUG_OFF
 | |
|   do
 | |
|   {
 | |
|     if (m_log_mode != MTR_LOG_ALL ||
 | |
|         _db_keyword_(nullptr, "skip_page_checksum", 1))
 | |
|       continue;
 | |
|     for (const mtr_memo_slot_t& slot : m_memo)
 | |
|       if (slot.type & MTR_MEMO_MODIFY)
 | |
|       {
 | |
|         const buf_page_t &b= *static_cast<const buf_page_t*>(slot.object);
 | |
|         if (!b.is_freed())
 | |
|           page_checksum(b);
 | |
|       }
 | |
|   }
 | |
|   while (0);
 | |
| #endif
 | |
| 
 | |
|   size_t len= m_log.size() + 5;
 | |
|   ut_ad(len > 5);
 | |
| 
 | |
|   if (log_sys.is_encrypted())
 | |
|   {
 | |
|     len+= 8;
 | |
|     encrypt();
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     m_crc= 0;
 | |
|     m_commit_lsn= 0;
 | |
|     m_log.for_each_block([this](const mtr_buf_t::block_t *b)
 | |
|     { m_crc= my_crc32c(m_crc, b->begin(), b->used()); return true; });
 | |
|   }
 | |
| 
 | |
|   if (!m_latch_ex)
 | |
|     log_sys.latch.rd_lock(SRW_LOCK_CALL);
 | |
| 
 | |
|   if (UNIV_UNLIKELY(m_user_space && !m_user_space->max_lsn &&
 | |
|                     !srv_is_undo_tablespace((m_user_space->id))))
 | |
|   {
 | |
|     if (!m_latch_ex)
 | |
|     {
 | |
|       m_latch_ex= true;
 | |
|       log_sys.latch.rd_unlock();
 | |
|       log_sys.latch.wr_lock(SRW_LOCK_CALL);
 | |
|       if (UNIV_UNLIKELY(m_user_space->max_lsn != 0))
 | |
|         goto func_exit;
 | |
|     }
 | |
|     name_write();
 | |
|   }
 | |
| func_exit:
 | |
|   return finish_write(len);
 | |
| }
 | |
| 
 | |
| inline void log_t::resize_write(lsn_t lsn, const byte *end, size_t len,
 | |
|                                 size_t seq) noexcept
 | |
| {
 | |
|   ut_ad(latch_have_any());
 | |
| 
 | |
|   if (UNIV_LIKELY_NULL(resize_buf))
 | |
|   {
 | |
|     ut_ad(end >= buf);
 | |
|     end-= len;
 | |
|     size_t s;
 | |
| 
 | |
| #ifdef HAVE_PMEM
 | |
|     if (!resize_flush_buf)
 | |
|     {
 | |
|       ut_ad(is_mmap());
 | |
|       lsn_lock.wr_lock();
 | |
|       const size_t resize_capacity{resize_target - START_OFFSET};
 | |
|       {
 | |
|         const lsn_t resizing{resize_in_progress()};
 | |
|         /* For memory-mapped log, log_t::resize_start() would never
 | |
|         set log_sys.resize_lsn to less than log_sys.lsn. It cannot
 | |
|         execute concurrently with this thread, because we are holding
 | |
|         log_sys.latch and it would hold an exclusive log_sys.latch. */
 | |
|         if (UNIV_UNLIKELY(lsn < resizing))
 | |
|         {
 | |
|           /* This function may execute in multiple concurrent threads
 | |
|           that hold a shared log_sys.latch. Before we got lsn_lock,
 | |
|           another thread could have executed resize_lsn.store(lsn) below
 | |
|           with a larger lsn than ours.
 | |
| 
 | |
|           append_prepare() guarantees that the concurrent writes
 | |
|           cannot overlap, that is, our entire log must be discarded.
 | |
|           Besides, incomplete mini-transactions cannot be parsed anyway. */
 | |
|           ut_ad(resizing >= lsn + len);
 | |
|           goto mmap_done;
 | |
|         }
 | |
| 
 | |
|         s= START_OFFSET;
 | |
| 
 | |
|         if (UNIV_UNLIKELY(lsn - resizing + len >= resize_capacity))
 | |
|         {
 | |
|           resize_lsn.store(lsn, std::memory_order_relaxed);
 | |
|           lsn= 0;
 | |
|         }
 | |
|         else
 | |
|         {
 | |
|           lsn-= resizing;
 | |
|           s+= lsn;
 | |
|         }
 | |
|       }
 | |
| 
 | |
|       ut_ad(s + len <= resize_target);
 | |
| 
 | |
|       if (UNIV_UNLIKELY(end < &buf[START_OFFSET]))
 | |
|       {
 | |
|         /* The source buffer (log_sys.buf) wrapped around */
 | |
|         ut_ad(end + capacity() < &buf[file_size]);
 | |
|         ut_ad(end + len >= &buf[START_OFFSET]);
 | |
|         ut_ad(end + capacity() + len >= &buf[file_size]);
 | |
| 
 | |
|         size_t l= size_t(buf - (end - START_OFFSET));
 | |
|         memcpy(resize_buf + s, end + capacity(), l);
 | |
|         memcpy(resize_buf + s + l, &buf[START_OFFSET], len - l);
 | |
|       }
 | |
|       else
 | |
|       {
 | |
|         ut_ad(end + len <= &buf[file_size]);
 | |
|         memcpy(resize_buf + s, end, len);
 | |
|       }
 | |
|       s+= len - seq;
 | |
| 
 | |
|       /* Always set the sequence bit. If the resized log were to wrap around,
 | |
|       we will advance resize_lsn. */
 | |
|       ut_ad(resize_buf[s] <= 1);
 | |
|       resize_buf[s]= 1;
 | |
|     mmap_done:
 | |
|       lsn_lock.wr_unlock();
 | |
|     }
 | |
|     else
 | |
| #endif
 | |
|     {
 | |
|       ut_ad(resize_flush_buf);
 | |
|       s= end - buf;
 | |
|       ut_ad(s + len <= buf_size);
 | |
|       memcpy(resize_buf + s, end, len);
 | |
|       s+= len - seq;
 | |
|       /* Always set the sequence bit. If the resized log were to wrap around,
 | |
|       we will advance resize_lsn. */
 | |
|       ut_ad(resize_buf[s] <= 1);
 | |
|       resize_buf[s]= 1;
 | |
|     }
 | |
|   }
 | |
| }
 | |
| 
 | |
| inline void log_t::append(byte *&d, const void *s, size_t size) noexcept
 | |
| {
 | |
|   ut_ad(log_sys.latch_have_any());
 | |
|   ut_ad(d + size <= log_sys.buf +
 | |
|         (log_sys.is_mmap() ? log_sys.file_size : log_sys.buf_size));
 | |
|   memcpy(d, s, size);
 | |
|   d+= size;
 | |
| }
 | |
| 
 | |
| template<bool spin,bool mmap>
 | |
| std::pair<lsn_t,mtr_t::page_flush_ahead>
 | |
| mtr_t::finish_writer(mtr_t *mtr, size_t len)
 | |
| {
 | |
|   ut_ad(log_sys.is_latest());
 | |
|   ut_ad(!recv_no_log_write);
 | |
|   ut_ad(mtr->is_logged());
 | |
|   ut_ad(mtr->m_latch_ex ? log_sys.latch_have_wr() : log_sys.latch_have_rd());
 | |
| 
 | |
|   const size_t size{mtr->m_commit_lsn ? 5U + 8U : 5U};
 | |
|   std::pair<lsn_t, byte*> start=
 | |
|     log_sys.append_prepare<spin,mmap>(len, mtr->m_latch_ex);
 | |
| 
 | |
|   if (!mmap)
 | |
|   {
 | |
|     mtr->m_log.for_each_block([&start](const mtr_buf_t::block_t *b)
 | |
|     { log_sys.append(start.second, b->begin(), b->used()); return true; });
 | |
| 
 | |
|   write_trailer:
 | |
|     *start.second++= log_sys.get_sequence_bit(start.first + len - size);
 | |
|     if (mtr->m_commit_lsn)
 | |
|     {
 | |
|       mach_write_to_8(start.second, mtr->m_commit_lsn);
 | |
|       mtr->m_crc= my_crc32c(mtr->m_crc, start.second, 8);
 | |
|       start.second+= 8;
 | |
|     }
 | |
|     mach_write_to_4(start.second, mtr->m_crc);
 | |
|     start.second+= 4;
 | |
|   }
 | |
|   else
 | |
|   {
 | |
|     if (UNIV_LIKELY(start.second + len <= &log_sys.buf[log_sys.file_size]))
 | |
|     {
 | |
|       mtr->m_log.for_each_block([&start](const mtr_buf_t::block_t *b)
 | |
|       { log_sys.append(start.second, b->begin(), b->used()); return true; });
 | |
|       goto write_trailer;
 | |
|     }
 | |
|     mtr->m_log.for_each_block([&start](const mtr_buf_t::block_t *b)
 | |
|     {
 | |
|       size_t size{b->used()};
 | |
|       const size_t size_left(&log_sys.buf[log_sys.file_size] - start.second);
 | |
|       const byte *src= b->begin();
 | |
|       if (size > size_left)
 | |
|       {
 | |
|         ::memcpy(start.second, src, size_left);
 | |
|         start.second= &log_sys.buf[log_sys.START_OFFSET];
 | |
|         src+= size_left;
 | |
|         size-= size_left;
 | |
|       }
 | |
|       ::memcpy(start.second, src, size);
 | |
|       start.second+= size;
 | |
|       return true;
 | |
|     });
 | |
|     const size_t size_left(&log_sys.buf[log_sys.file_size] - start.second);
 | |
|     if (size_left > size)
 | |
|       goto write_trailer;
 | |
| 
 | |
|     byte tail[5 + 8];
 | |
|     tail[0]= log_sys.get_sequence_bit(start.first + len - size);
 | |
| 
 | |
|     if (mtr->m_commit_lsn)
 | |
|     {
 | |
|       mach_write_to_8(tail + 1, mtr->m_commit_lsn);
 | |
|       mtr->m_crc= my_crc32c(mtr->m_crc, tail + 1, 8);
 | |
|       mach_write_to_4(tail + 9, mtr->m_crc);
 | |
|     }
 | |
|     else
 | |
|       mach_write_to_4(tail + 1, mtr->m_crc);
 | |
| 
 | |
|     ::memcpy(start.second, tail, size_left);
 | |
|     ::memcpy(log_sys.buf + log_sys.START_OFFSET, tail + size_left,
 | |
|              size - size_left);
 | |
|     start.second= log_sys.buf +
 | |
|       ((size >= size_left) ? log_sys.START_OFFSET : log_sys.file_size) +
 | |
|       (size - size_left);
 | |
|   }
 | |
| 
 | |
|   log_sys.resize_write(start.first, start.second, len, size);
 | |
| 
 | |
|   mtr->m_commit_lsn= start.first + len;
 | |
|   return {start.first, log_close(mtr->m_commit_lsn)};
 | |
| }
 | |
| 
 | |
| bool mtr_t::have_x_latch(const buf_block_t &block) const
 | |
| {
 | |
|   ut_d(const mtr_memo_slot_t *found= nullptr);
 | |
| 
 | |
|   for (const mtr_memo_slot_t &slot : m_memo)
 | |
|   {
 | |
|     if (slot.object != &block)
 | |
|       continue;
 | |
| 
 | |
|     ut_d(found= &slot);
 | |
| 
 | |
|     if (!(slot.type & MTR_MEMO_PAGE_X_FIX))
 | |
|       continue;
 | |
| 
 | |
|     ut_ad(block.page.lock.have_x());
 | |
|     return true;
 | |
|   }
 | |
| 
 | |
|   ut_ad(!found);
 | |
|   return false;
 | |
| }
 | |
| 
 | |
| bool mtr_t::have_u_or_x_latch(const buf_block_t &block) const
 | |
| {
 | |
|   for (const mtr_memo_slot_t &slot : m_memo)
 | |
|   {
 | |
|     if (slot.object == &block &&
 | |
|         slot.type & (MTR_MEMO_PAGE_X_FIX | MTR_MEMO_PAGE_SX_FIX))
 | |
|     {
 | |
|       ut_ad(block.page.lock.have_u_or_x());
 | |
|       return true;
 | |
|     }
 | |
|   }
 | |
|   return false;
 | |
| }
 | |
| 
 | |
| /** Check if we are holding exclusive tablespace latch
 | |
| @param space  tablespace to search for
 | |
| @return whether space.latch is being held */
 | |
| bool mtr_t::memo_contains(const fil_space_t& space) const
 | |
| {
 | |
|   for (const mtr_memo_slot_t &slot : m_memo)
 | |
|   {
 | |
|     if (slot.object == &space && slot.type == MTR_MEMO_SPACE_X_LOCK)
 | |
|     {
 | |
|       ut_ad(space.is_owner());
 | |
|       return true;
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   return false;
 | |
| }
 | |
| 
 | |
| buf_block_t *mtr_t::page_lock_upgrade(const buf_block_t &block) noexcept
 | |
| {
 | |
|   ut_ad(block.page.lock.have_x());
 | |
| 
 | |
|   for (mtr_memo_slot_t &slot : m_memo)
 | |
|     if (slot.object == &block && slot.type & MTR_MEMO_PAGE_SX_FIX)
 | |
|       slot.type= mtr_memo_type_t(slot.type ^
 | |
|                                  (MTR_MEMO_PAGE_SX_FIX | MTR_MEMO_PAGE_X_FIX));
 | |
| 
 | |
| #ifdef BTR_CUR_HASH_ADAPT
 | |
|   ut_d(if (dict_index_t *index= block.index))
 | |
|   ut_ad(!index->freed());
 | |
| #endif /* BTR_CUR_HASH_ADAPT */
 | |
|   return const_cast<buf_block_t*>(&block);
 | |
| }
 | |
| 
 | |
| buf_block_t *mtr_t::page_lock(buf_block_t *block, ulint rw_latch) noexcept
 | |
| {
 | |
|   mtr_memo_type_t fix_type;
 | |
|   ut_d(const auto state= block->page.state());
 | |
|   ut_ad(state > buf_page_t::FREED);
 | |
|   ut_ad(state > buf_page_t::WRITE_FIX || state < buf_page_t::READ_FIX);
 | |
|   switch (rw_latch) {
 | |
|   case RW_NO_LATCH:
 | |
|     fix_type= MTR_MEMO_BUF_FIX;
 | |
|     goto done;
 | |
|   case RW_S_LATCH:
 | |
|     fix_type= MTR_MEMO_PAGE_S_FIX;
 | |
|     block->page.lock.s_lock();
 | |
|     break;
 | |
|   case RW_SX_LATCH:
 | |
|     fix_type= MTR_MEMO_PAGE_SX_FIX;
 | |
|     block->page.lock.u_lock();
 | |
|     ut_ad(!block->page.is_io_fixed());
 | |
|     break;
 | |
|   default:
 | |
|     ut_ad(rw_latch == RW_X_LATCH);
 | |
|     fix_type= MTR_MEMO_PAGE_X_FIX;
 | |
|     if (block->page.lock.x_lock_upgraded())
 | |
|     {
 | |
|       block->unfix();
 | |
|       page_lock_upgrade(*block);
 | |
|       return block;
 | |
|     }
 | |
|     ut_ad(!block->page.is_io_fixed());
 | |
|   }
 | |
| 
 | |
| done:
 | |
|   ut_ad(state < buf_page_t::UNFIXED ||
 | |
|         page_id_t(page_get_space_id(block->page.frame),
 | |
|                   page_get_page_no(block->page.frame)) == block->page.id());
 | |
|   memo_push(block, fix_type);
 | |
|   return block;
 | |
| }
 | |
| 
 | |
| void mtr_t::upgrade_buffer_fix(ulint savepoint, rw_lock_type_t rw_latch)
 | |
|   noexcept
 | |
| {
 | |
|   ut_ad(is_active());
 | |
|   mtr_memo_slot_t &slot= m_memo[savepoint];
 | |
|   ut_ad(slot.type == MTR_MEMO_BUF_FIX);
 | |
|   buf_block_t *block= static_cast<buf_block_t*>(slot.object);
 | |
|   ut_d(const auto state= block->page.state());
 | |
|   ut_ad(state > buf_page_t::FREED);
 | |
|   ut_ad(state > buf_page_t::WRITE_FIX || state < buf_page_t::READ_FIX);
 | |
|   static_assert(int{MTR_MEMO_PAGE_S_FIX} == int{RW_S_LATCH}, "");
 | |
|   static_assert(int{MTR_MEMO_PAGE_X_FIX} == int{RW_X_LATCH}, "");
 | |
|   static_assert(int{MTR_MEMO_PAGE_SX_FIX} == int{RW_SX_LATCH}, "");
 | |
|   slot.type= mtr_memo_type_t(rw_latch);
 | |
| 
 | |
|   switch (rw_latch) {
 | |
|   default:
 | |
|     ut_ad("invalid state" == 0);
 | |
|     break;
 | |
|   case RW_S_LATCH:
 | |
|     block->page.lock.s_lock();
 | |
|     break;
 | |
|   case RW_SX_LATCH:
 | |
|     block->page.lock.u_lock();
 | |
|     ut_ad(!block->page.is_io_fixed());
 | |
|     break;
 | |
|   case RW_X_LATCH:
 | |
|     block->page.lock.x_lock();
 | |
|     ut_ad(!block->page.is_io_fixed());
 | |
|   }
 | |
| 
 | |
|   ut_ad(page_id_t(page_get_space_id(block->page.frame),
 | |
|                   page_get_page_no(block->page.frame)) == block->page.id());
 | |
| }
 | |
| 
 | |
| #ifdef UNIV_DEBUG
 | |
| /** Check if we are holding an rw-latch in this mini-transaction
 | |
| @param lock   latch to search for
 | |
| @param type   held latch type
 | |
| @return whether (lock,type) is contained */
 | |
| bool mtr_t::memo_contains(const index_lock &lock, mtr_memo_type_t type) const
 | |
| {
 | |
|   ut_ad(type == MTR_MEMO_X_LOCK || type == MTR_MEMO_S_LOCK ||
 | |
|         type == MTR_MEMO_SX_LOCK);
 | |
| 
 | |
|   for (const mtr_memo_slot_t &slot : m_memo)
 | |
|   {
 | |
|     if (slot.object == &lock && slot.type == type)
 | |
|     {
 | |
|       switch (type) {
 | |
|       case MTR_MEMO_X_LOCK:
 | |
|         ut_ad(lock.have_x());
 | |
|         break;
 | |
|       case MTR_MEMO_SX_LOCK:
 | |
|         ut_ad(lock.have_u_or_x());
 | |
|         break;
 | |
|       case MTR_MEMO_S_LOCK:
 | |
|         ut_ad(lock.have_s());
 | |
|         break;
 | |
|       default:
 | |
|         break;
 | |
|       }
 | |
|       return true;
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   return false;
 | |
| }
 | |
| 
 | |
| /** Check if memo contains the given item.
 | |
| @param object		object to search
 | |
| @param flags		specify types of object (can be ORred) of
 | |
| 			MTR_MEMO_PAGE_S_FIX ... values
 | |
| @return true if contains */
 | |
| bool mtr_t::memo_contains_flagged(const void *object, ulint flags) const
 | |
| {
 | |
|   ut_ad(is_active());
 | |
|   ut_ad(flags);
 | |
|   /* Look for rw-lock-related and page-related flags. */
 | |
|   ut_ad(!(flags & ulint(~(MTR_MEMO_PAGE_S_FIX | MTR_MEMO_PAGE_X_FIX |
 | |
|                           MTR_MEMO_PAGE_SX_FIX | MTR_MEMO_BUF_FIX |
 | |
|                           MTR_MEMO_MODIFY | MTR_MEMO_X_LOCK |
 | |
|                           MTR_MEMO_SX_LOCK | MTR_MEMO_S_LOCK))));
 | |
|   /* Either some rw-lock-related or page-related flags
 | |
|   must be specified, but not both at the same time. */
 | |
|   ut_ad(!(flags & (MTR_MEMO_PAGE_S_FIX | MTR_MEMO_PAGE_X_FIX |
 | |
|                    MTR_MEMO_PAGE_SX_FIX | MTR_MEMO_BUF_FIX |
 | |
|                    MTR_MEMO_MODIFY)) ==
 | |
|         !!(flags & (MTR_MEMO_X_LOCK | MTR_MEMO_SX_LOCK | MTR_MEMO_S_LOCK)));
 | |
| 
 | |
|   for (const mtr_memo_slot_t &slot : m_memo)
 | |
|   {
 | |
|     if (object != slot.object)
 | |
|       continue;
 | |
| 
 | |
|     auto f = flags & slot.type;
 | |
|     if (!f)
 | |
|       continue;
 | |
| 
 | |
|     if (f & (MTR_MEMO_PAGE_S_FIX | MTR_MEMO_PAGE_SX_FIX | MTR_MEMO_PAGE_X_FIX))
 | |
|     {
 | |
|       const block_lock &lock= static_cast<const buf_page_t*>(object)->lock;
 | |
|       ut_ad(!(f & MTR_MEMO_PAGE_S_FIX) || lock.have_s());
 | |
|       ut_ad(!(f & MTR_MEMO_PAGE_SX_FIX) || lock.have_u_or_x());
 | |
|       ut_ad(!(f & MTR_MEMO_PAGE_X_FIX) || lock.have_x());
 | |
|     }
 | |
|     else
 | |
|     {
 | |
|       const index_lock &lock= *static_cast<const index_lock*>(object);
 | |
|       ut_ad(!(f & MTR_MEMO_S_LOCK) || lock.have_s());
 | |
|       ut_ad(!(f & MTR_MEMO_SX_LOCK) || lock.have_u_or_x());
 | |
|       ut_ad(!(f & MTR_MEMO_X_LOCK) || lock.have_x());
 | |
|     }
 | |
| 
 | |
|     return true;
 | |
|   }
 | |
| 
 | |
|   return false;
 | |
| }
 | |
| 
 | |
| buf_block_t* mtr_t::memo_contains_page_flagged(const byte *ptr, ulint flags)
 | |
|   const
 | |
| {
 | |
|   ptr= page_align(ptr);
 | |
| 
 | |
|   for (const mtr_memo_slot_t &slot : m_memo)
 | |
|   {
 | |
|     ut_ad(slot.object);
 | |
|     if (!(flags & slot.type))
 | |
|       continue;
 | |
| 
 | |
|     buf_page_t *bpage= static_cast<buf_page_t*>(slot.object);
 | |
| 
 | |
|     if (ptr != bpage->frame)
 | |
|       continue;
 | |
| 
 | |
|     ut_ad(!(slot.type & MTR_MEMO_PAGE_S_FIX) || bpage->lock.have_s());
 | |
|     ut_ad(!(slot.type & MTR_MEMO_PAGE_SX_FIX) || bpage->lock.have_u_or_x());
 | |
|     ut_ad(!(slot.type & MTR_MEMO_PAGE_X_FIX) || bpage->lock.have_x());
 | |
|     return static_cast<buf_block_t*>(slot.object);
 | |
|   }
 | |
| 
 | |
|   return nullptr;
 | |
| }
 | |
| #endif /* UNIV_DEBUG */
 | |
| 
 | |
| 
 | |
| /** Mark the given latched page as modified.
 | |
| @param block   page that will be modified */
 | |
| void mtr_t::set_modified(const buf_block_t &block)
 | |
| {
 | |
|   if (block.page.id().space() >= SRV_TMP_SPACE_ID)
 | |
|   {
 | |
|     const_cast<buf_block_t&>(block).page.set_temp_modified();
 | |
|     return;
 | |
|   }
 | |
| 
 | |
|   m_modifications= true;
 | |
| 
 | |
|   if (UNIV_UNLIKELY(m_log_mode == MTR_LOG_NONE))
 | |
|     return;
 | |
| 
 | |
|   for (mtr_memo_slot_t &slot : m_memo)
 | |
|   {
 | |
|     if (slot.object == &block &&
 | |
|         slot.type & (MTR_MEMO_PAGE_X_FIX | MTR_MEMO_PAGE_SX_FIX))
 | |
|     {
 | |
|       if (slot.type & MTR_MEMO_MODIFY)
 | |
|         ut_ad(m_made_dirty || block.page.oldest_modification() > 1);
 | |
|       else
 | |
|       {
 | |
|         slot.type= static_cast<mtr_memo_type_t>(slot.type | MTR_MEMO_MODIFY);
 | |
|         if (!m_made_dirty)
 | |
|           m_made_dirty= block.page.oldest_modification() <= 1;
 | |
|       }
 | |
|       return;
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   /* This must be PageConverter::update_page() in IMPORT TABLESPACE. */
 | |
|   ut_ad(m_memo.empty());
 | |
|   ut_ad(!block.page.in_LRU_list);
 | |
| }
 | |
| 
 | |
| void mtr_t::init(buf_block_t *b)
 | |
| {
 | |
|   const page_id_t id{b->page.id()};
 | |
|   ut_ad(is_named_space(id.space()));
 | |
|   ut_ad(!m_freed_pages == !m_freed_space);
 | |
|   ut_ad(memo_contains_flagged(b, MTR_MEMO_PAGE_X_FIX));
 | |
| 
 | |
|   if (id.space() >= SRV_TMP_SPACE_ID)
 | |
|     b->page.set_temp_modified();
 | |
|   else
 | |
|   {
 | |
|     for (mtr_memo_slot_t &slot : m_memo)
 | |
|     {
 | |
|       if (slot.object == b && slot.type & MTR_MEMO_PAGE_X_FIX)
 | |
|       {
 | |
|         slot.type= MTR_MEMO_PAGE_X_MODIFY;
 | |
|         m_modifications= true;
 | |
|         if (!m_made_dirty)
 | |
|           m_made_dirty= b->page.oldest_modification() <= 1;
 | |
|         goto found;
 | |
|       }
 | |
|     }
 | |
|     ut_ad("block not X-latched" == 0);
 | |
|   }
 | |
| 
 | |
|  found:
 | |
|   if (UNIV_LIKELY_NULL(m_freed_space) &&
 | |
|       m_freed_space->id == id.space() &&
 | |
|       m_freed_pages->remove_if_exists(id.page_no()) &&
 | |
|       m_freed_pages->empty())
 | |
|   {
 | |
|     delete m_freed_pages;
 | |
|     m_freed_pages= nullptr;
 | |
|     m_freed_space= nullptr;
 | |
|   }
 | |
| 
 | |
|   b->page.set_reinit(b->page.state() & buf_page_t::LRU_MASK);
 | |
| 
 | |
|   if (!is_logged())
 | |
|     return;
 | |
| 
 | |
|   m_log.close(log_write<INIT_PAGE>(id, &b->page));
 | |
|   m_last_offset= FIL_PAGE_TYPE;
 | |
| }
 | |
| 
 | |
| /** Free a page.
 | |
| @param space   tablespace
 | |
| @param offset  offset of the page to be freed */
 | |
| void mtr_t::free(const fil_space_t &space, uint32_t offset)
 | |
| {
 | |
|   ut_ad(is_named_space(&space));
 | |
|   ut_ad(!m_freed_space || m_freed_space == &space);
 | |
| 
 | |
|   buf_block_t *freed= nullptr;
 | |
|   const page_id_t id{space.id, offset};
 | |
| 
 | |
|   for (auto it= m_memo.end(); it != m_memo.begin(); )
 | |
|   {
 | |
|     it--;
 | |
|   next:
 | |
|     mtr_memo_slot_t &slot= *it;
 | |
|     buf_block_t *block= static_cast<buf_block_t*>(slot.object);
 | |
|     ut_ad(block);
 | |
|     if (block == freed)
 | |
|     {
 | |
|       if (slot.type & (MTR_MEMO_PAGE_SX_FIX | MTR_MEMO_PAGE_X_FIX))
 | |
|         slot.type= MTR_MEMO_PAGE_X_FIX;
 | |
|       else
 | |
|       {
 | |
|         ut_ad(slot.type == MTR_MEMO_BUF_FIX);
 | |
|         block->page.unfix();
 | |
|         m_memo.erase(it, it + 1);
 | |
|         goto next;
 | |
|       }
 | |
|     }
 | |
|     else if (slot.type & (MTR_MEMO_PAGE_X_FIX | MTR_MEMO_PAGE_SX_FIX) &&
 | |
|              block->page.id() == id)
 | |
|     {
 | |
|       ut_ad(!block->page.is_freed());
 | |
|       ut_ad(!freed);
 | |
|       freed= block;
 | |
|       if (!(slot.type & MTR_MEMO_PAGE_X_FIX))
 | |
|       {
 | |
|         ut_d(bool upgraded=) block->page.lock.x_lock_upgraded();
 | |
|         ut_ad(upgraded);
 | |
|       }
 | |
|       if (id.space() >= SRV_TMP_SPACE_ID)
 | |
|       {
 | |
|         block->page.set_temp_modified();
 | |
|         slot.type= MTR_MEMO_PAGE_X_FIX;
 | |
|       }
 | |
|       else
 | |
|       {
 | |
|         slot.type= MTR_MEMO_PAGE_X_MODIFY;
 | |
|         if (!m_made_dirty)
 | |
|           m_made_dirty= block->page.oldest_modification() <= 1;
 | |
|       }
 | |
| #ifdef BTR_CUR_HASH_ADAPT
 | |
|       if (block->index)
 | |
|         btr_search_drop_page_hash_index(block, nullptr);
 | |
| #endif /* BTR_CUR_HASH_ADAPT */
 | |
|       block->page.set_freed(block->page.state());
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   if (is_logged())
 | |
|     m_log.close(log_write<FREE_PAGE>(id, nullptr));
 | |
| }
 | |
| 
 | |
| void small_vector_base::grow_by_1(void *small, size_t element_size) noexcept
 | |
| {
 | |
|   const size_t cap= Capacity*= 2, s= cap * element_size;
 | |
|   void *new_begin;
 | |
|   if (BeginX == small)
 | |
|   {
 | |
|     new_begin= my_malloc(PSI_NOT_INSTRUMENTED, s, MYF(0));
 | |
|     memcpy(new_begin, BeginX, s / 2);
 | |
|     TRASH_FREE(small, size() * element_size);
 | |
|   }
 | |
|   else
 | |
|     new_begin= my_realloc(PSI_NOT_INSTRUMENTED, BeginX, s, MYF(0));
 | |
| 
 | |
|   BeginX= new_begin;
 | |
| }
 | 
