/***************************************************************************** Copyright (c) 1995, 2010, Oracle and/or its affiliates. All Rights Reserved. This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; version 2 of the License. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Suite 500, Boston, MA 02110-1335 USA *****************************************************************************/ /**************************************************//** @file include/log0log.ic Database log Created 12/9/1995 Heikki Tuuri *******************************************************/ #include "os0file.h" #include "mach0data.h" #include "mtr0mtr.h" #include "srv0mon.h" #include "srv0srv.h" #include "ut0crc32.h" #ifdef UNIV_LOG_DEBUG /******************************************************//** Checks by parsing that the catenated log segment for a single mtr is consistent. */ UNIV_INTERN ibool log_check_log_recs( /*===============*/ const byte* buf, /*!< in: pointer to the start of the log segment in the log_sys->buf log buffer */ ulint len, /*!< in: segment length in bytes */ ib_uint64_t buf_start_lsn); /*!< in: buffer start lsn */ #endif /* UNIV_LOG_DEBUG */ /************************************************************//** Gets a log block flush bit. @return TRUE if this block was the first to be written in a log flush */ UNIV_INLINE ibool log_block_get_flush_bit( /*====================*/ const byte* log_block) /*!< in: log block */ { if (LOG_BLOCK_FLUSH_BIT_MASK & mach_read_from_4(log_block + LOG_BLOCK_HDR_NO)) { return(TRUE); } return(FALSE); } /************************************************************//** Sets the log block flush bit. */ UNIV_INLINE void log_block_set_flush_bit( /*====================*/ byte* log_block, /*!< in/out: log block */ ibool val) /*!< in: value to set */ { ulint field; field = mach_read_from_4(log_block + LOG_BLOCK_HDR_NO); if (val) { field = field | LOG_BLOCK_FLUSH_BIT_MASK; } else { field = field & ~LOG_BLOCK_FLUSH_BIT_MASK; } mach_write_to_4(log_block + LOG_BLOCK_HDR_NO, field); } /************************************************************//** Gets a log block number stored in the header. @return log block number stored in the block header */ UNIV_INLINE ulint log_block_get_hdr_no( /*=================*/ const byte* log_block) /*!< in: log block */ { return(~LOG_BLOCK_FLUSH_BIT_MASK & mach_read_from_4(log_block + LOG_BLOCK_HDR_NO)); } /************************************************************//** Sets the log block number stored in the header; NOTE that this must be set before the flush bit! */ UNIV_INLINE void log_block_set_hdr_no( /*=================*/ byte* log_block, /*!< in/out: log block */ ulint n) /*!< in: log block number: must be > 0 and < LOG_BLOCK_FLUSH_BIT_MASK */ { ut_ad(n > 0); ut_ad(n < LOG_BLOCK_FLUSH_BIT_MASK); mach_write_to_4(log_block + LOG_BLOCK_HDR_NO, n); } /************************************************************//** Gets a log block data length. @return log block data length measured as a byte offset from the block start */ UNIV_INLINE ulint log_block_get_data_len( /*===================*/ const byte* log_block) /*!< in: log block */ { return(mach_read_from_2(log_block + LOG_BLOCK_HDR_DATA_LEN)); } /************************************************************//** Sets the log block data length. */ UNIV_INLINE void log_block_set_data_len( /*===================*/ byte* log_block, /*!< in/out: log block */ ulint len) /*!< in: data length */ { mach_write_to_2(log_block + LOG_BLOCK_HDR_DATA_LEN, len); } /************************************************************//** Gets a log block first mtr log record group offset. @return first mtr log record group byte offset from the block start, 0 if none */ UNIV_INLINE ulint log_block_get_first_rec_group( /*==========================*/ const byte* log_block) /*!< in: log block */ { return(mach_read_from_2(log_block + LOG_BLOCK_FIRST_REC_GROUP)); } /************************************************************//** Sets the log block first mtr log record group offset. */ UNIV_INLINE void log_block_set_first_rec_group( /*==========================*/ byte* log_block, /*!< in/out: log block */ ulint offset) /*!< in: offset, 0 if none */ { mach_write_to_2(log_block + LOG_BLOCK_FIRST_REC_GROUP, offset); } /************************************************************//** Gets a log block checkpoint number field (4 lowest bytes). @return checkpoint no (4 lowest bytes) */ UNIV_INLINE ulint log_block_get_checkpoint_no( /*========================*/ const byte* log_block) /*!< in: log block */ { return(mach_read_from_4(log_block + LOG_BLOCK_CHECKPOINT_NO)); } /************************************************************//** Sets a log block checkpoint number field (4 lowest bytes). */ UNIV_INLINE void log_block_set_checkpoint_no( /*========================*/ byte* log_block, /*!< in/out: log block */ ib_uint64_t no) /*!< in: checkpoint no */ { mach_write_to_4(log_block + LOG_BLOCK_CHECKPOINT_NO, (ulint) no); } /************************************************************//** Converts a lsn to a log block number. @return log block number, it is > 0 and <= 1G */ UNIV_INLINE ulint log_block_convert_lsn_to_no( /*========================*/ lsn_t lsn) /*!< in: lsn of a byte within the block */ { return(((ulint) (lsn / OS_FILE_LOG_BLOCK_SIZE) & 0x3FFFFFFFUL) + 1); } /************************************************************//** Calculates the checksum for a log block using the current algorithm. @return checksum */ UNIV_INLINE ulint log_block_calc_checksum( /*====================*/ const byte* block) /*!< in: log block */ { return(log_checksum_algorithm_ptr(block)); } /************************************************************//** Calculates the checksum for a log block using the default InnoDB algorithm. @return checksum */ UNIV_INLINE ulint log_block_calc_checksum_innodb( /*===========================*/ const byte* block) /*!< in: log block */ { ulint sum; ulint sh; ulint i; sum = 1; sh = 0; for (i = 0; i < OS_FILE_LOG_BLOCK_SIZE - LOG_BLOCK_TRL_SIZE; i++) { ulint b = (ulint) block[i]; sum &= 0x7FFFFFFFUL; sum += b; sum += b << sh; sh++; if (sh > 24) { sh = 0; } } return(sum); } /************************************************************//** Calculates the checksum for a log block using the CRC32 algorithm. @return checksum */ UNIV_INLINE ulint log_block_calc_checksum_crc32( /*==========================*/ const byte* block) /*!< in: log block */ { return(ut_crc32(block, OS_FILE_LOG_BLOCK_SIZE - LOG_BLOCK_TRL_SIZE)); } /************************************************************//** Calculates the checksum for a log block using the "no-op" algorithm. @return checksum */ UNIV_INLINE ulint log_block_calc_checksum_none( /*=========================*/ const byte* block) /*!< in: log block */ { return(LOG_NO_CHECKSUM_MAGIC); } /************************************************************//** Gets a log block checksum field value. @return checksum */ UNIV_INLINE ulint log_block_get_checksum( /*===================*/ const byte* log_block) /*!< in: log block */ { return(mach_read_from_4(log_block + OS_FILE_LOG_BLOCK_SIZE - LOG_BLOCK_CHECKSUM)); } /************************************************************//** Sets a log block checksum field value. */ UNIV_INLINE void log_block_set_checksum( /*===================*/ byte* log_block, /*!< in/out: log block */ ulint checksum) /*!< in: checksum */ { mach_write_to_4(log_block + OS_FILE_LOG_BLOCK_SIZE - LOG_BLOCK_CHECKSUM, checksum); } /************************************************************//** Initializes a log block in the log buffer. */ UNIV_INLINE void log_block_init( /*===========*/ byte* log_block, /*!< in: pointer to the log buffer */ lsn_t lsn) /*!< in: lsn within the log block */ { ulint no; ut_ad(mutex_own(&(log_sys->mutex))); no = log_block_convert_lsn_to_no(lsn); log_block_set_hdr_no(log_block, no); log_block_set_data_len(log_block, LOG_BLOCK_HDR_SIZE); log_block_set_first_rec_group(log_block, 0); } /************************************************************//** Initializes a log block in the log buffer in the old format, where there was no checksum yet. */ UNIV_INLINE void log_block_init_in_old_format( /*=========================*/ byte* log_block, /*!< in: pointer to the log buffer */ lsn_t lsn) /*!< in: lsn within the log block */ { ulint no; ut_ad(mutex_own(&(log_sys->mutex))); no = log_block_convert_lsn_to_no(lsn); log_block_set_hdr_no(log_block, no); mach_write_to_4(log_block + OS_FILE_LOG_BLOCK_SIZE - LOG_BLOCK_CHECKSUM, no); log_block_set_data_len(log_block, LOG_BLOCK_HDR_SIZE); log_block_set_first_rec_group(log_block, 0); } #ifndef UNIV_HOTBACKUP /************************************************************//** Writes to the log the string given. The log must be released with log_release. @return end lsn of the log record, zero if did not succeed */ UNIV_INLINE lsn_t log_reserve_and_write_fast( /*=======================*/ const void* str, /*!< in: string */ ulint len, /*!< in: string length */ lsn_t* start_lsn)/*!< out: start lsn of the log record */ { ulint data_len; #ifdef UNIV_LOG_LSN_DEBUG /* length of the LSN pseudo-record */ ulint lsn_len; #endif /* UNIV_LOG_LSN_DEBUG */ mutex_enter(&log_sys->mutex); #ifdef UNIV_LOG_LSN_DEBUG lsn_len = 1 + mach_get_compressed_size(log_sys->lsn >> 32) + mach_get_compressed_size(log_sys->lsn & 0xFFFFFFFFUL); #endif /* UNIV_LOG_LSN_DEBUG */ data_len = len #ifdef UNIV_LOG_LSN_DEBUG + lsn_len #endif /* UNIV_LOG_LSN_DEBUG */ + log_sys->buf_free % OS_FILE_LOG_BLOCK_SIZE; if (data_len >= OS_FILE_LOG_BLOCK_SIZE - LOG_BLOCK_TRL_SIZE) { /* The string does not fit within the current log block or the log block would become full. Do not release the log mutex, because it has to be reacquired immediately for the "slow" write procedure via log_write_low(). */ return(0); } *start_lsn = log_sys->lsn; #ifdef UNIV_LOG_LSN_DEBUG { /* Write the LSN pseudo-record. */ byte* b = &log_sys->buf[log_sys->buf_free]; *b++ = MLOG_LSN | (MLOG_SINGLE_REC_FLAG & *(const byte*) str); /* Write the LSN in two parts, as a pseudo page number and space id. */ b += mach_write_compressed(b, log_sys->lsn >> 32); b += mach_write_compressed(b, log_sys->lsn & 0xFFFFFFFFUL); ut_a(b - lsn_len == &log_sys->buf[log_sys->buf_free]); memcpy(b, str, len); len += lsn_len; } #else /* UNIV_LOG_LSN_DEBUG */ memcpy(log_sys->buf + log_sys->buf_free, str, len); #endif /* UNIV_LOG_LSN_DEBUG */ log_block_set_data_len((byte*) ut_align_down(log_sys->buf + log_sys->buf_free, OS_FILE_LOG_BLOCK_SIZE), data_len); #ifdef UNIV_LOG_DEBUG log_sys->old_buf_free = log_sys->buf_free; log_sys->old_lsn = log_sys->lsn; #endif log_sys->buf_free += len; ut_ad(log_sys->buf_free <= log_sys->buf_size); log_sys->lsn += len; MONITOR_SET(MONITOR_LSN_CHECKPOINT_AGE, log_sys->lsn - log_sys->last_checkpoint_lsn); #ifdef UNIV_LOG_DEBUG log_check_log_recs(log_sys->buf + log_sys->old_buf_free, log_sys->buf_free - log_sys->old_buf_free, log_sys->old_lsn); #endif return(log_sys->lsn); } /**************************************************************************//** Locks the log mutex and opens the log for log_write_low. The log must be closed with log_close and released with log_release. @return start lsn of the log record */ UNIV_INLINE ib_uint64_t log_reserve_and_open( /*=================*/ ulint len) /*!< in: length of data to be catenated */ { mutex_enter(&(log_sys->mutex)); return log_open(len); } /***********************************************************************//** Releases the log mutex. */ UNIV_INLINE void log_release(void) /*=============*/ { mutex_exit(&(log_sys->mutex)); } /************************************************************//** Gets the current lsn. @return current lsn */ UNIV_INLINE lsn_t log_get_lsn(void) /*=============*/ { lsn_t lsn; mutex_enter(&(log_sys->mutex)); lsn = log_sys->lsn; mutex_exit(&(log_sys->mutex)); return(lsn); } /************************************************************//** Gets the last lsn that is fully flushed to disk. @return last flushed lsn */ UNIV_INLINE ib_uint64_t log_get_flush_lsn(void) /*=============*/ { ib_uint64_t lsn; mutex_enter(&(log_sys->mutex)); lsn = log_sys->flushed_to_disk_lsn; mutex_exit(&(log_sys->mutex)); return(lsn); } /************************************************************//** Gets the current lsn with a trylock @return current lsn or 0 if false*/ UNIV_INLINE lsn_t log_get_lsn_nowait(void) /*=============*/ { lsn_t lsn=0; if (!mutex_enter_nowait(&(log_sys->mutex))) { lsn = log_sys->lsn; mutex_exit(&(log_sys->mutex)); } return(lsn); } /**************************************************************** Gets the log group capacity. It is OK to read the value without holding log_sys->mutex because it is constant. @return log group capacity */ UNIV_INLINE lsn_t log_get_capacity(void) /*==================*/ { return(log_sys->log_group_capacity); } /**************************************************************** Get log_sys::max_modified_age_async. It is OK to read the value without holding log_sys::mutex because it is constant. @return max_modified_age_async */ UNIV_INLINE lsn_t log_get_max_modified_age_async(void) /*================================*/ { return(log_sys->max_modified_age_async); } /***********************************************************************//** Checks if there is need for a log buffer flush or a new checkpoint, and does this if yes. Any database operation should call this when it has modified more than about 4 pages. NOTE that this function may only be called when the OS thread owns no synchronization objects except the dictionary mutex. */ UNIV_INLINE void log_free_check(void) /*================*/ { #ifdef UNIV_SYNC_DEBUG ut_ad(sync_thread_levels_empty_except_dict()); #endif /* UNIV_SYNC_DEBUG */ if (log_sys->check_flush_or_checkpoint) { log_check_margins(); } } #endif /* !UNIV_HOTBACKUP */ /****************************************************************//** Unsafely reads the log_sys->tracked_lsn value. Uses atomic operations if available, or use dirty read. Use for printing only. @return log_sys->tracked_lsn value. */ UNIV_INLINE lsn_t log_get_tracked_lsn_peek(void) /*==========================*/ { #ifdef HAVE_ATOMIC_BUILTINS_64 return os_atomic_increment_uint64(&log_sys->tracked_lsn, 0); #else return log_sys->tracked_lsn; #endif } /****************************************************************//** Safely reads the log_sys->tracked_lsn value. Uses atomic operations if available, otherwise this field is protected with the log system mutex. The writer counterpart function is log_set_tracked_lsn() in log0online.c. @return log_sys->tracked_lsn value. */ UNIV_INLINE lsn_t log_get_tracked_lsn(void) /*=====================*/ { #ifdef HAVE_ATOMIC_BUILTINS_64 return os_atomic_increment_uint64(&log_sys->tracked_lsn, 0); #else ut_ad(mutex_own(&(log_sys->mutex))); return log_sys->tracked_lsn; #endif }