mirror of
https://github.com/MariaDB/server.git
synced 2025-01-22 14:54:20 +01:00
34eef269eb
Always read full page 0 to determine does tablespace contain encryption metadata. Tablespaces that are page compressed or page compressed and encrypted do not compare checksum as it does not exists. For encrypted tables use checksum verification written for encrypted tables and normal tables use normal method. buf_page_is_checksum_valid_crc32 buf_page_is_checksum_valid_innodb buf_page_is_checksum_valid_none Modify Innochecksum logging to file to avoid compilation warnings. fil0crypt.cc fil0crypt.h Modify to be able to use in innochecksum compilation and move fil_space_verify_crypt_checksum to end of the file. Add innochecksum logging to file. univ.i Add innochecksum strict_verify, log_file and cur_page_num variables as extern. page_zip_verify_checksum Add innochecksum logging to file and remove unnecessary code. innochecksum.cc Lot of changes most notable able to read encryption metadata from page 0 of the tablespace. Added test case where we corrupt intentionally FIL_PAGE_FILE_FLUSH_LSN_OR_KEY_VERSION (encryption key version) FIL_PAGE_FILE_FLUSH_LSN_OR_KEY_VERSION+4 (post encryption checksum) FIL_DATA+10 (data)
857 lines
32 KiB
C
857 lines
32 KiB
C
/*****************************************************************************
|
|
|
|
Copyright (c) 1995, 2016, Oracle and/or its affiliates. All Rights Reserved.
|
|
Copyright (c) 2013, 2017, MariaDB Corporation. All Rights Reserved.
|
|
|
|
This program is free software; you can redistribute it and/or modify it under
|
|
the terms of the GNU General Public License as published by the Free Software
|
|
Foundation; version 2 of the License.
|
|
|
|
This program is distributed in the hope that it will be useful, but WITHOUT
|
|
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License along with
|
|
this program; if not, write to the Free Software Foundation, Inc.,
|
|
51 Franklin Street, Suite 500, Boston, MA 02110-1335 USA
|
|
|
|
*****************************************************************************/
|
|
|
|
/**************************************************//**
|
|
@file include/fsp0fsp.h
|
|
File space management
|
|
|
|
Created 12/18/1995 Heikki Tuuri
|
|
*******************************************************/
|
|
|
|
#ifndef fsp0fsp_h
|
|
#define fsp0fsp_h
|
|
|
|
#include "univ.i"
|
|
|
|
#include "fsp0types.h"
|
|
|
|
#ifndef UNIV_INNOCHECKSUM
|
|
|
|
#include "fsp0space.h"
|
|
#include "fut0lst.h"
|
|
#include "mtr0mtr.h"
|
|
#include "page0types.h"
|
|
#include "rem0types.h"
|
|
#include "ut0byte.h"
|
|
|
|
#endif /* !UNIV_INNOCHECKSUM */
|
|
#include "fsp0types.h"
|
|
|
|
/** @return the PAGE_SSIZE flags for the current innodb_page_size */
|
|
#define FSP_FLAGS_PAGE_SSIZE() \
|
|
((UNIV_PAGE_SIZE == UNIV_PAGE_SIZE_ORIG) ? \
|
|
0 : (UNIV_PAGE_SIZE_SHIFT - UNIV_ZIP_SIZE_SHIFT_MIN + 1) \
|
|
<< FSP_FLAGS_POS_PAGE_SSIZE)
|
|
|
|
/* @defgroup Compatibility macros for MariaDB 10.1.0 through 10.1.20;
|
|
see the table in fsp0types.h @{ */
|
|
/** Zero relative shift position of the PAGE_COMPRESSION field */
|
|
#define FSP_FLAGS_POS_PAGE_COMPRESSION_MARIADB101 \
|
|
(FSP_FLAGS_POS_ATOMIC_BLOBS \
|
|
+ FSP_FLAGS_WIDTH_ATOMIC_BLOBS)
|
|
/** Zero relative shift position of the PAGE_COMPRESSION_LEVEL field */
|
|
#define FSP_FLAGS_POS_PAGE_COMPRESSION_LEVEL_MARIADB101 \
|
|
(FSP_FLAGS_POS_PAGE_COMPRESSION_MARIADB101 + 1)
|
|
/** Zero relative shift position of the ATOMIC_WRITES field */
|
|
#define FSP_FLAGS_POS_ATOMIC_WRITES_MARIADB101 \
|
|
(FSP_FLAGS_POS_PAGE_COMPRESSION_LEVEL_MARIADB101 + 4)
|
|
/** Zero relative shift position of the PAGE_SSIZE field */
|
|
#define FSP_FLAGS_POS_PAGE_SSIZE_MARIADB101 \
|
|
(FSP_FLAGS_POS_ATOMIC_WRITES_MARIADB101 + 2)
|
|
|
|
/** Bit mask of the PAGE_COMPRESSION field */
|
|
#define FSP_FLAGS_MASK_PAGE_COMPRESSION_MARIADB101 \
|
|
(1U << FSP_FLAGS_POS_PAGE_COMPRESSION_MARIADB101)
|
|
/** Bit mask of the PAGE_COMPRESSION_LEVEL field */
|
|
#define FSP_FLAGS_MASK_PAGE_COMPRESSION_LEVEL_MARIADB101 \
|
|
(15U << FSP_FLAGS_POS_PAGE_COMPRESSION_LEVEL_MARIADB101)
|
|
/** Bit mask of the ATOMIC_WRITES field */
|
|
#define FSP_FLAGS_MASK_ATOMIC_WRITES_MARIADB101 \
|
|
(3U << FSP_FLAGS_POS_ATOMIC_WRITES_MARIADB101)
|
|
/** Bit mask of the PAGE_SSIZE field */
|
|
#define FSP_FLAGS_MASK_PAGE_SSIZE_MARIADB101 \
|
|
(15U << FSP_FLAGS_POS_PAGE_SSIZE_MARIADB101)
|
|
|
|
/** Return the value of the PAGE_COMPRESSION field */
|
|
#define FSP_FLAGS_GET_PAGE_COMPRESSION_MARIADB101(flags) \
|
|
((flags & FSP_FLAGS_MASK_PAGE_COMPRESSION_MARIADB101) \
|
|
>> FSP_FLAGS_POS_PAGE_COMPRESSION_MARIADB101)
|
|
/** Return the value of the PAGE_COMPRESSION_LEVEL field */
|
|
#define FSP_FLAGS_GET_PAGE_COMPRESSION_LEVEL_MARIADB101(flags) \
|
|
((flags & FSP_FLAGS_MASK_PAGE_COMPRESSION_LEVEL_MARIADB101) \
|
|
>> FSP_FLAGS_POS_PAGE_COMPRESSION_LEVEL_MARIADB101)
|
|
/** Return the value of the PAGE_SSIZE field */
|
|
#define FSP_FLAGS_GET_PAGE_SSIZE_MARIADB101(flags) \
|
|
((flags & FSP_FLAGS_MASK_PAGE_SSIZE_MARIADB101) \
|
|
>> FSP_FLAGS_POS_PAGE_SSIZE_MARIADB101)
|
|
|
|
/* @} */
|
|
|
|
/* @defgroup Tablespace Header Constants (moved from fsp0fsp.c) @{ */
|
|
|
|
/** Offset of the space header within a file page */
|
|
#define FSP_HEADER_OFFSET FIL_PAGE_DATA
|
|
|
|
/* The data structures in files are defined just as byte strings in C */
|
|
typedef byte fsp_header_t;
|
|
typedef byte xdes_t;
|
|
|
|
/* SPACE HEADER
|
|
============
|
|
|
|
File space header data structure: this data structure is contained in the
|
|
first page of a space. The space for this header is reserved in every extent
|
|
descriptor page, but used only in the first. */
|
|
|
|
/*-------------------------------------*/
|
|
#define FSP_SPACE_ID 0 /* space id */
|
|
#define FSP_NOT_USED 4 /* this field contained a value up to
|
|
which we know that the modifications
|
|
in the database have been flushed to
|
|
the file space; not used now */
|
|
#define FSP_SIZE 8 /* Current size of the space in
|
|
pages */
|
|
#define FSP_FREE_LIMIT 12 /* Minimum page number for which the
|
|
free list has not been initialized:
|
|
the pages >= this limit are, by
|
|
definition, free; note that in a
|
|
single-table tablespace where size
|
|
< 64 pages, this number is 64, i.e.,
|
|
we have initialized the space
|
|
about the first extent, but have not
|
|
physically allocated those pages to the
|
|
file */
|
|
#define FSP_SPACE_FLAGS 16 /* fsp_space_t.flags, similar to
|
|
dict_table_t::flags */
|
|
#define FSP_FRAG_N_USED 20 /* number of used pages in the
|
|
FSP_FREE_FRAG list */
|
|
#define FSP_FREE 24 /* list of free extents */
|
|
#define FSP_FREE_FRAG (24 + FLST_BASE_NODE_SIZE)
|
|
/* list of partially free extents not
|
|
belonging to any segment */
|
|
#define FSP_FULL_FRAG (24 + 2 * FLST_BASE_NODE_SIZE)
|
|
/* list of full extents not belonging
|
|
to any segment */
|
|
#define FSP_SEG_ID (24 + 3 * FLST_BASE_NODE_SIZE)
|
|
/* 8 bytes which give the first unused
|
|
segment id */
|
|
#define FSP_SEG_INODES_FULL (32 + 3 * FLST_BASE_NODE_SIZE)
|
|
/* list of pages containing segment
|
|
headers, where all the segment inode
|
|
slots are reserved */
|
|
#define FSP_SEG_INODES_FREE (32 + 4 * FLST_BASE_NODE_SIZE)
|
|
/* list of pages containing segment
|
|
headers, where not all the segment
|
|
header slots are reserved */
|
|
/*-------------------------------------*/
|
|
/* File space header size */
|
|
#define FSP_HEADER_SIZE (32 + 5 * FLST_BASE_NODE_SIZE)
|
|
|
|
#define FSP_FREE_ADD 4 /* this many free extents are added
|
|
to the free list from above
|
|
FSP_FREE_LIMIT at a time */
|
|
/* @} */
|
|
|
|
/* @defgroup File Segment Inode Constants (moved from fsp0fsp.c) @{ */
|
|
|
|
/* FILE SEGMENT INODE
|
|
==================
|
|
|
|
Segment inode which is created for each segment in a tablespace. NOTE: in
|
|
purge we assume that a segment having only one currently used page can be
|
|
freed in a few steps, so that the freeing cannot fill the file buffer with
|
|
bufferfixed file pages. */
|
|
|
|
typedef byte fseg_inode_t;
|
|
|
|
#define FSEG_INODE_PAGE_NODE FSEG_PAGE_DATA
|
|
/* the list node for linking
|
|
segment inode pages */
|
|
|
|
#define FSEG_ARR_OFFSET (FSEG_PAGE_DATA + FLST_NODE_SIZE)
|
|
/*-------------------------------------*/
|
|
#define FSEG_ID 0 /* 8 bytes of segment id: if this is 0,
|
|
it means that the header is unused */
|
|
#define FSEG_NOT_FULL_N_USED 8
|
|
/* number of used segment pages in
|
|
the FSEG_NOT_FULL list */
|
|
#define FSEG_FREE 12
|
|
/* list of free extents of this
|
|
segment */
|
|
#define FSEG_NOT_FULL (12 + FLST_BASE_NODE_SIZE)
|
|
/* list of partially free extents */
|
|
#define FSEG_FULL (12 + 2 * FLST_BASE_NODE_SIZE)
|
|
/* list of full extents */
|
|
#define FSEG_MAGIC_N (12 + 3 * FLST_BASE_NODE_SIZE)
|
|
/* magic number used in debugging */
|
|
#define FSEG_FRAG_ARR (16 + 3 * FLST_BASE_NODE_SIZE)
|
|
/* array of individual pages
|
|
belonging to this segment in fsp
|
|
fragment extent lists */
|
|
#define FSEG_FRAG_ARR_N_SLOTS (FSP_EXTENT_SIZE / 2)
|
|
/* number of slots in the array for
|
|
the fragment pages */
|
|
#define FSEG_FRAG_SLOT_SIZE 4 /* a fragment page slot contains its
|
|
page number within space, FIL_NULL
|
|
means that the slot is not in use */
|
|
/*-------------------------------------*/
|
|
#define FSEG_INODE_SIZE \
|
|
(16 + 3 * FLST_BASE_NODE_SIZE \
|
|
+ FSEG_FRAG_ARR_N_SLOTS * FSEG_FRAG_SLOT_SIZE)
|
|
|
|
#define FSP_SEG_INODES_PER_PAGE(page_size) \
|
|
((page_size.physical() - FSEG_ARR_OFFSET - 10) / FSEG_INODE_SIZE)
|
|
/* Number of segment inodes which fit on a
|
|
single page */
|
|
|
|
#define FSEG_MAGIC_N_VALUE 97937874
|
|
|
|
#define FSEG_FILLFACTOR 8 /* If this value is x, then if
|
|
the number of unused but reserved
|
|
pages in a segment is less than
|
|
reserved pages * 1/x, and there are
|
|
at least FSEG_FRAG_LIMIT used pages,
|
|
then we allow a new empty extent to
|
|
be added to the segment in
|
|
fseg_alloc_free_page. Otherwise, we
|
|
use unused pages of the segment. */
|
|
|
|
#define FSEG_FRAG_LIMIT FSEG_FRAG_ARR_N_SLOTS
|
|
/* If the segment has >= this many
|
|
used pages, it may be expanded by
|
|
allocating extents to the segment;
|
|
until that only individual fragment
|
|
pages are allocated from the space */
|
|
|
|
#define FSEG_FREE_LIST_LIMIT 40 /* If the reserved size of a segment
|
|
is at least this many extents, we
|
|
allow extents to be put to the free
|
|
list of the extent: at most
|
|
FSEG_FREE_LIST_MAX_LEN many */
|
|
#define FSEG_FREE_LIST_MAX_LEN 4
|
|
/* @} */
|
|
|
|
/* @defgroup Extent Descriptor Constants (moved from fsp0fsp.c) @{ */
|
|
|
|
/* EXTENT DESCRIPTOR
|
|
=================
|
|
|
|
File extent descriptor data structure: contains bits to tell which pages in
|
|
the extent are free and which contain old tuple version to clean. */
|
|
|
|
/*-------------------------------------*/
|
|
#define XDES_ID 0 /* The identifier of the segment
|
|
to which this extent belongs */
|
|
#define XDES_FLST_NODE 8 /* The list node data structure
|
|
for the descriptors */
|
|
#define XDES_STATE (FLST_NODE_SIZE + 8)
|
|
/* contains state information
|
|
of the extent */
|
|
#define XDES_BITMAP (FLST_NODE_SIZE + 12)
|
|
/* Descriptor bitmap of the pages
|
|
in the extent */
|
|
/*-------------------------------------*/
|
|
|
|
#define XDES_BITS_PER_PAGE 2 /* How many bits are there per page */
|
|
#define XDES_FREE_BIT 0 /* Index of the bit which tells if
|
|
the page is free */
|
|
#define XDES_CLEAN_BIT 1 /* NOTE: currently not used!
|
|
Index of the bit which tells if
|
|
there are old versions of tuples
|
|
on the page */
|
|
/* States of a descriptor */
|
|
#define XDES_FREE 1 /* extent is in free list of space */
|
|
#define XDES_FREE_FRAG 2 /* extent is in free fragment list of
|
|
space */
|
|
#define XDES_FULL_FRAG 3 /* extent is in full fragment list of
|
|
space */
|
|
#define XDES_FSEG 4 /* extent belongs to a segment */
|
|
|
|
/** File extent data structure size in bytes. */
|
|
#define XDES_SIZE \
|
|
(XDES_BITMAP \
|
|
+ UT_BITS_IN_BYTES(FSP_EXTENT_SIZE * XDES_BITS_PER_PAGE))
|
|
|
|
/** File extent data structure size in bytes for MAX page size. */
|
|
#define XDES_SIZE_MAX \
|
|
(XDES_BITMAP \
|
|
+ UT_BITS_IN_BYTES(FSP_EXTENT_SIZE_MAX * XDES_BITS_PER_PAGE))
|
|
|
|
/** File extent data structure size in bytes for MIN page size. */
|
|
#define XDES_SIZE_MIN \
|
|
(XDES_BITMAP \
|
|
+ UT_BITS_IN_BYTES(FSP_EXTENT_SIZE_MIN * XDES_BITS_PER_PAGE))
|
|
|
|
/** Offset of the descriptor array on a descriptor page */
|
|
#define XDES_ARR_OFFSET (FSP_HEADER_OFFSET + FSP_HEADER_SIZE)
|
|
|
|
#ifndef UNIV_INNOCHECKSUM
|
|
/* @} */
|
|
|
|
/**********************************************************************//**
|
|
Initializes the file space system. */
|
|
void
|
|
fsp_init(void);
|
|
/*==========*/
|
|
|
|
/**********************************************************************//**
|
|
Gets the size of the system tablespace from the tablespace header. If
|
|
we do not have an auto-extending data file, this should be equal to
|
|
the size of the data files. If there is an auto-extending data file,
|
|
this can be smaller.
|
|
@return size in pages */
|
|
ulint
|
|
fsp_header_get_tablespace_size(void);
|
|
/*================================*/
|
|
|
|
/** Calculate the number of pages to extend a datafile.
|
|
We extend single-table tablespaces first one extent at a time,
|
|
but 4 at a time for bigger tablespaces. It is not enough to extend always
|
|
by one extent, because we need to add at least one extent to FSP_FREE.
|
|
A single extent descriptor page will track many extents. And the extent
|
|
that uses its extent descriptor page is put onto the FSP_FREE_FRAG list.
|
|
Extents that do not use their extent descriptor page are added to FSP_FREE.
|
|
The physical page size is used to determine how many extents are tracked
|
|
on one extent descriptor page. See xdes_calc_descriptor_page().
|
|
@param[in] page_size page_size of the datafile
|
|
@param[in] size current number of pages in the datafile
|
|
@return number of pages to extend the file. */
|
|
ulint
|
|
fsp_get_pages_to_extend_ibd(
|
|
const page_size_t& page_size,
|
|
ulint size);
|
|
|
|
/** Calculate the number of physical pages in an extent for this file.
|
|
@param[in] page_size page_size of the datafile
|
|
@return number of pages in an extent for this file. */
|
|
UNIV_INLINE
|
|
ulint
|
|
fsp_get_extent_size_in_pages(const page_size_t& page_size)
|
|
{
|
|
return(FSP_EXTENT_SIZE * UNIV_PAGE_SIZE / page_size.physical());
|
|
}
|
|
|
|
/**********************************************************************//**
|
|
Reads the space id from the first page of a tablespace.
|
|
@return space id, ULINT UNDEFINED if error */
|
|
ulint
|
|
fsp_header_get_space_id(
|
|
/*====================*/
|
|
const page_t* page); /*!< in: first page of a tablespace */
|
|
|
|
/** Read a tablespace header field.
|
|
@param[in] page first page of a tablespace
|
|
@param[in] field the header field
|
|
@return the contents of the header field */
|
|
inline
|
|
ulint
|
|
fsp_header_get_field(const page_t* page, ulint field)
|
|
{
|
|
return(mach_read_from_4(FSP_HEADER_OFFSET + field + page));
|
|
}
|
|
|
|
/** Read the flags from the tablespace header page.
|
|
@param[in] page first page of a tablespace
|
|
@return the contents of FSP_SPACE_FLAGS */
|
|
inline
|
|
ulint
|
|
fsp_header_get_flags(const page_t* page)
|
|
{
|
|
return(fsp_header_get_field(page, FSP_SPACE_FLAGS));
|
|
}
|
|
|
|
/** Get the byte offset of encryption information in page 0.
|
|
@param[in] ps page size
|
|
@return byte offset relative to FSP_HEADER_OFFSET */
|
|
inline MY_ATTRIBUTE((pure, warn_unused_result))
|
|
ulint
|
|
fsp_header_get_encryption_offset(const page_size_t& ps)
|
|
{
|
|
return XDES_ARR_OFFSET + XDES_SIZE * ps.physical() / FSP_EXTENT_SIZE;
|
|
}
|
|
|
|
/** Check the encryption key from the first page of a tablespace.
|
|
@param[in] fsp_flags tablespace flags
|
|
@param[in] page first page of a tablespace
|
|
@return true if success */
|
|
bool
|
|
fsp_header_check_encryption_key(
|
|
ulint fsp_flags,
|
|
page_t* page);
|
|
|
|
/**********************************************************************//**
|
|
Writes the space id and flags to a tablespace header. The flags contain
|
|
row type, physical/compressed page size, and logical/uncompressed page
|
|
size of the tablespace. */
|
|
void
|
|
fsp_header_init_fields(
|
|
/*===================*/
|
|
page_t* page, /*!< in/out: first page in the space */
|
|
ulint space_id, /*!< in: space id */
|
|
ulint flags); /*!< in: tablespace flags (FSP_SPACE_FLAGS):
|
|
0, or table->flags if newer than COMPACT */
|
|
/** Initialize a tablespace header.
|
|
@param[in] space_id space id
|
|
@param[in] size current size in blocks
|
|
@param[in,out] mtr mini-transaction */
|
|
void
|
|
fsp_header_init(ulint space_id, ulint size, mtr_t* mtr);
|
|
|
|
/**********************************************************************//**
|
|
Increases the space size field of a space. */
|
|
void
|
|
fsp_header_inc_size(
|
|
/*================*/
|
|
ulint space_id, /*!< in: space id */
|
|
ulint size_inc, /*!< in: size increment in pages */
|
|
mtr_t* mtr); /*!< in/out: mini-transaction */
|
|
/**********************************************************************//**
|
|
Creates a new segment.
|
|
@return the block where the segment header is placed, x-latched, NULL
|
|
if could not create segment because of lack of space */
|
|
buf_block_t*
|
|
fseg_create(
|
|
/*========*/
|
|
ulint space_id,/*!< in: space id */
|
|
ulint page, /*!< in: page where the segment header is placed: if
|
|
this is != 0, the page must belong to another segment,
|
|
if this is 0, a new page will be allocated and it
|
|
will belong to the created segment */
|
|
ulint byte_offset, /*!< in: byte offset of the created segment header
|
|
on the page */
|
|
mtr_t* mtr); /*!< in/out: mini-transaction */
|
|
/**********************************************************************//**
|
|
Creates a new segment.
|
|
@return the block where the segment header is placed, x-latched, NULL
|
|
if could not create segment because of lack of space */
|
|
buf_block_t*
|
|
fseg_create_general(
|
|
/*================*/
|
|
ulint space_id,/*!< in: space id */
|
|
ulint page, /*!< in: page where the segment header is placed: if
|
|
this is != 0, the page must belong to another segment,
|
|
if this is 0, a new page will be allocated and it
|
|
will belong to the created segment */
|
|
ulint byte_offset, /*!< in: byte offset of the created segment header
|
|
on the page */
|
|
ibool has_done_reservation, /*!< in: TRUE if the caller has already
|
|
done the reservation for the pages with
|
|
fsp_reserve_free_extents (at least 2 extents: one for
|
|
the inode and the other for the segment) then there is
|
|
no need to do the check for this individual
|
|
operation */
|
|
mtr_t* mtr); /*!< in/out: mini-transaction */
|
|
/**********************************************************************//**
|
|
Calculates the number of pages reserved by a segment, and how many pages are
|
|
currently used.
|
|
@return number of reserved pages */
|
|
ulint
|
|
fseg_n_reserved_pages(
|
|
/*==================*/
|
|
fseg_header_t* header, /*!< in: segment header */
|
|
ulint* used, /*!< out: number of pages used (<= reserved) */
|
|
mtr_t* mtr); /*!< in/out: mini-transaction */
|
|
/**********************************************************************//**
|
|
Allocates a single free page from a segment. This function implements
|
|
the intelligent allocation strategy which tries to minimize
|
|
file space fragmentation.
|
|
@param[in,out] seg_header segment header
|
|
@param[in] hint hint of which page would be desirable
|
|
@param[in] direction if the new page is needed because
|
|
of an index page split, and records are
|
|
inserted there in order, into which
|
|
direction they go alphabetically: FSP_DOWN,
|
|
FSP_UP, FSP_NO_DIR
|
|
@param[in,out] mtr mini-transaction
|
|
@return X-latched block, or NULL if no page could be allocated */
|
|
#define fseg_alloc_free_page(seg_header, hint, direction, mtr) \
|
|
fseg_alloc_free_page_general(seg_header, hint, direction, \
|
|
FALSE, mtr, mtr)
|
|
/**********************************************************************//**
|
|
Allocates a single free page from a segment. This function implements
|
|
the intelligent allocation strategy which tries to minimize file space
|
|
fragmentation.
|
|
@retval NULL if no page could be allocated
|
|
@retval block, rw_lock_x_lock_count(&block->lock) == 1 if allocation succeeded
|
|
(init_mtr == mtr, or the page was not previously freed in mtr)
|
|
@retval block (not allocated or initialized) otherwise */
|
|
buf_block_t*
|
|
fseg_alloc_free_page_general(
|
|
/*=========================*/
|
|
fseg_header_t* seg_header,/*!< in/out: segment header */
|
|
ulint hint, /*!< in: hint of which page would be
|
|
desirable */
|
|
byte direction,/*!< in: if the new page is needed because
|
|
of an index page split, and records are
|
|
inserted there in order, into which
|
|
direction they go alphabetically: FSP_DOWN,
|
|
FSP_UP, FSP_NO_DIR */
|
|
ibool has_done_reservation, /*!< in: TRUE if the caller has
|
|
already done the reservation for the page
|
|
with fsp_reserve_free_extents, then there
|
|
is no need to do the check for this individual
|
|
page */
|
|
mtr_t* mtr, /*!< in/out: mini-transaction */
|
|
mtr_t* init_mtr)/*!< in/out: mtr or another mini-transaction
|
|
in which the page should be initialized.
|
|
If init_mtr!=mtr, but the page is already
|
|
latched in mtr, do not initialize the page. */
|
|
MY_ATTRIBUTE((warn_unused_result, nonnull));
|
|
|
|
/** Reserves free pages from a tablespace. All mini-transactions which may
|
|
use several pages from the tablespace should call this function beforehand
|
|
and reserve enough free extents so that they certainly will be able
|
|
to do their operation, like a B-tree page split, fully. Reservations
|
|
must be released with function fil_space_release_free_extents!
|
|
|
|
The alloc_type below has the following meaning: FSP_NORMAL means an
|
|
operation which will probably result in more space usage, like an
|
|
insert in a B-tree; FSP_UNDO means allocation to undo logs: if we are
|
|
deleting rows, then this allocation will in the long run result in
|
|
less space usage (after a purge); FSP_CLEANING means allocation done
|
|
in a physical record delete (like in a purge) or other cleaning operation
|
|
which will result in less space usage in the long run. We prefer the latter
|
|
two types of allocation: when space is scarce, FSP_NORMAL allocations
|
|
will not succeed, but the latter two allocations will succeed, if possible.
|
|
The purpose is to avoid dead end where the database is full but the
|
|
user cannot free any space because these freeing operations temporarily
|
|
reserve some space.
|
|
|
|
Single-table tablespaces whose size is < FSP_EXTENT_SIZE pages are a special
|
|
case. In this function we would liberally reserve several extents for
|
|
every page split or merge in a B-tree. But we do not want to waste disk space
|
|
if the table only occupies < FSP_EXTENT_SIZE pages. That is why we apply
|
|
different rules in that special case, just ensuring that there are n_pages
|
|
free pages available.
|
|
|
|
@param[out] n_reserved number of extents actually reserved; if we
|
|
return true and the tablespace size is <
|
|
FSP_EXTENT_SIZE pages, then this can be 0,
|
|
otherwise it is n_ext
|
|
@param[in] space_id tablespace identifier
|
|
@param[in] n_ext number of extents to reserve
|
|
@param[in] alloc_type page reservation type (FSP_BLOB, etc)
|
|
@param[in,out] mtr the mini transaction
|
|
@param[in] n_pages for small tablespaces (tablespace size is
|
|
less than FSP_EXTENT_SIZE), number of free
|
|
pages to reserve.
|
|
@return true if we were able to make the reservation */
|
|
bool
|
|
fsp_reserve_free_extents(
|
|
ulint* n_reserved,
|
|
ulint space_id,
|
|
ulint n_ext,
|
|
fsp_reserve_t alloc_type,
|
|
mtr_t* mtr,
|
|
ulint n_pages = 2);
|
|
|
|
/** Calculate how many KiB of new data we will be able to insert to the
|
|
tablespace without running out of space.
|
|
@param[in] space_id tablespace ID
|
|
@return available space in KiB
|
|
@retval UINTMAX_MAX if unknown */
|
|
uintmax_t
|
|
fsp_get_available_space_in_free_extents(
|
|
ulint space_id);
|
|
|
|
/** Calculate how many KiB of new data we will be able to insert to the
|
|
tablespace without running out of space. Start with a space object that has
|
|
been acquired by the caller who holds it for the calculation,
|
|
@param[in] space tablespace object from fil_space_acquire()
|
|
@return available space in KiB */
|
|
uintmax_t
|
|
fsp_get_available_space_in_free_extents(
|
|
const fil_space_t* space);
|
|
|
|
/**********************************************************************//**
|
|
Frees a single page of a segment. */
|
|
void
|
|
fseg_free_page_func(
|
|
fseg_header_t* seg_header, /*!< in: segment header */
|
|
ulint space_id, /*!< in: space id */
|
|
ulint page, /*!< in: page offset */
|
|
#ifdef BTR_CUR_HASH_ADAPT
|
|
bool ahi, /*!< in: whether we may need to drop
|
|
the adaptive hash index */
|
|
#endif /* BTR_CUR_HASH_ADAPT */
|
|
mtr_t* mtr); /*!< in/out: mini-transaction */
|
|
#ifdef BTR_CUR_HASH_ADAPT
|
|
# define fseg_free_page(header, space_id, page, ahi, mtr) \
|
|
fseg_free_page_func(header, space_id, page, ahi, mtr)
|
|
#else /* BTR_CUR_HASH_ADAPT */
|
|
# define fseg_free_page(header, space_id, page, ahi, mtr) \
|
|
fseg_free_page_func(header, space_id, page, mtr)
|
|
#endif /* BTR_CUR_HASH_ADAPT */
|
|
/**********************************************************************//**
|
|
Checks if a single page of a segment is free.
|
|
@return true if free */
|
|
bool
|
|
fseg_page_is_free(
|
|
/*==============*/
|
|
fseg_header_t* seg_header, /*!< in: segment header */
|
|
ulint space_id, /*!< in: space id */
|
|
ulint page) /*!< in: page offset */
|
|
MY_ATTRIBUTE((nonnull, warn_unused_result));
|
|
/**********************************************************************//**
|
|
Frees part of a segment. This function can be used to free a segment
|
|
by repeatedly calling this function in different mini-transactions.
|
|
Doing the freeing in a single mini-transaction might result in
|
|
too big a mini-transaction.
|
|
@return TRUE if freeing completed */
|
|
ibool
|
|
fseg_free_step_func(
|
|
fseg_header_t* header, /*!< in, own: segment header; NOTE: if the header
|
|
resides on the first page of the frag list
|
|
of the segment, this pointer becomes obsolete
|
|
after the last freeing step */
|
|
#ifdef BTR_CUR_HASH_ADAPT
|
|
bool ahi, /*!< in: whether we may need to drop
|
|
the adaptive hash index */
|
|
#endif /* BTR_CUR_HASH_ADAPT */
|
|
mtr_t* mtr) /*!< in/out: mini-transaction */
|
|
MY_ATTRIBUTE((warn_unused_result));
|
|
#ifdef BTR_CUR_HASH_ADAPT
|
|
# define fseg_free_step(header, ahi, mtr) fseg_free_step_func(header, ahi, mtr)
|
|
#else /* BTR_CUR_HASH_ADAPT */
|
|
# define fseg_free_step(header, ahi, mtr) fseg_free_step_func(header, mtr)
|
|
#endif /* BTR_CUR_HASH_ADAPT */
|
|
/**********************************************************************//**
|
|
Frees part of a segment. Differs from fseg_free_step because this function
|
|
leaves the header page unfreed.
|
|
@return TRUE if freeing completed, except the header page */
|
|
ibool
|
|
fseg_free_step_not_header_func(
|
|
fseg_header_t* header, /*!< in: segment header which must reside on
|
|
the first fragment page of the segment */
|
|
#ifdef BTR_CUR_HASH_ADAPT
|
|
bool ahi, /*!< in: whether we may need to drop
|
|
the adaptive hash index */
|
|
#endif /* BTR_CUR_HASH_ADAPT */
|
|
mtr_t* mtr) /*!< in/out: mini-transaction */
|
|
MY_ATTRIBUTE((warn_unused_result));
|
|
#ifdef BTR_CUR_HASH_ADAPT
|
|
# define fseg_free_step_not_header(header, ahi, mtr) \
|
|
fseg_free_step_not_header_func(header, ahi, mtr)
|
|
#else /* BTR_CUR_HASH_ADAPT */
|
|
# define fseg_free_step_not_header(header, ahi, mtr) \
|
|
fseg_free_step_not_header_func(header, mtr)
|
|
#endif /* BTR_CUR_HASH_ADAPT */
|
|
|
|
/** Checks if a page address is an extent descriptor page address.
|
|
@param[in] page_id page id
|
|
@param[in] page_size page size
|
|
@return TRUE if a descriptor page */
|
|
UNIV_INLINE
|
|
ibool
|
|
fsp_descr_page(
|
|
const page_id_t& page_id,
|
|
const page_size_t& page_size);
|
|
|
|
/***********************************************************//**
|
|
Parses a redo log record of a file page init.
|
|
@return end of log record or NULL */
|
|
byte*
|
|
fsp_parse_init_file_page(
|
|
/*=====================*/
|
|
byte* ptr, /*!< in: buffer */
|
|
byte* end_ptr, /*!< in: buffer end */
|
|
buf_block_t* block); /*!< in: block or NULL */
|
|
#ifdef UNIV_BTR_PRINT
|
|
/*******************************************************************//**
|
|
Writes info of a segment. */
|
|
void
|
|
fseg_print(
|
|
/*=======*/
|
|
fseg_header_t* header, /*!< in: segment header */
|
|
mtr_t* mtr); /*!< in/out: mini-transaction */
|
|
#endif /* UNIV_BTR_PRINT */
|
|
|
|
/** Convert FSP_SPACE_FLAGS from the buggy MariaDB 10.1.0..10.1.20 format.
|
|
@param[in] flags the contents of FSP_SPACE_FLAGS
|
|
@return the flags corrected from the buggy MariaDB 10.1 format
|
|
@retval ULINT_UNDEFINED if the flags are not in the buggy 10.1 format */
|
|
MY_ATTRIBUTE((warn_unused_result, const))
|
|
UNIV_INLINE
|
|
ulint
|
|
fsp_flags_convert_from_101(ulint flags)
|
|
{
|
|
DBUG_EXECUTE_IF("fsp_flags_is_valid_failure",
|
|
return(ULINT_UNDEFINED););
|
|
if (flags == 0) {
|
|
return(flags);
|
|
}
|
|
|
|
if (flags >> 18) {
|
|
/* The most significant FSP_SPACE_FLAGS bit that was ever set
|
|
by MariaDB 10.1.0 to 10.1.20 was bit 17 (misplaced DATA_DIR flag).
|
|
The flags must be less than 1<<18 in order to be valid. */
|
|
return(ULINT_UNDEFINED);
|
|
}
|
|
|
|
if ((flags & (FSP_FLAGS_MASK_POST_ANTELOPE | FSP_FLAGS_MASK_ATOMIC_BLOBS))
|
|
== FSP_FLAGS_MASK_ATOMIC_BLOBS) {
|
|
/* If the "atomic blobs" flag (indicating
|
|
ROW_FORMAT=DYNAMIC or ROW_FORMAT=COMPRESSED) flag
|
|
is set, then the "post Antelope" (ROW_FORMAT!=REDUNDANT) flag
|
|
must also be set. */
|
|
return(ULINT_UNDEFINED);
|
|
}
|
|
|
|
/* Bits 6..10 denote compression in MariaDB 10.1.0 to 10.1.20.
|
|
They must be either 0b00000 or 0b00011 through 0b10011.
|
|
In correct versions, these bits would be
|
|
0bd0sss where d is the DATA_DIR flag (garbage bit) and
|
|
sss is the PAGE_SSIZE (3, 4, 6, or 7).
|
|
|
|
NOTE: MariaDB 10.1.0 to 10.1.20 can misinterpret
|
|
uncompressed data files with innodb_page_size=4k or 64k as
|
|
compressed innodb_page_size=16k files. Below is an exhaustive
|
|
state space analysis.
|
|
|
|
-0by1zzz: impossible (the bit 4 must be clean; see above)
|
|
-0b101xx: DATA_DIR, innodb_page_size>4k: invalid (COMPRESSION_LEVEL>9)
|
|
+0bx0011: innodb_page_size=4k:
|
|
!!! Misinterpreted as COMPRESSION_LEVEL=9 or 1, COMPRESSION=1.
|
|
-0bx0010: impossible, because sss must be 0b011 or 0b1xx
|
|
-0bx0001: impossible, because sss must be 0b011 or 0b1xx
|
|
-0b10000: DATA_DIR, innodb_page_size=16:
|
|
invalid (COMPRESSION_LEVEL=8 but COMPRESSION=0)
|
|
+0b00111: no DATA_DIR, innodb_page_size=64k:
|
|
!!! Misinterpreted as COMPRESSION_LEVEL=3, COMPRESSION=1.
|
|
-0b00101: impossible, because sss must be 0 for 16k, not 0b101
|
|
-0b001x0: no DATA_DIR, innodb_page_size=32k or 8k:
|
|
invalid (COMPRESSION_LEVEL=3 but COMPRESSION=0)
|
|
+0b00000: innodb_page_size=16k (looks like COMPRESSION=0)
|
|
??? Could actually be compressed; see PAGE_SSIZE below */
|
|
const ulint level = FSP_FLAGS_GET_PAGE_COMPRESSION_LEVEL_MARIADB101(
|
|
flags);
|
|
if (FSP_FLAGS_GET_PAGE_COMPRESSION_MARIADB101(flags) != (level != 0)
|
|
|| level > 9) {
|
|
/* The compression flags are not in the buggy MariaDB
|
|
10.1 format. */
|
|
return(ULINT_UNDEFINED);
|
|
}
|
|
if (!(~flags & FSP_FLAGS_MASK_ATOMIC_WRITES_MARIADB101)) {
|
|
/* The ATOMIC_WRITES flags cannot be 0b11.
|
|
(The bits 11..12 should actually never be 0b11,
|
|
because in MySQL they would be SHARED|TEMPORARY.) */
|
|
return(ULINT_UNDEFINED);
|
|
}
|
|
|
|
/* Bits 13..16 are the wrong position for PAGE_SSIZE, and they
|
|
should contain one of the values 3,4,6,7, that is, be of the form
|
|
0b0011 or 0b01xx (except 0b0110).
|
|
In correct versions, these bits should be 0bc0se
|
|
where c is the MariaDB COMPRESSED flag
|
|
and e is the MySQL 5.7 ENCRYPTION flag
|
|
and s is the MySQL 8.0 SDI flag. MariaDB can only support s=0, e=0.
|
|
|
|
Compressed innodb_page_size=16k tables with correct FSP_SPACE_FLAGS
|
|
will be properly rejected by older MariaDB 10.1.x because they
|
|
would read as PAGE_SSIZE>=8 which is not valid. */
|
|
|
|
const ulint ssize = FSP_FLAGS_GET_PAGE_SSIZE_MARIADB101(flags);
|
|
if (ssize == 1 || ssize == 2 || ssize == 5 || ssize & 8) {
|
|
/* the page_size is not between 4k and 64k;
|
|
16k should be encoded as 0, not 5 */
|
|
return(ULINT_UNDEFINED);
|
|
}
|
|
const ulint zssize = FSP_FLAGS_GET_ZIP_SSIZE(flags);
|
|
if (zssize == 0) {
|
|
/* not ROW_FORMAT=COMPRESSED */
|
|
} else if (zssize > (ssize ? ssize : 5)) {
|
|
/* invalid KEY_BLOCK_SIZE */
|
|
return(ULINT_UNDEFINED);
|
|
} else if (~flags & (FSP_FLAGS_MASK_POST_ANTELOPE
|
|
| FSP_FLAGS_MASK_ATOMIC_BLOBS)) {
|
|
/* both these flags should be set for
|
|
ROW_FORMAT=COMPRESSED */
|
|
return(ULINT_UNDEFINED);
|
|
}
|
|
|
|
flags = ((flags & 0x3f) | ssize << FSP_FLAGS_POS_PAGE_SSIZE
|
|
| FSP_FLAGS_GET_PAGE_COMPRESSION_MARIADB101(flags)
|
|
<< FSP_FLAGS_POS_PAGE_COMPRESSION);
|
|
ut_ad(fsp_flags_is_valid(flags, false));
|
|
return(flags);
|
|
}
|
|
|
|
/** Compare tablespace flags.
|
|
@param[in] expected expected flags from dict_tf_to_fsp_flags()
|
|
@param[in] actual flags read from FSP_SPACE_FLAGS
|
|
@return whether the flags match */
|
|
MY_ATTRIBUTE((warn_unused_result))
|
|
UNIV_INLINE
|
|
bool
|
|
fsp_flags_match(ulint expected, ulint actual)
|
|
{
|
|
expected &= ~FSP_FLAGS_MEM_MASK;
|
|
ut_ad(fsp_flags_is_valid(expected, false));
|
|
|
|
if (actual == expected) {
|
|
return(true);
|
|
}
|
|
|
|
actual = fsp_flags_convert_from_101(actual);
|
|
return(actual == expected);
|
|
}
|
|
|
|
/** Calculates the descriptor index within a descriptor page.
|
|
@param[in] page_size page size
|
|
@param[in] offset page offset
|
|
@return descriptor index */
|
|
UNIV_INLINE
|
|
ulint
|
|
xdes_calc_descriptor_index(
|
|
const page_size_t& page_size,
|
|
ulint offset);
|
|
|
|
/**********************************************************************//**
|
|
Gets a descriptor bit of a page.
|
|
@return TRUE if free */
|
|
UNIV_INLINE
|
|
ibool
|
|
xdes_get_bit(
|
|
/*=========*/
|
|
const xdes_t* descr, /*!< in: descriptor */
|
|
ulint bit, /*!< in: XDES_FREE_BIT or XDES_CLEAN_BIT */
|
|
ulint offset);/*!< in: page offset within extent:
|
|
0 ... FSP_EXTENT_SIZE - 1 */
|
|
|
|
/** Calculates the page where the descriptor of a page resides.
|
|
@param[in] page_size page size
|
|
@param[in] offset page offset
|
|
@return descriptor page offset */
|
|
UNIV_INLINE
|
|
ulint
|
|
xdes_calc_descriptor_page(
|
|
const page_size_t& page_size,
|
|
ulint offset);
|
|
|
|
/**********************************************************************//**
|
|
Checks if a single page is free.
|
|
@return true if free */
|
|
UNIV_INTERN
|
|
bool
|
|
fsp_page_is_free_func(
|
|
/*==============*/
|
|
ulint space, /*!< in: space id */
|
|
ulint page, /*!< in: page offset */
|
|
mtr_t* mtr, /*!< in/out: mini-transaction */
|
|
const char *file,
|
|
unsigned line);
|
|
|
|
#define fsp_page_is_free(space,page,mtr) \
|
|
fsp_page_is_free_func(space,page,mtr, __FILE__, __LINE__)
|
|
|
|
#endif /* UNIV_INNOCHECKSUM */
|
|
|
|
#include "fsp0fsp.ic"
|
|
|
|
#endif
|