mirror of
https://github.com/MariaDB/server.git
synced 2025-01-18 04:53:01 +01:00
1081513a12
Merge 3.23.52 innobase/btr/btr0btr.c: Merge 3.23.52 innobase/btr/btr0cur.c: Merge 3.23.52 innobase/btr/btr0sea.c: Merge 3.23.52 innobase/include/btr0btr.h: Merge 3.23.52 innobase/include/btr0cur.h: Merge 3.23.52 innobase/include/btr0sea.h: Merge 3.23.52 innobase/include/buf0buf.h: Merge 3.23.52 innobase/include/buf0rea.h: Merge 3.23.52 innobase/include/data0data.h: Merge 3.23.52 innobase/include/data0data.ic: Merge 3.23.52 innobase/include/log0log.h: Merge 3.23.52 innobase/include/log0log.ic: Merge 3.23.52 innobase/include/os0file.h: Merge 3.23.52 innobase/include/page0page.h: Merge 3.23.52 innobase/include/page0page.ic: Merge 3.23.52 innobase/include/row0mysql.h: Merge 3.23.52 innobase/include/trx0roll.h: Merge 3.23.52 innobase/include/trx0sys.h: Merge 3.23.52 innobase/include/trx0trx.h: Merge 3.23.52 innobase/include/ut0ut.h: Merge 3.23.52 innobase/include/univ.i: Merge 3.23.52 innobase/include/ut0ut.ic: Merge 3.23.52 innobase/buf/buf0buf.c: Merge 3.23.52 innobase/buf/buf0rea.c: Merge 3.23.52 innobase/data/data0data.c: Merge 3.23.52 innobase/dict/dict0crea.c: Merge 3.23.52 innobase/dict/dict0dict.c: Merge 3.23.52 innobase/dict/dict0load.c: Merge 3.23.52 innobase/dict/dict0mem.c: Merge 3.23.52 innobase/fsp/fsp0fsp.c: Merge 3.23.52 innobase/ibuf/ibuf0ibuf.c: Merge 3.23.52 innobase/lock/lock0lock.c: Merge 3.23.52 innobase/log/log0log.c: Merge 3.23.52 innobase/log/log0recv.c: Merge 3.23.52 innobase/mtr/mtr0log.c: Merge 3.23.52 innobase/mtr/mtr0mtr.c: Merge 3.23.52 innobase/os/os0file.c: Merge 3.23.52 innobase/page/page0cur.c: Merge 3.23.52 innobase/page/page0page.c: Merge 3.23.52 innobase/rem/rem0cmp.c: Merge 3.23.52 innobase/row/row0ins.c: Merge 3.23.52 innobase/row/row0mysql.c: Merge 3.23.52 innobase/row/row0purge.c: Merge 3.23.52 innobase/row/row0upd.c: Merge 3.23.52 innobase/srv/srv0srv.c: Merge 3.23.52 innobase/srv/srv0start.c: Merge 3.23.52 innobase/trx/trx0roll.c: Merge 3.23.52 innobase/trx/trx0sys.c: Merge 3.23.52 innobase/trx/trx0trx.c: Merge 3.23.52 innobase/trx/trx0undo.c: Merge 3.23.52 innobase/ut/ut0mem.c: Merge 3.23.52 innobase/ut/ut0ut.c: Merge 3.23.52
416 lines
15 KiB
C
416 lines
15 KiB
C
/******************************************************
|
|
The interface to the operating system file io
|
|
|
|
(c) 1995 Innobase Oy
|
|
|
|
Created 10/21/1995 Heikki Tuuri
|
|
*******************************************************/
|
|
|
|
#ifndef os0file_h
|
|
#define os0file_h
|
|
|
|
#include "univ.i"
|
|
|
|
|
|
/* If the following is set to TRUE, we do not call os_file_flush in every
|
|
os_file_write */
|
|
extern ibool os_do_not_call_flush_at_each_write;
|
|
extern ibool os_has_said_disk_full;
|
|
extern ibool os_aio_print_debug;
|
|
|
|
#ifdef __WIN__
|
|
|
|
/* We define always WIN_ASYNC_IO, and check at run-time whether
|
|
the OS actually supports it: Win 95 does not, NT does. */
|
|
#define WIN_ASYNC_IO
|
|
|
|
#define UNIV_NON_BUFFERED_IO
|
|
|
|
#endif
|
|
|
|
#ifdef __WIN__
|
|
#define os_file_t HANDLE
|
|
#else
|
|
typedef int os_file_t;
|
|
#endif
|
|
|
|
extern ulint os_innodb_umask;
|
|
|
|
/* If this flag is TRUE, then we will use the native aio of the
|
|
OS (provided we compiled Innobase with it in), otherwise we will
|
|
use simulated aio we build below with threads */
|
|
|
|
extern ibool os_aio_use_native_aio;
|
|
|
|
#define OS_FILE_SECTOR_SIZE 512
|
|
|
|
/* The next value should be smaller or equal to the smallest sector size used
|
|
on any disk. A log block is required to be a portion of disk which is written
|
|
so that if the start and the end of a block get written to disk, then the
|
|
whole block gets written. This should be true even in most cases of a crash:
|
|
if this fails for a log block, then it is equivalent to a media failure in the
|
|
log. */
|
|
|
|
#define OS_FILE_LOG_BLOCK_SIZE 512
|
|
|
|
/* Options for file_create */
|
|
#define OS_FILE_OPEN 51
|
|
#define OS_FILE_CREATE 52
|
|
#define OS_FILE_OVERWRITE 53
|
|
|
|
#define OS_FILE_READ_ONLY 333
|
|
#define OS_FILE_READ_WRITE 444
|
|
|
|
/* Options for file_create */
|
|
#define OS_FILE_AIO 61
|
|
#define OS_FILE_NORMAL 62
|
|
|
|
/* Types for file create */
|
|
#define OS_DATA_FILE 100
|
|
#define OS_LOG_FILE 101
|
|
|
|
/* Error codes from os_file_get_last_error */
|
|
#define OS_FILE_NOT_FOUND 71
|
|
#define OS_FILE_DISK_FULL 72
|
|
#define OS_FILE_ALREADY_EXISTS 73
|
|
#define OS_FILE_AIO_RESOURCES_RESERVED 74 /* wait for OS aio resources
|
|
to become available again */
|
|
#define OS_FILE_ERROR_NOT_SPECIFIED 75
|
|
|
|
/* Types for aio operations */
|
|
#define OS_FILE_READ 10
|
|
#define OS_FILE_WRITE 11
|
|
|
|
#define OS_FILE_LOG 256 /* This can be ORed to type */
|
|
|
|
#define OS_AIO_N_PENDING_IOS_PER_THREAD 32 /* Win NT does not allow more
|
|
than 64 */
|
|
|
|
/* Modes for aio operations */
|
|
#define OS_AIO_NORMAL 21 /* Normal asynchronous i/o not for ibuf
|
|
pages or ibuf bitmap pages */
|
|
#define OS_AIO_IBUF 22 /* Asynchronous i/o for ibuf pages or ibuf
|
|
bitmap pages */
|
|
#define OS_AIO_LOG 23 /* Asynchronous i/o for the log */
|
|
#define OS_AIO_SYNC 24 /* Asynchronous i/o where the calling thread
|
|
will itself wait for the i/o to complete,
|
|
doing also the job of the i/o-handler thread;
|
|
can be used for any pages, ibuf or non-ibuf.
|
|
This is used to save CPU time, as we can do
|
|
with fewer thread switches. Plain synchronous
|
|
i/o is not as good, because it must serialize
|
|
the file seek and read or write, causing a
|
|
bottleneck for parallelism. */
|
|
|
|
#define OS_AIO_SIMULATED_WAKE_LATER 512 /* This can be ORed to mode
|
|
in the call of os_aio(...),
|
|
if the caller wants to post several i/o
|
|
requests in a batch, and only after that
|
|
wake the i/o-handler thread; this has
|
|
effect only in simulated aio */
|
|
#define OS_WIN31 1
|
|
#define OS_WIN95 2
|
|
#define OS_WINNT 3
|
|
|
|
extern ulint os_n_file_reads;
|
|
extern ulint os_n_file_writes;
|
|
extern ulint os_n_fsyncs;
|
|
|
|
/***************************************************************************
|
|
Gets the operating system version. Currently works only on Windows. */
|
|
|
|
ulint
|
|
os_get_os_version(void);
|
|
/*===================*/
|
|
/* out: OS_WIN95, OS_WIN31, OS_WINNT (2000 == NT) */
|
|
/********************************************************************
|
|
Creates the seek mutexes used in positioned reads and writes. */
|
|
|
|
void
|
|
os_io_init_simple(void);
|
|
/*===================*/
|
|
/********************************************************************
|
|
A simple function to open or create a file. */
|
|
|
|
os_file_t
|
|
os_file_create_simple(
|
|
/*==================*/
|
|
/* out, own: handle to the file, not defined if error,
|
|
error number can be retrieved with os_get_last_error */
|
|
char* name, /* in: name of the file or path as a null-terminated
|
|
string */
|
|
ulint create_mode,/* in: OS_FILE_OPEN if an existing file is opened
|
|
(if does not exist, error), or OS_FILE_CREATE if a new
|
|
file is created (if exists, error) */
|
|
ulint access_type,/* in: OS_FILE_READ_ONLY or OS_FILE_READ_WRITE */
|
|
ibool* success);/* out: TRUE if succeed, FALSE if error */
|
|
/********************************************************************
|
|
Opens an existing file or creates a new. */
|
|
|
|
os_file_t
|
|
os_file_create(
|
|
/*===========*/
|
|
/* out, own: handle to the file, not defined if error,
|
|
error number can be retrieved with os_get_last_error */
|
|
char* name, /* in: name of the file or path as a null-terminated
|
|
string */
|
|
ulint create_mode,/* in: OS_FILE_OPEN if an existing file is opened
|
|
(if does not exist, error), or OS_FILE_CREATE if a new
|
|
file is created (if exists, error), OS_FILE_OVERWRITE
|
|
if a new file is created or an old overwritten */
|
|
ulint purpose,/* in: OS_FILE_AIO, if asynchronous, non-buffered i/o
|
|
is desired, OS_FILE_NORMAL, if any normal file */
|
|
ulint type, /* in: OS_DATA_FILE or OS_LOG_FILE */
|
|
ibool* success);/* out: TRUE if succeed, FALSE if error */
|
|
/***************************************************************************
|
|
Closes a file handle. In case of error, error number can be retrieved with
|
|
os_file_get_last_error. */
|
|
|
|
ibool
|
|
os_file_close(
|
|
/*==========*/
|
|
/* out: TRUE if success */
|
|
os_file_t file); /* in, own: handle to a file */
|
|
/***************************************************************************
|
|
Gets a file size. */
|
|
|
|
ibool
|
|
os_file_get_size(
|
|
/*=============*/
|
|
/* out: TRUE if success */
|
|
os_file_t file, /* in: handle to a file */
|
|
ulint* size, /* out: least significant 32 bits of file
|
|
size */
|
|
ulint* size_high);/* out: most significant 32 bits of size */
|
|
/***************************************************************************
|
|
Sets a file size. This function can be used to extend or truncate a file. */
|
|
|
|
ibool
|
|
os_file_set_size(
|
|
/*=============*/
|
|
/* out: TRUE if success */
|
|
char* name, /* in: name of the file or path as a
|
|
null-terminated string */
|
|
os_file_t file, /* in: handle to a file */
|
|
ulint size, /* in: least significant 32 bits of file
|
|
size */
|
|
ulint size_high);/* in: most significant 32 bits of size */
|
|
/***************************************************************************
|
|
Flushes the write buffers of a given file to the disk. */
|
|
|
|
ibool
|
|
os_file_flush(
|
|
/*==========*/
|
|
/* out: TRUE if success */
|
|
os_file_t file); /* in, own: handle to a file */
|
|
/***************************************************************************
|
|
Retrieves the last error number if an error occurs in a file io function.
|
|
The number should be retrieved before any other OS calls (because they may
|
|
overwrite the error number). If the number is not known to this program,
|
|
the OS error number + 100 is returned. */
|
|
|
|
ulint
|
|
os_file_get_last_error(void);
|
|
/*========================*/
|
|
/* out: error number, or OS error number + 100 */
|
|
/***********************************************************************
|
|
Requests a synchronous read operation. */
|
|
|
|
ibool
|
|
os_file_read(
|
|
/*=========*/
|
|
/* out: TRUE if request was
|
|
successful, FALSE if fail */
|
|
os_file_t file, /* in: handle to a file */
|
|
void* buf, /* in: buffer where to read */
|
|
ulint offset, /* in: least significant 32 bits of file
|
|
offset where to read */
|
|
ulint offset_high,/* in: most significant 32 bits of
|
|
offset */
|
|
ulint n); /* in: number of bytes to read */
|
|
/***********************************************************************
|
|
Requests a synchronous write operation. */
|
|
|
|
ibool
|
|
os_file_write(
|
|
/*==========*/
|
|
/* out: TRUE if request was
|
|
successful, FALSE if fail */
|
|
char* name, /* in: name of the file or path as a
|
|
null-terminated string */
|
|
os_file_t file, /* in: handle to a file */
|
|
void* buf, /* in: buffer from which to write */
|
|
ulint offset, /* in: least significant 32 bits of file
|
|
offset where to write */
|
|
ulint offset_high,/* in: most significant 32 bits of
|
|
offset */
|
|
ulint n); /* in: number of bytes to write */
|
|
/****************************************************************************
|
|
Initializes the asynchronous io system. Creates separate aio array for
|
|
non-ibuf read and write, a third aio array for the ibuf i/o, with just one
|
|
segment, two aio arrays for log reads and writes with one segment, and a
|
|
synchronous aio array of the specified size. The combined number of segments
|
|
in the three first aio arrays is the parameter n_segments given to the
|
|
function. The caller must create an i/o handler thread for each segment in
|
|
the four first arrays, but not for the sync aio array. */
|
|
|
|
void
|
|
os_aio_init(
|
|
/*========*/
|
|
ulint n, /* in: maximum number of pending aio operations
|
|
allowed; n must be divisible by n_segments */
|
|
ulint n_segments, /* in: combined number of segments in the four
|
|
first aio arrays; must be >= 4 */
|
|
ulint n_slots_sync); /* in: number of slots in the sync aio array */
|
|
/***********************************************************************
|
|
Requests an asynchronous i/o operation. */
|
|
|
|
ibool
|
|
os_aio(
|
|
/*===*/
|
|
/* out: TRUE if request was queued
|
|
successfully, FALSE if fail */
|
|
ulint type, /* in: OS_FILE_READ or OS_FILE_WRITE */
|
|
ulint mode, /* in: OS_AIO_NORMAL, ..., possibly ORed
|
|
to OS_AIO_SIMULATED_WAKE_LATER: the
|
|
last flag advises this function not to wake
|
|
i/o-handler threads, but the caller will
|
|
do the waking explicitly later, in this
|
|
way the caller can post several requests in
|
|
a batch; NOTE that the batch must not be
|
|
so big that it exhausts the slots in aio
|
|
arrays! NOTE that a simulated batch
|
|
may introduce hidden chances of deadlocks,
|
|
because i/os are not actually handled until
|
|
all have been posted: use with great
|
|
caution! */
|
|
char* name, /* in: name of the file or path as a
|
|
null-terminated string */
|
|
os_file_t file, /* in: handle to a file */
|
|
void* buf, /* in: buffer where to read or from which
|
|
to write */
|
|
ulint offset, /* in: least significant 32 bits of file
|
|
offset where to read or write */
|
|
ulint offset_high, /* in: most significant 32 bits of
|
|
offset */
|
|
ulint n, /* in: number of bytes to read or write */
|
|
void* message1,/* in: messages for the aio handler (these
|
|
can be used to identify a completed aio
|
|
operation); if mode is OS_AIO_SYNC, these
|
|
are ignored */
|
|
void* message2);
|
|
/****************************************************************************
|
|
Waits until there are no pending writes in os_aio_write_array. There can
|
|
be other, synchronous, pending writes. */
|
|
|
|
void
|
|
os_aio_wait_until_no_pending_writes(void);
|
|
/*=====================================*/
|
|
/**************************************************************************
|
|
Wakes up simulated aio i/o-handler threads if they have something to do. */
|
|
|
|
void
|
|
os_aio_simulated_wake_handler_threads(void);
|
|
/*=======================================*/
|
|
/**************************************************************************
|
|
This function can be called if one wants to post a batch of reads and
|
|
prefers an i/o-handler thread to handle them all at once later. You must
|
|
call os_aio_simulated_wake_handler_threads later to ensure the threads
|
|
are not left sleeping! */
|
|
|
|
void
|
|
os_aio_simulated_put_read_threads_to_sleep(void);
|
|
/*============================================*/
|
|
|
|
#ifdef WIN_ASYNC_IO
|
|
/**************************************************************************
|
|
This function is only used in Windows asynchronous i/o.
|
|
Waits for an aio operation to complete. This function is used to wait the
|
|
for completed requests. The aio array of pending requests is divided
|
|
into segments. The thread specifies which segment or slot it wants to wait
|
|
for. NOTE: this function will also take care of freeing the aio slot,
|
|
therefore no other thread is allowed to do the freeing! */
|
|
|
|
ibool
|
|
os_aio_windows_handle(
|
|
/*==================*/
|
|
/* out: TRUE if the aio operation succeeded */
|
|
ulint segment, /* in: the number of the segment in the aio
|
|
arrays to wait for; segment 0 is the ibuf
|
|
i/o thread, segment 1 the log i/o thread,
|
|
then follow the non-ibuf read threads, and as
|
|
the last are the non-ibuf write threads; if
|
|
this is ULINT_UNDEFINED, then it means that
|
|
sync aio is used, and this parameter is
|
|
ignored */
|
|
ulint pos, /* this parameter is used only in sync aio:
|
|
wait for the aio slot at this position */
|
|
void** message1, /* out: the messages passed with the aio
|
|
request; note that also in the case where
|
|
the aio operation failed, these output
|
|
parameters are valid and can be used to
|
|
restart the operation, for example */
|
|
void** message2,
|
|
ulint* type); /* out: OS_FILE_WRITE or ..._READ */
|
|
#endif
|
|
|
|
/* Currently we do not use Posix async i/o */
|
|
#ifdef POSIX_ASYNC_IO
|
|
/**************************************************************************
|
|
This function is only used in Posix asynchronous i/o. Waits for an aio
|
|
operation to complete. */
|
|
|
|
ibool
|
|
os_aio_posix_handle(
|
|
/*================*/
|
|
/* out: TRUE if the aio operation succeeded */
|
|
ulint array_no, /* in: array number 0 - 3 */
|
|
void** message1, /* out: the messages passed with the aio
|
|
request; note that also in the case where
|
|
the aio operation failed, these output
|
|
parameters are valid and can be used to
|
|
restart the operation, for example */
|
|
void** message2);
|
|
#endif
|
|
/**************************************************************************
|
|
Does simulated aio. This function should be called by an i/o-handler
|
|
thread. */
|
|
|
|
ibool
|
|
os_aio_simulated_handle(
|
|
/*====================*/
|
|
/* out: TRUE if the aio operation succeeded */
|
|
ulint segment, /* in: the number of the segment in the aio
|
|
arrays to wait for; segment 0 is the ibuf
|
|
i/o thread, segment 1 the log i/o thread,
|
|
then follow the non-ibuf read threads, and as
|
|
the last are the non-ibuf write threads */
|
|
void** message1, /* out: the messages passed with the aio
|
|
request; note that also in the case where
|
|
the aio operation failed, these output
|
|
parameters are valid and can be used to
|
|
restart the operation, for example */
|
|
void** message2,
|
|
ulint* type); /* out: OS_FILE_WRITE or ..._READ */
|
|
/**************************************************************************
|
|
Validates the consistency of the aio system. */
|
|
|
|
ibool
|
|
os_aio_validate(void);
|
|
/*=================*/
|
|
/* out: TRUE if ok */
|
|
/**************************************************************************
|
|
Prints info of the aio arrays. */
|
|
|
|
void
|
|
os_aio_print(void);
|
|
/*==============*/
|
|
/**************************************************************************
|
|
Checks that all slots in the system have been freed, that is, there are
|
|
no pending io operations. */
|
|
|
|
ibool
|
|
os_aio_all_slots_free(void);
|
|
/*=======================*/
|
|
/* out: TRUE if all free */
|
|
#endif
|