2011-06-30 17:37:13 +02:00
|
|
|
/*
|
2012-01-13 15:50:02 +01:00
|
|
|
Copyright (c) 2003, 2011, Oracle and/or its affiliates
|
2003-11-02 15:55:02 +02:00
|
|
|
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
|
|
it under the terms of the GNU General Public License as published by
|
2006-12-23 20:17:15 +01:00
|
|
|
the Free Software Foundation; version 2 of the License.
|
2003-11-02 15:55:02 +02:00
|
|
|
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
|
|
along with this program; if not, write to the Free Software
|
2011-06-30 17:46:53 +02:00
|
|
|
Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA */
|
2003-11-02 15:55:02 +02:00
|
|
|
|
|
|
|
#include "mysys_priv.h"
|
|
|
|
#include "mysys_err.h"
|
|
|
|
#include <errno.h>
|
|
|
|
|
2011-07-02 22:08:51 +02:00
|
|
|
|
2010-03-09 21:22:24 +02:00
|
|
|
ulong my_sync_count; /* Count number of sync calls */
|
|
|
|
|
2010-10-28 18:27:25 +02:00
|
|
|
static void (*before_sync_wait)(void)= 0;
|
|
|
|
static void (*after_sync_wait)(void)= 0;
|
|
|
|
|
|
|
|
void thr_set_sync_wait_callback(void (*before_wait)(void),
|
|
|
|
void (*after_wait)(void))
|
|
|
|
{
|
|
|
|
before_sync_wait= before_wait;
|
|
|
|
after_sync_wait= after_wait;
|
|
|
|
}
|
|
|
|
|
2003-11-02 15:55:02 +02:00
|
|
|
/*
|
|
|
|
Sync data in file to disk
|
|
|
|
|
|
|
|
SYNOPSIS
|
|
|
|
my_sync()
|
|
|
|
fd File descritor to sync
|
|
|
|
my_flags Flags (now only MY_WME is supported)
|
|
|
|
|
|
|
|
NOTE
|
2005-04-05 13:17:49 +02:00
|
|
|
If file system supports its, only file data is synced, not inode data.
|
|
|
|
|
|
|
|
MY_IGNORE_BADFD is useful when fd is "volatile" - not protected by a
|
|
|
|
mutex. In this case by the time of fsync(), fd may be already closed by
|
|
|
|
another thread, or even reassigned to a different file. With this flag -
|
|
|
|
MY_IGNORE_BADFD - such a situation will not be considered an error.
|
|
|
|
(which is correct behaviour, if we know that the other thread synced the
|
|
|
|
file before closing)
|
2003-11-02 15:55:02 +02:00
|
|
|
|
2012-08-30 10:53:49 +02:00
|
|
|
MY_SYNC_FILESIZE is useful when syncing a file after it has been extended.
|
|
|
|
On Linux, fdatasync() on ext3/ext4 file systems does not properly flush
|
|
|
|
to disk the inode data required to preserve the added data across a crash
|
|
|
|
(this looks to be a bug). But when a file is extended, inode data will most
|
|
|
|
likely need flushing in any case, so passing MY_SYNC_FILESIZE as flags
|
|
|
|
is not likely to be any slower, and will be crash safe on Linux ext3/ext4.
|
|
|
|
|
2003-11-02 15:55:02 +02:00
|
|
|
RETURN
|
|
|
|
0 ok
|
|
|
|
-1 error
|
|
|
|
*/
|
|
|
|
|
|
|
|
int my_sync(File fd, myf my_flags)
|
|
|
|
{
|
|
|
|
int res;
|
|
|
|
DBUG_ENTER("my_sync");
|
2011-07-02 22:08:51 +02:00
|
|
|
|
2007-12-18 03:21:32 +02:00
|
|
|
DBUG_PRINT("my",("fd: %d my_flags: %d", fd, my_flags));
|
2003-11-02 15:55:02 +02:00
|
|
|
|
2010-08-09 20:05:42 +03:00
|
|
|
if (my_disable_sync)
|
|
|
|
DBUG_RETURN(0);
|
2003-11-02 15:55:02 +02:00
|
|
|
|
2010-03-09 21:22:24 +02:00
|
|
|
statistic_increment(my_sync_count,&THR_LOCK_open);
|
2011-07-02 22:08:51 +02:00
|
|
|
|
2003-11-02 15:55:02 +02:00
|
|
|
DBUG_PRINT("my",("Fd: %d my_flags: %d", fd, my_flags));
|
|
|
|
|
2011-03-04 12:42:20 +01:00
|
|
|
if (before_sync_wait)
|
|
|
|
(*before_sync_wait)();
|
2011-07-02 22:08:51 +02:00
|
|
|
|
2005-01-11 00:14:46 +01:00
|
|
|
do
|
|
|
|
{
|
2007-10-11 18:07:40 +03:00
|
|
|
#if defined(F_FULLFSYNC)
|
|
|
|
/*
|
|
|
|
In Mac OS X >= 10.3 this call is safer than fsync() (it forces the
|
|
|
|
disk's cache and guarantees ordered writes).
|
|
|
|
*/
|
|
|
|
if (!(res= fcntl(fd, F_FULLFSYNC, 0)))
|
|
|
|
break; /* ok */
|
|
|
|
/* Some file systems don't support F_FULLFSYNC and fail above: */
|
|
|
|
DBUG_PRINT("info",("fcntl(F_FULLFSYNC) failed, falling back"));
|
|
|
|
#endif
|
2010-10-19 14:48:03 -02:00
|
|
|
#if defined(HAVE_FDATASYNC) && HAVE_DECL_FDATASYNC
|
2012-08-30 10:53:49 +02:00
|
|
|
if (!(my_flags & MY_SYNC_FILESIZE))
|
|
|
|
res= fdatasync(fd);
|
|
|
|
else
|
|
|
|
{
|
|
|
|
#endif
|
|
|
|
#if defined(HAVE_FSYNC)
|
2005-01-11 00:14:46 +01:00
|
|
|
res= fsync(fd);
|
2010-08-10 19:06:34 +03:00
|
|
|
if (res == -1 && errno == ENOLCK)
|
2010-08-09 20:54:58 +03:00
|
|
|
res= 0; /* Result Bug in Old FreeBSD */
|
This is the downport of
Bug#24509 - 2048 file descriptor limit on windows needs increasing, also
WL#3049 - improved Windows I/O
The patch replaces the use of the POSIX I/O interfaces in mysys on Windows with
the Win32 API calls (CreateFile, WriteFile, etc). The Windows HANDLE for the open
file is stored in the my_file_info struct, along with a flag for append mode
because the Windows API does not support opening files in append mode in all cases)
The default max open files has been increased to 16384 and can be increased further
by setting --max-open-files=<value> during the server start.
Another major change in this patch that almost all Windows specific file IO code
has been moved to a new file my_winfile.c, greatly reducing the amount of code
in #ifdef blocks within mysys, thus improving readability.
Minor enhancements:
- my_(f)stat() is changed to use __stati64 structure with 64 file size
and timestamps. It will return correct file size now (C runtime implementation
used to report outdated information)
- my_lock on Windows is prepared to handle additional timeout parameter
- after review : changed __WIN__ to _WIN32 in the new and changed code.
client/mysqlbinlog.cc:
fileno -> my_fileno
client/readline.cc:
fileno -> my_fileno
include/config-win.h:
Increase OS_FILE_LIMIT for Windows.
Remove O_SHARE - Windows does not support it. Its definition conflicts with
O_SHORT_LIVED, that has different semantics.
include/my_dir.h:
Use stat64 for stat() family of functions on Windows, because of 64 bit file size.
include/my_global.h:
Increased default value for open file limit to 16K
include/my_sys.h:
- my_file_info got new structure members - file handle and open flags
- 2 new Windows-only mysys functions : my_get_osfhandle and my_osmaperr,
modelled after Windows C runtime functions _get_osfhandle and _dosmaperr
libmysql/CMakeLists.txt:
new files my_winfile.c and my_winerr.c
mysql-test/suite/large_tests/r/lock_tables_big.result:
test for more then 2048 open file descriptors on Windows
mysql-test/suite/large_tests/t/lock_tables_big.test:
test for more then 2048 open file descriptors on Windows
mysys/CMakeLists.txt:
new files my_winfile.c and my_winerr.c
mysys/Makefile.am:
new files my_winfile.c and my_winerr.c
mysys/default_modify.c:
fileno -> my_fileno
mysys/my_chsize.c:
implementation of chsize on Windows now moved to my_winfile.c
mysys/my_create.c:
- my_sopen->my_win_open
- close open file before removing (won't generally work on Windows otherwise)
mysys/my_file.c:
On Windows, files returned by my_open will not start with 0, but 2048
(making it simple to detect incompatible mix of CRT and mysys io functions)
mysys/my_fopen.c:
fileno->my_win_fileno , fclose->my_win_fclose, fdopen->my_win_fdopen
Check for legal filename is done by my_win_[f]open functions
mysys/my_fstream.c:
fileno->my_fileno
mysys/my_lib.c:
Windows stat() functions are moved to my_winfile.c
mysys/my_lock.c:
Move Windows code under #ifdef to a separate function win_lock().
Add a parameter for lock wait timeout
mysys/my_mmap.c:
_get_osfhandle->my_get_osfhandle
mysys/my_open.c:
my_sopen->my_win_open (simpler interface)
mysys/my_pread.c:
moved most windows specific code to my_win_file.c
Use my_win_pread
mysys/my_quick.c:
Use my_win_read/my_win_write
mysys/my_read.c:
Moved most of windows specific code to my_win_file.c
Use my_win_read()
mysys/my_seek.c:
On Windows, use my_win_lseek() in my_seek()/my_tell()
Removed dead code (synchronization of lseeks)
Improved DBUG tracing (file position is ulonglong, not ulong)
mysys/my_static.c:
Removed array initialization. my_file_info_default is global variable
thus it is initialized with all zeros anyway
mysys/my_sync.c:
_commit->my_win_fsync
mysys/my_winerr.c:
New file my_winerr.c
Exports my_osmaperr modelled after undocumented C runtime
function _dosmaperr(). The problem with _dosmaperr() used previously is that
1) it is nowhere documented and thus code relying on it is not guaranteed to work
in subsequent releases on the C runtime
2) it is present only in static C runtime (mysqld does not link if compiled with
/MD)
mysys/my_winfile.c:
New file my_winfile.c
Implements ANSI/Posix file IO routines, when possible using native Windows IO, without
C runtime (C runtime dropped because of the 2048 file descriptor limit).
mysys/my_write.c:
write->my_win_write
mysys/mysys_priv.h:
Declaration of Windows Posix functions (private to mysys, shall not be visible
outside)
storage/innobase/handler/ha_innodb.cc:
mysys native Windows IO : correct innodb tmp file handling
mysql_tmpfile does not return valid CRT file descriptor, thus
it is not possible to dup() it. Instead, the native file handle has
to be duplicated and then converted to CRT descriptor.
storage/myisam/mi_locking.c:
_commit->my_sync
2009-09-11 22:26:35 +02:00
|
|
|
#elif defined(_WIN32)
|
|
|
|
res= my_win_fsync(fd);
|
2003-11-02 15:55:02 +02:00
|
|
|
#else
|
2007-10-11 18:07:40 +03:00
|
|
|
#error Cannot find a way to sync a file, durability in danger
|
2005-01-11 00:14:46 +01:00
|
|
|
res= 0; /* No sync (strange OS) */
|
2012-08-30 10:53:49 +02:00
|
|
|
#endif
|
|
|
|
#if defined(HAVE_FDATASYNC) && HAVE_DECL_FDATASYNC
|
|
|
|
}
|
2003-11-02 15:55:02 +02:00
|
|
|
#endif
|
2005-01-11 00:14:46 +01:00
|
|
|
} while (res == -1 && errno == EINTR);
|
|
|
|
|
2003-11-02 15:55:02 +02:00
|
|
|
if (res)
|
|
|
|
{
|
2005-04-05 13:17:49 +02:00
|
|
|
int er= errno;
|
|
|
|
if (!(my_errno= er))
|
|
|
|
my_errno= -1; /* Unknown error */
|
2010-10-28 18:27:25 +02:00
|
|
|
if (after_sync_wait)
|
|
|
|
(*after_sync_wait)();
|
2005-04-06 19:43:35 +03:00
|
|
|
if ((my_flags & MY_IGNORE_BADFD) &&
|
2005-04-05 13:17:49 +02:00
|
|
|
(er == EBADF || er == EINVAL || er == EROFS))
|
2007-10-11 18:07:40 +03:00
|
|
|
{
|
|
|
|
DBUG_PRINT("info", ("ignoring errno %d", er));
|
2005-04-05 13:17:49 +02:00
|
|
|
res= 0;
|
2007-10-11 18:07:40 +03:00
|
|
|
}
|
2005-04-05 13:17:49 +02:00
|
|
|
else if (my_flags & MY_WME)
|
2003-11-02 15:55:02 +02:00
|
|
|
my_error(EE_SYNC, MYF(ME_BELL+ME_WAITTANG), my_filename(fd), my_errno);
|
|
|
|
}
|
2010-10-28 18:27:25 +02:00
|
|
|
else
|
|
|
|
{
|
|
|
|
if (after_sync_wait)
|
|
|
|
(*after_sync_wait)();
|
|
|
|
}
|
2003-11-02 15:55:02 +02:00
|
|
|
DBUG_RETURN(res);
|
2005-04-05 13:17:49 +02:00
|
|
|
} /* my_sync */
|
|
|
|
|
2007-10-11 18:07:40 +03:00
|
|
|
|
|
|
|
static const char cur_dir_name[]= {FN_CURLIB, 0};
|
2010-10-19 11:49:31 -02:00
|
|
|
|
2007-10-11 18:07:40 +03:00
|
|
|
/*
|
|
|
|
Force directory information to disk.
|
|
|
|
|
|
|
|
SYNOPSIS
|
|
|
|
my_sync_dir()
|
|
|
|
dir_name the name of the directory
|
|
|
|
my_flags flags (MY_WME etc)
|
|
|
|
|
|
|
|
RETURN
|
|
|
|
0 if ok, !=0 if error
|
|
|
|
*/
|
2010-10-19 11:49:31 -02:00
|
|
|
|
2010-01-06 23:27:53 +02:00
|
|
|
int my_sync_dir(const char *dir_name __attribute__((unused)),
|
|
|
|
myf my_flags __attribute__((unused)))
|
2007-10-11 18:07:40 +03:00
|
|
|
{
|
2006-11-22 23:38:10 +01:00
|
|
|
#ifdef NEED_EXPLICIT_SYNC_DIR
|
2007-10-11 18:07:40 +03:00
|
|
|
File dir_fd;
|
|
|
|
int res= 0;
|
|
|
|
const char *correct_dir_name;
|
2009-11-25 16:48:29 +01:00
|
|
|
DBUG_ENTER("my_sync_dir");
|
|
|
|
DBUG_PRINT("my",("Dir: '%s' my_flags: %d", dir_name, my_flags));
|
2007-10-11 18:07:40 +03:00
|
|
|
/* Sometimes the path does not contain an explicit directory */
|
|
|
|
correct_dir_name= (dir_name[0] == 0) ? cur_dir_name : dir_name;
|
|
|
|
/*
|
|
|
|
Syncing a dir may give EINVAL on tmpfs on Linux, which is ok.
|
|
|
|
EIO on the other hand is very important. Hence MY_IGNORE_BADFD.
|
|
|
|
*/
|
|
|
|
if ((dir_fd= my_open(correct_dir_name, O_RDONLY, MYF(my_flags))) >= 0)
|
|
|
|
{
|
|
|
|
if (my_sync(dir_fd, MYF(my_flags | MY_IGNORE_BADFD)))
|
|
|
|
res= 2;
|
|
|
|
if (my_close(dir_fd, MYF(my_flags)))
|
|
|
|
res= 3;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
res= 1;
|
|
|
|
DBUG_RETURN(res);
|
2006-11-22 23:38:10 +01:00
|
|
|
#else
|
2007-10-11 18:07:40 +03:00
|
|
|
return 0;
|
2006-11-21 22:22:59 +01:00
|
|
|
#endif
|
2007-10-11 18:07:40 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
Force directory information to disk.
|
|
|
|
|
|
|
|
SYNOPSIS
|
|
|
|
my_sync_dir_by_file()
|
|
|
|
file_name the name of a file in the directory
|
|
|
|
my_flags flags (MY_WME etc)
|
|
|
|
|
|
|
|
RETURN
|
|
|
|
0 if ok, !=0 if error
|
|
|
|
*/
|
2010-10-19 11:49:31 -02:00
|
|
|
|
2010-01-06 23:27:53 +02:00
|
|
|
int my_sync_dir_by_file(const char *file_name __attribute__((unused)),
|
|
|
|
myf my_flags __attribute__((unused)))
|
2007-10-11 18:07:40 +03:00
|
|
|
{
|
2006-11-22 23:38:10 +01:00
|
|
|
#ifdef NEED_EXPLICIT_SYNC_DIR
|
2007-10-11 18:07:40 +03:00
|
|
|
char dir_name[FN_REFLEN];
|
|
|
|
size_t dir_name_length;
|
|
|
|
dirname_part(dir_name, file_name, &dir_name_length);
|
|
|
|
return my_sync_dir(dir_name, my_flags);
|
2006-11-22 23:38:10 +01:00
|
|
|
#else
|
2007-10-11 18:07:40 +03:00
|
|
|
return 0;
|
2006-11-21 22:22:59 +01:00
|
|
|
#endif
|
2007-10-11 18:07:40 +03:00
|
|
|
}
|