mariadb/storage/bdb/os_win32/os_open.c
2005-07-20 15:48:22 -07:00

228 lines
5.8 KiB
C

/*-
* See the file LICENSE for redistribution information.
*
* Copyright (c) 1997-2004
* Sleepycat Software. All rights reserved.
*
* $Id: os_open.c,v 11.37 2004/10/05 14:55:35 mjc Exp $
*/
#include "db_config.h"
#ifndef NO_SYSTEM_INCLUDES
#include <sys/types.h>
#include <fcntl.h>
#include <signal.h>
#include <string.h>
#include <unistd.h>
#endif
#include "db_int.h"
/*
* __os_have_direct --
* Check to see if we support direct I/O.
*
* PUBLIC: int __os_have_direct __P((void));
*/
int
__os_have_direct()
{
return (1);
}
/*
* __os_open --
* Open a file descriptor.
*/
__os_open(dbenv, name, flags, mode, fhpp)
DB_ENV *dbenv;
const char *name;
u_int32_t flags;
int mode;
DB_FH **fhpp;
{
return (__os_open_extend(dbenv, name, 0, flags, mode, fhpp));
}
/*
* __os_open_extend --
* Open a file descriptor (including page size and log size information).
*/
int
__os_open_extend(dbenv, name, page_size, flags, mode, fhpp)
DB_ENV *dbenv;
const char *name;
u_int32_t page_size, flags;
int mode;
DB_FH **fhpp;
{
DB_FH *fhp;
DWORD cluster_size, sector_size, free_clusters, total_clusters;
int access, attr, createflag, nrepeat, oflags, ret, share;
_TCHAR *drive, *tname;
_TCHAR dbuf[4]; /* <letter><colon><slash><nul> */
fhp = NULL;
tname = NULL;
#define OKFLAGS \
(DB_OSO_CREATE | DB_OSO_DIRECT | DB_OSO_DSYNC | DB_OSO_EXCL | \
DB_OSO_LOG | DB_OSO_RDONLY | DB_OSO_REGION | DB_OSO_SEQ | \
DB_OSO_TEMP | DB_OSO_TRUNC)
if ((ret = __db_fchk(dbenv, "__os_open", flags, OKFLAGS)) != 0)
return (ret);
/*
* The "public" interface to the __os_open routine passes around POSIX
* 1003.1 flags, not DB flags. If the user has defined their own open
* interface, use the POSIX flags.
*/
if (DB_GLOBAL(j_open) != NULL) {
oflags = O_BINARY | O_NOINHERIT;
if (LF_ISSET(DB_OSO_CREATE))
oflags |= O_CREAT;
#ifdef O_DSYNC
if (LF_ISSET(DB_OSO_LOG) && LF_ISSET(DB_OSO_DSYNC))
oflags |= O_DSYNC;
#endif
if (LF_ISSET(DB_OSO_EXCL))
oflags |= O_EXCL;
if (LF_ISSET(DB_OSO_RDONLY))
oflags |= O_RDONLY;
else
oflags |= O_RDWR;
if (LF_ISSET(DB_OSO_SEQ))
oflags |= _O_SEQUENTIAL;
else
oflags |= _O_RANDOM;
if (LF_ISSET(DB_OSO_TEMP))
oflags |= _O_TEMPORARY;
if (LF_ISSET(DB_OSO_TRUNC))
oflags |= O_TRUNC;
return (__os_openhandle(dbenv, name, oflags, mode, fhpp));
}
TO_TSTRING(dbenv, name, tname, ret);
if (ret != 0)
goto err;
if ((ret = __os_calloc(dbenv, 1, sizeof(DB_FH), &fhp)) != 0)
goto err;
/*
* Otherwise, use the Windows/32 CreateFile interface so that we can
* play magic games with log files to get data flush effects similar
* to the POSIX O_DSYNC flag.
*
* !!!
* We currently ignore the 'mode' argument. It would be possible
* to construct a set of security attributes that we could pass to
* CreateFile that would accurately represents the mode. In worst
* case, this would require looking up user and all group names and
* creating an entry for each. Alternatively, we could call the
* _chmod (partial emulation) function after file creation, although
* this leaves us with an obvious race. However, these efforts are
* largely meaningless on FAT, the most common file system, which
* only has a "readable" and "writeable" flag, applying to all users.
*/
access = GENERIC_READ;
if (!LF_ISSET(DB_OSO_RDONLY))
access |= GENERIC_WRITE;
share = FILE_SHARE_READ | FILE_SHARE_WRITE;
attr = FILE_ATTRIBUTE_NORMAL;
/*
* Reproduce POSIX 1003.1 semantics: if O_CREATE and O_EXCL are both
* specified, fail, returning EEXIST, unless we create the file.
*/
if (LF_ISSET(DB_OSO_CREATE) && LF_ISSET(DB_OSO_EXCL))
createflag = CREATE_NEW; /* create only if !exist*/
else if (!LF_ISSET(DB_OSO_CREATE) && LF_ISSET(DB_OSO_TRUNC))
createflag = TRUNCATE_EXISTING; /* truncate, fail if !exist */
else if (LF_ISSET(DB_OSO_TRUNC))
createflag = CREATE_ALWAYS; /* create and truncate */
else if (LF_ISSET(DB_OSO_CREATE))
createflag = OPEN_ALWAYS; /* open or create */
else
createflag = OPEN_EXISTING; /* open only if existing */
if (LF_ISSET(DB_OSO_LOG) && LF_ISSET(DB_OSO_DSYNC)) {
F_SET(fhp, DB_FH_NOSYNC);
attr |= FILE_FLAG_WRITE_THROUGH;
}
if (LF_ISSET(DB_OSO_SEQ))
attr |= FILE_FLAG_SEQUENTIAL_SCAN;
else
attr |= FILE_FLAG_RANDOM_ACCESS;
if (LF_ISSET(DB_OSO_TEMP))
attr |= FILE_FLAG_DELETE_ON_CLOSE;
/*
* We can turn filesystem buffering off if the page size is a
* multiple of the disk's sector size. To find the sector size,
* we call GetDiskFreeSpace, which expects a drive name like "d:\\"
* or NULL for the current disk (i.e., a relative path)
*/
if (LF_ISSET(DB_OSO_DIRECT) && page_size != 0 && name[0] != '\0') {
if (name[1] == ':') {
drive = dbuf;
_sntprintf(dbuf, sizeof(dbuf), _T("%c:\\"), tname[0]);
} else
drive = NULL;
/*
* We ignore all results except sectorsize, but some versions
* of Windows require that the parameters are non-NULL.
*/
if (GetDiskFreeSpace(drive, &cluster_size,
&sector_size, &free_clusters, &total_clusters) &&
page_size % sector_size == 0)
attr |= FILE_FLAG_NO_BUFFERING;
}
for (nrepeat = 1;; ++nrepeat) {
fhp->handle =
CreateFile(tname, access, share, NULL, createflag, attr, 0);
if (fhp->handle == INVALID_HANDLE_VALUE) {
/*
* If it's a "temporary" error, we retry up to 3 times,
* waiting up to 12 seconds. While it's not a problem
* if we can't open a database, an inability to open a
* log file is cause for serious dismay.
*/
ret = __os_get_errno();
if ((ret != ENFILE && ret != EMFILE && ret != ENOSPC) ||
nrepeat > 3)
goto err;
__os_sleep(dbenv, nrepeat * 2, 0);
} else
break;
}
FREE_STRING(dbenv, tname);
F_SET(fhp, DB_FH_OPENED);
*fhpp = fhp;
return (0);
err: if (ret == 0)
ret = __os_get_errno();
FREE_STRING(dbenv, tname);
if (fhp != NULL)
(void)__os_closehandle(dbenv, fhp);
return (ret);
}