mariadb/storage/bdb/os/os_open.c
2005-07-20 15:48:22 -07:00

412 lines
9.1 KiB
C

/*-
* See the file LICENSE for redistribution information.
*
* Copyright (c) 1997-2004
* Sleepycat Software. All rights reserved.
*
* $Id: os_open.c,v 11.60 2004/09/24 00:43:19 bostic Exp $
*/
#include "db_config.h"
#ifndef NO_SYSTEM_INCLUDES
#include <sys/types.h>
#include <sys/stat.h>
#ifdef HAVE_SYS_FCNTL_H
#include <sys/fcntl.h>
#endif
#include <fcntl.h>
#include <string.h>
#include <unistd.h>
#endif
#include "db_int.h"
static int __os_intermediate_dir __P((DB_ENV *, const char *));
static int __os_mkdir __P((DB_ENV *, const char *));
#ifdef HAVE_QNX
static int __os_region_open __P((DB_ENV *, const char *, int, int, DB_FH **));
#endif
/*
* __os_have_direct --
* Check to see if we support direct I/O.
*
* PUBLIC: int __os_have_direct __P((void));
*/
int
__os_have_direct()
{
int ret;
ret = 0;
#ifdef HAVE_O_DIRECT
ret = 1;
#endif
#if defined(HAVE_DIRECTIO) && defined(DIRECTIO_ON)
ret = 1;
#endif
return (ret);
}
/*
* __os_open --
* Open a file.
*
* PUBLIC: int __os_open
* PUBLIC: __P((DB_ENV *, const char *, u_int32_t, int, DB_FH **));
*/
int
__os_open(dbenv, name, flags, mode, fhpp)
DB_ENV *dbenv;
const char *name;
u_int32_t flags;
int mode;
DB_FH **fhpp;
{
return (__os_open_extend(dbenv, name, 0, flags, mode, fhpp));
}
/*
* __os_open_extend --
* Open a file descriptor (including page size and log size information).
*
* PUBLIC: int __os_open_extend __P((DB_ENV *,
* PUBLIC: const char *, u_int32_t, u_int32_t, int, DB_FH **));
*/
int
__os_open_extend(dbenv, name, page_size, flags, mode, fhpp)
DB_ENV *dbenv;
const char *name;
u_int32_t page_size, flags;
int mode;
DB_FH **fhpp;
{
DB_FH *fhp;
int oflags, ret;
COMPQUIET(page_size, 0);
*fhpp = NULL;
oflags = 0;
#define OKFLAGS \
(DB_OSO_CREATE | DB_OSO_DIRECT | DB_OSO_DSYNC | DB_OSO_EXCL | \
DB_OSO_LOG | DB_OSO_RDONLY | DB_OSO_REGION | DB_OSO_SEQ | \
DB_OSO_TEMP | DB_OSO_TRUNC)
if ((ret = __db_fchk(dbenv, "__os_open", flags, OKFLAGS)) != 0)
return (ret);
#if defined(O_BINARY)
/*
* If there's a binary-mode open flag, set it, we never want any
* kind of translation. Some systems do translations by default,
* e.g., with Cygwin, the default mode for an open() is set by the
* mode of the mount that underlies the file.
*/
oflags |= O_BINARY;
#endif
/*
* DB requires the POSIX 1003.1 semantic that two files opened at the
* same time with DB_OSO_CREATE/O_CREAT and DB_OSO_EXCL/O_EXCL flags
* set return an EEXIST failure in at least one.
*/
if (LF_ISSET(DB_OSO_CREATE))
oflags |= O_CREAT;
if (LF_ISSET(DB_OSO_EXCL))
oflags |= O_EXCL;
#ifdef HAVE_O_DIRECT
if (LF_ISSET(DB_OSO_DIRECT))
oflags |= O_DIRECT;
#endif
#ifdef O_DSYNC
if (LF_ISSET(DB_OSO_LOG) && LF_ISSET(DB_OSO_DSYNC))
oflags |= O_DSYNC;
#endif
if (LF_ISSET(DB_OSO_RDONLY))
oflags |= O_RDONLY;
else
oflags |= O_RDWR;
if (LF_ISSET(DB_OSO_TRUNC))
oflags |= O_TRUNC;
/*
* Undocumented feature: allow applications to create intermediate
* directories whenever a file is opened.
*/
if (dbenv != NULL &&
dbenv->dir_mode != 0 && LF_ISSET(DB_OSO_CREATE) &&
(ret = __os_intermediate_dir(dbenv, name)) != 0)
return (ret);
#ifdef HAVE_QNX
if (LF_ISSET(DB_OSO_REGION))
return (__os_qnx_region_open(dbenv, name, oflags, mode, fhpp));
#endif
/* Open the file. */
if ((ret = __os_openhandle(dbenv, name, oflags, mode, &fhp)) != 0)
return (ret);
#ifdef O_DSYNC
if (LF_ISSET(DB_OSO_LOG) && LF_ISSET(DB_OSO_DSYNC))
F_SET(fhp, DB_FH_NOSYNC);
#endif
#if defined(HAVE_DIRECTIO) && defined(DIRECTIO_ON)
/*
* The Solaris C library includes directio, but you have to set special
* compile flags to #define DIRECTIO_ON. Require both in order to call
* directio.
*/
if (LF_ISSET(DB_OSO_DIRECT))
(void)directio(fhp->fd, DIRECTIO_ON);
#endif
/*
* Delete any temporary file.
*
* !!!
* There's a race here, where we've created a file and we crash before
* we can unlink it. Temporary files aren't common in DB, regardless,
* it's not a security problem because the file is empty. There's no
* reasonable way to avoid the race (playing signal games isn't worth
* the portability nightmare), so we just live with it.
*/
if (LF_ISSET(DB_OSO_TEMP)) {
#if defined(HAVE_UNLINK_WITH_OPEN_FAILURE) || defined(CONFIG_TEST)
if ((ret = __os_strdup(dbenv, name, &fhp->name)) != 0) {
(void)__os_closehandle(dbenv, fhp);
(void)__os_unlink(dbenv, name);
return (ret);
}
F_SET(fhp, DB_FH_UNLINK);
#else
(void)__os_unlink(dbenv, name);
#endif
}
*fhpp = fhp;
return (0);
}
#ifdef HAVE_QNX
/*
* __os_qnx_region_open --
* Open a shared memory region file using POSIX shm_open.
*/
static int
__os_qnx_region_open(dbenv, name, oflags, mode, fhpp)
DB_ENV *dbenv;
const char *name;
int oflags;
int mode;
DB_FH **fhpp;
{
DB_FH *fhp;
int ret;
char *newname;
if ((ret = __os_calloc(dbenv, 1, sizeof(DB_FH), fhpp)) != 0)
return (ret);
fhp = *fhpp;
if ((ret = __os_shmname(dbenv, name, &newname)) != 0)
goto err;
/*
* Once we have created the object, we don't need the name
* anymore. Other callers of this will convert themselves.
*/
fhp->fd = shm_open(newname, oflags, mode);
__os_free(dbenv, newname);
if (fhp->fd == -1) {
ret = __os_get_errno();
goto err;
}
F_SET(fhp, DB_FH_OPENED);
#ifdef HAVE_FCNTL_F_SETFD
/* Deny file descriptor access to any child process. */
if (fcntl(fhp->fd, F_SETFD, 1) == -1) {
ret = __os_get_errno();
__db_err(dbenv, "fcntl(F_SETFD): %s", strerror(ret));
goto err;
}
#endif
err: if (ret != 0) {
(void)__os_closehandle(dbenv, fhp);
*fhpp = NULL;
}
return (ret);
}
/*
* __os_shmname --
* Translate a pathname into a shm_open memory object name.
*
* PUBLIC: #ifdef HAVE_QNX
* PUBLIC: int __os_shmname __P((DB_ENV *, const char *, char **));
* PUBLIC: #endif
*/
int
__os_shmname(dbenv, name, newnamep)
DB_ENV *dbenv;
const char *name;
char **newnamep;
{
int ret;
size_t size;
char *p, *q, *tmpname;
*newnamep = NULL;
/*
* POSIX states that the name for a shared memory object
* may begin with a slash '/' and support for subsequent
* slashes is implementation-dependent. The one implementation
* we know of right now, QNX, forbids subsequent slashes.
* We don't want to be parsing pathnames for '.' and '..' in
* the middle. In order to allow easy conversion, just take
* the last component as the shared memory name. This limits
* the namespace a bit, but makes our job a lot easier.
*
* We should not be modifying user memory, so we use our own.
* Caller is responsible for freeing the memory we give them.
*/
if ((ret = __os_strdup(dbenv, name, &tmpname)) != 0)
return (ret);
/*
* Skip over filename component.
* We set that separator to '\0' so that we can do another
* __db_rpath. However, we immediately set it then to ':'
* so that we end up with the tailing directory:filename.
* We require a home directory component. Return an error
* if there isn't one.
*/
p = __db_rpath(tmpname);
if (p == NULL)
return (EINVAL);
if (p != tmpname) {
*p = '\0';
q = p;
p = __db_rpath(tmpname);
*q = ':';
}
if (p != NULL) {
/*
* If we have a path component, copy and return it.
*/
ret = __os_strdup(dbenv, p, newnamep);
__os_free(dbenv, tmpname);
return (ret);
}
/*
* We were given just a directory name with no path components.
* Add a leading slash, and copy the remainder.
*/
size = strlen(tmpname) + 2;
if ((ret = __os_malloc(dbenv, size, &p)) != 0)
return (ret);
p[0] = '/';
memcpy(&p[1], tmpname, size-1);
__os_free(dbenv, tmpname);
*newnamep = p;
return (0);
}
#endif
/*
* __os_intermediate_dir --
* Create intermediate directories.
*/
static int
__os_intermediate_dir(dbenv, name)
DB_ENV *dbenv;
const char *name;
{
size_t len;
int ret;
char savech, *p, *t, buf[128];
ret = 0;
/*
* Get a copy so we can modify the string.
*
* Allocate memory if temporary space is too small.
*/
if ((len = strlen(name)) > sizeof(buf) - 1) {
if ((ret = __os_umalloc(dbenv, len, &t)) != 0)
return (ret);
} else
t = buf;
(void)strcpy(t, name);
/*
* Cycle through the path, creating intermediate directories.
*
* Skip the first byte if it's a path separator, it's the start of an
* absolute pathname.
*/
if (PATH_SEPARATOR[1] == '\0') {
for (p = t + 1; p[0] != '\0'; ++p)
if (p[0] == PATH_SEPARATOR[0]) {
savech = *p;
*p = '\0';
if (__os_exists(t, NULL) &&
(ret = __os_mkdir(dbenv, t)) != 0)
break;
*p = savech;
}
} else
for (p = t + 1; p[0] != '\0'; ++p)
if (strchr(PATH_SEPARATOR, p[0]) != NULL) {
savech = *p;
*p = '\0';
if (__os_exists(t, NULL) &&
(ret = __os_mkdir(dbenv, t)) != 0)
break;
*p = savech;
}
if (t != buf)
__os_free(dbenv, t);
return (ret);
}
/*
* __os_mkdir --
* Create a directory.
*/
static int
__os_mkdir(dbenv, name)
DB_ENV *dbenv;
const char *name;
{
int ret;
/* Make the directory, with paranoid permissions. */
#ifdef HAVE_VXWORKS
RETRY_CHK((mkdir((char *)name)), ret);
#else
RETRY_CHK((mkdir(name, 0600)), ret);
if (ret != 0)
return (ret);
/* Set the absolute permissions. */
RETRY_CHK((chmod(name, dbenv->dir_mode)), ret);
#endif
return (ret);
}