mariadb/bdb/db/crdel_rec.c
tim@threads.polyesthetic.msg 89dad52004 Import changeset
2001-03-04 19:42:05 -05:00

646 lines
16 KiB
C

/*-
* See the file LICENSE for redistribution information.
*
* Copyright (c) 1996, 1997, 1998, 1999, 2000
* Sleepycat Software. All rights reserved.
*/
#include "db_config.h"
#ifndef lint
static const char revid[] = "$Id: crdel_rec.c,v 11.43 2000/12/13 08:06:34 krinsky Exp $";
#endif /* not lint */
#ifndef NO_SYSTEM_INCLUDES
#include <sys/types.h>
#include <string.h>
#endif
#include "db_int.h"
#include "db_page.h"
#include "log.h"
#include "hash.h"
#include "mp.h"
#include "db_dispatch.h"
/*
* __crdel_fileopen_recover --
* Recovery function for fileopen.
*
* PUBLIC: int __crdel_fileopen_recover
* PUBLIC: __P((DB_ENV *, DBT *, DB_LSN *, db_recops, void *));
*/
int
__crdel_fileopen_recover(dbenv, dbtp, lsnp, op, info)
DB_ENV *dbenv;
DBT *dbtp;
DB_LSN *lsnp;
db_recops op;
void *info;
{
__crdel_fileopen_args *argp;
DBMETA ondisk;
DB_FH fh;
size_t nr;
int do_unlink, ret;
u_int32_t b, mb, io;
char *real_name;
COMPQUIET(info, NULL);
real_name = NULL;
REC_PRINT(__crdel_fileopen_print);
if ((ret = __crdel_fileopen_read(dbenv, dbtp->data, &argp)) != 0)
goto out;
/*
* If this is an in-memory database, then the name is going to
* be NULL, which looks like a 0-length name in recovery.
*/
if (argp->name.size == 0)
goto done;
if ((ret = __db_appname(dbenv, DB_APP_DATA,
NULL, argp->name.data, 0, NULL, &real_name)) != 0)
goto out;
if (DB_REDO(op)) {
/*
* The create commited, so we need to make sure that the file
* exists. A simple open should suffice.
*/
if ((ret = __os_open(dbenv, real_name,
DB_OSO_CREATE, argp->mode, &fh)) != 0)
goto out;
if ((ret = __os_closehandle(&fh)) != 0)
goto out;
} else if (DB_UNDO(op)) {
/*
* If the file is 0-length then it was in the process of being
* created, so we should unlink it. If it is non-0 length, then
* either someone else created it and we need to leave it
* untouched or we were in the process of creating it, allocated
* the first page on a system that requires you to actually
* write pages as you allocate them, but never got any data
* on it.
* If the file doesn't exist, we never got around to creating
* it, so that's fine.
*/
if (__os_exists(real_name, NULL) != 0)
goto done;
if ((ret = __os_open(dbenv, real_name, 0, 0, &fh)) != 0)
goto out;
if ((ret = __os_ioinfo(dbenv,
real_name, &fh, &mb, &b, &io)) != 0)
goto out;
do_unlink = 0;
if (mb != 0 || b != 0) {
/*
* We need to read the first page
* to see if its got valid data on it.
*/
if ((ret = __os_read(dbenv, &fh,
&ondisk, sizeof(ondisk), &nr)) != 0 ||
nr != sizeof(ondisk))
goto out;
if (ondisk.magic == 0)
do_unlink = 1;
}
if ((ret = __os_closehandle(&fh)) != 0)
goto out;
/* Check for 0-length and if it is, delete it. */
if (do_unlink || (mb == 0 && b == 0))
if ((ret = __os_unlink(dbenv, real_name)) != 0)
goto out;
}
done: *lsnp = argp->prev_lsn;
ret = 0;
out: if (argp != NULL)
__os_free(argp, 0);
if (real_name != NULL)
__os_freestr(real_name);
return (ret);
}
/*
* __crdel_metasub_recover --
* Recovery function for metasub.
*
* PUBLIC: int __crdel_metasub_recover
* PUBLIC: __P((DB_ENV *, DBT *, DB_LSN *, db_recops, void *));
*/
int
__crdel_metasub_recover(dbenv, dbtp, lsnp, op, info)
DB_ENV *dbenv;
DBT *dbtp;
DB_LSN *lsnp;
db_recops op;
void *info;
{
__crdel_metasub_args *argp;
DB *file_dbp;
DBC *dbc;
DB_MPOOLFILE *mpf;
PAGE *pagep;
u_int8_t *file_uid, ptype;
int cmp_p, modified, reopen, ret;
COMPQUIET(info, NULL);
REC_PRINT(__crdel_metasub_print);
REC_INTRO(__crdel_metasub_read, 0);
if ((ret = memp_fget(mpf, &argp->pgno, 0, &pagep)) != 0) {
if (DB_REDO(op)) {
if ((ret = memp_fget(mpf,
&argp->pgno, DB_MPOOL_CREATE, &pagep)) != 0)
goto out;
} else {
*lsnp = argp->prev_lsn;
ret = 0;
goto out;
}
}
modified = 0;
reopen = 0;
cmp_p = log_compare(&LSN(pagep), &argp->lsn);
CHECK_LSN(op, cmp_p, &LSN(pagep), &argp->lsn);
if (cmp_p == 0 && DB_REDO(op)) {
memcpy(pagep, argp->page.data, argp->page.size);
LSN(pagep) = *lsnp;
modified = 1;
/*
* If this is a meta-data page, then we must reopen;
* if it was a root page, then we do not.
*/
ptype = ((DBMETA *)argp->page.data)->type;
if (ptype == P_HASHMETA || ptype == P_BTREEMETA ||
ptype == P_QAMMETA)
reopen = 1;
} else if (DB_UNDO(op)) {
/*
* We want to undo this page creation. The page creation
* happened in two parts. First, we called __bam_new which
* was logged separately. Then we wrote the meta-data onto
* the page. So long as we restore the LSN, then the recovery
* for __bam_new will do everything else.
* Don't bother checking the lsn on the page. If we
* are rolling back the next thing is that this page
* will get freed. Opening the subdb will have reinitialized
* the page, but not the lsn.
*/
LSN(pagep) = argp->lsn;
modified = 1;
}
if ((ret = memp_fput(mpf, pagep, modified ? DB_MPOOL_DIRTY : 0)) != 0)
goto out;
/*
* If we are redoing a subdatabase create, we must close and reopen the
* file to be sure that we have the proper meta information in the
* in-memory structures
*/
if (reopen) {
/* Close cursor if it's open. */
if (dbc != NULL) {
dbc->c_close(dbc);
dbc = NULL;
}
if ((ret = __os_malloc(dbenv,
DB_FILE_ID_LEN, NULL, &file_uid)) != 0)
goto out;
memcpy(file_uid, &file_dbp->fileid[0], DB_FILE_ID_LEN);
ret = __log_reopen_file(dbenv,
NULL, argp->fileid, file_uid, argp->pgno);
(void)__os_free(file_uid, DB_FILE_ID_LEN);
if (ret != 0)
goto out;
}
done: *lsnp = argp->prev_lsn;
ret = 0;
out: REC_CLOSE;
}
/*
* __crdel_metapage_recover --
* Recovery function for metapage.
*
* PUBLIC: int __crdel_metapage_recover
* PUBLIC: __P((DB_ENV *, DBT *, DB_LSN *, db_recops, void *));
*/
int
__crdel_metapage_recover(dbenv, dbtp, lsnp, op, info)
DB_ENV *dbenv;
DBT *dbtp;
DB_LSN *lsnp;
db_recops op;
void *info;
{
__crdel_metapage_args *argp;
DB *dbp;
DBMETA *meta, ondisk;
DB_FH fh;
size_t nr;
u_int32_t b, io, mb, pagesize;
int is_done, ret;
char *real_name;
COMPQUIET(info, NULL);
real_name = NULL;
memset(&fh, 0, sizeof(fh));
REC_PRINT(__crdel_metapage_print);
if ((ret = __crdel_metapage_read(dbenv, dbtp->data, &argp)) != 0)
goto out;
/*
* If this is an in-memory database, then the name is going to
* be NULL, which looks like a 0-length name in recovery.
*/
if (argp->name.size == 0)
goto done;
meta = (DBMETA *)argp->page.data;
__ua_memcpy(&pagesize, &meta->pagesize, sizeof(pagesize));
if ((ret = __db_appname(dbenv, DB_APP_DATA,
NULL, argp->name.data, 0, NULL, &real_name)) != 0)
goto out;
if (DB_REDO(op)) {
if ((ret = __db_fileid_to_db(dbenv,
&dbp, argp->fileid, 0)) != 0) {
if (ret == DB_DELETED)
goto done;
else
goto out;
}
/*
* We simply read the first page and if the LSN is 0, we
* write the meta-data page.
*/
if ((ret = __os_open(dbenv, real_name, 0, 0, &fh)) != 0)
goto out;
if ((ret = __os_seek(dbenv, &fh,
pagesize, argp->pgno, 0, 0, DB_OS_SEEK_SET)) != 0)
goto out;
/*
* If the read succeeds then the page exists, then we need
* to vrify that the page has actually been written, because
* on some systems (e.g., Windows) we preallocate pages because
* files aren't allowed to have holes in them. If the page
* looks good then we're done.
*/
if ((ret = __os_read(dbenv, &fh, &ondisk,
sizeof(ondisk), &nr)) == 0 && nr == sizeof(ondisk)) {
if (ondisk.magic != 0)
goto done;
if ((ret = __os_seek(dbenv, &fh,
pagesize, argp->pgno, 0, 0, DB_OS_SEEK_SET)) != 0)
goto out;
}
/*
* Page didn't exist, update the LSN and write a new one.
* (seek pointer shouldn't have moved)
*/
__ua_memcpy(&meta->lsn, lsnp, sizeof(DB_LSN));
if ((ret = __os_write(dbp->dbenv, &fh,
argp->page.data, argp->page.size, &nr)) != 0)
goto out;
if (nr != (size_t)argp->page.size) {
__db_err(dbenv, "Write failed during recovery");
ret = EIO;
goto out;
}
/*
* We must close and reopen the file to be sure
* that we have the proper meta information
* in the in memory structures
*/
if ((ret = __log_reopen_file(dbenv,
argp->name.data, argp->fileid,
meta->uid, argp->pgno)) != 0)
goto out;
/* Handle will be closed on exit. */
} else if (DB_UNDO(op)) {
is_done = 0;
/* If file does not exist, there is nothing to undo. */
if (__os_exists(real_name, NULL) != 0)
goto done;
/*
* Before we can look at anything on disk, we have to check
* if there is a valid dbp for this, and if there is, we'd
* better flush it.
*/
dbp = NULL;
if ((ret =
__db_fileid_to_db(dbenv, &dbp, argp->fileid, 0)) == 0)
(void)dbp->sync(dbp, 0);
/*
* We need to make sure that we do not remove a file that
* someone else created. If the file is 0-length, then we
* can assume that we created it and remove it. If it is
* not 0-length, then we need to check the LSN and make
* sure that it's the file we created.
*/
if ((ret = __os_open(dbenv, real_name, 0, 0, &fh)) != 0)
goto out;
if ((ret = __os_ioinfo(dbenv,
real_name, &fh, &mb, &b, &io)) != 0)
goto out;
if (mb != 0 || b != 0) {
/* The file has something in it. */
if ((ret = __os_seek(dbenv, &fh,
pagesize, argp->pgno, 0, 0, DB_OS_SEEK_SET)) != 0)
goto out;
if ((ret = __os_read(dbenv, &fh,
&ondisk, sizeof(ondisk), &nr)) != 0)
goto out;
if (log_compare(&ondisk.lsn, lsnp) != 0)
is_done = 1;
}
/*
* Must close here, because unlink with the file open fails
* on some systems.
*/
if ((ret = __os_closehandle(&fh)) != 0)
goto out;
if (!is_done) {
/*
* On some systems, you cannot unlink an open file so
* we close the fd in the dbp here and make sure we
* don't try to close it again. First, check for a
* saved_open_fhp, then close down the mpool.
*/
if (dbp != NULL && dbp->saved_open_fhp != NULL &&
F_ISSET(dbp->saved_open_fhp, DB_FH_VALID) &&
(ret = __os_closehandle(dbp->saved_open_fhp)) != 0)
goto out;
if (dbp != NULL && dbp->mpf != NULL) {
(void)__memp_fremove(dbp->mpf);
if ((ret = memp_fclose(dbp->mpf)) != 0)
goto out;
F_SET(dbp, DB_AM_DISCARD);
dbp->mpf = NULL;
}
if ((ret = __os_unlink(dbenv, real_name)) != 0)
goto out;
}
}
done: *lsnp = argp->prev_lsn;
ret = 0;
out: if (argp != NULL)
__os_free(argp, 0);
if (real_name != NULL)
__os_freestr(real_name);
if (F_ISSET(&fh, DB_FH_VALID))
(void)__os_closehandle(&fh);
return (ret);
}
/*
* __crdel_delete_recover --
* Recovery function for delete.
*
* PUBLIC: int __crdel_delete_recover
* PUBLIC: __P((DB_ENV *, DBT *, DB_LSN *, db_recops, void *));
*/
int
__crdel_delete_recover(dbenv, dbtp, lsnp, op, info)
DB_ENV *dbenv;
DBT *dbtp;
DB_LSN *lsnp;
db_recops op;
void *info;
{
DB *dbp;
__crdel_delete_args *argp;
int ret;
char *backup, *real_back, *real_name;
REC_PRINT(__crdel_delete_print);
backup = real_back = real_name = NULL;
if ((ret = __crdel_delete_read(dbenv, dbtp->data, &argp)) != 0)
goto out;
if (DB_REDO(op)) {
/*
* On a recovery, as we recreate what was going on, we
* recreate the creation of the file. And so, even though
* it committed, we need to delete it. Try to delete it,
* but it is not an error if that delete fails.
*/
if ((ret = __db_appname(dbenv, DB_APP_DATA,
NULL, argp->name.data, 0, NULL, &real_name)) != 0)
goto out;
if (__os_exists(real_name, NULL) == 0) {
/*
* If a file is deleted and then recreated, it's
* possible for the __os_exists call above to
* return success and for us to get here, but for
* the fileid we're looking for to be marked
* deleted. In that case, we needn't redo the
* unlink even though the file exists, and it's
* not an error.
*/
ret = __db_fileid_to_db(dbenv, &dbp, argp->fileid, 0);
if (ret == 0) {
/*
* On Windows, the underlying file must be
* closed to perform a remove.
*/
(void)__memp_fremove(dbp->mpf);
if ((ret = memp_fclose(dbp->mpf)) != 0)
goto out;
dbp->mpf = NULL;
if ((ret = __os_unlink(dbenv, real_name)) != 0)
goto out;
} else if (ret != DB_DELETED)
goto out;
}
/*
* The transaction committed, so the only thing that might
* be true is that the backup file is still around. Try
* to delete it, but it's not an error if that delete fails.
*/
if ((ret = __db_backup_name(dbenv, argp->name.data,
&backup, lsnp)) != 0)
goto out;
if ((ret = __db_appname(dbenv,
DB_APP_DATA, NULL, backup, 0, NULL, &real_back)) != 0)
goto out;
if (__os_exists(real_back, NULL) == 0)
if ((ret = __os_unlink(dbenv, real_back)) != 0)
goto out;
if ((ret = __db_txnlist_delete(dbenv, info,
argp->name.data, TXNLIST_INVALID_ID, 1)) != 0)
goto out;
} else if (DB_UNDO(op)) {
/*
* Trying to undo. File may or may not have been deleted.
* Try to move the backup to the original. If the backup
* exists, then this is right. If it doesn't exist, then
* nothing will happen and that's OK.
*/
if ((ret = __db_backup_name(dbenv, argp->name.data,
&backup, lsnp)) != 0)
goto out;
if ((ret = __db_appname(dbenv,
DB_APP_DATA, NULL, backup, 0, NULL, &real_back)) != 0)
goto out;
if ((ret = __db_appname(dbenv, DB_APP_DATA,
NULL, argp->name.data, 0, NULL, &real_name)) != 0)
goto out;
if (__os_exists(real_back, NULL) == 0)
if ((ret =
__os_rename(dbenv, real_back, real_name)) != 0)
goto out;
}
*lsnp = argp->prev_lsn;
ret = 0;
out: if (argp != NULL)
__os_free(argp, 0);
if (backup != NULL)
__os_freestr(backup);
if (real_back != NULL)
__os_freestr(real_back);
if (real_name != NULL)
__os_freestr(real_name);
return (ret);
}
/*
* __crdel_rename_recover --
* Recovery function for rename.
*
* PUBLIC: int __crdel_rename_recover
* PUBLIC: __P((DB_ENV *, DBT *, DB_LSN *, db_recops, void *));
*/
int
__crdel_rename_recover(dbenv, dbtp, lsnp, op, info)
DB_ENV *dbenv;
DBT *dbtp;
DB_LSN *lsnp;
db_recops op;
void *info;
{
DB *dbp;
__crdel_rename_args *argp;
char *new_name, *real_name;
int ret, set;
COMPQUIET(info, NULL);
REC_PRINT(__crdel_rename_print);
new_name = real_name = NULL;
if ((ret = __crdel_rename_read(dbenv, dbtp->data, &argp)) != 0)
goto out;
if ((ret = __db_fileid_to_db(dbenv, &dbp, argp->fileid, 0)) != 0)
goto out;
if (DB_REDO(op)) {
/*
* We don't use the dbp parameter to __log_filelist_update
* in the rename case, so passing NULL for it is OK.
*/
if ((ret = __log_filelist_update(dbenv, NULL,
argp->fileid, argp->newname.data, &set)) != 0)
goto out;
if (set != 0) {
if ((ret = __db_appname(dbenv, DB_APP_DATA,
NULL, argp->name.data, 0, NULL, &real_name)) != 0)
goto out;
if (__os_exists(real_name, NULL) == 0) {
if ((ret = __db_appname(dbenv,
DB_APP_DATA, NULL, argp->newname.data,
0, NULL, &new_name)) != 0)
goto out;
/*
* On Windows, the underlying file
* must be closed to perform a remove.
* The db will be closed by a
* log_register record. Rename
* has exclusive access to the db.
*/
(void)__memp_fremove(dbp->mpf);
if ((ret = memp_fclose(dbp->mpf)) != 0)
goto out;
dbp->mpf = NULL;
if ((ret = __os_rename(dbenv,
real_name, new_name)) != 0)
goto out;
}
}
} else {
/*
* We don't use the dbp parameter to __log_filelist_update
* in the rename case, so passing NULL for it is OK.
*/
if ((ret = __log_filelist_update(dbenv, NULL,
argp->fileid, argp->name.data, &set)) != 0)
goto out;
if (set != 0) {
if ((ret = __db_appname(dbenv, DB_APP_DATA,
NULL, argp->newname.data, 0, NULL, &new_name)) != 0)
goto out;
if (__os_exists(new_name, NULL) == 0) {
if ((ret = __db_appname(dbenv,
DB_APP_DATA, NULL, argp->name.data,
0, NULL, &real_name)) != 0)
goto out;
/*
* On Windows, the underlying file
* must be closed to perform a remove.
* The file may have already been closed
* if we are aborting the transaction.
*/
if (dbp->mpf != NULL) {
(void)__memp_fremove(dbp->mpf);
if ((ret = memp_fclose(dbp->mpf)) != 0)
goto out;
dbp->mpf = NULL;
}
if ((ret = __os_rename(dbenv,
new_name, real_name)) != 0)
goto out;
}
}
}
*lsnp = argp->prev_lsn;
ret = 0;
out: if (argp != NULL)
__os_free(argp, 0);
if (new_name != NULL)
__os_free(new_name, 0);
if (real_name != NULL)
__os_free(real_name, 0);
return (ret);
}