2001-03-04 19:42:05 -05:00
|
|
|
/*-
|
|
|
|
* See the file LICENSE for redistribution information.
|
|
|
|
*
|
2005-12-05 10:27:46 -08:00
|
|
|
* Copyright (c) 1996-2005
|
2001-03-04 19:42:05 -05:00
|
|
|
* Sleepycat Software. All rights reserved.
|
2005-07-20 15:48:22 -07:00
|
|
|
*
|
2005-12-05 10:27:46 -08:00
|
|
|
* $Id: log.c,v 12.15 2005/10/14 15:20:24 bostic Exp $
|
2001-03-04 19:42:05 -05:00
|
|
|
*/
|
|
|
|
|
2005-07-20 15:48:22 -07:00
|
|
|
#include "db_config.h"
|
2001-03-04 19:42:05 -05:00
|
|
|
|
|
|
|
#ifndef NO_SYSTEM_INCLUDES
|
|
|
|
#include <sys/types.h>
|
|
|
|
|
2002-10-30 15:57:05 +04:00
|
|
|
#include <ctype.h>
|
2001-03-04 19:42:05 -05:00
|
|
|
#include <stdlib.h>
|
|
|
|
#include <string.h>
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#include "db_int.h"
|
2002-10-30 15:57:05 +04:00
|
|
|
#include "dbinc/crypto.h"
|
|
|
|
#include "dbinc/hmac.h"
|
|
|
|
#include "dbinc/log.h"
|
|
|
|
#include "dbinc/txn.h"
|
2001-03-04 19:42:05 -05:00
|
|
|
|
2005-07-20 15:48:22 -07:00
|
|
|
static int __log_init __P((DB_ENV *, DB_LOG *));
|
|
|
|
static int __log_recover __P((DB_LOG *));
|
|
|
|
static size_t __log_region_size __P((DB_ENV *));
|
|
|
|
static int __log_zero __P((DB_ENV *, DB_LSN *, DB_LSN *));
|
2001-03-04 19:42:05 -05:00
|
|
|
|
|
|
|
/*
|
|
|
|
* __log_open --
|
|
|
|
* Internal version of log_open: only called from DB_ENV->open.
|
|
|
|
*
|
|
|
|
* PUBLIC: int __log_open __P((DB_ENV *));
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
__log_open(dbenv)
|
|
|
|
DB_ENV *dbenv;
|
|
|
|
{
|
|
|
|
DB_LOG *dblp;
|
|
|
|
LOG *lp;
|
2005-12-05 10:27:46 -08:00
|
|
|
u_int8_t *bulk;
|
|
|
|
int region_locked, ret;
|
|
|
|
|
|
|
|
region_locked = 0;
|
2001-03-04 19:42:05 -05:00
|
|
|
|
|
|
|
/* Create/initialize the DB_LOG structure. */
|
|
|
|
if ((ret = __os_calloc(dbenv, 1, sizeof(DB_LOG), &dblp)) != 0)
|
|
|
|
return (ret);
|
|
|
|
dblp->dbenv = dbenv;
|
|
|
|
|
2005-07-20 15:48:22 -07:00
|
|
|
/* Set the default buffer size, if not otherwise configured. */
|
|
|
|
if (dbenv->lg_bsize == 0)
|
|
|
|
dbenv->lg_bsize = F_ISSET(dbenv, DB_ENV_LOG_INMEMORY) ?
|
|
|
|
LG_BSIZE_INMEM : LG_BSIZE_DEFAULT;
|
|
|
|
|
2001-03-04 19:42:05 -05:00
|
|
|
/* Join/create the log region. */
|
2005-07-20 15:48:22 -07:00
|
|
|
dblp->reginfo.dbenv = dbenv;
|
2001-03-04 19:42:05 -05:00
|
|
|
dblp->reginfo.type = REGION_TYPE_LOG;
|
|
|
|
dblp->reginfo.id = INVALID_REGION_ID;
|
|
|
|
dblp->reginfo.flags = REGION_JOIN_OK;
|
|
|
|
if (F_ISSET(dbenv, DB_ENV_CREATE))
|
|
|
|
F_SET(&dblp->reginfo, REGION_CREATE_OK);
|
|
|
|
if ((ret = __db_r_attach(
|
2002-10-30 15:57:05 +04:00
|
|
|
dbenv, &dblp->reginfo, __log_region_size(dbenv))) != 0)
|
2001-03-04 19:42:05 -05:00
|
|
|
goto err;
|
|
|
|
|
|
|
|
/* If we created the region, initialize it. */
|
2002-10-30 15:57:05 +04:00
|
|
|
if (F_ISSET(&dblp->reginfo, REGION_CREATE))
|
|
|
|
if ((ret = __log_init(dbenv, dblp)) != 0)
|
|
|
|
goto err;
|
2001-03-04 19:42:05 -05:00
|
|
|
|
|
|
|
/* Set the local addresses. */
|
|
|
|
lp = dblp->reginfo.primary =
|
|
|
|
R_ADDR(&dblp->reginfo, dblp->reginfo.rp->primary);
|
2005-12-05 10:27:46 -08:00
|
|
|
dblp->bufp = R_ADDR(&dblp->reginfo, lp->buffer_off);
|
2001-03-04 19:42:05 -05:00
|
|
|
|
|
|
|
/*
|
2005-12-05 10:27:46 -08:00
|
|
|
* If the region is threaded, we have to lock the DBREG list, and we
|
|
|
|
* need to allocate a mutex for that purpose.
|
2001-03-04 19:42:05 -05:00
|
|
|
*/
|
2005-12-05 10:27:46 -08:00
|
|
|
if ((ret = __mutex_alloc(dbenv,
|
|
|
|
MTX_LOG_REGION, DB_MUTEX_THREAD, &dblp->mtx_dbreg)) != 0)
|
2002-10-30 15:57:05 +04:00
|
|
|
goto err;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Set the handle -- we may be about to run recovery, which allocates
|
|
|
|
* log cursors. Log cursors require logging be already configured,
|
|
|
|
* and the handle being set is what demonstrates that.
|
|
|
|
*
|
|
|
|
* If we created the region, run recovery. If that fails, make sure
|
|
|
|
* we reset the log handle before cleaning up, otherwise we will try
|
|
|
|
* and clean up again in the mainline DB_ENV initialization code.
|
|
|
|
*/
|
|
|
|
dbenv->lg_handle = dblp;
|
|
|
|
|
|
|
|
if (F_ISSET(&dblp->reginfo, REGION_CREATE)) {
|
|
|
|
/*
|
|
|
|
* We first take the log file size from the environment, if
|
2005-07-20 15:48:22 -07:00
|
|
|
* specified. If that wasn't set, default it. Regardless,
|
|
|
|
* recovery may set it from the persistent information in a
|
|
|
|
* log file header.
|
2002-10-30 15:57:05 +04:00
|
|
|
*/
|
|
|
|
if (lp->log_size == 0)
|
2005-07-20 15:48:22 -07:00
|
|
|
lp->log_size = F_ISSET(dbenv, DB_ENV_LOG_INMEMORY) ?
|
|
|
|
LG_MAX_INMEM : LG_MAX_DEFAULT;
|
|
|
|
|
|
|
|
if ((ret = __log_recover(dblp)) != 0)
|
|
|
|
goto err;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* If the next log file size hasn't been set yet, default it
|
|
|
|
* to the current log file size.
|
|
|
|
*/
|
|
|
|
if (lp->log_nsize == 0)
|
|
|
|
lp->log_nsize = lp->log_size;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* If we haven't written any log files, write the first one
|
|
|
|
* so that checkpoint gets a valid ckp_lsn value.
|
|
|
|
*/
|
|
|
|
if (IS_INIT_LSN(lp->lsn) &&
|
|
|
|
(ret = __log_newfile(dblp, NULL, 0)) != 0)
|
|
|
|
goto err;
|
|
|
|
|
2005-12-05 10:27:46 -08:00
|
|
|
/*
|
|
|
|
* Initialize replication's next-expected LSN value
|
|
|
|
* and replication's bulk buffer.
|
|
|
|
*/
|
2005-07-20 15:48:22 -07:00
|
|
|
lp->ready_lsn = lp->lsn;
|
2005-12-05 10:27:46 -08:00
|
|
|
if (IS_ENV_REPLICATED(dbenv)) {
|
|
|
|
if ((ret = __db_shalloc(&dblp->reginfo, MEGABYTE, 0,
|
|
|
|
&bulk)) != 0)
|
|
|
|
goto err;
|
|
|
|
lp->bulk_buf = R_OFFSET(&dblp->reginfo, bulk);
|
|
|
|
lp->bulk_len = MEGABYTE;
|
|
|
|
lp->bulk_off = 0;
|
|
|
|
} else {
|
|
|
|
lp->bulk_buf = INVALID_ROFF;
|
|
|
|
lp->bulk_len = 0;
|
|
|
|
lp->bulk_off = 0;
|
|
|
|
}
|
2002-10-30 15:57:05 +04:00
|
|
|
} else {
|
|
|
|
/*
|
|
|
|
* A process joining the region may have reset the log file
|
|
|
|
* size, too. If so, it only affects the next log file we
|
2005-07-20 15:48:22 -07:00
|
|
|
* create. We need to check that the size is reasonable given
|
|
|
|
* the buffer size in the region.
|
2002-10-30 15:57:05 +04:00
|
|
|
*/
|
2005-12-05 10:27:46 -08:00
|
|
|
LOG_SYSTEM_LOCK(dbenv);
|
|
|
|
region_locked = 1;
|
|
|
|
|
2005-07-20 15:48:22 -07:00
|
|
|
if (dbenv->lg_size != 0) {
|
|
|
|
if ((ret =
|
|
|
|
__log_check_sizes(dbenv, dbenv->lg_size, 0)) != 0)
|
|
|
|
goto err;
|
|
|
|
|
2002-10-30 15:57:05 +04:00
|
|
|
lp->log_nsize = dbenv->lg_size;
|
2005-07-20 15:48:22 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
/* Migrate persistent flags from the region into the DB_ENV. */
|
|
|
|
if (lp->db_log_autoremove)
|
|
|
|
F_SET(dbenv, DB_ENV_LOG_AUTOREMOVE);
|
|
|
|
if (lp->db_log_inmemory)
|
|
|
|
F_SET(dbenv, DB_ENV_LOG_INMEMORY);
|
2005-12-05 10:27:46 -08:00
|
|
|
|
|
|
|
LOG_SYSTEM_UNLOCK(dbenv);
|
|
|
|
region_locked = 0;
|
2001-03-04 19:42:05 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
return (0);
|
|
|
|
|
2005-07-20 15:48:22 -07:00
|
|
|
err: dbenv->lg_handle = NULL;
|
|
|
|
if (dblp->reginfo.addr != NULL) {
|
2005-12-05 10:27:46 -08:00
|
|
|
if (region_locked)
|
|
|
|
LOG_SYSTEM_UNLOCK(dbenv);
|
2001-03-04 19:42:05 -05:00
|
|
|
(void)__db_r_detach(dbenv, &dblp->reginfo, 0);
|
|
|
|
}
|
|
|
|
|
2005-12-05 10:27:46 -08:00
|
|
|
(void)__mutex_free(dbenv, &dblp->mtx_dbreg);
|
2002-10-30 15:57:05 +04:00
|
|
|
__os_free(dbenv, dblp);
|
|
|
|
|
2001-03-04 19:42:05 -05:00
|
|
|
return (ret);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* __log_init --
|
|
|
|
* Initialize a log region in shared memory.
|
|
|
|
*/
|
|
|
|
static int
|
|
|
|
__log_init(dbenv, dblp)
|
|
|
|
DB_ENV *dbenv;
|
|
|
|
DB_LOG *dblp;
|
|
|
|
{
|
2005-07-20 15:48:22 -07:00
|
|
|
LOG *lp;
|
2001-03-04 19:42:05 -05:00
|
|
|
int ret;
|
|
|
|
void *p;
|
|
|
|
|
2005-07-20 15:48:22 -07:00
|
|
|
/*
|
|
|
|
* This is the first point where we can validate the buffer size,
|
|
|
|
* because we know all three settings have been configured (file size,
|
|
|
|
* buffer size and the in-memory flag).
|
|
|
|
*/
|
|
|
|
if ((ret =
|
|
|
|
__log_check_sizes(dbenv, dbenv->lg_size, dbenv->lg_bsize)) != 0)
|
|
|
|
return (ret);
|
|
|
|
|
|
|
|
if ((ret = __db_shalloc(&dblp->reginfo,
|
2005-12-05 10:27:46 -08:00
|
|
|
sizeof(*lp), 0, &dblp->reginfo.primary)) != 0)
|
2001-03-04 19:42:05 -05:00
|
|
|
goto mem_err;
|
|
|
|
dblp->reginfo.rp->primary =
|
|
|
|
R_OFFSET(&dblp->reginfo, dblp->reginfo.primary);
|
2005-07-20 15:48:22 -07:00
|
|
|
lp = dblp->reginfo.primary;
|
|
|
|
memset(lp, 0, sizeof(*lp));
|
2001-03-04 19:42:05 -05:00
|
|
|
|
2005-12-05 10:27:46 -08:00
|
|
|
if ((ret =
|
|
|
|
__mutex_alloc(dbenv, MTX_LOG_REGION, 0, &lp->mtx_region)) != 0)
|
|
|
|
return (ret);
|
|
|
|
|
2005-07-20 15:48:22 -07:00
|
|
|
lp->fid_max = 0;
|
|
|
|
SH_TAILQ_INIT(&lp->fq);
|
|
|
|
lp->free_fid_stack = INVALID_ROFF;
|
|
|
|
lp->free_fids = lp->free_fids_alloced = 0;
|
2001-03-04 19:42:05 -05:00
|
|
|
|
|
|
|
/* Initialize LOG LSNs. */
|
2005-07-20 15:48:22 -07:00
|
|
|
INIT_LSN(lp->lsn);
|
|
|
|
INIT_LSN(lp->t_lsn);
|
2002-10-30 15:57:05 +04:00
|
|
|
|
|
|
|
/*
|
|
|
|
* It's possible to be waiting for an LSN of [1][0], if a replication
|
|
|
|
* client gets the first log record out of order. An LSN of [0][0]
|
|
|
|
* signifies that we're not waiting.
|
|
|
|
*/
|
2005-07-20 15:48:22 -07:00
|
|
|
ZERO_LSN(lp->waiting_lsn);
|
2002-10-30 15:57:05 +04:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Log makes note of the fact that it ran into a checkpoint on
|
|
|
|
* startup if it did so, as a recovery optimization. A zero
|
|
|
|
* LSN signifies that it hasn't found one [yet].
|
|
|
|
*/
|
2005-07-20 15:48:22 -07:00
|
|
|
ZERO_LSN(lp->cached_ckp_lsn);
|
2002-10-30 15:57:05 +04:00
|
|
|
|
2005-12-05 10:27:46 -08:00
|
|
|
if ((ret =
|
|
|
|
__mutex_alloc(dbenv, MTX_LOG_FILENAME, 0, &lp->mtx_filelist)) != 0)
|
2002-10-30 15:57:05 +04:00
|
|
|
return (ret);
|
2005-12-05 10:27:46 -08:00
|
|
|
if ((ret = __mutex_alloc(dbenv, MTX_LOG_FLUSH, 0, &lp->mtx_flush)) != 0)
|
2002-10-30 15:57:05 +04:00
|
|
|
return (ret);
|
2001-03-04 19:42:05 -05:00
|
|
|
|
|
|
|
/* Initialize the buffer. */
|
2005-07-20 15:48:22 -07:00
|
|
|
if ((ret = __db_shalloc(&dblp->reginfo, dbenv->lg_bsize, 0, &p)) != 0) {
|
2001-03-04 19:42:05 -05:00
|
|
|
mem_err: __db_err(dbenv, "Unable to allocate memory for the log buffer");
|
|
|
|
return (ret);
|
|
|
|
}
|
2005-07-20 15:48:22 -07:00
|
|
|
lp->regionmax = dbenv->lg_regionmax;
|
|
|
|
lp->buffer_off = R_OFFSET(&dblp->reginfo, p);
|
|
|
|
lp->buffer_size = dbenv->lg_bsize;
|
2005-12-05 10:27:46 -08:00
|
|
|
lp->filemode = dbenv->lg_filemode;
|
2005-07-20 15:48:22 -07:00
|
|
|
lp->log_size = lp->log_nsize = dbenv->lg_size;
|
2001-03-04 19:42:05 -05:00
|
|
|
|
2002-10-30 15:57:05 +04:00
|
|
|
/* Initialize the commit Queue. */
|
2005-07-20 15:48:22 -07:00
|
|
|
SH_TAILQ_INIT(&lp->free_commits);
|
|
|
|
SH_TAILQ_INIT(&lp->commits);
|
|
|
|
lp->ncommit = 0;
|
|
|
|
|
|
|
|
/* Initialize the logfiles list for in-memory logs. */
|
|
|
|
SH_TAILQ_INIT(&lp->logfiles);
|
|
|
|
SH_TAILQ_INIT(&lp->free_logfiles);
|
2002-10-30 15:57:05 +04:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Fill in the log's persistent header. Don't fill in the log file
|
|
|
|
* sizes, as they may change at any time and so have to be filled in
|
|
|
|
* as each log file is created.
|
|
|
|
*/
|
2005-07-20 15:48:22 -07:00
|
|
|
lp->persist.magic = DB_LOGMAGIC;
|
|
|
|
lp->persist.version = DB_LOGVERSION;
|
2005-12-05 10:27:46 -08:00
|
|
|
lp->persist.notused = 0;
|
2005-07-20 15:48:22 -07:00
|
|
|
|
|
|
|
/* Migrate persistent flags from the DB_ENV into the region. */
|
|
|
|
if (F_ISSET(dbenv, DB_ENV_LOG_AUTOREMOVE))
|
|
|
|
lp->db_log_autoremove = 1;
|
|
|
|
if (F_ISSET(dbenv, DB_ENV_LOG_INMEMORY))
|
|
|
|
lp->db_log_inmemory = 1;
|
2002-10-30 15:57:05 +04:00
|
|
|
|
|
|
|
return (0);
|
2001-03-04 19:42:05 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* __log_recover --
|
|
|
|
* Recover a log.
|
|
|
|
*/
|
|
|
|
static int
|
|
|
|
__log_recover(dblp)
|
|
|
|
DB_LOG *dblp;
|
|
|
|
{
|
|
|
|
DBT dbt;
|
2002-10-30 15:57:05 +04:00
|
|
|
DB_ENV *dbenv;
|
|
|
|
DB_LOGC *logc;
|
2001-03-04 19:42:05 -05:00
|
|
|
DB_LSN lsn;
|
|
|
|
LOG *lp;
|
2002-10-30 15:57:05 +04:00
|
|
|
u_int32_t cnt, rectype;
|
|
|
|
int ret;
|
2001-03-04 19:42:05 -05:00
|
|
|
logfile_validity status;
|
|
|
|
|
2002-10-30 15:57:05 +04:00
|
|
|
logc = NULL;
|
|
|
|
dbenv = dblp->dbenv;
|
2001-03-04 19:42:05 -05:00
|
|
|
lp = dblp->reginfo.primary;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Find a log file. If none exist, we simply return, leaving
|
|
|
|
* everything initialized to a new log.
|
|
|
|
*/
|
|
|
|
if ((ret = __log_find(dblp, 0, &cnt, &status)) != 0)
|
|
|
|
return (ret);
|
|
|
|
if (cnt == 0)
|
|
|
|
return (0);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* If the last file is an old version, readable or no, start a new
|
2002-10-30 15:57:05 +04:00
|
|
|
* file. Don't bother finding the end of the last log file;
|
|
|
|
* we assume that it's valid in its entirety, since the user
|
|
|
|
* should have shut down cleanly or run recovery before upgrading.
|
2001-03-04 19:42:05 -05:00
|
|
|
*/
|
|
|
|
if (status == DB_LV_OLD_READABLE || status == DB_LV_OLD_UNREADABLE) {
|
|
|
|
lp->lsn.file = lp->s_lsn.file = cnt + 1;
|
|
|
|
lp->lsn.offset = lp->s_lsn.offset = 0;
|
|
|
|
goto skipsearch;
|
|
|
|
}
|
|
|
|
DB_ASSERT(status == DB_LV_NORMAL);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* We have the last useful log file and we've loaded any persistent
|
|
|
|
* information. Set the end point of the log past the end of the last
|
|
|
|
* file. Read the last file, looking for the last checkpoint and
|
|
|
|
* the log's end.
|
|
|
|
*/
|
|
|
|
lp->lsn.file = cnt + 1;
|
|
|
|
lp->lsn.offset = 0;
|
|
|
|
lsn.file = cnt;
|
|
|
|
lsn.offset = 0;
|
|
|
|
|
2002-10-30 15:57:05 +04:00
|
|
|
/*
|
|
|
|
* Allocate a cursor and set it to the first record. This shouldn't
|
|
|
|
* fail, leave error messages on.
|
|
|
|
*/
|
2005-07-20 15:48:22 -07:00
|
|
|
if ((ret = __log_cursor(dbenv, &logc)) != 0)
|
2001-03-04 19:42:05 -05:00
|
|
|
return (ret);
|
2002-10-30 15:57:05 +04:00
|
|
|
F_SET(logc, DB_LOG_LOCKED);
|
|
|
|
memset(&dbt, 0, sizeof(dbt));
|
2005-07-20 15:48:22 -07:00
|
|
|
if ((ret = __log_c_get(logc, &lsn, &dbt, DB_SET)) != 0)
|
2002-10-30 15:57:05 +04:00
|
|
|
goto err;
|
2001-03-04 19:42:05 -05:00
|
|
|
|
|
|
|
/*
|
2002-10-30 15:57:05 +04:00
|
|
|
* Read to the end of the file. This may fail at some point, so
|
|
|
|
* turn off error messages.
|
2001-03-04 19:42:05 -05:00
|
|
|
*/
|
2002-10-30 15:57:05 +04:00
|
|
|
F_SET(logc, DB_LOG_SILENT_ERR);
|
2005-07-20 15:48:22 -07:00
|
|
|
while (__log_c_get(logc, &lsn, &dbt, DB_NEXT) == 0) {
|
2001-03-04 19:42:05 -05:00
|
|
|
if (dbt.size < sizeof(u_int32_t))
|
|
|
|
continue;
|
2002-10-30 15:57:05 +04:00
|
|
|
memcpy(&rectype, dbt.data, sizeof(u_int32_t));
|
|
|
|
if (rectype == DB___txn_ckp)
|
|
|
|
/*
|
|
|
|
* If we happen to run into a checkpoint, cache its
|
|
|
|
* LSN so that the transaction system doesn't have
|
|
|
|
* to walk this log file again looking for it.
|
|
|
|
*/
|
|
|
|
lp->cached_ckp_lsn = lsn;
|
2001-03-04 19:42:05 -05:00
|
|
|
}
|
2002-10-30 15:57:05 +04:00
|
|
|
F_CLR(logc, DB_LOG_SILENT_ERR);
|
2001-03-04 19:42:05 -05:00
|
|
|
|
|
|
|
/*
|
|
|
|
* We now know where the end of the log is. Set the first LSN that
|
|
|
|
* we want to return to an application and the LSN of the last known
|
|
|
|
* record on disk.
|
|
|
|
*/
|
|
|
|
lp->lsn = lsn;
|
|
|
|
lp->s_lsn = lsn;
|
2002-10-30 15:57:05 +04:00
|
|
|
lp->lsn.offset += logc->c_len;
|
|
|
|
lp->s_lsn.offset += logc->c_len;
|
2001-03-04 19:42:05 -05:00
|
|
|
|
|
|
|
/* Set up the current buffer information, too. */
|
2002-10-30 15:57:05 +04:00
|
|
|
lp->len = logc->c_len;
|
2005-07-20 15:48:22 -07:00
|
|
|
lp->a_off = 0;
|
2001-03-04 19:42:05 -05:00
|
|
|
lp->b_off = 0;
|
|
|
|
lp->w_off = lp->lsn.offset;
|
|
|
|
|
2002-10-30 15:57:05 +04:00
|
|
|
skipsearch:
|
|
|
|
if (FLD_ISSET(dbenv->verbose, DB_VERB_RECOVERY))
|
2005-07-20 15:48:22 -07:00
|
|
|
__db_msg(dbenv,
|
2001-03-04 19:42:05 -05:00
|
|
|
"Finding last valid log LSN: file: %lu offset %lu",
|
|
|
|
(u_long)lp->lsn.file, (u_long)lp->lsn.offset);
|
|
|
|
|
2002-10-30 15:57:05 +04:00
|
|
|
err: if (logc != NULL)
|
2005-07-20 15:48:22 -07:00
|
|
|
(void)__log_c_close(logc);
|
2002-10-30 15:57:05 +04:00
|
|
|
|
|
|
|
return (ret);
|
2001-03-04 19:42:05 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* __log_find --
|
|
|
|
* Try to find a log file. If find_first is set, valp will contain
|
|
|
|
* the number of the first readable log file, else it will contain the number
|
|
|
|
* of the last log file (which may be too old to read).
|
|
|
|
*
|
2002-10-30 15:57:05 +04:00
|
|
|
* PUBLIC: int __log_find __P((DB_LOG *, int, u_int32_t *, logfile_validity *));
|
2001-03-04 19:42:05 -05:00
|
|
|
*/
|
|
|
|
int
|
|
|
|
__log_find(dblp, find_first, valp, statusp)
|
|
|
|
DB_LOG *dblp;
|
2002-10-30 15:57:05 +04:00
|
|
|
int find_first;
|
|
|
|
u_int32_t *valp;
|
2001-03-04 19:42:05 -05:00
|
|
|
logfile_validity *statusp;
|
|
|
|
{
|
2002-10-30 15:57:05 +04:00
|
|
|
DB_ENV *dbenv;
|
2005-07-20 15:48:22 -07:00
|
|
|
LOG *lp;
|
2001-05-09 23:02:36 +03:00
|
|
|
logfile_validity logval_status, status;
|
2005-07-20 15:48:22 -07:00
|
|
|
struct __db_filestart *filestart;
|
2001-03-04 19:42:05 -05:00
|
|
|
u_int32_t clv, logval;
|
|
|
|
int cnt, fcnt, ret;
|
|
|
|
const char *dir;
|
2002-10-30 15:57:05 +04:00
|
|
|
char *c, **names, *p, *q, savech;
|
2001-03-04 19:42:05 -05:00
|
|
|
|
2002-10-30 15:57:05 +04:00
|
|
|
dbenv = dblp->dbenv;
|
2005-07-20 15:48:22 -07:00
|
|
|
lp = dblp->reginfo.primary;
|
2001-05-09 23:02:36 +03:00
|
|
|
logval_status = status = DB_LV_NONEXISTENT;
|
2001-03-04 19:42:05 -05:00
|
|
|
|
|
|
|
/* Return a value of 0 as the log file number on failure. */
|
|
|
|
*valp = 0;
|
|
|
|
|
2005-07-20 15:48:22 -07:00
|
|
|
if (lp->db_log_inmemory) {
|
|
|
|
filestart = find_first ?
|
|
|
|
SH_TAILQ_FIRST(&lp->logfiles, __db_filestart) :
|
|
|
|
SH_TAILQ_LAST(&lp->logfiles, links, __db_filestart);
|
|
|
|
if (filestart != NULL) {
|
|
|
|
*valp = filestart->file;
|
|
|
|
logval_status = DB_LV_NORMAL;
|
|
|
|
}
|
|
|
|
*statusp = logval_status;
|
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
|
2001-03-04 19:42:05 -05:00
|
|
|
/* Find the directory name. */
|
|
|
|
if ((ret = __log_name(dblp, 1, &p, NULL, 0)) != 0)
|
|
|
|
return (ret);
|
|
|
|
if ((q = __db_rpath(p)) == NULL) {
|
|
|
|
COMPQUIET(savech, 0);
|
|
|
|
dir = PATH_DOT;
|
|
|
|
} else {
|
|
|
|
savech = *q;
|
|
|
|
*q = '\0';
|
|
|
|
dir = p;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Get the list of file names. */
|
2002-10-30 15:57:05 +04:00
|
|
|
ret = __os_dirlist(dbenv, dir, &names, &fcnt);
|
2001-03-04 19:42:05 -05:00
|
|
|
|
|
|
|
/*
|
|
|
|
* !!!
|
|
|
|
* We overwrote a byte in the string with a nul. Restore the string
|
|
|
|
* so that the diagnostic checks in the memory allocation code work
|
|
|
|
* and any error messages display the right file name.
|
|
|
|
*/
|
|
|
|
if (q != NULL)
|
|
|
|
*q = savech;
|
|
|
|
|
|
|
|
if (ret != 0) {
|
2002-10-30 15:57:05 +04:00
|
|
|
__db_err(dbenv, "%s: %s", dir, db_strerror(ret));
|
|
|
|
__os_free(dbenv, p);
|
2001-03-04 19:42:05 -05:00
|
|
|
return (ret);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Search for a valid log file name. */
|
|
|
|
for (cnt = fcnt, clv = logval = 0; --cnt >= 0;) {
|
|
|
|
if (strncmp(names[cnt], LFPREFIX, sizeof(LFPREFIX) - 1) != 0)
|
|
|
|
continue;
|
|
|
|
|
2002-10-30 15:57:05 +04:00
|
|
|
/*
|
|
|
|
* Names of the form log\.[0-9]* are reserved for DB. Other
|
|
|
|
* names sharing LFPREFIX, such as "log.db", are legal.
|
|
|
|
*/
|
|
|
|
for (c = names[cnt] + sizeof(LFPREFIX) - 1; *c != '\0'; c++)
|
|
|
|
if (!isdigit((int)*c))
|
|
|
|
break;
|
|
|
|
if (*c != '\0')
|
|
|
|
continue;
|
|
|
|
|
2001-03-04 19:42:05 -05:00
|
|
|
/*
|
|
|
|
* Use atol, not atoi; if an "int" is 16-bits, the largest
|
|
|
|
* log file name won't fit.
|
|
|
|
*/
|
2005-07-20 15:48:22 -07:00
|
|
|
clv = (u_int32_t)atol(names[cnt] + (sizeof(LFPREFIX) - 1));
|
2002-10-30 15:57:05 +04:00
|
|
|
|
|
|
|
/*
|
|
|
|
* If searching for the first log file, we want to return the
|
|
|
|
* oldest log file we can read, or, if no readable log files
|
|
|
|
* exist, the newest log file we can't read (the crossover
|
|
|
|
* point between the old and new versions of the log file).
|
|
|
|
*
|
|
|
|
* If we're searching for the last log file, we want to return
|
|
|
|
* the newest log file, period.
|
|
|
|
*
|
2005-07-20 15:48:22 -07:00
|
|
|
* Readable log files should never precede unreadable log
|
2002-10-30 15:57:05 +04:00
|
|
|
* files, that would mean the admin seriously screwed up.
|
|
|
|
*/
|
2001-03-04 19:42:05 -05:00
|
|
|
if (find_first) {
|
2002-10-30 15:57:05 +04:00
|
|
|
if (logval != 0 &&
|
|
|
|
status != DB_LV_OLD_UNREADABLE && clv > logval)
|
2001-03-04 19:42:05 -05:00
|
|
|
continue;
|
|
|
|
} else
|
|
|
|
if (logval != 0 && clv < logval)
|
|
|
|
continue;
|
|
|
|
|
2005-07-20 15:48:22 -07:00
|
|
|
if ((ret = __log_valid(dblp, clv, 1, NULL, 0, &status)) != 0) {
|
2002-10-30 15:57:05 +04:00
|
|
|
__db_err(dbenv, "Invalid log file: %s: %s",
|
|
|
|
names[cnt], db_strerror(ret));
|
2001-03-04 19:42:05 -05:00
|
|
|
goto err;
|
2002-10-30 15:57:05 +04:00
|
|
|
}
|
2001-03-04 19:42:05 -05:00
|
|
|
switch (status) {
|
2002-10-30 15:57:05 +04:00
|
|
|
case DB_LV_NONEXISTENT:
|
|
|
|
/* __log_valid never returns DB_LV_NONEXISTENT. */
|
|
|
|
DB_ASSERT(0);
|
|
|
|
break;
|
2001-03-04 19:42:05 -05:00
|
|
|
case DB_LV_INCOMPLETE:
|
|
|
|
/*
|
2002-10-30 15:57:05 +04:00
|
|
|
* The last log file may not have been initialized --
|
|
|
|
* it's possible to create a log file but not write
|
|
|
|
* anything to it. If performing recovery (that is,
|
|
|
|
* if find_first isn't set), ignore the file, it's
|
|
|
|
* not interesting. If we're searching for the first
|
|
|
|
* log record, return the file (assuming we don't find
|
|
|
|
* something better), as the "real" first log record
|
|
|
|
* is likely to be in the log buffer, and we want to
|
|
|
|
* set the file LSN for our return.
|
2001-03-04 19:42:05 -05:00
|
|
|
*/
|
2002-10-30 15:57:05 +04:00
|
|
|
if (find_first)
|
|
|
|
goto found;
|
2001-03-04 19:42:05 -05:00
|
|
|
break;
|
2002-10-30 15:57:05 +04:00
|
|
|
case DB_LV_OLD_UNREADABLE:
|
|
|
|
/*
|
|
|
|
* If we're searching for the first log file, then we
|
|
|
|
* only want this file if we don't yet have a file or
|
|
|
|
* already have an unreadable file and this one is
|
|
|
|
* newer than that one. If we're searching for the
|
|
|
|
* last log file, we always want this file because we
|
|
|
|
* wouldn't be here if it wasn't newer than our current
|
|
|
|
* choice.
|
|
|
|
*/
|
|
|
|
if (!find_first || logval == 0 ||
|
|
|
|
(status == DB_LV_OLD_UNREADABLE && clv > logval))
|
|
|
|
goto found;
|
2001-05-09 23:02:36 +03:00
|
|
|
break;
|
2001-03-04 19:42:05 -05:00
|
|
|
case DB_LV_NORMAL:
|
|
|
|
case DB_LV_OLD_READABLE:
|
2002-10-30 15:57:05 +04:00
|
|
|
found: logval = clv;
|
2001-05-09 23:02:36 +03:00
|
|
|
logval_status = status;
|
2001-03-04 19:42:05 -05:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
*valp = logval;
|
|
|
|
|
2002-10-30 15:57:05 +04:00
|
|
|
err: __os_dirfree(dbenv, names, fcnt);
|
|
|
|
__os_free(dbenv, p);
|
2001-05-09 23:02:36 +03:00
|
|
|
*statusp = logval_status;
|
2001-03-04 19:42:05 -05:00
|
|
|
|
|
|
|
return (ret);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* log_valid --
|
|
|
|
* Validate a log file. Returns an error code in the event of
|
|
|
|
* a fatal flaw in a the specified log file; returns success with
|
|
|
|
* a code indicating the currentness and completeness of the specified
|
|
|
|
* log file if it is not unexpectedly flawed (that is, if it's perfectly
|
|
|
|
* normal, if it's zero-length, or if it's an old version).
|
|
|
|
*
|
2005-07-20 15:48:22 -07:00
|
|
|
* PUBLIC: int __log_valid __P((DB_LOG *, u_int32_t, int,
|
|
|
|
* PUBLIC: DB_FH **, u_int32_t, logfile_validity *));
|
2001-03-04 19:42:05 -05:00
|
|
|
*/
|
|
|
|
int
|
2005-07-20 15:48:22 -07:00
|
|
|
__log_valid(dblp, number, set_persist, fhpp, flags, statusp)
|
2001-03-04 19:42:05 -05:00
|
|
|
DB_LOG *dblp;
|
|
|
|
u_int32_t number;
|
|
|
|
int set_persist;
|
2005-07-20 15:48:22 -07:00
|
|
|
DB_FH **fhpp;
|
|
|
|
u_int32_t flags;
|
2001-03-04 19:42:05 -05:00
|
|
|
logfile_validity *statusp;
|
|
|
|
{
|
2002-10-30 15:57:05 +04:00
|
|
|
DB_CIPHER *db_cipher;
|
|
|
|
DB_ENV *dbenv;
|
2005-07-20 15:48:22 -07:00
|
|
|
DB_FH *fhp;
|
2002-10-30 15:57:05 +04:00
|
|
|
HDR *hdr;
|
2005-07-20 15:48:22 -07:00
|
|
|
LOG *lp;
|
2002-10-30 15:57:05 +04:00
|
|
|
LOGP *persist;
|
2001-03-04 19:42:05 -05:00
|
|
|
logfile_validity status;
|
2005-07-20 15:48:22 -07:00
|
|
|
size_t hdrsize, nr, recsize;
|
|
|
|
int is_hmac, ret;
|
2002-10-30 15:57:05 +04:00
|
|
|
u_int8_t *tmp;
|
|
|
|
char *fname;
|
2001-03-04 19:42:05 -05:00
|
|
|
|
2002-10-30 15:57:05 +04:00
|
|
|
dbenv = dblp->dbenv;
|
|
|
|
db_cipher = dbenv->crypto_handle;
|
2005-07-20 15:48:22 -07:00
|
|
|
fhp = NULL;
|
2002-10-30 15:57:05 +04:00
|
|
|
persist = NULL;
|
2001-03-04 19:42:05 -05:00
|
|
|
status = DB_LV_NORMAL;
|
2005-07-20 15:48:22 -07:00
|
|
|
tmp = NULL;
|
|
|
|
|
|
|
|
/* Return the file handle to our caller, on request */
|
|
|
|
if (fhpp != NULL)
|
|
|
|
*fhpp = NULL;
|
2001-03-04 19:42:05 -05:00
|
|
|
|
2005-07-20 15:48:22 -07:00
|
|
|
if (flags == 0)
|
|
|
|
flags = DB_OSO_RDONLY | DB_OSO_SEQ;
|
2001-03-04 19:42:05 -05:00
|
|
|
/* Try to open the log file. */
|
2005-07-20 15:48:22 -07:00
|
|
|
if ((ret = __log_name(dblp, number, &fname, &fhp, flags)) != 0) {
|
2002-10-30 15:57:05 +04:00
|
|
|
__os_free(dbenv, fname);
|
2001-03-04 19:42:05 -05:00
|
|
|
return (ret);
|
|
|
|
}
|
|
|
|
|
2002-10-30 15:57:05 +04:00
|
|
|
hdrsize = HDR_NORMAL_SZ;
|
|
|
|
is_hmac = 0;
|
|
|
|
recsize = sizeof(LOGP);
|
|
|
|
if (CRYPTO_ON(dbenv)) {
|
|
|
|
hdrsize = HDR_CRYPTO_SZ;
|
|
|
|
recsize = sizeof(LOGP);
|
|
|
|
recsize += db_cipher->adj_size(recsize);
|
|
|
|
is_hmac = 1;
|
|
|
|
}
|
|
|
|
if ((ret = __os_calloc(dbenv, 1, recsize + hdrsize, &tmp)) != 0)
|
2005-07-20 15:48:22 -07:00
|
|
|
goto err;
|
|
|
|
|
2002-10-30 15:57:05 +04:00
|
|
|
hdr = (HDR *)tmp;
|
|
|
|
persist = (LOGP *)(tmp + hdrsize);
|
2005-07-20 15:48:22 -07:00
|
|
|
/*
|
|
|
|
* Try to read the header. This can fail if the log is truncated, or
|
|
|
|
* if we find a preallocated log file where the header has not yet been
|
|
|
|
* written, so we need to check whether the header is zero-filled.
|
|
|
|
*/
|
|
|
|
if ((ret = __os_read(dbenv, fhp, tmp, recsize + hdrsize, &nr)) != 0 ||
|
|
|
|
nr != recsize + hdrsize ||
|
|
|
|
(hdr->len == 0 && persist->magic == 0 && persist->log_size == 0)) {
|
2001-03-04 19:42:05 -05:00
|
|
|
if (ret == 0)
|
|
|
|
status = DB_LV_INCOMPLETE;
|
|
|
|
else
|
|
|
|
/*
|
|
|
|
* The error was a fatal read error, not just an
|
|
|
|
* incompletely initialized log file.
|
|
|
|
*/
|
2002-10-30 15:57:05 +04:00
|
|
|
__db_err(dbenv, "Ignoring log file: %s: %s",
|
2001-03-04 19:42:05 -05:00
|
|
|
fname, db_strerror(ret));
|
|
|
|
goto err;
|
|
|
|
}
|
2002-10-30 15:57:05 +04:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Now we have to validate the persistent record. We have
|
|
|
|
* several scenarios we have to deal with:
|
|
|
|
*
|
|
|
|
* 1. User has crypto turned on:
|
|
|
|
* - They're reading an old, unencrypted log file
|
|
|
|
* . We will fail the record size match check below.
|
|
|
|
* - They're reading a current, unencrypted log file
|
|
|
|
* . We will fail the record size match check below.
|
|
|
|
* - They're reading an old, encrypted log file [NOT YET]
|
|
|
|
* . After decryption we'll fail the version check. [NOT YET]
|
|
|
|
* - They're reading a current, encrypted log file
|
|
|
|
* . We should proceed as usual.
|
|
|
|
* 2. User has crypto turned off:
|
|
|
|
* - They're reading an old, unencrypted log file
|
|
|
|
* . We will fail the version check.
|
|
|
|
* - They're reading a current, unencrypted log file
|
|
|
|
* . We should proceed as usual.
|
|
|
|
* - They're reading an old, encrypted log file [NOT YET]
|
|
|
|
* . We'll fail the magic number check (it is encrypted).
|
|
|
|
* - They're reading a current, encrypted log file
|
|
|
|
* . We'll fail the magic number check (it is encrypted).
|
|
|
|
*/
|
|
|
|
if (CRYPTO_ON(dbenv)) {
|
|
|
|
/*
|
|
|
|
* If we are trying to decrypt an unencrypted log
|
|
|
|
* we can only detect that by having an unreasonable
|
|
|
|
* data length for our persistent data.
|
|
|
|
*/
|
|
|
|
if ((hdr->len - hdrsize) != sizeof(LOGP)) {
|
|
|
|
__db_err(dbenv, "log record size mismatch");
|
|
|
|
goto err;
|
|
|
|
}
|
|
|
|
/* Check the checksum and decrypt. */
|
|
|
|
if ((ret = __db_check_chksum(dbenv, db_cipher, &hdr->chksum[0],
|
|
|
|
(u_int8_t *)persist, hdr->len - hdrsize, is_hmac)) != 0) {
|
|
|
|
__db_err(dbenv, "log record checksum mismatch");
|
|
|
|
goto err;
|
|
|
|
}
|
|
|
|
if ((ret = db_cipher->decrypt(dbenv, db_cipher->data,
|
|
|
|
&hdr->iv[0], (u_int8_t *)persist, hdr->len - hdrsize)) != 0)
|
|
|
|
goto err;
|
|
|
|
}
|
2001-03-04 19:42:05 -05:00
|
|
|
|
|
|
|
/* Validate the header. */
|
2002-10-30 15:57:05 +04:00
|
|
|
if (persist->magic != DB_LOGMAGIC) {
|
|
|
|
__db_err(dbenv,
|
2001-03-04 19:42:05 -05:00
|
|
|
"Ignoring log file: %s: magic number %lx, not %lx",
|
2002-10-30 15:57:05 +04:00
|
|
|
fname, (u_long)persist->magic, (u_long)DB_LOGMAGIC);
|
2001-03-04 19:42:05 -05:00
|
|
|
ret = EINVAL;
|
|
|
|
goto err;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
2005-07-20 15:48:22 -07:00
|
|
|
* Set our status code to indicate whether the log file belongs to an
|
|
|
|
* unreadable or readable old version; leave it alone if and only if
|
|
|
|
* the log file version is the current one.
|
2001-03-04 19:42:05 -05:00
|
|
|
*/
|
2002-10-30 15:57:05 +04:00
|
|
|
if (persist->version > DB_LOGVERSION) {
|
2001-03-04 19:42:05 -05:00
|
|
|
/* This is a fatal error--the log file is newer than DB. */
|
2002-10-30 15:57:05 +04:00
|
|
|
__db_err(dbenv,
|
2005-07-20 15:48:22 -07:00
|
|
|
"Unacceptable log file %s: unsupported log version %lu",
|
2002-10-30 15:57:05 +04:00
|
|
|
fname, (u_long)persist->version);
|
2001-03-04 19:42:05 -05:00
|
|
|
ret = EINVAL;
|
|
|
|
goto err;
|
2002-10-30 15:57:05 +04:00
|
|
|
} else if (persist->version < DB_LOGOLDVER) {
|
2001-03-04 19:42:05 -05:00
|
|
|
status = DB_LV_OLD_UNREADABLE;
|
2005-07-20 15:48:22 -07:00
|
|
|
/* This is a non-fatal error, but give some feedback. */
|
|
|
|
__db_err(dbenv,
|
|
|
|
"Skipping log file %s: historic log version %lu",
|
|
|
|
fname, (u_long)persist->version);
|
2001-03-04 19:42:05 -05:00
|
|
|
/*
|
2005-07-20 15:48:22 -07:00
|
|
|
* We don't want to set persistent info based on an unreadable
|
|
|
|
* region, so jump to "err".
|
2001-03-04 19:42:05 -05:00
|
|
|
*/
|
|
|
|
goto err;
|
2002-10-30 15:57:05 +04:00
|
|
|
} else if (persist->version < DB_LOGVERSION)
|
2001-03-04 19:42:05 -05:00
|
|
|
status = DB_LV_OLD_READABLE;
|
|
|
|
|
|
|
|
/*
|
2005-07-20 15:48:22 -07:00
|
|
|
* Only if we have a current log do we verify the checksum. We could
|
|
|
|
* not check the checksum before checking the magic and version because
|
|
|
|
* old log headers put the length and checksum in a different location.
|
2002-10-30 15:57:05 +04:00
|
|
|
*/
|
|
|
|
if (!CRYPTO_ON(dbenv) && ((ret = __db_check_chksum(dbenv,
|
|
|
|
db_cipher, &hdr->chksum[0], (u_int8_t *)persist,
|
|
|
|
hdr->len - hdrsize, is_hmac)) != 0)) {
|
|
|
|
__db_err(dbenv, "log record checksum mismatch");
|
|
|
|
goto err;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* If the log is readable so far and we're doing system initialization,
|
|
|
|
* set the region's persistent information based on the headers.
|
|
|
|
*
|
2005-07-20 15:48:22 -07:00
|
|
|
* Override the current log file size.
|
2001-03-04 19:42:05 -05:00
|
|
|
*/
|
|
|
|
if (set_persist) {
|
2005-07-20 15:48:22 -07:00
|
|
|
lp = dblp->reginfo.primary;
|
|
|
|
lp->log_size = persist->log_size;
|
2001-03-04 19:42:05 -05:00
|
|
|
}
|
|
|
|
|
2005-07-20 15:48:22 -07:00
|
|
|
err: if (fname != NULL)
|
|
|
|
__os_free(dbenv, fname);
|
|
|
|
if (ret == 0 && fhpp != NULL)
|
|
|
|
*fhpp = fhp;
|
|
|
|
else
|
|
|
|
/* Must close on error or if we only used it locally. */
|
|
|
|
(void)__os_closehandle(dbenv, fhp);
|
|
|
|
if (tmp != NULL)
|
2002-10-30 15:57:05 +04:00
|
|
|
__os_free(dbenv, tmp);
|
2005-07-20 15:48:22 -07:00
|
|
|
|
2001-03-04 19:42:05 -05:00
|
|
|
*statusp = status;
|
2005-07-20 15:48:22 -07:00
|
|
|
|
2001-03-04 19:42:05 -05:00
|
|
|
return (ret);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
2002-10-30 15:57:05 +04:00
|
|
|
* __log_dbenv_refresh --
|
2005-07-20 15:48:22 -07:00
|
|
|
* Clean up after the log system on a close or failed open.
|
2001-03-04 19:42:05 -05:00
|
|
|
*
|
2002-10-30 15:57:05 +04:00
|
|
|
* PUBLIC: int __log_dbenv_refresh __P((DB_ENV *));
|
2001-03-04 19:42:05 -05:00
|
|
|
*/
|
|
|
|
int
|
2002-10-30 15:57:05 +04:00
|
|
|
__log_dbenv_refresh(dbenv)
|
2001-03-04 19:42:05 -05:00
|
|
|
DB_ENV *dbenv;
|
|
|
|
{
|
|
|
|
DB_LOG *dblp;
|
2005-07-20 15:48:22 -07:00
|
|
|
LOG *lp;
|
|
|
|
REGINFO *reginfo;
|
2005-12-05 10:27:46 -08:00
|
|
|
struct __fname *fnp;
|
2001-03-04 19:42:05 -05:00
|
|
|
int ret, t_ret;
|
|
|
|
|
|
|
|
dblp = dbenv->lg_handle;
|
2005-07-20 15:48:22 -07:00
|
|
|
reginfo = &dblp->reginfo;
|
|
|
|
lp = reginfo->primary;
|
2001-03-04 19:42:05 -05:00
|
|
|
|
|
|
|
/* We may have opened files as part of XA; if so, close them. */
|
2002-10-30 15:57:05 +04:00
|
|
|
ret = __dbreg_close_files(dbenv);
|
2001-03-04 19:42:05 -05:00
|
|
|
|
2005-12-05 10:27:46 -08:00
|
|
|
/*
|
|
|
|
* After we close the files, check for any unlogged closes left in
|
|
|
|
* the shared memory queue. If we find any, we need to panic the
|
|
|
|
* region. Note, just set "ret" -- a panic overrides any previously
|
|
|
|
* set error return.
|
|
|
|
*/
|
|
|
|
for (fnp = SH_TAILQ_FIRST(&lp->fq, __fname); fnp != NULL;
|
|
|
|
fnp = SH_TAILQ_NEXT(fnp, q, __fname))
|
|
|
|
if (F_ISSET(fnp, DB_FNAME_NOTLOGGED))
|
|
|
|
ret = __db_panic(dbenv, EINVAL);
|
|
|
|
|
2005-07-20 15:48:22 -07:00
|
|
|
/*
|
|
|
|
* If a private region, return the memory to the heap. Not needed for
|
|
|
|
* filesystem-backed or system shared memory regions, that memory isn't
|
|
|
|
* owned by any particular process.
|
|
|
|
*/
|
|
|
|
if (F_ISSET(dbenv, DB_ENV_PRIVATE)) {
|
|
|
|
/* Discard the flush mutex. */
|
2005-12-05 10:27:46 -08:00
|
|
|
if ((t_ret =
|
|
|
|
__mutex_free(dbenv, &lp->mtx_flush)) != 0 && ret == 0)
|
|
|
|
ret = t_ret;
|
2005-07-20 15:48:22 -07:00
|
|
|
|
|
|
|
/* Discard the buffer. */
|
|
|
|
__db_shalloc_free(reginfo, R_ADDR(reginfo, lp->buffer_off));
|
|
|
|
|
|
|
|
/* Discard stack of free file IDs. */
|
|
|
|
if (lp->free_fid_stack != INVALID_ROFF)
|
|
|
|
__db_shalloc_free(reginfo,
|
|
|
|
R_ADDR(reginfo, lp->free_fid_stack));
|
|
|
|
}
|
|
|
|
|
2005-12-05 10:27:46 -08:00
|
|
|
/* Discard the per-thread DBREG mutex. */
|
|
|
|
if ((t_ret = __mutex_free(dbenv, &dblp->mtx_dbreg)) != 0 && ret == 0)
|
|
|
|
ret = t_ret;
|
2001-03-04 19:42:05 -05:00
|
|
|
|
|
|
|
/* Detach from the region. */
|
2005-07-20 15:48:22 -07:00
|
|
|
if ((t_ret = __db_r_detach(dbenv, reginfo, 0)) != 0 && ret == 0)
|
2002-10-30 15:57:05 +04:00
|
|
|
ret = t_ret;
|
2001-03-04 19:42:05 -05:00
|
|
|
|
|
|
|
/* Close open files, release allocated memory. */
|
2005-07-20 15:48:22 -07:00
|
|
|
if (dblp->lfhp != NULL) {
|
|
|
|
if ((t_ret =
|
|
|
|
__os_closehandle(dbenv, dblp->lfhp)) != 0 && ret == 0)
|
|
|
|
ret = t_ret;
|
|
|
|
dblp->lfhp = NULL;
|
|
|
|
}
|
2001-03-04 19:42:05 -05:00
|
|
|
if (dblp->dbentry != NULL)
|
2002-10-30 15:57:05 +04:00
|
|
|
__os_free(dbenv, dblp->dbentry);
|
2001-03-04 19:42:05 -05:00
|
|
|
|
2002-10-30 15:57:05 +04:00
|
|
|
__os_free(dbenv, dblp);
|
2001-03-04 19:42:05 -05:00
|
|
|
|
|
|
|
dbenv->lg_handle = NULL;
|
|
|
|
return (ret);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
2002-10-30 15:57:05 +04:00
|
|
|
* __log_get_cached_ckp_lsn --
|
|
|
|
* Retrieve any last checkpoint LSN that we may have found on startup.
|
|
|
|
*
|
2005-12-05 10:27:46 -08:00
|
|
|
* PUBLIC: int __log_get_cached_ckp_lsn __P((DB_ENV *, DB_LSN *));
|
2002-10-30 15:57:05 +04:00
|
|
|
*/
|
2005-12-05 10:27:46 -08:00
|
|
|
int
|
2002-10-30 15:57:05 +04:00
|
|
|
__log_get_cached_ckp_lsn(dbenv, ckp_lsnp)
|
|
|
|
DB_ENV *dbenv;
|
|
|
|
DB_LSN *ckp_lsnp;
|
|
|
|
{
|
|
|
|
DB_LOG *dblp;
|
|
|
|
LOG *lp;
|
|
|
|
|
|
|
|
dblp = (DB_LOG *)dbenv->lg_handle;
|
|
|
|
lp = (LOG *)dblp->reginfo.primary;
|
|
|
|
|
2005-12-05 10:27:46 -08:00
|
|
|
LOG_SYSTEM_LOCK(dbenv);
|
2002-10-30 15:57:05 +04:00
|
|
|
*ckp_lsnp = lp->cached_ckp_lsn;
|
2005-12-05 10:27:46 -08:00
|
|
|
LOG_SYSTEM_UNLOCK(dbenv);
|
|
|
|
|
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* __log_region_mutex_count --
|
|
|
|
* Return the number of mutexes the log region will need.
|
|
|
|
*
|
|
|
|
* PUBLIC: u_int32_t __log_region_mutex_count __P((DB_ENV *));
|
|
|
|
*/
|
|
|
|
u_int32_t
|
|
|
|
__log_region_mutex_count(dbenv)
|
|
|
|
DB_ENV *dbenv;
|
|
|
|
{
|
|
|
|
/*
|
|
|
|
* We need a few assorted mutexes, and one per transaction waiting
|
|
|
|
* on the group commit list. We can't know how many that will be,
|
|
|
|
* but it should be bounded by the maximum active transactions.
|
|
|
|
*/
|
|
|
|
return (dbenv->tx_max + 5);
|
2002-10-30 15:57:05 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* __log_region_size --
|
|
|
|
* Return the amount of space needed for the log region.
|
|
|
|
* Make the region large enough to hold txn_max transaction
|
|
|
|
* detail structures plus some space to hold thread handles
|
|
|
|
* and the beginning of the shalloc region and anything we
|
|
|
|
* need for mutex system resource recording.
|
|
|
|
*/
|
|
|
|
static size_t
|
|
|
|
__log_region_size(dbenv)
|
|
|
|
DB_ENV *dbenv;
|
|
|
|
{
|
|
|
|
size_t s;
|
|
|
|
|
|
|
|
s = dbenv->lg_regionmax + dbenv->lg_bsize;
|
|
|
|
|
2005-07-20 15:48:22 -07:00
|
|
|
/*
|
2005-12-05 10:27:46 -08:00
|
|
|
* If running with replication, add in space for bulk buffer.
|
|
|
|
* Allocate a megabyte and a little bit more space.
|
2005-07-20 15:48:22 -07:00
|
|
|
*/
|
2005-12-05 10:27:46 -08:00
|
|
|
if (IS_ENV_REPLICATED(dbenv))
|
|
|
|
s += MEGABYTE;
|
2005-07-20 15:48:22 -07:00
|
|
|
|
2005-12-05 10:27:46 -08:00
|
|
|
return (s);
|
2002-10-30 15:57:05 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* __log_vtruncate
|
|
|
|
* This is a virtual truncate. We set up the log indicators to
|
|
|
|
* make everyone believe that the given record is the last one in the
|
|
|
|
* log. Returns with the next valid LSN (i.e., the LSN of the next
|
|
|
|
* record to be written). This is used in replication to discard records
|
|
|
|
* in the log file that do not agree with the master.
|
|
|
|
*
|
2005-07-20 15:48:22 -07:00
|
|
|
* PUBLIC: int __log_vtruncate __P((DB_ENV *, DB_LSN *, DB_LSN *, DB_LSN *));
|
2002-10-30 15:57:05 +04:00
|
|
|
*/
|
|
|
|
int
|
2005-07-20 15:48:22 -07:00
|
|
|
__log_vtruncate(dbenv, lsn, ckplsn, trunclsn)
|
2002-10-30 15:57:05 +04:00
|
|
|
DB_ENV *dbenv;
|
2005-07-20 15:48:22 -07:00
|
|
|
DB_LSN *lsn, *ckplsn, *trunclsn;
|
2002-10-30 15:57:05 +04:00
|
|
|
{
|
|
|
|
DBT log_dbt;
|
|
|
|
DB_LOG *dblp;
|
|
|
|
DB_LOGC *logc;
|
|
|
|
DB_LSN end_lsn;
|
|
|
|
LOG *lp;
|
|
|
|
u_int32_t bytes, c_len;
|
2005-07-20 15:48:22 -07:00
|
|
|
int ret, t_ret;
|
2002-10-30 15:57:05 +04:00
|
|
|
|
|
|
|
/* Need to find out the length of this soon-to-be-last record. */
|
2005-07-20 15:48:22 -07:00
|
|
|
if ((ret = __log_cursor(dbenv, &logc)) != 0)
|
2002-10-30 15:57:05 +04:00
|
|
|
return (ret);
|
|
|
|
memset(&log_dbt, 0, sizeof(log_dbt));
|
2005-07-20 15:48:22 -07:00
|
|
|
ret = __log_c_get(logc, lsn, &log_dbt, DB_SET);
|
2002-10-30 15:57:05 +04:00
|
|
|
c_len = logc->c_len;
|
2005-07-20 15:48:22 -07:00
|
|
|
if ((t_ret = __log_c_close(logc)) != 0 && ret == 0)
|
2002-10-30 15:57:05 +04:00
|
|
|
ret = t_ret;
|
|
|
|
if (ret != 0)
|
|
|
|
return (ret);
|
|
|
|
|
|
|
|
/* Now do the truncate. */
|
|
|
|
dblp = (DB_LOG *)dbenv->lg_handle;
|
|
|
|
lp = (LOG *)dblp->reginfo.primary;
|
|
|
|
|
2005-12-05 10:27:46 -08:00
|
|
|
LOG_SYSTEM_LOCK(dbenv);
|
2005-07-20 15:48:22 -07:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Flush the log so we can simply initialize the in-memory buffer
|
|
|
|
* after the truncate.
|
|
|
|
*/
|
|
|
|
if ((ret = __log_flush_int(dblp, NULL, 0)) != 0)
|
|
|
|
goto err;
|
|
|
|
|
2002-10-30 15:57:05 +04:00
|
|
|
end_lsn = lp->lsn;
|
|
|
|
lp->lsn = *lsn;
|
|
|
|
lp->len = c_len;
|
|
|
|
lp->lsn.offset += lp->len;
|
|
|
|
|
2005-07-20 15:48:22 -07:00
|
|
|
if (lp->db_log_inmemory &&
|
|
|
|
(ret = __log_inmem_lsnoff(dblp, &lp->lsn, &lp->b_off)) != 0)
|
|
|
|
goto err;
|
|
|
|
|
2002-10-30 15:57:05 +04:00
|
|
|
/*
|
|
|
|
* I am going to assume that the number of bytes written since
|
|
|
|
* the last checkpoint doesn't exceed a 32-bit number.
|
|
|
|
*/
|
|
|
|
DB_ASSERT(lp->lsn.file >= ckplsn->file);
|
|
|
|
bytes = 0;
|
|
|
|
if (ckplsn->file != lp->lsn.file) {
|
|
|
|
bytes = lp->log_size - ckplsn->offset;
|
|
|
|
if (lp->lsn.file > ckplsn->file + 1)
|
|
|
|
bytes += lp->log_size *
|
2005-07-20 15:48:22 -07:00
|
|
|
((lp->lsn.file - ckplsn->file) - 1);
|
2002-10-30 15:57:05 +04:00
|
|
|
bytes += lp->lsn.offset;
|
|
|
|
} else
|
|
|
|
bytes = lp->lsn.offset - ckplsn->offset;
|
|
|
|
|
|
|
|
lp->stat.st_wc_mbytes += bytes / MEGABYTE;
|
|
|
|
lp->stat.st_wc_bytes += bytes % MEGABYTE;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* If the saved lsn is greater than our new end of log, reset it
|
|
|
|
* to our current end of log.
|
|
|
|
*/
|
2005-12-05 10:27:46 -08:00
|
|
|
MUTEX_LOCK(dbenv, lp->mtx_flush);
|
2002-10-30 15:57:05 +04:00
|
|
|
if (log_compare(&lp->s_lsn, lsn) > 0)
|
|
|
|
lp->s_lsn = lp->lsn;
|
2005-12-05 10:27:46 -08:00
|
|
|
MUTEX_UNLOCK(dbenv, lp->mtx_flush);
|
2002-10-30 15:57:05 +04:00
|
|
|
|
2005-07-20 15:48:22 -07:00
|
|
|
/* Initialize the in-region buffer to a pristine state. */
|
|
|
|
ZERO_LSN(lp->f_lsn);
|
|
|
|
lp->w_off = lp->lsn.offset;
|
2002-10-30 15:57:05 +04:00
|
|
|
|
2005-07-20 15:48:22 -07:00
|
|
|
if (trunclsn != NULL)
|
|
|
|
*trunclsn = lp->lsn;
|
2002-10-30 15:57:05 +04:00
|
|
|
|
|
|
|
/* Truncate the log to the new point. */
|
|
|
|
if ((ret = __log_zero(dbenv, &lp->lsn, &end_lsn)) != 0)
|
|
|
|
goto err;
|
|
|
|
|
2005-12-05 10:27:46 -08:00
|
|
|
err: LOG_SYSTEM_UNLOCK(dbenv);
|
2002-10-30 15:57:05 +04:00
|
|
|
return (ret);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* __log_is_outdated --
|
2005-12-05 10:27:46 -08:00
|
|
|
* Used by the replication system to identify if a client's logs are too
|
|
|
|
* old.
|
2001-03-04 19:42:05 -05:00
|
|
|
*
|
2005-07-20 15:48:22 -07:00
|
|
|
* PUBLIC: int __log_is_outdated __P((DB_ENV *, u_int32_t, int *));
|
2001-03-04 19:42:05 -05:00
|
|
|
*/
|
|
|
|
int
|
2002-10-30 15:57:05 +04:00
|
|
|
__log_is_outdated(dbenv, fnum, outdatedp)
|
2001-03-04 19:42:05 -05:00
|
|
|
DB_ENV *dbenv;
|
2002-10-30 15:57:05 +04:00
|
|
|
u_int32_t fnum;
|
|
|
|
int *outdatedp;
|
2001-03-04 19:42:05 -05:00
|
|
|
{
|
2002-10-30 15:57:05 +04:00
|
|
|
DB_LOG *dblp;
|
2001-03-04 19:42:05 -05:00
|
|
|
LOG *lp;
|
2002-10-30 15:57:05 +04:00
|
|
|
char *name;
|
|
|
|
int ret;
|
|
|
|
u_int32_t cfile;
|
2005-07-20 15:48:22 -07:00
|
|
|
struct __db_filestart *filestart;
|
2001-03-04 19:42:05 -05:00
|
|
|
|
2002-10-30 15:57:05 +04:00
|
|
|
dblp = dbenv->lg_handle;
|
|
|
|
|
2005-12-05 10:27:46 -08:00
|
|
|
/*
|
|
|
|
* The log represented by dbenv is compared to the file number passed
|
|
|
|
* in fnum. If the log file fnum does not exist and is lower-numbered
|
|
|
|
* than the current logs, return *outdatedp non-zero, else we return 0.
|
|
|
|
*/
|
2005-07-20 15:48:22 -07:00
|
|
|
if (F_ISSET(dbenv, DB_ENV_LOG_INMEMORY)) {
|
2005-12-05 10:27:46 -08:00
|
|
|
LOG_SYSTEM_LOCK(dbenv);
|
2005-07-20 15:48:22 -07:00
|
|
|
lp = (LOG *)dblp->reginfo.primary;
|
|
|
|
filestart = SH_TAILQ_FIRST(&lp->logfiles, __db_filestart);
|
2005-12-05 10:27:46 -08:00
|
|
|
*outdatedp = filestart == NULL ? 0 : (fnum < filestart->file);
|
|
|
|
LOG_SYSTEM_UNLOCK(dbenv);
|
2005-07-20 15:48:22 -07:00
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
|
|
|
|
*outdatedp = 0;
|
2002-10-30 15:57:05 +04:00
|
|
|
if ((ret = __log_name(dblp, fnum, &name, NULL, 0)) != 0)
|
|
|
|
return (ret);
|
|
|
|
|
|
|
|
/* If the file exists, we're just fine. */
|
|
|
|
if (__os_exists(name, NULL) == 0)
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* It didn't exist, decide if the file number is too big or
|
|
|
|
* too little. If it's too little, then we need to indicate
|
|
|
|
* that the LSN is outdated.
|
|
|
|
*/
|
2005-12-05 10:27:46 -08:00
|
|
|
LOG_SYSTEM_LOCK(dbenv);
|
2002-10-30 15:57:05 +04:00
|
|
|
lp = (LOG *)dblp->reginfo.primary;
|
|
|
|
cfile = lp->lsn.file;
|
2005-12-05 10:27:46 -08:00
|
|
|
LOG_SYSTEM_UNLOCK(dbenv);
|
2002-10-30 15:57:05 +04:00
|
|
|
|
|
|
|
if (cfile > fnum)
|
|
|
|
*outdatedp = 1;
|
|
|
|
out: __os_free(dbenv, name);
|
|
|
|
return (ret);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* __log_zero --
|
|
|
|
* Zero out the tail of a log after a truncate.
|
|
|
|
*/
|
|
|
|
static int
|
|
|
|
__log_zero(dbenv, from_lsn, to_lsn)
|
|
|
|
DB_ENV *dbenv;
|
|
|
|
DB_LSN *from_lsn, *to_lsn;
|
|
|
|
{
|
2005-07-20 15:48:22 -07:00
|
|
|
DB_FH *fhp;
|
2002-10-30 15:57:05 +04:00
|
|
|
DB_LOG *dblp;
|
|
|
|
LOG *lp;
|
2005-07-20 15:48:22 -07:00
|
|
|
struct __db_filestart *filestart, *nextstart;
|
2002-10-30 15:57:05 +04:00
|
|
|
size_t nbytes, len, nw;
|
2005-07-20 15:48:22 -07:00
|
|
|
u_int32_t fn, mbytes, bytes;
|
2002-10-30 15:57:05 +04:00
|
|
|
u_int8_t buf[4096];
|
2005-07-20 15:48:22 -07:00
|
|
|
int ret;
|
|
|
|
char *fname;
|
2002-10-30 15:57:05 +04:00
|
|
|
|
|
|
|
dblp = dbenv->lg_handle;
|
2005-07-20 15:48:22 -07:00
|
|
|
DB_ASSERT(log_compare(from_lsn, to_lsn) <= 0);
|
|
|
|
if (log_compare(from_lsn, to_lsn) > 0) {
|
|
|
|
__db_err(dbenv,
|
|
|
|
"Warning: truncating to point beyond end of log");
|
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
|
2002-10-30 15:57:05 +04:00
|
|
|
lp = (LOG *)dblp->reginfo.primary;
|
2005-07-20 15:48:22 -07:00
|
|
|
if (lp->db_log_inmemory) {
|
|
|
|
/*
|
|
|
|
* Remove the first file if it is invalidated by this write.
|
|
|
|
* Log records can't be bigger than a file, so we only need to
|
|
|
|
* check the first file.
|
|
|
|
*/
|
|
|
|
for (filestart = SH_TAILQ_FIRST(&lp->logfiles, __db_filestart);
|
|
|
|
filestart != NULL && from_lsn->file < filestart->file;
|
|
|
|
filestart = nextstart) {
|
|
|
|
nextstart = SH_TAILQ_NEXT(filestart,
|
|
|
|
links, __db_filestart);
|
|
|
|
SH_TAILQ_REMOVE(&lp->logfiles, filestart,
|
|
|
|
links, __db_filestart);
|
|
|
|
SH_TAILQ_INSERT_HEAD(&lp->free_logfiles, filestart,
|
|
|
|
links, __db_filestart);
|
|
|
|
}
|
|
|
|
|
|
|
|
return (0);
|
|
|
|
}
|
2002-10-30 15:57:05 +04:00
|
|
|
|
2005-07-20 15:48:22 -07:00
|
|
|
/* Close any open file handles so unlinks don't fail. */
|
|
|
|
if (dblp->lfhp != NULL) {
|
|
|
|
(void)__os_closehandle(dbenv, dblp->lfhp);
|
|
|
|
dblp->lfhp = NULL;
|
2002-10-30 15:57:05 +04:00
|
|
|
}
|
|
|
|
|
2005-07-20 15:48:22 -07:00
|
|
|
/* Throw away any extra log files that we have around. */
|
|
|
|
for (fn = from_lsn->file + 1;; fn++) {
|
|
|
|
if (__log_name(dblp, fn, &fname, &fhp, DB_OSO_RDONLY) != 0) {
|
|
|
|
__os_free(dbenv, fname);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
(void)__os_closehandle(dbenv, fhp);
|
|
|
|
ret = __os_unlink(dbenv, fname);
|
|
|
|
__os_free(dbenv, fname);
|
|
|
|
if (ret != 0)
|
2002-10-30 15:57:05 +04:00
|
|
|
return (ret);
|
2005-07-20 15:48:22 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
/* We removed some log files; have to 0 to end of file. */
|
|
|
|
if ((ret =
|
|
|
|
__log_name(dblp, from_lsn->file, &fname, &dblp->lfhp, 0)) != 0)
|
|
|
|
return (ret);
|
|
|
|
__os_free(dbenv, fname);
|
|
|
|
if ((ret = __os_ioinfo(dbenv,
|
|
|
|
NULL, dblp->lfhp, &mbytes, &bytes, NULL)) != 0)
|
|
|
|
goto err;
|
|
|
|
DB_ASSERT((mbytes * MEGABYTE + bytes) >= from_lsn->offset);
|
|
|
|
len = (mbytes * MEGABYTE + bytes) - from_lsn->offset;
|
2002-10-30 15:57:05 +04:00
|
|
|
|
|
|
|
memset(buf, 0, sizeof(buf));
|
|
|
|
|
|
|
|
/* Initialize the write position. */
|
|
|
|
if ((ret = __os_seek(dbenv,
|
2005-07-20 15:48:22 -07:00
|
|
|
dblp->lfhp, 0, 0, from_lsn->offset, 0, DB_OS_SEEK_SET)) != 0)
|
|
|
|
goto err;
|
2002-10-30 15:57:05 +04:00
|
|
|
|
|
|
|
while (len > 0) {
|
|
|
|
nbytes = len > sizeof(buf) ? sizeof(buf) : len;
|
|
|
|
if ((ret =
|
2005-07-20 15:48:22 -07:00
|
|
|
__os_write(dbenv, dblp->lfhp, buf, nbytes, &nw)) != 0)
|
|
|
|
goto err;
|
2002-10-30 15:57:05 +04:00
|
|
|
len -= nbytes;
|
|
|
|
}
|
2005-07-20 15:48:22 -07:00
|
|
|
|
|
|
|
err: (void)__os_closehandle(dbenv, dblp->lfhp);
|
|
|
|
dblp->lfhp = NULL;
|
|
|
|
|
|
|
|
return (ret);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* __log_inmem_lsnoff --
|
|
|
|
* Find the offset in the buffer of a given LSN.
|
|
|
|
*
|
|
|
|
* PUBLIC: int __log_inmem_lsnoff __P((DB_LOG *, DB_LSN *, size_t *));
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
__log_inmem_lsnoff(dblp, lsn, offsetp)
|
|
|
|
DB_LOG *dblp;
|
|
|
|
DB_LSN *lsn;
|
|
|
|
size_t *offsetp;
|
|
|
|
{
|
|
|
|
LOG *lp;
|
|
|
|
struct __db_filestart *filestart;
|
|
|
|
|
|
|
|
lp = (LOG *)dblp->reginfo.primary;
|
|
|
|
|
|
|
|
SH_TAILQ_FOREACH(filestart, &lp->logfiles, links, __db_filestart)
|
|
|
|
if (filestart->file == lsn->file) {
|
|
|
|
*offsetp =
|
|
|
|
(filestart->b_off + lsn->offset) % lp->buffer_size;
|
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
|
|
|
|
return (DB_NOTFOUND);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* __log_inmem_newfile --
|
|
|
|
* Records the offset of the beginning of a new file in the in-memory
|
|
|
|
* buffer.
|
|
|
|
*
|
|
|
|
* PUBLIC: int __log_inmem_newfile __P((DB_LOG *, u_int32_t));
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
__log_inmem_newfile(dblp, file)
|
|
|
|
DB_LOG *dblp;
|
|
|
|
u_int32_t file;
|
|
|
|
{
|
|
|
|
HDR hdr;
|
|
|
|
LOG *lp;
|
|
|
|
struct __db_filestart *filestart;
|
|
|
|
int ret;
|
|
|
|
#ifdef DIAGNOSTIC
|
|
|
|
struct __db_filestart *first, *last;
|
|
|
|
#endif
|
|
|
|
|
|
|
|
lp = (LOG *)dblp->reginfo.primary;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* We write an empty header at the end of every in-memory log file.
|
|
|
|
* This is used during cursor traversal to indicate when to switch the
|
|
|
|
* LSN to the next file.
|
|
|
|
*/
|
|
|
|
if (file > 1) {
|
|
|
|
memset(&hdr, 0, sizeof(HDR));
|
|
|
|
__log_inmem_copyin(dblp, lp->b_off, &hdr, sizeof(HDR));
|
|
|
|
lp->b_off = (lp->b_off + sizeof(HDR)) % lp->buffer_size;
|
|
|
|
}
|
|
|
|
|
|
|
|
filestart = SH_TAILQ_FIRST(&lp->free_logfiles, __db_filestart);
|
|
|
|
if (filestart == NULL) {
|
|
|
|
if ((ret = __db_shalloc(&dblp->reginfo,
|
|
|
|
sizeof(struct __db_filestart), 0, &filestart)) != 0)
|
|
|
|
return (ret);
|
|
|
|
memset(filestart, 0, sizeof(*filestart));
|
|
|
|
} else
|
|
|
|
SH_TAILQ_REMOVE(&lp->free_logfiles, filestart,
|
|
|
|
links, __db_filestart);
|
|
|
|
|
|
|
|
filestart->file = file;
|
|
|
|
filestart->b_off = lp->b_off;
|
|
|
|
|
|
|
|
#ifdef DIAGNOSTIC
|
|
|
|
first = SH_TAILQ_FIRST(&lp->logfiles, __db_filestart);
|
|
|
|
last = SH_TAILQ_LAST(&(lp)->logfiles, links, __db_filestart);
|
|
|
|
|
|
|
|
/* Check that we don't wrap. */
|
|
|
|
DB_ASSERT(!first || first == last ||
|
|
|
|
RINGBUF_LEN(lp, first->b_off, lp->b_off) ==
|
|
|
|
RINGBUF_LEN(lp, first->b_off, last->b_off) +
|
|
|
|
RINGBUF_LEN(lp, last->b_off, lp->b_off));
|
|
|
|
#endif
|
|
|
|
|
|
|
|
SH_TAILQ_INSERT_TAIL(&lp->logfiles, filestart, links);
|
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* __log_inmem_chkspace --
|
|
|
|
* Ensure that the requested amount of space is available in the buffer,
|
|
|
|
* and invalidate the region.
|
|
|
|
* Note: assumes that the region lock is held on entry.
|
|
|
|
*
|
|
|
|
* PUBLIC: int __log_inmem_chkspace __P((DB_LOG *, size_t));
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
__log_inmem_chkspace(dblp, len)
|
|
|
|
DB_LOG *dblp;
|
|
|
|
size_t len;
|
|
|
|
{
|
2005-12-05 10:27:46 -08:00
|
|
|
DB_ENV *dbenv;
|
2005-07-20 15:48:22 -07:00
|
|
|
LOG *lp;
|
|
|
|
DB_LSN active_lsn, old_active_lsn;
|
|
|
|
struct __db_filestart *filestart;
|
2005-12-05 10:27:46 -08:00
|
|
|
int ret;
|
2005-07-20 15:48:22 -07:00
|
|
|
|
2005-12-05 10:27:46 -08:00
|
|
|
dbenv = dblp->dbenv;
|
2005-07-20 15:48:22 -07:00
|
|
|
lp = dblp->reginfo.primary;
|
|
|
|
|
|
|
|
DB_ASSERT(lp->db_log_inmemory);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Allow room for an extra header so that we don't need to check for
|
|
|
|
* space when switching files.
|
|
|
|
*/
|
|
|
|
len += sizeof(HDR);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* If transactions are enabled and we're about to fill available space,
|
|
|
|
* update the active LSN and recheck. If transactions aren't enabled,
|
|
|
|
* don't even bother checking: in that case we can always overwrite old
|
|
|
|
* log records, because we're never going to abort.
|
|
|
|
*/
|
2005-12-05 10:27:46 -08:00
|
|
|
while (TXN_ON(dbenv) &&
|
2005-07-20 15:48:22 -07:00
|
|
|
RINGBUF_LEN(lp, lp->b_off, lp->a_off) <= len) {
|
|
|
|
old_active_lsn = lp->active_lsn;
|
|
|
|
active_lsn = lp->lsn;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Drop the log region lock so we don't hold it while
|
|
|
|
* taking the transaction region lock.
|
|
|
|
*/
|
2005-12-05 10:27:46 -08:00
|
|
|
LOG_SYSTEM_UNLOCK(dbenv);
|
|
|
|
if ((ret = __txn_getactive(dbenv, &active_lsn)) != 0)
|
|
|
|
return (ret);
|
|
|
|
LOG_SYSTEM_LOCK(dbenv);
|
2005-07-20 15:48:22 -07:00
|
|
|
active_lsn.offset = 0;
|
|
|
|
|
|
|
|
/* If we didn't make any progress, give up. */
|
|
|
|
if (log_compare(&active_lsn, &old_active_lsn) == 0) {
|
2005-12-05 10:27:46 -08:00
|
|
|
__db_err(dbenv,
|
2005-07-20 15:48:22 -07:00
|
|
|
"In-memory log buffer is full (an active transaction spans the buffer)");
|
|
|
|
return (DB_LOG_BUFFER_FULL);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Make sure we're moving the region LSN forwards. */
|
|
|
|
if (log_compare(&active_lsn, &lp->active_lsn) > 0) {
|
|
|
|
lp->active_lsn = active_lsn;
|
|
|
|
(void)__log_inmem_lsnoff(dblp, &active_lsn,
|
|
|
|
&lp->a_off);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Remove the first file if it is invalidated by this write.
|
|
|
|
* Log records can't be bigger than a file, so we only need to
|
|
|
|
* check the first file.
|
|
|
|
*/
|
|
|
|
filestart = SH_TAILQ_FIRST(&lp->logfiles, __db_filestart);
|
|
|
|
if (filestart != NULL &&
|
|
|
|
RINGBUF_LEN(lp, lp->b_off, filestart->b_off) <= len) {
|
|
|
|
SH_TAILQ_REMOVE(&lp->logfiles, filestart,
|
|
|
|
links, __db_filestart);
|
|
|
|
SH_TAILQ_INSERT_HEAD(&lp->free_logfiles, filestart,
|
|
|
|
links, __db_filestart);
|
|
|
|
lp->f_lsn.file = filestart->file + 1;
|
|
|
|
}
|
2001-03-04 19:42:05 -05:00
|
|
|
|
|
|
|
return (0);
|
|
|
|
}
|
2005-07-20 15:48:22 -07:00
|
|
|
|
|
|
|
/*
|
|
|
|
* __log_inmem_copyout --
|
|
|
|
* Copies the given number of bytes from the buffer -- no checking.
|
|
|
|
* Note: assumes that the region lock is held on entry.
|
|
|
|
*
|
|
|
|
* PUBLIC: void __log_inmem_copyout __P((DB_LOG *, size_t, void *, size_t));
|
|
|
|
*/
|
|
|
|
void
|
|
|
|
__log_inmem_copyout(dblp, offset, buf, size)
|
|
|
|
DB_LOG *dblp;
|
|
|
|
size_t offset;
|
|
|
|
void *buf;
|
|
|
|
size_t size;
|
|
|
|
{
|
|
|
|
LOG *lp;
|
|
|
|
size_t nbytes;
|
|
|
|
|
|
|
|
lp = (LOG *)dblp->reginfo.primary;
|
|
|
|
nbytes = (offset + size < lp->buffer_size) ?
|
|
|
|
size : lp->buffer_size - offset;
|
|
|
|
memcpy(buf, dblp->bufp + offset, nbytes);
|
|
|
|
if (nbytes < size)
|
|
|
|
memcpy((u_int8_t *)buf + nbytes, dblp->bufp, size - nbytes);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* __log_inmem_copyin --
|
|
|
|
* Copies the given number of bytes into the buffer -- no checking.
|
|
|
|
* Note: assumes that the region lock is held on entry.
|
|
|
|
*
|
|
|
|
* PUBLIC: void __log_inmem_copyin __P((DB_LOG *, size_t, void *, size_t));
|
|
|
|
*/
|
|
|
|
void
|
|
|
|
__log_inmem_copyin(dblp, offset, buf, size)
|
|
|
|
DB_LOG *dblp;
|
|
|
|
size_t offset;
|
|
|
|
void *buf;
|
|
|
|
size_t size;
|
|
|
|
{
|
|
|
|
LOG *lp;
|
|
|
|
size_t nbytes;
|
|
|
|
|
|
|
|
lp = (LOG *)dblp->reginfo.primary;
|
|
|
|
nbytes = (offset + size < lp->buffer_size) ?
|
|
|
|
size : lp->buffer_size - offset;
|
|
|
|
memcpy(dblp->bufp + offset, buf, nbytes);
|
|
|
|
if (nbytes < size)
|
|
|
|
memcpy(dblp->bufp, (u_int8_t *)buf + nbytes, size - nbytes);
|
|
|
|
}
|