mirror of
https://github.com/MariaDB/server.git
synced 2025-01-22 06:44:16 +01:00
Segrate rollback and recover functions. Write a brt-level test for the cursor static variable problem. Addresses #536, #538.
git-svn-id: file:///svn/tokudb@2829 c7de825b-a66e-492c-adef-691d508d4ae1
This commit is contained in:
parent
86bd15c721
commit
4d369d8572
8 changed files with 588 additions and 529 deletions
|
@ -57,6 +57,7 @@ REGRESSION_TESTS = \
|
|||
brt-test3 \
|
||||
brt-test4 \
|
||||
brt-test-cursor \
|
||||
brt-test-cursor-2 \
|
||||
log-test \
|
||||
log-test2 \
|
||||
log-test3 \
|
||||
|
@ -108,6 +109,7 @@ CHECKS = \
|
|||
test-brt-delete-both \
|
||||
brt-test \
|
||||
brt-test-cursor \
|
||||
brt-test-cursor-2 \
|
||||
brt-test3 \
|
||||
brt-test4 \
|
||||
fifo-test \
|
||||
|
@ -141,7 +143,7 @@ check-fanout:
|
|||
let BRT_FANOUT=BRT_FANOUT+1; \
|
||||
done
|
||||
|
||||
log-test log-test2 log-test3 log-test4 log-test5 log-test6 pma-test benchmark-test brt-test brt-test3 brt-test4 brt-test-cursor test-brt-delete-both brt-serialize-test brtdump test-inc-split test-del-inorder: LDFLAGS+=-lz
|
||||
log-test log-test2 log-test3 log-test4 log-test5 log-test6 pma-test benchmark-test brt-test brt-test3 brt-test4 brt-test-cursor brt-test-cursor-2 test-brt-delete-both brt-serialize-test brtdump test-inc-split test-del-inorder: LDFLAGS+=-lz
|
||||
# pma: PROF_FLAGS=-fprofile-arcs -ftest-coverage
|
||||
|
||||
BRT_INTERNAL_H_INCLUDES = brt-internal.h cachetable.h fifo.h pma.h brt.h brttypes.h yerror.h ybt.h log.h ../include/db.h kv-pair.h memory.h crc.h
|
||||
|
@ -157,10 +159,10 @@ ybt.o: ybt.h brttypes.h ../include/db.h
|
|||
ybt-test: ybt-test.o ybt.o memory.o toku_assert.o
|
||||
ybt-test.o: ybt.h ../include/db.h
|
||||
cachetable.o: cachetable.h hashfun.h memory.h
|
||||
brt-test3 brt-test4 brt-test-cursor brt-test: ybt.o brt.o fifo.o pma.o memory.o brt-serialize.o cachetable.o ybt.o key.o primes.o toku_assert.o log.o mempool.o brt-verify.o fingerprint.o log_code.o roll.o
|
||||
brt-test3 brt-test4 brt-test-cursor brt-test-cursor-2 brt-test: ybt.o brt.o fifo.o pma.o memory.o brt-serialize.o cachetable.o ybt.o key.o primes.o toku_assert.o log.o mempool.o brt-verify.o fingerprint.o log_code.o roll.o
|
||||
log.o: log_header.h log-internal.h log.h wbuf.h crc.h brttypes.h $(BRT_INTERNAL_H_INCLUDES)
|
||||
logformat: logformat.o toku_assert.o
|
||||
brt-test3.o brt-test4.o brt-test-cursor.o brt-test.o brt.o: brt.h ../include/db.h fifo.h pma.h brttypes.h cachetable.h memory.h
|
||||
brt-test3.o brt-test4.o brt-test-cursor.o brt-test-cursor-2.o brt-test.o brt.o: brt.h ../include/db.h fifo.h pma.h brttypes.h cachetable.h memory.h
|
||||
brt-serialize-test.o: $(BRT_INTERNAL_H_INCLUDES)
|
||||
brt.o: $(BRT_INTERNAL_H_INCLUDES) key.h log_header.h
|
||||
fifo.o: fifo.h brttypes.h
|
||||
|
|
111
newbrt/brt-test-cursor-2.c
Normal file
111
newbrt/brt-test-cursor-2.c
Normal file
|
@ -0,0 +1,111 @@
|
|||
/* -*- mode: C; c-basic-offset: 4 -*- */
|
||||
#ident "Copyright (c) 2007, 2008 Tokutek Inc. All rights reserved."
|
||||
|
||||
#include "brt.h"
|
||||
#include "key.h"
|
||||
#include "pma.h"
|
||||
#include "brt-internal.h"
|
||||
#include "memory.h"
|
||||
#include "toku_assert.h"
|
||||
|
||||
#include <fcntl.h>
|
||||
#include <stdio.h>
|
||||
#include <string.h>
|
||||
#include <sys/time.h>
|
||||
#include <stdlib.h>
|
||||
#include <unistd.h>
|
||||
#include <arpa/inet.h>
|
||||
|
||||
#include "test.h"
|
||||
|
||||
static const char fname[]= __FILE__ ".brt";
|
||||
|
||||
static TOKUTXN const null_txn = 0;
|
||||
static DB * const null_db = 0;
|
||||
|
||||
// Verify that different cursors return different data items when a DBT is initialized to all zeros (no flags)
|
||||
static void test_multiple_brt_cursor_dbts(int n, DB *db) {
|
||||
if (verbose) printf("test_multiple_brt_cursors:%d %p\n", n, db);
|
||||
|
||||
int r;
|
||||
CACHETABLE ct;
|
||||
BRT brt;
|
||||
BRT_CURSOR cursors[n];
|
||||
|
||||
unlink(fname);
|
||||
|
||||
r = toku_brt_create_cachetable(&ct, 0, ZERO_LSN, NULL_LOGGER);
|
||||
assert(r==0);
|
||||
|
||||
r = toku_open_brt(fname, 0, 1, &brt, 1<<12, ct, null_txn, toku_default_compare_fun, db);
|
||||
assert(r==0);
|
||||
|
||||
int i;
|
||||
for (i=0; i<n; i++) {
|
||||
DBT kbt,vbt;
|
||||
char key[10],val[10];
|
||||
snprintf(key, sizeof key, "k%04d", i);
|
||||
snprintf(key, sizeof val, "k%04d", i);
|
||||
r = toku_brt_insert(brt,
|
||||
toku_fill_dbt(&kbt, key, strlen(key)),
|
||||
toku_fill_dbt(&vbt, val, strlen(val)),
|
||||
0);
|
||||
assert(r == 0);
|
||||
}
|
||||
|
||||
for (i=0; i<n; i++) {
|
||||
r = toku_brt_cursor(brt, &cursors[i]);
|
||||
assert(r == 0);
|
||||
}
|
||||
|
||||
void *ptrs[n];
|
||||
for (i=0; i<n; i++) {
|
||||
DBT kbt, vbt;
|
||||
char key[10];
|
||||
snprintf(key, sizeof key, "k%04d", i);
|
||||
r = toku_brt_cursor_get(cursors[i],
|
||||
toku_fill_dbt(&kbt, key, strlen(key)),
|
||||
toku_init_dbt(&vbt),
|
||||
DB_SET,
|
||||
null_txn);
|
||||
assert(r == 0);
|
||||
ptrs[i] = vbt.data;
|
||||
}
|
||||
|
||||
for (i=0; i<n; i++) {
|
||||
int j;
|
||||
for (j=i+1; j<n; j++) {
|
||||
assert(ptrs[i]!=ptrs[j]);
|
||||
}
|
||||
}
|
||||
|
||||
for (i=0; i<n; i++) {
|
||||
r = toku_brt_cursor_close(cursors[i]);
|
||||
assert(r == 0);
|
||||
}
|
||||
|
||||
r = toku_close_brt(brt);
|
||||
assert(r==0);
|
||||
|
||||
r = toku_cachetable_close(&ct);
|
||||
assert(r==0);
|
||||
}
|
||||
|
||||
static void test_brt_cursor(DB *db) {
|
||||
test_multiple_brt_cursor_dbts(1, db);
|
||||
test_multiple_brt_cursor_dbts(2, db);
|
||||
test_multiple_brt_cursor_dbts(3, db);
|
||||
}
|
||||
|
||||
|
||||
int main (int argc , const char *argv[]) {
|
||||
default_parse_args(argc, argv);
|
||||
|
||||
DB a_db;
|
||||
DB *db = &a_db;
|
||||
test_brt_cursor(db);
|
||||
|
||||
toku_malloc_cleanup();
|
||||
if (verbose) printf("test ok\n");
|
||||
return 0;
|
||||
}
|
|
@ -92,4 +92,6 @@ struct brt_cmd {
|
|||
};
|
||||
typedef struct brt_cmd BRT_CMD_S, *BRT_CMD;
|
||||
|
||||
#define UU(x) x __attribute__((__unused__))
|
||||
|
||||
#endif
|
||||
|
|
|
@ -129,3 +129,10 @@ static inline int toku_logsizeof_INTPAIRARRAY (INTPAIRARRAY pa) {
|
|||
return 4+(4+4)*pa.size;
|
||||
}
|
||||
|
||||
static inline char *fixup_fname(BYTESTRING *f) {
|
||||
assert(f->len>0);
|
||||
char *fname = toku_malloc(f->len+1);
|
||||
memcpy(fname, f->data, f->len);
|
||||
fname[f->len]=0;
|
||||
return fname;
|
||||
}
|
||||
|
|
|
@ -236,9 +236,9 @@ void generate_log_struct (void) {
|
|||
fprintf(hf, " %-16s crc;\n", "u_int32_t");
|
||||
fprintf(hf, " %-16s len;\n", "u_int32_t");
|
||||
fprintf(hf, "};\n");
|
||||
fprintf(hf, "void toku_recover_%s (LSN lsn", lt->name);
|
||||
DO_FIELDS(ft, lt, fprintf(hf, ", %s %s", ft->type, ft->name));
|
||||
fprintf(hf, ");\n");
|
||||
//fprintf(hf, "void toku_recover_%s (LSN lsn", lt->name);
|
||||
//DO_FIELDS(ft, lt, fprintf(hf, ", %s %s", ft->type, ft->name));
|
||||
//fprintf(hf, ");\n");
|
||||
}));
|
||||
DO_ROLLBACKS(lt,
|
||||
({ fprintf(hf, "struct rolltype_%s {\n", lt->name);
|
||||
|
|
446
newbrt/recover.c
446
newbrt/recover.c
|
@ -19,6 +19,452 @@
|
|||
#include <sys/stat.h>
|
||||
#include <unistd.h>
|
||||
|
||||
//#define DO_VERIFY_COUNTS
|
||||
#ifdef DO_VERIFY_COUNTS
|
||||
#define VERIFY_COUNTS(n) toku_verify_counts(n)
|
||||
#else
|
||||
#define VERIFY_COUNTS(n) ((void)0)
|
||||
#endif
|
||||
|
||||
static DB * const null_db=0;
|
||||
|
||||
// These data structures really should be part of a recovery data structure. Recovery could be multithreaded (on different environments...) But this is OK since recovery can only happen in one
|
||||
static CACHETABLE ct;
|
||||
static struct cf_pair {
|
||||
FILENUM filenum;
|
||||
CACHEFILE cf;
|
||||
BRT brt; // set to zero on an fopen, but filled in when an fheader is seen.
|
||||
} *cf_pairs;
|
||||
static int n_cf_pairs=0, max_cf_pairs=0;;
|
||||
|
||||
int toku_recover_init (void) {
|
||||
int r = toku_create_cachetable(&ct, 1<<25, (LSN){0}, 0);
|
||||
return r;
|
||||
}
|
||||
|
||||
void toku_recover_cleanup (void) {
|
||||
int i;
|
||||
for (i=0; i<n_cf_pairs; i++) {
|
||||
if (cf_pairs[i].brt) {
|
||||
int r = toku_close_brt(cf_pairs[i].brt);
|
||||
//r = toku_cachefile_close(&cf_pairs[i].cf);
|
||||
assert(r==0);
|
||||
}
|
||||
}
|
||||
toku_free(cf_pairs);
|
||||
{
|
||||
int r = toku_cachetable_close(&ct);
|
||||
assert(r==0);
|
||||
}
|
||||
}
|
||||
|
||||
void toku_recover_commit (LSN UU(lsn), TXNID UU(txnid)) {
|
||||
}
|
||||
|
||||
void toku_recover_fcreate (LSN UU(lsn), TXNID UU(txnid),BYTESTRING fname,u_int32_t mode) {
|
||||
char *fixed_fname = fixup_fname(&fname);
|
||||
int fd = creat(fixed_fname, mode);
|
||||
assert(fd>=0);
|
||||
toku_free(fixed_fname);
|
||||
toku_free_BYTESTRING(fname);
|
||||
}
|
||||
|
||||
int toku_recover_note_cachefile (FILENUM fnum, CACHEFILE cf, BRT brt) {
|
||||
if (max_cf_pairs==0) {
|
||||
n_cf_pairs=1;
|
||||
max_cf_pairs=2;
|
||||
MALLOC_N(max_cf_pairs, cf_pairs);
|
||||
if (cf_pairs==0) return errno;
|
||||
} else {
|
||||
if (n_cf_pairs>=max_cf_pairs) {
|
||||
max_cf_pairs*=2;
|
||||
cf_pairs = toku_realloc(cf_pairs, max_cf_pairs*sizeof(*cf_pairs));
|
||||
}
|
||||
n_cf_pairs++;
|
||||
}
|
||||
cf_pairs[n_cf_pairs-1].filenum = fnum;
|
||||
cf_pairs[n_cf_pairs-1].cf = cf;
|
||||
cf_pairs[n_cf_pairs-1].brt = brt;
|
||||
return 0;
|
||||
}
|
||||
|
||||
static int find_cachefile (FILENUM fnum, struct cf_pair **cf_pair) {
|
||||
int i;
|
||||
for (i=0; i<n_cf_pairs; i++) {
|
||||
if (fnum.fileid==cf_pairs[i].filenum.fileid) {
|
||||
*cf_pair = cf_pairs+i;
|
||||
return 0;
|
||||
}
|
||||
}
|
||||
return 1;
|
||||
}
|
||||
|
||||
static void toku_recover_fheader (LSN UU(lsn), TXNID UU(txnid),FILENUM filenum,LOGGEDBRTHEADER header) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
struct brt_header *MALLOC(h);
|
||||
assert(h);
|
||||
h->dirty=0;
|
||||
h->flags = header.flags;
|
||||
h->nodesize = header.nodesize;
|
||||
h->freelist = header.freelist;
|
||||
h->unused_memory = header.unused_memory;
|
||||
h->n_named_roots = header.n_named_roots;
|
||||
if ((signed)header.n_named_roots==-1) {
|
||||
h->unnamed_root = header.u.one.root;
|
||||
} else {
|
||||
assert(0);
|
||||
}
|
||||
toku_cachetable_put(pair->cf, 0, h, 0, toku_brtheader_flush_callback, toku_brtheader_fetch_callback, 0);
|
||||
if (pair->brt) {
|
||||
free(pair->brt->h);
|
||||
} else {
|
||||
MALLOC(pair->brt);
|
||||
pair->brt->cf = pair->cf;
|
||||
pair->brt->database_name = 0; // Special case, we don't know or care what the database name is for recovery.
|
||||
list_init(&pair->brt->cursors);
|
||||
pair->brt->compare_fun = 0;
|
||||
pair->brt->dup_compare = 0;
|
||||
pair->brt->db = 0;
|
||||
pair->brt->skey = pair->brt->sval = 0;
|
||||
}
|
||||
pair->brt->h = h;
|
||||
pair->brt->nodesize = h->nodesize;
|
||||
pair->brt->flags = h->nodesize;
|
||||
r = toku_unpin_brt_header(pair->brt);
|
||||
assert(r==0);
|
||||
}
|
||||
|
||||
void toku_recover_newbrtnode (LSN lsn, FILENUM filenum,DISKOFF diskoff,u_int32_t height,u_int32_t nodesize,u_int8_t is_dup_sort,u_int32_t rand4fingerprint) {
|
||||
int r;
|
||||
struct cf_pair *pair = NULL;
|
||||
r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
TAGMALLOC(BRTNODE, n);
|
||||
n->nodesize = nodesize;
|
||||
n->thisnodename = diskoff;
|
||||
n->log_lsn = n->disk_lsn = lsn;
|
||||
//printf("%s:%d %p->disk_lsn=%"PRId64"\n", __FILE__, __LINE__, n, n->disk_lsn.lsn);
|
||||
n->layout_version = 2;
|
||||
n->height = height;
|
||||
n->rand4fingerprint = rand4fingerprint;
|
||||
n->flags = is_dup_sort ? TOKU_DB_DUPSORT : 0; // Don't have TOKU_DB_DUP ???
|
||||
n->local_fingerprint = 0; // nothing there yet
|
||||
n->dirty = 1;
|
||||
if (height==0) {
|
||||
r=toku_pma_create(&n->u.l.buffer, toku_dont_call_this_compare_fun, null_db, filenum, nodesize);
|
||||
assert(r==0);
|
||||
n->u.l.n_bytes_in_buffer=0;
|
||||
} else {
|
||||
n->u.n.n_children = 0;
|
||||
n->u.n.totalchildkeylens = 0;
|
||||
n->u.n.n_bytes_in_buffers = 0;
|
||||
MALLOC_N(3,n->u.n.childinfos);
|
||||
MALLOC_N(2,n->u.n.childkeys);
|
||||
}
|
||||
// Now put it in the cachetable
|
||||
toku_cachetable_put(pair->cf, diskoff, n, toku_serialize_brtnode_size(n), toku_brtnode_flush_callback, toku_brtnode_fetch_callback, 0);
|
||||
|
||||
VERIFY_COUNTS(n);
|
||||
|
||||
n->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(pair->cf, diskoff, 1, toku_serialize_brtnode_size(n));
|
||||
assert(r==0);
|
||||
}
|
||||
|
||||
static void recover_setup_node (FILENUM filenum, DISKOFF diskoff, CACHEFILE *cf, BRTNODE *resultnode) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
assert(pair->brt);
|
||||
void *node_v;
|
||||
r = toku_cachetable_get_and_pin(pair->cf, diskoff, &node_v, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
BRTNODE node = node_v;
|
||||
*resultnode = node;
|
||||
*cf = pair->cf;
|
||||
}
|
||||
|
||||
void toku_recover_brtdeq (LSN UU(lsn), FILENUM UU(filenum), DISKOFF UU(diskoff), u_int32_t UU(childnum), TXNID UU(xid), u_int32_t UU(typ), BYTESTRING UU(key), BYTESTRING UU(data), u_int32_t UU(oldfingerprint), u_int32_t UU(newfingerprint)) { assert(0); }
|
||||
|
||||
void toku_recover_brtenq (LSN UU(lsn), FILENUM UU(filenum), DISKOFF UU(diskoff), u_int32_t UU(childnum), TXNID UU(xid), u_int32_t UU(typ), BYTESTRING UU(key), BYTESTRING UU(data), u_int32_t UU(oldfingerprint), u_int32_t UU(newfingerprint)) { assert(0); }
|
||||
|
||||
void toku_recover_addchild (LSN lsn, FILENUM filenum, DISKOFF diskoff, u_int32_t childnum, DISKOFF child, u_int32_t childfingerprint) {
|
||||
CACHEFILE cf;
|
||||
BRTNODE node;
|
||||
recover_setup_node(filenum, diskoff, &cf, &node);
|
||||
assert(node->height>0);
|
||||
assert(childnum <= (unsigned)node->u.n.n_children);
|
||||
unsigned int i;
|
||||
REALLOC_N(node->u.n.n_children+1, node->u.n.childinfos);
|
||||
REALLOC_N(node->u.n.n_children, node->u.n.childkeys);
|
||||
for (i=node->u.n.n_children; i>childnum; i--) {
|
||||
node->u.n.childinfos[i]=node->u.n.childinfos[i-1];
|
||||
BNC_NBYTESINBUF(node,i) = BNC_NBYTESINBUF(node,i-1);
|
||||
assert(i>=2);
|
||||
node->u.n.childkeys [i-1] = node->u.n.childkeys [i-2];
|
||||
}
|
||||
if (childnum>0) {
|
||||
node->u.n.childkeys [childnum-1] = 0;
|
||||
}
|
||||
BNC_DISKOFF(node, childnum) = child;
|
||||
BNC_SUBTREE_FINGERPRINT(node, childnum) = childfingerprint;
|
||||
int r= toku_fifo_create(&BNC_BUFFER(node, childnum)); assert(r==0);
|
||||
BNC_NBYTESINBUF(node, childnum) = 0;
|
||||
node->u.n.n_children++;
|
||||
node->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(cf, diskoff, 1, toku_serialize_brtnode_size(node));
|
||||
assert(r==0);
|
||||
}
|
||||
|
||||
void toku_recover_delchild (LSN lsn, FILENUM filenum, DISKOFF diskoff, u_int32_t childnum, DISKOFF child, u_int32_t childfingerprint, BYTESTRING pivotkey) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
void *node_v;
|
||||
assert(pair->brt);
|
||||
r = toku_cachetable_get_and_pin(pair->cf, diskoff, &node_v, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
BRTNODE node = node_v;
|
||||
assert(node->height>0);
|
||||
|
||||
assert(childnum < (unsigned)node->u.n.n_children);
|
||||
assert(node->u.n.childinfos[childnum].subtree_fingerprint == childfingerprint);
|
||||
assert(BNC_DISKOFF(node, childnum)==child);
|
||||
assert(toku_fifo_n_entries(BNC_BUFFER(node,childnum))==0);
|
||||
assert(BNC_NBYTESINBUF(node,childnum)==0);
|
||||
assert(node->u.n.n_children>2); // Must be at least two children.
|
||||
u_int32_t i;
|
||||
assert(childnum>0);
|
||||
node->u.n.totalchildkeylens -= toku_brt_pivot_key_len(pair->brt, node->u.n.childkeys[childnum-1]);
|
||||
toku_free((void*)node->u.n.childkeys[childnum-1]);
|
||||
toku_fifo_free(&BNC_BUFFER(node,childnum));
|
||||
for (i=childnum+1; i<(unsigned)node->u.n.n_children; i++) {
|
||||
node->u.n.childinfos[i-1] = node->u.n.childinfos[i];
|
||||
BNC_NBYTESINBUF(node,i-1) = BNC_NBYTESINBUF(node,i);
|
||||
node->u.n.childkeys[i-2] = node->u.n.childkeys[i-1];
|
||||
}
|
||||
node->u.n.n_children--;
|
||||
|
||||
node->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(pair->cf, diskoff, 1, toku_serialize_brtnode_size(node));
|
||||
assert(r==0);
|
||||
toku_free(pivotkey.data);
|
||||
}
|
||||
|
||||
void toku_recover_setchild (LSN lsn, FILENUM filenum, DISKOFF diskoff, u_int32_t childnum, DISKOFF UU(oldchild), DISKOFF newchild) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
void *node_v;
|
||||
assert(pair->brt);
|
||||
r = toku_cachetable_get_and_pin(pair->cf, diskoff, &node_v, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
BRTNODE node = node_v;
|
||||
assert(node->height>0);
|
||||
assert(childnum < (unsigned)node->u.n.n_children);
|
||||
BNC_DISKOFF(node, childnum) = newchild;
|
||||
node->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(pair->cf, diskoff, 1, toku_serialize_brtnode_size(node));
|
||||
assert(r==0);
|
||||
}
|
||||
void toku_recover_setpivot (LSN lsn, FILENUM filenum, DISKOFF diskoff, u_int32_t childnum, BYTESTRING pivotkey) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
void *node_v;
|
||||
assert(pair->brt);
|
||||
r = toku_cachetable_get_and_pin(pair->cf, diskoff, &node_v, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
BRTNODE node = node_v;
|
||||
assert(node->height>0);
|
||||
|
||||
struct kv_pair *new_pivot = kv_pair_malloc(pivotkey.data, pivotkey.len, 0, 0);
|
||||
|
||||
node->u.n.childkeys[childnum] = new_pivot;
|
||||
node->u.n.totalchildkeylens += toku_brt_pivot_key_len(pair->brt, node->u.n.childkeys[childnum]);
|
||||
|
||||
node->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(pair->cf, diskoff, 1, toku_serialize_brtnode_size(node));
|
||||
assert(r==0);
|
||||
|
||||
toku_free(pivotkey.data);
|
||||
}
|
||||
|
||||
void toku_recover_changechildfingerprint (LSN lsn, FILENUM filenum, DISKOFF diskoff, u_int32_t childnum, u_int32_t UU(oldfingerprint), u_int32_t newfingerprint) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
void *node_v;
|
||||
assert(pair->brt);
|
||||
r = toku_cachetable_get_and_pin(pair->cf, diskoff, &node_v, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
BRTNODE node = node_v;
|
||||
assert(node->height>0);
|
||||
assert((signed)childnum < node->u.n.n_children);
|
||||
BNC_SUBTREE_FINGERPRINT(node, childnum) = newfingerprint;
|
||||
node->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(pair->cf, diskoff, 1, toku_serialize_brtnode_size(node));
|
||||
assert(r==0);
|
||||
|
||||
}
|
||||
|
||||
void toku_recover_fopen (LSN UU(lsn), TXNID UU(txnid), BYTESTRING fname, FILENUM filenum) {
|
||||
char *fixedfname = fixup_fname(&fname);
|
||||
CACHEFILE cf;
|
||||
int fd = open(fixedfname, O_RDWR, 0);
|
||||
assert(fd>=0);
|
||||
BRT MALLOC(brt);
|
||||
assert(errno==0 && brt!=0);
|
||||
brt->database_name = fixedfname;
|
||||
brt->h=0;
|
||||
list_init(&brt->cursors);
|
||||
brt->compare_fun = 0;
|
||||
brt->dup_compare = 0;
|
||||
brt->db = 0;
|
||||
int r = toku_cachetable_openfd(&cf, ct, fd, brt);
|
||||
assert(r==0);
|
||||
brt->skey = brt->sval = 0;
|
||||
brt->cf=cf;
|
||||
toku_recover_note_cachefile(filenum, cf, brt);
|
||||
toku_free_BYTESTRING(fname);
|
||||
}
|
||||
|
||||
void toku_recover_insertinleaf (LSN lsn, TXNID UU(txnid), FILENUM filenum, DISKOFF diskoff, u_int32_t pmaidx, BYTESTRING keybs, BYTESTRING databs) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
void *node_v;
|
||||
assert(pair->brt);
|
||||
r = toku_cachetable_get_and_pin(pair->cf, diskoff, &node_v, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
BRTNODE node = node_v;
|
||||
assert(node->height==0);
|
||||
VERIFY_COUNTS(node);
|
||||
DBT key,data;
|
||||
r = toku_pma_set_at_index(node->u.l.buffer, pmaidx, toku_fill_dbt(&key, keybs.data, keybs.len), toku_fill_dbt(&data, databs.data, databs.len));
|
||||
assert(r==0);
|
||||
node->local_fingerprint += node->rand4fingerprint*toku_calccrc32_kvpair(keybs.data, keybs.len, databs.data, databs.len);
|
||||
node->u.l.n_bytes_in_buffer += PMA_ITEM_OVERHEAD + KEY_VALUE_OVERHEAD + keybs.len + databs.len;
|
||||
|
||||
VERIFY_COUNTS(node);
|
||||
|
||||
node->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(pair->cf, diskoff, 1, toku_serialize_brtnode_size(node));
|
||||
assert(r==0);
|
||||
toku_free_BYTESTRING(keybs);
|
||||
toku_free_BYTESTRING(databs);
|
||||
}
|
||||
|
||||
void toku_recover_deleteinleaf (LSN lsn, TXNID UU(txnid), FILENUM filenum, DISKOFF diskoff, u_int32_t pmaidx, BYTESTRING keybs, BYTESTRING databs) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
void *node_v;
|
||||
assert(pair->brt);
|
||||
r = toku_cachetable_get_and_pin(pair->cf, diskoff, &node_v, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
BRTNODE node = node_v;
|
||||
assert(node->height==0);
|
||||
VERIFY_COUNTS(node);
|
||||
r = toku_pma_clear_at_index(node->u.l.buffer, pmaidx);
|
||||
assert (r==0);
|
||||
node->local_fingerprint -= node->rand4fingerprint*toku_calccrc32_kvpair(keybs.data, keybs.len, databs.data, databs.len);
|
||||
node->u.l.n_bytes_in_buffer -= PMA_ITEM_OVERHEAD + KEY_VALUE_OVERHEAD + keybs.len + databs.len;
|
||||
VERIFY_COUNTS(node);
|
||||
node->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(pair->cf, diskoff, 1, toku_serialize_brtnode_size(node));
|
||||
assert(r==0);
|
||||
toku_free_BYTESTRING(keybs);
|
||||
toku_free_BYTESTRING(databs);
|
||||
}
|
||||
|
||||
// a newbrtnode should have been done before this
|
||||
void toku_recover_resizepma (LSN lsn, FILENUM filenum, DISKOFF diskoff, u_int32_t oldsize, u_int32_t newsize) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
void *node_v;
|
||||
assert(pair->brt);
|
||||
r = toku_cachetable_get_and_pin (pair->cf, diskoff, &node_v, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
BRTNODE node = node_v;
|
||||
assert(node->height==0);
|
||||
r = toku_resize_pma_exactly (node->u.l.buffer, oldsize, newsize);
|
||||
assert(r==0);
|
||||
|
||||
VERIFY_COUNTS(node);
|
||||
|
||||
node->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(pair->cf, diskoff, 1, toku_serialize_brtnode_size(node));
|
||||
assert(r==0);
|
||||
}
|
||||
|
||||
void toku_recover_pmadistribute (LSN lsn, FILENUM filenum, DISKOFF old_diskoff, DISKOFF new_diskoff, INTPAIRARRAY fromto) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
void *node_va, *node_vb;
|
||||
assert(pair->brt);
|
||||
r = toku_cachetable_get_and_pin(pair->cf, old_diskoff, &node_va, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
r = toku_cachetable_get_and_pin(pair->cf, new_diskoff, &node_vb, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
BRTNODE nodea = node_va; assert(nodea->height==0);
|
||||
BRTNODE nodeb = node_vb; assert(nodeb->height==0);
|
||||
{
|
||||
unsigned int i;
|
||||
for (i=0; i<fromto.size; i++) {
|
||||
assert(fromto.array[i].a < toku_pma_index_limit(nodea->u.l.buffer));
|
||||
assert(fromto.array[i].b < toku_pma_index_limit(nodeb->u.l.buffer));
|
||||
}
|
||||
}
|
||||
r = toku_pma_move_indices (nodea->u.l.buffer, nodeb->u.l.buffer, fromto,
|
||||
nodea->rand4fingerprint, &nodea->local_fingerprint,
|
||||
nodeb->rand4fingerprint, &nodeb->local_fingerprint,
|
||||
&nodea->u.l.n_bytes_in_buffer, &nodeb->u.l.n_bytes_in_buffer
|
||||
);
|
||||
// The bytes in buffer and fingerprint shouldn't change
|
||||
|
||||
VERIFY_COUNTS(nodea);
|
||||
VERIFY_COUNTS(nodeb);
|
||||
|
||||
nodea->log_lsn = lsn;
|
||||
nodeb->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(pair->cf, old_diskoff, 1, toku_serialize_brtnode_size(nodea));
|
||||
assert(r==0);
|
||||
r = toku_cachetable_unpin(pair->cf, new_diskoff, 1, toku_serialize_brtnode_size(nodeb));
|
||||
assert(r==0);
|
||||
|
||||
|
||||
toku_free_INTPAIRARRAY(fromto);
|
||||
}
|
||||
|
||||
void toku_recover_changeunnamedroot (LSN UU(lsn), FILENUM filenum, DISKOFF UU(oldroot), DISKOFF newroot) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
assert(pair->brt);
|
||||
r = toku_read_and_pin_brt_header(pair->cf, &pair->brt->h);
|
||||
assert(r==0);
|
||||
pair->brt->h->unnamed_root = newroot;
|
||||
r = toku_unpin_brt_header(pair->brt);
|
||||
}
|
||||
void toku_recover_changenamedroot (LSN UU(lsn), FILENUM UU(filenum), BYTESTRING UU(name), DISKOFF UU(oldroot), DISKOFF UU(newroot)) { assert(0); }
|
||||
|
||||
void toku_recover_changeunusedmemory (LSN UU(lsn), FILENUM filenum, DISKOFF UU(oldunused), DISKOFF newunused) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
assert(pair->brt);
|
||||
r = toku_read_and_pin_brt_header(pair->cf, &pair->brt->h);
|
||||
assert(r==0);
|
||||
pair->brt->h->unused_memory = newunused;
|
||||
r = toku_unpin_brt_header(pair->brt);
|
||||
}
|
||||
|
||||
|
||||
int tokudb_recover(const char *data_dir, const char *log_dir) {
|
||||
int r;
|
||||
int entrycount=0;
|
||||
|
|
478
newbrt/roll.c
478
newbrt/roll.c
|
@ -12,98 +12,8 @@
|
|||
#include "cachetable.h"
|
||||
#include "key.h"
|
||||
|
||||
//#define DO_VERIFY_COUNTS
|
||||
#ifdef DO_VERIFY_COUNTS
|
||||
#define VERIFY_COUNTS(n) toku_verify_counts(n)
|
||||
#else
|
||||
#define VERIFY_COUNTS(n) ((void)0)
|
||||
#endif
|
||||
|
||||
#define UU(x) x __attribute__((__unused__))
|
||||
|
||||
static DB * const null_db=0;
|
||||
|
||||
// These data structures really should be part of a recovery data structure. Recovery could be multithreaded (on different environments...) But this is OK since recovery can only happen in one
|
||||
static CACHETABLE ct;
|
||||
static struct cf_pair {
|
||||
FILENUM filenum;
|
||||
CACHEFILE cf;
|
||||
BRT brt; // set to zero on an fopen, but filled in when an fheader is seen.
|
||||
} *cf_pairs;
|
||||
static int n_cf_pairs=0, max_cf_pairs=0;;
|
||||
|
||||
int toku_recover_init (void) {
|
||||
int r = toku_create_cachetable(&ct, 1<<25, (LSN){0}, 0);
|
||||
return r;
|
||||
}
|
||||
void toku_recover_cleanup (void) {
|
||||
int i;
|
||||
for (i=0; i<n_cf_pairs; i++) {
|
||||
if (cf_pairs[i].brt) {
|
||||
int r = toku_close_brt(cf_pairs[i].brt);
|
||||
//r = toku_cachefile_close(&cf_pairs[i].cf);
|
||||
assert(r==0);
|
||||
}
|
||||
}
|
||||
toku_free(cf_pairs);
|
||||
{
|
||||
int r = toku_cachetable_close(&ct);
|
||||
assert(r==0);
|
||||
}
|
||||
}
|
||||
|
||||
int toku_recover_note_cachefile (FILENUM fnum, CACHEFILE cf, BRT brt) {
|
||||
if (max_cf_pairs==0) {
|
||||
n_cf_pairs=1;
|
||||
max_cf_pairs=2;
|
||||
MALLOC_N(max_cf_pairs, cf_pairs);
|
||||
if (cf_pairs==0) return errno;
|
||||
} else {
|
||||
if (n_cf_pairs>=max_cf_pairs) {
|
||||
max_cf_pairs*=2;
|
||||
cf_pairs = toku_realloc(cf_pairs, max_cf_pairs*sizeof(*cf_pairs));
|
||||
}
|
||||
n_cf_pairs++;
|
||||
}
|
||||
cf_pairs[n_cf_pairs-1].filenum = fnum;
|
||||
cf_pairs[n_cf_pairs-1].cf = cf;
|
||||
cf_pairs[n_cf_pairs-1].brt = brt;
|
||||
return 0;
|
||||
}
|
||||
|
||||
static int find_cachefile (FILENUM fnum, struct cf_pair **cf_pair) {
|
||||
int i;
|
||||
for (i=0; i<n_cf_pairs; i++) {
|
||||
if (fnum.fileid==cf_pairs[i].filenum.fileid) {
|
||||
*cf_pair = cf_pairs+i;
|
||||
return 0;
|
||||
}
|
||||
}
|
||||
return 1;
|
||||
}
|
||||
|
||||
static char *fixup_fname(BYTESTRING *f) {
|
||||
assert(f->len>0);
|
||||
char *fname = toku_malloc(f->len+1);
|
||||
memcpy(fname, f->data, f->len);
|
||||
fname[f->len]=0;
|
||||
return fname;
|
||||
}
|
||||
|
||||
|
||||
void toku_recover_commit (LSN UU(lsn), TXNID UU(txnid)) {
|
||||
}
|
||||
|
||||
#define ABORTIT { le=le; txn=txn; fprintf(stderr, "%s:%d (%s) not ready to go\n", __FILE__, __LINE__, __func__); abort(); }
|
||||
|
||||
void toku_recover_fcreate (LSN UU(lsn), TXNID UU(txnid),BYTESTRING fname,u_int32_t mode) {
|
||||
char *fixed_fname = fixup_fname(&fname);
|
||||
int fd = creat(fixed_fname, mode);
|
||||
assert(fd>=0);
|
||||
toku_free(fixed_fname);
|
||||
toku_free_BYTESTRING(fname);
|
||||
}
|
||||
|
||||
int toku_rollback_fcreate (BYTESTRING bs_fname,
|
||||
TOKUTXN txn __attribute__((__unused__))) {
|
||||
char *fname = fixup_fname(&bs_fname);
|
||||
|
@ -118,81 +28,6 @@ int toku_rollback_fcreate (BYTESTRING bs_fname,
|
|||
return 0;
|
||||
}
|
||||
|
||||
|
||||
void toku_recover_fheader (LSN UU(lsn), TXNID UU(txnid),FILENUM filenum,LOGGEDBRTHEADER header) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
struct brt_header *MALLOC(h);
|
||||
assert(h);
|
||||
h->dirty=0;
|
||||
h->flags = header.flags;
|
||||
h->nodesize = header.nodesize;
|
||||
h->freelist = header.freelist;
|
||||
h->unused_memory = header.unused_memory;
|
||||
h->n_named_roots = header.n_named_roots;
|
||||
if ((signed)header.n_named_roots==-1) {
|
||||
h->unnamed_root = header.u.one.root;
|
||||
} else {
|
||||
assert(0);
|
||||
}
|
||||
toku_cachetable_put(pair->cf, 0, h, 0, toku_brtheader_flush_callback, toku_brtheader_fetch_callback, 0);
|
||||
if (pair->brt) {
|
||||
free(pair->brt->h);
|
||||
} else {
|
||||
MALLOC(pair->brt);
|
||||
pair->brt->cf = pair->cf;
|
||||
pair->brt->database_name = 0; // Special case, we don't know or care what the database name is for recovery.
|
||||
list_init(&pair->brt->cursors);
|
||||
pair->brt->compare_fun = 0;
|
||||
pair->brt->dup_compare = 0;
|
||||
pair->brt->db = 0;
|
||||
pair->brt->skey = pair->brt->sval = 0;
|
||||
}
|
||||
pair->brt->h = h;
|
||||
pair->brt->nodesize = h->nodesize;
|
||||
pair->brt->flags = h->nodesize;
|
||||
r = toku_unpin_brt_header(pair->brt);
|
||||
assert(r==0);
|
||||
}
|
||||
|
||||
void toku_recover_newbrtnode (LSN lsn, FILENUM filenum,DISKOFF diskoff,u_int32_t height,u_int32_t nodesize,u_int8_t is_dup_sort,u_int32_t rand4fingerprint) {
|
||||
int r;
|
||||
struct cf_pair *pair = NULL;
|
||||
r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
TAGMALLOC(BRTNODE, n);
|
||||
n->nodesize = nodesize;
|
||||
n->thisnodename = diskoff;
|
||||
n->log_lsn = n->disk_lsn = lsn;
|
||||
//printf("%s:%d %p->disk_lsn=%"PRId64"\n", __FILE__, __LINE__, n, n->disk_lsn.lsn);
|
||||
n->layout_version = 2;
|
||||
n->height = height;
|
||||
n->rand4fingerprint = rand4fingerprint;
|
||||
n->flags = is_dup_sort ? TOKU_DB_DUPSORT : 0; // Don't have TOKU_DB_DUP ???
|
||||
n->local_fingerprint = 0; // nothing there yet
|
||||
n->dirty = 1;
|
||||
if (height==0) {
|
||||
r=toku_pma_create(&n->u.l.buffer, toku_dont_call_this_compare_fun, null_db, filenum, nodesize);
|
||||
assert(r==0);
|
||||
n->u.l.n_bytes_in_buffer=0;
|
||||
} else {
|
||||
n->u.n.n_children = 0;
|
||||
n->u.n.totalchildkeylens = 0;
|
||||
n->u.n.n_bytes_in_buffers = 0;
|
||||
MALLOC_N(3,n->u.n.childinfos);
|
||||
MALLOC_N(2,n->u.n.childkeys);
|
||||
}
|
||||
// Now put it in the cachetable
|
||||
toku_cachetable_put(pair->cf, diskoff, n, toku_serialize_brtnode_size(n), toku_brtnode_flush_callback, toku_brtnode_fetch_callback, 0);
|
||||
|
||||
VERIFY_COUNTS(n);
|
||||
|
||||
n->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(pair->cf, diskoff, 1, toku_serialize_brtnode_size(n));
|
||||
assert(r==0);
|
||||
}
|
||||
|
||||
//int toku_rollback_newbrtnode (struct logtype_newbrtnode *le, TOKUTXN txn) {
|
||||
// // All that must be done is to put the node on the freelist.
|
||||
// // Since we don't have a freelist right now, we don't have anything to do.
|
||||
|
@ -202,227 +37,6 @@ void toku_recover_newbrtnode (LSN lsn, FILENUM filenum,DISKOFF diskoff,u_int32_t
|
|||
// return 0;
|
||||
//}
|
||||
|
||||
|
||||
static void recover_setup_node (FILENUM filenum, DISKOFF diskoff, CACHEFILE *cf, BRTNODE *resultnode) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
assert(pair->brt);
|
||||
void *node_v;
|
||||
r = toku_cachetable_get_and_pin(pair->cf, diskoff, &node_v, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
BRTNODE node = node_v;
|
||||
*resultnode = node;
|
||||
*cf = pair->cf;
|
||||
}
|
||||
|
||||
void toku_recover_brtdeq (LSN UU(lsn), FILENUM UU(filenum), DISKOFF UU(diskoff), u_int32_t UU(childnum), TXNID UU(xid), u_int32_t UU(typ), BYTESTRING UU(key), BYTESTRING UU(data), u_int32_t UU(oldfingerprint), u_int32_t UU(newfingerprint)) { assert(0); }
|
||||
|
||||
void toku_recover_brtenq (LSN UU(lsn), FILENUM UU(filenum), DISKOFF UU(diskoff), u_int32_t UU(childnum), TXNID UU(xid), u_int32_t UU(typ), BYTESTRING UU(key), BYTESTRING UU(data), u_int32_t UU(oldfingerprint), u_int32_t UU(newfingerprint)) { assert(0); }
|
||||
|
||||
void toku_recover_addchild (LSN lsn, FILENUM filenum, DISKOFF diskoff, u_int32_t childnum, DISKOFF child, u_int32_t childfingerprint) {
|
||||
CACHEFILE cf;
|
||||
BRTNODE node;
|
||||
recover_setup_node(filenum, diskoff, &cf, &node);
|
||||
assert(node->height>0);
|
||||
assert(childnum <= (unsigned)node->u.n.n_children);
|
||||
unsigned int i;
|
||||
REALLOC_N(node->u.n.n_children+1, node->u.n.childinfos);
|
||||
REALLOC_N(node->u.n.n_children, node->u.n.childkeys);
|
||||
for (i=node->u.n.n_children; i>childnum; i--) {
|
||||
node->u.n.childinfos[i]=node->u.n.childinfos[i-1];
|
||||
BNC_NBYTESINBUF(node,i) = BNC_NBYTESINBUF(node,i-1);
|
||||
assert(i>=2);
|
||||
node->u.n.childkeys [i-1] = node->u.n.childkeys [i-2];
|
||||
}
|
||||
if (childnum>0) {
|
||||
node->u.n.childkeys [childnum-1] = 0;
|
||||
}
|
||||
BNC_DISKOFF(node, childnum) = child;
|
||||
BNC_SUBTREE_FINGERPRINT(node, childnum) = childfingerprint;
|
||||
int r= toku_fifo_create(&BNC_BUFFER(node, childnum)); assert(r==0);
|
||||
BNC_NBYTESINBUF(node, childnum) = 0;
|
||||
node->u.n.n_children++;
|
||||
node->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(cf, diskoff, 1, toku_serialize_brtnode_size(node));
|
||||
assert(r==0);
|
||||
}
|
||||
|
||||
void toku_recover_delchild (LSN lsn, FILENUM filenum, DISKOFF diskoff, u_int32_t childnum, DISKOFF child, u_int32_t childfingerprint, BYTESTRING pivotkey) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
void *node_v;
|
||||
assert(pair->brt);
|
||||
r = toku_cachetable_get_and_pin(pair->cf, diskoff, &node_v, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
BRTNODE node = node_v;
|
||||
assert(node->height>0);
|
||||
|
||||
assert(childnum < (unsigned)node->u.n.n_children);
|
||||
assert(node->u.n.childinfos[childnum].subtree_fingerprint == childfingerprint);
|
||||
assert(BNC_DISKOFF(node, childnum)==child);
|
||||
assert(toku_fifo_n_entries(BNC_BUFFER(node,childnum))==0);
|
||||
assert(BNC_NBYTESINBUF(node,childnum)==0);
|
||||
assert(node->u.n.n_children>2); // Must be at least two children.
|
||||
u_int32_t i;
|
||||
assert(childnum>0);
|
||||
node->u.n.totalchildkeylens -= toku_brt_pivot_key_len(pair->brt, node->u.n.childkeys[childnum-1]);
|
||||
toku_free((void*)node->u.n.childkeys[childnum-1]);
|
||||
toku_fifo_free(&BNC_BUFFER(node,childnum));
|
||||
for (i=childnum+1; i<(unsigned)node->u.n.n_children; i++) {
|
||||
node->u.n.childinfos[i-1] = node->u.n.childinfos[i];
|
||||
BNC_NBYTESINBUF(node,i-1) = BNC_NBYTESINBUF(node,i);
|
||||
node->u.n.childkeys[i-2] = node->u.n.childkeys[i-1];
|
||||
}
|
||||
node->u.n.n_children--;
|
||||
|
||||
node->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(pair->cf, diskoff, 1, toku_serialize_brtnode_size(node));
|
||||
assert(r==0);
|
||||
toku_free(pivotkey.data);
|
||||
}
|
||||
|
||||
void toku_recover_setchild (LSN lsn, FILENUM filenum, DISKOFF diskoff, u_int32_t childnum, DISKOFF UU(oldchild), DISKOFF newchild) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
void *node_v;
|
||||
assert(pair->brt);
|
||||
r = toku_cachetable_get_and_pin(pair->cf, diskoff, &node_v, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
BRTNODE node = node_v;
|
||||
assert(node->height>0);
|
||||
assert(childnum < (unsigned)node->u.n.n_children);
|
||||
BNC_DISKOFF(node, childnum) = newchild;
|
||||
node->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(pair->cf, diskoff, 1, toku_serialize_brtnode_size(node));
|
||||
assert(r==0);
|
||||
}
|
||||
void toku_recover_setpivot (LSN lsn, FILENUM filenum, DISKOFF diskoff, u_int32_t childnum, BYTESTRING pivotkey) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
void *node_v;
|
||||
assert(pair->brt);
|
||||
r = toku_cachetable_get_and_pin(pair->cf, diskoff, &node_v, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
BRTNODE node = node_v;
|
||||
assert(node->height>0);
|
||||
|
||||
struct kv_pair *new_pivot = kv_pair_malloc(pivotkey.data, pivotkey.len, 0, 0);
|
||||
|
||||
node->u.n.childkeys[childnum] = new_pivot;
|
||||
node->u.n.totalchildkeylens += toku_brt_pivot_key_len(pair->brt, node->u.n.childkeys[childnum]);
|
||||
|
||||
node->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(pair->cf, diskoff, 1, toku_serialize_brtnode_size(node));
|
||||
assert(r==0);
|
||||
|
||||
toku_free(pivotkey.data);
|
||||
}
|
||||
|
||||
void toku_recover_changechildfingerprint (LSN lsn, FILENUM filenum, DISKOFF diskoff, u_int32_t childnum, u_int32_t UU(oldfingerprint), u_int32_t newfingerprint) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
void *node_v;
|
||||
assert(pair->brt);
|
||||
r = toku_cachetable_get_and_pin(pair->cf, diskoff, &node_v, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
BRTNODE node = node_v;
|
||||
assert(node->height>0);
|
||||
assert((signed)childnum < node->u.n.n_children);
|
||||
BNC_SUBTREE_FINGERPRINT(node, childnum) = newfingerprint;
|
||||
node->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(pair->cf, diskoff, 1, toku_serialize_brtnode_size(node));
|
||||
assert(r==0);
|
||||
|
||||
}
|
||||
|
||||
void toku_recover_fopen (LSN UU(lsn), TXNID UU(txnid), BYTESTRING fname, FILENUM filenum) {
|
||||
char *fixedfname = fixup_fname(&fname);
|
||||
CACHEFILE cf;
|
||||
int fd = open(fixedfname, O_RDWR, 0);
|
||||
assert(fd>=0);
|
||||
BRT MALLOC(brt);
|
||||
assert(errno==0 && brt!=0);
|
||||
brt->database_name = fixedfname;
|
||||
brt->h=0;
|
||||
list_init(&brt->cursors);
|
||||
brt->compare_fun = 0;
|
||||
brt->dup_compare = 0;
|
||||
brt->db = 0;
|
||||
int r = toku_cachetable_openfd(&cf, ct, fd, brt);
|
||||
assert(r==0);
|
||||
brt->skey = brt->sval = 0;
|
||||
brt->cf=cf;
|
||||
toku_recover_note_cachefile(filenum, cf, brt);
|
||||
toku_free_BYTESTRING(fname);
|
||||
}
|
||||
|
||||
void toku_recover_insertinleaf (LSN lsn, TXNID UU(txnid), FILENUM filenum, DISKOFF diskoff, u_int32_t pmaidx, BYTESTRING keybs, BYTESTRING databs) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
void *node_v;
|
||||
assert(pair->brt);
|
||||
r = toku_cachetable_get_and_pin(pair->cf, diskoff, &node_v, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
BRTNODE node = node_v;
|
||||
assert(node->height==0);
|
||||
VERIFY_COUNTS(node);
|
||||
DBT key,data;
|
||||
r = toku_pma_set_at_index(node->u.l.buffer, pmaidx, toku_fill_dbt(&key, keybs.data, keybs.len), toku_fill_dbt(&data, databs.data, databs.len));
|
||||
assert(r==0);
|
||||
node->local_fingerprint += node->rand4fingerprint*toku_calccrc32_kvpair(keybs.data, keybs.len, databs.data, databs.len);
|
||||
node->u.l.n_bytes_in_buffer += PMA_ITEM_OVERHEAD + KEY_VALUE_OVERHEAD + keybs.len + databs.len;
|
||||
|
||||
VERIFY_COUNTS(node);
|
||||
|
||||
node->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(pair->cf, diskoff, 1, toku_serialize_brtnode_size(node));
|
||||
assert(r==0);
|
||||
toku_free_BYTESTRING(keybs);
|
||||
toku_free_BYTESTRING(databs);
|
||||
}
|
||||
|
||||
void toku_recover_deleteinleaf (LSN lsn, TXNID UU(txnid), FILENUM filenum, DISKOFF diskoff, u_int32_t pmaidx, BYTESTRING keybs, BYTESTRING databs) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
void *node_v;
|
||||
assert(pair->brt);
|
||||
r = toku_cachetable_get_and_pin(pair->cf, diskoff, &node_v, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
BRTNODE node = node_v;
|
||||
assert(node->height==0);
|
||||
VERIFY_COUNTS(node);
|
||||
r = toku_pma_clear_at_index(node->u.l.buffer, pmaidx);
|
||||
assert (r==0);
|
||||
node->local_fingerprint -= node->rand4fingerprint*toku_calccrc32_kvpair(keybs.data, keybs.len, databs.data, databs.len);
|
||||
node->u.l.n_bytes_in_buffer -= PMA_ITEM_OVERHEAD + KEY_VALUE_OVERHEAD + keybs.len + databs.len;
|
||||
VERIFY_COUNTS(node);
|
||||
node->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(pair->cf, diskoff, 1, toku_serialize_brtnode_size(node));
|
||||
assert(r==0);
|
||||
toku_free_BYTESTRING(keybs);
|
||||
toku_free_BYTESTRING(databs);
|
||||
}
|
||||
|
||||
int toku_rollback_deleteatleaf (FILENUM filenum, BYTESTRING key, BYTESTRING data,TOKUTXN txn) {
|
||||
CACHEFILE cf;
|
||||
BRT brt;
|
||||
int r = toku_cachefile_of_filenum(txn->logger->ct, filenum, &cf, &brt);
|
||||
assert(r==0);
|
||||
DBT key_dbt,data_dbt;
|
||||
r = toku_brt_insert(brt,
|
||||
toku_fill_dbt(&key_dbt, key.data, key.len),
|
||||
toku_fill_dbt(&data_dbt, data.data, data.len),
|
||||
0); // Do the insertion unconditionally
|
||||
return r;
|
||||
}
|
||||
|
||||
int toku_rollback_insertatleaf (FILENUM filenum, BYTESTRING key,BYTESTRING data, TOKUTXN txn) {
|
||||
CACHEFILE cf;
|
||||
BRT brt;
|
||||
|
@ -436,87 +50,15 @@ int toku_rollback_insertatleaf (FILENUM filenum, BYTESTRING key,BYTESTRING data,
|
|||
return r;
|
||||
}
|
||||
|
||||
// a newbrtnode should have been done before this
|
||||
void toku_recover_resizepma (LSN lsn, FILENUM filenum, DISKOFF diskoff, u_int32_t oldsize, u_int32_t newsize) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
void *node_v;
|
||||
assert(pair->brt);
|
||||
r = toku_cachetable_get_and_pin (pair->cf, diskoff, &node_v, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
BRTNODE node = node_v;
|
||||
assert(node->height==0);
|
||||
r = toku_resize_pma_exactly (node->u.l.buffer, oldsize, newsize);
|
||||
assert(r==0);
|
||||
|
||||
VERIFY_COUNTS(node);
|
||||
|
||||
node->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(pair->cf, diskoff, 1, toku_serialize_brtnode_size(node));
|
||||
int toku_rollback_deleteatleaf (FILENUM filenum, BYTESTRING key, BYTESTRING data,TOKUTXN txn) {
|
||||
CACHEFILE cf;
|
||||
BRT brt;
|
||||
int r = toku_cachefile_of_filenum(txn->logger->ct, filenum, &cf, &brt);
|
||||
assert(r==0);
|
||||
DBT key_dbt,data_dbt;
|
||||
r = toku_brt_insert(brt,
|
||||
toku_fill_dbt(&key_dbt, key.data, key.len),
|
||||
toku_fill_dbt(&data_dbt, data.data, data.len),
|
||||
0); // Do the insertion unconditionally
|
||||
return r;
|
||||
}
|
||||
|
||||
void toku_recover_pmadistribute (LSN lsn, FILENUM filenum, DISKOFF old_diskoff, DISKOFF new_diskoff, INTPAIRARRAY fromto) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
void *node_va, *node_vb;
|
||||
assert(pair->brt);
|
||||
r = toku_cachetable_get_and_pin(pair->cf, old_diskoff, &node_va, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
r = toku_cachetable_get_and_pin(pair->cf, new_diskoff, &node_vb, NULL, toku_brtnode_flush_callback, toku_brtnode_fetch_callback, pair->brt);
|
||||
assert(r==0);
|
||||
BRTNODE nodea = node_va; assert(nodea->height==0);
|
||||
BRTNODE nodeb = node_vb; assert(nodeb->height==0);
|
||||
{
|
||||
unsigned int i;
|
||||
for (i=0; i<fromto.size; i++) {
|
||||
assert(fromto.array[i].a < toku_pma_index_limit(nodea->u.l.buffer));
|
||||
assert(fromto.array[i].b < toku_pma_index_limit(nodeb->u.l.buffer));
|
||||
}
|
||||
}
|
||||
r = toku_pma_move_indices (nodea->u.l.buffer, nodeb->u.l.buffer, fromto,
|
||||
nodea->rand4fingerprint, &nodea->local_fingerprint,
|
||||
nodeb->rand4fingerprint, &nodeb->local_fingerprint,
|
||||
&nodea->u.l.n_bytes_in_buffer, &nodeb->u.l.n_bytes_in_buffer
|
||||
);
|
||||
// The bytes in buffer and fingerprint shouldn't change
|
||||
|
||||
VERIFY_COUNTS(nodea);
|
||||
VERIFY_COUNTS(nodeb);
|
||||
|
||||
nodea->log_lsn = lsn;
|
||||
nodeb->log_lsn = lsn;
|
||||
r = toku_cachetable_unpin(pair->cf, old_diskoff, 1, toku_serialize_brtnode_size(nodea));
|
||||
assert(r==0);
|
||||
r = toku_cachetable_unpin(pair->cf, new_diskoff, 1, toku_serialize_brtnode_size(nodeb));
|
||||
assert(r==0);
|
||||
|
||||
|
||||
toku_free_INTPAIRARRAY(fromto);
|
||||
}
|
||||
|
||||
void toku_recover_changeunnamedroot (LSN UU(lsn), FILENUM filenum, DISKOFF UU(oldroot), DISKOFF newroot) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
assert(pair->brt);
|
||||
r = toku_read_and_pin_brt_header(pair->cf, &pair->brt->h);
|
||||
assert(r==0);
|
||||
pair->brt->h->unnamed_root = newroot;
|
||||
r = toku_unpin_brt_header(pair->brt);
|
||||
}
|
||||
void toku_recover_changenamedroot (LSN UU(lsn), FILENUM UU(filenum), BYTESTRING UU(name), DISKOFF UU(oldroot), DISKOFF UU(newroot)) { assert(0); }
|
||||
|
||||
void toku_recover_changeunusedmemory (LSN UU(lsn), FILENUM filenum, DISKOFF UU(oldunused), DISKOFF newunused) {
|
||||
struct cf_pair *pair = NULL;
|
||||
int r = find_cachefile(filenum, &pair);
|
||||
assert(r==0);
|
||||
assert(pair->brt);
|
||||
r = toku_read_and_pin_brt_header(pair->cf, &pair->brt->h);
|
||||
assert(r==0);
|
||||
pair->brt->h->unused_memory = newunused;
|
||||
r = toku_unpin_brt_header(pair->brt);
|
||||
}
|
||||
|
||||
|
|
|
@ -20,63 +20,12 @@
|
|||
#include <unistd.h>
|
||||
|
||||
int main (int argc, char *argv[]) {
|
||||
const char *dir;
|
||||
int r;
|
||||
int entrycount=0;
|
||||
assert(argc==2);
|
||||
dir = argv[1];
|
||||
int n_logfiles;
|
||||
char **logfiles;
|
||||
|
||||
int lockfd;
|
||||
|
||||
{
|
||||
int namelen=strlen(dir);
|
||||
char lockfname[namelen+20];
|
||||
snprintf(lockfname, sizeof(lockfname), "%s/__recoverylock", dir);
|
||||
lockfd = open(lockfname, O_RDWR|O_CREAT, S_IRUSR | S_IWUSR);
|
||||
if (lockfd<0) {
|
||||
printf("Couldn't open %s\n", lockfname);
|
||||
exit(1);
|
||||
}
|
||||
r=flock(lockfd, LOCK_EX | LOCK_NB);
|
||||
if (r!=0) {
|
||||
printf("Couldn't run recovery because some other process holds the recovery lock %s\n", lockfname);
|
||||
exit(1);
|
||||
}
|
||||
int r=tokudb_recover(argv[1], argv[1]);
|
||||
if (r!=0) {
|
||||
fprintf(stderr, "Recovery failed\n");
|
||||
exit(1);
|
||||
}
|
||||
|
||||
r = toku_logger_find_logfiles(dir, &n_logfiles, &logfiles);
|
||||
if (r!=0) exit(1);
|
||||
int i;
|
||||
toku_recover_init();
|
||||
for (i=0; i<n_logfiles; i++) {
|
||||
//fprintf(stderr, "Opening %s\n", logfiles[i]);
|
||||
FILE *f = fopen(logfiles[i], "r");
|
||||
struct log_entry le;
|
||||
u_int32_t version;
|
||||
r=toku_read_and_print_logmagic(f, &version);
|
||||
assert(r==0 && version==0);
|
||||
while ((r = toku_log_fread(f, &le))==0) {
|
||||
//printf("%lld: Got cmd %c\n", le.u.commit.lsn.lsn, le.cmd);
|
||||
logtype_dispatch_args(&le, toku_recover_);
|
||||
entrycount++;
|
||||
}
|
||||
if (r!=EOF) {
|
||||
if (r==DB_BADFORMAT) {
|
||||
fprintf(stderr, "Bad log format at record %d\n", entrycount);
|
||||
exit(1);
|
||||
} else {
|
||||
fprintf(stderr, "Huh? %s\n", strerror(r));
|
||||
exit(1);
|
||||
}
|
||||
}
|
||||
fclose(f);
|
||||
}
|
||||
toku_recover_cleanup();
|
||||
for (i=0; i<n_logfiles; i++) {
|
||||
toku_free(logfiles[i]);
|
||||
}
|
||||
toku_free(logfiles);
|
||||
return 0;
|
||||
}
|
||||
|
|
Loading…
Add table
Reference in a new issue