mariadb/extra/mariabackup/xbstream.cc

564 lines
12 KiB
C++
Raw Normal View History

2017-04-18 20:43:20 +02:00
/******************************************************
Copyright (c) 2011-2013 Percona LLC and/or its affiliates.
The xbstream utility: serialize/deserialize files in the XBSTREAM format.
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; version 2 of the License.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
2019-05-11 21:19:05 +02:00
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1335 USA
2017-04-18 20:43:20 +02:00
*******************************************************/
#include <mysql_version.h>
#include <my_base.h>
#include <my_getopt.h>
#include <hash.h>
2017-04-19 15:09:03 +02:00
#include <my_pthread.h>
2017-04-18 20:43:20 +02:00
#include "common.h"
#include "xbstream.h"
2017-04-19 15:09:03 +02:00
#include "datasink.h"
#include "crc_glue.h"
2017-04-18 20:43:20 +02:00
#define XBSTREAM_VERSION "1.0"
#define XBSTREAM_BUFFER_SIZE (10 * 1024 * 1024UL)
#define START_FILE_HASH_SIZE 16
typedef enum {
RUN_MODE_NONE,
RUN_MODE_CREATE,
RUN_MODE_EXTRACT
} run_mode_t;
/* Need the following definitions to avoid linking with ds_*.o and their link
dependencies */
datasink_t datasink_archive;
datasink_t datasink_xbstream;
datasink_t datasink_compress;
datasink_t datasink_tmpfile;
2017-04-19 15:09:03 +02:00
static run_mode_t opt_mode;
2017-04-18 20:43:20 +02:00
static char * opt_directory = NULL;
static my_bool opt_verbose = 0;
2017-04-19 15:09:03 +02:00
static int opt_parallel = 1;
2017-04-18 20:43:20 +02:00
static struct my_option my_long_options[] =
{
{"help", '?', "Display this help and exit.",
0, 0, 0, GET_NO_ARG, NO_ARG, 0, 0, 0, 0, 0, 0},
{"create", 'c', "Stream the specified files to the standard output.",
0, 0, 0, GET_NO_ARG, NO_ARG, 0, 0, 0, 0, 0, 0},
{"extract", 'x', "Extract to disk files from the stream on the "
"standard input.",
0, 0, 0, GET_NO_ARG, NO_ARG, 0, 0, 0, 0, 0, 0},
{"directory", 'C', "Change the current directory to the specified one "
"before streaming or extracting.", &opt_directory, &opt_directory, 0,
GET_STR_ALLOC, REQUIRED_ARG, 0, 0, 0, 0, 0, 0},
{"verbose", 'v', "Print verbose output.", &opt_verbose, &opt_verbose,
0, GET_BOOL, NO_ARG, 0, 0, 0, 0, 0, 0},
2017-04-19 15:09:03 +02:00
{"parallel", 'p', "Number of worker threads for reading / writing.",
&opt_parallel, &opt_parallel, 0, GET_INT, REQUIRED_ARG,
1, 1, INT_MAX, 0, 0, 0},
2017-04-18 20:43:20 +02:00
{0, 0, 0, 0, 0, 0, GET_NO_ARG, NO_ARG, 0, 0, 0, 0, 0, 0}
};
2017-04-19 15:09:03 +02:00
typedef struct {
HASH *filehash;
xb_rstream_t *stream;
ds_ctxt_t *ds_ctxt;
pthread_mutex_t *mutex;
} extract_ctxt_t;
2017-04-18 20:43:20 +02:00
typedef struct {
char *path;
uint pathlen;
my_off_t offset;
ds_file_t *file;
2017-04-19 15:09:03 +02:00
pthread_mutex_t mutex;
2017-04-18 20:43:20 +02:00
} file_entry_t;
static int get_options(int *argc, char ***argv);
static int mode_create(int argc, char **argv);
2017-04-19 15:09:03 +02:00
static int mode_extract(int n_threads, int argc, char **argv);
2017-04-18 20:43:20 +02:00
static my_bool get_one_option(int optid, const struct my_option *opt,
char *argument);
int
main(int argc, char **argv)
{
MY_INIT(argv[0]);
2017-04-19 15:09:03 +02:00
crc_init();
2017-04-18 20:43:20 +02:00
if (get_options(&argc, &argv)) {
goto err;
}
if (opt_mode == RUN_MODE_NONE) {
msg("%s: either -c or -x must be specified.", my_progname);
2017-04-18 20:43:20 +02:00
goto err;
}
/* Change the current directory if -C is specified */
if (opt_directory && my_setwd(opt_directory, MYF(MY_WME))) {
goto err;
}
if (opt_mode == RUN_MODE_CREATE && mode_create(argc, argv)) {
goto err;
2017-04-19 15:09:03 +02:00
} else if (opt_mode == RUN_MODE_EXTRACT &&
mode_extract(opt_parallel, argc, argv)) {
2017-04-18 20:43:20 +02:00
goto err;
}
my_cleanup_options(my_long_options);
my_end(0);
return EXIT_SUCCESS;
err:
my_cleanup_options(my_long_options);
my_end(0);
exit(EXIT_FAILURE);
}
static
int
get_options(int *argc, char ***argv)
{
int ho_error;
if ((ho_error= handle_options(argc, argv, my_long_options,
get_one_option))) {
exit(EXIT_FAILURE);
}
return 0;
}
static
void
print_version(void)
{
printf("%s Ver %s for %s (%s)\n", my_progname, XBSTREAM_VERSION,
SYSTEM_TYPE, MACHINE_TYPE);
}
static
void
usage(void)
{
print_version();
puts("Copyright (C) 2011-2013 Percona LLC and/or its affiliates.");
puts("This software comes with ABSOLUTELY NO WARRANTY. "
"This is free software,\nand you are welcome to modify and "
"redistribute it under the GPL license.\n");
puts("Serialize/deserialize files in the XBSTREAM format.\n");
puts("Usage: ");
printf(" %s -c [OPTIONS...] FILES... # stream specified files to "
"standard output.\n", my_progname);
printf(" %s -x [OPTIONS...] # extract files from the stream"
"on the standard input.\n", my_progname);
puts("\nOptions:");
my_print_help(my_long_options);
}
static
int
set_run_mode(run_mode_t mode)
{
if (opt_mode != RUN_MODE_NONE) {
msg("%s: can't set specify both -c and -x.", my_progname);
2017-04-18 20:43:20 +02:00
return 1;
}
opt_mode = mode;
return 0;
}
static
my_bool
get_one_option(int optid, const struct my_option *opt __attribute__((unused)),
char *argument __attribute__((unused)))
{
switch (optid) {
case 'c':
if (set_run_mode(RUN_MODE_CREATE)) {
return TRUE;
}
break;
case 'x':
if (set_run_mode(RUN_MODE_EXTRACT)) {
return TRUE;
}
break;
case '?':
usage();
exit(0);
}
return FALSE;
}
static
int
stream_one_file(File file, xb_wstream_file_t *xbfile)
{
uchar *buf;
ssize_t bytes;
my_off_t offset;
2017-04-18 20:43:20 +02:00
posix_fadvise(file, 0, 0, POSIX_FADV_SEQUENTIAL);
offset = my_tell(file, MYF(MY_WME));
buf = (uchar*)(my_malloc(XBSTREAM_BUFFER_SIZE, MYF(MY_FAE)));
while ((bytes = (ssize_t)my_read(file, buf, XBSTREAM_BUFFER_SIZE,
2017-04-18 20:43:20 +02:00
MYF(MY_WME))) > 0) {
if (xb_stream_write_data(xbfile, buf, bytes)) {
msg("%s: xb_stream_write_data() failed.",
2017-04-18 20:43:20 +02:00
my_progname);
my_free(buf);
return 1;
}
posix_fadvise(file, offset, XBSTREAM_BUFFER_SIZE,
POSIX_FADV_DONTNEED);
offset += XBSTREAM_BUFFER_SIZE;
}
my_free(buf);
if (bytes < 0) {
2017-04-18 20:43:20 +02:00
return 1;
}
return 0;
}
static
int
mode_create(int argc, char **argv)
{
int i;
MY_STAT mystat;
xb_wstream_t *stream;
if (argc < 1) {
msg("%s: no files are specified.", my_progname);
2017-04-18 20:43:20 +02:00
return 1;
}
stream = xb_stream_write_new();
if (stream == NULL) {
msg("%s: xb_stream_write_new() failed.", my_progname);
2017-04-18 20:43:20 +02:00
return 1;
}
for (i = 0; i < argc; i++) {
char *filepath = argv[i];
File src_file;
xb_wstream_file_t *file;
if (my_stat(filepath, &mystat, MYF(MY_WME)) == NULL) {
goto err;
}
if (!MY_S_ISREG(mystat.st_mode)) {
msg("%s: %s is not a regular file, exiting.",
2017-04-18 20:43:20 +02:00
my_progname, filepath);
goto err;
}
if ((src_file = my_open(filepath, O_RDONLY, MYF(MY_WME))) < 0) {
msg("%s: failed to open %s.", my_progname, filepath);
2017-04-18 20:43:20 +02:00
goto err;
}
file = xb_stream_write_open(stream, filepath, &mystat, NULL, NULL);
if (file == NULL) {
goto err;
}
if (opt_verbose) {
msg("%s", filepath);
2017-04-18 20:43:20 +02:00
}
if (stream_one_file(src_file, file) ||
xb_stream_write_close(file) ||
my_close(src_file, MYF(MY_WME))) {
goto err;
}
}
xb_stream_write_done(stream);
return 0;
err:
xb_stream_write_done(stream);
return 1;
}
static
file_entry_t *
2017-04-19 15:09:03 +02:00
file_entry_new(extract_ctxt_t *ctxt, const char *path, uint pathlen)
2017-04-18 20:43:20 +02:00
{
file_entry_t *entry;
ds_file_t *file;
entry = (file_entry_t *) my_malloc(sizeof(file_entry_t),
MYF(MY_WME | MY_ZEROFILL));
if (entry == NULL) {
return NULL;
}
entry->path = my_strndup(path, pathlen, MYF(MY_WME));
if (entry->path == NULL) {
goto err;
}
entry->pathlen = pathlen;
file = ds_open(ctxt->ds_ctxt, path, NULL);
2017-04-18 20:43:20 +02:00
if (file == NULL) {
msg("%s: failed to create file.", my_progname);
2017-04-18 20:43:20 +02:00
goto err;
}
if (opt_verbose) {
msg("%s", entry->path);
2017-04-18 20:43:20 +02:00
}
entry->file = file;
2017-04-19 15:09:03 +02:00
pthread_mutex_init(&entry->mutex, NULL);
2017-04-18 20:43:20 +02:00
return entry;
err:
if (entry->path != NULL) {
my_free(entry->path);
}
my_free(entry);
return NULL;
}
static
uchar *
get_file_entry_key(file_entry_t *entry, size_t *length,
my_bool not_used __attribute__((unused)))
{
*length = entry->pathlen;
return (uchar *) entry->path;
}
static
void
file_entry_free(file_entry_t *entry)
{
2017-04-19 15:09:03 +02:00
pthread_mutex_destroy(&entry->mutex);
2017-04-18 20:43:20 +02:00
ds_close(entry->file);
my_free(entry->path);
my_free(entry);
}
static
2017-04-19 15:09:03 +02:00
void *
extract_worker_thread_func(void *arg)
2017-04-18 20:43:20 +02:00
{
xb_rstream_chunk_t chunk;
file_entry_t *entry;
2017-04-19 15:09:03 +02:00
xb_rstream_result_t res;
2017-04-18 20:43:20 +02:00
2017-04-19 15:09:03 +02:00
extract_ctxt_t *ctxt = (extract_ctxt_t *) arg;
2017-04-18 20:43:20 +02:00
2017-04-19 15:09:03 +02:00
my_thread_init();
2017-04-18 20:43:20 +02:00
2017-04-19 15:09:03 +02:00
memset(&chunk, 0, sizeof(chunk));
while (1) {
pthread_mutex_lock(ctxt->mutex);
res = xb_stream_read_chunk(ctxt->stream, &chunk);
if (res != XB_STREAM_READ_CHUNK) {
pthread_mutex_unlock(ctxt->mutex);
break;
}
2017-04-18 20:43:20 +02:00
/* If unknown type and ignorable flag is set, skip this chunk */
if (chunk.type == XB_CHUNK_TYPE_UNKNOWN && \
!(chunk.flags & XB_STREAM_FLAG_IGNORABLE)) {
2017-04-19 15:09:03 +02:00
pthread_mutex_unlock(ctxt->mutex);
2017-04-18 20:43:20 +02:00
continue;
}
/* See if we already have this file open */
2017-04-19 15:09:03 +02:00
entry = (file_entry_t *) my_hash_search(ctxt->filehash,
2017-04-18 20:43:20 +02:00
(uchar *) chunk.path,
chunk.pathlen);
if (entry == NULL) {
2017-04-19 15:09:03 +02:00
entry = file_entry_new(ctxt,
chunk.path,
2017-04-18 20:43:20 +02:00
chunk.pathlen);
if (entry == NULL) {
2017-04-19 15:09:03 +02:00
pthread_mutex_unlock(ctxt->mutex);
break;
2017-04-18 20:43:20 +02:00
}
2017-04-19 15:09:03 +02:00
if (my_hash_insert(ctxt->filehash, (uchar *) entry)) {
msg("%s: my_hash_insert() failed.",
2017-04-18 20:43:20 +02:00
my_progname);
2017-04-19 15:09:03 +02:00
pthread_mutex_unlock(ctxt->mutex);
break;
2017-04-18 20:43:20 +02:00
}
}
2017-04-19 15:09:03 +02:00
pthread_mutex_lock(&entry->mutex);
pthread_mutex_unlock(ctxt->mutex);
2017-04-18 20:43:20 +02:00
2017-04-19 15:09:03 +02:00
res = xb_stream_validate_checksum(&chunk);
if (res != XB_STREAM_READ_CHUNK) {
pthread_mutex_unlock(&entry->mutex);
break;
}
if (chunk.type == XB_CHUNK_TYPE_EOF) {
pthread_mutex_lock(ctxt->mutex);
2017-04-19 15:09:03 +02:00
pthread_mutex_unlock(&entry->mutex);
my_hash_delete(ctxt->filehash, (uchar *) entry);
pthread_mutex_unlock(ctxt->mutex);
2017-04-18 20:43:20 +02:00
continue;
}
if (entry->offset != chunk.offset) {
msg("%s: out-of-order chunk: real offset = 0x%llx, "
"expected offset = 0x%llx", my_progname,
2017-04-18 20:43:20 +02:00
chunk.offset, entry->offset);
2017-04-19 15:09:03 +02:00
pthread_mutex_unlock(&entry->mutex);
res = XB_STREAM_READ_ERROR;
break;
2017-04-18 20:43:20 +02:00
}
if (ds_write(entry->file, chunk.data, chunk.length)) {
msg("%s: my_write() failed.", my_progname);
2017-04-19 15:09:03 +02:00
pthread_mutex_unlock(&entry->mutex);
res = XB_STREAM_READ_ERROR;
break;
2017-04-18 20:43:20 +02:00
}
entry->offset += chunk.length;
2017-04-19 15:09:03 +02:00
pthread_mutex_unlock(&entry->mutex);
2017-04-18 20:43:20 +02:00
}
2017-04-19 15:09:03 +02:00
if (chunk.data)
my_free(chunk.data);
my_thread_end();
return (void *)(res);
}
static
int
mode_extract(int n_threads, int argc __attribute__((unused)),
char **argv __attribute__((unused)))
{
xb_rstream_t *stream = NULL;
HASH filehash;
ds_ctxt_t *ds_ctxt = NULL;
extract_ctxt_t ctxt;
int i;
pthread_t *tids = NULL;
void **retvals = NULL;
pthread_mutex_t mutex;
int ret = 0;
if (my_hash_init(&filehash, &my_charset_bin, START_FILE_HASH_SIZE,
0, 0, (my_hash_get_key) get_file_entry_key,
(my_hash_free_key) file_entry_free, MYF(0))) {
msg("%s: failed to initialize file hash.", my_progname);
2017-04-19 15:09:03 +02:00
return 1;
}
if (pthread_mutex_init(&mutex, NULL)) {
msg("%s: failed to initialize mutex.", my_progname);
2017-04-19 15:09:03 +02:00
my_hash_free(&filehash);
return 1;
}
/* If --directory is specified, it is already set as CWD by now. */
ds_ctxt = ds_create(".", DS_TYPE_LOCAL);
if (ds_ctxt == NULL) {
ret = 1;
goto exit;
}
stream = xb_stream_read_new();
if (stream == NULL) {
msg("%s: xb_stream_read_new() failed.", my_progname);
2017-04-19 15:09:03 +02:00
pthread_mutex_destroy(&mutex);
ret = 1;
goto exit;
}
ctxt.stream = stream;
ctxt.filehash = &filehash;
ctxt.ds_ctxt = ds_ctxt;
ctxt.mutex = &mutex;
tids = (pthread_t *)calloc(n_threads, sizeof(pthread_t));
retvals = (void **)calloc(n_threads, sizeof(void*));
2017-04-19 15:09:03 +02:00
for (i = 0; i < n_threads; i++)
pthread_create(tids + i, NULL, extract_worker_thread_func,
&ctxt);
for (i = 0; i < n_threads; i++)
pthread_join(tids[i], retvals + i);
for (i = 0; i < n_threads; i++) {
if ((size_t)retvals[i] == XB_STREAM_READ_ERROR) {
2017-04-19 15:09:03 +02:00
ret = 1;
goto exit;
}
}
exit:
pthread_mutex_destroy(&mutex);
free(tids);
free(retvals);
2017-04-18 20:43:20 +02:00
my_hash_free(&filehash);
2017-04-19 15:09:03 +02:00
if (ds_ctxt != NULL) {
ds_destroy(ds_ctxt);
}
2017-04-18 20:43:20 +02:00
xb_stream_read_done(stream);
2017-04-19 15:09:03 +02:00
return ret;
2017-04-18 20:43:20 +02:00
}