mirror of
https://github.com/MariaDB/server.git
synced 2025-01-26 00:34:18 +01:00
73453d8b5e
innobase/log/log0log.c: Auto merged mysql-test/r/rpl_failsafe.result: Auto merged mysql-test/t/rpl_failsafe.test: Auto merged
3245 lines
81 KiB
C++
3245 lines
81 KiB
C++
/* Copyright (C) 2000 MySQL AB & MySQL Finland AB & InnoDB Oy
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 2 of the License, or
|
|
(at your option) any later version.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program; if not, write to the Free Software
|
|
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA */
|
|
|
|
/* This file defines the InnoDB handler: the interface between MySQL and
|
|
InnoDB */
|
|
|
|
/* TODO list for the InnoDB handler:
|
|
- Ask Monty if strings of different languages can exist in the same
|
|
database. Answer: in near future yes, but not yet.
|
|
*/
|
|
|
|
#ifdef __GNUC__
|
|
#pragma implementation // gcc: Class implementation
|
|
#endif
|
|
|
|
#include "mysql_priv.h"
|
|
#ifdef HAVE_INNOBASE_DB
|
|
#include <m_ctype.h>
|
|
#include <assert.h>
|
|
#include <hash.h>
|
|
#include <myisampack.h>
|
|
|
|
#define MAX_ULONG_BIT ((ulong) 1 << (sizeof(ulong)*8-1))
|
|
|
|
#include "ha_innobase.h"
|
|
|
|
/* We must declare this here because we undef SAFE_MUTEX below */
|
|
pthread_mutex_t innobase_mutex;
|
|
|
|
/* Store MySQL definition of 'byte': in Linux it is char while InnoDB
|
|
uses unsigned char */
|
|
typedef byte mysql_byte;
|
|
|
|
#ifdef SAFE_MUTEX
|
|
#undef pthread_mutex_t
|
|
#endif
|
|
|
|
#define INSIDE_HA_INNOBASE_CC
|
|
|
|
/* Include necessary InnoDB headers */
|
|
extern "C" {
|
|
#include "../innobase/include/univ.i"
|
|
#include "../innobase/include/srv0start.h"
|
|
#include "../innobase/include/srv0srv.h"
|
|
#include "../innobase/include/trx0roll.h"
|
|
#include "../innobase/include/trx0trx.h"
|
|
#include "../innobase/include/row0ins.h"
|
|
#include "../innobase/include/row0mysql.h"
|
|
#include "../innobase/include/row0sel.h"
|
|
#include "../innobase/include/row0upd.h"
|
|
#include "../innobase/include/log0log.h"
|
|
#include "../innobase/include/lock0lock.h"
|
|
#include "../innobase/include/dict0crea.h"
|
|
#include "../innobase/include/btr0cur.h"
|
|
#include "../innobase/include/btr0btr.h"
|
|
#include "../innobase/include/fsp0fsp.h"
|
|
}
|
|
|
|
#define HA_INNOBASE_ROWS_IN_TABLE 10000 /* to get optimization right */
|
|
#define HA_INNOBASE_RANGE_COUNT 100
|
|
|
|
bool innodb_skip = 0;
|
|
uint innobase_init_flags = 0;
|
|
ulong innobase_cache_size = 0;
|
|
|
|
long innobase_mirrored_log_groups, innobase_log_files_in_group,
|
|
innobase_log_file_size, innobase_log_buffer_size,
|
|
innobase_buffer_pool_size, innobase_additional_mem_pool_size,
|
|
innobase_file_io_threads, innobase_lock_wait_timeout;
|
|
|
|
char *innobase_data_home_dir;
|
|
char *innobase_log_group_home_dir, *innobase_log_arch_dir;
|
|
char *innobase_unix_file_flush_method;
|
|
bool innobase_flush_log_at_trx_commit, innobase_log_archive,
|
|
innobase_use_native_aio;
|
|
|
|
/*
|
|
Set default InnoDB size to 64M, to let users use InnoDB without having
|
|
to specify any startup options.
|
|
*/
|
|
|
|
char *innobase_data_file_path= (char*) "ibdata1:64M";
|
|
char *internal_innobase_data_file_path=0;
|
|
|
|
/* The following counter is used to convey information to InnoDB
|
|
about server activity: in selects it is not sensible to call
|
|
srv_active_wake_master_thread after each fetch or search, we only do
|
|
it every INNOBASE_WAKE_INTERVAL'th step. */
|
|
|
|
#define INNOBASE_WAKE_INTERVAL 32
|
|
ulong innobase_active_counter = 0;
|
|
|
|
char* innobase_home = NULL;
|
|
|
|
char innodb_dummy_stmt_trx_handle = 'D';
|
|
|
|
static HASH innobase_open_tables;
|
|
|
|
static mysql_byte* innobase_get_key(INNOBASE_SHARE *share,uint *length,
|
|
my_bool not_used __attribute__((unused)));
|
|
static INNOBASE_SHARE *get_share(const char *table_name);
|
|
static void free_share(INNOBASE_SHARE *share);
|
|
static void innobase_print_error(const char* db_errpfx, char* buffer);
|
|
|
|
/* General functions */
|
|
|
|
/************************************************************************
|
|
Increments innobase_active_counter and every INNOBASE_WAKE_INTERVALth
|
|
time calls srv_active_wake_master_thread. This function should be used
|
|
when a single database operation may introduce a small need for
|
|
server utility activity, like checkpointing. */
|
|
inline
|
|
void
|
|
innobase_active_small(void)
|
|
/*=======================*/
|
|
{
|
|
innobase_active_counter++;
|
|
|
|
if ((innobase_active_counter % INNOBASE_WAKE_INTERVAL) == 0) {
|
|
srv_active_wake_master_thread();
|
|
}
|
|
}
|
|
|
|
/************************************************************************
|
|
Converts an InnoDB error code to a MySQL error code. */
|
|
static
|
|
int
|
|
convert_error_code_to_mysql(
|
|
/*========================*/
|
|
/* out: MySQL error code */
|
|
int error) /* in: InnoDB error code */
|
|
{
|
|
if (error == DB_SUCCESS) {
|
|
|
|
return(0);
|
|
|
|
} else if (error == (int) DB_DUPLICATE_KEY) {
|
|
|
|
return(HA_ERR_FOUND_DUPP_KEY);
|
|
|
|
} else if (error == (int) DB_RECORD_NOT_FOUND) {
|
|
|
|
return(HA_ERR_NO_ACTIVE_RECORD);
|
|
|
|
} else if (error == (int) DB_ERROR) {
|
|
|
|
return(HA_ERR_NO_ACTIVE_RECORD);
|
|
|
|
} else if (error == (int) DB_DEADLOCK) {
|
|
|
|
return(HA_ERR_LOCK_DEADLOCK);
|
|
|
|
} else if (error == (int) DB_LOCK_WAIT_TIMEOUT) {
|
|
|
|
return(1000001);
|
|
|
|
} else if (error == (int) DB_NO_REFERENCED_ROW) {
|
|
|
|
return(1000010);
|
|
|
|
} else if (error == (int) DB_ROW_IS_REFERENCED) {
|
|
|
|
return(1000011);
|
|
|
|
} else if (error == (int) DB_CANNOT_ADD_CONSTRAINT) {
|
|
|
|
return(1000012);
|
|
|
|
} else if (error == (int) DB_OUT_OF_FILE_SPACE) {
|
|
|
|
return(HA_ERR_RECORD_FILE_FULL);
|
|
|
|
} else if (error == (int) DB_TABLE_IS_BEING_USED) {
|
|
|
|
return(HA_ERR_WRONG_COMMAND);
|
|
|
|
} else if (error == (int) DB_TABLE_NOT_FOUND) {
|
|
|
|
return(HA_ERR_KEY_NOT_FOUND);
|
|
|
|
} else if (error == (int) DB_TOO_BIG_RECORD) {
|
|
|
|
return(HA_ERR_TO_BIG_ROW);
|
|
} else {
|
|
dbug_assert(0);
|
|
|
|
return(-1); // Unknown error
|
|
}
|
|
}
|
|
|
|
extern "C" {
|
|
/*****************************************************************
|
|
Prints info of a THD object (== user session thread) to the
|
|
standatd output. NOTE that mysql/innobase/trx/trx0trx.c must contain
|
|
the prototype for this function! */
|
|
|
|
void
|
|
innobase_mysql_print_thd(
|
|
/*=====================*/
|
|
void* input_thd)/* in: pointer to a MySQL THD object */
|
|
{
|
|
THD* thd;
|
|
|
|
thd = (THD*) input_thd;
|
|
|
|
printf("MySQL thread id %lu, query id %lu",
|
|
thd->thread_id, thd->query_id);
|
|
if (thd->host) {
|
|
printf(" %s", thd->host);
|
|
}
|
|
|
|
if (thd->ip) {
|
|
printf(" %s", thd->ip);
|
|
}
|
|
|
|
if (thd->user) {
|
|
printf(" %s", thd->user);
|
|
}
|
|
|
|
if (thd->proc_info) {
|
|
printf(" %s", thd->proc_info);
|
|
}
|
|
|
|
if (thd->query) {
|
|
printf("\n%-.100s", thd->query);
|
|
}
|
|
|
|
printf("\n");
|
|
}
|
|
}
|
|
|
|
/*************************************************************************
|
|
Gets the InnoDB transaction handle for a MySQL handler object, creates
|
|
an InnoDB transaction struct if the corresponding MySQL thread struct still
|
|
lacks one. */
|
|
static
|
|
trx_t*
|
|
check_trx_exists(
|
|
/*=============*/
|
|
/* out: InnoDB transaction handle */
|
|
THD* thd) /* in: user thread handle */
|
|
{
|
|
trx_t* trx;
|
|
|
|
trx = (trx_t*) thd->transaction.all.innobase_tid;
|
|
|
|
if (trx == NULL) {
|
|
dbug_assert(thd != NULL);
|
|
trx = trx_allocate_for_mysql();
|
|
|
|
trx->mysql_thd = thd;
|
|
|
|
thd->transaction.all.innobase_tid = trx;
|
|
|
|
/* The execution of a single SQL statement is denoted by
|
|
a 'transaction' handle which is a dummy pointer: InnoDB
|
|
remembers internally where the latest SQL statement
|
|
started, and if error handling requires rolling back the
|
|
latest statement, InnoDB does a rollback to a savepoint. */
|
|
|
|
thd->transaction.stmt.innobase_tid =
|
|
(void*)&innodb_dummy_stmt_trx_handle;
|
|
}
|
|
|
|
return(trx);
|
|
}
|
|
|
|
/*************************************************************************
|
|
Updates the user_thd field in a handle and also allocates a new InnoDB
|
|
transaction handle if needed, and updates the transaction fields in the
|
|
prebuilt struct. */
|
|
inline
|
|
int
|
|
ha_innobase::update_thd(
|
|
/*====================*/
|
|
/* out: 0 or error code */
|
|
THD* thd) /* in: thd to use the handle */
|
|
{
|
|
row_prebuilt_t* prebuilt = (row_prebuilt_t*) innobase_prebuilt;
|
|
trx_t* trx;
|
|
|
|
trx = check_trx_exists(thd);
|
|
|
|
if (prebuilt->trx != trx) {
|
|
|
|
row_update_prebuilt_trx(prebuilt, trx);
|
|
}
|
|
|
|
user_thd = thd;
|
|
|
|
return(0);
|
|
}
|
|
|
|
/*************************************************************************
|
|
Reads the data files and their sizes from a character string given in
|
|
the .cnf file. */
|
|
static
|
|
bool
|
|
innobase_parse_data_file_paths_and_sizes(void)
|
|
/*==========================================*/
|
|
/* out: TRUE if ok, FALSE if parsing
|
|
error */
|
|
{
|
|
char* str;
|
|
char* endp;
|
|
char* path;
|
|
ulint size;
|
|
ulint i = 0;
|
|
|
|
str = internal_innobase_data_file_path;
|
|
|
|
/* First calculate the number of data files and check syntax:
|
|
path:size[M];path:size[M]... . Note that a Windows path may
|
|
contain a drive name and a ':'. */
|
|
|
|
while (*str != '\0') {
|
|
path = str;
|
|
|
|
while ((*str != ':' && *str != '\0')
|
|
|| (*str == ':'
|
|
&& (*(str + 1) == '\\' || *(str + 1) == '/'))) {
|
|
str++;
|
|
}
|
|
|
|
if (*str == '\0') {
|
|
return(FALSE);
|
|
}
|
|
|
|
str++;
|
|
|
|
size = strtoul(str, &endp, 10);
|
|
|
|
str = endp;
|
|
|
|
if ((*str != 'M') && (*str != 'G')) {
|
|
size = size / (1024 * 1024);
|
|
} else if (*str == 'G') {
|
|
size = size * 1024;
|
|
str++;
|
|
} else {
|
|
str++;
|
|
}
|
|
|
|
if (size >= 4096) {
|
|
fprintf(stderr,
|
|
"InnoDB: error: data file size must not be >= 4096M\n");
|
|
return(FALSE);
|
|
}
|
|
|
|
if (strlen(str) >= 6
|
|
&& *str == 'n'
|
|
&& *(str + 1) == 'e'
|
|
&& *(str + 2) == 'w') {
|
|
str += 3;
|
|
}
|
|
|
|
if (strlen(str) >= 3
|
|
&& *str == 'r'
|
|
&& *(str + 1) == 'a'
|
|
&& *(str + 2) == 'w') {
|
|
str += 3;
|
|
}
|
|
|
|
if (size == 0) {
|
|
return(FALSE);
|
|
}
|
|
|
|
i++;
|
|
|
|
if (*str == ';') {
|
|
str++;
|
|
} else if (*str != '\0') {
|
|
|
|
return(FALSE);
|
|
}
|
|
}
|
|
|
|
srv_data_file_names = (char**)ut_malloc(i * sizeof(void*));
|
|
srv_data_file_sizes = (ulint*)ut_malloc(i * sizeof(ulint));
|
|
srv_data_file_is_raw_partition = (ulint*)ut_malloc(i * sizeof(ulint));
|
|
|
|
srv_n_data_files = i;
|
|
|
|
/* Then store the actual values to our arrays */
|
|
|
|
str = internal_innobase_data_file_path;
|
|
i = 0;
|
|
|
|
while (*str != '\0') {
|
|
path = str;
|
|
|
|
/* Note that we must ignore the ':' in a Windows path */
|
|
|
|
while ((*str != ':' && *str != '\0')
|
|
|| (*str == ':'
|
|
&& (*(str + 1) == '\\' || *(str + 1) == '/'))) {
|
|
str++;
|
|
}
|
|
|
|
if (*str == ':') {
|
|
/* Make path a null-terminated string */
|
|
*str = '\0';
|
|
str++;
|
|
}
|
|
|
|
size = strtoul(str, &endp, 10);
|
|
|
|
str = endp;
|
|
|
|
if ((*str != 'M') && (*str != 'G')) {
|
|
size = size / (1024 * 1024);
|
|
} else if (*str == 'G') {
|
|
size = size * 1024;
|
|
str++;
|
|
} else {
|
|
str++;
|
|
}
|
|
|
|
srv_data_file_is_raw_partition[i] = 0;
|
|
|
|
if (strlen(str) >= 6
|
|
&& *str == 'n'
|
|
&& *(str + 1) == 'e'
|
|
&& *(str + 2) == 'w') {
|
|
str += 3;
|
|
srv_data_file_is_raw_partition[i] = SRV_NEW_RAW;
|
|
}
|
|
|
|
if (strlen(str) >= 3
|
|
&& *str == 'r'
|
|
&& *(str + 1) == 'a'
|
|
&& *(str + 2) == 'w') {
|
|
str += 3;
|
|
|
|
if (srv_data_file_is_raw_partition[i] == 0) {
|
|
srv_data_file_is_raw_partition[i] = SRV_OLD_RAW;
|
|
}
|
|
}
|
|
|
|
srv_data_file_names[i] = path;
|
|
srv_data_file_sizes[i] = size;
|
|
|
|
i++;
|
|
|
|
if (*str == ';') {
|
|
str++;
|
|
}
|
|
}
|
|
|
|
return(TRUE);
|
|
}
|
|
|
|
/*************************************************************************
|
|
Reads log group home directories from a character string given in
|
|
the .cnf file. */
|
|
static
|
|
bool
|
|
innobase_parse_log_group_home_dirs(void)
|
|
/*====================================*/
|
|
/* out: TRUE if ok, FALSE if parsing
|
|
error */
|
|
{
|
|
char* str;
|
|
char* path;
|
|
ulint i = 0;
|
|
|
|
str = innobase_log_group_home_dir;
|
|
|
|
/* First calculate the number of directories and check syntax:
|
|
path;path;... */
|
|
|
|
while (*str != '\0') {
|
|
path = str;
|
|
|
|
while (*str != ';' && *str != '\0') {
|
|
str++;
|
|
}
|
|
|
|
i++;
|
|
|
|
if (*str == ';') {
|
|
str++;
|
|
} else if (*str != '\0') {
|
|
|
|
return(FALSE);
|
|
}
|
|
}
|
|
|
|
if (i != (ulint) innobase_mirrored_log_groups) {
|
|
|
|
return(FALSE);
|
|
}
|
|
|
|
srv_log_group_home_dirs = (char**) ut_malloc(i * sizeof(void*));
|
|
|
|
/* Then store the actual values to our array */
|
|
|
|
str = innobase_log_group_home_dir;
|
|
i = 0;
|
|
|
|
while (*str != '\0') {
|
|
path = str;
|
|
|
|
while (*str != ';' && *str != '\0') {
|
|
str++;
|
|
}
|
|
|
|
if (*str == ';') {
|
|
*str = '\0';
|
|
str++;
|
|
}
|
|
|
|
srv_log_group_home_dirs[i] = path;
|
|
|
|
i++;
|
|
}
|
|
|
|
return(TRUE);
|
|
}
|
|
|
|
/*************************************************************************
|
|
Opens an InnoDB database. */
|
|
|
|
bool
|
|
innobase_init(void)
|
|
/*===============*/
|
|
/* out: TRUE if error */
|
|
{
|
|
int err;
|
|
bool ret;
|
|
char current_lib[2], *default_path;
|
|
|
|
DBUG_ENTER("innobase_init");
|
|
|
|
/*
|
|
When using the embedded server, the datadirectory is not
|
|
in the current directory.
|
|
*/
|
|
if (!mysql_embedded)
|
|
default_path=mysql_real_data_home;
|
|
else
|
|
{
|
|
/* It's better to use current lib, to keep path's short */
|
|
current_lib[0]=FN_CURLIB;
|
|
current_lib[1]=FN_LIBCHAR;
|
|
default_path=current_lib;
|
|
}
|
|
|
|
if (specialflag & SPECIAL_NO_PRIOR) {
|
|
srv_set_thread_priorities = FALSE;
|
|
} else {
|
|
srv_set_thread_priorities = TRUE;
|
|
srv_query_thread_priority = QUERY_PRIOR;
|
|
}
|
|
|
|
/* Set InnoDB initialization parameters according to the values
|
|
read from MySQL .cnf file */
|
|
|
|
// Make a copy of innobase_data_file_path to not modify the original
|
|
internal_innobase_data_file_path=my_strdup(innobase_data_file_path,
|
|
MYF(MY_WME));
|
|
|
|
srv_data_home = (innobase_data_home_dir ? innobase_data_home_dir :
|
|
default_path);
|
|
srv_logs_home = (char*) "";
|
|
srv_arch_dir = (innobase_log_arch_dir ? innobase_log_arch_dir :
|
|
default_path);
|
|
|
|
ret = innobase_parse_data_file_paths_and_sizes();
|
|
|
|
if (ret == FALSE) {
|
|
fprintf(stderr, "InnoDB: syntax error in innodb_data_file_path\n");
|
|
DBUG_RETURN(TRUE);
|
|
}
|
|
|
|
if (!innobase_log_group_home_dir)
|
|
innobase_log_group_home_dir= default_path;
|
|
ret = innobase_parse_log_group_home_dirs();
|
|
|
|
if (ret == FALSE) {
|
|
DBUG_RETURN(TRUE);
|
|
}
|
|
|
|
srv_unix_file_flush_method_str = (innobase_unix_file_flush_method ?
|
|
innobase_unix_file_flush_method :
|
|
(char*)"fdatasync");
|
|
|
|
srv_n_log_groups = (ulint) innobase_mirrored_log_groups;
|
|
srv_n_log_files = (ulint) innobase_log_files_in_group;
|
|
srv_log_file_size = (ulint) innobase_log_file_size;
|
|
|
|
srv_log_archive_on = (ulint) innobase_log_archive;
|
|
srv_log_buffer_size = (ulint) innobase_log_buffer_size;
|
|
srv_flush_log_at_trx_commit = (ulint) innobase_flush_log_at_trx_commit;
|
|
|
|
srv_use_native_aio = 0;
|
|
|
|
srv_pool_size = (ulint) innobase_buffer_pool_size;
|
|
srv_mem_pool_size = (ulint) innobase_additional_mem_pool_size;
|
|
|
|
srv_n_file_io_threads = (ulint) innobase_file_io_threads;
|
|
|
|
srv_lock_wait_timeout = (ulint) innobase_lock_wait_timeout;
|
|
|
|
srv_print_verbose_log = mysql_embedded ? 0 : 1;
|
|
if (strcmp(default_charset_info->name, "latin1") == 0) {
|
|
/* Store the character ordering table to InnoDB.
|
|
For non-latin1 charsets we use the MySQL comparison
|
|
functions, and consequently we do not need to know
|
|
the ordering internally in InnoDB. */
|
|
|
|
memcpy(srv_latin1_ordering,
|
|
default_charset_info->sort_order, 256);
|
|
}
|
|
|
|
err = innobase_start_or_create_for_mysql();
|
|
|
|
if (err != DB_SUCCESS) {
|
|
|
|
DBUG_RETURN(1);
|
|
}
|
|
(void) hash_init(&innobase_open_tables,32,0,0,
|
|
(hash_get_key) innobase_get_key,0,0);
|
|
pthread_mutex_init(&innobase_mutex,MY_MUTEX_INIT_FAST);
|
|
DBUG_RETURN(0);
|
|
}
|
|
|
|
/***********************************************************************
|
|
Closes an InnoDB database. */
|
|
|
|
bool
|
|
innobase_end(void)
|
|
/*==============*/
|
|
/* out: TRUE if error */
|
|
{
|
|
int err;
|
|
|
|
DBUG_ENTER("innobase_end");
|
|
|
|
err = innobase_shutdown_for_mysql();
|
|
hash_free(&innobase_open_tables);
|
|
my_free(internal_innobase_data_file_path,MYF(MY_ALLOW_ZERO_PTR));
|
|
|
|
if (err != DB_SUCCESS) {
|
|
|
|
DBUG_RETURN(1);
|
|
}
|
|
|
|
DBUG_RETURN(0);
|
|
}
|
|
|
|
/********************************************************************
|
|
Flushes InnoDB logs to disk and makes a checkpoint. Really, a commit
|
|
flushes logs, and the name of this function should be innobase_checkpoint. */
|
|
|
|
bool
|
|
innobase_flush_logs(void)
|
|
/*=====================*/
|
|
/* out: TRUE if error */
|
|
{
|
|
bool result = 0;
|
|
|
|
DBUG_ENTER("innobase_flush_logs");
|
|
|
|
log_flush_up_to(ut_dulint_max, LOG_WAIT_ONE_GROUP);
|
|
|
|
DBUG_RETURN(result);
|
|
}
|
|
|
|
/*************************************************************************
|
|
Gets the free space in an InnoDB database: returned in units of kB. */
|
|
|
|
uint
|
|
innobase_get_free_space(void)
|
|
/*=========================*/
|
|
/* out: free space in kB */
|
|
{
|
|
return((uint) fsp_get_available_space_in_free_extents(0));
|
|
}
|
|
|
|
/*********************************************************************
|
|
Commits a transaction in an InnoDB database. */
|
|
|
|
int
|
|
innobase_commit(
|
|
/*============*/
|
|
/* out: 0 or error number */
|
|
THD* thd, /* in: MySQL thread handle of the user for whom
|
|
the transaction should be committed */
|
|
void* trx_handle)/* in: InnoDB trx handle or NULL: NULL means
|
|
that the current SQL statement ended, and we should
|
|
mark the start of a new statement with a savepoint */
|
|
{
|
|
int error = 0;
|
|
trx_t* trx;
|
|
|
|
DBUG_ENTER("innobase_commit");
|
|
DBUG_PRINT("trans", ("ending transaction"));
|
|
|
|
trx = check_trx_exists(thd);
|
|
|
|
if (trx_handle != (void*)&innodb_dummy_stmt_trx_handle) {
|
|
trx_commit_for_mysql(trx);
|
|
trx_mark_sql_stat_end_do_not_start_new(trx);
|
|
} else {
|
|
trx_mark_sql_stat_end(trx);
|
|
}
|
|
|
|
#ifndef DBUG_OFF
|
|
if (error) {
|
|
DBUG_PRINT("error", ("error: %d", error));
|
|
}
|
|
#endif
|
|
/* Tell InnoDB server that there might be work for
|
|
utility threads: */
|
|
|
|
srv_active_wake_master_thread();
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
/*********************************************************************
|
|
Rolls back a transaction in an InnoDB database. */
|
|
|
|
int
|
|
innobase_rollback(
|
|
/*==============*/
|
|
/* out: 0 or error number */
|
|
THD* thd, /* in: handle to the MySQL thread of the user
|
|
whose transaction should be rolled back */
|
|
void* trx_handle)/* in: InnoDB trx handle or a dummy stmt handle */
|
|
{
|
|
int error = 0;
|
|
trx_t* trx;
|
|
|
|
DBUG_ENTER("innobase_rollback");
|
|
DBUG_PRINT("trans", ("aborting transaction"));
|
|
|
|
trx = check_trx_exists(thd);
|
|
|
|
if (trx_handle != (void*)&innodb_dummy_stmt_trx_handle) {
|
|
error = trx_rollback_for_mysql(trx);
|
|
trx_mark_sql_stat_end_do_not_start_new(trx);
|
|
} else {
|
|
error = trx_rollback_last_sql_stat_for_mysql(trx);
|
|
trx_mark_sql_stat_end(trx);
|
|
}
|
|
|
|
DBUG_RETURN(convert_error_code_to_mysql(error));
|
|
}
|
|
|
|
/*********************************************************************
|
|
Frees a possible InnoDB trx object associated with the current
|
|
THD. */
|
|
|
|
int
|
|
innobase_close_connection(
|
|
/*======================*/
|
|
/* out: 0 or error number */
|
|
THD* thd) /* in: handle to the MySQL thread of the user
|
|
whose transaction should be rolled back */
|
|
{
|
|
if (NULL != thd->transaction.all.innobase_tid) {
|
|
trx_rollback_for_mysql((trx_t*)
|
|
(thd->transaction.all.innobase_tid));
|
|
trx_free_for_mysql((trx_t*)
|
|
(thd->transaction.all.innobase_tid));
|
|
}
|
|
|
|
return(0);
|
|
}
|
|
|
|
/**********************************************************************
|
|
Prints an error message. */
|
|
static
|
|
void
|
|
innobase_print_error(
|
|
/*=================*/
|
|
const char* db_errpfx, /* in: error prefix text */
|
|
char* buffer) /* in: error text */
|
|
{
|
|
sql_print_error("%s: %s", db_errpfx, buffer);
|
|
}
|
|
|
|
|
|
/*****************************************************************************
|
|
** InnoDB database tables
|
|
*****************************************************************************/
|
|
|
|
/********************************************************************
|
|
This function is not relevant since we store the tables and indexes
|
|
into our own tablespace, not as files, whose extension this function would
|
|
give. */
|
|
|
|
const char**
|
|
ha_innobase::bas_ext() const
|
|
/*========================*/
|
|
/* out: file extension strings, currently not
|
|
used */
|
|
{
|
|
static const char* ext[] = {".InnoDB", NullS};
|
|
|
|
return(ext);
|
|
}
|
|
|
|
/*********************************************************************
|
|
Normalizes a table name string. A normalized name consists of the
|
|
database name catenated to '/' and table name. An example:
|
|
test/mytable. */
|
|
static
|
|
void
|
|
normalize_table_name(
|
|
/*=================*/
|
|
char* norm_name, /* out: normalized name as a
|
|
null-terminated string */
|
|
const char* name) /* in: table name string */
|
|
{
|
|
char* name_ptr;
|
|
char* db_ptr;
|
|
char* ptr;
|
|
|
|
/* Scan name from the end */
|
|
|
|
ptr = strend(name)-1;
|
|
|
|
while (ptr >= name && *ptr != '\\' && *ptr != '/') {
|
|
ptr--;
|
|
}
|
|
|
|
name_ptr = ptr + 1;
|
|
|
|
dbug_assert(ptr > name);
|
|
|
|
ptr--;
|
|
|
|
while (ptr >= name && *ptr != '\\' && *ptr != '/') {
|
|
ptr--;
|
|
}
|
|
|
|
db_ptr = ptr + 1;
|
|
|
|
memcpy(norm_name, db_ptr, strlen(name) + 1 - (db_ptr - name));
|
|
|
|
norm_name[name_ptr - db_ptr - 1] = '/';
|
|
}
|
|
|
|
/*********************************************************************
|
|
Creates and opens a handle to a table which already exists in an Innobase
|
|
database. */
|
|
|
|
int
|
|
ha_innobase::open(
|
|
/*==============*/
|
|
/* out: 1 if error, 0 if success */
|
|
const char* name, /* in: table name */
|
|
int mode, /* in: not used */
|
|
uint test_if_locked) /* in: not used */
|
|
{
|
|
dict_table_t* ib_table;
|
|
int error = 0;
|
|
uint buff_len;
|
|
char norm_name[1000];
|
|
|
|
DBUG_ENTER("ha_innobase::open");
|
|
|
|
UT_NOT_USED(mode);
|
|
UT_NOT_USED(test_if_locked);
|
|
|
|
normalize_table_name(norm_name, name);
|
|
|
|
user_thd = NULL;
|
|
|
|
last_query_id = (ulong)-1;
|
|
|
|
if (!(share=get_share(name)))
|
|
DBUG_RETURN(1);
|
|
|
|
/* Create buffers for packing the fields of a record. Why
|
|
table->reclength did not work here? Obviously, because char
|
|
fields when packed actually became 1 byte longer, when we also
|
|
stored the string length as the first byte. */
|
|
|
|
buff_len = table->reclength + table->max_key_length
|
|
+ MAX_REF_PARTS * 3;
|
|
if (!(mysql_byte*) my_multi_malloc(MYF(MY_WME),
|
|
&upd_buff, buff_len,
|
|
&key_val_buff, buff_len,
|
|
NullS)) {
|
|
free_share(share);
|
|
DBUG_RETURN(1);
|
|
}
|
|
|
|
/* Get pointer to a table object in InnoDB dictionary cache */
|
|
|
|
if (NULL == (ib_table = dict_table_get(norm_name, NULL))) {
|
|
|
|
fprintf(stderr,
|
|
"InnoDB: Cannot find table %s from the internal data dictionary\n"
|
|
"InnoDB: of InnoDB though the .frm file for the table exists. Maybe you\n"
|
|
"InnoDB: have deleted and recreated InnoDB data files but have forgotten\n"
|
|
"InnoDB: to delete the corresponding .frm files of InnoDB tables?\n",
|
|
norm_name);
|
|
|
|
free_share(share);
|
|
my_free((char*) upd_buff, MYF(0));
|
|
my_errno = ENOENT;
|
|
DBUG_RETURN(1);
|
|
}
|
|
|
|
innobase_prebuilt = row_create_prebuilt(ib_table);
|
|
|
|
((row_prebuilt_t*)innobase_prebuilt)->mysql_row_len = table->reclength;
|
|
|
|
primary_key = MAX_KEY;
|
|
|
|
if (!row_table_got_default_clust_index(ib_table)) {
|
|
|
|
/* If we automatically created the clustered index,
|
|
then MySQL does not know about it and it must not be aware
|
|
of the index used on scan, to avoid checking if we update
|
|
the column of the index. The column is the row id in
|
|
the automatical case, and it will not be updated. */
|
|
|
|
((row_prebuilt_t*)innobase_prebuilt)
|
|
->clust_index_was_generated = FALSE;
|
|
|
|
primary_key = 0;
|
|
key_used_on_scan = 0;
|
|
|
|
/* MySQL allocates the buffer for ref */
|
|
|
|
ref_length = table->key_info->key_length
|
|
+ table->key_info->key_parts + 10;
|
|
|
|
/* One byte per key field is consumed to the SQL NULL
|
|
info of the field; we add also 10 bytes of safety margin */
|
|
} else {
|
|
((row_prebuilt_t*)innobase_prebuilt)
|
|
->clust_index_was_generated = TRUE;
|
|
|
|
ref_length = DATA_ROW_ID_LEN + 10;
|
|
|
|
dbug_assert(key_used_on_scan == MAX_KEY);
|
|
}
|
|
|
|
/* Init table lock structure */
|
|
thr_lock_data_init(&share->lock,&lock,(void*) 0);
|
|
|
|
info(HA_STATUS_NO_LOCK | HA_STATUS_VARIABLE | HA_STATUS_CONST);
|
|
|
|
DBUG_RETURN(0);
|
|
}
|
|
|
|
/*********************************************************************
|
|
Does nothing. */
|
|
|
|
void
|
|
ha_innobase::initialize(void)
|
|
/*=========================*/
|
|
{
|
|
}
|
|
|
|
/**********************************************************************
|
|
Closes a handle to an InnoDB table. */
|
|
|
|
int
|
|
ha_innobase::close(void)
|
|
/*====================*/
|
|
/* out: error number */
|
|
{
|
|
DBUG_ENTER("ha_innobase::close");
|
|
|
|
row_prebuilt_free((row_prebuilt_t*) innobase_prebuilt);
|
|
|
|
my_free((char*) upd_buff, MYF(0));
|
|
free_share(share);
|
|
|
|
/* Tell InnoDB server that there might be work for
|
|
utility threads: */
|
|
|
|
srv_active_wake_master_thread();
|
|
|
|
DBUG_RETURN(0);
|
|
}
|
|
|
|
/* The following accessor functions should really be inside MySQL code! */
|
|
|
|
/******************************************************************
|
|
Gets field offset for a field in a table. */
|
|
inline
|
|
uint
|
|
get_field_offset(
|
|
/*=============*/
|
|
/* out: offset */
|
|
TABLE* table, /* in: MySQL table object */
|
|
Field* field) /* in: MySQL field object */
|
|
{
|
|
return((uint) (field->ptr - (char*) table->record[0]));
|
|
}
|
|
|
|
/******************************************************************
|
|
Checks if a field in a record is SQL NULL. Uses the record format
|
|
information in table to track the null bit in record. */
|
|
inline
|
|
uint
|
|
field_in_record_is_null(
|
|
/*====================*/
|
|
/* out: 1 if NULL, 0 otherwise */
|
|
TABLE* table, /* in: MySQL table object */
|
|
Field* field, /* in: MySQL field object */
|
|
char* record) /* in: a row in MySQL format */
|
|
{
|
|
int null_offset;
|
|
|
|
if (!field->null_ptr) {
|
|
|
|
return(0);
|
|
}
|
|
|
|
null_offset = (uint) ((char*) field->null_ptr
|
|
- (char*) table->record[0]);
|
|
|
|
if (record[null_offset] & field->null_bit) {
|
|
|
|
return(1);
|
|
}
|
|
|
|
return(0);
|
|
}
|
|
|
|
/******************************************************************
|
|
Sets a field in a record to SQL NULL. Uses the record format
|
|
information in table to track the null bit in record. */
|
|
inline
|
|
void
|
|
set_field_in_record_to_null(
|
|
/*========================*/
|
|
TABLE* table, /* in: MySQL table object */
|
|
Field* field, /* in: MySQL field object */
|
|
char* record) /* in: a row in MySQL format */
|
|
{
|
|
int null_offset;
|
|
|
|
null_offset = (uint) ((char*) field->null_ptr
|
|
- (char*) table->record[0]);
|
|
|
|
record[null_offset] = record[null_offset] | field->null_bit;
|
|
}
|
|
|
|
/******************************************************************
|
|
Resets SQL NULL bits in a record to zero. */
|
|
inline
|
|
void
|
|
reset_null_bits(
|
|
/*============*/
|
|
TABLE* table, /* in: MySQL table object */
|
|
char* record) /* in: a row in MySQL format */
|
|
{
|
|
bzero(record, table->null_bytes);
|
|
}
|
|
|
|
extern "C" {
|
|
/*****************************************************************
|
|
InnoDB uses this function is to compare two data fields for which the
|
|
data type is such that we must use MySQL code to compare them. NOTE that the
|
|
prototype of this function is in rem0cmp.c in InnoDB source code!
|
|
If you change this function, remember to update the prototype there! */
|
|
|
|
int
|
|
innobase_mysql_cmp(
|
|
/*===============*/
|
|
/* out: 1, 0, -1, if a is greater,
|
|
equal, less than b, respectively */
|
|
int mysql_type, /* in: MySQL type */
|
|
unsigned char* a, /* in: data field */
|
|
unsigned int a_length, /* in: data field length,
|
|
not UNIV_SQL_NULL */
|
|
unsigned char* b, /* in: data field */
|
|
unsigned int b_length) /* in: data field length,
|
|
not UNIV_SQL_NULL */
|
|
{
|
|
enum_field_types mysql_tp;
|
|
int ret;
|
|
|
|
dbug_assert(a_length != UNIV_SQL_NULL);
|
|
dbug_assert(b_length != UNIV_SQL_NULL);
|
|
|
|
mysql_tp = (enum_field_types) mysql_type;
|
|
|
|
switch (mysql_tp) {
|
|
|
|
case FIELD_TYPE_STRING:
|
|
case FIELD_TYPE_VAR_STRING:
|
|
ret = my_sortncmp((const char*) a, a_length,
|
|
(const char*) b, b_length);
|
|
if (ret < 0) {
|
|
return(-1);
|
|
} else if (ret > 0) {
|
|
return(1);
|
|
} else {
|
|
return(0);
|
|
}
|
|
default:
|
|
assert(0);
|
|
}
|
|
|
|
return(0);
|
|
}
|
|
}
|
|
|
|
/******************************************************************
|
|
Converts a MySQL type to an InnoDB type. */
|
|
inline
|
|
ulint
|
|
get_innobase_type_from_mysql_type(
|
|
/*==============================*/
|
|
/* out: DATA_BINARY, DATA_VARCHAR, ... */
|
|
Field* field) /* in: MySQL field */
|
|
{
|
|
/* The following asserts check that MySQL type code fits in
|
|
8 bits: this is used in ibuf and also when DATA_NOT_NULL is
|
|
ORed to the type */
|
|
|
|
dbug_assert((ulint)FIELD_TYPE_STRING < 256);
|
|
dbug_assert((ulint)FIELD_TYPE_VAR_STRING < 256);
|
|
dbug_assert((ulint)FIELD_TYPE_DOUBLE < 256);
|
|
dbug_assert((ulint)FIELD_TYPE_FLOAT < 256);
|
|
dbug_assert((ulint)FIELD_TYPE_DECIMAL < 256);
|
|
|
|
switch (field->type()) {
|
|
case FIELD_TYPE_VAR_STRING: if (field->flags & BINARY_FLAG) {
|
|
|
|
return(DATA_BINARY);
|
|
} else if (strcmp(
|
|
default_charset_info->name,
|
|
"latin1") == 0) {
|
|
return(DATA_VARCHAR);
|
|
} else {
|
|
return(DATA_VARMYSQL);
|
|
}
|
|
case FIELD_TYPE_STRING: if (field->flags & BINARY_FLAG) {
|
|
|
|
return(DATA_FIXBINARY);
|
|
} else if (strcmp(
|
|
default_charset_info->name,
|
|
"latin1") == 0) {
|
|
return(DATA_CHAR);
|
|
} else {
|
|
return(DATA_MYSQL);
|
|
}
|
|
case FIELD_TYPE_LONG:
|
|
case FIELD_TYPE_LONGLONG:
|
|
case FIELD_TYPE_TINY:
|
|
case FIELD_TYPE_SHORT:
|
|
case FIELD_TYPE_INT24:
|
|
case FIELD_TYPE_DATE:
|
|
case FIELD_TYPE_DATETIME:
|
|
case FIELD_TYPE_YEAR:
|
|
case FIELD_TYPE_NEWDATE:
|
|
case FIELD_TYPE_ENUM:
|
|
case FIELD_TYPE_SET:
|
|
case FIELD_TYPE_TIME:
|
|
case FIELD_TYPE_TIMESTAMP:
|
|
return(DATA_INT);
|
|
case FIELD_TYPE_FLOAT:
|
|
return(DATA_FLOAT);
|
|
case FIELD_TYPE_DOUBLE:
|
|
return(DATA_DOUBLE);
|
|
case FIELD_TYPE_DECIMAL:
|
|
return(DATA_DECIMAL);
|
|
case FIELD_TYPE_TINY_BLOB:
|
|
case FIELD_TYPE_MEDIUM_BLOB:
|
|
case FIELD_TYPE_BLOB:
|
|
case FIELD_TYPE_LONG_BLOB:
|
|
return(DATA_BLOB);
|
|
default:
|
|
assert(0);
|
|
}
|
|
|
|
return(0);
|
|
}
|
|
|
|
/***********************************************************************
|
|
Stores a key value for a row to a buffer. */
|
|
|
|
uint
|
|
ha_innobase::store_key_val_for_row(
|
|
/*===============================*/
|
|
/* out: key value length as stored in buff */
|
|
uint keynr, /* in: key number */
|
|
char* buff, /* in/out: buffer for the key value (in MySQL
|
|
format) */
|
|
const mysql_byte* record)/* in: row in MySQL format */
|
|
{
|
|
KEY* key_info = table->key_info + keynr;
|
|
KEY_PART_INFO* key_part = key_info->key_part;
|
|
KEY_PART_INFO* end = key_part + key_info->key_parts;
|
|
char* buff_start = buff;
|
|
|
|
DBUG_ENTER("store_key_val_for_row");
|
|
|
|
for (; key_part != end; key_part++) {
|
|
|
|
if (key_part->null_bit) {
|
|
/* Store 0 if the key part is a NULL part */
|
|
|
|
if (record[key_part->null_offset]
|
|
& key_part->null_bit) {
|
|
*buff++ = 1;
|
|
continue;
|
|
}
|
|
|
|
*buff++ = 0;
|
|
}
|
|
|
|
memcpy(buff, record + key_part->offset, key_part->length);
|
|
buff += key_part->length;
|
|
}
|
|
|
|
DBUG_RETURN(buff - buff_start);
|
|
}
|
|
|
|
/******************************************************************
|
|
Builds a template to the prebuilt struct. */
|
|
static
|
|
void
|
|
build_template(
|
|
/*===========*/
|
|
row_prebuilt_t* prebuilt, /* in: prebuilt struct */
|
|
THD* thd, /* in: current user thread, used
|
|
only if templ_type is
|
|
ROW_MYSQL_REC_FIELDS */
|
|
TABLE* table, /* in: MySQL table */
|
|
ulint templ_type) /* in: ROW_MYSQL_WHOLE_ROW or
|
|
ROW_MYSQL_REC_FIELDS */
|
|
{
|
|
dict_index_t* index;
|
|
dict_index_t* clust_index;
|
|
mysql_row_templ_t* templ;
|
|
Field* field;
|
|
ulint n_fields;
|
|
ulint n_requested_fields = 0;
|
|
ulint i;
|
|
|
|
clust_index = dict_table_get_first_index_noninline(prebuilt->table);
|
|
|
|
if (!prebuilt->in_update_remember_pos) {
|
|
/* We are building a temporary table: fetch all columns */
|
|
|
|
templ_type = ROW_MYSQL_WHOLE_ROW;
|
|
}
|
|
|
|
if (prebuilt->select_lock_type == LOCK_X) {
|
|
/* TODO: should fix the code in sql_update so that we could do
|
|
with fetching only the needed columns */
|
|
|
|
templ_type = ROW_MYSQL_WHOLE_ROW;
|
|
}
|
|
|
|
|
|
if (templ_type == ROW_MYSQL_REC_FIELDS) {
|
|
|
|
if (prebuilt->select_lock_type != LOCK_NONE) {
|
|
/* Let index be the clustered index */
|
|
|
|
index = clust_index;
|
|
} else {
|
|
index = prebuilt->index;
|
|
}
|
|
} else {
|
|
index = clust_index;
|
|
}
|
|
|
|
if (index == clust_index) {
|
|
prebuilt->need_to_access_clustered = TRUE;
|
|
} else {
|
|
prebuilt->need_to_access_clustered = FALSE;
|
|
/* Below we check column by column if we need to access
|
|
the clustered index */
|
|
}
|
|
|
|
n_fields = (ulint)table->fields;
|
|
|
|
if (!prebuilt->mysql_template) {
|
|
prebuilt->mysql_template = (mysql_row_templ_t*)
|
|
mem_alloc_noninline(
|
|
n_fields * sizeof(mysql_row_templ_t));
|
|
}
|
|
|
|
prebuilt->template_type = templ_type;
|
|
prebuilt->null_bitmap_len = table->null_bytes;
|
|
|
|
prebuilt->templ_contains_blob = FALSE;
|
|
|
|
for (i = 0; i < n_fields; i++) {
|
|
templ = prebuilt->mysql_template + n_requested_fields;
|
|
field = table->field[i];
|
|
|
|
if (templ_type == ROW_MYSQL_REC_FIELDS
|
|
&& thd->query_id != field->query_id
|
|
&& thd->query_id != (field->query_id ^ MAX_ULONG_BIT)
|
|
&& thd->query_id !=
|
|
(field->query_id ^ (MAX_ULONG_BIT >> 1))) {
|
|
|
|
/* This field is not needed in the query, skip it */
|
|
|
|
goto skip_field;
|
|
}
|
|
|
|
n_requested_fields++;
|
|
|
|
templ->col_no = i;
|
|
|
|
if (index == clust_index) {
|
|
templ->rec_field_no = (index->table->cols + i)
|
|
->clust_pos;
|
|
} else {
|
|
templ->rec_field_no = dict_index_get_nth_col_pos(
|
|
index, i);
|
|
}
|
|
|
|
if (templ->rec_field_no == ULINT_UNDEFINED) {
|
|
prebuilt->need_to_access_clustered = TRUE;
|
|
}
|
|
|
|
if (field->null_ptr) {
|
|
templ->mysql_null_byte_offset =
|
|
(ulint) ((char*) field->null_ptr
|
|
- (char*) table->record[0]);
|
|
|
|
templ->mysql_null_bit_mask = (ulint) field->null_bit;
|
|
} else {
|
|
templ->mysql_null_bit_mask = 0;
|
|
}
|
|
|
|
templ->mysql_col_offset = (ulint)
|
|
get_field_offset(table, field);
|
|
|
|
templ->mysql_col_len = (ulint) field->pack_length();
|
|
templ->type = get_innobase_type_from_mysql_type(field);
|
|
templ->is_unsigned = (ulint) (field->flags & UNSIGNED_FLAG);
|
|
|
|
if (templ->type == DATA_BLOB) {
|
|
prebuilt->templ_contains_blob = TRUE;
|
|
}
|
|
skip_field:
|
|
;
|
|
}
|
|
|
|
prebuilt->n_template = n_requested_fields;
|
|
|
|
if (prebuilt->need_to_access_clustered) {
|
|
/* Change rec_field_no's to correspond to the clustered index
|
|
record */
|
|
for (i = 0; i < n_requested_fields; i++) {
|
|
templ = prebuilt->mysql_template + i;
|
|
|
|
templ->rec_field_no =
|
|
(index->table->cols + templ->col_no)->clust_pos;
|
|
}
|
|
}
|
|
|
|
if (templ_type == ROW_MYSQL_REC_FIELDS
|
|
&& prebuilt->select_lock_type != LOCK_NONE) {
|
|
|
|
prebuilt->need_to_access_clustered = TRUE;
|
|
}
|
|
}
|
|
|
|
/************************************************************************
|
|
Stores a row in an InnoDB database, to the table specified in this
|
|
handle. */
|
|
|
|
int
|
|
ha_innobase::write_row(
|
|
/*===================*/
|
|
/* out: error code */
|
|
mysql_byte* record) /* in: a row in MySQL format */
|
|
{
|
|
row_prebuilt_t* prebuilt = (row_prebuilt_t*)innobase_prebuilt;
|
|
int error;
|
|
longlong auto_inc;
|
|
|
|
DBUG_ENTER("ha_innobase::write_row");
|
|
|
|
statistic_increment(ha_write_count, &LOCK_status);
|
|
|
|
if (table->time_stamp) {
|
|
update_timestamp(record + table->time_stamp - 1);
|
|
}
|
|
|
|
if (last_query_id != user_thd->query_id) {
|
|
prebuilt->sql_stat_start = TRUE;
|
|
last_query_id = user_thd->query_id;
|
|
}
|
|
|
|
if (table->next_number_field && record == table->record[0]) {
|
|
/* Set the 'in_update_remember_pos' flag to FALSE to
|
|
make sure all columns are fetched in the select done by
|
|
update_auto_increment */
|
|
|
|
/* Fetch the value the user possibly has set in the
|
|
autoincrement field */
|
|
|
|
auto_inc = table->next_number_field->val_int();
|
|
|
|
/* In replication and also otherwise the auto-inc column
|
|
can be set with SET INSERT_ID. Then we must look at
|
|
user_thd->next_insert_id. If it is nonzero and the user
|
|
has not supplied a value, we must use it. */
|
|
|
|
if (auto_inc == 0 && user_thd->next_insert_id != 0) {
|
|
auto_inc = user_thd->next_insert_id;
|
|
}
|
|
|
|
if (auto_inc != 0) {
|
|
/* This call will calculate the max of the
|
|
current value and the value supplied by the user, if
|
|
the auto_inc counter is already initialized
|
|
for the table */
|
|
|
|
/* We have to use the transactional lock mechanism
|
|
on the auto-inc counter of the table to ensure
|
|
that replication and roll-forward of the binlog
|
|
exactly imitates also the given auto-inc values.
|
|
The lock is released at each SQL statement's
|
|
end. */
|
|
|
|
error = row_lock_table_autoinc_for_mysql(prebuilt);
|
|
|
|
if (error != DB_SUCCESS) {
|
|
|
|
error = convert_error_code_to_mysql(error);
|
|
goto func_exit;
|
|
}
|
|
|
|
dict_table_autoinc_update(prebuilt->table, auto_inc);
|
|
} else {
|
|
if (!prebuilt->trx->auto_inc_lock) {
|
|
|
|
error = row_lock_table_autoinc_for_mysql(
|
|
prebuilt);
|
|
if (error != DB_SUCCESS) {
|
|
|
|
error = convert_error_code_to_mysql(
|
|
error);
|
|
goto func_exit;
|
|
}
|
|
}
|
|
|
|
auto_inc = dict_table_autoinc_get(prebuilt->table);
|
|
|
|
/* If auto_inc is now != 0 the autoinc counter
|
|
was already initialized for the table: we can give
|
|
the new value for MySQL to place in the field */
|
|
|
|
if (auto_inc != 0) {
|
|
user_thd->next_insert_id = auto_inc;
|
|
}
|
|
}
|
|
|
|
prebuilt->in_update_remember_pos = FALSE;
|
|
|
|
update_auto_increment();
|
|
|
|
if (auto_inc == 0) {
|
|
/* The autoinc counter for our table was not yet
|
|
initialized, initialize it now */
|
|
|
|
auto_inc = table->next_number_field->val_int();
|
|
|
|
dict_table_autoinc_initialize(prebuilt->table,
|
|
auto_inc);
|
|
}
|
|
|
|
/* We have to set sql_stat_start to TRUE because
|
|
update_auto_increment has called a select, and
|
|
has reset that flag; row_insert_for_mysql has to
|
|
know to set the IX intention lock on the table, something
|
|
it only does at the start of each statement */
|
|
|
|
prebuilt->sql_stat_start = TRUE;
|
|
}
|
|
|
|
if (prebuilt->mysql_template == NULL
|
|
|| prebuilt->template_type != ROW_MYSQL_WHOLE_ROW) {
|
|
/* Build the template used in converting quickly between
|
|
the two database formats */
|
|
|
|
build_template(prebuilt, NULL, table, ROW_MYSQL_WHOLE_ROW);
|
|
}
|
|
|
|
if (user_thd->lex.sql_command == SQLCOM_INSERT
|
|
&& user_thd->lex.duplicates == DUP_IGNORE) {
|
|
prebuilt->trx->ignore_duplicates_in_insert = TRUE;
|
|
} else {
|
|
prebuilt->trx->ignore_duplicates_in_insert = FALSE;
|
|
}
|
|
|
|
error = row_insert_for_mysql((byte*) record, prebuilt);
|
|
|
|
prebuilt->trx->ignore_duplicates_in_insert = FALSE;
|
|
|
|
error = convert_error_code_to_mysql(error);
|
|
|
|
/* Tell InnoDB server that there might be work for
|
|
utility threads: */
|
|
func_exit:
|
|
innobase_active_small();
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
/******************************************************************
|
|
Converts field data for storage in an InnoDB update vector. */
|
|
inline
|
|
mysql_byte*
|
|
innobase_convert_and_store_changed_col(
|
|
/*===================================*/
|
|
/* out: pointer to the end of the converted
|
|
data in the buffer */
|
|
upd_field_t* ufield, /* in/out: field in the update vector */
|
|
mysql_byte* buf, /* in: buffer we can use in conversion */
|
|
mysql_byte* data, /* in: column data to store */
|
|
ulint len, /* in: data len */
|
|
ulint col_type,/* in: data type in InnoDB type numbers */
|
|
ulint is_unsigned)/* in: != 0 if an unsigned integer type */
|
|
{
|
|
uint i;
|
|
|
|
if (len == UNIV_SQL_NULL) {
|
|
data = NULL;
|
|
} else if (col_type == DATA_VARCHAR || col_type == DATA_BINARY
|
|
|| col_type == DATA_VARMYSQL) {
|
|
/* Remove trailing spaces */
|
|
while (len > 0 && data[len - 1] == ' ') {
|
|
len--;
|
|
}
|
|
|
|
} else if (col_type == DATA_INT) {
|
|
/* Store integer data in InnoDB in a big-endian
|
|
format, sign bit negated, if signed */
|
|
|
|
for (i = 0; i < len; i++) {
|
|
buf[len - 1 - i] = data[i];
|
|
}
|
|
|
|
if (!is_unsigned) {
|
|
buf[0] = buf[0] ^ 128;
|
|
}
|
|
|
|
data = buf;
|
|
|
|
buf += len;
|
|
}
|
|
|
|
ufield->new_val.data = data;
|
|
ufield->new_val.len = len;
|
|
|
|
return(buf);
|
|
}
|
|
|
|
/**************************************************************************
|
|
Checks which fields have changed in a row and stores information
|
|
of them to an update vector. */
|
|
static
|
|
int
|
|
calc_row_difference(
|
|
/*================*/
|
|
/* out: error number or 0 */
|
|
upd_t* uvect, /* in/out: update vector */
|
|
mysql_byte* old_row, /* in: old row in MySQL format */
|
|
mysql_byte* new_row, /* in: new row in MySQL format */
|
|
struct st_table* table, /* in: table in MySQL data dictionary */
|
|
mysql_byte* upd_buff, /* in: buffer to use */
|
|
row_prebuilt_t* prebuilt, /* in: InnoDB prebuilt struct */
|
|
THD* thd) /* in: user thread */
|
|
{
|
|
Field* field;
|
|
uint n_fields;
|
|
ulint o_len;
|
|
ulint n_len;
|
|
byte* o_ptr;
|
|
byte* n_ptr;
|
|
byte* buf;
|
|
upd_field_t* ufield;
|
|
ulint col_type;
|
|
ulint is_unsigned;
|
|
ulint n_changed = 0;
|
|
uint i;
|
|
|
|
n_fields = table->fields;
|
|
|
|
/* We use upd_buff to convert changed fields */
|
|
buf = (byte*) upd_buff;
|
|
|
|
for (i = 0; i < n_fields; i++) {
|
|
field = table->field[i];
|
|
|
|
/* if (thd->query_id != field->query_id) { */
|
|
/* TODO: check that these fields cannot have
|
|
changed! */
|
|
|
|
/* goto skip_field;
|
|
}*/
|
|
|
|
o_ptr = (byte*) old_row + get_field_offset(table, field);
|
|
n_ptr = (byte*) new_row + get_field_offset(table, field);
|
|
o_len = field->pack_length();
|
|
n_len = field->pack_length();
|
|
|
|
col_type = get_innobase_type_from_mysql_type(field);
|
|
is_unsigned = (ulint) (field->flags & UNSIGNED_FLAG);
|
|
|
|
switch (col_type) {
|
|
|
|
case DATA_BLOB:
|
|
o_ptr = row_mysql_read_blob_ref(&o_len, o_ptr, o_len);
|
|
n_ptr = row_mysql_read_blob_ref(&n_len, n_ptr, n_len);
|
|
break;
|
|
case DATA_VARCHAR:
|
|
case DATA_BINARY:
|
|
case DATA_VARMYSQL:
|
|
o_ptr = row_mysql_read_var_ref_noninline(&o_len, o_ptr);
|
|
n_ptr = row_mysql_read_var_ref_noninline(&n_len, n_ptr);
|
|
default:
|
|
;
|
|
}
|
|
|
|
if (field->null_ptr) {
|
|
if (field_in_record_is_null(table, field,
|
|
(char*) old_row)) {
|
|
o_len = UNIV_SQL_NULL;
|
|
}
|
|
|
|
if (field_in_record_is_null(table, field,
|
|
(char*) new_row)) {
|
|
n_len = UNIV_SQL_NULL;
|
|
}
|
|
}
|
|
|
|
if (o_len != n_len || (o_len != UNIV_SQL_NULL &&
|
|
0 != memcmp(o_ptr, n_ptr, o_len))) {
|
|
/* The field has changed */
|
|
|
|
ufield = uvect->fields + n_changed;
|
|
|
|
buf = (byte*)
|
|
innobase_convert_and_store_changed_col(ufield,
|
|
(mysql_byte*)buf,
|
|
(mysql_byte*)n_ptr, n_len, col_type,
|
|
is_unsigned);
|
|
ufield->exp = NULL;
|
|
ufield->field_no =
|
|
(prebuilt->table->cols + i)->clust_pos;
|
|
n_changed++;
|
|
}
|
|
;
|
|
}
|
|
|
|
uvect->n_fields = n_changed;
|
|
uvect->info_bits = 0;
|
|
|
|
return(0);
|
|
}
|
|
|
|
/**************************************************************************
|
|
Updates a row given as a parameter to a new value. Note that we are given
|
|
whole rows, not just the fields which are updated: this incurs some
|
|
overhead for CPU when we check which fields are actually updated.
|
|
TODO: currently InnoDB does not prevent the 'Halloween problem':
|
|
in a searched update a single row can get updated several times
|
|
if its index columns are updated! */
|
|
|
|
int
|
|
ha_innobase::update_row(
|
|
/*====================*/
|
|
/* out: error number or 0 */
|
|
const mysql_byte* old_row,/* in: old row in MySQL format */
|
|
mysql_byte* new_row)/* in: new row in MySQL format */
|
|
{
|
|
row_prebuilt_t* prebuilt = (row_prebuilt_t*) innobase_prebuilt;
|
|
upd_t* uvect;
|
|
int error = 0;
|
|
|
|
DBUG_ENTER("ha_innobase::update_row");
|
|
|
|
if (table->time_stamp) {
|
|
update_timestamp(new_row + table->time_stamp - 1);
|
|
}
|
|
|
|
if (last_query_id != user_thd->query_id) {
|
|
prebuilt->sql_stat_start = TRUE;
|
|
last_query_id = user_thd->query_id;
|
|
}
|
|
|
|
if (prebuilt->upd_node) {
|
|
uvect = prebuilt->upd_node->update;
|
|
} else {
|
|
uvect = row_get_prebuilt_update_vector(prebuilt);
|
|
}
|
|
|
|
/* Build an update vector from the modified fields in the rows
|
|
(uses upd_buff of the handle) */
|
|
|
|
calc_row_difference(uvect, (mysql_byte*) old_row, new_row, table,
|
|
upd_buff, prebuilt, user_thd);
|
|
/* This is not a delete */
|
|
prebuilt->upd_node->is_delete = FALSE;
|
|
|
|
if (!prebuilt->in_update_remember_pos) {
|
|
assert(prebuilt->template_type == ROW_MYSQL_WHOLE_ROW);
|
|
}
|
|
|
|
error = row_update_for_mysql((byte*) old_row, prebuilt);
|
|
|
|
error = convert_error_code_to_mysql(error);
|
|
|
|
/* Tell InnoDB server that there might be work for
|
|
utility threads: */
|
|
|
|
innobase_active_small();
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
/**************************************************************************
|
|
Deletes a row given as the parameter. */
|
|
|
|
int
|
|
ha_innobase::delete_row(
|
|
/*====================*/
|
|
/* out: error number or 0 */
|
|
const mysql_byte* record) /* in: a row in MySQL format */
|
|
{
|
|
row_prebuilt_t* prebuilt = (row_prebuilt_t*) innobase_prebuilt;
|
|
int error = 0;
|
|
|
|
DBUG_ENTER("ha_innobase::delete_row");
|
|
|
|
if (last_query_id != user_thd->query_id) {
|
|
prebuilt->sql_stat_start = TRUE;
|
|
last_query_id = user_thd->query_id;
|
|
}
|
|
|
|
if (!prebuilt->upd_node) {
|
|
row_get_prebuilt_update_vector(prebuilt);
|
|
}
|
|
|
|
/* This is a delete */
|
|
|
|
prebuilt->upd_node->is_delete = TRUE;
|
|
prebuilt->in_update_remember_pos = TRUE;
|
|
|
|
error = row_update_for_mysql((byte*) record, prebuilt);
|
|
|
|
error = convert_error_code_to_mysql(error);
|
|
|
|
/* Tell the InnoDB server that there might be work for
|
|
utility threads: */
|
|
|
|
innobase_active_small();
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
/**********************************************************************
|
|
Initializes a handle to use an index. */
|
|
|
|
int
|
|
ha_innobase::index_init(
|
|
/*====================*/
|
|
/* out: 0 or error number */
|
|
uint keynr) /* in: key (index) number */
|
|
{
|
|
int error = 0;
|
|
DBUG_ENTER("index_init");
|
|
|
|
change_active_index(keynr);
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
/**********************************************************************
|
|
Currently does nothing. */
|
|
|
|
int
|
|
ha_innobase::index_end(void)
|
|
/*========================*/
|
|
{
|
|
int error = 0;
|
|
DBUG_ENTER("index_end");
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
/*************************************************************************
|
|
Converts a search mode flag understood by MySQL to a flag understood
|
|
by InnoDB. */
|
|
inline
|
|
ulint
|
|
convert_search_mode_to_innobase(
|
|
/*============================*/
|
|
enum ha_rkey_function find_flag)
|
|
{
|
|
switch (find_flag) {
|
|
case HA_READ_KEY_EXACT: return(PAGE_CUR_GE);
|
|
/* the above does not require the index to be UNIQUE */
|
|
case HA_READ_KEY_OR_NEXT: return(PAGE_CUR_GE);
|
|
case HA_READ_KEY_OR_PREV: return(PAGE_CUR_LE);
|
|
case HA_READ_AFTER_KEY: return(PAGE_CUR_G);
|
|
case HA_READ_BEFORE_KEY: return(PAGE_CUR_L);
|
|
case HA_READ_PREFIX: return(PAGE_CUR_GE);
|
|
case HA_READ_PREFIX_LAST: return(PAGE_CUR_LE);
|
|
/* the above PREFIX flags mean that the last
|
|
field in the key value may just be a prefix
|
|
of the complete fixed length field */
|
|
default: assert(0);
|
|
}
|
|
|
|
return(0);
|
|
}
|
|
|
|
/**************************************************************************
|
|
Positions an index cursor to the index specified in the handle. Fetches the
|
|
row if any. */
|
|
|
|
int
|
|
ha_innobase::index_read(
|
|
/*====================*/
|
|
/* out: 0, HA_ERR_KEY_NOT_FOUND,
|
|
or error number */
|
|
mysql_byte* buf, /* in/out: buffer for the returned
|
|
row */
|
|
const mysql_byte* key_ptr,/* in: key value; if this is NULL
|
|
we position the cursor at the
|
|
start or end of index */
|
|
uint key_len,/* in: key value length */
|
|
enum ha_rkey_function find_flag)/* in: search flags from my_base.h */
|
|
{
|
|
row_prebuilt_t* prebuilt = (row_prebuilt_t*) innobase_prebuilt;
|
|
ulint mode;
|
|
dict_index_t* index;
|
|
ulint match_mode = 0;
|
|
int error;
|
|
ulint ret;
|
|
|
|
DBUG_ENTER("index_read");
|
|
statistic_increment(ha_read_key_count, &LOCK_status);
|
|
|
|
if (last_query_id != user_thd->query_id) {
|
|
prebuilt->sql_stat_start = TRUE;
|
|
last_query_id = user_thd->query_id;
|
|
}
|
|
|
|
index = prebuilt->index;
|
|
|
|
/* Note that if the select is used for an update, we always
|
|
fetch the clustered index record: therefore the index for which the
|
|
template is built is not necessarily prebuilt->index, but can also
|
|
be the clustered index */
|
|
|
|
if (prebuilt->sql_stat_start) {
|
|
build_template(prebuilt, user_thd, table,
|
|
ROW_MYSQL_REC_FIELDS);
|
|
}
|
|
|
|
if (key_ptr) {
|
|
row_sel_convert_mysql_key_to_innobase(prebuilt->search_tuple,
|
|
(byte*) key_val_buff,
|
|
index,
|
|
(byte*) key_ptr,
|
|
(ulint) key_len);
|
|
} else {
|
|
/* We position the cursor to the last or the first entry
|
|
in the index */
|
|
|
|
dtuple_set_n_fields(prebuilt->search_tuple, 0);
|
|
}
|
|
|
|
mode = convert_search_mode_to_innobase(find_flag);
|
|
|
|
match_mode = 0;
|
|
|
|
if (find_flag == HA_READ_KEY_EXACT) {
|
|
match_mode = ROW_SEL_EXACT;
|
|
|
|
} else if (find_flag == HA_READ_PREFIX
|
|
|| find_flag == HA_READ_PREFIX_LAST) {
|
|
match_mode = ROW_SEL_EXACT_PREFIX;
|
|
}
|
|
|
|
last_match_mode = match_mode;
|
|
|
|
ret = row_search_for_mysql((byte*) buf, mode, prebuilt, match_mode, 0);
|
|
|
|
if (ret == DB_SUCCESS) {
|
|
error = 0;
|
|
table->status = 0;
|
|
|
|
} else if (ret == DB_RECORD_NOT_FOUND) {
|
|
error = HA_ERR_KEY_NOT_FOUND;
|
|
table->status = STATUS_NOT_FOUND;
|
|
|
|
} else if (ret == DB_END_OF_INDEX) {
|
|
error = HA_ERR_KEY_NOT_FOUND;
|
|
table->status = STATUS_NOT_FOUND;
|
|
} else {
|
|
error = convert_error_code_to_mysql(ret);
|
|
table->status = STATUS_NOT_FOUND;
|
|
}
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
/************************************************************************
|
|
Changes the active index of a handle. */
|
|
|
|
int
|
|
ha_innobase::change_active_index(
|
|
/*=============================*/
|
|
/* out: 0 or error code */
|
|
uint keynr) /* in: use this index; MAX_KEY means always clustered
|
|
index, even if it was internally generated by
|
|
InnoDB */
|
|
{
|
|
row_prebuilt_t* prebuilt = (row_prebuilt_t*) innobase_prebuilt;
|
|
KEY* key;
|
|
|
|
statistic_increment(ha_read_key_count, &LOCK_status);
|
|
|
|
DBUG_ENTER("index_read_idx");
|
|
|
|
active_index = keynr;
|
|
|
|
if (keynr != MAX_KEY && table->keys > 0) {
|
|
key = table->key_info + active_index;
|
|
|
|
prebuilt->index = dict_table_get_index_noninline(
|
|
prebuilt->table, key->name);
|
|
} else {
|
|
prebuilt->index = dict_table_get_first_index_noninline(
|
|
prebuilt->table);
|
|
}
|
|
|
|
dtuple_set_n_fields(prebuilt->search_tuple, prebuilt->index->n_fields);
|
|
|
|
dict_index_copy_types(prebuilt->search_tuple, prebuilt->index,
|
|
prebuilt->index->n_fields);
|
|
assert(prebuilt->index);
|
|
|
|
/* Maybe MySQL changes the active index for a handle also
|
|
during some queries, we do not know: then it is safest to build
|
|
the template such that all columns will be fetched */
|
|
|
|
build_template(prebuilt, user_thd, table, ROW_MYSQL_WHOLE_ROW);
|
|
|
|
DBUG_RETURN(0);
|
|
}
|
|
|
|
/**************************************************************************
|
|
Positions an index cursor to the index specified in keynr. Fetches the
|
|
row if any. */
|
|
/* ??? This is only used to read whole keys ??? */
|
|
|
|
int
|
|
ha_innobase::index_read_idx(
|
|
/*========================*/
|
|
/* out: error number or 0 */
|
|
mysql_byte* buf, /* in/out: buffer for the returned
|
|
row */
|
|
uint keynr, /* in: use this index */
|
|
const mysql_byte* key, /* in: key value; if this is NULL
|
|
we position the cursor at the
|
|
start or end of index */
|
|
uint key_len, /* in: key value length */
|
|
enum ha_rkey_function find_flag)/* in: search flags from my_base.h */
|
|
{
|
|
change_active_index(keynr);
|
|
|
|
return(index_read(buf, key, key_len, find_flag));
|
|
}
|
|
|
|
/***************************************************************************
|
|
Reads the next or previous row from a cursor, which must have previously been
|
|
positioned using index_read. */
|
|
|
|
int
|
|
ha_innobase::general_fetch(
|
|
/*=======================*/
|
|
/* out: 0, HA_ERR_END_OF_FILE, or error
|
|
number */
|
|
mysql_byte* buf, /* in/out: buffer for next row in MySQL
|
|
format */
|
|
uint direction, /* in: ROW_SEL_NEXT or ROW_SEL_PREV */
|
|
uint match_mode) /* in: 0, ROW_SEL_EXACT, or
|
|
ROW_SEL_EXACT_PREFIX */
|
|
{
|
|
row_prebuilt_t* prebuilt = (row_prebuilt_t*) innobase_prebuilt;
|
|
ulint ret;
|
|
int error = 0;
|
|
|
|
DBUG_ENTER("general_fetch");
|
|
|
|
ret = row_search_for_mysql((byte*)buf, 0, prebuilt,
|
|
match_mode, direction);
|
|
|
|
if (ret == DB_SUCCESS) {
|
|
error = 0;
|
|
table->status = 0;
|
|
|
|
} else if (ret == DB_RECORD_NOT_FOUND) {
|
|
error = HA_ERR_END_OF_FILE;
|
|
table->status = STATUS_NOT_FOUND;
|
|
|
|
} else if (ret == DB_END_OF_INDEX) {
|
|
error = HA_ERR_END_OF_FILE;
|
|
table->status = STATUS_NOT_FOUND;
|
|
} else {
|
|
error = convert_error_code_to_mysql(ret);
|
|
table->status = STATUS_NOT_FOUND;
|
|
}
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
/***************************************************************************
|
|
Reads the next row from a cursor, which must have previously been
|
|
positioned using index_read. */
|
|
|
|
int
|
|
ha_innobase::index_next(
|
|
/*====================*/
|
|
/* out: 0, HA_ERR_END_OF_FILE, or error
|
|
number */
|
|
mysql_byte* buf) /* in/out: buffer for next row in MySQL
|
|
format */
|
|
{
|
|
statistic_increment(ha_read_next_count, &LOCK_status);
|
|
|
|
return(general_fetch(buf, ROW_SEL_NEXT, 0));
|
|
}
|
|
|
|
/***********************************************************************
|
|
Reads the next row matching to the key value given as the parameter. */
|
|
|
|
int
|
|
ha_innobase::index_next_same(
|
|
/*=========================*/
|
|
/* out: 0, HA_ERR_END_OF_FILE, or error
|
|
number */
|
|
mysql_byte* buf, /* in/out: buffer for the row */
|
|
const mysql_byte* key, /* in: key value */
|
|
uint keylen) /* in: key value length */
|
|
{
|
|
statistic_increment(ha_read_next_count, &LOCK_status);
|
|
|
|
return(general_fetch(buf, ROW_SEL_NEXT, last_match_mode));
|
|
}
|
|
|
|
/***************************************************************************
|
|
Reads the previous row from a cursor, which must have previously been
|
|
positioned using index_read. */
|
|
|
|
int
|
|
ha_innobase::index_prev(
|
|
/*====================*/
|
|
/* out: 0, HA_ERR_END_OF_FILE, or error
|
|
number */
|
|
mysql_byte* buf) /* in/out: buffer for previous row in MySQL
|
|
format */
|
|
{
|
|
return(general_fetch(buf, ROW_SEL_PREV, 0));
|
|
}
|
|
|
|
/************************************************************************
|
|
Positions a cursor on the first record in an index and reads the
|
|
corresponding row to buf. */
|
|
|
|
int
|
|
ha_innobase::index_first(
|
|
/*=====================*/
|
|
/* out: 0, HA_ERR_END_OF_FILE,
|
|
or error code */
|
|
mysql_byte* buf) /* in/out: buffer for the row */
|
|
{
|
|
int error;
|
|
|
|
DBUG_ENTER("index_first");
|
|
statistic_increment(ha_read_first_count, &LOCK_status);
|
|
|
|
error = index_read(buf, NULL, 0, HA_READ_AFTER_KEY);
|
|
|
|
/* MySQL does not seem to allow this to return HA_ERR_KEY_NOT_FOUND */
|
|
|
|
if (error == HA_ERR_KEY_NOT_FOUND) {
|
|
error = HA_ERR_END_OF_FILE;
|
|
}
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
/************************************************************************
|
|
Positions a cursor on the last record in an index and reads the
|
|
corresponding row to buf. */
|
|
|
|
int
|
|
ha_innobase::index_last(
|
|
/*====================*/
|
|
/* out: 0, HA_ERR_END_OF_FILE, or error code */
|
|
mysql_byte* buf) /* in/out: buffer for the row */
|
|
{
|
|
int error;
|
|
|
|
DBUG_ENTER("index_first");
|
|
statistic_increment(ha_read_last_count, &LOCK_status);
|
|
|
|
error = index_read(buf, NULL, 0, HA_READ_BEFORE_KEY);
|
|
|
|
/* MySQL does not seem to allow this to return HA_ERR_KEY_NOT_FOUND */
|
|
|
|
if (error == HA_ERR_KEY_NOT_FOUND) {
|
|
error = HA_ERR_END_OF_FILE;
|
|
}
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
/********************************************************************
|
|
Initialize a table scan. */
|
|
|
|
int
|
|
ha_innobase::rnd_init(
|
|
/*==================*/
|
|
/* out: 0 or error number */
|
|
bool scan) /* in: ???????? */
|
|
{
|
|
row_prebuilt_t* prebuilt = (row_prebuilt_t*) innobase_prebuilt;
|
|
|
|
if (prebuilt->clust_index_was_generated) {
|
|
change_active_index(MAX_KEY);
|
|
} else {
|
|
change_active_index(primary_key);
|
|
}
|
|
|
|
start_of_scan = 1;
|
|
|
|
return(0);
|
|
}
|
|
|
|
/*********************************************************************
|
|
Ends a table scan ???????????????? */
|
|
|
|
int
|
|
ha_innobase::rnd_end(void)
|
|
/*======================*/
|
|
/* out: 0 or error number */
|
|
{
|
|
return(index_end());
|
|
}
|
|
|
|
/*********************************************************************
|
|
Reads the next row in a table scan (also used to read the FIRST row
|
|
in a table scan). */
|
|
|
|
int
|
|
ha_innobase::rnd_next(
|
|
/*==================*/
|
|
/* out: 0, HA_ERR_END_OF_FILE, or error number */
|
|
mysql_byte* buf)/* in/out: returns the row in this buffer,
|
|
in MySQL format */
|
|
{
|
|
int error;
|
|
|
|
DBUG_ENTER("rnd_next");
|
|
statistic_increment(ha_read_rnd_next_count, &LOCK_status);
|
|
|
|
if (start_of_scan) {
|
|
error = index_first(buf);
|
|
if (error == HA_ERR_KEY_NOT_FOUND) {
|
|
error = HA_ERR_END_OF_FILE;
|
|
}
|
|
start_of_scan = 0;
|
|
} else {
|
|
error = general_fetch(buf, ROW_SEL_NEXT, 0);
|
|
}
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
/**************************************************************************
|
|
Fetches a row from the table based on a reference. TODO: currently we use
|
|
'ref_stored_len' of the handle as the key length. This may change. */
|
|
|
|
int
|
|
ha_innobase::rnd_pos(
|
|
/*=================*/
|
|
/* out: 0, HA_ERR_KEY_NOT_FOUND,
|
|
or error code */
|
|
mysql_byte* buf, /* in/out: buffer for the row */
|
|
mysql_byte* pos) /* in: primary key value in MySQL format */
|
|
{
|
|
row_prebuilt_t* prebuilt = (row_prebuilt_t*) innobase_prebuilt;
|
|
int error;
|
|
uint keynr = active_index;
|
|
|
|
DBUG_ENTER("rnd_pos");
|
|
statistic_increment(ha_read_rnd_count, &LOCK_status);
|
|
|
|
if (prebuilt->clust_index_was_generated) {
|
|
/* No primary key was defined for the table and we
|
|
generated the clustered index from the row id: the
|
|
row reference is the row id, not any key value
|
|
that MySQL knows */
|
|
|
|
change_active_index(MAX_KEY);
|
|
} else {
|
|
change_active_index(primary_key);
|
|
}
|
|
|
|
error = index_read(buf, pos, ref_stored_len, HA_READ_KEY_EXACT);
|
|
|
|
change_active_index(keynr);
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
/*************************************************************************
|
|
Stores a reference to the current row to 'ref' field of the handle. Note
|
|
that the function parameter is illogical: we must assume that 'record'
|
|
is the current 'position' of the handle, because if row ref is actually
|
|
the row id internally generated in InnoDB, then 'record' does not contain
|
|
it. We just guess that the row id must be for the record where the handle
|
|
was positioned the last time. */
|
|
|
|
void
|
|
ha_innobase::position(
|
|
/*==================*/
|
|
const mysql_byte* record) /* in: row in MySQL format */
|
|
{
|
|
row_prebuilt_t* prebuilt = (row_prebuilt_t*) innobase_prebuilt;
|
|
uint len;
|
|
|
|
if (prebuilt->clust_index_was_generated) {
|
|
/* No primary key was defined for the table and we
|
|
generated the clustered index from row id: the
|
|
row reference will be the row id, not any key value
|
|
that MySQL knows */
|
|
|
|
len = DATA_ROW_ID_LEN;
|
|
|
|
memcpy(ref, prebuilt->row_id, len);
|
|
} else {
|
|
len = store_key_val_for_row(primary_key, (char*) ref, record);
|
|
}
|
|
|
|
dbug_assert(len <= ref_length);
|
|
|
|
ref_stored_len = len;
|
|
}
|
|
|
|
/***********************************************************************
|
|
Tells something additional to the handler about how to do things. */
|
|
|
|
int
|
|
ha_innobase::extra(
|
|
/*===============*/
|
|
/* out: 0 or error number */
|
|
enum ha_extra_function operation)
|
|
/* in: HA_EXTRA_DONT_USE_CURSOR_TO_UPDATE */
|
|
{
|
|
row_prebuilt_t* prebuilt = (row_prebuilt_t*) innobase_prebuilt;
|
|
|
|
switch (operation) {
|
|
case HA_EXTRA_DONT_USE_CURSOR_TO_UPDATE:
|
|
prebuilt->in_update_remember_pos = FALSE;
|
|
break;
|
|
default: /* Do nothing */
|
|
;
|
|
}
|
|
|
|
return(0);
|
|
}
|
|
|
|
int ha_innobase::reset(void)
|
|
{
|
|
return(0);
|
|
}
|
|
|
|
/**********************************************************************
|
|
As MySQL will execute an external lock for every new table it uses when it
|
|
starts to process an SQL statement, we can use this function to store the
|
|
pointer to the THD in the handle. We will also use this function to communicate
|
|
to InnoDB that a new SQL statement has started and that we must store a
|
|
savepoint to our transaction handle, so that we are able to roll back
|
|
the SQL statement in case of an error. */
|
|
|
|
int
|
|
ha_innobase::external_lock(
|
|
/*=======================*/
|
|
THD* thd, /* in: handle to the user thread */
|
|
int lock_type) /* in: lock type */
|
|
{
|
|
row_prebuilt_t* prebuilt = (row_prebuilt_t*) innobase_prebuilt;
|
|
int error = 0;
|
|
trx_t* trx;
|
|
|
|
DBUG_ENTER("ha_innobase::external_lock");
|
|
|
|
update_thd(thd);
|
|
|
|
trx = prebuilt->trx;
|
|
|
|
prebuilt->sql_stat_start = TRUE;
|
|
prebuilt->in_update_remember_pos = TRUE;
|
|
|
|
if (lock_type == F_WRLCK) {
|
|
|
|
/* If this is a SELECT, then it is in UPDATE TABLE ...
|
|
or SELECT ... FOR UPDATE */
|
|
prebuilt->select_lock_type = LOCK_X;
|
|
}
|
|
|
|
if (lock_type != F_UNLCK) {
|
|
if (trx->n_mysql_tables_in_use == 0) {
|
|
trx_mark_sql_stat_end(trx);
|
|
}
|
|
thd->transaction.all.innodb_active_trans = 1;
|
|
trx->n_mysql_tables_in_use++;
|
|
|
|
if (prebuilt->select_lock_type != LOCK_NONE) {
|
|
|
|
trx->mysql_n_tables_locked++;
|
|
}
|
|
} else {
|
|
trx->n_mysql_tables_in_use--;
|
|
|
|
if (trx->n_mysql_tables_in_use == 0) {
|
|
|
|
trx->mysql_n_tables_locked = 0;
|
|
|
|
if (trx->has_search_latch) {
|
|
|
|
trx_search_latch_release_if_reserved(trx);
|
|
}
|
|
|
|
if (trx->auto_inc_lock) {
|
|
|
|
/* If we had reserved the auto-inc lock for
|
|
some table in this SQL statement, we release
|
|
it now */
|
|
|
|
row_unlock_table_autoinc_for_mysql(trx);
|
|
}
|
|
|
|
if (!(thd->options
|
|
& (OPTION_NOT_AUTO_COMMIT | OPTION_BEGIN))) {
|
|
innobase_commit(thd, trx);
|
|
}
|
|
}
|
|
}
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
/*********************************************************************
|
|
Creates a table definition to an InnoDB database. */
|
|
static
|
|
int
|
|
create_table_def(
|
|
/*=============*/
|
|
trx_t* trx, /* in: InnoDB transaction handle */
|
|
TABLE* form, /* in: information on table
|
|
columns and indexes */
|
|
const char* table_name) /* in: table name */
|
|
{
|
|
Field* field;
|
|
dict_table_t* table;
|
|
ulint n_cols;
|
|
int error;
|
|
ulint col_type;
|
|
ulint nulls_allowed;
|
|
ulint unsigned_type;
|
|
ulint i;
|
|
|
|
DBUG_ENTER("create_table_def");
|
|
DBUG_PRINT("enter", ("table_name: %s", table_name));
|
|
|
|
n_cols = form->fields;
|
|
|
|
/* The '0' below specifies that everything is currently
|
|
created in tablespace 0 */
|
|
|
|
table = dict_mem_table_create((char*) table_name, 0, n_cols);
|
|
|
|
for (i = 0; i < n_cols; i++) {
|
|
field = form->field[i];
|
|
|
|
col_type = get_innobase_type_from_mysql_type(field);
|
|
if (field->null_ptr) {
|
|
nulls_allowed = 0;
|
|
} else {
|
|
nulls_allowed = DATA_NOT_NULL;
|
|
}
|
|
|
|
if (field->flags & UNSIGNED_FLAG) {
|
|
unsigned_type = DATA_UNSIGNED;
|
|
} else {
|
|
unsigned_type = 0;
|
|
}
|
|
|
|
dict_mem_table_add_col(table, (char*) field->field_name,
|
|
col_type, (ulint)field->type()
|
|
| nulls_allowed | unsigned_type,
|
|
field->pack_length(), 0);
|
|
}
|
|
|
|
error = row_create_table_for_mysql(table, trx);
|
|
|
|
error = convert_error_code_to_mysql(error);
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
/*********************************************************************
|
|
Creates an index in an InnoDB database. */
|
|
static
|
|
int
|
|
create_index(
|
|
/*=========*/
|
|
trx_t* trx, /* in: InnoDB transaction handle */
|
|
TABLE* form, /* in: information on table
|
|
columns and indexes */
|
|
const char* table_name, /* in: table name */
|
|
uint key_num) /* in: index number */
|
|
{
|
|
dict_index_t* index;
|
|
int error;
|
|
ulint n_fields;
|
|
KEY* key;
|
|
KEY_PART_INFO* key_part;
|
|
ulint ind_type;
|
|
ulint i;
|
|
|
|
DBUG_ENTER("create_index");
|
|
|
|
key = form->key_info + key_num;
|
|
|
|
n_fields = key->key_parts;
|
|
|
|
ind_type = 0;
|
|
|
|
if (strcmp(key->name, "PRIMARY") == 0) {
|
|
ind_type = ind_type | DICT_CLUSTERED;
|
|
}
|
|
|
|
if (key->flags & HA_NOSAME ) {
|
|
ind_type = ind_type | DICT_UNIQUE;
|
|
}
|
|
|
|
/* The '0' below specifies that everything in InnoDB is currently
|
|
created in tablespace 0 */
|
|
|
|
index = dict_mem_index_create((char*) table_name, key->name, 0,
|
|
ind_type, n_fields);
|
|
for (i = 0; i < n_fields; i++) {
|
|
key_part = key->key_part + i;
|
|
|
|
/* We assume all fields should be sorted in ascending
|
|
order, hence the '0': */
|
|
dict_mem_index_add_field(index,
|
|
(char*) key_part->field->field_name, 0);
|
|
}
|
|
|
|
error = row_create_index_for_mysql(index, trx);
|
|
|
|
error = convert_error_code_to_mysql(error);
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
/*********************************************************************
|
|
Creates an index to an InnoDB table when the user has defined no
|
|
primary index. */
|
|
static
|
|
int
|
|
create_clustered_index_when_no_primary(
|
|
/*===================================*/
|
|
trx_t* trx, /* in: InnoDB transaction handle */
|
|
const char* table_name) /* in: table name */
|
|
{
|
|
dict_index_t* index;
|
|
int error;
|
|
|
|
/* The first '0' below specifies that everything in InnoDB is
|
|
currently created in file space 0 */
|
|
|
|
index = dict_mem_index_create((char*) table_name,
|
|
(char*) "GEN_CLUST_INDEX",
|
|
0, DICT_CLUSTERED, 0);
|
|
error = row_create_index_for_mysql(index, trx);
|
|
|
|
error = convert_error_code_to_mysql(error);
|
|
|
|
return(error);
|
|
}
|
|
|
|
/*********************************************************************
|
|
Creates a new table to an InnoDB database. */
|
|
|
|
int
|
|
ha_innobase::create(
|
|
/*================*/
|
|
/* out: error number */
|
|
const char* name, /* in: table name */
|
|
TABLE* form, /* in: information on table
|
|
columns and indexes */
|
|
HA_CREATE_INFO* create_info) /* in: more information of the
|
|
created table, contains also the
|
|
create statement string */
|
|
{
|
|
int error;
|
|
dict_table_t* innobase_table;
|
|
trx_t* trx;
|
|
int primary_key_no = -1;
|
|
KEY* key;
|
|
uint i;
|
|
char name2[FN_REFLEN];
|
|
char norm_name[FN_REFLEN];
|
|
|
|
DBUG_ENTER("ha_innobase::create");
|
|
|
|
trx = trx_allocate_for_mysql();
|
|
|
|
fn_format(name2, name, "", "",2); // Remove the .frm extension
|
|
|
|
normalize_table_name(norm_name, name2);
|
|
|
|
/* Create the table definition in InnoDB */
|
|
|
|
if ((error = create_table_def(trx, form, norm_name))) {
|
|
|
|
trx_commit_for_mysql(trx);
|
|
|
|
trx_free_for_mysql(trx);
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
/* Look for a primary key */
|
|
|
|
for (i = 0; i < form->keys; i++) {
|
|
key = form->key_info + i;
|
|
|
|
if (strcmp(key->name, "PRIMARY") == 0) {
|
|
primary_key_no = (int) i;
|
|
}
|
|
}
|
|
|
|
/* Our function row_get_mysql_key_number_for_index assumes
|
|
the primary key is always number 0, if it exists */
|
|
|
|
assert(primary_key_no == -1 || primary_key_no == 0);
|
|
|
|
/* Create the keys */
|
|
|
|
if (form->keys == 0 || primary_key_no == -1) {
|
|
/* Create an index which is used as the clustered index;
|
|
order the rows by their row id which is internally generated
|
|
by InnoDB */
|
|
|
|
error = create_clustered_index_when_no_primary(trx,
|
|
norm_name);
|
|
if (error) {
|
|
trx_commit_for_mysql(trx);
|
|
|
|
trx_free_for_mysql(trx);
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
}
|
|
|
|
if (primary_key_no != -1) {
|
|
/* In InnoDB the clustered index must always be created
|
|
first */
|
|
if ((error = create_index(trx, form, norm_name,
|
|
(uint) primary_key_no))) {
|
|
trx_commit_for_mysql(trx);
|
|
|
|
trx_free_for_mysql(trx);
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
}
|
|
|
|
for (i = 0; i < form->keys; i++) {
|
|
|
|
if (i != (uint) primary_key_no) {
|
|
|
|
if ((error = create_index(trx, form, norm_name, i))) {
|
|
|
|
trx_commit_for_mysql(trx);
|
|
|
|
trx_free_for_mysql(trx);
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
}
|
|
}
|
|
|
|
error = row_table_add_foreign_constraints(trx,
|
|
create_info->create_statement, norm_name);
|
|
|
|
error = convert_error_code_to_mysql(error);
|
|
|
|
if (error) {
|
|
trx_commit_for_mysql(trx);
|
|
|
|
trx_free_for_mysql(trx);
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
trx_commit_for_mysql(trx);
|
|
|
|
innobase_table = dict_table_get(norm_name, NULL);
|
|
|
|
assert(innobase_table);
|
|
|
|
/* Tell the InnoDB server that there might be work for
|
|
utility threads: */
|
|
|
|
srv_active_wake_master_thread();
|
|
|
|
trx_free_for_mysql(trx);
|
|
|
|
DBUG_RETURN(0);
|
|
}
|
|
|
|
/*********************************************************************
|
|
Drops a table from an InnoDB database. Before calling this function,
|
|
MySQL calls innobase_commit to commit the transaction of the current user.
|
|
Then the current user cannot have locks set on the table. Drop table
|
|
operation inside InnoDB will remove all locks any user has on the table
|
|
inside InnoDB. */
|
|
|
|
int
|
|
ha_innobase::delete_table(
|
|
/*======================*/
|
|
/* out: error number */
|
|
const char* name) /* in: table name */
|
|
{
|
|
ulint name_len;
|
|
int error;
|
|
trx_t* trx;
|
|
char norm_name[1000];
|
|
|
|
DBUG_ENTER("ha_innobase::delete_table");
|
|
|
|
trx = trx_allocate_for_mysql();
|
|
|
|
name_len = strlen(name);
|
|
|
|
assert(name_len < 1000);
|
|
|
|
/* Strangely, MySQL passes the table name without the '.frm'
|
|
extension, in contrast to ::create */
|
|
|
|
normalize_table_name(norm_name, name);
|
|
|
|
/* Drop the table in InnoDB */
|
|
|
|
error = row_drop_table_for_mysql(norm_name, trx, FALSE);
|
|
|
|
/* Tell the InnoDB server that there might be work for
|
|
utility threads: */
|
|
|
|
srv_active_wake_master_thread();
|
|
|
|
trx_free_for_mysql(trx);
|
|
|
|
error = convert_error_code_to_mysql(error);
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
/*********************************************************************
|
|
Removes all tables in the named database inside InnoDB. */
|
|
|
|
int
|
|
innobase_drop_database(
|
|
/*===================*/
|
|
/* out: error number */
|
|
char* path) /* in: database path; inside InnoDB the name
|
|
of the last directory in the path is used as
|
|
the database name: for example, in 'mysql/data/test'
|
|
the database name is 'test' */
|
|
{
|
|
ulint len = 0;
|
|
trx_t* trx;
|
|
char* ptr;
|
|
int error;
|
|
char namebuf[10000];
|
|
|
|
ptr = strend(path) - 2;
|
|
|
|
while (ptr >= path && *ptr != '\\' && *ptr != '/') {
|
|
ptr--;
|
|
len++;
|
|
}
|
|
|
|
ptr++;
|
|
|
|
memcpy(namebuf, ptr, len);
|
|
namebuf[len] = '/';
|
|
namebuf[len + 1] = '\0';
|
|
|
|
trx = trx_allocate_for_mysql();
|
|
|
|
error = row_drop_database_for_mysql(namebuf, trx);
|
|
|
|
/* Tell the InnoDB server that there might be work for
|
|
utility threads: */
|
|
|
|
srv_active_wake_master_thread();
|
|
|
|
trx_free_for_mysql(trx);
|
|
|
|
error = convert_error_code_to_mysql(error);
|
|
|
|
return(error);
|
|
}
|
|
|
|
/*************************************************************************
|
|
Renames an InnoDB table. */
|
|
|
|
int
|
|
ha_innobase::rename_table(
|
|
/*======================*/
|
|
/* out: 0 or error code */
|
|
const char* from, /* in: old name of the table */
|
|
const char* to) /* in: new name of the table */
|
|
{
|
|
ulint name_len1;
|
|
ulint name_len2;
|
|
int error;
|
|
trx_t* trx;
|
|
char norm_from[1000];
|
|
char norm_to[1000];
|
|
|
|
DBUG_ENTER("ha_innobase::rename_table");
|
|
|
|
trx = trx_allocate_for_mysql();
|
|
|
|
name_len1 = strlen(from);
|
|
name_len2 = strlen(to);
|
|
|
|
assert(name_len1 < 1000);
|
|
assert(name_len2 < 1000);
|
|
|
|
normalize_table_name(norm_from, from);
|
|
normalize_table_name(norm_to, to);
|
|
|
|
/* Rename the table in InnoDB */
|
|
|
|
error = row_rename_table_for_mysql(norm_from, norm_to, trx);
|
|
|
|
/* Tell the InnoDB server that there might be work for
|
|
utility threads: */
|
|
|
|
srv_active_wake_master_thread();
|
|
|
|
trx_free_for_mysql(trx);
|
|
|
|
error = convert_error_code_to_mysql(error);
|
|
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
/*************************************************************************
|
|
Estimates the number of index records in a range. */
|
|
|
|
ha_rows
|
|
ha_innobase::records_in_range(
|
|
/*==========================*/
|
|
/* out: estimated number of rows,
|
|
currently 32-bit int or uint */
|
|
int keynr, /* in: index number */
|
|
const mysql_byte* start_key, /* in: start key value of the
|
|
range, may also be empty */
|
|
uint start_key_len, /* in: start key val len, may
|
|
also be 0 */
|
|
enum ha_rkey_function start_search_flag,/* in: start search condition
|
|
e.g., 'greater than' */
|
|
const mysql_byte* end_key, /* in: range end key val, may
|
|
also be empty */
|
|
uint end_key_len, /* in: range end key val len,
|
|
may also be 0 */
|
|
enum ha_rkey_function end_search_flag)/* in: range end search cond */
|
|
{
|
|
row_prebuilt_t* prebuilt = (row_prebuilt_t*) innobase_prebuilt;
|
|
KEY* key;
|
|
dict_index_t* index;
|
|
mysql_byte* key_val_buff2 = (mysql_byte*) my_malloc(
|
|
table->reclength,
|
|
MYF(MY_WME));
|
|
dtuple_t* range_start;
|
|
dtuple_t* range_end;
|
|
ulint n_rows;
|
|
ulint mode1;
|
|
ulint mode2;
|
|
void* heap1;
|
|
void* heap2;
|
|
|
|
DBUG_ENTER("records_in_range");
|
|
|
|
if (prebuilt->trx) {
|
|
prebuilt->trx->op_info = (char*) "estimating range size";
|
|
}
|
|
|
|
active_index = keynr;
|
|
|
|
key = table->key_info + active_index;
|
|
|
|
index = dict_table_get_index_noninline(prebuilt->table, key->name);
|
|
|
|
range_start = dtuple_create_for_mysql(&heap1, key->key_parts);
|
|
dict_index_copy_types(range_start, index, key->key_parts);
|
|
|
|
range_end = dtuple_create_for_mysql(&heap2, key->key_parts);
|
|
dict_index_copy_types(range_end, index, key->key_parts);
|
|
|
|
row_sel_convert_mysql_key_to_innobase(
|
|
range_start, (byte*) key_val_buff, index,
|
|
(byte*) start_key,
|
|
(ulint) start_key_len);
|
|
|
|
row_sel_convert_mysql_key_to_innobase(
|
|
range_end, (byte*) key_val_buff2, index,
|
|
(byte*) end_key,
|
|
(ulint) end_key_len);
|
|
|
|
mode1 = convert_search_mode_to_innobase(start_search_flag);
|
|
mode2 = convert_search_mode_to_innobase(end_search_flag);
|
|
|
|
n_rows = btr_estimate_n_rows_in_range(index, range_start,
|
|
mode1, range_end, mode2);
|
|
dtuple_free_for_mysql(heap1);
|
|
dtuple_free_for_mysql(heap2);
|
|
|
|
my_free((char*) key_val_buff2, MYF(0));
|
|
|
|
if (prebuilt->trx) {
|
|
prebuilt->trx->op_info = (char*) "";
|
|
}
|
|
|
|
DBUG_RETURN((ha_rows) n_rows);
|
|
}
|
|
|
|
/*************************************************************************
|
|
Gives an UPPER BOUND to the number of rows in a table. This is used in
|
|
filesort.cc and the upper bound must hold. TODO: Since the number of
|
|
rows in a table may change after this function is called, we still may
|
|
get a 'Sort aborted' error in filesort.cc of MySQL. The ultimate fix is to
|
|
improve the algorithm of filesort.cc. */
|
|
|
|
ha_rows
|
|
ha_innobase::estimate_number_of_rows(void)
|
|
/*======================================*/
|
|
/* out: upper bound of rows */
|
|
{
|
|
row_prebuilt_t* prebuilt = (row_prebuilt_t*) innobase_prebuilt;
|
|
dict_index_t* index;
|
|
ulonglong estimate;
|
|
ulonglong data_file_length;
|
|
|
|
if (prebuilt->trx) {
|
|
prebuilt->trx->op_info =
|
|
(char*) "estimating upper bound of table size";
|
|
}
|
|
|
|
DBUG_ENTER("info");
|
|
|
|
dict_update_statistics(prebuilt->table);
|
|
|
|
index = dict_table_get_first_index_noninline(prebuilt->table);
|
|
|
|
data_file_length = ((ulonglong) index->stat_n_leaf_pages)
|
|
* UNIV_PAGE_SIZE;
|
|
/* Calculate a minimum length for a clustered index record */
|
|
|
|
estimate = data_file_length / dict_index_calc_min_rec_len(index);
|
|
|
|
if (prebuilt->trx) {
|
|
prebuilt->trx->op_info = (char*) "";
|
|
}
|
|
|
|
return((ha_rows) estimate);
|
|
}
|
|
|
|
/*************************************************************************
|
|
How many seeks it will take to read through the table. This is to be
|
|
comparable to the number returned by records_in_range so that we can
|
|
decide if we should scan the table or use keys. */
|
|
|
|
double
|
|
ha_innobase::scan_time()
|
|
/*====================*/
|
|
/* out: estimated time measured in disk seeks */
|
|
{
|
|
row_prebuilt_t* prebuilt = (row_prebuilt_t*) innobase_prebuilt;
|
|
|
|
/* In the following formula we assume that scanning 10 pages
|
|
takes the same time as a disk seek: */
|
|
|
|
return((double) (prebuilt->table->stat_clustered_index_size / 10));
|
|
}
|
|
|
|
/*************************************************************************
|
|
Returns statistics information of the table to the MySQL interpreter,
|
|
in various fields of the handle object. */
|
|
|
|
void
|
|
ha_innobase::info(
|
|
/*==============*/
|
|
uint flag) /* in: what information MySQL requests */
|
|
{
|
|
row_prebuilt_t* prebuilt = (row_prebuilt_t*) innobase_prebuilt;
|
|
dict_table_t* ib_table;
|
|
dict_index_t* index;
|
|
ulong rec_per_key;
|
|
ulong j;
|
|
ulong i;
|
|
|
|
DBUG_ENTER("info");
|
|
|
|
if (prebuilt->trx) {
|
|
prebuilt->trx->op_info = (char*) "calculating table stats";
|
|
}
|
|
|
|
ib_table = prebuilt->table;
|
|
|
|
if (flag & HA_STATUS_TIME) {
|
|
/* In sql_show we call with this flag: update then statistics
|
|
so that they are up-to-date */
|
|
|
|
dict_update_statistics(ib_table);
|
|
}
|
|
|
|
if (flag & HA_STATUS_VARIABLE) {
|
|
records = (ha_rows)ib_table->stat_n_rows;
|
|
deleted = 0;
|
|
data_file_length = ((ulonglong)
|
|
ib_table->stat_clustered_index_size)
|
|
* UNIV_PAGE_SIZE;
|
|
index_file_length = ((ulonglong)
|
|
ib_table->stat_sum_of_other_index_sizes)
|
|
* UNIV_PAGE_SIZE;
|
|
delete_length = 0;
|
|
check_time = 0;
|
|
|
|
if (records == 0) {
|
|
mean_rec_length = 0;
|
|
} else {
|
|
mean_rec_length = (ulong) (data_file_length / records);
|
|
}
|
|
}
|
|
|
|
if (flag & HA_STATUS_CONST) {
|
|
index = dict_table_get_first_index_noninline(ib_table);
|
|
|
|
if (prebuilt->clust_index_was_generated) {
|
|
index = dict_table_get_next_index_noninline(index);
|
|
}
|
|
|
|
for (i = 0; i < table->keys; i++) {
|
|
for (j = 0; j < table->key_info[i].key_parts; j++) {
|
|
|
|
if (index->stat_n_diff_key_vals[j + 1] == 0) {
|
|
|
|
rec_per_key = records;
|
|
} else {
|
|
rec_per_key = (ulong)(records /
|
|
index->stat_n_diff_key_vals[j + 1]);
|
|
}
|
|
|
|
if (rec_per_key == 0) {
|
|
rec_per_key = 1;
|
|
}
|
|
|
|
table->key_info[i].rec_per_key[j]
|
|
= rec_per_key;
|
|
}
|
|
|
|
index = dict_table_get_next_index_noninline(index);
|
|
}
|
|
}
|
|
|
|
/* The trx struct in InnoDB contains a pthread mutex embedded:
|
|
in the debug version of MySQL that it replaced by a 'safe mutex'
|
|
which is of a different size. We have to use a function to access
|
|
trx fields. Otherwise trx->error_info will be a random
|
|
pointer and cause a seg fault. */
|
|
|
|
if (flag & HA_STATUS_ERRKEY) {
|
|
errkey = (unsigned int) row_get_mysql_key_number_for_index(
|
|
(dict_index_t*)
|
|
trx_get_error_info(prebuilt->trx));
|
|
}
|
|
|
|
if (prebuilt->trx) {
|
|
prebuilt->trx->op_info = (char*) "";
|
|
}
|
|
|
|
DBUG_VOID_RETURN;
|
|
}
|
|
|
|
/***********************************************************************
|
|
Tries to check that an InnoDB table is not corrupted. If corruption is
|
|
noticed, prints to stderr information about it. In case of corruption
|
|
may also assert a failure and crash the server. */
|
|
|
|
int
|
|
ha_innobase::check(
|
|
/*===============*/
|
|
/* out: HA_ADMIN_CORRUPT or
|
|
HA_ADMIN_OK */
|
|
THD* thd, /* in: user thread handle */
|
|
HA_CHECK_OPT* check_opt) /* in: check options, currently
|
|
ignored */
|
|
{
|
|
row_prebuilt_t* prebuilt = (row_prebuilt_t*) innobase_prebuilt;
|
|
ulint ret;
|
|
|
|
if (prebuilt->mysql_template == NULL) {
|
|
/* Build the template; we will use a dummy template
|
|
in index scans done in checking */
|
|
|
|
build_template(prebuilt, NULL, table, ROW_MYSQL_WHOLE_ROW);
|
|
}
|
|
|
|
ret = row_check_table_for_mysql(prebuilt);
|
|
|
|
if (ret == DB_SUCCESS) {
|
|
return(HA_ADMIN_OK);
|
|
}
|
|
|
|
return(HA_ADMIN_CORRUPT);
|
|
}
|
|
|
|
/*****************************************************************
|
|
Adds information about free space in the InnoDB tablespace to a
|
|
table comment which is printed out when a user calls SHOW TABLE STATUS. */
|
|
|
|
char*
|
|
ha_innobase::update_table_comment(
|
|
/*==============================*/
|
|
const char* comment)
|
|
{
|
|
uint length=strlen(comment);
|
|
|
|
char *str=my_malloc(length + 100,MYF(0)), *pos;
|
|
|
|
if (!str)
|
|
return (char*)comment;
|
|
|
|
pos=str;
|
|
if (length)
|
|
{
|
|
pos=strmov(str,comment);
|
|
*pos++=';';
|
|
*pos++=' ';
|
|
}
|
|
sprintf(pos, "InnoDB free: %lu kB", (ulong) innobase_get_free_space());
|
|
|
|
return(str);
|
|
}
|
|
|
|
/****************************************************************************
|
|
Handling the shared INNOBASE_SHARE structure that is needed to provide table
|
|
locking.
|
|
****************************************************************************/
|
|
|
|
static mysql_byte* innobase_get_key(INNOBASE_SHARE *share,uint *length,
|
|
my_bool not_used __attribute__((unused)))
|
|
{
|
|
*length=share->table_name_length;
|
|
return (mysql_byte*) share->table_name;
|
|
}
|
|
|
|
static INNOBASE_SHARE *get_share(const char *table_name)
|
|
{
|
|
INNOBASE_SHARE *share;
|
|
pthread_mutex_lock(&innobase_mutex);
|
|
uint length=(uint) strlen(table_name);
|
|
if (!(share=(INNOBASE_SHARE*) hash_search(&innobase_open_tables,
|
|
(mysql_byte*) table_name,
|
|
length)))
|
|
{
|
|
if ((share=(INNOBASE_SHARE *) my_malloc(sizeof(*share)+length+1,
|
|
MYF(MY_WME | MY_ZEROFILL))))
|
|
{
|
|
share->table_name_length=length;
|
|
share->table_name=(char*) (share+1);
|
|
strmov(share->table_name,table_name);
|
|
if (hash_insert(&innobase_open_tables, (mysql_byte*) share))
|
|
{
|
|
pthread_mutex_unlock(&innobase_mutex);
|
|
my_free((gptr) share,0);
|
|
return 0;
|
|
}
|
|
thr_lock_init(&share->lock);
|
|
pthread_mutex_init(&share->mutex,MY_MUTEX_INIT_FAST);
|
|
}
|
|
}
|
|
share->use_count++;
|
|
pthread_mutex_unlock(&innobase_mutex);
|
|
return share;
|
|
}
|
|
|
|
static void free_share(INNOBASE_SHARE *share)
|
|
{
|
|
pthread_mutex_lock(&innobase_mutex);
|
|
if (!--share->use_count)
|
|
{
|
|
hash_delete(&innobase_open_tables, (mysql_byte*) share);
|
|
thr_lock_delete(&share->lock);
|
|
pthread_mutex_destroy(&share->mutex);
|
|
my_free((gptr) share, MYF(0));
|
|
}
|
|
pthread_mutex_unlock(&innobase_mutex);
|
|
}
|
|
|
|
/*********************************************************************
|
|
Stores a MySQL lock into a 'lock' field in a handle. */
|
|
|
|
THR_LOCK_DATA**
|
|
ha_innobase::store_lock(
|
|
/*====================*/
|
|
/* out: pointer to the next
|
|
element in the 'to' array */
|
|
THD* thd, /* in: user thread handle */
|
|
THR_LOCK_DATA** to, /* in: pointer to an array
|
|
of pointers to lock structs;
|
|
pointer to the 'lock' field
|
|
of current handle is stored
|
|
next to this array */
|
|
enum thr_lock_type lock_type) /* in: lock type to store in
|
|
'lock' */
|
|
{
|
|
row_prebuilt_t* prebuilt = (row_prebuilt_t*) innobase_prebuilt;
|
|
|
|
if (lock_type == TL_READ_WITH_SHARED_LOCKS ||
|
|
lock_type == TL_READ_NO_INSERT) {
|
|
/* This is a SELECT ... IN SHARE MODE, or
|
|
we are doing a complex SQL statement like
|
|
INSERT INTO ... SELECT ... and the logical logging
|
|
requires the use of a locking read */
|
|
|
|
prebuilt->select_lock_type = LOCK_S;
|
|
} else {
|
|
/* We set possible LOCK_X value in external_lock, not yet
|
|
here even if this would be SELECT ... FOR UPDATE */
|
|
|
|
prebuilt->select_lock_type = LOCK_NONE;
|
|
}
|
|
|
|
if (lock_type != TL_IGNORE && lock.type == TL_UNLOCK) {
|
|
|
|
/* If we are not doing a LOCK TABLE, then allow multiple
|
|
writers */
|
|
|
|
if ((lock_type >= TL_WRITE_CONCURRENT_INSERT &&
|
|
lock_type <= TL_WRITE) && !thd->in_lock_tables) {
|
|
|
|
lock_type = TL_WRITE_ALLOW_WRITE;
|
|
}
|
|
|
|
lock.type=lock_type;
|
|
}
|
|
|
|
*to++= &lock;
|
|
|
|
return(to);
|
|
}
|
|
|
|
/***********************************************************************
|
|
Returns the next auto-increment column value for the table. write_row
|
|
normally fetches the value from the cache in the data dictionary. This
|
|
function in used by SHOW TABLE STATUS and when the first insert to the table
|
|
is done after database startup. */
|
|
|
|
longlong
|
|
ha_innobase::get_auto_increment()
|
|
/*=============================*/
|
|
/* out: the next auto-increment column value */
|
|
{
|
|
row_prebuilt_t* prebuilt = (row_prebuilt_t*) innobase_prebuilt;
|
|
longlong nr;
|
|
int error;
|
|
|
|
(void) extra(HA_EXTRA_KEYREAD);
|
|
index_init(table->next_number_index);
|
|
|
|
/* We use an exclusive lock when we read the max key value from the
|
|
auto-increment column index. This is because then build_template will
|
|
advise InnoDB to fetch all columns. In SHOW TABLE STATUS the query
|
|
id of the auto-increment column is not changed, and previously InnoDB
|
|
did not fetch it, causing SHOW TABLE STATUS to show wrong values
|
|
for the autoinc column. */
|
|
|
|
prebuilt->select_lock_type = LOCK_X;
|
|
prebuilt->trx->mysql_n_tables_locked += 1;
|
|
|
|
error=index_last(table->record[1]);
|
|
|
|
if (error) {
|
|
nr = 1;
|
|
} else {
|
|
nr = (longlong) table->next_number_field->
|
|
val_int_offset(table->rec_buff_length) + 1;
|
|
}
|
|
|
|
(void) extra(HA_EXTRA_NO_KEYREAD);
|
|
|
|
index_end();
|
|
|
|
return(nr);
|
|
}
|
|
|
|
|
|
#endif /* HAVE_INNOBASE_DB */
|