2008-02-05 16:00:53 +00:00
# ifdef USE_PRAGMA_IMPLEMENTATION
2008-02-07 20:19:44 +00:00
# pragma implementation // gcc: Class implementation
2008-02-05 16:00:53 +00:00
# endif
# define MYSQL_SERVER 1
2012-07-18 17:29:49 +00:00
# include "hatoku_defines.h"
2009-03-25 20:25:06 +00:00
# include "hatoku_cmp.h"
2008-12-22 20:08:10 +00:00
extern " C " {
# include "stdint.h"
# if defined(_WIN32)
# include "misc.h"
# endif
}
2008-02-05 16:00:53 +00:00
2008-05-02 17:36:22 +00:00
static inline void * thd_data_get ( THD * thd , int slot ) {
return thd - > ha_data [ slot ] . ha_ptr ;
}
static inline void thd_data_set ( THD * thd , int slot , void * data ) {
thd - > ha_data [ slot ] . ha_ptr = data ;
}
2008-02-05 16:00:53 +00:00
# undef PACKAGE
# undef VERSION
# undef HAVE_DTRACE
# undef _DTRACE_VERSION
/* We define DTRACE after mysql_priv.h in case it disabled dtrace in the main server */
# ifdef HAVE_DTRACE
# define _DTRACE_VERSION 1
# else
# endif
# include "ha_tokudb.h"
2008-11-18 22:20:06 +00:00
# include "hatoku_hton.h"
2008-02-05 16:00:53 +00:00
# include <mysql/plugin.h>
2009-04-17 18:29:25 +00:00
static const char * ha_tokudb_exts [ ] = {
ha_tokudb_ext ,
NullS
} ;
2009-04-13 21:23:37 +00:00
2009-04-17 18:29:25 +00:00
//
// This offset is calculated starting from AFTER the NULL bytes
//
2012-07-25 20:48:53 +00:00
static inline uint32_t get_fixed_field_size ( KEY_AND_COL_INFO * kc_info , TABLE_SHARE * table_share , uint keynr ) {
2009-04-17 18:29:25 +00:00
uint offset = 0 ;
for ( uint i = 0 ; i < table_share - > fields ; i + + ) {
2010-01-11 18:14:37 +00:00
if ( kc_info - > field_lengths [ i ] & & ! bitmap_is_set ( & kc_info - > key_filters [ keynr ] , i ) ) {
offset + = kc_info - > field_lengths [ i ] ;
2009-04-17 18:29:25 +00:00
}
}
return offset ;
}
2012-07-25 20:48:53 +00:00
static inline uint32_t get_len_of_offsets ( KEY_AND_COL_INFO * kc_info , TABLE_SHARE * table_share , uint keynr ) {
2009-04-17 18:29:25 +00:00
uint len = 0 ;
for ( uint i = 0 ; i < table_share - > fields ; i + + ) {
2010-01-11 18:14:37 +00:00
if ( kc_info - > length_bytes [ i ] & & ! bitmap_is_set ( & kc_info - > key_filters [ keynr ] , i ) ) {
len + = kc_info - > num_offset_bytes ;
2009-04-17 18:29:25 +00:00
}
}
return len ;
}
2010-01-20 21:14:23 +00:00
static int allocate_key_and_col_info ( TABLE_SHARE * table_share , KEY_AND_COL_INFO * kc_info ) {
2010-01-11 18:14:37 +00:00
int error ;
//
// initialize all of the bitmaps
//
for ( uint i = 0 ; i < MAX_KEY + 1 ; i + + ) {
error = bitmap_init (
& kc_info - > key_filters [ i ] ,
NULL ,
table_share - > fields ,
false
) ;
if ( error ) {
goto exit ;
}
}
//
// create the field lengths
//
2012-07-25 20:48:53 +00:00
kc_info - > field_lengths = ( uint16_t * ) my_malloc ( table_share - > fields * sizeof ( uint16_t ) , MYF ( MY_WME | MY_ZEROFILL ) ) ;
2010-01-11 18:14:37 +00:00
kc_info - > length_bytes = ( uchar * ) my_malloc ( table_share - > fields , MYF ( MY_WME | MY_ZEROFILL ) ) ;
2012-07-25 20:48:53 +00:00
kc_info - > blob_fields = ( uint32_t * ) my_malloc ( table_share - > fields * sizeof ( uint32_t ) , MYF ( MY_WME | MY_ZEROFILL ) ) ;
2010-01-11 18:14:37 +00:00
if ( kc_info - > field_lengths = = NULL | |
kc_info - > length_bytes = = NULL | |
kc_info - > blob_fields = = NULL ) {
error = ENOMEM ;
goto exit ;
}
exit :
if ( error ) {
for ( uint i = 0 ; MAX_KEY + 1 ; i + + ) {
bitmap_free ( & kc_info - > key_filters [ i ] ) ;
}
my_free ( kc_info - > field_lengths , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
my_free ( kc_info - > length_bytes , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
my_free ( kc_info - > blob_fields , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
}
return error ;
}
2008-02-05 16:00:53 +00:00
/** @brief
Simple lock controls . The " share " it creates is a structure we will
pass to each tokudb handler . Do you have to have one of these ? Well , you have
pieces that are used for locking , and they are needed to function .
*/
2010-01-20 21:14:23 +00:00
static TOKUDB_SHARE * get_share ( const char * table_name , TABLE_SHARE * table_share ) {
2009-04-17 18:29:25 +00:00
TOKUDB_SHARE * share = NULL ;
int error = 0 ;
2008-02-07 20:19:44 +00:00
uint length ;
2008-02-05 16:00:53 +00:00
2008-02-07 20:19:44 +00:00
pthread_mutex_lock ( & tokudb_mutex ) ;
length = ( uint ) strlen ( table_name ) ;
2010-01-20 21:25:11 +00:00
if ( ! ( share = ( TOKUDB_SHARE * ) my_hash_search ( & tokudb_open_tables , ( uchar * ) table_name , length ) ) ) {
2008-02-07 20:19:44 +00:00
char * tmp_name ;
2008-06-28 01:52:30 +00:00
//
// create share and fill it with all zeroes
// hence, all pointers are initialized to NULL
//
2008-02-20 21:31:18 +00:00
if ( ! ( share = ( TOKUDB_SHARE * )
my_multi_malloc ( MYF ( MY_WME | MY_ZEROFILL ) ,
& share , sizeof ( * share ) ,
& tmp_name , length + 1 ,
NullS ) ) ) {
2008-02-07 20:19:44 +00:00
pthread_mutex_unlock ( & tokudb_mutex ) ;
return NULL ;
}
share - > use_count = 0 ;
share - > table_name_length = length ;
share - > table_name = tmp_name ;
strmov ( share - > table_name , table_name ) ;
2008-02-05 16:00:53 +00:00
2010-01-11 18:14:37 +00:00
error = allocate_key_and_col_info ( table_share , & share - > kc_info ) ;
if ( error ) {
2009-04-17 18:29:25 +00:00
goto exit ;
}
2012-05-09 18:36:52 +00:00
memset ( ( void * ) share - > key_file , 0 , sizeof ( share - > key_file ) ) ;
2008-02-07 20:19:44 +00:00
2009-04-17 18:29:25 +00:00
error = my_hash_insert ( & tokudb_open_tables , ( uchar * ) share ) ;
if ( error ) {
goto exit ;
}
2008-02-07 20:19:44 +00:00
thr_lock_init ( & share - > lock ) ;
pthread_mutex_init ( & share - > mutex , MY_MUTEX_INIT_FAST ) ;
2010-11-17 23:09:06 +00:00
my_rwlock_init ( & share - > num_DBs_lock , 0 ) ;
2008-02-05 16:00:53 +00:00
}
2009-04-17 18:29:25 +00:00
exit :
if ( error ) {
pthread_mutex_destroy ( & share - > mutex ) ;
my_free ( ( uchar * ) share , MYF ( 0 ) ) ;
share = NULL ;
}
2010-07-10 18:42:04 +00:00
pthread_mutex_unlock ( & tokudb_mutex ) ;
2008-02-07 20:19:44 +00:00
return share ;
2008-02-05 16:00:53 +00:00
}
2010-01-11 18:14:37 +00:00
2012-05-23 17:51:36 +00:00
static void free_key_and_col_info ( KEY_AND_COL_INFO * kc_info ) {
2010-01-11 18:14:37 +00:00
for ( uint i = 0 ; i < MAX_KEY + 1 ; i + + ) {
bitmap_free ( & kc_info - > key_filters [ i ] ) ;
}
for ( uint i = 0 ; i < MAX_KEY + 1 ; i + + ) {
my_free ( kc_info - > cp_info [ i ] , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
2010-12-17 15:47:52 +00:00
kc_info - > cp_info [ i ] = NULL ; // 3144
2010-01-11 18:14:37 +00:00
}
my_free ( kc_info - > field_lengths , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
my_free ( kc_info - > length_bytes , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
my_free ( kc_info - > blob_fields , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
}
2009-04-02 15:24:14 +00:00
static int free_share ( TOKUDB_SHARE * share , bool mutex_is_locked ) {
2008-02-07 20:19:44 +00:00
int error , result = 0 ;
pthread_mutex_lock ( & tokudb_mutex ) ;
if ( mutex_is_locked )
pthread_mutex_unlock ( & share - > mutex ) ;
if ( ! - - share - > use_count ) {
DBUG_PRINT ( " info " , ( " share->use_count %u " , share - > use_count ) ) ;
2008-06-28 01:52:30 +00:00
//
// number of open DB's may not be equal to number of keys we have because add_index
// may have added some. So, we loop through entire array and close any non-NULL value
// It is imperative that we reset a DB to NULL once we are done with it.
//
for ( uint i = 0 ; i < sizeof ( share - > key_file ) / sizeof ( share - > key_file [ 0 ] ) ; i + + ) {
if ( tokudb_debug & TOKUDB_DEBUG_OPEN ) {
TOKUDB_TRACE ( " dbclose:%p \n " , share - > key_file [ i ] ) ;
}
if ( share - > key_file [ i ] ) {
error = share - > key_file [ i ] - > close ( share - > key_file [ i ] , 0 ) ;
2009-12-03 15:49:42 +00:00
assert ( error = = 0 ) ;
2008-06-28 01:52:30 +00:00
if ( error ) {
result = error ;
}
share - > key_file [ i ] = NULL ;
}
2008-02-07 20:19:44 +00:00
}
2009-04-17 18:29:25 +00:00
2010-01-11 18:14:37 +00:00
free_key_and_col_info ( & share - > kc_info ) ;
2008-02-07 20:19:44 +00:00
2008-06-28 01:52:30 +00:00
if ( share - > status_block & & ( error = share - > status_block - > close ( share - > status_block , 0 ) ) ) {
2009-12-03 15:49:42 +00:00
assert ( error = = 0 ) ;
2008-02-07 20:19:44 +00:00
result = error ;
2008-06-28 01:52:30 +00:00
}
2008-02-07 20:19:44 +00:00
2010-01-20 21:25:11 +00:00
my_hash_delete ( & tokudb_open_tables , ( uchar * ) share ) ;
2008-02-07 20:19:44 +00:00
thr_lock_delete ( & share - > lock ) ;
pthread_mutex_destroy ( & share - > mutex ) ;
2010-11-17 23:09:06 +00:00
rwlock_destroy ( & share - > num_DBs_lock ) ;
2008-02-07 20:19:44 +00:00
my_free ( ( uchar * ) share , MYF ( 0 ) ) ;
}
pthread_mutex_unlock ( & tokudb_mutex ) ;
return result ;
2008-02-05 16:00:53 +00:00
}
2008-05-26 14:07:31 +00:00
2008-07-30 14:43:19 +00:00
# define HANDLE_INVALID_CURSOR() \
2008-06-10 17:03:09 +00:00
if ( cursor = = NULL ) { \
error = last_cursor_error ; \
goto cleanup ; \
}
2012-03-19 12:15:50 +00:00
const char * ha_tokudb : : table_type ( ) const {
extern const char * const tokudb_hton_name ;
return tokudb_hton_name ;
}
2008-02-05 16:00:53 +00:00
2012-03-19 12:15:50 +00:00
const char * ha_tokudb : : index_type ( uint inx ) {
return " BTREE " ;
}
2008-02-05 16:00:53 +00:00
2008-04-17 20:56:40 +00:00
/*
* returns NULL terminated file extension string
*/
2008-02-07 20:19:44 +00:00
const char * * ha_tokudb : : bas_ext ( ) const {
2008-05-05 18:38:04 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::bas_ext " ) ;
DBUG_RETURN ( ha_tokudb_exts ) ;
2008-02-07 20:19:44 +00:00
}
2010-03-05 20:21:08 +00:00
static inline bool is_insert_ignore ( THD * thd ) {
//
// from http://lists.mysql.com/internals/37735
//
return thd - > lex - > ignore & & thd - > lex - > duplicates = = DUP_ERROR ;
}
static inline bool is_replace_into ( THD * thd ) {
2010-05-19 16:26:23 +00:00
return thd - > lex - > duplicates = = DUP_REPLACE ;
2010-03-05 20:21:08 +00:00
}
2010-05-06 04:19:11 +00:00
static inline bool do_ignore_flag_optimization ( THD * thd , TABLE * table , bool opt_eligible ) {
2010-03-05 20:21:08 +00:00
uint pk_insert_mode = get_pk_insert_mode ( thd ) ;
return (
2010-05-06 04:19:11 +00:00
opt_eligible & &
2010-05-19 16:26:23 +00:00
( is_replace_into ( thd ) | | is_insert_ignore ( thd ) ) & &
2010-03-05 20:21:08 +00:00
( ( ! table - > triggers & & pk_insert_mode < 2 ) | | pk_insert_mode = = 0 )
) ;
}
2012-12-12 18:37:24 +00:00
static inline uint get_key_parts ( const KEY * key ) {
# if 50609 <= MYSQL_VERSION_ID && MYSQL_VERSION_ID <= 50699
2012-12-14 19:53:19 +00:00
return key - > user_defined_key_parts ;
2012-12-12 18:37:24 +00:00
# else
return key - > key_parts ;
# endif
}
2013-02-26 21:17:51 +00:00
# if TOKU_INCLUDE_EXTENDED_KEYS
static inline uint get_ext_key_parts ( const KEY * key ) {
2013-02-27 15:55:15 +00:00
# if 50609 <= MYSQL_VERSION_ID && MYSQL_VERSION_ID <= 50699
return key - > actual_key_parts ;
# elif defined(MARIADB_BASE_VERSION)
2013-02-26 21:17:51 +00:00
return key - > ext_key_parts ;
# else
2013-02-27 15:55:15 +00:00
# error
2013-02-26 21:17:51 +00:00
# endif
}
# endif
2010-03-05 20:21:08 +00:00
ulonglong ha_tokudb : : table_flags ( ) const {
2010-05-06 04:19:11 +00:00
return ( table & & do_ignore_flag_optimization ( ha_thd ( ) , table , share - > replace_into_fast ) ?
2010-03-05 20:21:08 +00:00
int_table_flags | HA_BINLOG_STMT_CAPABLE :
2011-03-25 12:08:58 +00:00
int_table_flags | HA_BINLOG_ROW_CAPABLE | HA_BINLOG_STMT_CAPABLE ) ;
2010-03-05 20:21:08 +00:00
}
2008-04-17 20:56:40 +00:00
//
// Returns a bit mask of capabilities of the key or its part specified by
// the arguments. The capabilities are defined in sql/handler.h.
//
2008-02-07 20:19:44 +00:00
ulong ha_tokudb : : index_flags ( uint idx , uint part , bool all_parts ) const {
2008-05-05 18:38:04 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::index_flags " ) ;
2010-04-30 14:51:09 +00:00
assert ( table_share ) ;
2008-02-07 20:19:44 +00:00
ulong flags = ( HA_READ_NEXT | HA_READ_PREV | HA_READ_ORDER | HA_KEYREAD_ONLY | HA_READ_RANGE ) ;
2013-02-20 21:45:09 +00:00
# if defined(MARIADB_BASE_VERSION) || (50600 <= MYSQL_VERSION_ID && MYSQL_VERSION_ID <= 50699)
2013-02-20 20:36:28 +00:00
flags | = HA_DO_INDEX_COND_PUSHDOWN ;
# endif
2010-04-30 14:51:09 +00:00
if ( table_share - > key_info [ idx ] . flags & HA_CLUSTERING ) {
flags | = HA_CLUSTERED_INDEX ;
}
2008-05-05 18:38:04 +00:00
DBUG_RETURN ( flags ) ;
2008-02-07 20:19:44 +00:00
}
2008-04-15 19:13:38 +00:00
2008-07-30 14:43:19 +00:00
//
// struct that will be used as a context for smart DBT callbacks
// contains parameters needed to complete the smart DBT cursor call
//
typedef struct smart_dbt_info {
ha_tokudb * ha ; //instance to ha_tokudb needed for reading the row
uchar * buf ; // output buffer where row will be written
uint keynr ; // index into share->key_file that represents DB we are currently operating on
} * SMART_DBT_INFO ;
2011-08-16 12:50:38 +00:00
typedef struct smart_dbt_bf_info {
ha_tokudb * ha ;
bool need_val ;
int direction ;
THD * thd ;
2013-02-20 20:36:28 +00:00
uchar * buf ;
2011-08-16 12:50:38 +00:00
} * SMART_DBT_BF_INFO ;
2009-08-20 17:01:16 +00:00
typedef struct index_read_info {
struct smart_dbt_info smart_dbt_info ;
int cmp ;
DBT * orig_key ;
} * INDEX_READ_INFO ;
2010-03-29 02:08:34 +00:00
2012-05-23 17:51:36 +00:00
static int ai_poll_fun ( void * extra , float progress ) {
2010-11-17 23:09:06 +00:00
LOADER_CONTEXT context = ( LOADER_CONTEXT ) extra ;
if ( context - > thd - > killed ) {
sprintf ( context - > write_status_msg , " The process has been killed, aborting add index. " ) ;
2010-11-22 17:20:27 +00:00
return ER_ABORTING_CONNECTION ;
2010-11-17 23:09:06 +00:00
}
2012-06-30 16:51:25 +00:00
float percentage = progress * 100 ;
sprintf ( context - > write_status_msg , " Adding of indexes about %.1f%% done " , percentage ) ;
2010-11-17 23:09:06 +00:00
thd_proc_info ( context - > thd , context - > write_status_msg ) ;
2012-06-30 16:51:25 +00:00
# ifdef HA_TOKUDB_HAS_THD_PROGRESS
thd_progress_report ( context - > thd , ( unsigned long long ) percentage , 100 ) ;
# endif
2010-11-17 23:09:06 +00:00
return 0 ;
}
2012-06-30 16:51:25 +00:00
static int loader_poll_fun ( void * extra , float progress ) {
2010-03-29 02:08:34 +00:00
LOADER_CONTEXT context = ( LOADER_CONTEXT ) extra ;
if ( context - > thd - > killed ) {
sprintf ( context - > write_status_msg , " The process has been killed, aborting bulk load. " ) ;
2010-11-22 17:20:27 +00:00
return ER_ABORTING_CONNECTION ;
2010-03-29 02:08:34 +00:00
}
2012-06-30 16:51:25 +00:00
float percentage = progress * 100 ;
sprintf ( context - > write_status_msg , " Loading of data about %.1f%% done " , percentage ) ;
2010-03-29 02:08:34 +00:00
thd_proc_info ( context - > thd , context - > write_status_msg ) ;
2012-06-30 16:51:25 +00:00
# ifdef HA_TOKUDB_HAS_THD_PROGRESS
thd_progress_report ( context - > thd , ( unsigned long long ) percentage , 100 ) ;
# endif
2010-03-29 02:08:34 +00:00
return 0 ;
}
2012-05-23 17:51:36 +00:00
static void loader_ai_err_fun ( DB * db , int i , int err , DBT * key , DBT * val , void * error_extra ) {
2010-03-29 02:08:34 +00:00
LOADER_CONTEXT context = ( LOADER_CONTEXT ) error_extra ;
assert ( context - > ha ) ;
context - > ha - > set_loader_error ( err ) ;
}
2012-05-23 17:51:36 +00:00
static void loader_dup_fun ( DB * db , int i , int err , DBT * key , DBT * val , void * error_extra ) {
2010-03-29 02:08:34 +00:00
LOADER_CONTEXT context = ( LOADER_CONTEXT ) error_extra ;
assert ( context - > ha ) ;
context - > ha - > set_loader_error ( err ) ;
if ( err = = DB_KEYEXIST ) {
context - > ha - > set_dup_value_for_pk ( key ) ;
}
2008-07-30 14:43:19 +00:00
}
2008-08-12 02:25:50 +00:00
//
// smart DBT callback function for optimize
// in optimize, we want to flatten DB by doing
// a full table scan. Therefore, we don't
// want to actually do anything with the data, hence
// callback does nothing
//
2009-07-27 14:52:30 +00:00
static int smart_dbt_do_nothing ( DBT const * key , DBT const * row , void * context ) {
2009-02-09 20:20:30 +00:00
return 0 ;
2008-08-12 02:25:50 +00:00
}
2009-09-10 20:52:19 +00:00
static int smart_dbt_metacallback ( DBT const * key , DBT const * row , void * context ) {
DBT * val = ( DBT * ) context ;
val - > data = my_malloc ( row - > size , MYF ( MY_WME | MY_ZEROFILL ) ) ;
2009-09-11 17:13:45 +00:00
if ( val - > data = = NULL ) return ENOMEM ;
memcpy ( val - > data , row - > data , row - > size ) ;
val - > size = row - > size ;
return 0 ;
2009-09-10 20:52:19 +00:00
}
2008-08-12 02:25:50 +00:00
2009-08-06 15:49:36 +00:00
static int
smart_dbt_callback_rowread_ptquery ( DBT const * key , DBT const * row , void * context ) {
SMART_DBT_INFO info = ( SMART_DBT_INFO ) context ;
2009-11-25 21:00:52 +00:00
info - > ha - > extract_hidden_primary_key ( info - > keynr , key ) ;
2009-08-06 15:57:33 +00:00
return info - > ha - > read_row_callback ( info - > buf , info - > keynr , row , key ) ;
2009-08-06 15:49:36 +00:00
}
2008-07-30 14:43:19 +00:00
//
// Smart DBT callback function in case where we have a covering index
//
2009-02-09 20:20:30 +00:00
static int
smart_dbt_callback_keyread ( DBT const * key , DBT const * row , void * context ) {
2008-07-30 14:43:19 +00:00
SMART_DBT_INFO info = ( SMART_DBT_INFO ) context ;
2009-11-25 21:00:52 +00:00
info - > ha - > extract_hidden_primary_key ( info - > keynr , key ) ;
info - > ha - > read_key_only ( info - > buf , info - > keynr , key ) ;
2009-02-09 20:20:30 +00:00
return 0 ;
2008-07-30 14:43:19 +00:00
}
//
// Smart DBT callback function in case where we do NOT have a covering index
//
2009-02-09 20:20:30 +00:00
static int
smart_dbt_callback_rowread ( DBT const * key , DBT const * row , void * context ) {
2009-04-20 02:36:43 +00:00
int error = 0 ;
2008-07-30 14:43:19 +00:00
SMART_DBT_INFO info = ( SMART_DBT_INFO ) context ;
2009-11-25 21:00:52 +00:00
info - > ha - > extract_hidden_primary_key ( info - > keynr , key ) ;
2009-04-20 02:36:43 +00:00
error = info - > ha - > read_primary_key ( info - > buf , info - > keynr , row , key ) ;
return error ;
2008-07-30 14:43:19 +00:00
}
2009-08-20 17:01:16 +00:00
//
// Smart DBT callback function in case where we have a covering index
//
static int
smart_dbt_callback_ir_keyread ( DBT const * key , DBT const * row , void * context ) {
INDEX_READ_INFO ir_info = ( INDEX_READ_INFO ) context ;
ir_info - > cmp = ir_info - > smart_dbt_info . ha - > prefix_cmp_dbts ( ir_info - > smart_dbt_info . keynr , ir_info - > orig_key , key ) ;
if ( ir_info - > cmp ) {
return 0 ;
}
return smart_dbt_callback_keyread ( key , row , & ir_info - > smart_dbt_info ) ;
}
2009-11-25 21:00:52 +00:00
static int
smart_dbt_callback_lookup ( DBT const * key , DBT const * row , void * context ) {
INDEX_READ_INFO ir_info = ( INDEX_READ_INFO ) context ;
ir_info - > cmp = ir_info - > smart_dbt_info . ha - > prefix_cmp_dbts ( ir_info - > smart_dbt_info . keynr , ir_info - > orig_key , key ) ;
return 0 ;
}
2009-08-20 17:01:16 +00:00
//
// Smart DBT callback function in case where we do NOT have a covering index
//
static int
smart_dbt_callback_ir_rowread ( DBT const * key , DBT const * row , void * context ) {
INDEX_READ_INFO ir_info = ( INDEX_READ_INFO ) context ;
ir_info - > cmp = ir_info - > smart_dbt_info . ha - > prefix_cmp_dbts ( ir_info - > smart_dbt_info . keynr , ir_info - > orig_key , key ) ;
if ( ir_info - > cmp ) {
return 0 ;
}
return smart_dbt_callback_rowread ( key , row , & ir_info - > smart_dbt_info ) ;
}
2008-07-30 14:43:19 +00:00
//
// macro for Smart DBT callback function,
// so we do not need to put this long line of code in multiple places
//
# define SMART_DBT_CALLBACK ( this->key_read ? smart_dbt_callback_keyread : smart_dbt_callback_rowread )
2009-08-20 17:01:16 +00:00
# define SMART_DBT_IR_CALLBACK ( this->key_read ? smart_dbt_callback_ir_keyread : smart_dbt_callback_ir_rowread )
2008-07-03 16:30:01 +00:00
2008-06-26 15:43:33 +00:00
//
// macro that modifies read flag for cursor operations depending on whether
// we have preacquired lock or not
//
2011-06-13 18:01:03 +00:00
# define SET_PRELOCK_FLAG(flg) ((flg) | (range_lock_grabbed ? (use_write_locks ? DB_PRELOCKED_WRITE : DB_PRELOCKED) : 0))
2008-08-18 18:35:32 +00:00
//
// This method retrieves the value of the auto increment column of a record in MySQL format
// This was basically taken from MyISAM
// Parameters:
// type - the type of the auto increment column (e.g. int, float, double...)
// offset - offset into the record where the auto increment column is stored
// [in] record - MySQL row whose auto increment value we want to extract
// Returns:
// The value of the auto increment column in record
//
ulonglong retrieve_auto_increment ( uint16 type , uint32 offset , const uchar * record )
{
2008-09-19 20:39:23 +00:00
const uchar * key ; /* Key */
2008-11-18 22:26:11 +00:00
ulonglong unsigned_autoinc = 0 ; /* Unsigned auto-increment */
longlong signed_autoinc = 0 ; /* Signed auto-increment */
2008-09-19 20:39:23 +00:00
enum { unsigned_type , signed_type } autoinc_type ;
float float_tmp ; /* Temporary variable */
double double_tmp ; /* Temporary variable */
key = ( ( uchar * ) record ) + offset ;
/* Set default autoincrement type */
autoinc_type = unsigned_type ;
switch ( type ) {
case HA_KEYTYPE_INT8 :
signed_autoinc = ( longlong ) * ( char * ) key ;
autoinc_type = signed_type ;
break ;
case HA_KEYTYPE_BINARY :
unsigned_autoinc = ( ulonglong ) * ( uchar * ) key ;
break ;
case HA_KEYTYPE_SHORT_INT :
signed_autoinc = ( longlong ) sint2korr ( key ) ;
autoinc_type = signed_type ;
break ;
case HA_KEYTYPE_USHORT_INT :
unsigned_autoinc = ( ulonglong ) uint2korr ( key ) ;
break ;
case HA_KEYTYPE_LONG_INT :
signed_autoinc = ( longlong ) sint4korr ( key ) ;
autoinc_type = signed_type ;
break ;
case HA_KEYTYPE_ULONG_INT :
unsigned_autoinc = ( ulonglong ) uint4korr ( key ) ;
break ;
case HA_KEYTYPE_INT24 :
signed_autoinc = ( longlong ) sint3korr ( key ) ;
autoinc_type = signed_type ;
break ;
case HA_KEYTYPE_UINT24 :
unsigned_autoinc = ( ulonglong ) uint3korr ( key ) ;
2008-08-18 18:35:32 +00:00
break ;
2008-09-19 20:39:23 +00:00
case HA_KEYTYPE_LONGLONG :
signed_autoinc = sint8korr ( key ) ;
autoinc_type = signed_type ;
break ;
case HA_KEYTYPE_ULONGLONG :
unsigned_autoinc = uint8korr ( key ) ;
break ;
/* The remaining two cases should not be used but are included for
compatibility */
case HA_KEYTYPE_FLOAT :
float4get ( float_tmp , key ) ; /* Note: float4get is a macro */
signed_autoinc = ( longlong ) float_tmp ;
autoinc_type = signed_type ;
break ;
case HA_KEYTYPE_DOUBLE :
float8get ( double_tmp , key ) ; /* Note: float8get is a macro */
signed_autoinc = ( longlong ) double_tmp ;
autoinc_type = signed_type ;
break ;
default :
DBUG_ASSERT ( 0 ) ;
unsigned_autoinc = 0 ;
}
if ( signed_autoinc < 0 ) {
signed_autoinc = 0 ;
}
return autoinc_type = = unsigned_type ?
unsigned_autoinc : ( ulonglong ) signed_autoinc ;
2008-08-18 18:35:32 +00:00
}
2012-05-23 17:51:36 +00:00
static inline bool
2008-09-17 19:32:10 +00:00
is_null_field ( TABLE * table , Field * field , const uchar * record ) {
2008-11-18 22:20:06 +00:00
uint null_offset ;
2008-09-17 19:32:10 +00:00
bool ret_val ;
2012-08-08 17:45:04 +00:00
if ( ! field - > real_maybe_null ( ) ) {
2008-11-18 22:20:06 +00:00
ret_val = false ;
2008-09-17 19:32:10 +00:00
goto exitpt ;
2008-11-18 22:20:06 +00:00
}
null_offset = get_null_offset ( table , field ) ;
2008-09-17 19:32:10 +00:00
ret_val = ( record [ null_offset ] & field - > null_bit ) ? true : false ;
exitpt :
2008-11-18 22:20:06 +00:00
return ret_val ;
}
2012-05-23 17:51:36 +00:00
static inline ulong field_offset ( Field * field , TABLE * table ) {
2008-11-18 22:20:06 +00:00
return ( ( ulong ) ( field - > ptr - table - > record [ 0 ] ) ) ;
2008-09-17 19:32:10 +00:00
}
2012-05-23 17:51:36 +00:00
static inline HA_TOKU_ISO_LEVEL tx_to_toku_iso ( ulong tx_isolation ) {
2008-10-08 18:29:32 +00:00
if ( tx_isolation = = ISO_READ_UNCOMMITTED ) {
return hatoku_iso_read_uncommitted ;
}
2010-04-06 17:16:02 +00:00
else if ( tx_isolation = = ISO_READ_COMMITTED ) {
return hatoku_iso_read_committed ;
}
2010-09-03 20:47:01 +00:00
else if ( tx_isolation = = ISO_REPEATABLE_READ ) {
return hatoku_iso_repeatable_read ;
}
2008-10-08 18:29:32 +00:00
else {
return hatoku_iso_serializable ;
}
}
2012-07-25 20:48:53 +00:00
static inline uint32_t toku_iso_to_txn_flag ( HA_TOKU_ISO_LEVEL lvl ) {
2008-10-08 18:29:32 +00:00
if ( lvl = = hatoku_iso_read_uncommitted ) {
2008-11-10 21:05:47 +00:00
return DB_READ_UNCOMMITTED ;
2008-10-08 18:29:32 +00:00
}
2010-04-06 17:16:02 +00:00
else if ( lvl = = hatoku_iso_read_committed ) {
return DB_READ_COMMITTED ;
}
2010-09-03 20:47:01 +00:00
else if ( lvl = = hatoku_iso_repeatable_read ) {
return DB_TXN_SNAPSHOT ;
}
2008-10-08 18:29:32 +00:00
else {
return 0 ;
}
}
2012-05-23 17:51:36 +00:00
static int filter_key_part_compare ( const void * left , const void * right ) {
2009-04-17 18:29:25 +00:00
FILTER_KEY_PART_INFO * left_part = ( FILTER_KEY_PART_INFO * ) left ;
FILTER_KEY_PART_INFO * right_part = ( FILTER_KEY_PART_INFO * ) right ;
return left_part - > offset - right_part - > offset ;
}
//
// Be very careful with parameters passed to this function. Who knows
// if key, table have proper info set. I had to verify by checking
// in the debugger.
//
void set_key_filter ( MY_BITMAP * key_filter , KEY * key , TABLE * table , bool get_offset_from_keypart ) {
FILTER_KEY_PART_INFO parts [ MAX_REF_PARTS ] ;
uint curr_skip_index = 0 ;
2012-12-12 18:37:24 +00:00
for ( uint i = 0 ; i < get_key_parts ( key ) ; i + + ) {
2009-04-17 18:29:25 +00:00
//
// horrendous hack due to bugs in mysql, basically
// we cannot always reliably get the offset from the same source
//
parts [ i ] . offset = get_offset_from_keypart ? key - > key_part [ i ] . offset : field_offset ( key - > key_part [ i ] . field , table ) ;
parts [ i ] . part_index = i ;
}
qsort (
parts , // start of array
2012-12-12 18:37:24 +00:00
get_key_parts ( key ) , //num elements
2009-04-17 18:29:25 +00:00
sizeof ( * parts ) , //size of each element
filter_key_part_compare
) ;
for ( uint i = 0 ; i < table - > s - > fields ; i + + ) {
Field * field = table - > field [ i ] ;
uint curr_field_offset = field_offset ( field , table ) ;
2012-12-12 18:37:24 +00:00
if ( curr_skip_index < get_key_parts ( key ) ) {
2009-04-17 18:29:25 +00:00
uint curr_skip_offset = 0 ;
curr_skip_offset = parts [ curr_skip_index ] . offset ;
if ( curr_skip_offset = = curr_field_offset ) {
//
// we have hit a field that is a portion of the primary key
//
uint curr_key_index = parts [ curr_skip_index ] . part_index ;
curr_skip_index + + ;
//
// only choose to continue over the key if the key's length matches the field's length
// otherwise, we may have a situation where the column is a varchar(10), the
// key is only the first 3 characters, and we end up losing the last 7 bytes of the
// column
//
2012-11-27 15:23:21 +00:00
TOKU_TYPE toku_type = mysql_to_toku_type ( field ) ;
switch ( toku_type ) {
case toku_type_blob :
2009-04-17 18:29:25 +00:00
break ;
2012-11-27 15:23:21 +00:00
case toku_type_varbinary :
case toku_type_varstring :
case toku_type_fixbinary :
case toku_type_fixstring :
2009-04-17 18:29:25 +00:00
if ( key - > key_part [ curr_key_index ] . length = = field - > field_length ) {
bitmap_set_bit ( key_filter , i ) ;
}
break ;
default :
bitmap_set_bit ( key_filter , i ) ;
break ;
}
}
}
}
}
2012-05-23 17:51:36 +00:00
static inline uchar * pack_fixed_field (
2009-04-17 18:29:25 +00:00
uchar * to_tokudb ,
const uchar * from_mysql ,
2012-07-25 20:48:53 +00:00
uint32_t num_bytes
2009-04-17 18:29:25 +00:00
)
{
switch ( num_bytes ) {
case ( 1 ) :
memcpy ( to_tokudb , from_mysql , 1 ) ;
break ;
case ( 2 ) :
memcpy ( to_tokudb , from_mysql , 2 ) ;
break ;
case ( 3 ) :
memcpy ( to_tokudb , from_mysql , 3 ) ;
break ;
case ( 4 ) :
memcpy ( to_tokudb , from_mysql , 4 ) ;
break ;
case ( 8 ) :
memcpy ( to_tokudb , from_mysql , 8 ) ;
break ;
default :
memcpy ( to_tokudb , from_mysql , num_bytes ) ;
break ;
}
return to_tokudb + num_bytes ;
}
2012-05-23 17:51:36 +00:00
static inline const uchar * unpack_fixed_field (
2009-04-17 18:29:25 +00:00
uchar * to_mysql ,
const uchar * from_tokudb ,
2012-07-25 20:48:53 +00:00
uint32_t num_bytes
2009-04-17 18:29:25 +00:00
)
{
switch ( num_bytes ) {
case ( 1 ) :
memcpy ( to_mysql , from_tokudb , 1 ) ;
break ;
case ( 2 ) :
memcpy ( to_mysql , from_tokudb , 2 ) ;
break ;
case ( 3 ) :
memcpy ( to_mysql , from_tokudb , 3 ) ;
break ;
case ( 4 ) :
memcpy ( to_mysql , from_tokudb , 4 ) ;
break ;
case ( 8 ) :
memcpy ( to_mysql , from_tokudb , 8 ) ;
break ;
default :
memcpy ( to_mysql , from_tokudb , num_bytes ) ;
break ;
}
return from_tokudb + num_bytes ;
}
2012-05-23 17:51:36 +00:00
static inline uchar * write_var_field (
2009-04-17 18:29:25 +00:00
uchar * to_tokudb_offset_ptr , //location where offset data is going to be written
2011-03-04 19:54:23 +00:00
uchar * to_tokudb_data , // location where data is going to be written
uchar * to_tokudb_offset_start , //location where offset starts, IS THIS A BAD NAME????
const uchar * data , // the data to write
2012-07-25 20:48:53 +00:00
uint32_t data_length , // length of data to write
uint32_t offset_bytes // number of offset bytes
2009-04-17 18:29:25 +00:00
)
{
2011-03-04 19:54:23 +00:00
memcpy ( to_tokudb_data , data , data_length ) ;
2009-04-17 18:29:25 +00:00
//
// for offset, we pack the offset where the data ENDS!
//
2012-07-25 20:48:53 +00:00
uint32_t offset = to_tokudb_data + data_length - to_tokudb_offset_start ;
2009-04-17 18:29:25 +00:00
switch ( offset_bytes ) {
case ( 1 ) :
to_tokudb_offset_ptr [ 0 ] = ( uchar ) offset ;
break ;
case ( 2 ) :
int2store ( to_tokudb_offset_ptr , offset ) ;
break ;
default :
assert ( false ) ;
break ;
}
return to_tokudb_data + data_length ;
}
2012-07-25 20:48:53 +00:00
static inline uint32_t get_var_data_length (
2011-03-04 19:54:23 +00:00
const uchar * from_mysql ,
2012-07-25 20:48:53 +00:00
uint32_t mysql_length_bytes
2011-03-04 19:54:23 +00:00
)
{
2012-07-25 20:48:53 +00:00
uint32_t data_length ;
2011-03-04 19:54:23 +00:00
switch ( mysql_length_bytes ) {
case ( 1 ) :
data_length = from_mysql [ 0 ] ;
break ;
case ( 2 ) :
data_length = uint2korr ( from_mysql ) ;
break ;
default :
assert ( false ) ;
break ;
}
return data_length ;
}
2012-05-23 17:51:36 +00:00
static inline uchar * pack_var_field (
2011-03-04 19:54:23 +00:00
uchar * to_tokudb_offset_ptr , //location where offset data is going to be written
uchar * to_tokudb_data , // pointer to where tokudb data should be written
uchar * to_tokudb_offset_start , //location where data starts, IS THIS A BAD NAME????
const uchar * from_mysql , // mysql data
2012-07-25 20:48:53 +00:00
uint32_t mysql_length_bytes , //number of bytes used to store length in from_mysql
uint32_t offset_bytes //number of offset_bytes used in tokudb row
2011-03-04 19:54:23 +00:00
)
{
uint data_length = get_var_data_length ( from_mysql , mysql_length_bytes ) ;
return write_var_field (
to_tokudb_offset_ptr ,
to_tokudb_data ,
to_tokudb_offset_start ,
from_mysql + mysql_length_bytes ,
data_length ,
offset_bytes
) ;
}
2012-05-23 17:51:36 +00:00
static inline void unpack_var_field (
2009-04-17 18:29:25 +00:00
uchar * to_mysql ,
const uchar * from_tokudb_data ,
2012-07-25 20:48:53 +00:00
uint32_t from_tokudb_data_len ,
uint32_t mysql_length_bytes
2009-04-17 18:29:25 +00:00
)
{
//
// store the length
//
switch ( mysql_length_bytes ) {
case ( 1 ) :
to_mysql [ 0 ] = ( uchar ) from_tokudb_data_len ;
break ;
case ( 2 ) :
int2store ( to_mysql , from_tokudb_data_len ) ;
break ;
default :
assert ( false ) ;
break ;
}
//
// store the data
//
memcpy ( to_mysql + mysql_length_bytes , from_tokudb_data , from_tokudb_data_len ) ;
}
2012-05-23 17:51:36 +00:00
static uchar * pack_toku_field_blob (
2009-06-10 18:51:38 +00:00
uchar * to_tokudb ,
const uchar * from_mysql ,
Field * field
)
{
2012-07-25 20:48:53 +00:00
uint32_t len_bytes = field - > row_pack_length ( ) ;
uint32_t length = 0 ;
2009-06-10 18:51:38 +00:00
uchar * data_ptr = NULL ;
memcpy ( to_tokudb , from_mysql , len_bytes ) ;
switch ( len_bytes ) {
case ( 1 ) :
2012-07-25 20:48:53 +00:00
length = ( uint32_t ) ( * from_mysql ) ;
2009-06-10 18:51:38 +00:00
break ;
case ( 2 ) :
length = uint2korr ( from_mysql ) ;
break ;
case ( 3 ) :
length = uint3korr ( from_mysql ) ;
break ;
case ( 4 ) :
length = uint4korr ( from_mysql ) ;
break ;
default :
assert ( false ) ;
}
if ( length > 0 ) {
memcpy_fixed ( ( uchar * ) ( & data_ptr ) , from_mysql + len_bytes , sizeof ( uchar * ) ) ;
memcpy ( to_tokudb + len_bytes , data_ptr , length ) ;
}
return ( to_tokudb + len_bytes + length ) ;
}
2009-09-10 20:52:19 +00:00
2009-11-10 19:22:08 +00:00
static int add_table_to_metadata ( const char * name , TABLE * table , DB_TXN * txn ) {
2009-09-10 20:52:19 +00:00
int error = 0 ;
DBT key ;
DBT val ;
uchar hidden_primary_key = ( table - > s - > primary_key > = MAX_KEY ) ;
2009-11-10 19:22:08 +00:00
assert ( txn ) ;
2009-09-10 20:52:19 +00:00
2012-05-09 18:36:52 +00:00
memset ( ( void * ) & key , 0 , sizeof ( key ) ) ;
memset ( ( void * ) & val , 0 , sizeof ( val ) ) ;
2009-09-10 20:52:19 +00:00
key . data = ( void * ) name ;
key . size = strlen ( name ) + 1 ;
val . data = & hidden_primary_key ;
val . size = sizeof ( hidden_primary_key ) ;
error = metadata_db - > put (
metadata_db ,
txn ,
& key ,
& val ,
2011-06-06 21:08:45 +00:00
0
2009-09-10 20:52:19 +00:00
) ;
return error ;
}
2009-11-10 19:22:08 +00:00
static int drop_table_from_metadata ( const char * name , DB_TXN * txn ) {
2009-09-10 20:52:19 +00:00
int error = 0 ;
DBT key ;
DBT data ;
2009-11-10 19:22:08 +00:00
assert ( txn ) ;
2012-05-09 18:36:52 +00:00
memset ( ( void * ) & key , 0 , sizeof ( key ) ) ;
memset ( ( void * ) & data , 0 , sizeof ( data ) ) ;
2009-09-10 20:52:19 +00:00
key . data = ( void * ) name ;
key . size = strlen ( name ) + 1 ;
error = metadata_db - > del (
metadata_db ,
txn ,
& key ,
DB_DELETE_ANY
) ;
return error ;
}
2009-11-10 19:22:08 +00:00
static int rename_table_in_metadata ( const char * from , const char * to , DB_TXN * txn ) {
2009-09-10 20:52:19 +00:00
int error = 0 ;
DBT from_key ;
2009-09-10 21:09:41 +00:00
DBT to_key ;
DBT val ;
2009-11-10 19:22:08 +00:00
assert ( txn ) ;
2009-09-10 20:52:19 +00:00
2012-05-09 18:36:52 +00:00
memset ( ( void * ) & from_key , 0 , sizeof ( from_key ) ) ;
memset ( ( void * ) & to_key , 0 , sizeof ( to_key ) ) ;
memset ( ( void * ) & val , 0 , sizeof ( val ) ) ;
2009-09-10 20:52:19 +00:00
from_key . data = ( void * ) from ;
from_key . size = strlen ( from ) + 1 ;
to_key . data = ( void * ) to ;
to_key . size = strlen ( to ) + 1 ;
error = metadata_db - > getf_set (
metadata_db ,
txn ,
0 ,
& from_key ,
smart_dbt_metacallback ,
& val
) ;
if ( error ) {
2009-09-10 21:09:41 +00:00
goto cleanup ;
2009-09-10 20:52:19 +00:00
}
error = metadata_db - > put (
metadata_db ,
txn ,
& to_key ,
& val ,
2011-06-06 21:08:45 +00:00
0
2009-09-10 20:52:19 +00:00
) ;
2009-09-10 21:09:41 +00:00
if ( error ) {
goto cleanup ;
}
2009-09-10 20:52:19 +00:00
2009-09-10 21:09:41 +00:00
error = metadata_db - > del (
2009-09-10 20:52:19 +00:00
metadata_db ,
txn ,
& from_key ,
DB_DELETE_ANY
) ;
2009-09-10 21:09:41 +00:00
if ( error ) {
goto cleanup ;
}
2009-09-10 20:52:19 +00:00
error = 0 ;
cleanup :
my_free ( val . data , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
return error ;
}
2011-09-06 18:42:31 +00:00
static int check_table_in_metadata ( const char * name , bool * table_found , DB_TXN * txn ) {
2009-09-10 20:52:19 +00:00
int error = 0 ;
DBT key ;
pthread_mutex_lock ( & tokudb_meta_mutex ) ;
2012-05-09 18:36:52 +00:00
memset ( ( void * ) & key , 0 , sizeof ( key ) ) ;
2009-09-10 20:52:19 +00:00
key . data = ( void * ) name ;
key . size = strlen ( name ) + 1 ;
error = metadata_db - > getf_set (
metadata_db ,
txn ,
0 ,
& key ,
smart_dbt_do_nothing ,
NULL
) ;
if ( error = = 0 ) {
* table_found = true ;
}
else if ( error = = DB_NOTFOUND ) {
* table_found = false ;
error = 0 ;
}
pthread_mutex_unlock ( & tokudb_meta_mutex ) ;
return error ;
}
2012-05-23 17:51:36 +00:00
static int create_tokudb_trx_data_instance ( tokudb_trx_data * * out_trx ) {
2009-09-29 21:47:37 +00:00
int error ;
tokudb_trx_data * trx = NULL ;
trx = ( tokudb_trx_data * ) my_malloc ( sizeof ( * trx ) , MYF ( MY_ZEROFILL ) ) ;
if ( ! trx ) {
error = ENOMEM ;
goto cleanup ;
}
* out_trx = trx ;
2009-09-30 12:23:33 +00:00
error = 0 ;
2009-09-29 21:47:37 +00:00
cleanup :
return error ;
}
2010-11-04 18:51:18 +00:00
2012-05-23 17:51:36 +00:00
static inline int tokudb_generate_row (
2010-01-21 19:24:11 +00:00
DB * dest_db ,
DB * src_db ,
DBT * dest_key ,
DBT * dest_val ,
const DBT * src_key ,
2010-11-15 14:24:42 +00:00
const DBT * src_val
2010-01-21 19:24:11 +00:00
)
{
2010-01-11 18:14:37 +00:00
int error ;
2010-01-21 19:24:11 +00:00
DB * curr_db = dest_db ;
uchar * row_desc = NULL ;
2012-07-25 20:48:53 +00:00
uint32_t desc_size ;
2010-01-21 19:24:11 +00:00
uchar * buff = NULL ;
2012-07-25 20:48:53 +00:00
uint32_t max_key_len = 0 ;
2010-01-11 18:14:37 +00:00
2010-05-28 21:08:32 +00:00
row_desc = ( uchar * ) curr_db - > descriptor - > dbt . data ;
2012-07-25 20:48:53 +00:00
row_desc + = ( * ( uint32_t * ) row_desc ) ;
desc_size = ( * ( uint32_t * ) row_desc ) - 4 ;
2010-01-21 19:24:11 +00:00
row_desc + = 4 ;
if ( is_key_pk ( row_desc , desc_size ) ) {
if ( dest_key - > flags = = DB_DBT_REALLOC & & dest_key - > data ! = NULL ) {
free ( dest_key - > data ) ;
}
2010-11-08 21:09:28 +00:00
if ( dest_val ! = NULL ) {
2010-11-04 18:51:18 +00:00
if ( dest_val - > flags = = DB_DBT_REALLOC & & dest_val - > data ! = NULL ) {
free ( dest_val - > data ) ;
}
2010-01-21 19:24:11 +00:00
}
dest_key - > data = src_key - > data ;
dest_key - > size = src_key - > size ;
2010-01-22 21:56:44 +00:00
dest_key - > flags = 0 ;
2010-11-08 21:09:28 +00:00
if ( dest_val ! = NULL ) {
2010-11-04 18:51:18 +00:00
dest_val - > data = src_val - > data ;
dest_val - > size = src_val - > size ;
dest_val - > flags = 0 ;
}
2010-01-21 19:24:11 +00:00
error = 0 ;
goto cleanup ;
}
2011-09-08 02:55:20 +00:00
// at this point, we need to create the key/val and set it
// in the DBTs
if ( dest_key - > flags = = 0 ) {
dest_key - > ulen = 0 ;
dest_key - > size = 0 ;
dest_key - > data = NULL ;
dest_key - > flags = DB_DBT_REALLOC ;
}
if ( dest_key - > flags = = DB_DBT_REALLOC ) {
2010-01-21 19:24:11 +00:00
max_key_len = max_key_size_from_desc ( row_desc , desc_size ) ;
max_key_len + = src_key - > size ;
2010-01-11 18:14:37 +00:00
2010-01-21 19:24:11 +00:00
if ( max_key_len > dest_key - > ulen ) {
void * old_ptr = dest_key - > data ;
void * new_ptr = NULL ;
new_ptr = realloc ( old_ptr , max_key_len ) ;
assert ( new_ptr ) ;
dest_key - > data = new_ptr ;
dest_key - > ulen = max_key_len ;
2010-01-11 18:14:37 +00:00
}
2010-01-21 19:24:11 +00:00
buff = ( uchar * ) dest_key - > data ;
assert ( buff ! = NULL & & max_key_len > 0 ) ;
}
else {
assert ( false ) ;
}
dest_key - > size = pack_key_from_desc (
buff ,
row_desc ,
desc_size ,
src_key ,
src_val
) ;
assert ( dest_key - > ulen > = dest_key - > size ) ;
if ( tokudb_debug & TOKUDB_DEBUG_CHECK_KEY & & ! max_key_len ) {
max_key_len = max_key_size_from_desc ( row_desc , desc_size ) ;
max_key_len + = src_key - > size ;
}
if ( max_key_len ) {
assert ( max_key_len > = dest_key - > size ) ;
}
row_desc + = desc_size ;
2012-07-25 20:48:53 +00:00
desc_size = ( * ( uint32_t * ) row_desc ) - 4 ;
2010-01-21 19:24:11 +00:00
row_desc + = 4 ;
2010-11-08 21:09:28 +00:00
if ( dest_val ! = NULL ) {
2012-06-04 20:40:17 +00:00
if ( ! is_key_clustering ( row_desc , desc_size ) | | src_val - > size = = 0 ) {
2010-11-04 18:51:18 +00:00
dest_val - > size = 0 ;
2010-01-11 18:14:37 +00:00
}
else {
2012-06-04 20:40:17 +00:00
uchar * buff = NULL ;
2011-09-08 02:55:20 +00:00
if ( dest_val - > flags = = 0 ) {
dest_val - > ulen = 0 ;
dest_val - > size = 0 ;
dest_val - > data = NULL ;
dest_val - > flags = DB_DBT_REALLOC ;
2010-11-04 18:51:18 +00:00
}
2011-09-08 02:55:20 +00:00
if ( dest_val - > flags = = DB_DBT_REALLOC ) {
2010-11-04 18:51:18 +00:00
if ( dest_val - > ulen < src_val - > size ) {
void * old_ptr = dest_val - > data ;
void * new_ptr = NULL ;
new_ptr = realloc ( old_ptr , src_val - > size ) ;
assert ( new_ptr ) ;
dest_val - > data = new_ptr ;
dest_val - > ulen = src_val - > size ;
}
buff = ( uchar * ) dest_val - > data ;
assert ( buff ! = NULL ) ;
}
else {
assert ( false ) ;
}
dest_val - > size = pack_clustering_val_from_desc (
buff ,
row_desc ,
desc_size ,
src_val
) ;
assert ( dest_val - > ulen > = dest_val - > size ) ;
2010-01-11 18:14:37 +00:00
}
}
error = 0 ;
2010-01-21 19:24:11 +00:00
cleanup :
2010-01-11 18:14:37 +00:00
return error ;
}
2012-05-23 17:51:36 +00:00
static int generate_row_for_del (
2010-11-04 18:51:18 +00:00
DB * dest_db ,
DB * src_db ,
DBT * dest_key ,
const DBT * src_key ,
2010-11-15 14:24:42 +00:00
const DBT * src_val
)
2010-11-04 18:51:18 +00:00
{
return tokudb_generate_row (
dest_db ,
src_db ,
dest_key ,
NULL ,
src_key ,
2010-11-15 14:24:42 +00:00
src_val
2010-11-04 18:51:18 +00:00
) ;
}
2012-05-23 17:51:36 +00:00
static int generate_row_for_put (
2010-11-04 18:51:18 +00:00
DB * dest_db ,
DB * src_db ,
DBT * dest_key ,
DBT * dest_val ,
const DBT * src_key ,
2010-11-15 20:02:32 +00:00
const DBT * src_val
2010-11-04 18:51:18 +00:00
)
{
return tokudb_generate_row (
dest_db ,
src_db ,
dest_key ,
dest_val ,
src_key ,
2010-11-15 14:24:42 +00:00
src_val
2010-11-04 18:51:18 +00:00
) ;
}
2009-04-17 18:29:25 +00:00
ha_tokudb : : ha_tokudb ( handlerton * hton , TABLE_SHARE * table_arg ) : handler ( hton , table_arg )
// flags defined in sql\handler.h
{
2012-08-14 21:24:38 +00:00
share = NULL ;
2009-06-02 19:39:54 +00:00
int_table_flags = HA_REC_NOT_IN_SEQ | HA_NULL_IN_KEY | HA_CAN_INDEX_BLOBS | HA_PRIMARY_KEY_IN_READ_INDEX |
2012-05-22 20:39:30 +00:00
HA_FILE_BASED | HA_AUTO_PART_KEY | HA_TABLE_SCAN_ON_INDEX | HA_CAN_WRITE_DURING_OPTIMIZE ;
2009-04-17 18:29:25 +00:00
alloc_ptr = NULL ;
rec_buff = NULL ;
2010-11-10 21:34:29 +00:00
rec_update_buff = NULL ;
2009-04-17 18:29:25 +00:00
transaction = NULL ;
2011-03-04 19:54:23 +00:00
is_fast_alter_running = false ;
2009-04-17 18:29:25 +00:00
cursor = NULL ;
fixed_cols_for_query = NULL ;
var_cols_for_query = NULL ;
num_fixed_cols_for_query = 0 ;
num_var_cols_for_query = 0 ;
unpack_entire_row = true ;
read_blobs = false ;
read_key = false ;
added_rows = 0 ;
deleted_rows = 0 ;
last_dup_key = UINT_MAX ;
using_ignore = 0 ;
last_cursor_error = 0 ;
range_lock_grabbed = false ;
2009-04-18 18:12:30 +00:00
blob_buff = NULL ;
num_blob_bytes = 0 ;
2009-07-27 14:52:30 +00:00
delay_updating_ai_metadata = false ;
ai_metadata_update_required = false ;
2012-05-09 18:36:52 +00:00
memset ( mult_key_dbt , 0 , sizeof ( mult_key_dbt ) ) ;
memset ( mult_rec_dbt , 0 , sizeof ( mult_rec_dbt ) ) ;
2010-03-29 02:08:34 +00:00
loader = NULL ;
abort_loader = false ;
2012-05-09 18:36:52 +00:00
memset ( & lc , 0 , sizeof ( lc ) ) ;
2010-09-03 20:47:01 +00:00
lock . type = TL_IGNORE ;
2012-07-25 20:48:53 +00:00
for ( uint32_t i = 0 ; i < MAX_KEY + 1 ; i + + ) {
2011-06-06 21:08:45 +00:00
mult_put_flags [ i ] = 0 ;
2010-11-04 18:51:18 +00:00
mult_del_flags [ i ] = DB_DELETE_ANY ;
2010-11-02 18:17:17 +00:00
mult_dbt_flags [ i ] = DB_DBT_REALLOC ;
}
2010-12-09 20:24:59 +00:00
num_DBs_locked_in_bulk = false ;
lock_count = 0 ;
2011-08-12 18:56:15 +00:00
use_write_locks = false ;
2011-08-16 12:50:38 +00:00
range_query_buff = NULL ;
size_range_query_buff = 0 ;
bytes_used_in_range_query_buff = 0 ;
curr_range_query_buff_offset = 0 ;
doing_bulk_fetch = false ;
prelocked_left_range_size = 0 ;
prelocked_right_range_size = 0 ;
2012-08-23 14:16:01 +00:00
tokudb_active_index = MAX_KEY ;
2013-02-20 20:36:28 +00:00
invalidate_icp ( ) ;
2009-04-17 18:29:25 +00:00
}
2012-03-19 12:15:50 +00:00
ha_tokudb : : ~ ha_tokudb ( ) {
}
2009-04-17 18:29:25 +00:00
//
// states if table has an auto increment column, if so, sets index where auto inc column is to index
// Parameters:
// [out] index - if auto inc exists, then this param is set to where it exists in table, if not, then unchanged
// Returns:
// true if auto inc column exists, false otherwise
//
bool ha_tokudb : : has_auto_increment_flag ( uint * index ) {
//
// check to see if we have auto increment field
//
bool ai_found = false ;
uint ai_index = 0 ;
for ( uint i = 0 ; i < table_share - > fields ; i + + , ai_index + + ) {
Field * field = table - > field [ i ] ;
if ( field - > flags & AUTO_INCREMENT_FLAG ) {
ai_found = true ;
* index = ai_index ;
break ;
}
}
return ai_found ;
}
2012-06-25 18:50:33 +00:00
# define status_dict_pagesize 1024
2012-05-23 17:51:36 +00:00
static int open_status_dictionary ( DB * * ptr , const char * name , DB_TXN * txn ) {
2009-11-10 19:22:08 +00:00
int error ;
char * newname = NULL ;
uint open_mode = DB_THREAD ;
2012-07-25 20:48:53 +00:00
uint32_t pagesize = 0 ;
2009-11-10 19:22:08 +00:00
newname = ( char * ) my_malloc (
get_max_dict_name_path_length ( name ) ,
MYF ( MY_WME )
) ;
if ( newname = = NULL ) {
error = ENOMEM ;
goto cleanup ;
}
make_name ( newname , name , " status " ) ;
if ( tokudb_debug & TOKUDB_DEBUG_OPEN ) {
TOKUDB_TRACE ( " open:%s \n " , newname ) ;
}
error = db_create ( ptr , db_env , 0 ) ;
if ( error ) { goto cleanup ; }
error = ( * ptr ) - > open ( ( * ptr ) , txn , newname , NULL , DB_BTREE , open_mode , 0 ) ;
if ( error ) {
goto cleanup ;
}
2012-06-25 18:50:33 +00:00
error = ( * ptr ) - > get_pagesize ( * ptr , & pagesize ) ;
if ( error ) {
goto cleanup ;
}
if ( pagesize > status_dict_pagesize ) {
error = ( * ptr ) - > change_pagesize ( * ptr , status_dict_pagesize ) ;
if ( error ) { goto cleanup ; }
}
2009-11-10 19:22:08 +00:00
cleanup :
if ( error ) {
if ( * ptr ) {
2009-12-03 15:49:42 +00:00
int r = ( * ptr ) - > close ( * ptr , 0 ) ;
assert ( r = = 0 ) ;
2009-11-10 19:22:08 +00:00
* ptr = NULL ;
}
}
my_free ( newname , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
return error ;
}
2009-12-02 14:02:47 +00:00
int ha_tokudb : : open_main_dictionary ( const char * name , bool is_read_only , DB_TXN * txn ) {
2009-11-10 19:22:08 +00:00
int error ;
char * newname = NULL ;
2009-12-02 14:02:47 +00:00
uint open_flags = ( is_read_only ? DB_RDONLY : 0 ) | DB_THREAD ;
2009-11-10 19:22:08 +00:00
assert ( share - > file = = NULL ) ;
assert ( share - > key_file [ primary_key ] = = NULL ) ;
newname = ( char * ) my_malloc (
get_max_dict_name_path_length ( name ) ,
MYF ( MY_WME | MY_ZEROFILL )
) ;
if ( newname = = NULL ) {
error = ENOMEM ;
goto exit ;
}
make_name ( newname , name , " main " ) ;
error = db_create ( & share - > file , db_env , 0 ) ;
if ( error ) {
goto exit ;
}
share - > key_file [ primary_key ] = share - > file ;
2009-04-17 18:29:25 +00:00
2009-11-10 19:22:08 +00:00
error = share - > file - > open ( share - > file , txn , newname , NULL , DB_BTREE , open_flags , 0 ) ;
if ( error ) {
goto exit ;
}
if ( tokudb_debug & TOKUDB_DEBUG_OPEN ) {
TOKUDB_TRACE ( " open:%s:file=%p \n " , newname , share - > file ) ;
}
2009-12-03 15:39:53 +00:00
error = 0 ;
2009-11-10 19:22:08 +00:00
exit :
if ( error ) {
if ( share - > file ) {
2009-12-03 15:49:42 +00:00
int r = share - > file - > close (
2009-11-10 19:22:08 +00:00
share - > file ,
0
) ;
2009-12-03 15:49:42 +00:00
assert ( r = = 0 ) ;
2009-11-10 19:22:08 +00:00
share - > file = NULL ;
share - > key_file [ primary_key ] = NULL ;
}
}
my_free ( newname , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
return error ;
}
2008-09-17 19:32:10 +00:00
2008-05-26 14:07:31 +00:00
//
// Open a secondary table, the key will be a secondary index, the data will be a primary key
//
2009-12-02 14:02:47 +00:00
int ha_tokudb : : open_secondary_dictionary ( DB * * ptr , KEY * key_info , const char * name , bool is_read_only , DB_TXN * txn ) {
2008-05-26 14:07:31 +00:00
int error = ENOSYS ;
2009-05-07 20:25:14 +00:00
char dict_name [ MAX_DICT_NAME_LEN ] ;
2009-12-02 14:02:47 +00:00
uint open_flags = ( is_read_only ? DB_RDONLY : 0 ) | DB_THREAD ;
2008-10-13 17:50:40 +00:00
char * newname = NULL ;
2009-05-07 20:25:14 +00:00
uint newname_len = 0 ;
sprintf ( dict_name , " key-%s " , key_info - > name ) ;
newname_len = get_max_dict_name_path_length ( name ) ;
newname = ( char * ) my_malloc ( newname_len , MYF ( MY_WME | MY_ZEROFILL ) ) ;
2008-10-13 17:50:40 +00:00
if ( newname = = NULL ) {
error = ENOMEM ;
goto cleanup ;
}
2009-05-07 20:25:14 +00:00
make_name ( newname , name , dict_name ) ;
2008-05-26 14:07:31 +00:00
if ( ( error = db_create ( ptr , db_env , 0 ) ) ) {
my_errno = error ;
goto cleanup ;
}
2009-11-25 21:00:52 +00:00
2008-08-10 16:39:16 +00:00
2009-11-10 19:22:08 +00:00
if ( ( error = ( * ptr ) - > open ( * ptr , txn , newname , NULL , DB_BTREE , open_flags , 0 ) ) ) {
2008-05-26 14:07:31 +00:00
my_errno = error ;
goto cleanup ;
}
if ( tokudb_debug & TOKUDB_DEBUG_OPEN ) {
TOKUDB_TRACE ( " open:%s:file=%p \n " , newname , * ptr ) ;
}
cleanup :
2009-11-10 19:22:08 +00:00
if ( error ) {
if ( * ptr ) {
2009-12-03 15:49:42 +00:00
int r = ( * ptr ) - > close ( * ptr , 0 ) ;
assert ( r = = 0 ) ;
2009-11-10 19:22:08 +00:00
* ptr = NULL ;
}
}
2008-10-13 17:50:40 +00:00
my_free ( newname , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
2008-05-26 14:07:31 +00:00
return error ;
}
2012-05-23 17:51:36 +00:00
static int initialize_col_pack_info ( KEY_AND_COL_INFO * kc_info , TABLE_SHARE * table_share , uint keynr ) {
2009-04-17 18:29:25 +00:00
int error = ENOSYS ;
//
// set up the cp_info
//
2010-01-11 18:14:37 +00:00
assert ( kc_info - > cp_info [ keynr ] = = NULL ) ;
kc_info - > cp_info [ keynr ] = ( COL_PACK_INFO * ) my_malloc (
2009-04-17 18:29:25 +00:00
table_share - > fields * sizeof ( COL_PACK_INFO ) ,
MYF ( MY_WME | MY_ZEROFILL )
) ;
2010-01-11 18:14:37 +00:00
if ( kc_info - > cp_info [ keynr ] = = NULL ) {
2009-04-17 18:29:25 +00:00
error = ENOMEM ;
goto exit ;
}
{
2012-07-25 20:48:53 +00:00
uint32_t curr_fixed_offset = 0 ;
uint32_t curr_var_index = 0 ;
2009-04-17 18:29:25 +00:00
for ( uint j = 0 ; j < table_share - > fields ; j + + ) {
2010-01-11 18:14:37 +00:00
COL_PACK_INFO * curr = & kc_info - > cp_info [ keynr ] [ j ] ;
2009-04-17 18:29:25 +00:00
//
// need to set the offsets / indexes
// offsets are calculated AFTER the NULL bytes
//
2010-01-11 18:14:37 +00:00
if ( ! bitmap_is_set ( & kc_info - > key_filters [ keynr ] , j ) ) {
if ( kc_info - > field_lengths [ j ] ) {
2009-04-17 18:29:25 +00:00
curr - > col_pack_val = curr_fixed_offset ;
2010-01-11 18:14:37 +00:00
curr_fixed_offset + = kc_info - > field_lengths [ j ] ;
2009-04-17 18:29:25 +00:00
}
2010-01-11 18:14:37 +00:00
else if ( kc_info - > length_bytes [ j ] ) {
2009-04-17 18:29:25 +00:00
curr - > col_pack_val = curr_var_index ;
curr_var_index + + ;
}
}
}
//
// set up the mcp_info
//
2011-03-04 19:54:23 +00:00
kc_info - > mcp_info [ keynr ] . fixed_field_size = get_fixed_field_size (
2010-01-11 18:14:37 +00:00
kc_info ,
2009-04-17 18:29:25 +00:00
table_share ,
keynr
) ;
2010-01-11 18:14:37 +00:00
kc_info - > mcp_info [ keynr ] . len_of_offsets = get_len_of_offsets (
kc_info ,
2009-04-17 18:29:25 +00:00
table_share ,
keynr
) ;
error = 0 ;
}
exit :
return error ;
}
2010-12-17 15:47:52 +00:00
// reset the kc_info state at keynr
static void reset_key_and_col_info ( KEY_AND_COL_INFO * kc_info , uint keynr ) {
bitmap_clear_all ( & kc_info - > key_filters [ keynr ] ) ;
my_free ( kc_info - > cp_info [ keynr ] , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
kc_info - > cp_info [ keynr ] = NULL ;
kc_info - > mcp_info [ keynr ] = ( MULTI_COL_PACK_INFO ) { 0 , 0 } ;
}
2012-05-23 17:51:36 +00:00
static int initialize_key_and_col_info ( TABLE_SHARE * table_share , TABLE * table , KEY_AND_COL_INFO * kc_info , uint hidden_primary_key , uint primary_key ) {
2010-03-25 13:30:54 +00:00
int error = 0 ;
2012-07-25 20:48:53 +00:00
uint32_t curr_blob_field_index = 0 ;
uint32_t max_var_bytes = 0 ;
2009-04-17 18:29:25 +00:00
//
// fill in the field lengths. 0 means it is a variable sized field length
// fill in length_bytes, 0 means it is fixed or blob
//
for ( uint i = 0 ; i < table_share - > fields ; i + + ) {
Field * field = table_share - > field [ i ] ;
TOKU_TYPE toku_type = mysql_to_toku_type ( field ) ;
uint32 pack_length = 0 ;
switch ( toku_type ) {
case toku_type_int :
case toku_type_double :
case toku_type_float :
case toku_type_fixbinary :
case toku_type_fixstring :
pack_length = field - > pack_length ( ) ;
2010-02-18 15:57:15 +00:00
assert ( pack_length < 1 < < 16 ) ;
2012-07-25 20:48:53 +00:00
kc_info - > field_lengths [ i ] = ( uint16_t ) pack_length ;
2010-01-11 18:14:37 +00:00
kc_info - > length_bytes [ i ] = 0 ;
2009-04-17 18:29:25 +00:00
break ;
case toku_type_blob :
2010-01-11 18:14:37 +00:00
kc_info - > field_lengths [ i ] = 0 ;
kc_info - > length_bytes [ i ] = 0 ;
kc_info - > blob_fields [ curr_blob_field_index ] = i ;
2009-04-17 18:29:25 +00:00
curr_blob_field_index + + ;
break ;
case toku_type_varstring :
case toku_type_varbinary :
//
// meaning it is variable sized
//
2010-01-11 18:14:37 +00:00
kc_info - > field_lengths [ i ] = 0 ;
kc_info - > length_bytes [ i ] = ( uchar ) ( ( Field_varstring * ) field ) - > length_bytes ;
2009-04-18 21:07:54 +00:00
max_var_bytes + = field - > field_length ;
2009-04-17 18:29:25 +00:00
break ;
default :
assert ( false ) ;
}
}
2010-01-11 18:14:37 +00:00
kc_info - > num_blobs = curr_blob_field_index ;
2009-04-17 18:29:25 +00:00
2009-04-18 21:07:54 +00:00
//
// initialize share->num_offset_bytes
// because MAX_REF_LENGTH is 65536, we
// can safely set num_offset_bytes to 1 or 2
//
if ( max_var_bytes < 256 ) {
2010-01-11 18:14:37 +00:00
kc_info - > num_offset_bytes = 1 ;
2009-04-18 21:07:54 +00:00
}
else {
2010-01-11 18:14:37 +00:00
kc_info - > num_offset_bytes = 2 ;
2009-04-18 21:07:54 +00:00
}
2009-04-17 18:29:25 +00:00
for ( uint i = 0 ; i < table_share - > keys + test ( hidden_primary_key ) ; i + + ) {
//
// do the cluster/primary key filtering calculations
//
if ( ! ( i = = primary_key & & hidden_primary_key ) ) {
if ( i = = primary_key ) {
set_key_filter (
2010-01-11 18:14:37 +00:00
& kc_info - > key_filters [ primary_key ] ,
2009-04-17 18:29:25 +00:00
& table_share - > key_info [ primary_key ] ,
table ,
true
) ;
}
2010-05-06 04:19:11 +00:00
else {
2009-04-17 18:29:25 +00:00
set_key_filter (
2010-01-11 18:14:37 +00:00
& kc_info - > key_filters [ i ] ,
2009-04-17 18:29:25 +00:00
& table_share - > key_info [ i ] ,
table ,
true
) ;
if ( ! hidden_primary_key ) {
set_key_filter (
2010-01-11 18:14:37 +00:00
& kc_info - > key_filters [ i ] ,
2009-04-17 18:29:25 +00:00
& table_share - > key_info [ primary_key ] ,
table ,
true
) ;
}
}
}
if ( i = = primary_key | | table_share - > key_info [ i ] . flags & HA_CLUSTERING ) {
2010-01-11 18:14:37 +00:00
error = initialize_col_pack_info ( kc_info , table_share , i ) ;
2009-04-17 18:29:25 +00:00
if ( error ) {
goto exit ;
}
}
}
2010-01-11 18:14:37 +00:00
exit :
return error ;
}
2009-04-17 18:29:25 +00:00
2010-05-06 04:19:11 +00:00
bool ha_tokudb : : can_replace_into_be_fast ( TABLE_SHARE * table_share , KEY_AND_COL_INFO * kc_info , uint pk ) {
uint curr_num_DBs = table_share - > keys + test ( hidden_primary_key ) ;
2010-05-07 22:18:37 +00:00
bool ret_val ;
if ( curr_num_DBs = = 1 ) {
ret_val = true ;
goto exit ;
}
ret_val = true ;
2010-05-06 04:19:11 +00:00
for ( uint curr_index = 0 ; curr_index < table_share - > keys ; curr_index + + ) {
if ( curr_index = = pk ) continue ;
KEY * curr_key_info = & table_share - > key_info [ curr_index ] ;
2012-12-12 18:37:24 +00:00
for ( uint i = 0 ; i < get_key_parts ( curr_key_info ) ; i + + ) {
2010-05-06 04:19:11 +00:00
uint16 curr_field_index = curr_key_info - > key_part [ i ] . field - > field_index ;
if ( ! bitmap_is_set ( & kc_info - > key_filters [ curr_index ] , curr_field_index ) ) {
ret_val = false ;
goto exit ;
}
if ( bitmap_is_set ( & kc_info - > key_filters [ curr_index ] , curr_field_index ) & &
! bitmap_is_set ( & kc_info - > key_filters [ pk ] , curr_field_index ) ) {
ret_val = false ;
goto exit ;
}
}
2010-05-13 14:59:29 +00:00
}
2010-05-06 04:19:11 +00:00
exit :
return ret_val ;
}
2010-01-11 18:14:37 +00:00
int ha_tokudb : : initialize_share (
const char * name ,
int mode
)
{
int error = 0 ;
2012-07-25 20:48:53 +00:00
uint64_t num_rows = 0 ;
2010-01-11 18:14:37 +00:00
bool table_exists ;
2011-09-06 18:42:31 +00:00
DB_TXN * txn = NULL ;
bool do_commit = false ;
2011-09-07 15:43:50 +00:00
THD * thd = ha_thd ( ) ;
2011-09-06 18:42:31 +00:00
tokudb_trx_data * trx = NULL ;
trx = ( tokudb_trx_data * ) thd_data_get ( ha_thd ( ) , tokudb_hton - > slot ) ;
2011-09-07 15:43:50 +00:00
if ( thd_sql_command ( thd ) = = SQLCOM_CREATE_TABLE & & trx & & trx - > sub_sp_level ) {
2011-09-06 18:42:31 +00:00
txn = trx - > sub_sp_level ;
}
else {
do_commit = true ;
error = db_env - > txn_begin ( db_env , 0 , & txn , 0 ) ;
if ( error ) { goto exit ; }
}
2010-01-11 18:14:37 +00:00
DBUG_PRINT ( " info " , ( " share->use_count %u " , share - > use_count ) ) ;
table_exists = true ;
2011-09-06 18:42:31 +00:00
error = check_table_in_metadata ( name , & table_exists , txn ) ;
2010-01-11 18:14:37 +00:00
if ( error ) {
goto exit ;
}
if ( ! table_exists ) {
sql_print_error ( " table %s does not exist in metadata, was it moved from someplace else? Not opening table " , name ) ;
error = HA_ADMIN_FAILED ;
goto exit ;
}
2011-04-21 00:53:18 +00:00
2011-09-06 18:42:31 +00:00
error = get_status ( txn ) ;
2011-04-21 00:53:18 +00:00
if ( error ) {
goto exit ;
}
2011-05-03 16:04:15 +00:00
if ( share - > version ! = HA_TOKU_VERSION ) {
2011-04-21 00:53:18 +00:00
error = ENOSYS ;
goto exit ;
}
2012-12-18 20:14:09 +00:00
# if TOKU_PARTITION_WRITE_FRM_DATA
// verify frm data for all tables
error = verify_frm_data ( table - > s - > path . str , txn ) ;
if ( error )
goto exit ;
# else
// verify frm data for non-partitioned tables
if ( table - > part_info = = NULL ) {
2011-09-06 18:42:31 +00:00
error = verify_frm_data ( table - > s - > path . str , txn ) ;
2012-09-20 13:34:32 +00:00
if ( error )
2011-04-21 00:53:18 +00:00
goto exit ;
2012-09-20 13:34:32 +00:00
} else {
2012-12-18 20:14:09 +00:00
// remove the frm data for partitions since we are not maintaining it
error = remove_frm_data ( share - > status_block , txn ) ;
if ( error )
goto exit ;
2011-04-21 00:53:18 +00:00
}
2012-12-18 20:14:09 +00:00
# endif
2012-09-20 13:34:32 +00:00
2010-01-11 18:14:37 +00:00
error = initialize_key_and_col_info (
table_share ,
table ,
& share - > kc_info ,
hidden_primary_key ,
primary_key
) ;
2009-11-10 19:22:08 +00:00
if ( error ) { goto exit ; }
2009-04-17 18:29:25 +00:00
2011-09-06 18:42:31 +00:00
error = open_main_dictionary ( name , mode = = O_RDONLY , txn ) ;
2010-01-11 18:14:37 +00:00
if ( error ) { goto exit ; }
share - > has_unique_keys = false ;
2009-04-17 18:29:25 +00:00
/* Open other keys; These are part of the share structure */
2012-04-19 14:51:34 +00:00
for ( uint i = 0 ; i < table_share - > keys ; i + + ) {
2010-01-11 18:14:37 +00:00
if ( table_share - > key_info [ i ] . flags & HA_NOSAME ) {
share - > has_unique_keys = true ;
}
2009-04-17 18:29:25 +00:00
if ( i ! = primary_key ) {
2009-11-10 19:22:08 +00:00
error = open_secondary_dictionary (
2009-04-17 18:29:25 +00:00
& share - > key_file [ i ] ,
& table_share - > key_info [ i ] ,
name ,
2009-12-02 14:02:47 +00:00
mode = = O_RDONLY ,
2011-09-06 18:42:31 +00:00
txn
2009-04-17 18:29:25 +00:00
) ;
if ( error ) {
goto exit ;
}
}
}
2010-05-06 04:19:11 +00:00
share - > replace_into_fast = can_replace_into_be_fast (
table_share ,
& share - > kc_info ,
primary_key
) ;
2009-04-17 18:29:25 +00:00
if ( ! hidden_primary_key ) {
//
// We need to set the ref_length to start at 5, to account for
// the "infinity byte" in keys, and for placing the DBT size in the first four bytes
//
2012-07-25 20:48:53 +00:00
ref_length = sizeof ( uint32_t ) + sizeof ( uchar ) ;
2009-04-17 18:29:25 +00:00
KEY_PART_INFO * key_part = table - > key_info [ primary_key ] . key_part ;
2012-12-12 18:37:24 +00:00
KEY_PART_INFO * end = key_part + get_key_parts ( & table - > key_info [ primary_key ] ) ;
2009-04-17 18:29:25 +00:00
for ( ; key_part ! = end ; key_part + + ) {
ref_length + = key_part - > field - > max_packed_col_length ( key_part - > length ) ;
}
share - > status | = STATUS_PRIMARY_KEY_INIT ;
}
share - > ref_length = ref_length ;
2011-09-06 18:42:31 +00:00
error = estimate_num_rows ( share - > file , & num_rows , txn ) ;
2009-04-17 18:29:25 +00:00
//
// estimate_num_rows should not fail under normal conditions
//
if ( error = = 0 ) {
share - > rows = num_rows ;
}
else {
goto exit ;
}
//
// initialize auto increment data
//
share - > has_auto_inc = has_auto_increment_flag ( & share - > ai_field_index ) ;
if ( share - > has_auto_inc ) {
init_auto_increment ( ) ;
}
2011-10-05 21:55:09 +00:00
if ( may_table_be_empty ( NULL ) ) {
2009-09-11 18:34:16 +00:00
share - > try_table_lock = true ;
}
else {
share - > try_table_lock = false ;
}
2010-11-17 23:09:06 +00:00
share - > num_DBs = table_share - > keys + test ( hidden_primary_key ) ;
2009-04-17 18:29:25 +00:00
error = 0 ;
exit :
2011-09-06 18:42:31 +00:00
if ( do_commit & & txn ) {
commit_txn ( txn , 0 ) ;
}
2009-04-17 18:29:25 +00:00
return error ;
}
2008-05-26 14:07:31 +00:00
2008-04-17 20:56:40 +00:00
//
// Creates and opens a handle to a table which already exists in a tokudb
// database.
// Parameters:
// [in] name - table name
// mode - seems to specify if table is read only
// test_if_locked - unused
// Returns:
// 0 on success
// 1 on error
//
2008-02-07 20:19:44 +00:00
int ha_tokudb : : open ( const char * name , int mode , uint test_if_locked ) {
2008-04-17 11:12:01 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::open %p %s " , this , name ) ;
2011-08-16 12:50:38 +00:00
THD * thd = ha_thd ( ) ;
2008-02-07 20:19:44 +00:00
2009-04-17 18:29:25 +00:00
int error = 0 ;
int ret_val = 0 ;
2010-11-08 21:09:28 +00:00
uint curr_num_DBs = 0 ;
2008-02-07 20:19:44 +00:00
2008-07-04 02:24:49 +00:00
transaction = NULL ;
cursor = NULL ;
2008-10-13 19:01:14 +00:00
2008-02-07 20:19:44 +00:00
/* Open primary key */
hidden_primary_key = 0 ;
if ( ( primary_key = table_share - > primary_key ) > = MAX_KEY ) {
// No primary key
primary_key = table_share - > keys ;
key_used_on_scan = MAX_KEY ;
2009-04-08 17:54:52 +00:00
hidden_primary_key = TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH ;
2012-07-25 20:48:53 +00:00
ref_length = TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH + sizeof ( uint32_t ) ;
2009-04-17 18:29:25 +00:00
}
2008-10-13 19:01:14 +00:00
else {
2008-02-07 20:19:44 +00:00
key_used_on_scan = primary_key ;
2008-10-13 19:01:14 +00:00
}
2010-11-08 21:09:28 +00:00
curr_num_DBs = table_share - > keys + test ( hidden_primary_key ) ;
2009-04-17 18:29:25 +00:00
2008-02-07 20:19:44 +00:00
/* Need some extra memory in case of packed keys */
2008-09-17 19:01:39 +00:00
// the "+ 1" is for the first byte that states +/- infinity
2008-11-03 20:42:59 +00:00
// multiply everything by 2 to account for clustered keys having a key and primary key together
max_key_length = 2 * ( table_share - > max_key_length + MAX_REF_PARTS * 3 + sizeof ( uchar ) ) ;
2009-04-17 18:29:25 +00:00
alloc_ptr = my_multi_malloc ( MYF ( MY_WME ) ,
& key_buff , max_key_length ,
& key_buff2 , max_key_length ,
2009-04-20 16:56:22 +00:00
& key_buff3 , max_key_length ,
2011-08-16 12:50:38 +00:00
& prelocked_left_range , max_key_length ,
& prelocked_right_range , max_key_length ,
2009-04-17 18:29:25 +00:00
& primary_key_buff , ( hidden_primary_key ? 0 : max_key_length ) ,
2012-07-25 20:48:53 +00:00
& fixed_cols_for_query , table_share - > fields * sizeof ( uint32_t ) ,
& var_cols_for_query , table_share - > fields * sizeof ( uint32_t ) ,
2009-04-17 18:29:25 +00:00
NullS
) ;
if ( alloc_ptr = = NULL ) {
ret_val = 1 ;
goto exit ;
2008-02-07 20:19:44 +00:00
}
2011-08-16 12:50:38 +00:00
size_range_query_buff = get_tokudb_read_buf_size ( thd ) ;
range_query_buff = ( uchar * ) my_malloc ( size_range_query_buff , MYF ( MY_WME ) ) ;
if ( range_query_buff = = NULL ) {
ret_val = 1 ;
goto exit ;
}
2009-04-17 18:29:25 +00:00
alloced_rec_buff_length = table_share - > rec_buff_length + table_share - > fields ;
2010-01-21 19:24:11 +00:00
rec_buff = ( uchar * ) my_malloc ( alloced_rec_buff_length , MYF ( MY_WME ) ) ;
2009-04-17 18:29:25 +00:00
if ( rec_buff = = NULL ) {
ret_val = 1 ;
goto exit ;
2008-02-07 20:19:44 +00:00
}
2009-04-17 18:29:25 +00:00
2010-11-10 21:34:29 +00:00
alloced_update_rec_buff_length = alloced_rec_buff_length ;
rec_update_buff = ( uchar * ) my_malloc ( alloced_update_rec_buff_length , MYF ( MY_WME ) ) ;
if ( rec_update_buff = = NULL ) {
ret_val = 1 ;
goto exit ;
}
2012-07-25 20:48:53 +00:00
for ( uint32_t i = 0 ; i < sizeof ( mult_key_dbt ) / sizeof ( mult_key_dbt [ 0 ] ) ; i + + ) {
2011-09-08 02:55:20 +00:00
mult_key_dbt [ i ] . flags = DB_DBT_REALLOC ;
2010-11-10 21:34:29 +00:00
}
2012-07-25 20:48:53 +00:00
for ( uint32_t i = 0 ; i < curr_num_DBs ; i + + ) {
2011-09-08 02:55:20 +00:00
mult_rec_dbt [ i ] . flags = DB_DBT_REALLOC ;
2010-01-11 18:14:37 +00:00
}
2009-04-17 18:29:25 +00:00
/* Init shared structure */
share = get_share ( name , table_share ) ;
if ( share = = NULL ) {
ret_val = 1 ;
goto exit ;
2008-05-29 18:22:48 +00:00
}
2008-02-07 20:19:44 +00:00
thr_lock_data_init ( & share - > lock , & lock , NULL ) ;
/* Fill in shared structure, if needed */
pthread_mutex_lock ( & share - > mutex ) ;
2008-10-13 17:50:40 +00:00
if ( tokudb_debug & TOKUDB_DEBUG_OPEN ) {
2008-04-24 17:30:05 +00:00
TOKUDB_TRACE ( " tokudbopen:%p:share=%p:file=%p:table=%p:table->s=%p:%d \n " ,
this , share , share - > file , table , table - > s , share - > use_count ) ;
2008-10-13 17:50:40 +00:00
}
2008-02-07 20:19:44 +00:00
if ( ! share - > use_count + + ) {
2009-04-17 18:29:25 +00:00
ret_val = initialize_share (
name ,
mode
) ;
if ( ret_val ) {
2009-04-02 15:24:14 +00:00
free_share ( share , 1 ) ;
2010-01-11 18:14:37 +00:00
goto exit ;
2008-08-18 18:35:32 +00:00
}
2008-02-07 20:19:44 +00:00
}
ref_length = share - > ref_length ; // If second open
pthread_mutex_unlock ( & share - > mutex ) ;
2008-04-18 19:54:14 +00:00
key_read = false ;
2008-02-12 20:26:48 +00:00
stats . block_size = 1 < < 20 ; // QQQ Tokudb DB block size
2008-02-07 20:19:44 +00:00
2008-07-04 15:07:07 +00:00
init_hidden_prim_key_info ( ) ;
2008-02-07 20:19:44 +00:00
info ( HA_STATUS_NO_LOCK | HA_STATUS_VARIABLE | HA_STATUS_CONST ) ;
2009-04-17 18:29:25 +00:00
exit :
if ( ret_val ) {
2011-08-16 12:50:38 +00:00
my_free ( range_query_buff , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
range_query_buff = NULL ;
2009-04-17 18:29:25 +00:00
my_free ( alloc_ptr , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
alloc_ptr = NULL ;
my_free ( rec_buff , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
rec_buff = NULL ;
2010-11-10 21:34:29 +00:00
my_free ( rec_update_buff , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
rec_update_buff = NULL ;
2010-01-11 18:14:37 +00:00
2009-04-17 18:29:25 +00:00
if ( error ) {
my_errno = error ;
}
}
TOKUDB_DBUG_RETURN ( ret_val ) ;
2008-02-07 20:19:44 +00:00
}
2008-07-03 16:30:01 +00:00
//
// estimate the number of rows in a DB
// Parameters:
// [in] db - DB whose number of rows will be estimated
// [out] num_rows - number of estimated rows in db
// Returns:
// 0 on success
// error otherwise
//
2012-07-25 20:48:53 +00:00
int ha_tokudb : : estimate_num_rows ( DB * db , uint64_t * num_rows , DB_TXN * txn ) {
2008-07-03 16:30:01 +00:00
int error = ENOSYS ;
DBC * crsr = NULL ;
bool do_commit = false ;
2011-07-07 17:57:46 +00:00
DB_BTREE_STAT64 dict_stats ;
2010-03-06 00:58:21 +00:00
DB_TXN * txn_to_use = NULL ;
2008-07-03 16:30:01 +00:00
2010-03-06 00:58:21 +00:00
if ( txn = = NULL ) {
error = db_env - > txn_begin ( db_env , 0 , & txn_to_use , DB_READ_UNCOMMITTED ) ;
2008-07-03 16:30:01 +00:00
if ( error ) goto cleanup ;
do_commit = true ;
}
2010-03-06 00:58:21 +00:00
else {
txn_to_use = txn ;
}
2008-07-03 16:30:01 +00:00
2011-07-07 17:57:46 +00:00
error = db - > stat64 (
share - > file ,
2010-03-06 00:58:21 +00:00
txn_to_use ,
2011-07-07 17:57:46 +00:00
& dict_stats
2008-07-03 16:30:01 +00:00
) ;
2011-07-07 17:57:46 +00:00
if ( error ) { goto cleanup ; }
2008-07-03 16:30:01 +00:00
2011-07-07 17:57:46 +00:00
* num_rows = dict_stats . bt_ndata ;
2008-07-03 16:30:01 +00:00
error = 0 ;
cleanup :
2008-07-14 17:27:10 +00:00
if ( crsr ! = NULL ) {
2009-12-03 16:59:52 +00:00
int r = crsr - > c_close ( crsr ) ;
assert ( r = = 0 ) ;
2008-07-14 17:27:10 +00:00
crsr = NULL ;
}
2009-08-04 14:20:12 +00:00
if ( do_commit ) {
2010-03-06 00:58:21 +00:00
commit_txn ( txn_to_use , 0 ) ;
txn_to_use = NULL ;
2009-08-04 14:20:12 +00:00
}
2008-07-03 16:30:01 +00:00
return error ;
}
2009-10-26 20:09:07 +00:00
2009-11-10 19:22:08 +00:00
int ha_tokudb : : write_to_status ( DB * db , HA_METADATA_KEY curr_key_data , void * data , uint size , DB_TXN * txn ) {
2012-04-02 18:27:34 +00:00
return write_metadata ( db , & curr_key_data , sizeof curr_key_data , data , size , txn ) ;
2009-11-10 19:22:08 +00:00
}
2012-04-02 18:27:34 +00:00
int ha_tokudb : : remove_from_status ( DB * db , HA_METADATA_KEY curr_key_data , DB_TXN * txn ) {
return remove_metadata ( db , & curr_key_data , sizeof curr_key_data , txn ) ;
}
2009-11-10 19:22:08 +00:00
int ha_tokudb : : remove_metadata ( DB * db , void * key_data , uint key_size , DB_TXN * transaction ) {
int error ;
DBT key ;
DB_TXN * txn = NULL ;
bool do_commit = false ;
//
// transaction to be used for putting metadata into status.tokudb
//
if ( transaction = = NULL ) {
error = db_env - > txn_begin ( db_env , 0 , & txn , 0 ) ;
if ( error ) {
goto cleanup ;
}
do_commit = true ;
}
else {
txn = transaction ;
}
2012-05-09 18:36:52 +00:00
memset ( & key , 0 , sizeof ( key ) ) ;
2009-11-10 19:22:08 +00:00
key . data = key_data ;
key . size = key_size ;
error = db - > del ( db , txn , & key , DB_DELETE_ANY ) ;
if ( error ) {
goto cleanup ;
}
error = 0 ;
cleanup :
if ( do_commit & & txn ) {
if ( ! error ) {
commit_txn ( txn , DB_TXN_NOSYNC ) ;
}
else {
abort_txn ( txn ) ;
}
}
return error ;
2009-10-26 20:09:07 +00:00
}
2008-08-18 18:35:32 +00:00
//
// helper function to write a piece of metadata in to status.tokudb
//
2009-11-10 19:22:08 +00:00
int ha_tokudb : : write_metadata ( DB * db , void * key_data , uint key_size , void * val_data , uint val_size , DB_TXN * transaction ) {
2008-08-18 18:35:32 +00:00
int error ;
DBT key ;
DBT value ;
DB_TXN * txn = NULL ;
2009-11-10 19:22:08 +00:00
bool do_commit = false ;
2008-08-18 18:35:32 +00:00
//
// transaction to be used for putting metadata into status.tokudb
//
2009-11-10 19:22:08 +00:00
if ( transaction = = NULL ) {
error = db_env - > txn_begin ( db_env , 0 , & txn , 0 ) ;
if ( error ) {
goto cleanup ;
}
do_commit = true ;
}
else {
txn = transaction ;
2008-08-18 18:35:32 +00:00
}
2012-05-09 18:36:52 +00:00
memset ( & key , 0 , sizeof ( key ) ) ;
memset ( & value , 0 , sizeof ( value ) ) ;
2009-10-26 20:09:07 +00:00
key . data = key_data ;
key . size = key_size ;
value . data = val_data ;
value . size = val_size ;
2008-08-18 18:35:32 +00:00
error = db - > put ( db , txn , & key , & value , 0 ) ;
if ( error ) {
goto cleanup ;
}
error = 0 ;
cleanup :
2009-11-10 19:22:08 +00:00
if ( do_commit & & txn ) {
2008-08-18 18:35:32 +00:00
if ( ! error ) {
2009-11-10 19:22:08 +00:00
commit_txn ( txn , DB_TXN_NOSYNC ) ;
2008-08-18 18:35:32 +00:00
}
else {
2009-11-10 19:22:08 +00:00
abort_txn ( txn ) ;
2008-08-18 18:35:32 +00:00
}
}
return error ;
}
2011-04-21 00:53:18 +00:00
int ha_tokudb : : write_frm_data ( DB * db , DB_TXN * txn , const char * frm_name ) {
2012-08-14 21:24:38 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::write_frm_data %p %p %p %s " , this , db , txn , frm_name ) ;
2012-04-02 18:27:34 +00:00
2011-04-21 00:53:18 +00:00
uchar * frm_data = NULL ;
size_t frm_len = 0 ;
int error = 0 ;
error = readfrm ( frm_name , & frm_data , & frm_len ) ;
if ( error ) { goto cleanup ; }
error = write_to_status ( db , hatoku_frm_data , frm_data , ( uint ) frm_len , txn ) ;
if ( error ) { goto cleanup ; }
error = 0 ;
cleanup :
my_free ( frm_data , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
TOKUDB_DBUG_RETURN ( error ) ;
}
2012-04-02 18:27:34 +00:00
int ha_tokudb : : remove_frm_data ( DB * db , DB_TXN * txn ) {
return remove_from_status ( db , hatoku_frm_data , txn ) ;
}
2011-04-21 01:25:50 +00:00
static int
smart_dbt_callback_verify_frm ( DBT const * key , DBT const * row , void * context ) {
DBT * stored_frm = ( DBT * ) context ;
stored_frm - > size = row - > size ;
2011-05-02 14:57:14 +00:00
stored_frm - > data = ( uchar * ) my_malloc ( row - > size , MYF ( MY_WME ) ) ;
assert ( stored_frm - > data ) ;
memcpy ( stored_frm - > data , row - > data , row - > size ) ;
2011-04-21 01:25:50 +00:00
return 0 ;
}
2011-09-06 18:42:31 +00:00
int ha_tokudb : : verify_frm_data ( const char * frm_name , DB_TXN * txn ) {
2012-04-02 18:27:34 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::verify_frm_data %s " , frm_name ) ;
2011-04-21 00:53:18 +00:00
uchar * mysql_frm_data = NULL ;
size_t mysql_frm_len = 0 ;
2011-04-21 01:25:50 +00:00
DBT key , stored_frm ;
2011-04-21 00:53:18 +00:00
int error = 0 ;
HA_METADATA_KEY curr_key = hatoku_frm_data ;
2012-05-09 18:36:52 +00:00
memset ( & key , 0 , sizeof ( key ) ) ;
memset ( & stored_frm , 0 , sizeof ( & stored_frm ) ) ;
2011-04-21 00:53:18 +00:00
// get the frm data from MySQL
error = readfrm ( frm_name , & mysql_frm_data , & mysql_frm_len ) ;
if ( error ) { goto cleanup ; }
key . data = & curr_key ;
key . size = sizeof ( curr_key ) ;
2011-04-21 01:25:50 +00:00
error = share - > status_block - > getf_set (
2011-04-21 00:53:18 +00:00
share - > status_block ,
2011-04-21 01:25:50 +00:00
txn ,
0 ,
2011-04-21 00:53:18 +00:00
& key ,
2011-04-21 01:25:50 +00:00
smart_dbt_callback_verify_frm ,
& stored_frm
2011-04-21 00:53:18 +00:00
) ;
if ( error = = DB_NOTFOUND ) {
// if not found, write it
error = write_frm_data (
share - > status_block ,
txn ,
frm_name
) ;
goto cleanup ;
}
else if ( error ) {
goto cleanup ;
}
2011-04-21 01:25:50 +00:00
if ( stored_frm . size ! = mysql_frm_len | |
memcmp ( stored_frm . data , mysql_frm_data , stored_frm . size ) )
2011-04-21 00:53:18 +00:00
{
error = HA_ERR_TABLE_DEF_CHANGED ;
goto cleanup ;
}
2008-08-18 18:35:32 +00:00
2011-04-21 00:53:18 +00:00
error = 0 ;
cleanup :
my_free ( mysql_frm_data , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
2011-05-02 14:57:14 +00:00
my_free ( stored_frm . data , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
2011-04-21 00:53:18 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
}
2008-08-18 18:35:32 +00:00
//
// Updates status.tokudb with a new max value used for the auto increment column
// Parameters:
// [in] db - this will always be status.tokudb
// val - value to store
// Returns:
// 0 on success, error otherwise
//
//
int ha_tokudb : : update_max_auto_inc ( DB * db , ulonglong val ) {
2009-11-10 19:22:08 +00:00
return write_to_status ( db , hatoku_max_ai , & val , sizeof ( val ) , NULL ) ;
2008-08-18 18:35:32 +00:00
}
//
// Writes the initial auto increment value, as specified by create table
// so if a user does "create table t1 (a int auto_increment, primary key (a)) auto_increment=100",
// then the value 100 will be stored here in val
// Parameters:
// [in] db - this will always be status.tokudb
// val - value to store
// Returns:
// 0 on success, error otherwise
//
//
2009-11-10 19:22:08 +00:00
int ha_tokudb : : write_auto_inc_create ( DB * db , ulonglong val , DB_TXN * txn ) {
return write_to_status ( db , hatoku_ai_create_value , & val , sizeof ( val ) , txn ) ;
2008-08-18 18:35:32 +00:00
}
2008-07-03 16:30:01 +00:00
2008-04-17 20:56:40 +00:00
//
// Closes a handle to a table.
//
2008-02-07 20:19:44 +00:00
int ha_tokudb : : close ( void ) {
2008-04-17 11:12:01 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::close %p " , this ) ;
2008-03-21 23:47:22 +00:00
TOKUDB_DBUG_RETURN ( __close ( 0 ) ) ;
2008-02-07 20:19:44 +00:00
}
int ha_tokudb : : __close ( int mutex_is_locked ) {
2008-04-17 11:12:01 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::__close %p " , this ) ;
2008-03-20 16:13:43 +00:00
if ( tokudb_debug & TOKUDB_DEBUG_OPEN )
2008-04-24 17:30:05 +00:00
TOKUDB_TRACE ( " close:%p \n " , this ) ;
2008-02-07 20:19:44 +00:00
my_free ( rec_buff , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
2010-11-10 21:34:29 +00:00
my_free ( rec_update_buff , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
2009-06-10 18:52:24 +00:00
my_free ( blob_buff , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
2008-02-07 20:19:44 +00:00
my_free ( alloc_ptr , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
2011-08-16 12:50:38 +00:00
my_free ( range_query_buff , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
2012-07-25 20:48:53 +00:00
for ( uint32_t i = 0 ; i < sizeof ( mult_rec_dbt ) / sizeof ( mult_rec_dbt [ 0 ] ) ; i + + ) {
2011-09-30 14:16:40 +00:00
if ( mult_rec_dbt [ i ] . flags = = DB_DBT_REALLOC & &
mult_rec_dbt [ i ] . data ! = NULL ) {
free ( mult_rec_dbt [ i ] . data ) ;
}
2010-11-10 21:34:29 +00:00
}
2012-07-25 20:48:53 +00:00
for ( uint32_t i = 0 ; i < sizeof ( mult_key_dbt ) / sizeof ( mult_key_dbt [ 0 ] ) ; i + + ) {
2011-09-30 14:16:40 +00:00
if ( mult_key_dbt [ i ] . flags = = DB_DBT_REALLOC & &
mult_key_dbt [ i ] . data ! = NULL ) {
free ( mult_key_dbt [ i ] . data ) ;
}
2010-01-11 18:14:37 +00:00
}
2008-12-02 18:09:53 +00:00
rec_buff = NULL ;
2010-11-10 21:34:29 +00:00
rec_update_buff = NULL ;
2008-12-02 18:09:53 +00:00
alloc_ptr = NULL ;
2009-08-06 15:59:37 +00:00
ha_tokudb : : reset ( ) ;
2009-04-02 15:24:14 +00:00
TOKUDB_DBUG_RETURN ( free_share ( share , mutex_is_locked ) ) ;
2008-02-05 16:00:53 +00:00
}
2008-04-21 18:19:07 +00:00
//
// Reallocate record buffer (rec_buff) if needed
// If not needed, does nothing
// Parameters:
// length - size of buffer required for rec_buff
//
2008-02-07 20:19:44 +00:00
bool ha_tokudb : : fix_rec_buff_for_blob ( ulong length ) {
2010-01-11 18:14:37 +00:00
if ( ! rec_buff | | ( length > alloced_rec_buff_length ) ) {
2008-02-07 20:19:44 +00:00
uchar * newptr ;
2010-01-21 19:24:11 +00:00
if ( ! ( newptr = ( uchar * ) my_realloc ( ( void * ) rec_buff , length , MYF ( MY_ALLOW_ZERO_PTR ) ) ) )
2008-02-07 20:19:44 +00:00
return 1 ;
rec_buff = newptr ;
alloced_rec_buff_length = length ;
}
return 0 ;
2008-02-05 16:00:53 +00:00
}
2010-11-10 21:34:29 +00:00
//
// Reallocate record buffer (rec_buff) if needed
// If not needed, does nothing
// Parameters:
// length - size of buffer required for rec_buff
//
bool ha_tokudb : : fix_rec_update_buff_for_blob ( ulong length ) {
if ( ! rec_update_buff | | ( length > alloced_update_rec_buff_length ) ) {
uchar * newptr ;
if ( ! ( newptr = ( uchar * ) my_realloc ( ( void * ) rec_update_buff , length , MYF ( MY_ALLOW_ZERO_PTR ) ) ) )
return 1 ;
rec_update_buff = newptr ;
alloced_update_rec_buff_length = length ;
}
return 0 ;
}
2008-02-05 16:00:53 +00:00
/* Calculate max length needed for row */
2008-02-07 20:19:44 +00:00
ulong ha_tokudb : : max_row_length ( const uchar * buf ) {
ulong length = table_share - > reclength + table_share - > fields * 2 ;
uint * ptr , * end ;
for ( ptr = table_share - > blob_field , end = ptr + table_share - > blob_fields ; ptr ! = end ; ptr + + ) {
Field_blob * blob = ( ( Field_blob * ) table - > field [ * ptr ] ) ;
2008-11-18 22:20:06 +00:00
length + = blob - > get_length ( ( uchar * ) ( buf + field_offset ( blob , table ) ) ) + 2 ;
2008-02-07 20:19:44 +00:00
}
return length ;
2008-02-05 16:00:53 +00:00
}
/*
*/
2008-04-24 19:20:26 +00:00
//
// take the row passed in as a DBT*, and convert it into a row in MySQL format in record
// Pack a row for storage.
// If the row is of fixed length, just store the row 'as is'.
// If not, we will generate a packed row suitable for storage.
// This will only fail if we don't have enough memory to pack the row,
// which may only happen in rows with blobs, as the default row length is
// pre-allocated.
// Parameters:
// [out] row - row stored in DBT to be converted
2010-01-11 18:14:37 +00:00
// [out] buf - buffer where row is packed
2008-04-24 19:20:26 +00:00
// [in] record - row in MySQL format
//
2008-02-05 16:00:53 +00:00
2010-11-10 21:34:29 +00:00
int ha_tokudb : : pack_row_in_buff (
2009-04-07 15:14:03 +00:00
DBT * row ,
2009-04-17 18:29:25 +00:00
const uchar * record ,
2010-11-10 21:34:29 +00:00
uint index ,
uchar * row_buff
2009-04-07 15:14:03 +00:00
)
{
2009-04-17 18:29:25 +00:00
uchar * fixed_field_ptr = NULL ;
uchar * var_field_offset_ptr = NULL ;
uchar * start_field_data_ptr = NULL ;
uchar * var_field_data_ptr = NULL ;
2008-05-29 18:22:48 +00:00
int r = ENOSYS ;
2012-05-09 18:36:52 +00:00
memset ( ( void * ) row , 0 , sizeof ( * row ) ) ;
2008-05-29 18:22:48 +00:00
my_bitmap_map * old_map = dbug_tmp_use_all_columns ( table , table - > write_set ) ;
2012-09-05 17:48:50 +00:00
// Copy null bytes
2010-11-10 21:34:29 +00:00
memcpy ( row_buff , record , table_share - > null_bytes ) ;
fixed_field_ptr = row_buff + table_share - > null_bytes ;
2011-03-04 19:54:23 +00:00
var_field_offset_ptr = fixed_field_ptr + share - > kc_info . mcp_info [ index ] . fixed_field_size ;
2010-01-11 18:14:37 +00:00
start_field_data_ptr = var_field_offset_ptr + share - > kc_info . mcp_info [ index ] . len_of_offsets ;
var_field_data_ptr = var_field_offset_ptr + share - > kc_info . mcp_info [ index ] . len_of_offsets ;
2008-02-07 20:19:44 +00:00
2008-05-29 18:22:48 +00:00
// assert that when the hidden primary key exists, primary_key_offsets is NULL
2009-04-17 18:29:25 +00:00
for ( uint i = 0 ; i < table_share - > fields ; i + + ) {
Field * field = table - > field [ i ] ;
uint curr_field_offset = field_offset ( field , table ) ;
2010-01-11 18:14:37 +00:00
if ( bitmap_is_set ( & share - > kc_info . key_filters [ index ] , i ) ) {
2008-09-17 19:32:10 +00:00
continue ;
}
2010-01-11 18:14:37 +00:00
if ( share - > kc_info . field_lengths [ i ] ) {
2009-04-17 18:29:25 +00:00
fixed_field_ptr = pack_fixed_field (
fixed_field_ptr ,
record + curr_field_offset ,
2010-01-11 18:14:37 +00:00
share - > kc_info . field_lengths [ i ]
2009-04-17 18:29:25 +00:00
) ;
}
2010-01-11 18:14:37 +00:00
else if ( share - > kc_info . length_bytes [ i ] ) {
2009-04-17 18:29:25 +00:00
var_field_data_ptr = pack_var_field (
var_field_offset_ptr ,
var_field_data_ptr ,
start_field_data_ptr ,
record + curr_field_offset ,
2010-01-11 18:14:37 +00:00
share - > kc_info . length_bytes [ i ] ,
share - > kc_info . num_offset_bytes
2009-04-17 18:29:25 +00:00
) ;
2010-01-11 18:14:37 +00:00
var_field_offset_ptr + = share - > kc_info . num_offset_bytes ;
2009-04-17 18:29:25 +00:00
}
}
2010-01-11 18:14:37 +00:00
for ( uint i = 0 ; i < share - > kc_info . num_blobs ; i + + ) {
Field * field = table - > field [ share - > kc_info . blob_fields [ i ] ] ;
2009-06-10 18:51:38 +00:00
var_field_data_ptr = pack_toku_field_blob (
2009-04-17 18:29:25 +00:00
var_field_data_ptr ,
2009-06-10 18:51:38 +00:00
record + field_offset ( field , table ) ,
field
2009-04-17 18:29:25 +00:00
) ;
2008-02-07 20:19:44 +00:00
}
2008-05-12 14:27:43 +00:00
2010-11-10 21:34:29 +00:00
row - > data = row_buff ;
row - > size = ( size_t ) ( var_field_data_ptr - row_buff ) ;
2008-05-29 18:22:48 +00:00
r = 0 ;
dbug_tmp_restore_column_map ( table - > write_set , old_map ) ;
return r ;
2008-02-07 20:19:44 +00:00
}
2009-04-18 18:12:30 +00:00
2010-11-10 21:34:29 +00:00
int ha_tokudb : : pack_row (
DBT * row ,
const uchar * record ,
uint index
)
{
return pack_row_in_buff ( row , record , index , rec_buff ) ;
}
int ha_tokudb : : pack_old_row_for_update (
DBT * row ,
const uchar * record ,
uint index
)
{
return pack_row_in_buff ( row , record , index , rec_update_buff ) ;
}
2009-04-20 02:36:43 +00:00
int ha_tokudb : : unpack_blobs (
2009-04-18 18:12:30 +00:00
uchar * record ,
const uchar * from_tokudb_blob ,
2012-07-25 20:48:53 +00:00
uint32_t num_bytes ,
2010-01-12 03:41:56 +00:00
bool check_bitmap
2009-04-18 18:12:30 +00:00
)
{
2009-04-20 02:36:43 +00:00
uint error = 0 ;
uchar * ptr = NULL ;
const uchar * buff = NULL ;
2009-04-18 18:12:30 +00:00
//
2009-04-20 02:36:43 +00:00
// assert that num_bytes > 0 iff share->num_blobs > 0
2009-04-18 18:12:30 +00:00
//
2010-01-11 18:14:37 +00:00
assert ( ! ( ( share - > kc_info . num_blobs = = 0 ) & & ( num_bytes > 0 ) ) ) ;
2009-04-20 02:36:43 +00:00
if ( num_bytes > num_blob_bytes ) {
ptr = ( uchar * ) my_realloc ( ( void * ) blob_buff , num_bytes , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
if ( ptr = = NULL ) {
error = ENOMEM ;
goto exit ;
}
blob_buff = ptr ;
num_blob_bytes = num_bytes ;
}
memcpy ( blob_buff , from_tokudb_blob , num_bytes ) ;
buff = blob_buff ;
2010-01-11 18:14:37 +00:00
for ( uint i = 0 ; i < share - > kc_info . num_blobs ; i + + ) {
2012-07-25 20:48:53 +00:00
uint32_t curr_field_index = share - > kc_info . blob_fields [ i ] ;
2010-01-12 03:41:56 +00:00
bool skip = check_bitmap ?
! ( bitmap_is_set ( table - > read_set , curr_field_index ) | |
bitmap_is_set ( table - > write_set , curr_field_index ) ) :
false ;
Field * field = table - > field [ curr_field_index ] ;
2012-07-25 20:48:53 +00:00
uint32_t len_bytes = field - > row_pack_length ( ) ;
2009-06-10 18:51:38 +00:00
buff = unpack_toku_field_blob (
2009-04-18 18:12:30 +00:00
record + field_offset ( field , table ) ,
2009-06-10 18:51:38 +00:00
buff ,
2010-01-11 18:14:37 +00:00
len_bytes ,
2010-01-12 03:41:56 +00:00
skip
2009-04-18 18:12:30 +00:00
) ;
}
2009-04-20 02:36:43 +00:00
error = 0 ;
exit :
return error ;
2009-04-18 18:12:30 +00:00
}
2008-04-18 19:54:14 +00:00
//
// take the row passed in as a DBT*, and convert it into a row in MySQL format in record
// Parameters:
// [out] record - row in MySQL format
// [in] row - row stored in DBT to be converted
//
2009-04-20 02:36:43 +00:00
int ha_tokudb : : unpack_row (
2009-04-07 15:14:03 +00:00
uchar * record ,
DBT const * row ,
2009-04-17 18:29:25 +00:00
DBT const * key ,
uint index
2009-04-07 15:14:03 +00:00
)
{
2008-05-29 18:22:48 +00:00
//
// two cases, fixed length row, and variable length row
// fixed length row is first below
//
2009-04-17 18:29:25 +00:00
/* Copy null bits */
2009-04-20 02:36:43 +00:00
int error = 0 ;
2009-04-17 18:29:25 +00:00
const uchar * fixed_field_ptr = ( const uchar * ) row - > data ;
const uchar * var_field_offset_ptr = NULL ;
const uchar * var_field_data_ptr = NULL ;
2012-07-25 20:48:53 +00:00
uint32_t data_end_offset = 0 ;
2009-04-17 18:29:25 +00:00
memcpy ( record , fixed_field_ptr , table_share - > null_bytes ) ;
fixed_field_ptr + = table_share - > null_bytes ;
2008-05-29 18:22:48 +00:00
2011-03-04 19:54:23 +00:00
var_field_offset_ptr = fixed_field_ptr + share - > kc_info . mcp_info [ index ] . fixed_field_size ;
2010-01-11 18:14:37 +00:00
var_field_data_ptr = var_field_offset_ptr + share - > kc_info . mcp_info [ index ] . len_of_offsets ;
2008-05-29 18:22:48 +00:00
2009-04-17 18:29:25 +00:00
//
// unpack the key, if necessary
//
if ( ! ( hidden_primary_key & & index = = primary_key ) ) {
unpack_key ( record , key , index ) ;
}
2012-07-25 20:48:53 +00:00
uint32_t last_offset = 0 ;
2009-04-17 18:29:25 +00:00
//
// we have two methods of unpacking, one if we need to unpack the entire row
// the second if we unpack a subset of the entire row
// first method here is if we unpack the entire row
//
if ( unpack_entire_row ) {
//
// fill in parts of record that are not part of the key
//
for ( uint i = 0 ; i < table_share - > fields ; i + + ) {
Field * field = table - > field [ i ] ;
2010-01-11 18:14:37 +00:00
if ( bitmap_is_set ( & share - > kc_info . key_filters [ index ] , i ) ) {
2009-04-17 18:29:25 +00:00
continue ;
}
2008-05-29 18:22:48 +00:00
2010-01-11 18:14:37 +00:00
if ( share - > kc_info . field_lengths [ i ] ) {
2009-04-17 18:29:25 +00:00
fixed_field_ptr = unpack_fixed_field (
record + field_offset ( field , table ) ,
fixed_field_ptr ,
2010-01-11 18:14:37 +00:00
share - > kc_info . field_lengths [ i ]
2009-04-17 18:29:25 +00:00
) ;
}
2008-05-29 18:22:48 +00:00
//
2009-04-17 18:29:25 +00:00
// here, we DO modify var_field_data_ptr or var_field_offset_ptr
// as we unpack variable sized fields
2008-05-29 18:22:48 +00:00
//
2010-01-11 18:14:37 +00:00
else if ( share - > kc_info . length_bytes [ i ] ) {
switch ( share - > kc_info . num_offset_bytes ) {
2009-04-17 18:29:25 +00:00
case ( 1 ) :
data_end_offset = var_field_offset_ptr [ 0 ] ;
break ;
case ( 2 ) :
data_end_offset = uint2korr ( var_field_offset_ptr ) ;
break ;
default :
assert ( false ) ;
break ;
}
unpack_var_field (
record + field_offset ( field , table ) ,
var_field_data_ptr ,
data_end_offset - last_offset ,
2010-01-11 18:14:37 +00:00
share - > kc_info . length_bytes [ i ]
2009-04-17 18:29:25 +00:00
) ;
2010-01-11 18:14:37 +00:00
var_field_offset_ptr + = share - > kc_info . num_offset_bytes ;
2009-04-17 18:29:25 +00:00
var_field_data_ptr + = data_end_offset - last_offset ;
last_offset = data_end_offset ;
2009-04-18 18:12:30 +00:00
}
2008-05-29 18:22:48 +00:00
}
2009-04-20 02:36:43 +00:00
error = unpack_blobs (
2009-04-18 18:12:30 +00:00
record ,
var_field_data_ptr ,
2012-07-25 20:48:53 +00:00
row - > size - ( uint32_t ) ( var_field_data_ptr - ( const uchar * ) row - > data ) ,
2010-01-12 03:41:56 +00:00
false
2009-04-18 18:12:30 +00:00
) ;
2009-04-20 02:36:43 +00:00
if ( error ) {
goto exit ;
}
2008-05-29 18:22:48 +00:00
}
2009-04-17 18:29:25 +00:00
//
// in this case, we unpack only what is specified
// in fixed_cols_for_query and var_cols_for_query
//
2008-02-07 20:19:44 +00:00
else {
2009-04-17 18:29:25 +00:00
//
// first the fixed fields
//
2012-07-25 20:48:53 +00:00
for ( uint32_t i = 0 ; i < num_fixed_cols_for_query ; i + + ) {
2009-04-17 18:29:25 +00:00
uint field_index = fixed_cols_for_query [ i ] ;
Field * field = table - > field [ field_index ] ;
unpack_fixed_field (
record + field_offset ( field , table ) ,
2010-01-11 18:14:37 +00:00
fixed_field_ptr + share - > kc_info . cp_info [ index ] [ field_index ] . col_pack_val ,
share - > kc_info . field_lengths [ field_index ]
2009-04-17 18:29:25 +00:00
) ;
2008-05-29 18:22:48 +00:00
}
//
2009-04-17 18:29:25 +00:00
// now the var fields
// here, we do NOT modify var_field_data_ptr or var_field_offset_ptr
2008-05-29 18:22:48 +00:00
//
2012-07-25 20:48:53 +00:00
for ( uint32_t i = 0 ; i < num_var_cols_for_query ; i + + ) {
2009-04-17 18:29:25 +00:00
uint field_index = var_cols_for_query [ i ] ;
Field * field = table - > field [ field_index ] ;
2012-07-25 20:48:53 +00:00
uint32_t var_field_index = share - > kc_info . cp_info [ index ] [ field_index ] . col_pack_val ;
uint32_t data_start_offset ;
uint32_t field_len ;
2009-04-17 18:29:25 +00:00
2010-01-11 18:14:37 +00:00
get_var_field_info (
& field_len ,
& data_start_offset ,
var_field_index ,
var_field_offset_ptr ,
share - > kc_info . num_offset_bytes
) ;
2009-04-17 18:29:25 +00:00
unpack_var_field (
record + field_offset ( field , table ) ,
var_field_data_ptr + data_start_offset ,
2010-01-11 18:14:37 +00:00
field_len ,
share - > kc_info . length_bytes [ field_index ]
2009-04-17 18:29:25 +00:00
) ;
}
2009-04-18 18:12:30 +00:00
if ( read_blobs ) {
//
// now the blobs
//
2010-01-11 18:14:37 +00:00
get_blob_field_info (
& data_end_offset ,
share - > kc_info . mcp_info [ index ] . len_of_offsets ,
var_field_data_ptr ,
share - > kc_info . num_offset_bytes
) ;
2009-04-17 18:29:25 +00:00
2010-01-11 18:14:37 +00:00
var_field_data_ptr + = data_end_offset ;
2009-04-20 02:36:43 +00:00
error = unpack_blobs (
2009-04-18 18:12:30 +00:00
record ,
var_field_data_ptr ,
2012-07-25 20:48:53 +00:00
row - > size - ( uint32_t ) ( var_field_data_ptr - ( const uchar * ) row - > data ) ,
2010-01-12 03:41:56 +00:00
true
2009-04-17 18:29:25 +00:00
) ;
2009-04-20 02:36:43 +00:00
if ( error ) {
goto exit ;
}
2008-05-29 18:22:48 +00:00
}
2008-02-07 20:19:44 +00:00
}
2009-04-20 02:36:43 +00:00
error = 0 ;
exit :
return error ;
2008-02-05 16:00:53 +00:00
}
2012-07-25 20:48:53 +00:00
uint32_t ha_tokudb : : place_key_into_mysql_buff (
2009-04-07 15:14:03 +00:00
KEY * key_info ,
uchar * record ,
uchar * data
)
{
2012-12-12 18:37:24 +00:00
KEY_PART_INFO * key_part = key_info - > key_part , * end = key_part + get_key_parts ( key_info ) ;
2008-11-03 20:42:59 +00:00
uchar * pos = data ;
2008-02-07 20:19:44 +00:00
for ( ; key_part ! = end ; key_part + + ) {
2010-03-29 02:08:34 +00:00
if ( key_part - > field - > null_bit ) {
uint null_offset = get_null_offset ( table , key_part - > field ) ;
2008-09-17 19:32:10 +00:00
if ( * pos + + = = NULL_COL_VAL ) { // Null value
2009-03-26 01:25:59 +00:00
//
// We don't need to reset the record data as we will not access it
// if the null data is set
//
2010-03-29 02:08:34 +00:00
record [ null_offset ] | = key_part - > field - > null_bit ;
2008-02-07 20:19:44 +00:00
continue ;
}
2010-03-29 02:08:34 +00:00
record [ null_offset ] & = ~ key_part - > field - > null_bit ;
2008-02-07 20:19:44 +00:00
}
2012-04-16 20:04:07 +00:00
# if !defined(MARIADB_BASE_VERSION)
2009-03-26 14:20:49 +00:00
//
// HOPEFULLY TEMPORARY
//
assert ( table - > s - > db_low_byte_first ) ;
2012-04-16 20:04:07 +00:00
# endif
2009-04-07 15:08:03 +00:00
pos = unpack_toku_key_field (
2009-03-26 14:20:49 +00:00
record + field_offset ( key_part - > field , table ) ,
2009-03-25 14:24:25 +00:00
pos ,
2009-03-26 14:20:49 +00:00
key_part - > field ,
key_part - > length
2009-03-25 14:24:25 +00:00
) ;
2008-02-07 20:19:44 +00:00
}
2008-11-03 20:42:59 +00:00
return pos - data ;
2008-02-05 16:00:53 +00:00
}
2008-05-08 15:50:34 +00:00
//
2008-11-03 20:42:59 +00:00
// Store the key and the primary key into the row
2008-05-08 15:50:34 +00:00
// Parameters:
2008-11-03 20:42:59 +00:00
// [out] record - key stored in MySQL format
// [in] key - key stored in DBT to be converted
// index -index into key_file that represents the DB
// unpacking a key of
2008-05-08 15:50:34 +00:00
//
2008-11-03 20:42:59 +00:00
void ha_tokudb : : unpack_key ( uchar * record , DBT const * key , uint index ) {
2012-07-25 20:48:53 +00:00
uint32_t bytes_read ;
2008-11-03 20:42:59 +00:00
uchar * pos = ( uchar * ) key - > data + 1 ;
2009-03-25 20:41:04 +00:00
bytes_read = place_key_into_mysql_buff (
& table - > key_info [ index ] ,
record ,
pos
) ;
2009-11-25 21:00:52 +00:00
if ( ( index ! = primary_key ) & & ! hidden_primary_key ) {
2008-11-03 20:42:59 +00:00
//
// also unpack primary key
//
2009-03-25 20:41:04 +00:00
place_key_into_mysql_buff (
& table - > key_info [ primary_key ] ,
record ,
pos + bytes_read
) ;
2008-11-03 20:42:59 +00:00
}
}
2008-02-05 16:00:53 +00:00
2012-07-25 20:48:53 +00:00
uint32_t ha_tokudb : : place_key_into_dbt_buff (
2009-04-07 15:14:03 +00:00
KEY * key_info ,
uchar * buff ,
const uchar * record ,
bool * has_null ,
int key_length
)
{
2008-11-03 20:42:59 +00:00
KEY_PART_INFO * key_part = key_info - > key_part ;
2012-12-12 18:37:24 +00:00
KEY_PART_INFO * end = key_part + get_key_parts ( key_info ) ;
2008-11-03 20:42:59 +00:00
uchar * curr_buff = buff ;
2008-08-10 16:39:16 +00:00
* has_null = false ;
2008-02-07 20:19:44 +00:00
for ( ; key_part ! = end & & key_length > 0 ; key_part + + ) {
2008-05-26 14:07:31 +00:00
//
// accessing key_part->field->null_bit instead off key_part->null_bit
// because key_part->null_bit is not set in add_index
// filed ticket 862 to look into this
//
if ( key_part - > field - > null_bit ) {
2008-02-07 20:19:44 +00:00
/* Store 0 if the key part is a NULL part */
2009-03-25 20:41:04 +00:00
uint null_offset = get_null_offset ( table , key_part - > field ) ;
2008-09-16 13:34:59 +00:00
if ( record [ null_offset ] & key_part - > field - > null_bit ) {
2008-11-03 20:42:59 +00:00
* curr_buff + + = NULL_COL_VAL ;
2008-08-10 16:39:16 +00:00
* has_null = true ;
2008-02-07 20:19:44 +00:00
continue ;
}
2008-11-03 20:42:59 +00:00
* curr_buff + + = NONNULL_COL_VAL ; // Store NOT NULL marker
2008-02-07 20:19:44 +00:00
}
2012-04-16 20:04:07 +00:00
# if !defined(MARIADB_BASE_VERSION)
2008-05-26 14:07:31 +00:00
//
2009-03-26 14:11:14 +00:00
// HOPEFULLY TEMPORARY
//
assert ( table - > s - > db_low_byte_first ) ;
2012-04-16 20:04:07 +00:00
# endif
2009-03-26 14:11:14 +00:00
//
2008-05-26 14:07:31 +00:00
// accessing field_offset(key_part->field) instead off key_part->offset
// because key_part->offset is SET INCORRECTLY in add_index
// filed ticket 862 to look into this
//
2009-04-07 15:08:03 +00:00
curr_buff = pack_toku_key_field (
2009-03-26 14:11:14 +00:00
curr_buff ,
2009-03-25 14:24:25 +00:00
( uchar * ) ( record + field_offset ( key_part - > field , table ) ) ,
2009-03-26 14:11:14 +00:00
key_part - > field ,
key_part - > length
2009-03-25 14:24:25 +00:00
) ;
2008-02-07 20:19:44 +00:00
key_length - = key_part - > length ;
}
2008-11-03 20:42:59 +00:00
return curr_buff - buff ;
}
//
// Create a packed key from a row. This key will be written as such
// to the index tree. This will never fail as the key buffer is pre-allocated.
// Parameters:
// [out] key - DBT that holds the key
// [in] key_info - holds data about the key, such as it's length and offset into record
// [out] buff - buffer that will hold the data for key (unless
// we have a hidden primary key)
// [in] record - row from which to create the key
// key_length - currently set to MAX_KEY_LENGTH, is it size of buff?
// Returns:
// the parameter key
//
2009-04-07 15:14:03 +00:00
DBT * ha_tokudb : : create_dbt_key_from_key (
2009-11-25 21:00:52 +00:00
DBT * key ,
2009-04-07 15:14:03 +00:00
KEY * key_info ,
2009-11-25 21:00:52 +00:00
uchar * buff ,
2009-04-07 15:14:03 +00:00
const uchar * record ,
2009-11-25 21:00:52 +00:00
bool * has_null ,
bool dont_pack_pk ,
2009-04-07 15:14:03 +00:00
int key_length
)
{
2012-07-25 20:48:53 +00:00
uint32_t size = 0 ;
2008-11-03 20:42:59 +00:00
uchar * tmp_buff = buff ;
my_bitmap_map * old_map = dbug_tmp_use_all_columns ( table , table - > write_set ) ;
key - > data = buff ;
//
// first put the "infinity" byte at beginning. States if missing columns are implicitly
2009-08-19 14:11:01 +00:00
// positive infinity or negative infinity or zero. For this, because we are creating key
2008-11-03 20:42:59 +00:00
// from a row, there is no way that columns can be missing, so in practice,
// this will be meaningless. Might as well put in a value
//
2009-08-19 14:11:01 +00:00
* tmp_buff + + = COL_ZERO ;
2008-11-03 20:42:59 +00:00
size + + ;
2009-04-07 15:14:03 +00:00
size + = place_key_into_dbt_buff (
key_info ,
tmp_buff ,
record ,
has_null ,
key_length
) ;
2009-11-25 21:00:52 +00:00
if ( ! dont_pack_pk ) {
2008-11-03 20:42:59 +00:00
tmp_buff = buff + size ;
if ( hidden_primary_key ) {
memcpy_fixed ( tmp_buff , current_ident , TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH ) ;
size + = TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH ;
}
else {
bool tmp_bool = false ;
size + = place_key_into_dbt_buff (
& table - > key_info [ primary_key ] ,
tmp_buff ,
record ,
& tmp_bool ,
MAX_KEY_LENGTH //this parameter does not matter
) ;
}
}
key - > size = size ;
2008-02-07 20:19:44 +00:00
DBUG_DUMP ( " key " , ( uchar * ) key - > data , key - > size ) ;
dbug_tmp_restore_column_map ( table - > write_set , old_map ) ;
2008-05-26 14:07:31 +00:00
return key ;
}
//
// Create a packed key from a row. This key will be written as such
// to the index tree. This will never fail as the key buffer is pre-allocated.
// Parameters:
// [out] key - DBT that holds the key
// keynr - index for which to create the key
// [out] buff - buffer that will hold the data for key (unless
// we have a hidden primary key)
// [in] record - row from which to create the key
2008-09-17 19:01:39 +00:00
// [out] has_null - says if the key has a NULL value for one of its columns
2008-05-26 14:07:31 +00:00
// key_length - currently set to MAX_KEY_LENGTH, is it size of buff?
// Returns:
// the parameter key
//
2009-04-07 15:14:03 +00:00
DBT * ha_tokudb : : create_dbt_key_from_table (
DBT * key ,
uint keynr ,
uchar * buff ,
const uchar * record ,
bool * has_null ,
int key_length
)
{
2008-05-26 14:07:31 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::create_dbt_key_from_table " ) ;
2012-05-09 18:36:52 +00:00
memset ( ( void * ) key , 0 , sizeof ( * key ) ) ;
2008-05-26 14:07:31 +00:00
if ( hidden_primary_key & & keynr = = primary_key ) {
2010-01-11 18:14:37 +00:00
key - > data = buff ;
memcpy ( buff , & current_ident , TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH ) ;
2008-05-26 14:07:31 +00:00
key - > size = TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH ;
2008-08-10 16:39:16 +00:00
* has_null = false ;
2008-05-26 14:07:31 +00:00
DBUG_RETURN ( key ) ;
}
2009-11-25 21:00:52 +00:00
DBUG_RETURN ( create_dbt_key_from_key ( key , & table - > key_info [ keynr ] , buff , record , has_null , ( keynr = = primary_key ) , key_length ) ) ;
2008-02-05 16:00:53 +00:00
}
2009-11-25 21:00:52 +00:00
DBT * ha_tokudb : : create_dbt_key_for_lookup (
DBT * key ,
KEY * key_info ,
uchar * buff ,
const uchar * record ,
bool * has_null ,
int key_length
)
{
TOKUDB_DBUG_ENTER ( " ha_tokudb::create_dbt_key_from_lookup " ) ;
DBUG_RETURN ( create_dbt_key_from_key ( key , key_info , buff , record , has_null , true , key_length ) ) ;
}
2008-02-05 16:00:53 +00:00
2008-05-08 15:50:34 +00:00
//
// Create a packed key from from a MySQL unpacked key (like the one that is
// sent from the index_read() This key is to be used to read a row
// Parameters:
// [out] key - DBT that holds the key
// keynr - index for which to pack the key
// [out] buff - buffer that will hold the data for key
// [in] key_ptr - MySQL unpacked key
// key_length - length of key_ptr
// Returns:
// the parameter key
//
2009-04-07 15:14:03 +00:00
DBT * ha_tokudb : : pack_key (
DBT * key ,
uint keynr ,
uchar * buff ,
const uchar * key_ptr ,
uint key_length ,
2009-08-19 14:11:01 +00:00
int8_t inf_byte
2009-04-07 15:14:03 +00:00
)
{
2008-03-26 02:47:07 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::pack_key " ) ;
2013-02-26 21:17:51 +00:00
# if TOKU_INCLUDE_EXTENDED_KEYS
if ( keynr ! = primary_key & & ! test ( hidden_primary_key ) ) {
DBUG_RETURN ( pack_ext_key ( key , keynr , buff , key_ptr , key_length , inf_byte ) ) ;
}
# endif
KEY * key_info = & table - > key_info [ keynr ] ;
KEY_PART_INFO * key_part = key_info - > key_part ;
KEY_PART_INFO * end = key_part + get_key_parts ( key_info ) ;
my_bitmap_map * old_map = dbug_tmp_use_all_columns ( table , table - > write_set ) ;
memset ( ( void * ) key , 0 , sizeof ( * key ) ) ;
key - > data = buff ;
// first put the "infinity" byte at beginning. States if missing columns are implicitly
// positive infinity or negative infinity
* buff + + = ( uchar ) inf_byte ;
for ( ; key_part ! = end & & ( int ) key_length > 0 ; key_part + + ) {
uint offset = 0 ;
if ( key_part - > null_bit ) {
if ( ! ( * key_ptr = = 0 ) ) {
* buff + + = NULL_COL_VAL ;
key_length - = key_part - > store_length ;
key_ptr + = key_part - > store_length ;
continue ;
}
* buff + + = NONNULL_COL_VAL ;
offset = 1 ; // Data is at key_ptr+1
}
# if !defined(MARIADB_BASE_VERSION)
assert ( table - > s - > db_low_byte_first ) ;
# endif
buff = pack_key_toku_key_field (
buff ,
( uchar * ) key_ptr + offset ,
key_part - > field ,
key_part - > length
) ;
key_ptr + = key_part - > store_length ;
key_length - = key_part - > store_length ;
}
key - > size = ( buff - ( uchar * ) key - > data ) ;
DBUG_DUMP ( " key " , ( uchar * ) key - > data , key - > size ) ;
dbug_tmp_restore_column_map ( table - > write_set , old_map ) ;
DBUG_RETURN ( key ) ;
}
# if TOKU_INCLUDE_EXTENDED_KEYS
DBT * ha_tokudb : : pack_ext_key (
DBT * key ,
uint keynr ,
uchar * buff ,
const uchar * key_ptr ,
uint key_length ,
int8_t inf_byte
)
{
TOKUDB_DBUG_ENTER ( " ha_tokudb::pack_ext_key " ) ;
// build a list of PK parts that are in the SK. we will use this list to build the
// extended key if necessary.
KEY * pk_key_info = & table - > key_info [ primary_key ] ;
uint pk_parts = get_key_parts ( pk_key_info ) ;
uint pk_next = 0 ;
struct {
const uchar * key_ptr ;
KEY_PART_INFO * key_part ;
} pk_info [ pk_parts ] ;
2009-03-31 20:43:42 +00:00
KEY * key_info = & table - > key_info [ keynr ] ;
2008-02-07 20:19:44 +00:00
KEY_PART_INFO * key_part = key_info - > key_part ;
2012-12-12 18:37:24 +00:00
KEY_PART_INFO * end = key_part + get_key_parts ( key_info ) ;
2008-02-07 20:19:44 +00:00
my_bitmap_map * old_map = dbug_tmp_use_all_columns ( table , table - > write_set ) ;
2012-05-09 18:36:52 +00:00
memset ( ( void * ) key , 0 , sizeof ( * key ) ) ;
2008-02-07 20:19:44 +00:00
key - > data = buff ;
2008-09-17 19:01:39 +00:00
// first put the "infinity" byte at beginning. States if missing columns are implicitly
// positive infinity or negative infinity
2009-08-19 14:11:01 +00:00
* buff + + = ( uchar ) inf_byte ;
2008-09-17 19:01:39 +00:00
2008-02-07 20:19:44 +00:00
for ( ; key_part ! = end & & ( int ) key_length > 0 ; key_part + + ) {
2013-02-26 21:17:51 +00:00
// if the SK part is part of the PK, then append it to the list.
if ( key_part - > field - > part_of_key . is_set ( primary_key ) ) {
assert ( pk_next < pk_parts ) ;
pk_info [ pk_next ] . key_ptr = key_ptr ;
pk_info [ pk_next ] . key_part = key_part ;
pk_next + + ;
}
2008-02-07 20:19:44 +00:00
uint offset = 0 ;
if ( key_part - > null_bit ) {
2008-09-17 19:01:39 +00:00
if ( ! ( * key_ptr = = 0 ) ) {
* buff + + = NULL_COL_VAL ;
2008-02-07 20:19:44 +00:00
key_length - = key_part - > store_length ;
key_ptr + = key_part - > store_length ;
continue ;
}
2008-09-17 19:01:39 +00:00
* buff + + = NONNULL_COL_VAL ;
2008-02-07 20:19:44 +00:00
offset = 1 ; // Data is at key_ptr+1
}
2012-04-16 20:04:07 +00:00
# if !defined(MARIADB_BASE_VERSION)
2009-03-26 15:03:15 +00:00
assert ( table - > s - > db_low_byte_first ) ;
2012-04-16 20:04:07 +00:00
# endif
2009-04-07 15:08:03 +00:00
buff = pack_key_toku_key_field (
2009-03-26 15:03:15 +00:00
buff ,
2009-03-25 14:24:25 +00:00
( uchar * ) key_ptr + offset ,
2009-03-26 15:03:15 +00:00
key_part - > field ,
key_part - > length
2009-03-25 14:24:25 +00:00
) ;
2009-03-26 15:03:15 +00:00
2008-02-07 20:19:44 +00:00
key_ptr + = key_part - > store_length ;
key_length - = key_part - > store_length ;
}
2013-02-26 21:17:51 +00:00
if ( key_length > 0 ) {
assert ( key_part = = end ) ;
end = key_info - > key_part + get_ext_key_parts ( key_info ) ;
// pack PK in order of PK key parts
for ( uint pk_index = 0 ; key_part ! = end & & ( int ) key_length > 0 & & pk_index < pk_parts ; pk_index + + ) {
uint i ;
for ( i = 0 ; i < pk_next ; i + + ) {
2013-02-27 15:55:15 +00:00
if ( pk_info [ i ] . key_part - > fieldnr = = pk_key_info - > key_part [ pk_index ] . fieldnr )
2013-02-26 21:17:51 +00:00
break ;
}
if ( i < pk_next ) {
const uchar * this_key_ptr = pk_info [ i ] . key_ptr ;
KEY_PART_INFO * this_key_part = pk_info [ i ] . key_part ;
buff = pack_key_toku_key_field ( buff , ( uchar * ) this_key_ptr , this_key_part - > field , this_key_part - > length ) ;
} else {
buff = pack_key_toku_key_field ( buff , ( uchar * ) key_ptr , key_part - > field , key_part - > length ) ;
key_ptr + = key_part - > store_length ;
key_length - = key_part - > store_length ;
key_part + + ;
}
}
}
2008-02-07 20:19:44 +00:00
key - > size = ( buff - ( uchar * ) key - > data ) ;
DBUG_DUMP ( " key " , ( uchar * ) key - > data , key - > size ) ;
dbug_tmp_restore_column_map ( table - > write_set , old_map ) ;
DBUG_RETURN ( key ) ;
2008-02-05 16:00:53 +00:00
}
2013-02-26 21:17:51 +00:00
# endif
2008-02-05 16:00:53 +00:00
2008-07-04 02:24:49 +00:00
//
// get max used hidden primary key value
//
void ha_tokudb : : init_hidden_prim_key_info ( ) {
TOKUDB_DBUG_ENTER ( " ha_tokudb::init_prim_key_info " ) ;
2008-07-04 16:34:36 +00:00
pthread_mutex_lock ( & share - > mutex ) ;
2008-07-03 18:58:58 +00:00
if ( ! ( share - > status & STATUS_PRIMARY_KEY_INIT ) ) {
2011-09-07 20:25:11 +00:00
int error = 0 ;
THD * thd = ha_thd ( ) ;
DB_TXN * txn = NULL ;
DBC * c = NULL ;
tokudb_trx_data * trx = NULL ;
trx = ( tokudb_trx_data * ) thd_data_get ( ha_thd ( ) , tokudb_hton - > slot ) ;
bool do_commit = false ;
if ( thd_sql_command ( thd ) = = SQLCOM_CREATE_TABLE & & trx & & trx - > sub_sp_level ) {
txn = trx - > sub_sp_level ;
}
else {
do_commit = true ;
error = db_env - > txn_begin ( db_env , 0 , & txn , 0 ) ;
assert ( error = = 0 ) ;
}
error = share - > key_file [ primary_key ] - > cursor (
share - > key_file [ primary_key ] ,
txn ,
& c ,
0
) ;
assert ( error = = 0 ) ;
DBT key , val ;
2012-05-09 18:36:52 +00:00
memset ( & key , 0 , sizeof ( key ) ) ;
memset ( & val , 0 , sizeof ( val ) ) ;
2011-09-07 20:25:11 +00:00
error = c - > c_get ( c , & key , & val , DB_LAST ) ;
2008-07-03 18:58:58 +00:00
if ( error = = 0 ) {
2011-09-07 20:25:11 +00:00
assert ( key . size = = TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH ) ;
share - > auto_ident = hpk_char_to_num ( ( uchar * ) key . data ) ;
}
error = c - > c_close ( c ) ;
assert ( error = = 0 ) ;
if ( do_commit ) {
commit_txn ( txn , 0 ) ;
2008-02-07 20:19:44 +00:00
}
2008-07-03 22:04:11 +00:00
share - > status | = STATUS_PRIMARY_KEY_INIT ;
2008-07-04 16:34:36 +00:00
}
pthread_mutex_unlock ( & share - > mutex ) ;
2008-07-04 02:24:49 +00:00
DBUG_VOID_RETURN ;
}
2008-07-03 22:04:11 +00:00
2008-07-04 02:24:49 +00:00
/** @brief
Get metadata info stored in status . tokudb
*/
2011-09-06 18:42:31 +00:00
int ha_tokudb : : get_status ( DB_TXN * txn ) {
2008-07-04 02:24:49 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::get_status " ) ;
2008-07-04 02:34:12 +00:00
DBT key , value ;
HA_METADATA_KEY curr_key ;
int error ;
2011-09-06 18:42:31 +00:00
2008-07-03 22:04:11 +00:00
//
// open status.tokudb
//
if ( ! share - > status_block ) {
2009-11-10 19:22:08 +00:00
error = open_status_dictionary (
& share - > status_block ,
share - > table_name ,
2011-09-06 18:42:31 +00:00
txn
2009-05-07 20:25:14 +00:00
) ;
2009-01-22 21:44:54 +00:00
if ( error ) {
goto cleanup ;
}
2008-02-07 20:19:44 +00:00
}
2008-07-03 22:04:11 +00:00
2008-07-04 02:01:46 +00:00
//
// transaction to be used for putting metadata into status.tokudb
//
2012-05-09 18:36:52 +00:00
memset ( & key , 0 , sizeof ( key ) ) ;
memset ( & value , 0 , sizeof ( value ) ) ;
2008-07-04 02:01:46 +00:00
key . data = & curr_key ;
key . size = sizeof ( curr_key ) ;
2009-08-05 18:23:40 +00:00
value . flags = DB_DBT_USERMEM ;
2008-07-04 02:01:46 +00:00
2009-11-10 19:22:08 +00:00
assert ( share - > status_block ) ;
//
// get version
//
value . ulen = sizeof ( share - > version ) ;
value . data = & share - > version ;
2011-05-03 16:04:15 +00:00
curr_key = hatoku_new_version ;
2009-11-10 19:22:08 +00:00
error = share - > status_block - > get (
share - > status_block ,
txn ,
& key ,
& value ,
0
) ;
if ( error = = DB_NOTFOUND ) {
2011-05-03 16:04:15 +00:00
//
// hack to keep handle the issues of going back and forth
// between 5.0.3 to 5.0.4
// the problem with going back and forth
// is with storing the frm file, 5.0.4 stores it, 5.0.3 does not
// so, if a user goes back and forth and alters the schema
// the frm stored can get out of sync with the schema of the table
// This can cause issues.
// To take care of this, we are doing this versioning work here.
// We change the key that stores the version.
// In 5.0.3, it is hatoku_old_version, in 5.0.4 it is hatoku_new_version
// When we encounter a table that does not have hatoku_new_version
// set, we give it the right one, and overwrite the old one with zero.
// This ensures that 5.0.3 cannot open the table. Once it has been opened by 5.0.4
//
uint dummy_version = 0 ;
share - > version = HA_TOKU_ORIG_VERSION ;
error = write_to_status (
share - > status_block ,
hatoku_new_version ,
& share - > version ,
sizeof ( share - > version ) ,
txn
) ;
if ( error ) { goto cleanup ; }
error = write_to_status (
share - > status_block ,
hatoku_old_version ,
& dummy_version ,
sizeof ( dummy_version ) ,
txn
) ;
if ( error ) { goto cleanup ; }
2009-11-10 19:22:08 +00:00
}
else if ( error | | value . size ! = sizeof ( share - > version ) ) {
if ( error = = 0 ) {
error = HA_ERR_INTERNAL_ERROR ;
2008-07-04 02:01:46 +00:00
}
2009-11-10 19:22:08 +00:00
goto cleanup ;
}
//
// get capabilities
//
curr_key = hatoku_capabilities ;
value . ulen = sizeof ( share - > capabilities ) ;
value . data = & share - > capabilities ;
error = share - > status_block - > get (
share - > status_block ,
txn ,
& key ,
& value ,
0
) ;
if ( error = = DB_NOTFOUND ) {
share - > capabilities = 0 ;
}
else if ( error | | value . size ! = sizeof ( share - > version ) ) {
if ( error = = 0 ) {
error = HA_ERR_INTERNAL_ERROR ;
2008-07-04 02:01:46 +00:00
}
2009-11-10 19:22:08 +00:00
goto cleanup ;
2008-07-04 02:01:46 +00:00
}
2009-11-10 19:22:08 +00:00
2008-07-04 02:34:12 +00:00
error = 0 ;
cleanup :
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-07 20:19:44 +00:00
}
2008-02-05 16:00:53 +00:00
/** @brief
Return an estimated of the number of rows in the table .
Used when sorting to allocate buffers and by the optimizer .
2008-04-17 20:56:40 +00:00
This is used in filesort . cc .
2008-02-05 16:00:53 +00:00
*/
2008-02-07 20:19:44 +00:00
ha_rows ha_tokudb : : estimate_rows_upper_bound ( ) {
2008-05-05 18:38:04 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::estimate_rows_upper_bound " ) ;
2008-07-08 01:59:46 +00:00
DBUG_RETURN ( share - > rows + HA_TOKUDB_EXTRA_ROWS ) ;
2008-02-07 20:19:44 +00:00
}
2008-02-05 16:00:53 +00:00
2009-03-24 18:20:58 +00:00
//
// Function that compares two primary keys that were saved as part of rnd_pos
// and ::position
//
2008-02-07 20:19:44 +00:00
int ha_tokudb : : cmp_ref ( const uchar * ref1 , const uchar * ref2 ) {
2009-03-24 18:20:58 +00:00
int ret_val = 0 ;
ret_val = tokudb_compare_two_keys (
2012-07-25 20:48:53 +00:00
ref1 + sizeof ( uint32_t ) ,
* ( uint32_t * ) ref1 ,
ref2 + sizeof ( uint32_t ) ,
* ( uint32_t * ) ref2 ,
2010-05-28 21:08:32 +00:00
( uchar * ) share - > file - > descriptor - > dbt . data + 4 ,
2012-07-25 20:48:53 +00:00
* ( uint32_t * ) share - > file - > descriptor - > dbt . data - 4 ,
2009-03-24 19:27:28 +00:00
false
2009-03-24 18:20:58 +00:00
) ;
return ret_val ;
2008-02-05 16:00:53 +00:00
}
2008-02-07 20:19:44 +00:00
bool ha_tokudb : : check_if_incompatible_data ( HA_CREATE_INFO * info , uint table_changes ) {
2011-03-09 13:16:25 +00:00
//
// This is a horrendous hack for now, as copied by InnoDB.
// This states that if the auto increment create field has changed,
// via a "alter table foo auto_increment=new_val", that this
// change is incompatible, and to rebuild the entire table
// This will need to be fixed
//
if ( ( info - > used_fields & HA_CREATE_USED_AUTO ) & &
info - > auto_increment_value ! = 0 ) {
return COMPATIBLE_DATA_NO ;
}
if ( table_changes ! = IS_EQUAL_YES )
2011-03-04 19:54:23 +00:00
return COMPATIBLE_DATA_NO ;
2011-03-09 13:16:25 +00:00
return COMPATIBLE_DATA_YES ;
2008-02-07 20:19:44 +00:00
}
2009-07-10 20:01:20 +00:00
2009-07-27 14:52:30 +00:00
//
// Method that is called before the beginning of many calls
// to insert rows (ha_tokudb::write_row). There is no guarantee
// that start_bulk_insert is called, however there is a guarantee
// that if start_bulk_insert is called, then end_bulk_insert may be
// called as well.
// Parameters:
// [in] rows - an estimate of the number of rows that will be inserted
// if number of rows is unknown (such as if doing
// "insert into foo select * from bar), then rows
// will be 0
//
2009-09-11 18:34:16 +00:00
//
// This function returns true if the table MAY be empty.
// It is NOT meant to be a 100% check for emptiness.
// This is used for a bulk load optimization.
//
2011-10-05 21:55:09 +00:00
bool ha_tokudb : : may_table_be_empty ( DB_TXN * txn ) {
2009-09-11 18:34:16 +00:00
int error ;
bool ret_val = false ;
DBC * tmp_cursor = NULL ;
2011-10-05 21:55:09 +00:00
DB_TXN * tmp_txn = NULL ;
2009-09-11 18:34:16 +00:00
2011-10-05 21:55:09 +00:00
if ( txn = = NULL ) {
error = db_env - > txn_begin ( db_env , 0 , & tmp_txn , 0 ) ;
if ( error ) {
goto cleanup ;
}
txn = tmp_txn ;
2009-09-11 18:34:16 +00:00
}
error = share - > file - > cursor ( share - > file , txn , & tmp_cursor , 0 ) ;
if ( error ) {
goto cleanup ;
}
error = tmp_cursor - > c_getf_next ( tmp_cursor , 0 , smart_dbt_do_nothing , NULL ) ;
if ( error = = DB_NOTFOUND ) {
ret_val = true ;
}
else {
ret_val = false ;
}
error = 0 ;
cleanup :
if ( tmp_cursor ) {
2009-12-03 16:59:52 +00:00
int r = tmp_cursor - > c_close ( tmp_cursor ) ;
assert ( r = = 0 ) ;
2009-09-11 18:34:16 +00:00
tmp_cursor = NULL ;
}
2011-10-05 21:55:09 +00:00
if ( tmp_txn ) {
commit_txn ( tmp_txn , 0 ) ;
tmp_txn = NULL ;
2009-09-11 18:34:16 +00:00
}
return ret_val ;
}
2010-01-11 18:14:37 +00:00
void ha_tokudb : : start_bulk_insert ( ha_rows rows ) {
2010-04-30 14:18:43 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::start_bulk_insert " ) ;
THD * thd = ha_thd ( ) ;
2010-07-15 16:18:56 +00:00
tokudb_trx_data * trx = ( tokudb_trx_data * ) thd_data_get ( thd , tokudb_hton - > slot ) ;
2010-01-11 18:53:10 +00:00
delay_updating_ai_metadata = true ;
2010-01-11 18:14:37 +00:00
ai_metadata_update_required = false ;
2010-03-29 02:08:34 +00:00
abort_loader = false ;
2010-12-09 20:24:59 +00:00
rw_rdlock ( & share - > num_DBs_lock ) ;
uint curr_num_DBs = table - > s - > keys + test ( hidden_primary_key ) ;
num_DBs_locked_in_bulk = true ;
lock_count = 0 ;
2010-01-11 18:14:37 +00:00
if ( share - > try_table_lock ) {
2011-10-05 21:55:09 +00:00
if ( get_prelock_empty ( thd ) & & may_table_be_empty ( transaction ) ) {
2012-06-09 21:00:05 +00:00
if ( using_ignore | | is_insert_ignore ( thd ) | | thd - > lex - > duplicates ! = DUP_ERROR ) {
2010-03-29 02:08:34 +00:00
acquire_table_lock ( transaction , lock_write ) ;
}
else {
mult_dbt_flags [ primary_key ] = 0 ;
if ( ! thd_test_options ( thd , OPTION_RELAXED_UNIQUE_CHECKS ) & & ! hidden_primary_key ) {
mult_put_flags [ primary_key ] = DB_NOOVERWRITE ;
}
2012-07-25 20:48:53 +00:00
uint32_t loader_flags = ( get_load_save_space ( thd ) ) ?
2012-11-20 16:11:50 +00:00
LOADER_COMPRESS_INTERMEDIATES : 0 ;
2012-06-30 16:51:25 +00:00
2010-03-29 02:08:34 +00:00
int error = db_env - > create_loader (
db_env ,
transaction ,
& loader ,
NULL , // no src_db needed
curr_num_DBs ,
share - > key_file ,
mult_put_flags ,
mult_dbt_flags ,
2012-04-12 15:07:54 +00:00
loader_flags
2010-03-29 02:08:34 +00:00
) ;
2010-05-05 21:04:19 +00:00
if ( error ) {
assert ( loader = = NULL ) ;
goto exit_try_table_lock ;
}
2010-03-29 02:08:34 +00:00
lc . thd = thd ;
lc . ha = this ;
2012-06-30 16:51:25 +00:00
error = loader - > set_poll_function ( loader , loader_poll_fun , & lc ) ;
2010-03-29 02:08:34 +00:00
assert ( ! error ) ;
error = loader - > set_error_callback ( loader , loader_dup_fun , & lc ) ;
assert ( ! error ) ;
2010-07-15 16:18:56 +00:00
trx - > stmt_progress . using_loader = true ;
2010-03-29 02:08:34 +00:00
}
2010-01-11 18:14:37 +00:00
}
2010-05-05 21:04:19 +00:00
exit_try_table_lock :
2010-01-11 18:14:37 +00:00
pthread_mutex_lock ( & share - > mutex ) ;
2012-04-02 18:27:34 +00:00
share - > try_table_lock = false ;
2010-01-11 18:14:37 +00:00
pthread_mutex_unlock ( & share - > mutex ) ;
}
2010-04-30 14:18:43 +00:00
DBUG_VOID_RETURN ;
2010-01-11 18:14:37 +00:00
}
//
// Method that is called at the end of many calls to insert rows
// (ha_tokudb::write_row). If start_bulk_insert is called, then
// this is guaranteed to be called.
//
2010-07-16 19:39:13 +00:00
int ha_tokudb : : end_bulk_insert ( bool abort ) {
2010-04-30 14:18:43 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::end_bulk_insert " ) ;
2010-01-11 18:14:37 +00:00
int error = 0 ;
2010-06-08 20:39:23 +00:00
THD * thd = ha_thd ( ) ;
2010-07-15 16:18:56 +00:00
tokudb_trx_data * trx = ( tokudb_trx_data * ) thd_data_get ( thd , tokudb_hton - > slot ) ;
2010-06-10 17:26:49 +00:00
bool using_loader = ( loader ! = NULL ) ;
2010-01-11 18:14:37 +00:00
if ( ai_metadata_update_required ) {
pthread_mutex_lock ( & share - > mutex ) ;
error = update_max_auto_inc ( share - > status_block , share - > last_auto_increment ) ;
pthread_mutex_unlock ( & share - > mutex ) ;
2010-03-29 02:08:34 +00:00
if ( error ) { goto cleanup ; }
2010-01-11 18:14:37 +00:00
}
delay_updating_ai_metadata = false ;
ai_metadata_update_required = false ;
2010-03-29 02:08:34 +00:00
loader_error = 0 ;
if ( loader ) {
2010-06-08 20:39:23 +00:00
if ( ! abort_loader & & ! thd - > killed ) {
2010-03-29 02:08:34 +00:00
error = loader - > close ( loader ) ;
loader = NULL ;
2010-06-09 17:45:49 +00:00
if ( error ) {
if ( thd - > killed ) {
my_error ( ER_QUERY_INTERRUPTED , MYF ( 0 ) ) ;
}
goto cleanup ;
}
2010-03-29 02:08:34 +00:00
for ( uint i = 0 ; i < table_share - > keys ; i + + ) {
if ( table_share - > key_info [ i ] . flags & HA_NOSAME ) {
bool is_unique ;
2010-05-13 14:59:29 +00:00
if ( i = = primary_key ) {
continue ;
}
2010-03-29 02:08:34 +00:00
error = is_index_unique (
& is_unique ,
transaction ,
share - > key_file [ i ] ,
& table - > key_info [ i ]
) ;
if ( error ) goto cleanup ;
if ( ! is_unique ) {
error = HA_ERR_FOUND_DUPP_KEY ;
last_dup_key = i ;
goto cleanup ;
}
}
}
}
else {
2010-06-16 19:17:54 +00:00
error = sprintf ( write_status_msg , " aborting bulk load " ) ;
thd_proc_info ( thd , write_status_msg ) ;
2010-03-29 02:08:34 +00:00
loader - > abort ( loader ) ;
loader = NULL ;
2010-06-09 18:09:40 +00:00
share - > try_table_lock = true ;
2010-03-29 02:08:34 +00:00
}
}
cleanup :
2010-12-09 20:24:59 +00:00
if ( num_DBs_locked_in_bulk ) {
rw_unlock ( & share - > num_DBs_lock ) ;
}
num_DBs_locked_in_bulk = false ;
lock_count = 0 ;
2010-03-29 02:08:34 +00:00
if ( loader ) {
2010-06-16 19:17:54 +00:00
error = sprintf ( write_status_msg , " aborting bulk load " ) ;
thd_proc_info ( thd , write_status_msg ) ;
2010-03-29 02:08:34 +00:00
loader - > abort ( loader ) ;
loader = NULL ;
}
abort_loader = false ;
2012-05-09 18:36:52 +00:00
memset ( & lc , 0 , sizeof ( lc ) ) ;
2010-03-29 02:08:34 +00:00
if ( error | | loader_error ) {
my_errno = error ? error : loader_error ;
2010-06-10 17:26:49 +00:00
if ( using_loader ) {
share - > try_table_lock = true ;
}
2010-03-29 02:08:34 +00:00
}
2010-07-15 16:18:56 +00:00
trx - > stmt_progress . using_loader = false ;
2010-04-30 14:18:43 +00:00
TOKUDB_DBUG_RETURN ( error ? error : loader_error ) ;
2010-01-11 18:14:37 +00:00
}
2010-07-16 19:39:13 +00:00
int ha_tokudb : : end_bulk_insert ( ) {
return end_bulk_insert ( false ) ;
}
2010-01-11 18:14:37 +00:00
2010-03-29 02:08:34 +00:00
int ha_tokudb : : is_index_unique ( bool * is_unique , DB_TXN * txn , DB * db , KEY * key_info ) {
int error ;
DBC * tmp_cursor1 = NULL ;
DBC * tmp_cursor2 = NULL ;
DBT key1 , key2 , val , packed_key1 , packed_key2 ;
2012-07-25 20:48:53 +00:00
uint64_t cnt = 0 ;
2010-06-17 15:56:23 +00:00
char status_msg [ MAX_ALIAS_NAME + 200 ] ; //buffer of 200 should be a good upper bound.
2010-06-16 19:50:11 +00:00
THD * thd = ha_thd ( ) ;
2012-05-09 18:36:52 +00:00
memset ( & key1 , 0 , sizeof ( key1 ) ) ;
memset ( & key2 , 0 , sizeof ( key2 ) ) ;
memset ( & val , 0 , sizeof ( val ) ) ;
memset ( & packed_key1 , 0 , sizeof ( packed_key1 ) ) ;
memset ( & packed_key2 , 0 , sizeof ( packed_key2 ) ) ;
2010-03-29 02:08:34 +00:00
* is_unique = true ;
error = db - > cursor (
db ,
txn ,
& tmp_cursor1 ,
2010-09-03 20:47:01 +00:00
DB_SERIALIZABLE
2010-03-29 02:08:34 +00:00
) ;
if ( error ) { goto cleanup ; }
error = db - > cursor (
db ,
txn ,
& tmp_cursor2 ,
2010-09-03 20:47:01 +00:00
DB_SERIALIZABLE
2010-03-29 02:08:34 +00:00
) ;
if ( error ) { goto cleanup ; }
error = tmp_cursor1 - > c_get (
tmp_cursor1 ,
& key1 ,
& val ,
DB_NEXT
) ;
if ( error = = DB_NOTFOUND ) {
* is_unique = true ;
error = 0 ;
goto cleanup ;
}
else if ( error ) { goto cleanup ; }
error = tmp_cursor2 - > c_get (
tmp_cursor2 ,
& key2 ,
& val ,
DB_NEXT
) ;
if ( error ) { goto cleanup ; }
error = tmp_cursor2 - > c_get (
tmp_cursor2 ,
& key2 ,
& val ,
DB_NEXT
) ;
if ( error = = DB_NOTFOUND ) {
* is_unique = true ;
error = 0 ;
goto cleanup ;
}
else if ( error ) { goto cleanup ; }
while ( error ! = DB_NOTFOUND ) {
bool has_null1 ;
bool has_null2 ;
int cmp ;
place_key_into_mysql_buff (
key_info ,
table - > record [ 0 ] ,
( uchar * ) key1 . data + 1
) ;
place_key_into_mysql_buff (
key_info ,
table - > record [ 1 ] ,
( uchar * ) key2 . data + 1
) ;
create_dbt_key_for_lookup (
& packed_key1 ,
key_info ,
key_buff ,
table - > record [ 0 ] ,
& has_null1
) ;
create_dbt_key_for_lookup (
& packed_key2 ,
key_info ,
key_buff2 ,
table - > record [ 1 ] ,
& has_null2
) ;
if ( ! has_null1 & & ! has_null2 ) {
cmp = tokudb_prefix_cmp_dbt_key ( db , & packed_key1 , & packed_key2 ) ;
if ( cmp = = 0 ) {
2010-05-13 21:46:12 +00:00
memcpy ( key_buff , key1 . data , key1 . size ) ;
place_key_into_mysql_buff (
key_info ,
table - > record [ 0 ] ,
( uchar * ) key_buff + 1
) ;
2010-03-29 02:08:34 +00:00
* is_unique = false ;
break ;
}
}
error = tmp_cursor1 - > c_get (
tmp_cursor1 ,
& key1 ,
& val ,
DB_NEXT
) ;
if ( error ) { goto cleanup ; }
error = tmp_cursor2 - > c_get (
tmp_cursor2 ,
& key2 ,
& val ,
DB_NEXT
) ;
if ( error & & ( error ! = DB_NOTFOUND ) ) { goto cleanup ; }
2010-06-16 19:50:11 +00:00
cnt + + ;
2010-06-17 15:56:23 +00:00
if ( ( cnt % 10000 ) = = 0 ) {
sprintf (
status_msg ,
" Verifying index uniqueness: Checked %llu of %llu rows in key-%s. " ,
2010-11-15 14:24:42 +00:00
( long long unsigned ) cnt ,
2010-06-17 15:56:23 +00:00
share - > rows ,
key_info - > name ) ;
thd_proc_info ( thd , status_msg ) ;
2010-06-16 19:50:11 +00:00
if ( thd - > killed ) {
my_error ( ER_QUERY_INTERRUPTED , MYF ( 0 ) ) ;
error = ER_QUERY_INTERRUPTED ;
goto cleanup ;
}
}
2010-03-29 02:08:34 +00:00
}
error = 0 ;
cleanup :
if ( tmp_cursor1 ) {
tmp_cursor1 - > c_close ( tmp_cursor1 ) ;
tmp_cursor1 = NULL ;
}
if ( tmp_cursor2 ) {
tmp_cursor2 - > c_close ( tmp_cursor2 ) ;
tmp_cursor2 = NULL ;
}
return error ;
}
2010-01-11 18:14:37 +00:00
int ha_tokudb : : is_val_unique ( bool * is_unique , uchar * record , KEY * key_info , uint dict_index , DB_TXN * txn ) {
DBT key ;
int error = 0 ;
bool has_null ;
DBC * tmp_cursor = NULL ;
struct index_read_info ir_info ;
struct smart_dbt_info info ;
2012-05-09 18:36:52 +00:00
memset ( ( void * ) & key , 0 , sizeof ( key ) ) ;
2010-01-11 18:14:37 +00:00
info . ha = this ;
info . buf = NULL ;
info . keynr = dict_index ;
ir_info . smart_dbt_info = info ;
create_dbt_key_for_lookup (
& key ,
key_info ,
key_buff3 ,
record ,
& has_null
) ;
ir_info . orig_key = & key ;
if ( has_null ) {
error = 0 ;
* is_unique = true ;
goto cleanup ;
}
error = share - > key_file [ dict_index ] - > cursor (
share - > key_file [ dict_index ] ,
txn ,
& tmp_cursor ,
2010-09-03 20:47:01 +00:00
DB_SERIALIZABLE
2010-01-11 18:14:37 +00:00
) ;
if ( error ) { goto cleanup ; }
error = tmp_cursor - > c_getf_set_range (
tmp_cursor ,
0 ,
& key ,
smart_dbt_callback_lookup ,
& ir_info
) ;
if ( error = = DB_NOTFOUND ) {
* is_unique = true ;
error = 0 ;
goto cleanup ;
}
else if ( error ) {
goto cleanup ;
}
if ( ir_info . cmp ) {
* is_unique = true ;
}
else {
* is_unique = false ;
}
error = 0 ;
cleanup :
if ( tmp_cursor ) {
int r = tmp_cursor - > c_close ( tmp_cursor ) ;
assert ( r = = 0 ) ;
tmp_cursor = NULL ;
}
return error ;
}
int ha_tokudb : : do_uniqueness_checks ( uchar * record , DB_TXN * txn , THD * thd ) {
int error ;
//
// first do uniqueness checks
//
if ( share - > has_unique_keys & & ! thd_test_options ( thd , OPTION_RELAXED_UNIQUE_CHECKS ) ) {
for ( uint keynr = 0 ; keynr < table_share - > keys ; keynr + + ) {
bool is_unique_key = table - > key_info [ keynr ] . flags & HA_NOSAME ;
bool is_unique = false ;
2010-02-25 17:18:53 +00:00
//
// don't need to do check for primary key
//
if ( keynr = = primary_key ) {
continue ;
}
2010-01-11 18:14:37 +00:00
if ( ! is_unique_key ) {
continue ;
}
//
// if unique key, check uniqueness constraint
// but, we do not need to check it if the key has a null
// and we do not need to check it if unique_checks is off
//
error = is_val_unique ( & is_unique , record , & table - > key_info [ keynr ] , keynr , txn ) ;
if ( error ) { goto cleanup ; }
if ( ! is_unique ) {
error = DB_KEYEXIST ;
last_dup_key = keynr ;
goto cleanup ;
}
}
}
error = 0 ;
cleanup :
return error ;
}
2010-05-22 14:32:25 +00:00
void ha_tokudb : : test_row_packing ( uchar * record , DBT * pk_key , DBT * pk_val ) {
2010-01-11 18:14:37 +00:00
int error ;
DBT row , key ;
//
// variables for testing key packing, only used in some debug modes
//
uchar * tmp_pk_key_data = NULL ;
uchar * tmp_pk_val_data = NULL ;
DBT tmp_pk_key ;
DBT tmp_pk_val ;
bool has_null ;
2010-05-22 20:46:13 +00:00
int cmp ;
2010-01-11 18:14:37 +00:00
2012-05-09 18:36:52 +00:00
memset ( & tmp_pk_key , 0 , sizeof ( DBT ) ) ;
memset ( & tmp_pk_val , 0 , sizeof ( DBT ) ) ;
2010-01-11 18:14:37 +00:00
//
//use for testing the packing of keys
//
tmp_pk_key_data = ( uchar * ) my_malloc ( pk_key - > size , MYF ( MY_WME ) ) ;
assert ( tmp_pk_key_data ) ;
tmp_pk_val_data = ( uchar * ) my_malloc ( pk_val - > size , MYF ( MY_WME ) ) ;
assert ( tmp_pk_val_data ) ;
memcpy ( tmp_pk_key_data , pk_key - > data , pk_key - > size ) ;
memcpy ( tmp_pk_val_data , pk_val - > data , pk_val - > size ) ;
tmp_pk_key . data = tmp_pk_key_data ;
tmp_pk_key . size = pk_key - > size ;
tmp_pk_val . data = tmp_pk_val_data ;
tmp_pk_val . size = pk_val - > size ;
for ( uint keynr = 0 ; keynr < table_share - > keys ; keynr + + ) {
2012-07-25 20:48:53 +00:00
uint32_t tmp_num_bytes = 0 ;
2010-01-11 18:14:37 +00:00
uchar * row_desc = NULL ;
2012-07-25 20:48:53 +00:00
uint32_t desc_size = 0 ;
2010-01-11 18:14:37 +00:00
if ( keynr = = primary_key ) {
continue ;
}
2011-09-08 02:55:20 +00:00
create_dbt_key_from_table ( & key , keynr , key_buff2 , record , & has_null ) ;
2010-01-11 18:14:37 +00:00
//
// TEST
//
2010-05-28 21:08:32 +00:00
row_desc = ( uchar * ) share - > key_file [ keynr ] - > descriptor - > dbt . data ;
2012-07-25 20:48:53 +00:00
row_desc + = ( * ( uint32_t * ) row_desc ) ;
desc_size = ( * ( uint32_t * ) row_desc ) - 4 ;
2010-01-11 18:14:37 +00:00
row_desc + = 4 ;
tmp_num_bytes = pack_key_from_desc (
key_buff3 ,
row_desc ,
desc_size ,
& tmp_pk_key ,
& tmp_pk_val
) ;
assert ( tmp_num_bytes = = key . size ) ;
2011-09-08 02:55:20 +00:00
cmp = memcmp ( key_buff3 , key_buff2 , tmp_num_bytes ) ;
2010-01-11 18:14:37 +00:00
assert ( cmp = = 0 ) ;
//
// test key packing of clustering keys
//
if ( table - > key_info [ keynr ] . flags & HA_CLUSTERING ) {
2010-01-21 19:24:11 +00:00
error = pack_row ( & row , ( const uchar * ) record , keynr ) ;
2010-05-22 14:32:25 +00:00
assert ( error = = 0 ) ;
2010-01-11 18:14:37 +00:00
uchar * tmp_buff = NULL ;
tmp_buff = ( uchar * ) my_malloc ( alloced_rec_buff_length , MYF ( MY_WME ) ) ;
assert ( tmp_buff ) ;
2010-05-28 21:08:32 +00:00
row_desc = ( uchar * ) share - > key_file [ keynr ] - > descriptor - > dbt . data ;
2012-07-25 20:48:53 +00:00
row_desc + = ( * ( uint32_t * ) row_desc ) ;
row_desc + = ( * ( uint32_t * ) row_desc ) ;
desc_size = ( * ( uint32_t * ) row_desc ) - 4 ;
2010-01-11 18:14:37 +00:00
row_desc + = 4 ;
tmp_num_bytes = pack_clustering_val_from_desc (
tmp_buff ,
row_desc ,
desc_size ,
& tmp_pk_val
) ;
assert ( tmp_num_bytes = = row . size ) ;
2010-01-21 19:24:11 +00:00
cmp = memcmp ( tmp_buff , rec_buff , tmp_num_bytes ) ;
2010-01-11 18:14:37 +00:00
assert ( cmp = = 0 ) ;
my_free ( tmp_buff , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
}
}
2010-05-22 14:32:25 +00:00
//
// copy stuff back out
//
error = pack_row ( pk_val , ( const uchar * ) record , primary_key ) ;
2010-05-22 20:46:13 +00:00
assert ( pk_val - > size = = tmp_pk_val . size ) ;
cmp = memcmp ( pk_val - > data , tmp_pk_val_data , pk_val - > size ) ;
assert ( cmp = = 0 ) ;
2010-05-22 14:32:25 +00:00
2010-01-11 18:14:37 +00:00
my_free ( tmp_pk_key_data , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
my_free ( tmp_pk_val_data , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
}
2010-05-06 04:19:11 +00:00
//
// set the put flags for the main dictionary
//
2010-12-09 20:24:59 +00:00
void ha_tokudb : : set_main_dict_put_flags (
THD * thd ,
2012-01-08 22:08:12 +00:00
bool opt_eligible ,
2012-07-25 20:48:53 +00:00
uint32_t * put_flags
2010-12-09 20:24:59 +00:00
)
{
2012-07-25 20:48:53 +00:00
uint32_t old_prelock_flags = 0 ;
2011-04-27 17:01:36 +00:00
uint curr_num_DBs = table - > s - > keys + test ( hidden_primary_key ) ;
bool in_hot_index = share - > num_DBs > curr_num_DBs ;
2011-12-24 04:54:30 +00:00
bool using_ignore_flag_opt = do_ignore_flag_optimization (
thd , table , share - > replace_into_fast ) ;
2010-01-11 18:14:37 +00:00
//
2010-03-05 20:21:08 +00:00
// optimization for "REPLACE INTO..." (and "INSERT IGNORE") command
2010-01-11 18:14:37 +00:00
// if the command is "REPLACE INTO" and the only table
2010-05-06 04:19:11 +00:00
// is the main table (or all indexes are a subset of the pk),
// then we can simply insert the element
2010-01-11 18:14:37 +00:00
// with DB_YESOVERWRITE. If the element does not exist,
// it will act as a normal insert, and if it does exist, it
// will act as a replace, which is exactly what REPLACE INTO is supposed
2010-05-06 04:19:11 +00:00
// to do. We cannot do this if otherwise, because then we lose
2010-01-11 18:14:37 +00:00
// consistency between indexes
//
2011-12-24 04:54:30 +00:00
if ( hidden_primary_key )
{
2011-06-06 21:08:45 +00:00
* put_flags = old_prelock_flags ;
2010-05-06 04:19:11 +00:00
}
2011-12-24 04:54:30 +00:00
else if ( thd_test_options ( thd , OPTION_RELAXED_UNIQUE_CHECKS )
& & ! is_replace_into ( thd ) & & ! is_insert_ignore ( thd ) )
2010-03-05 20:21:08 +00:00
{
2011-06-06 21:08:45 +00:00
* put_flags = old_prelock_flags ;
2010-02-25 17:18:53 +00:00
}
2011-12-24 04:54:30 +00:00
else if ( using_ignore_flag_opt & & is_replace_into ( thd )
& & ! in_hot_index )
2010-05-06 04:19:11 +00:00
{
2011-06-06 21:08:45 +00:00
* put_flags = old_prelock_flags ;
2010-03-05 20:21:08 +00:00
}
2012-01-08 22:08:12 +00:00
else if ( opt_eligible & & using_ignore_flag_opt & & is_insert_ignore ( thd )
2011-12-24 04:54:30 +00:00
& & ! in_hot_index )
2010-05-06 04:19:11 +00:00
{
2011-12-24 04:54:30 +00:00
* put_flags = DB_NOOVERWRITE_NO_ERROR | old_prelock_flags ;
2010-05-06 04:19:11 +00:00
}
else
{
2011-12-24 04:54:30 +00:00
* put_flags = DB_NOOVERWRITE | old_prelock_flags ;
2010-02-25 17:18:53 +00:00
}
2010-05-06 04:19:11 +00:00
}
int ha_tokudb : : insert_row_to_main_dictionary ( uchar * record , DBT * pk_key , DBT * pk_val , DB_TXN * txn ) {
int error = 0 ;
2012-07-25 20:48:53 +00:00
uint32_t put_flags = mult_put_flags [ primary_key ] ;
2010-05-06 04:19:11 +00:00
THD * thd = ha_thd ( ) ;
uint curr_num_DBs = table - > s - > keys + test ( hidden_primary_key ) ;
assert ( curr_num_DBs = = 1 ) ;
2012-01-08 22:08:12 +00:00
set_main_dict_put_flags ( thd , true , & put_flags ) ;
2010-01-11 18:14:37 +00:00
2011-10-05 21:55:09 +00:00
error = share - > file - > put (
share - > file ,
txn ,
pk_key ,
pk_val ,
put_flags
) ;
2010-01-11 18:14:37 +00:00
if ( error ) {
last_dup_key = primary_key ;
goto cleanup ;
}
cleanup :
2009-07-10 20:01:20 +00:00
return error ;
}
2010-01-21 19:24:11 +00:00
int ha_tokudb : : insert_rows_to_dictionaries_mult ( DBT * pk_key , DBT * pk_val , DB_TXN * txn , THD * thd ) {
2010-03-25 13:30:54 +00:00
int error = 0 ;
2011-01-03 16:11:07 +00:00
uint curr_num_DBs = share - > num_DBs ;
2012-01-08 22:08:12 +00:00
set_main_dict_put_flags ( thd , true , & mult_put_flags [ primary_key ] ) ;
2011-12-24 04:54:30 +00:00
uint32_t i , flags = mult_put_flags [ primary_key ] ;
// the insert ignore optimization uses DB_NOOVERWRITE_NO_ERROR,
// which is not allowed with env->put_multiple.
// we have to insert the rows one by one in this case.
if ( flags & DB_NOOVERWRITE_NO_ERROR ) {
DB * src_db = share - > key_file [ primary_key ] ;
for ( i = 0 ; i < curr_num_DBs ; i + + ) {
DB * db = share - > key_file [ i ] ;
if ( i = = primary_key ) {
// if it's the primary key, insert the rows
// as they are.
error = db - > put ( db , txn , pk_key , pk_val , flags ) ;
} else {
// generate a row for secondary keys.
// use our multi put key/rec buffers
// just as the ydb layer would have in
// env->put_multiple(), except that
// we will just do a put() right away.
error = tokudb_generate_row ( db , src_db ,
& mult_key_dbt [ i ] , & mult_rec_dbt [ i ] ,
pk_key , pk_val ) ;
if ( error ! = 0 ) {
goto out ;
}
error = db - > put ( db , txn , & mult_key_dbt [ i ] ,
& mult_rec_dbt [ i ] , flags ) ;
}
if ( error ! = 0 ) {
goto out ;
}
}
} else {
// not insert ignore, so we can use put multiple
error = db_env - > put_multiple (
db_env ,
share - > key_file [ primary_key ] ,
txn ,
pk_key ,
pk_val ,
curr_num_DBs ,
share - > key_file ,
mult_key_dbt ,
mult_rec_dbt ,
mult_put_flags
) ;
}
2009-11-25 21:00:52 +00:00
2011-12-24 04:54:30 +00:00
out :
2010-01-11 18:14:37 +00:00
//
// We break if we hit an error, unless it is a dup key error
// and MySQL told us to ignore duplicate key errors
//
if ( error ) {
last_dup_key = primary_key ;
2009-11-25 21:00:52 +00:00
}
return error ;
}
2010-01-11 18:14:37 +00:00
2012-03-19 12:15:50 +00:00
volatile int ha_tokudb_write_row_wait = 0 ; // debug
2008-04-17 20:56:40 +00:00
//
// Stores a row in the table, called when handling an INSERT query
// Parameters:
// [in] record - a row in MySQL format
// Returns:
// 0 on success
// error otherwise
//
2008-02-07 20:19:44 +00:00
int ha_tokudb : : write_row ( uchar * record ) {
2008-04-17 11:12:01 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::write_row " ) ;
2012-03-19 12:15:50 +00:00
while ( ha_tokudb_write_row_wait ) sleep ( 1 ) ; // debug
2010-01-11 18:14:37 +00:00
DBT row , prim_key ;
2008-02-07 20:19:44 +00:00
int error ;
2009-09-28 19:08:52 +00:00
THD * thd = ha_thd ( ) ;
2008-08-10 16:39:16 +00:00
bool has_null ;
2008-08-10 17:46:23 +00:00
DB_TXN * sub_trans = NULL ;
DB_TXN * txn = NULL ;
2009-04-13 21:23:37 +00:00
tokudb_trx_data * trx = NULL ;
2010-11-17 23:09:06 +00:00
uint curr_num_DBs ;
2010-02-12 22:37:55 +00:00
bool create_sub_trans = false ;
2008-02-07 20:19:44 +00:00
2008-08-08 19:20:52 +00:00
//
// some crap that needs to be done because MySQL does not properly abstract
// this work away from us, namely filling in auto increment and setting auto timestamp
//
2013-02-15 18:25:37 +00:00
ha_statistic_increment ( & SSV : : ha_write_count ) ;
2012-05-09 18:36:52 +00:00
# if MYSQL_VERSION_ID < 50600
2008-05-12 14:27:43 +00:00
if ( table - > timestamp_field_type & TIMESTAMP_AUTO_SET_ON_INSERT ) {
2008-02-07 20:19:44 +00:00
table - > timestamp_field - > set_time ( ) ;
2008-05-12 14:27:43 +00:00
}
2012-05-09 18:36:52 +00:00
# endif
2008-05-12 14:27:43 +00:00
if ( table - > next_number_field & & record = = table - > record [ 0 ] ) {
2012-12-09 18:54:32 +00:00
error = update_auto_increment ( ) ;
if ( error )
goto cleanup ;
2008-05-12 14:27:43 +00:00
}
2008-08-18 18:35:32 +00:00
//
// check to see if some value for the auto increment column that is bigger
// than anything else til now is being used. If so, update the metadata to reflect it
// the goal here is we never want to have a dup key error due to a bad increment
// of the auto inc field.
//
if ( share - > has_auto_inc & & record = = table - > record [ 0 ] ) {
pthread_mutex_lock ( & share - > mutex ) ;
ulonglong curr_auto_inc = retrieve_auto_increment (
table - > field [ share - > ai_field_index ] - > key_type ( ) ,
2008-11-18 22:20:06 +00:00
field_offset ( table - > field [ share - > ai_field_index ] , table ) ,
2008-08-18 18:35:32 +00:00
record
) ;
if ( curr_auto_inc > share - > last_auto_increment ) {
2009-07-10 20:01:20 +00:00
share - > last_auto_increment = curr_auto_inc ;
2009-07-27 14:52:30 +00:00
if ( delay_updating_ai_metadata ) {
ai_metadata_update_required = true ;
2008-08-18 18:35:32 +00:00
}
2009-07-10 20:01:20 +00:00
else {
update_max_auto_inc ( share - > status_block , share - > last_auto_increment ) ;
}
2012-11-27 15:23:21 +00:00
}
2008-08-18 18:35:32 +00:00
pthread_mutex_unlock ( & share - > mutex ) ;
}
2010-11-17 23:09:06 +00:00
//
// grab reader lock on numDBs_lock
//
2010-12-09 20:24:59 +00:00
if ( ! num_DBs_locked_in_bulk ) {
rw_rdlock ( & share - > num_DBs_lock ) ;
}
else {
lock_count + + ;
if ( lock_count > = 2000 ) {
rw_unlock ( & share - > num_DBs_lock ) ;
rw_rdlock ( & share - > num_DBs_lock ) ;
lock_count = 0 ;
}
}
2010-11-17 23:09:06 +00:00
curr_num_DBs = share - > num_DBs ;
2008-05-12 14:27:43 +00:00
if ( hidden_primary_key ) {
get_auto_primary_key ( current_ident ) ;
}
2008-02-07 20:19:44 +00:00
2010-01-11 18:14:37 +00:00
if ( table_share - > blob_fields ) {
if ( fix_rec_buff_for_blob ( max_row_length ( record ) ) ) {
error = HA_ERR_OUT_OF_MEM ;
2008-08-10 17:46:23 +00:00
goto cleanup ;
}
}
2010-01-11 18:14:37 +00:00
2010-01-21 19:24:11 +00:00
create_dbt_key_from_table ( & prim_key , primary_key , primary_key_buff , record , & has_null ) ;
if ( ( error = pack_row ( & row , ( const uchar * ) record , primary_key ) ) ) {
2010-01-11 18:14:37 +00:00
goto cleanup ;
2009-04-13 21:23:37 +00:00
}
2010-05-10 14:06:01 +00:00
create_sub_trans = ( using_ignore & & ! ( do_ignore_flag_optimization ( thd , table , share - > replace_into_fast ) ) ) ;
2010-02-12 22:37:55 +00:00
if ( create_sub_trans ) {
2010-01-11 18:15:50 +00:00
error = db_env - > txn_begin ( db_env , transaction , & sub_trans , DB_INHERIT_ISOLATION ) ;
2010-01-11 18:14:37 +00:00
if ( error ) {
goto cleanup ;
}
2008-08-08 19:20:52 +00:00
}
2008-11-03 20:42:59 +00:00
2012-06-02 13:20:58 +00:00
txn = create_sub_trans ? sub_trans : transaction ;
2010-01-11 18:14:37 +00:00
if ( tokudb_debug & TOKUDB_DEBUG_CHECK_KEY ) {
2010-05-22 14:32:25 +00:00
test_row_packing ( record , & prim_key , & row ) ;
2010-01-11 18:14:37 +00:00
}
2009-11-25 21:00:52 +00:00
2010-03-29 02:08:34 +00:00
if ( loader ) {
error = loader - > put ( loader , & prim_key , & row ) ;
if ( error ) {
abort_loader = true ;
goto cleanup ;
}
2010-01-11 18:14:37 +00:00
}
else {
2010-03-29 02:08:34 +00:00
if ( curr_num_DBs = = 1 ) {
error = insert_row_to_main_dictionary ( record , & prim_key , & row , txn ) ;
if ( error ) { goto cleanup ; }
}
else {
error = do_uniqueness_checks ( record , txn , thd ) ;
2012-03-27 04:38:26 +00:00
if ( error ) {
// for #4633
// if we have a duplicate key error, let's check the primary key to see
// if there is a duplicate there. If so, set last_dup_key to the pk
if ( error = = DB_KEYEXIST & & ! test ( hidden_primary_key ) ) {
int r = share - > file - > getf_set (
share - > file ,
txn ,
0 ,
& prim_key ,
smart_dbt_do_nothing ,
NULL
) ;
if ( r = = 0 ) {
// if we get no error, that means the row
// was found and this is a duplicate key,
// so we set last_dup_key
last_dup_key = primary_key ;
}
else if ( r ! = DB_NOTFOUND ) {
// if some other error is returned, return that to the user.
error = r ;
}
}
goto cleanup ;
}
2010-02-25 17:18:53 +00:00
2010-03-29 02:08:34 +00:00
error = insert_rows_to_dictionaries_mult ( & prim_key , & row , txn , thd ) ;
if ( error ) { goto cleanup ; }
}
2012-11-30 01:55:42 +00:00
if ( error = = 0 ) {
uint64_t full_row_size = prim_key . size + row . size ;
toku_hton_update_primary_key_bytes_inserted ( full_row_size ) ;
}
2008-02-05 16:00:53 +00:00
}
2008-08-08 19:20:52 +00:00
2010-01-11 18:14:37 +00:00
trx = ( tokudb_trx_data * ) thd_data_get ( thd , tokudb_hton - > slot ) ;
2008-08-08 19:20:52 +00:00
if ( ! error ) {
added_rows + + ;
2009-09-28 19:08:52 +00:00
trx - > stmt_progress . inserted + + ;
track_progress ( thd ) ;
2008-08-08 19:20:52 +00:00
}
cleanup :
2010-12-09 20:24:59 +00:00
if ( ! num_DBs_locked_in_bulk ) {
rw_unlock ( & share - > num_DBs_lock ) ;
}
2008-07-03 16:38:38 +00:00
if ( error = = DB_KEYEXIST ) {
2008-02-07 20:19:44 +00:00
error = HA_ERR_FOUND_DUPP_KEY ;
2008-07-03 16:38:38 +00:00
}
2008-08-10 17:46:23 +00:00
if ( sub_trans ) {
// no point in recording error value of abort.
// nothing we can do about it anyway and it is not what
// we want to return.
if ( error ) {
2009-11-10 19:22:08 +00:00
abort_txn ( sub_trans ) ;
2008-08-10 17:46:23 +00:00
}
else {
2009-11-10 19:22:08 +00:00
commit_txn ( sub_trans , DB_TXN_NOSYNC ) ;
2008-08-10 17:46:23 +00:00
}
}
2008-03-21 23:47:22 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-07 20:19:44 +00:00
}
/* Compare if a key in a row has changed */
2012-03-28 15:29:11 +00:00
bool ha_tokudb : : key_changed ( uint keynr , const uchar * old_row , const uchar * new_row ) {
DBT old_key ;
DBT new_key ;
2012-05-09 18:36:52 +00:00
memset ( ( void * ) & old_key , 0 , sizeof ( old_key ) ) ;
memset ( ( void * ) & new_key , 0 , sizeof ( new_key ) ) ;
2008-02-07 20:19:44 +00:00
2012-03-28 15:29:11 +00:00
bool has_null ;
create_dbt_key_from_table ( & new_key , keynr , key_buff2 , new_row , & has_null ) ;
create_dbt_key_for_lookup ( & old_key , & table - > key_info [ keynr ] , key_buff3 , old_row , & has_null ) ;
return tokudb_prefix_cmp_dbt_key ( share - > key_file [ keynr ] , & old_key , & new_key ) ;
2008-02-05 16:00:53 +00:00
}
2008-04-17 20:56:40 +00:00
//
// Updates a row in the table, called when handling an UPDATE query
// Parameters:
// [in] old_row - row to be updated, in MySQL format
// [in] new_row - new row, in MySQL format
// Returns:
// 0 on success
// error otherwise
//
2008-02-07 20:19:44 +00:00
int ha_tokudb : : update_row ( const uchar * old_row , uchar * new_row ) {
2008-03-26 02:47:07 +00:00
TOKUDB_DBUG_ENTER ( " update_row " ) ;
2010-11-10 21:34:29 +00:00
DBT prim_key , old_prim_key , prim_row , old_prim_row ;
2008-02-07 20:19:44 +00:00
int error ;
2008-08-10 16:39:16 +00:00
bool has_null ;
THD * thd = ha_thd ( ) ;
2008-08-10 17:46:23 +00:00
DB_TXN * sub_trans = NULL ;
DB_TXN * txn = NULL ;
2010-01-24 00:38:17 +00:00
tokudb_trx_data * trx = ( tokudb_trx_data * ) thd_data_get ( thd , tokudb_hton - > slot ) ;
2010-11-17 23:09:06 +00:00
uint curr_num_DBs ;
2008-02-07 20:19:44 +00:00
LINT_INIT ( error ) ;
2012-05-09 18:36:52 +00:00
memset ( ( void * ) & prim_key , 0 , sizeof ( prim_key ) ) ;
memset ( ( void * ) & old_prim_key , 0 , sizeof ( old_prim_key ) ) ;
memset ( ( void * ) & prim_row , 0 , sizeof ( prim_row ) ) ;
memset ( ( void * ) & old_prim_row , 0 , sizeof ( old_prim_row ) ) ;
2010-01-24 00:38:17 +00:00
2013-02-15 18:25:37 +00:00
ha_statistic_increment ( & SSV : : ha_update_count ) ;
2012-05-09 18:36:52 +00:00
# if MYSQL_VERSION_ID < 50600
2008-08-08 19:20:52 +00:00
if ( table - > timestamp_field_type & TIMESTAMP_AUTO_SET_ON_UPDATE ) {
2008-02-07 20:19:44 +00:00
table - > timestamp_field - > set_time ( ) ;
2008-08-08 19:20:52 +00:00
}
2012-05-09 18:36:52 +00:00
# endif
2008-08-18 18:35:32 +00:00
//
// check to see if some value for the auto increment column that is bigger
// than anything else til now is being used. If so, update the metadata to reflect it
// the goal here is we never want to have a dup key error due to a bad increment
// of the auto inc field.
//
if ( share - > has_auto_inc & & new_row = = table - > record [ 0 ] ) {
pthread_mutex_lock ( & share - > mutex ) ;
ulonglong curr_auto_inc = retrieve_auto_increment (
table - > field [ share - > ai_field_index ] - > key_type ( ) ,
2008-11-18 22:20:06 +00:00
field_offset ( table - > field [ share - > ai_field_index ] , table ) ,
2008-08-18 18:35:32 +00:00
new_row
) ;
if ( curr_auto_inc > share - > last_auto_increment ) {
error = update_max_auto_inc ( share - > status_block , curr_auto_inc ) ;
if ( ! error ) {
share - > last_auto_increment = curr_auto_inc ;
}
}
pthread_mutex_unlock ( & share - > mutex ) ;
}
2010-11-17 23:09:06 +00:00
//
// grab reader lock on numDBs_lock
//
rw_rdlock ( & share - > num_DBs_lock ) ;
curr_num_DBs = share - > num_DBs ;
2010-01-24 00:38:17 +00:00
if ( using_ignore ) {
error = db_env - > txn_begin ( db_env , transaction , & sub_trans , DB_INHERIT_ISOLATION ) ;
if ( error ) {
goto cleanup ;
}
2010-02-12 21:50:47 +00:00
}
2010-01-24 00:38:17 +00:00
txn = using_ignore ? sub_trans : transaction ;
2008-08-18 18:35:32 +00:00
2008-02-07 20:19:44 +00:00
if ( hidden_primary_key ) {
2012-05-09 18:36:52 +00:00
memset ( ( void * ) & prim_key , 0 , sizeof ( prim_key ) ) ;
2008-02-07 20:19:44 +00:00
prim_key . data = ( void * ) current_ident ;
prim_key . size = TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH ;
old_prim_key = prim_key ;
2008-08-08 19:20:52 +00:00
}
else {
2008-08-10 16:39:16 +00:00
create_dbt_key_from_table ( & prim_key , primary_key , key_buff , new_row , & has_null ) ;
2012-03-29 15:03:22 +00:00
create_dbt_key_from_table ( & old_prim_key , primary_key , primary_key_buff , old_row , & has_null ) ;
2008-02-07 20:19:44 +00:00
}
2010-11-10 21:34:29 +00:00
//
// do uniqueness checks
//
if ( share - > has_unique_keys & & ! thd_test_options ( thd , OPTION_RELAXED_UNIQUE_CHECKS ) ) {
for ( uint keynr = 0 ; keynr < table_share - > keys ; keynr + + ) {
2009-11-25 21:00:52 +00:00
bool is_unique_key = table - > key_info [ keynr ] . flags & HA_NOSAME ;
2010-11-10 21:34:29 +00:00
if ( keynr = = primary_key ) {
continue ;
2008-08-08 19:20:52 +00:00
}
2010-11-10 21:34:29 +00:00
if ( is_unique_key ) {
2012-03-28 15:29:11 +00:00
bool key_ch = key_changed ( keynr , old_row , new_row ) ;
if ( key_ch ) {
2010-11-10 21:34:29 +00:00
bool is_unique ;
error = is_val_unique ( & is_unique , new_row , & table - > key_info [ keynr ] , keynr , txn ) ;
if ( error ) goto cleanup ;
if ( ! is_unique ) {
error = DB_KEYEXIST ;
last_dup_key = keynr ;
goto cleanup ;
}
2009-11-25 21:00:52 +00:00
}
2008-08-10 16:39:16 +00:00
}
2010-11-10 21:34:29 +00:00
}
}
if ( table_share - > blob_fields ) {
if ( fix_rec_buff_for_blob ( max_row_length ( new_row ) ) ) {
error = HA_ERR_OUT_OF_MEM ;
goto cleanup ;
}
if ( fix_rec_update_buff_for_blob ( max_row_length ( old_row ) ) ) {
error = HA_ERR_OUT_OF_MEM ;
goto cleanup ;
2008-02-07 20:19:44 +00:00
}
}
2008-08-18 18:35:32 +00:00
2010-11-10 21:34:29 +00:00
error = pack_row ( & prim_row , new_row , primary_key ) ;
if ( error ) { goto cleanup ; }
error = pack_old_row_for_update ( & old_prim_row , old_row , primary_key ) ;
if ( error ) { goto cleanup ; }
2012-01-08 22:08:12 +00:00
set_main_dict_put_flags ( thd , false , & mult_put_flags [ primary_key ] ) ;
2011-10-05 21:55:09 +00:00
error = db_env - > update_multiple (
db_env ,
share - > key_file [ primary_key ] ,
txn ,
& old_prim_key ,
& old_prim_row ,
& prim_key ,
& prim_row ,
curr_num_DBs ,
share - > key_file ,
mult_put_flags ,
2 * curr_num_DBs ,
mult_key_dbt ,
curr_num_DBs ,
mult_rec_dbt
) ;
2010-02-25 22:23:04 +00:00
if ( error = = DB_KEYEXIST ) {
last_dup_key = primary_key ;
}
else if ( ! error ) {
2009-09-28 19:08:52 +00:00
trx - > stmt_progress . updated + + ;
track_progress ( thd ) ;
2009-01-20 21:06:49 +00:00
}
2008-08-18 18:35:32 +00:00
2008-08-08 19:20:52 +00:00
cleanup :
2010-11-17 23:09:06 +00:00
rw_unlock ( & share - > num_DBs_lock ) ;
2008-08-08 19:20:52 +00:00
if ( error = = DB_KEYEXIST ) {
2008-02-07 20:19:44 +00:00
error = HA_ERR_FOUND_DUPP_KEY ;
2008-08-08 19:20:52 +00:00
}
2008-08-10 17:46:23 +00:00
if ( sub_trans ) {
// no point in recording error value of abort.
// nothing we can do about it anyway and it is not what
// we want to return.
if ( error ) {
2009-11-10 19:22:08 +00:00
abort_txn ( sub_trans ) ;
2008-08-10 17:46:23 +00:00
}
else {
2009-11-10 19:22:08 +00:00
commit_txn ( sub_trans , DB_TXN_NOSYNC ) ;
2008-08-10 17:46:23 +00:00
}
}
2008-03-21 23:47:22 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-05 16:00:53 +00:00
}
2008-04-17 20:56:40 +00:00
//
2008-05-08 15:50:34 +00:00
// Deletes a row in the table, called when handling a DELETE query
2008-04-17 20:56:40 +00:00
// Parameters:
// [in] record - row to be deleted, in MySQL format
// Returns:
// 0 on success
// error otherwise
//
2008-02-07 20:19:44 +00:00
int ha_tokudb : : delete_row ( const uchar * record ) {
2008-04-04 21:09:51 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::delete_row " ) ;
2008-05-08 16:01:22 +00:00
int error = ENOSYS ;
2010-11-04 18:51:18 +00:00
DBT row , prim_key ;
2008-08-10 16:39:16 +00:00
bool has_null ;
2009-01-20 21:06:49 +00:00
THD * thd = ha_thd ( ) ;
2010-11-17 23:09:06 +00:00
uint curr_num_DBs ;
2009-09-28 19:08:52 +00:00
tokudb_trx_data * trx = ( tokudb_trx_data * ) thd_data_get ( thd , tokudb_hton - > slot ) ; ;
2009-04-20 18:52:14 +00:00
2013-02-15 18:25:37 +00:00
ha_statistic_increment ( & SSV : : ha_delete_count ) ;
2008-02-07 20:19:44 +00:00
2010-11-17 23:09:06 +00:00
//
// grab reader lock on numDBs_lock
//
rw_rdlock ( & share - > num_DBs_lock ) ;
curr_num_DBs = share - > num_DBs ;
2008-08-10 16:39:16 +00:00
create_dbt_key_from_table ( & prim_key , primary_key , key_buff , record , & has_null ) ;
2010-11-04 18:51:18 +00:00
if ( table_share - > blob_fields ) {
if ( fix_rec_buff_for_blob ( max_row_length ( record ) ) ) {
error = HA_ERR_OUT_OF_MEM ;
goto cleanup ;
}
2008-08-08 19:20:52 +00:00
}
2010-11-04 18:51:18 +00:00
if ( ( error = pack_row ( & row , ( const uchar * ) record , primary_key ) ) ) {
goto cleanup ;
}
2011-10-05 21:55:09 +00:00
error = db_env - > del_multiple (
db_env ,
share - > key_file [ primary_key ] ,
transaction ,
& prim_key ,
& row ,
curr_num_DBs ,
share - > key_file ,
mult_key_dbt ,
mult_del_flags
) ;
2010-11-04 18:51:18 +00:00
2008-08-08 19:20:52 +00:00
if ( error ) {
DBUG_PRINT ( " error " , ( " Got error %d " , error ) ) ;
2008-02-05 16:00:53 +00:00
}
2008-08-08 19:20:52 +00:00
else {
2008-07-08 01:59:46 +00:00
deleted_rows + + ;
2009-09-28 19:08:52 +00:00
trx - > stmt_progress . deleted + + ;
track_progress ( thd ) ;
2008-07-08 01:59:46 +00:00
}
2010-11-04 18:51:18 +00:00
cleanup :
2010-11-17 23:09:06 +00:00
rw_unlock ( & share - > num_DBs_lock ) ;
2008-03-21 23:47:22 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-05 16:00:53 +00:00
}
2009-04-17 18:29:25 +00:00
//
// takes as input table->read_set and table->write_set
// and puts list of field indexes that need to be read in
// unpack_row in the member variables fixed_cols_for_query
// and var_cols_for_query
//
void ha_tokudb : : set_query_columns ( uint keynr ) {
2012-07-25 20:48:53 +00:00
uint32_t curr_fixed_col_index = 0 ;
uint32_t curr_var_col_index = 0 ;
2009-04-17 18:29:25 +00:00
read_key = false ;
read_blobs = false ;
//
// i know this is probably confusing and will need to be explained better
//
uint key_index = 0 ;
2009-04-21 15:13:09 +00:00
if ( keynr = = primary_key | | keynr = = MAX_KEY ) {
2009-04-17 18:29:25 +00:00
key_index = primary_key ;
}
else {
key_index = ( table - > key_info [ keynr ] . flags & HA_CLUSTERING ? keynr : primary_key ) ;
}
for ( uint i = 0 ; i < table_share - > fields ; i + + ) {
if ( bitmap_is_set ( table - > read_set , i ) | |
bitmap_is_set ( table - > write_set , i )
)
{
2010-01-11 18:14:37 +00:00
if ( bitmap_is_set ( & share - > kc_info . key_filters [ key_index ] , i ) ) {
2009-04-17 18:29:25 +00:00
read_key = true ;
}
else {
//
// if fixed field length
//
2010-01-11 18:14:37 +00:00
if ( share - > kc_info . field_lengths [ i ] ! = 0 ) {
2009-04-17 18:29:25 +00:00
//
// save the offset into the list
//
fixed_cols_for_query [ curr_fixed_col_index ] = i ;
curr_fixed_col_index + + ;
}
//
// varchar or varbinary
//
2010-01-11 18:14:37 +00:00
else if ( share - > kc_info . length_bytes [ i ] ! = 0 ) {
2009-04-17 18:29:25 +00:00
var_cols_for_query [ curr_var_col_index ] = i ;
curr_var_col_index + + ;
}
//
// it is a blob
//
else {
read_blobs = true ;
}
}
}
}
num_fixed_cols_for_query = curr_fixed_col_index ;
num_var_cols_for_query = curr_var_col_index ;
}
2009-04-21 15:13:09 +00:00
void ha_tokudb : : column_bitmaps_signal ( ) {
2009-04-22 14:17:41 +00:00
//
// if we have max number of indexes, then MAX_KEY == primary_key
//
2012-08-23 14:16:01 +00:00
if ( tokudb_active_index ! = MAX_KEY | | tokudb_active_index = = primary_key ) {
set_query_columns ( tokudb_active_index ) ;
2009-04-21 15:13:09 +00:00
}
}
2009-04-17 18:29:25 +00:00
2008-06-27 20:33:01 +00:00
//
// Notification that a scan of entire secondary table is about
// to take place. Will pre acquire table read lock
// Returns:
// 0 on success
// error otherwise
//
int ha_tokudb : : prepare_index_scan ( ) {
2010-03-25 13:15:03 +00:00
int error = 0 ;
2010-09-03 20:47:01 +00:00
HANDLE_INVALID_CURSOR ( ) ;
2011-08-16 12:50:38 +00:00
error = prelock_range ( NULL , NULL ) ;
2008-06-27 20:33:01 +00:00
if ( error ) { last_cursor_error = error ; goto cleanup ; }
range_lock_grabbed = true ;
error = 0 ;
cleanup :
return error ;
}
2009-07-05 02:00:36 +00:00
//
// Notification that a range query getting all elements that equal a key
// to take place. Will pre acquire read lock
// Returns:
// 0 on success
// error otherwise
//
2011-10-05 21:55:09 +00:00
int ha_tokudb : : prepare_index_key_scan ( const uchar * key , uint key_len ) {
2009-07-05 02:00:36 +00:00
int error = 0 ;
DBT start_key , end_key ;
2011-08-16 12:50:38 +00:00
THD * thd = ha_thd ( ) ;
2010-09-03 20:47:01 +00:00
HANDLE_INVALID_CURSOR ( ) ;
2012-08-23 14:16:01 +00:00
pack_key ( & start_key , tokudb_active_index , prelocked_left_range , key , key_len , COL_NEG_INF ) ;
2011-08-16 12:50:38 +00:00
prelocked_left_range_size = start_key . size ;
2012-08-23 14:16:01 +00:00
pack_key ( & end_key , tokudb_active_index , prelocked_right_range , key , key_len , COL_POS_INF ) ;
2011-08-16 12:50:38 +00:00
prelocked_right_range_size = end_key . size ;
2009-07-05 02:00:36 +00:00
2011-10-05 21:55:09 +00:00
error = cursor - > c_pre_acquire_range_lock (
cursor ,
& start_key ,
& end_key
) ;
2009-07-05 02:00:36 +00:00
if ( error ) {
goto cleanup ;
}
range_lock_grabbed = true ;
2011-08-16 12:50:38 +00:00
doing_bulk_fetch = ( thd_sql_command ( thd ) = = SQLCOM_SELECT ) ;
2012-01-23 21:21:23 +00:00
bulk_fetch_iteration = 0 ;
rows_fetched_using_bulk_fetch = 0 ;
2009-07-05 02:00:36 +00:00
error = 0 ;
cleanup :
if ( error ) {
2012-11-19 19:12:47 +00:00
if ( error = = DB_LOCK_NOTGRANTED ) {
error = HA_ERR_LOCK_WAIT_TIMEOUT ;
}
2009-07-05 02:00:36 +00:00
last_cursor_error = error ;
//
2011-10-05 21:55:09 +00:00
// cursor should be initialized here, but in case it is not,
// we still check
2009-07-05 02:00:36 +00:00
//
if ( cursor ) {
2009-12-03 16:59:52 +00:00
int r = cursor - > c_close ( cursor ) ;
assert ( r = = 0 ) ;
2009-07-05 02:00:36 +00:00
cursor = NULL ;
}
}
return error ;
}
2011-08-16 12:50:38 +00:00
void ha_tokudb : : invalidate_bulk_fetch ( ) {
bytes_used_in_range_query_buff = 0 ;
curr_range_query_buff_offset = 0 ;
}
2009-07-05 02:00:36 +00:00
2013-02-20 20:36:28 +00:00
void ha_tokudb : : invalidate_icp ( ) {
toku_pushed_idx_cond = NULL ;
toku_pushed_idx_cond_keyno = MAX_KEY ;
icp_went_out_of_range = false ;
}
2012-03-19 12:15:50 +00:00
volatile int ha_tokudb_index_init_wait = 0 ; // debug
2008-04-17 20:56:40 +00:00
//
// Initializes local cursor on DB with index keynr
// Parameters:
// keynr - key (index) number
// sorted - 1 if result MUST be sorted according to index
// Returns:
// 0 on success
// error otherwise
//
2008-02-07 20:19:44 +00:00
int ha_tokudb : : index_init ( uint keynr , bool sorted ) {
2008-04-17 11:12:01 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::index_init %p %d " , this , keynr ) ;
2012-03-19 12:15:50 +00:00
while ( ha_tokudb_index_init_wait ) sleep ( 1 ) ; // debug
2008-02-07 20:19:44 +00:00
int error ;
2009-04-17 18:29:25 +00:00
THD * thd = ha_thd ( ) ;
2008-02-07 20:19:44 +00:00
DBUG_PRINT ( " enter " , ( " table: '%s' key: %d " , table_share - > table_name . str , keynr ) ) ;
/*
Under some very rare conditions ( like full joins ) we may already have
an active cursor at this point
*/
if ( cursor ) {
DBUG_PRINT ( " note " , ( " Closing active cursor " ) ) ;
2009-12-03 16:59:52 +00:00
int r = cursor - > c_close ( cursor ) ;
assert ( r = = 0 ) ;
2008-02-07 20:19:44 +00:00
}
active_index = keynr ;
2012-08-23 14:16:01 +00:00
if ( active_index < MAX_KEY ) {
DBUG_ASSERT ( keynr < = table - > s - > keys ) ;
} else {
DBUG_ASSERT ( active_index = = MAX_KEY ) ;
keynr = primary_key ;
}
tokudb_active_index = keynr ;
2008-06-10 17:03:09 +00:00
last_cursor_error = 0 ;
2008-06-17 14:31:53 +00:00
range_lock_grabbed = false ;
2008-05-26 14:07:31 +00:00
DBUG_ASSERT ( share - > key_file [ keynr ] ) ;
2010-09-03 20:47:01 +00:00
cursor_flags = get_cursor_isolation_flags ( lock . type , thd ) ;
2011-12-11 01:56:53 +00:00
if ( use_write_locks ) {
2011-06-13 18:01:03 +00:00
cursor_flags | = DB_RMW ;
2011-12-11 01:56:53 +00:00
}
if ( get_disable_prefetching ( thd ) ) {
cursor_flags | = DBC_DISABLE_PREFETCHING ;
}
2010-09-03 20:47:01 +00:00
if ( ( error = share - > key_file [ keynr ] - > cursor ( share - > key_file [ keynr ] , transaction , & cursor , cursor_flags ) ) ) {
if ( error = = TOKUDB_MVCC_DICTIONARY_TOO_NEW ) {
2010-09-09 13:54:59 +00:00
error = HA_ERR_TABLE_DEF_CHANGED ;
2010-09-03 20:47:01 +00:00
my_error ( ER_TABLE_DEF_CHANGED , MYF ( 0 ) ) ;
}
2011-02-15 21:42:47 +00:00
if ( error = = DB_LOCK_NOTGRANTED ) {
error = HA_ERR_LOCK_WAIT_TIMEOUT ;
my_error ( ER_LOCK_WAIT_TIMEOUT , MYF ( 0 ) ) ;
}
2010-09-03 20:47:01 +00:00
table - > status = STATUS_NOT_FOUND ;
2008-06-10 17:03:09 +00:00
last_cursor_error = error ;
2008-04-18 19:54:14 +00:00
cursor = NULL ; // Safety
2009-04-17 18:29:25 +00:00
goto exit ;
2008-06-10 17:03:09 +00:00
}
2012-05-09 18:36:52 +00:00
memset ( ( void * ) & last_key , 0 , sizeof ( last_key ) ) ;
2009-04-17 18:29:25 +00:00
if ( thd_sql_command ( thd ) = = SQLCOM_SELECT ) {
set_query_columns ( keynr ) ;
unpack_entire_row = false ;
}
else {
unpack_entire_row = true ;
}
2011-08-16 12:50:38 +00:00
invalidate_bulk_fetch ( ) ;
doing_bulk_fetch = false ;
2009-04-17 18:29:25 +00:00
error = 0 ;
exit :
2008-03-21 23:47:22 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-07 20:19:44 +00:00
}
2008-04-17 20:56:40 +00:00
//
// closes the local cursor
//
2008-02-07 20:19:44 +00:00
int ha_tokudb : : index_end ( ) {
2008-04-17 11:12:01 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::index_end %p " , this ) ;
2008-06-17 14:31:53 +00:00
range_lock_grabbed = false ;
2008-02-07 20:19:44 +00:00
if ( cursor ) {
DBUG_PRINT ( " enter " , ( " table: '%s' " , table_share - > table_name . str ) ) ;
2010-11-24 14:01:48 +00:00
int r = cursor - > c_close ( cursor ) ;
assert ( r = = 0 ) ;
2008-04-18 19:54:14 +00:00
cursor = NULL ;
2008-06-10 17:03:09 +00:00
last_cursor_error = 0 ;
2008-02-05 16:00:53 +00:00
}
2012-08-23 14:16:01 +00:00
active_index = tokudb_active_index = MAX_KEY ;
2009-04-17 22:07:40 +00:00
//
// reset query variables
//
unpack_entire_row = true ;
read_blobs = true ;
read_key = true ;
num_fixed_cols_for_query = 0 ;
num_var_cols_for_query = 0 ;
2011-08-16 12:50:38 +00:00
invalidate_bulk_fetch ( ) ;
2013-02-20 20:36:28 +00:00
invalidate_icp ( ) ;
2011-08-16 12:50:38 +00:00
doing_bulk_fetch = false ;
2013-02-17 00:14:14 +00:00
close_dsmrr ( ) ;
2010-11-24 14:01:48 +00:00
TOKUDB_DBUG_RETURN ( 0 ) ;
2008-02-07 20:19:44 +00:00
}
2008-07-30 14:43:19 +00:00
int ha_tokudb : : handle_cursor_error ( int error , int err_to_return , uint keynr ) {
TOKUDB_DBUG_ENTER ( " ha_tokudb::handle_cursor_error " ) ;
2008-02-07 20:19:44 +00:00
if ( error ) {
2010-09-14 13:27:08 +00:00
if ( error = = DB_LOCK_NOTGRANTED ) {
error = HA_ERR_LOCK_WAIT_TIMEOUT ;
}
2008-06-10 17:03:09 +00:00
last_cursor_error = error ;
2008-02-07 20:19:44 +00:00
table - > status = STATUS_NOT_FOUND ;
2009-02-09 20:20:30 +00:00
if ( error = = DB_NOTFOUND ) {
2008-07-30 14:43:19 +00:00
error = err_to_return ;
2008-06-10 17:03:09 +00:00
}
2008-02-07 20:19:44 +00:00
}
2008-07-30 14:43:19 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
}
//
// Helper function for read_row and smart_dbt_callback_xxx functions
// When using a hidden primary key, upon reading a row,
// we set the current_ident field to whatever the primary key we retrieved
// was
//
2009-11-25 21:00:52 +00:00
void ha_tokudb : : extract_hidden_primary_key ( uint keynr , DBT const * found_key ) {
2008-04-21 18:19:07 +00:00
//
2008-05-09 21:07:09 +00:00
// extract hidden primary key to current_ident
2008-04-21 18:19:07 +00:00
//
if ( hidden_primary_key ) {
2008-05-09 21:07:09 +00:00
if ( keynr = = primary_key ) {
memcpy_fixed ( current_ident , ( char * ) found_key - > data , TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH ) ;
}
2008-11-03 20:42:59 +00:00
//
2009-11-25 21:00:52 +00:00
// if secondary key, hidden primary key is at end of found_key
2008-11-03 20:42:59 +00:00
//
2009-11-25 21:00:52 +00:00
else {
2008-11-03 20:42:59 +00:00
memcpy_fixed (
current_ident ,
( char * ) found_key - > data + found_key - > size - TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH ,
TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH
) ;
}
2008-04-21 18:19:07 +00:00
}
2008-07-30 14:43:19 +00:00
}
2009-08-06 15:49:36 +00:00
2009-08-06 15:57:33 +00:00
int ha_tokudb : : read_row_callback ( uchar * buf , uint keynr , DBT const * row , DBT const * found_key ) {
2009-08-06 15:49:36 +00:00
assert ( keynr = = primary_key ) ;
2009-08-06 15:57:33 +00:00
return unpack_row ( buf , row , found_key , keynr ) ;
2009-08-06 15:49:36 +00:00
}
2008-07-30 14:43:19 +00:00
//
// Reads the contents of row and found_key, DBT's retrieved from the DB associated to keynr, into buf
// This function assumes that we are using a covering index, as a result, if keynr is the primary key,
// we do not read row into buf
// Parameters:
// [out] buf - buffer for the row, in MySQL format
// keynr - index into key_file that represents DB we are currently operating on.
// [in] row - the row that has been read from the preceding DB call
// [in] found_key - key used to retrieve the row
//
2009-11-25 21:00:52 +00:00
void ha_tokudb : : read_key_only ( uchar * buf , uint keynr , DBT const * found_key ) {
2008-07-30 14:43:19 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::read_key_only " ) ;
table - > status = 0 ;
2009-11-25 21:00:52 +00:00
//
// only case when we do not unpack the key is if we are dealing with the main dictionary
// of a table with a hidden primary key
//
2009-08-19 17:01:05 +00:00
if ( ! ( hidden_primary_key & & keynr = = primary_key ) ) {
unpack_key ( buf , found_key , keynr ) ;
}
2008-07-30 14:43:19 +00:00
DBUG_VOID_RETURN ;
}
//
// Helper function used to try to retrieve the entire row
// If keynr is associated with the main table, reads contents of found_key and row into buf, otherwise,
// makes copy of primary key and saves it to last_key. This can later be used to retrieve the entire row
// Parameters:
// [out] buf - buffer for the row, in MySQL format
// keynr - index into key_file that represents DB we are currently operating on.
// [in] row - the row that has been read from the preceding DB call
// [in] found_key - key used to retrieve the row
//
2009-04-20 02:36:43 +00:00
int ha_tokudb : : read_primary_key ( uchar * buf , uint keynr , DBT const * row , DBT const * found_key ) {
2008-07-30 14:43:19 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::read_primary_key " ) ;
2009-04-20 02:36:43 +00:00
int error = 0 ;
2008-07-30 14:43:19 +00:00
table - > status = 0 ;
2008-11-03 20:42:59 +00:00
//
// case where we read from secondary table that is not clustered
//
if ( keynr ! = primary_key & & ! ( table - > key_info [ keynr ] . flags & HA_CLUSTERING ) ) {
2009-11-25 21:00:52 +00:00
bool has_null ;
2008-07-30 14:43:19 +00:00
//
2009-11-25 21:00:52 +00:00
// create a DBT that has the same data as row, this is inefficient
// extract_hidden_primary_key MUST have been called before this
2008-07-30 14:43:19 +00:00
//
2012-05-09 18:36:52 +00:00
memset ( ( void * ) & last_key , 0 , sizeof ( last_key ) ) ;
2009-11-25 21:00:52 +00:00
if ( ! hidden_primary_key ) {
unpack_key ( buf , found_key , keynr ) ;
}
create_dbt_key_from_table (
& last_key ,
primary_key ,
key_buff ,
buf ,
& has_null
) ;
2008-07-30 14:43:19 +00:00
}
2008-11-03 20:42:59 +00:00
//
2009-04-17 18:29:25 +00:00
// else read from clustered/primary key
2008-11-03 20:42:59 +00:00
//
2008-07-30 14:43:19 +00:00
else {
2009-04-20 02:36:43 +00:00
error = unpack_row ( buf , row , found_key , keynr ) ;
if ( error ) { goto exit ; }
2008-07-30 14:43:19 +00:00
}
if ( found_key ) { DBUG_DUMP ( " read row key " , ( uchar * ) found_key - > data , found_key - > size ) ; }
2009-04-20 02:36:43 +00:00
error = 0 ;
exit :
TOKUDB_DBUG_RETURN ( error ) ;
2008-07-30 14:43:19 +00:00
}
//
// This function reads an entire row into buf. This function also assumes that
// the key needed to retrieve the row is stored in the member variable last_key
// Parameters:
// [out] buf - buffer for the row, in MySQL format
// Returns:
// 0 on success, error otherwise
//
int ha_tokudb : : read_full_row ( uchar * buf ) {
TOKUDB_DBUG_ENTER ( " ha_tokudb::read_full_row " ) ;
2010-03-25 13:15:03 +00:00
int error = 0 ;
2009-08-06 15:49:36 +00:00
struct smart_dbt_info info ;
info . ha = this ;
info . buf = buf ;
info . keynr = primary_key ;
2008-07-30 14:43:19 +00:00
//
2009-08-06 15:49:36 +00:00
// assumes key is stored in this->last_key
2008-07-30 14:43:19 +00:00
//
2011-10-05 21:55:09 +00:00
error = share - > file - > getf_set (
share - > file ,
transaction ,
cursor_flags ,
& last_key ,
smart_dbt_callback_rowread_ptquery ,
& info
) ;
2009-08-06 15:49:36 +00:00
if ( error ) {
2010-09-14 13:27:08 +00:00
if ( error = = DB_LOCK_NOTGRANTED ) {
error = HA_ERR_LOCK_WAIT_TIMEOUT ;
}
2008-07-30 14:43:19 +00:00
table - > status = STATUS_NOT_FOUND ;
TOKUDB_DBUG_RETURN ( error = = DB_NOTFOUND ? HA_ERR_CRASHED : error ) ;
}
2009-04-20 02:36:43 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
2008-07-30 14:43:19 +00:00
}
2009-04-20 16:56:22 +00:00
//
// Reads the next row matching to the key, on success, advances cursor
// Parameters:
// [out] buf - buffer for the next row, in MySQL format
// [in] key - key value
// keylen - length of key
// Returns:
// 0 on success
// HA_ERR_END_OF_FILE if not found
// error otherwise
//
int ha_tokudb : : index_next_same ( uchar * buf , const uchar * key , uint keylen ) {
2011-08-16 12:50:38 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::index_next_same " ) ;
2013-02-15 18:25:37 +00:00
ha_statistic_increment ( & SSV : : ha_read_next_count ) ;
2011-08-16 12:50:38 +00:00
2009-04-20 16:56:22 +00:00
DBT curr_key ;
DBT found_key ;
bool has_null ;
int cmp ;
2011-08-16 12:50:38 +00:00
int error = get_next ( buf , 1 ) ;
2009-04-20 16:56:22 +00:00
if ( error ) {
goto cleanup ;
}
//
// now do the comparison
//
2012-08-23 14:16:01 +00:00
pack_key ( & curr_key , tokudb_active_index , key_buff2 , key , keylen , COL_ZERO ) ;
create_dbt_key_from_table ( & found_key , tokudb_active_index , key_buff3 , buf , & has_null ) ;
cmp = tokudb_prefix_cmp_dbt_key ( share - > key_file [ tokudb_active_index ] , & curr_key , & found_key ) ;
2009-04-20 16:56:22 +00:00
if ( cmp ) {
error = HA_ERR_END_OF_FILE ;
}
2011-08-16 12:50:38 +00:00
cleanup :
TOKUDB_DBUG_RETURN ( error ) ;
}
2009-04-20 16:56:22 +00:00
2008-04-17 20:56:40 +00:00
//
// According to InnoDB handlerton: Positions an index cursor to the index
// specified in keynr. Fetches the row if any
// Parameters:
// [out] buf - buffer for the returned row
// [in] key - key value, according to InnoDB, if NULL,
// position cursor at start or end of index,
// not sure if this is done now
// key_len - length of key
// find_flag - according to InnoDB, search flags from my_base.h
// Returns:
// 0 on success
// HA_ERR_KEY_NOT_FOUND if not found (per InnoDB),
// we seem to return HA_ERR_END_OF_FILE if find_flag != HA_READ_KEY_EXACT
// TODO: investigate this for correctness
// error otherwise
//
2008-04-17 11:12:01 +00:00
int ha_tokudb : : index_read ( uchar * buf , const uchar * key , uint key_len , enum ha_rkey_function find_flag ) {
TOKUDB_DBUG_ENTER ( " ha_tokudb::index_read %p find %d " , this , find_flag ) ;
2011-08-16 12:50:38 +00:00
invalidate_bulk_fetch ( ) ;
2008-04-18 17:07:17 +00:00
// TOKUDB_DBUG_DUMP("key=", key, key_len);
2008-04-17 11:12:01 +00:00
DBT row ;
2009-08-19 19:37:32 +00:00
DBT lookup_key ;
2010-03-25 13:15:03 +00:00
int error = 0 ;
2012-07-25 20:48:53 +00:00
uint32_t flags = 0 ;
2009-09-28 19:08:52 +00:00
THD * thd = ha_thd ( ) ;
tokudb_trx_data * trx = ( tokudb_trx_data * ) thd_data_get ( thd , tokudb_hton - > slot ) ; ;
2008-07-30 14:43:19 +00:00
struct smart_dbt_info info ;
2009-08-20 17:01:16 +00:00
struct index_read_info ir_info ;
2008-04-17 11:12:01 +00:00
2008-07-30 14:43:19 +00:00
HANDLE_INVALID_CURSOR ( ) ;
2008-06-10 17:03:09 +00:00
2013-02-15 18:25:37 +00:00
ha_statistic_increment ( & SSV : : ha_read_key_count ) ;
2012-05-09 18:36:52 +00:00
memset ( ( void * ) & row , 0 , sizeof ( row ) ) ;
2008-04-17 11:12:01 +00:00
2008-07-30 14:43:19 +00:00
info . ha = this ;
info . buf = buf ;
2012-08-23 14:16:01 +00:00
info . keynr = tokudb_active_index ;
2008-07-30 14:43:19 +00:00
2009-08-20 17:01:16 +00:00
ir_info . smart_dbt_info = info ;
2010-01-11 18:14:37 +00:00
ir_info . cmp = 0 ;
2009-08-20 17:01:16 +00:00
2011-06-13 18:01:03 +00:00
flags = SET_PRELOCK_FLAG ( 0 ) ;
2008-02-28 01:27:14 +00:00
switch ( find_flag ) {
2008-04-17 20:56:40 +00:00
case HA_READ_KEY_EXACT : /* Find first record else error */
2012-08-23 14:16:01 +00:00
pack_key ( & lookup_key , tokudb_active_index , key_buff3 , key , key_len , COL_NEG_INF ) ;
2009-08-20 17:01:16 +00:00
ir_info . orig_key = & lookup_key ;
2011-10-05 21:55:09 +00:00
error = cursor - > c_getf_set_range ( cursor , flags ,
& lookup_key , SMART_DBT_IR_CALLBACK , & ir_info ) ;
2009-08-20 17:01:16 +00:00
if ( ir_info . cmp ) {
error = DB_NOTFOUND ;
2008-04-02 11:17:40 +00:00
}
2008-02-28 01:27:14 +00:00
break ;
2008-04-17 20:56:40 +00:00
case HA_READ_AFTER_KEY : /* Find next rec. after key-record */
2012-08-23 14:16:01 +00:00
pack_key ( & lookup_key , tokudb_active_index , key_buff3 , key , key_len , COL_POS_INF ) ;
2011-10-05 21:55:09 +00:00
error = cursor - > c_getf_set_range ( cursor , flags ,
& lookup_key , SMART_DBT_CALLBACK , & info ) ;
2008-02-28 01:27:14 +00:00
break ;
2008-04-17 20:56:40 +00:00
case HA_READ_BEFORE_KEY : /* Find next rec. before key-record */
2012-08-23 14:16:01 +00:00
pack_key ( & lookup_key , tokudb_active_index , key_buff3 , key , key_len , COL_NEG_INF ) ;
2011-10-05 21:55:09 +00:00
error = cursor - > c_getf_set_range_reverse ( cursor , flags ,
& lookup_key , SMART_DBT_CALLBACK , & info ) ;
2008-03-03 20:27:58 +00:00
break ;
2008-04-17 20:56:40 +00:00
case HA_READ_KEY_OR_NEXT : /* Record or next record */
2012-08-23 14:16:01 +00:00
pack_key ( & lookup_key , tokudb_active_index , key_buff3 , key , key_len , COL_NEG_INF ) ;
2011-10-05 21:55:09 +00:00
error = cursor - > c_getf_set_range ( cursor , flags ,
& lookup_key , SMART_DBT_CALLBACK , & info ) ;
2008-02-28 01:27:14 +00:00
break ;
2009-08-19 19:37:32 +00:00
//
// This case does not seem to ever be used, it is ok for it to be slow
//
2008-04-17 20:56:40 +00:00
case HA_READ_KEY_OR_PREV : /* Record or previous */
2012-08-23 14:16:01 +00:00
pack_key ( & lookup_key , tokudb_active_index , key_buff3 , key , key_len , COL_NEG_INF ) ;
2009-08-20 17:01:16 +00:00
ir_info . orig_key = & lookup_key ;
2011-10-05 21:55:09 +00:00
error = cursor - > c_getf_set_range ( cursor , flags ,
& lookup_key , SMART_DBT_IR_CALLBACK , & ir_info ) ;
2009-08-20 17:01:16 +00:00
if ( error = = DB_NOTFOUND ) {
2009-08-19 16:14:54 +00:00
error = cursor - > c_getf_last ( cursor , flags , SMART_DBT_CALLBACK , & info ) ;
}
2009-08-20 17:01:16 +00:00
else if ( ir_info . cmp ) {
error = cursor - > c_getf_prev ( cursor , flags , SMART_DBT_CALLBACK , & info ) ;
}
2008-03-21 23:47:22 +00:00
break ;
2008-04-17 20:56:40 +00:00
case HA_READ_PREFIX_LAST_OR_PREV : /* Last or prev key with the same prefix */
2012-08-23 14:16:01 +00:00
pack_key ( & lookup_key , tokudb_active_index , key_buff3 , key , key_len , COL_POS_INF ) ;
2011-10-05 21:55:09 +00:00
error = cursor - > c_getf_set_range_reverse ( cursor , flags ,
& lookup_key , SMART_DBT_CALLBACK , & info ) ;
2008-02-28 01:27:14 +00:00
break ;
2008-10-07 19:57:02 +00:00
case HA_READ_PREFIX_LAST :
2012-08-23 14:16:01 +00:00
pack_key ( & lookup_key , tokudb_active_index , key_buff3 , key , key_len , COL_POS_INF ) ;
2009-08-20 17:01:16 +00:00
ir_info . orig_key = & lookup_key ;
2011-10-05 21:55:09 +00:00
error = cursor - > c_getf_set_range_reverse ( cursor , flags , & lookup_key , SMART_DBT_IR_CALLBACK , & ir_info ) ;
2009-08-20 17:01:16 +00:00
if ( ir_info . cmp ) {
error = DB_NOTFOUND ;
2008-10-07 19:57:02 +00:00
}
break ;
2008-02-28 01:27:14 +00:00
default :
2008-04-24 17:30:05 +00:00
TOKUDB_TRACE ( " unsupported:%d \n " , find_flag ) ;
2008-03-21 23:47:22 +00:00
error = HA_ERR_UNSUPPORTED ;
2008-02-28 01:27:14 +00:00
break ;
2008-02-07 20:19:44 +00:00
}
2012-08-23 14:16:01 +00:00
error = handle_cursor_error ( error , HA_ERR_KEY_NOT_FOUND , tokudb_active_index ) ;
if ( ! error & & ! key_read & & tokudb_active_index ! = primary_key & & ! ( table - > key_info [ tokudb_active_index ] . flags & HA_CLUSTERING ) ) {
2008-07-30 14:43:19 +00:00
error = read_full_row ( buf ) ;
2008-07-17 19:10:36 +00:00
}
2008-07-30 14:43:19 +00:00
if ( error & & ( tokudb_debug & TOKUDB_DEBUG_ERROR ) ) {
TOKUDB_TRACE ( " error:%d:%d \n " , error , find_flag ) ;
}
2009-09-28 19:08:52 +00:00
trx - > stmt_progress . queried + + ;
track_progress ( thd ) ;
2008-07-30 14:43:19 +00:00
cleanup :
2008-03-21 23:47:22 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-05 16:00:53 +00:00
}
2008-02-07 20:19:44 +00:00
2011-08-16 12:50:38 +00:00
int ha_tokudb : : read_data_from_range_query_buff ( uchar * buf , bool need_val ) {
// buffer has the next row, get it from there
int error ;
uchar * curr_pos = range_query_buff + curr_range_query_buff_offset ;
DBT curr_key ;
2012-05-09 18:36:52 +00:00
memset ( ( void * ) & curr_key , 0 , sizeof ( curr_key ) ) ;
2011-08-16 12:50:38 +00:00
// get key info
2012-07-25 20:48:53 +00:00
uint32_t key_size = * ( uint32_t * ) curr_pos ;
2011-08-16 12:50:38 +00:00
curr_pos + = sizeof ( key_size ) ;
uchar * curr_key_buff = curr_pos ;
curr_pos + = key_size ;
curr_key . data = curr_key_buff ;
curr_key . size = key_size ;
// if this is a covering index, this is all we need
if ( this - > key_read ) {
assert ( ! need_val ) ;
2012-08-23 14:16:01 +00:00
extract_hidden_primary_key ( tokudb_active_index , & curr_key ) ;
read_key_only ( buf , tokudb_active_index , & curr_key ) ;
2011-08-16 12:50:38 +00:00
error = 0 ;
}
// we need to get more data
else {
DBT curr_val ;
2012-05-09 18:36:52 +00:00
memset ( ( void * ) & curr_val , 0 , sizeof ( curr_val ) ) ;
2011-08-16 12:50:38 +00:00
uchar * curr_val_buff = NULL ;
2012-07-25 20:48:53 +00:00
uint32_t val_size = 0 ;
2011-08-16 12:50:38 +00:00
// in this case, we don't have a val, we are simply extracting the pk
if ( ! need_val ) {
curr_val . data = curr_val_buff ;
curr_val . size = val_size ;
2012-08-23 14:16:01 +00:00
extract_hidden_primary_key ( tokudb_active_index , & curr_key ) ;
error = read_primary_key ( buf , tokudb_active_index , & curr_val , & curr_key ) ;
2011-08-16 12:50:38 +00:00
}
else {
2012-08-23 14:16:01 +00:00
extract_hidden_primary_key ( tokudb_active_index , & curr_key ) ;
2011-08-16 12:50:38 +00:00
// need to extract a val and place it into buf
if ( unpack_entire_row ) {
// get val info
2012-07-25 20:48:53 +00:00
val_size = * ( uint32_t * ) curr_pos ;
2011-08-16 12:50:38 +00:00
curr_pos + = sizeof ( val_size ) ;
curr_val_buff = curr_pos ;
curr_pos + = val_size ;
curr_val . data = curr_val_buff ;
curr_val . size = val_size ;
2012-08-23 14:16:01 +00:00
error = unpack_row ( buf , & curr_val , & curr_key , tokudb_active_index ) ;
2011-08-16 12:50:38 +00:00
}
else {
2012-08-23 14:16:01 +00:00
if ( ! ( hidden_primary_key & & tokudb_active_index = = primary_key ) ) {
unpack_key ( buf , & curr_key , tokudb_active_index ) ;
2011-08-16 12:50:38 +00:00
}
// read rows we care about
// first the null bytes;
memcpy ( buf , curr_pos , table_share - > null_bytes ) ;
curr_pos + = table_share - > null_bytes ;
// now the fixed sized rows
2012-07-25 20:48:53 +00:00
for ( uint32_t i = 0 ; i < num_fixed_cols_for_query ; i + + ) {
2011-08-16 12:50:38 +00:00
uint field_index = fixed_cols_for_query [ i ] ;
Field * field = table - > field [ field_index ] ;
unpack_fixed_field (
buf + field_offset ( field , table ) ,
curr_pos ,
share - > kc_info . field_lengths [ field_index ]
) ;
curr_pos + = share - > kc_info . field_lengths [ field_index ] ;
}
// now the variable sized rows
2012-07-25 20:48:53 +00:00
for ( uint32_t i = 0 ; i < num_var_cols_for_query ; i + + ) {
2011-08-16 12:50:38 +00:00
uint field_index = var_cols_for_query [ i ] ;
Field * field = table - > field [ field_index ] ;
2012-07-25 20:48:53 +00:00
uint32_t field_len = * ( uint32_t * ) curr_pos ;
2011-08-16 12:50:38 +00:00
curr_pos + = sizeof ( field_len ) ;
unpack_var_field (
buf + field_offset ( field , table ) ,
curr_pos ,
field_len ,
share - > kc_info . length_bytes [ field_index ]
) ;
curr_pos + = field_len ;
}
// now the blobs
if ( read_blobs ) {
2012-07-25 20:48:53 +00:00
uint32_t blob_size = * ( uint32_t * ) curr_pos ;
2011-08-16 12:50:38 +00:00
curr_pos + = sizeof ( blob_size ) ;
error = unpack_blobs (
buf ,
curr_pos ,
blob_size ,
true
) ;
curr_pos + = blob_size ;
if ( error ) {
invalidate_bulk_fetch ( ) ;
goto exit ;
}
}
error = 0 ;
}
}
}
curr_range_query_buff_offset = curr_pos - range_query_buff ;
exit :
return error ;
}
2008-02-07 20:19:44 +00:00
2011-08-16 12:50:38 +00:00
static int
smart_dbt_bf_callback ( DBT const * key , DBT const * row , void * context ) {
SMART_DBT_BF_INFO info = ( SMART_DBT_BF_INFO ) context ;
2013-02-20 20:36:28 +00:00
return info - > ha - > fill_range_query_buf ( info - > need_val , key , row , info - > direction , info - > thd , info - > buf ) ;
2011-08-16 12:50:38 +00:00
}
2013-02-20 21:45:09 +00:00
# if defined(MARIADB_BASE_VERSION) || (50600 <= MYSQL_VERSION_ID && MYSQL_VERSION_ID <= 50699)
2013-02-20 20:36:28 +00:00
enum icp_result ha_tokudb : : toku_handler_index_cond_check ( Item * pushed_idx_cond )
{
2013-02-20 21:45:09 +00:00
enum icp_result res ;
if ( end_range ) {
int cmp ;
# ifdef MARIADB_BASE_VERSION
cmp = compare_key2 ( end_range ) ;
# else
cmp = compare_key_icp ( end_range ) ;
# endif
if ( cmp > 0 ) {
return ICP_OUT_OF_RANGE ;
}
}
res = pushed_idx_cond - > val_int ( ) ? ICP_MATCH : ICP_NO_MATCH ;
return res ;
2013-02-20 20:36:28 +00:00
}
# endif
2011-08-16 12:50:38 +00:00
// fill in the range query buf for bulk fetch
int ha_tokudb : : fill_range_query_buf (
bool need_val ,
DBT const * key ,
DBT const * row ,
int direction ,
2013-02-20 20:36:28 +00:00
THD * thd ,
uchar * buf
2011-08-16 12:50:38 +00:00
) {
int error ;
//
// first put the value into range_query_buf
//
2012-07-25 20:48:53 +00:00
uint32_t size_remaining = size_range_query_buff - bytes_used_in_range_query_buff ;
uint32_t size_needed ;
uint32_t user_defined_size = get_tokudb_read_buf_size ( thd ) ;
2011-08-16 12:50:38 +00:00
uchar * curr_pos = NULL ;
2013-02-20 20:36:28 +00:00
2013-02-20 21:45:09 +00:00
# if defined(MARIADB_BASE_VERSION) || (50600 <= MYSQL_VERSION_ID && MYSQL_VERSION_ID <= 50699)
2013-02-20 20:36:28 +00:00
// if we have an index condition pushed down, we check it
if ( toku_pushed_idx_cond & & ( tokudb_active_index = = toku_pushed_idx_cond_keyno ) ) {
unpack_key ( buf , key , tokudb_active_index ) ;
enum icp_result result = toku_handler_index_cond_check ( toku_pushed_idx_cond ) ;
// If we have reason to stop, we set icp_went_out_of_range and get out
2013-02-20 21:45:09 +00:00
if ( result = = ICP_OUT_OF_RANGE | | thd_killed ( thd ) ) {
2013-02-20 20:36:28 +00:00
icp_went_out_of_range = true ;
error = 0 ;
goto cleanup ;
}
// otherwise, if we simply see that the current key is no match,
// we tell the cursor to continue and don't store
// the key locally
else if ( result = = ICP_NO_MATCH ) {
error = TOKUDB_CURSOR_CONTINUE ;
goto cleanup ;
}
}
# endif
// at this point, if ICP is on, we have verified that the key is one
// we are interested in, so we proceed with placing the data
// into the range query buffer
2011-08-16 12:50:38 +00:00
if ( need_val ) {
if ( unpack_entire_row ) {
2012-07-25 20:48:53 +00:00
size_needed = 2 * sizeof ( uint32_t ) + key - > size + row - > size ;
2011-08-16 12:50:38 +00:00
}
else {
// this is an upper bound
2012-07-25 20:48:53 +00:00
size_needed = sizeof ( uint32_t ) + // size of key length
2011-08-16 12:50:38 +00:00
key - > size + row - > size + //key and row
2012-07-25 20:48:53 +00:00
num_var_cols_for_query * ( sizeof ( uint32_t ) ) + //lengths of varchars stored
sizeof ( uint32_t ) ; //length of blobs
2011-08-16 12:50:38 +00:00
}
}
else {
2012-07-25 20:48:53 +00:00
size_needed = sizeof ( uint32_t ) + key - > size ;
2011-08-16 12:50:38 +00:00
}
if ( size_remaining < size_needed ) {
range_query_buff = ( uchar * ) my_realloc (
( void * ) range_query_buff ,
bytes_used_in_range_query_buff + size_needed ,
MYF ( MY_WME )
) ;
if ( range_query_buff = = NULL ) {
error = ENOMEM ;
2011-08-17 13:30:33 +00:00
invalidate_bulk_fetch ( ) ;
2011-08-16 12:50:38 +00:00
goto cleanup ;
}
2011-08-17 13:30:33 +00:00
size_range_query_buff = bytes_used_in_range_query_buff + size_needed ;
2011-08-16 12:50:38 +00:00
}
//
// now we know we have the size, let's fill the buffer, starting with the key
//
curr_pos = range_query_buff + bytes_used_in_range_query_buff ;
2012-07-25 20:48:53 +00:00
* ( uint32_t * ) curr_pos = key - > size ;
curr_pos + = sizeof ( uint32_t ) ;
2011-08-16 12:50:38 +00:00
memcpy ( curr_pos , key - > data , key - > size ) ;
curr_pos + = key - > size ;
if ( need_val ) {
if ( unpack_entire_row ) {
2012-07-25 20:48:53 +00:00
* ( uint32_t * ) curr_pos = row - > size ;
curr_pos + = sizeof ( uint32_t ) ;
2011-08-16 12:50:38 +00:00
memcpy ( curr_pos , row - > data , row - > size ) ;
curr_pos + = row - > size ;
}
else {
// need to unpack just the data we care about
const uchar * fixed_field_ptr = ( const uchar * ) row - > data ;
fixed_field_ptr + = table_share - > null_bytes ;
const uchar * var_field_offset_ptr = NULL ;
const uchar * var_field_data_ptr = NULL ;
2012-08-23 14:16:01 +00:00
var_field_offset_ptr = fixed_field_ptr + share - > kc_info . mcp_info [ tokudb_active_index ] . fixed_field_size ;
var_field_data_ptr = var_field_offset_ptr + share - > kc_info . mcp_info [ tokudb_active_index ] . len_of_offsets ;
2011-08-16 12:50:38 +00:00
// first the null bytes
memcpy ( curr_pos , row - > data , table_share - > null_bytes ) ;
curr_pos + = table_share - > null_bytes ;
// now the fixed fields
//
// first the fixed fields
//
2012-07-25 20:48:53 +00:00
for ( uint32_t i = 0 ; i < num_fixed_cols_for_query ; i + + ) {
2011-08-16 12:50:38 +00:00
uint field_index = fixed_cols_for_query [ i ] ;
memcpy (
curr_pos ,
2012-08-23 14:16:01 +00:00
fixed_field_ptr + share - > kc_info . cp_info [ tokudb_active_index ] [ field_index ] . col_pack_val ,
2011-08-16 12:50:38 +00:00
share - > kc_info . field_lengths [ field_index ]
) ;
curr_pos + = share - > kc_info . field_lengths [ field_index ] ;
}
//
// now the var fields
//
2012-07-25 20:48:53 +00:00
for ( uint32_t i = 0 ; i < num_var_cols_for_query ; i + + ) {
2011-08-16 12:50:38 +00:00
uint field_index = var_cols_for_query [ i ] ;
2012-08-23 14:16:01 +00:00
uint32_t var_field_index = share - > kc_info . cp_info [ tokudb_active_index ] [ field_index ] . col_pack_val ;
2012-07-25 20:48:53 +00:00
uint32_t data_start_offset ;
uint32_t field_len ;
2011-08-16 12:50:38 +00:00
get_var_field_info (
& field_len ,
& data_start_offset ,
var_field_index ,
var_field_offset_ptr ,
share - > kc_info . num_offset_bytes
) ;
memcpy ( curr_pos , & field_len , sizeof ( field_len ) ) ;
curr_pos + = sizeof ( field_len ) ;
memcpy ( curr_pos , var_field_data_ptr + data_start_offset , field_len ) ;
curr_pos + = field_len ;
}
if ( read_blobs ) {
2012-07-25 20:48:53 +00:00
uint32_t blob_offset = 0 ;
uint32_t data_size = 0 ;
2011-08-16 12:50:38 +00:00
//
// now the blobs
//
get_blob_field_info (
& blob_offset ,
2012-08-23 14:16:01 +00:00
share - > kc_info . mcp_info [ tokudb_active_index ] . len_of_offsets ,
2011-08-16 12:50:38 +00:00
var_field_data_ptr ,
share - > kc_info . num_offset_bytes
) ;
2012-07-25 20:48:53 +00:00
data_size = row - > size - blob_offset - ( uint32_t ) ( var_field_data_ptr - ( const uchar * ) row - > data ) ;
2011-08-16 12:50:38 +00:00
memcpy ( curr_pos , & data_size , sizeof ( data_size ) ) ;
curr_pos + = sizeof ( data_size ) ;
memcpy ( curr_pos , var_field_data_ptr + blob_offset , data_size ) ;
curr_pos + = data_size ;
}
}
}
bytes_used_in_range_query_buff = curr_pos - range_query_buff ;
assert ( bytes_used_in_range_query_buff < = size_range_query_buff ) ;
//
// now determine if we should continue with the bulk fetch
// we want to stop under these conditions:
// - we overran the prelocked range
// - we are close to the end of the buffer
2012-01-23 21:21:23 +00:00
// - we have fetched an exponential amount of rows with
// respect to the bulk fetch iteration, which is initialized
// to 0 in index_init() and prelock_range().
rows_fetched_using_bulk_fetch + + ;
// if the iteration is less than the number of possible shifts on
// a 64 bit integer, check that we haven't exceeded this iterations
// row fetch upper bound.
if ( bulk_fetch_iteration < HA_TOKU_BULK_FETCH_ITERATION_MAX ) {
uint64_t row_fetch_upper_bound = 1LLU < < bulk_fetch_iteration ;
assert ( row_fetch_upper_bound > 0 ) ;
if ( rows_fetched_using_bulk_fetch > = row_fetch_upper_bound ) {
error = 0 ;
goto cleanup ;
}
}
2011-08-16 12:50:38 +00:00
if ( bytes_used_in_range_query_buff + table_share - > rec_buff_length > user_defined_size ) {
error = 0 ;
goto cleanup ;
}
if ( direction > 0 ) {
// compare what we got to the right endpoint of prelocked range
// because we are searching keys in ascending order
if ( prelocked_right_range_size = = 0 ) {
error = TOKUDB_CURSOR_CONTINUE ;
goto cleanup ;
}
DBT right_range ;
2012-05-09 18:36:52 +00:00
memset ( & right_range , 0 , sizeof ( right_range ) ) ;
2011-08-16 12:50:38 +00:00
right_range . size = prelocked_right_range_size ;
right_range . data = prelocked_right_range ;
int cmp = tokudb_cmp_dbt_key (
2012-08-23 14:16:01 +00:00
share - > key_file [ tokudb_active_index ] ,
2011-08-16 12:50:38 +00:00
key ,
& right_range
) ;
error = ( cmp > 0 ) ? 0 : TOKUDB_CURSOR_CONTINUE ;
}
else {
// compare what we got to the left endpoint of prelocked range
// because we are searching keys in descending order
if ( prelocked_left_range_size = = 0 ) {
error = TOKUDB_CURSOR_CONTINUE ;
goto cleanup ;
}
DBT left_range ;
2012-05-09 18:36:52 +00:00
memset ( & left_range , 0 , sizeof ( left_range ) ) ;
2011-08-16 12:50:38 +00:00
left_range . size = prelocked_left_range_size ;
left_range . data = prelocked_left_range ;
int cmp = tokudb_cmp_dbt_key (
2012-08-23 14:16:01 +00:00
share - > key_file [ tokudb_active_index ] ,
2011-08-16 12:50:38 +00:00
key ,
& left_range
) ;
error = ( cmp < 0 ) ? 0 : TOKUDB_CURSOR_CONTINUE ;
}
cleanup :
return error ;
}
int ha_tokudb : : get_next ( uchar * buf , int direction ) {
2010-03-25 13:15:03 +00:00
int error = 0 ;
2012-07-25 20:48:53 +00:00
uint32_t flags = SET_PRELOCK_FLAG ( 0 ) ;
2009-09-28 19:08:52 +00:00
THD * thd = ha_thd ( ) ;
tokudb_trx_data * trx = ( tokudb_trx_data * ) thd_data_get ( thd , tokudb_hton - > slot ) ; ;
2011-08-16 12:50:38 +00:00
bool need_val ;
2008-07-30 14:43:19 +00:00
HANDLE_INVALID_CURSOR ( ) ;
2011-08-16 12:50:38 +00:00
// we need to read the val of what we retrieve if
// we do NOT have a covering index AND we are using a clustering secondary
// key
need_val = ( this - > key_read = = 0 ) & &
2012-08-23 14:16:01 +00:00
( tokudb_active_index = = primary_key | |
table - > key_info [ tokudb_active_index ] . flags & HA_CLUSTERING
2011-08-16 12:50:38 +00:00
) ;
2009-11-13 21:21:30 +00:00
2011-08-16 12:50:38 +00:00
if ( ( bytes_used_in_range_query_buff - curr_range_query_buff_offset ) > 0 ) {
error = read_data_from_range_query_buff ( buf , need_val ) ;
2009-11-13 21:21:30 +00:00
}
2013-02-20 20:36:28 +00:00
else if ( icp_went_out_of_range ) {
2013-02-25 23:03:11 +00:00
icp_went_out_of_range = false ;
2013-02-20 20:36:28 +00:00
error = HA_ERR_END_OF_FILE ;
}
2011-08-16 12:50:38 +00:00
else {
invalidate_bulk_fetch ( ) ;
if ( doing_bulk_fetch ) {
struct smart_dbt_bf_info bf_info ;
bf_info . ha = this ;
// you need the val if you have a clustering index and key_read is not 0;
bf_info . direction = direction ;
bf_info . thd = ha_thd ( ) ;
bf_info . need_val = need_val ;
2013-02-20 20:36:28 +00:00
bf_info . buf = buf ;
2011-08-16 12:50:38 +00:00
//
// call c_getf_next with purpose of filling in range_query_buff
//
2012-01-23 21:21:23 +00:00
rows_fetched_using_bulk_fetch = 0 ;
2013-02-20 20:36:28 +00:00
// it is expected that we can do ICP in the smart_dbt_bf_callback
// as a result, it's possible we don't return any data because
// none of the rows matched the index condition. Therefore, we need
// this while loop. icp_out_of_range will be set if we hit a row that
// the index condition states is out of our range. When that hits,
// we know all the data in the buffer is the last data we will retrieve
while ( bytes_used_in_range_query_buff = = 0 & & ! icp_went_out_of_range & & error = = 0 ) {
if ( direction > 0 ) {
error = cursor - > c_getf_next ( cursor , flags , smart_dbt_bf_callback , & bf_info ) ;
} else {
error = cursor - > c_getf_prev ( cursor , flags , smart_dbt_bf_callback , & bf_info ) ;
}
}
// if there is no data set and we went out of range,
// then there is nothing to return
if ( bytes_used_in_range_query_buff = = 0 & & icp_went_out_of_range ) {
2013-02-25 23:01:32 +00:00
icp_went_out_of_range = false ;
2013-02-20 20:36:28 +00:00
error = HA_ERR_END_OF_FILE ;
2011-08-16 12:50:38 +00:00
}
2012-01-23 21:21:23 +00:00
if ( bulk_fetch_iteration < HA_TOKU_BULK_FETCH_ITERATION_MAX ) {
bulk_fetch_iteration + + ;
}
2011-08-16 12:50:38 +00:00
2012-08-23 14:16:01 +00:00
error = handle_cursor_error ( error , HA_ERR_END_OF_FILE , tokudb_active_index ) ;
2011-08-16 12:50:38 +00:00
if ( error ) { goto cleanup ; }
//
// now that range_query_buff is filled, read an element
//
error = read_data_from_range_query_buff ( buf , need_val ) ;
}
else {
struct smart_dbt_info info ;
info . ha = this ;
info . buf = buf ;
2012-08-23 14:16:01 +00:00
info . keynr = tokudb_active_index ;
2012-04-02 19:44:50 +00:00
if ( direction > 0 ) {
error = cursor - > c_getf_next ( cursor , flags , SMART_DBT_CALLBACK , & info ) ;
} else {
error = cursor - > c_getf_prev ( cursor , flags , SMART_DBT_CALLBACK , & info ) ;
}
2012-08-23 14:16:01 +00:00
error = handle_cursor_error ( error , HA_ERR_END_OF_FILE , tokudb_active_index ) ;
2011-08-16 12:50:38 +00:00
}
}
2008-07-30 14:43:19 +00:00
//
2011-08-16 12:50:38 +00:00
// at this point, one of two things has happened
// either we have unpacked the data into buf, and we
// are done, or we have unpacked the primary key
// into last_key, and we use the code below to
// read the full row by doing a point query into the
// main table.
2008-07-30 14:43:19 +00:00
//
2011-08-16 12:50:38 +00:00
2012-08-23 14:16:01 +00:00
if ( ! error & & ! key_read & & ( tokudb_active_index ! = primary_key ) & & ! ( table - > key_info [ tokudb_active_index ] . flags & HA_CLUSTERING ) ) {
2008-07-30 14:43:19 +00:00
error = read_full_row ( buf ) ;
}
2009-09-28 19:08:52 +00:00
trx - > stmt_progress . queried + + ;
track_progress ( thd ) ;
2008-06-10 17:03:09 +00:00
cleanup :
2011-08-16 12:50:38 +00:00
return error ;
}
//
// Reads the next row from the active index (cursor) into buf, and advances cursor
// Parameters:
// [out] buf - buffer for the next row, in MySQL format
// Returns:
// 0 on success
// HA_ERR_END_OF_FILE if not found
// error otherwise
//
int ha_tokudb : : index_next ( uchar * buf ) {
TOKUDB_DBUG_ENTER ( " ha_tokudb::index_next " ) ;
2013-02-15 18:25:37 +00:00
ha_statistic_increment ( & SSV : : ha_read_next_count ) ;
2011-08-16 12:50:38 +00:00
int error = get_next ( buf , 1 ) ;
2008-06-09 20:19:52 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-07 20:19:44 +00:00
}
2009-06-13 18:39:42 +00:00
int ha_tokudb : : index_read_last ( uchar * buf , const uchar * key , uint key_len ) {
return ( index_read ( buf , key , key_len , HA_READ_PREFIX_LAST ) ) ;
}
2008-04-17 20:56:40 +00:00
//
// Reads the previous row from the active index (cursor) into buf, and advances cursor
// Parameters:
// [out] buf - buffer for the next row, in MySQL format
// Returns:
// 0 on success
// HA_ERR_END_OF_FILE if not found
// error otherwise
//
2008-02-07 20:19:44 +00:00
int ha_tokudb : : index_prev ( uchar * buf ) {
2011-08-16 12:50:38 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::index_prev " ) ;
2013-02-20 21:45:09 +00:00
ha_statistic_increment ( & SSV : : ha_read_prev_count ) ;
2011-08-16 12:50:38 +00:00
int error = get_next ( buf , - 1 ) ;
2008-06-09 20:19:52 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-07 20:19:44 +00:00
}
2008-04-17 20:56:40 +00:00
//
// Reads the first row from the active index (cursor) into buf, and advances cursor
// Parameters:
// [out] buf - buffer for the next row, in MySQL format
// Returns:
// 0 on success
// HA_ERR_END_OF_FILE if not found
// error otherwise
//
2008-02-07 20:19:44 +00:00
int ha_tokudb : : index_first ( uchar * buf ) {
2008-03-26 02:47:07 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::index_first " ) ;
2011-08-16 12:50:38 +00:00
invalidate_bulk_fetch ( ) ;
2010-03-25 13:15:03 +00:00
int error = 0 ;
2009-08-19 14:17:12 +00:00
struct smart_dbt_info info ;
2012-07-25 20:48:53 +00:00
uint32_t flags = SET_PRELOCK_FLAG ( 0 ) ;
2009-09-28 19:08:52 +00:00
THD * thd = ha_thd ( ) ;
tokudb_trx_data * trx = ( tokudb_trx_data * ) thd_data_get ( thd , tokudb_hton - > slot ) ; ;
2008-07-30 14:43:19 +00:00
HANDLE_INVALID_CURSOR ( ) ;
2009-08-19 14:17:12 +00:00
2013-02-15 18:25:37 +00:00
ha_statistic_increment ( & SSV : : ha_read_first_count ) ;
2008-07-30 14:43:19 +00:00
2009-08-19 14:17:12 +00:00
info . ha = this ;
info . buf = buf ;
2012-08-23 14:16:01 +00:00
info . keynr = tokudb_active_index ;
2009-08-19 14:17:12 +00:00
2011-10-05 21:55:09 +00:00
error = cursor - > c_getf_first ( cursor , flags ,
SMART_DBT_CALLBACK , & info ) ;
2012-08-23 14:16:01 +00:00
error = handle_cursor_error ( error , HA_ERR_END_OF_FILE , tokudb_active_index ) ;
2009-11-13 21:21:30 +00:00
2009-08-19 14:17:12 +00:00
//
// still need to get entire contents of the row if operation done on
// secondary DB and it was NOT a covering index
//
2012-08-23 14:16:01 +00:00
if ( ! error & & ! key_read & & ( tokudb_active_index ! = primary_key ) & & ! ( table - > key_info [ tokudb_active_index ] . flags & HA_CLUSTERING ) ) {
2009-08-19 14:17:12 +00:00
error = read_full_row ( buf ) ;
2008-07-30 14:43:19 +00:00
}
2009-09-28 19:08:52 +00:00
trx - > stmt_progress . queried + + ;
track_progress ( thd ) ;
2008-06-10 17:03:09 +00:00
cleanup :
2008-06-09 20:19:52 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-07 20:19:44 +00:00
}
2008-04-17 20:56:40 +00:00
//
// Reads the last row from the active index (cursor) into buf, and advances cursor
// Parameters:
// [out] buf - buffer for the next row, in MySQL format
// Returns:
// 0 on success
// HA_ERR_END_OF_FILE if not found
// error otherwise
//
2008-02-07 20:19:44 +00:00
int ha_tokudb : : index_last ( uchar * buf ) {
2008-03-26 02:47:07 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::index_last " ) ;
2011-08-16 12:50:38 +00:00
invalidate_bulk_fetch ( ) ;
2010-03-25 13:15:03 +00:00
int error = 0 ;
2009-08-19 14:17:12 +00:00
struct smart_dbt_info info ;
2012-07-25 20:48:53 +00:00
uint32_t flags = SET_PRELOCK_FLAG ( 0 ) ;
2009-09-28 19:08:52 +00:00
THD * thd = ha_thd ( ) ;
tokudb_trx_data * trx = ( tokudb_trx_data * ) thd_data_get ( thd , tokudb_hton - > slot ) ; ;
2008-07-30 14:43:19 +00:00
HANDLE_INVALID_CURSOR ( ) ;
2009-08-19 14:17:12 +00:00
2013-02-15 18:25:37 +00:00
ha_statistic_increment ( & SSV : : ha_read_last_count ) ;
2008-07-30 14:43:19 +00:00
2009-08-19 14:17:12 +00:00
info . ha = this ;
info . buf = buf ;
2012-08-23 14:16:01 +00:00
info . keynr = tokudb_active_index ;
2009-08-19 14:17:12 +00:00
2011-10-05 21:55:09 +00:00
error = cursor - > c_getf_last ( cursor , flags ,
SMART_DBT_CALLBACK , & info ) ;
2012-08-23 14:16:01 +00:00
error = handle_cursor_error ( error , HA_ERR_END_OF_FILE , tokudb_active_index ) ;
2009-08-19 14:17:12 +00:00
//
// still need to get entire contents of the row if operation done on
// secondary DB and it was NOT a covering index
//
2012-08-23 14:16:01 +00:00
if ( ! error & & ! key_read & & ( tokudb_active_index ! = primary_key ) & & ! ( table - > key_info [ tokudb_active_index ] . flags & HA_CLUSTERING ) ) {
2009-08-19 14:17:12 +00:00
error = read_full_row ( buf ) ;
2008-07-30 14:43:19 +00:00
}
2009-09-28 19:08:52 +00:00
if ( trx ) {
trx - > stmt_progress . queried + + ;
}
track_progress ( thd ) ;
2008-06-10 17:03:09 +00:00
cleanup :
2008-06-09 20:19:52 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-07 20:19:44 +00:00
}
2008-04-17 20:56:40 +00:00
//
// Initialize a scan of the table (which is why index_init is called on primary_key)
// Parameters:
// scan - unused
// Returns:
// 0 on success
// error otherwise
//
2008-02-07 20:19:44 +00:00
int ha_tokudb : : rnd_init ( bool scan ) {
2008-03-26 02:47:07 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::rnd_init " ) ;
2010-03-25 13:15:03 +00:00
int error = 0 ;
2008-06-17 14:31:53 +00:00
range_lock_grabbed = false ;
2012-08-23 14:16:01 +00:00
error = index_init ( MAX_KEY , 0 ) ;
2010-09-03 20:47:01 +00:00
if ( error ) { goto cleanup ; }
2008-06-06 18:41:08 +00:00
if ( scan ) {
2011-08-16 12:50:38 +00:00
error = prelock_range ( NULL , NULL ) ;
2010-11-24 14:01:48 +00:00
if ( error ) { goto cleanup ; }
2008-06-06 18:41:08 +00:00
}
2008-06-11 21:09:47 +00:00
//
2008-06-17 14:31:53 +00:00
// only want to set range_lock_grabbed to true after index_init
2008-06-11 21:09:47 +00:00
// successfully executed for two reasons:
// 1) index_init will reset it to false anyway
// 2) if it fails, we don't want prelocking on,
//
2008-06-17 14:31:53 +00:00
if ( scan ) { range_lock_grabbed = true ; }
2008-06-11 21:09:47 +00:00
error = 0 ;
2008-06-06 18:41:08 +00:00
cleanup :
2010-11-24 14:01:48 +00:00
if ( error ) {
index_end ( ) ;
last_cursor_error = error ;
}
2008-06-06 18:41:08 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-07 20:19:44 +00:00
}
2008-04-17 20:56:40 +00:00
//
// End a scan of the table
//
2008-02-07 20:19:44 +00:00
int ha_tokudb : : rnd_end ( ) {
2008-05-05 18:38:04 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::rnd_end " ) ;
2008-06-17 14:31:53 +00:00
range_lock_grabbed = false ;
2008-05-05 18:38:04 +00:00
TOKUDB_DBUG_RETURN ( index_end ( ) ) ;
2008-02-07 20:19:44 +00:00
}
2008-07-30 14:43:19 +00:00
2008-04-17 20:56:40 +00:00
//
// Read the next row in a table scan
// Parameters:
// [out] buf - buffer for the next row, in MySQL format
// Returns:
// 0 on success
// HA_ERR_END_OF_FILE if not found
// error otherwise
//
2008-02-07 20:19:44 +00:00
int ha_tokudb : : rnd_next ( uchar * buf ) {
2008-03-26 02:47:07 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::ha_tokudb::rnd_next " ) ;
2013-02-15 18:25:37 +00:00
ha_statistic_increment ( & SSV : : ha_read_rnd_next_count ) ;
2011-08-16 12:50:38 +00:00
int error = get_next ( buf , 1 ) ;
2008-06-09 20:19:52 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-07 20:19:44 +00:00
}
2009-09-28 19:08:52 +00:00
void ha_tokudb : : track_progress ( THD * thd ) {
tokudb_trx_data * trx = ( tokudb_trx_data * ) thd_data_get ( thd , tokudb_hton - > slot ) ;
if ( trx ) {
2009-10-06 18:07:44 +00:00
ulonglong num_written = trx - > stmt_progress . inserted + trx - > stmt_progress . updated + trx - > stmt_progress . deleted ;
2009-09-28 19:53:20 +00:00
bool update_status =
2009-10-12 13:48:53 +00:00
( trx - > stmt_progress . queried & & tokudb_read_status_frequency & & ( trx - > stmt_progress . queried % tokudb_read_status_frequency ) = = 0 ) | |
2010-02-23 16:42:08 +00:00
( num_written & & tokudb_write_status_frequency & & ( num_written % tokudb_write_status_frequency ) = = 0 ) ;
2009-09-28 19:08:52 +00:00
if ( update_status ) {
2009-10-08 21:06:31 +00:00
char * next_status = write_status_msg ;
bool first = true ;
int r ;
if ( trx - > stmt_progress . queried ) {
2009-10-09 12:25:54 +00:00
r = sprintf ( next_status , " Queried about %llu row%s " , trx - > stmt_progress . queried , trx - > stmt_progress . queried = = 1 ? " " : " s " ) ;
assert ( r > = 0 ) ;
2009-10-08 21:06:31 +00:00
next_status + = r ;
first = false ;
}
if ( trx - > stmt_progress . inserted ) {
2010-07-15 16:18:56 +00:00
if ( trx - > stmt_progress . using_loader ) {
r = sprintf ( next_status , " %sFetched about %llu row%s, loading data still remains " , first ? " " : " , " , trx - > stmt_progress . inserted , trx - > stmt_progress . inserted = = 1 ? " " : " s " ) ;
}
else {
r = sprintf ( next_status , " %sInserted about %llu row%s " , first ? " " : " , " , trx - > stmt_progress . inserted , trx - > stmt_progress . inserted = = 1 ? " " : " s " ) ;
}
2009-10-09 12:25:54 +00:00
assert ( r > = 0 ) ;
2009-10-08 21:06:31 +00:00
next_status + = r ;
first = false ;
}
if ( trx - > stmt_progress . updated ) {
2009-10-09 12:25:54 +00:00
r = sprintf ( next_status , " %sUpdated about %llu row%s " , first ? " " : " , " , trx - > stmt_progress . updated , trx - > stmt_progress . updated = = 1 ? " " : " s " ) ;
assert ( r > = 0 ) ;
2009-10-08 21:06:31 +00:00
next_status + = r ;
first = false ;
}
if ( trx - > stmt_progress . deleted ) {
2009-10-09 12:25:54 +00:00
r = sprintf ( next_status , " %sDeleted about %llu row%s " , first ? " " : " , " , trx - > stmt_progress . deleted , trx - > stmt_progress . deleted = = 1 ? " " : " s " ) ;
assert ( r > = 0 ) ;
2009-10-08 21:06:31 +00:00
next_status + = r ;
first = false ;
}
2009-10-10 12:05:34 +00:00
if ( ! first )
2012-07-26 12:44:37 +00:00
thd_proc_info ( thd , write_status_msg ) ;
2009-09-28 19:08:52 +00:00
}
}
}
2008-02-07 20:19:44 +00:00
DBT * ha_tokudb : : get_pos ( DBT * to , uchar * pos ) {
2008-05-05 18:38:04 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::get_pos " ) ;
2008-02-07 20:19:44 +00:00
/* We don't need to set app_data here */
2012-05-09 18:36:52 +00:00
memset ( ( void * ) to , 0 , sizeof ( * to ) ) ;
2012-07-25 20:48:53 +00:00
to - > data = pos + sizeof ( uint32_t ) ;
to - > size = * ( uint32_t * ) pos ;
2008-02-07 20:19:44 +00:00
DBUG_DUMP ( " key " , ( const uchar * ) to - > data , to - > size ) ;
2008-05-05 18:38:04 +00:00
DBUG_RETURN ( to ) ;
2008-02-07 20:19:44 +00:00
}
2008-04-17 20:56:40 +00:00
//
2008-04-24 22:17:41 +00:00
// Retrieves a row with based on the primary key saved in pos
2008-04-17 20:56:40 +00:00
// Returns:
// 0 on success
// HA_ERR_KEY_NOT_FOUND if not found
// error otherwise
//
2008-02-07 20:19:44 +00:00
int ha_tokudb : : rnd_pos ( uchar * buf , uchar * pos ) {
2008-03-26 02:47:07 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::rnd_pos " ) ;
2008-02-07 20:19:44 +00:00
DBT db_pos ;
2010-03-25 13:15:03 +00:00
int error = 0 ;
2009-08-06 15:49:36 +00:00
struct smart_dbt_info info ;
bool old_unpack_entire_row = unpack_entire_row ;
DBT * key = get_pos ( & db_pos , pos ) ;
unpack_entire_row = true ;
2013-02-15 18:25:37 +00:00
ha_statistic_increment ( & SSV : : ha_read_rnd_count ) ;
2012-08-23 14:16:01 +00:00
tokudb_active_index = MAX_KEY ;
2009-08-06 15:49:36 +00:00
info . ha = this ;
info . buf = buf ;
info . keynr = primary_key ;
2011-10-05 21:55:09 +00:00
error = share - > file - > getf_set ( share - > file , transaction ,
get_cursor_isolation_flags ( lock . type , ha_thd ( ) ) ,
key , smart_dbt_callback_rowread_ptquery , & info ) ;
2010-02-12 22:19:57 +00:00
2009-02-09 20:20:30 +00:00
if ( error = = DB_NOTFOUND ) {
2008-07-30 14:43:19 +00:00
error = HA_ERR_KEY_NOT_FOUND ;
goto cleanup ;
}
cleanup :
2009-08-06 15:49:36 +00:00
unpack_entire_row = old_unpack_entire_row ;
2008-07-30 14:43:19 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-05 16:00:53 +00:00
}
2009-07-08 19:08:19 +00:00
int ha_tokudb : : prelock_range ( const key_range * start_key , const key_range * end_key ) {
2011-06-13 18:01:03 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::prelock_range " ) ;
2011-08-16 12:50:38 +00:00
THD * thd = ha_thd ( ) ;
2010-03-25 13:15:03 +00:00
int error = 0 ;
2008-06-06 21:41:22 +00:00
DBT start_dbt_key ;
DBT end_dbt_key ;
2011-08-16 12:50:38 +00:00
uchar * start_key_buff = prelocked_left_range ;
uchar * end_key_buff = prelocked_right_range ;
2008-10-13 17:50:40 +00:00
2012-05-09 18:36:52 +00:00
memset ( ( void * ) & start_dbt_key , 0 , sizeof ( start_dbt_key ) ) ;
memset ( ( void * ) & end_dbt_key , 0 , sizeof ( end_dbt_key ) ) ;
2008-06-06 21:41:22 +00:00
2010-09-03 20:47:01 +00:00
HANDLE_INVALID_CURSOR ( ) ;
2008-06-06 21:41:22 +00:00
if ( start_key ) {
switch ( start_key - > flag ) {
case HA_READ_AFTER_KEY :
2012-08-23 14:16:01 +00:00
pack_key ( & start_dbt_key , tokudb_active_index , start_key_buff , start_key - > key , start_key - > length , COL_POS_INF ) ;
2008-06-06 21:41:22 +00:00
break ;
default :
2012-08-23 14:16:01 +00:00
pack_key ( & start_dbt_key , tokudb_active_index , start_key_buff , start_key - > key , start_key - > length , COL_NEG_INF ) ;
2008-06-06 21:41:22 +00:00
break ;
}
2011-08-16 12:50:38 +00:00
prelocked_left_range_size = start_dbt_key . size ;
}
else {
prelocked_left_range_size = 0 ;
2008-06-06 21:41:22 +00:00
}
2010-09-03 20:47:01 +00:00
2008-06-06 21:41:22 +00:00
if ( end_key ) {
switch ( end_key - > flag ) {
case HA_READ_BEFORE_KEY :
2012-08-23 14:16:01 +00:00
pack_key ( & end_dbt_key , tokudb_active_index , end_key_buff , end_key - > key , end_key - > length , COL_NEG_INF ) ;
2008-06-06 21:41:22 +00:00
break ;
default :
2012-08-23 14:16:01 +00:00
pack_key ( & end_dbt_key , tokudb_active_index , end_key_buff , end_key - > key , end_key - > length , COL_POS_INF ) ;
2008-06-06 21:41:22 +00:00
break ;
2011-06-13 18:01:03 +00:00
}
2011-08-16 12:50:38 +00:00
prelocked_right_range_size = end_dbt_key . size ;
}
else {
prelocked_right_range_size = 0 ;
2008-06-06 21:41:22 +00:00
}
2011-10-05 21:55:09 +00:00
error = cursor - > c_pre_acquire_range_lock (
cursor ,
2012-08-23 14:16:01 +00:00
start_key ? & start_dbt_key : share - > key_file [ tokudb_active_index ] - > dbt_neg_infty ( ) ,
end_key ? & end_dbt_key : share - > key_file [ tokudb_active_index ] - > dbt_pos_infty ( )
2011-10-05 21:55:09 +00:00
) ;
2008-06-10 17:03:09 +00:00
if ( error ) {
last_cursor_error = error ;
//
// cursor should be initialized here, but in case it is not, we still check
//
if ( cursor ) {
2009-12-03 16:59:52 +00:00
int r = cursor - > c_close ( cursor ) ;
assert ( r = = 0 ) ;
2008-06-10 17:03:09 +00:00
cursor = NULL ;
}
goto cleanup ;
}
2008-06-06 21:41:22 +00:00
2011-08-16 12:50:38 +00:00
//
// at this point, determine if we will be doing bulk fetch
// as of now, only do it if we are doing a select
//
doing_bulk_fetch = ( thd_sql_command ( thd ) = = SQLCOM_SELECT ) ;
2012-01-23 21:21:23 +00:00
bulk_fetch_iteration = 0 ;
rows_fetched_using_bulk_fetch = 0 ;
2011-08-16 12:50:38 +00:00
2008-06-06 21:41:22 +00:00
cleanup :
TOKUDB_DBUG_RETURN ( error ) ;
2008-06-05 18:43:49 +00:00
}
2009-07-08 19:08:19 +00:00
2009-07-27 14:52:30 +00:00
//
// Prelock range if possible, start_key is leftmost, end_key is rightmost
// whether scanning forward or backward. This function is called by MySQL
// for backward range queries (in QUICK_SELECT_DESC::get_next).
// Forward scans use read_range_first()/read_range_next().
//
2009-07-08 19:08:19 +00:00
int ha_tokudb : : prepare_range_scan ( const key_range * start_key , const key_range * end_key ) {
2009-07-20 14:23:05 +00:00
int error = prelock_range ( start_key , end_key ) ;
if ( ! error ) {
range_lock_grabbed = true ;
}
return error ;
2009-07-08 19:08:19 +00:00
}
int ha_tokudb : : read_range_first (
const key_range * start_key ,
const key_range * end_key ,
bool eq_range ,
bool sorted )
{
2011-06-13 18:01:03 +00:00
int error = prelock_range ( start_key , end_key ) ;
2009-07-08 19:08:19 +00:00
if ( error ) { goto cleanup ; }
range_lock_grabbed = true ;
error = handler : : read_range_first ( start_key , end_key , eq_range , sorted ) ;
cleanup :
return error ;
}
2011-06-13 18:01:03 +00:00
2008-06-05 18:43:49 +00:00
int ha_tokudb : : read_range_next ( )
{
2008-06-11 21:09:47 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::read_range_next " ) ;
int error ;
error = handler : : read_range_next ( ) ;
if ( error ) {
2008-06-17 14:31:53 +00:00
range_lock_grabbed = false ;
2008-06-11 21:09:47 +00:00
}
TOKUDB_DBUG_RETURN ( error ) ;
2008-06-05 18:43:49 +00:00
}
2008-02-05 16:00:53 +00:00
/*
Set a reference to the current record in ( ref , ref_length ) .
SYNOPSIS
ha_tokudb : : position ( )
record The current record buffer
DESCRIPTION
The BDB handler stores the primary key in ( ref , ref_length ) .
There is either an explicit primary key , or an implicit ( hidden )
primary key .
During open ( ) , ' ref_length ' is calculated as the maximum primary
key length . When an actual key is shorter than that , the rest of
the buffer must be cleared out . The row cannot be identified , if
garbage follows behind the end of the key . There is no length
field for the current key , so that the whole ref_length is used
for comparison .
RETURN
nothing
*/
2008-02-07 20:19:44 +00:00
void ha_tokudb : : position ( const uchar * record ) {
2008-03-26 02:47:07 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::position " ) ;
2008-02-07 20:19:44 +00:00
DBT key ;
if ( hidden_primary_key ) {
2012-07-25 20:48:53 +00:00
DBUG_ASSERT ( ref_length = = ( TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH + sizeof ( uint32_t ) ) ) ;
memcpy_fixed ( ref + sizeof ( uint32_t ) , current_ident , TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH ) ;
* ( uint32_t * ) ref = TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH ;
2008-08-10 16:39:16 +00:00
}
else {
2009-03-24 19:27:28 +00:00
bool has_null ;
//
// save the data
//
2012-07-25 20:48:53 +00:00
create_dbt_key_from_table ( & key , primary_key , ref + sizeof ( uint32_t ) , record , & has_null ) ;
2009-03-24 19:27:28 +00:00
//
// save the size of data in the first four bytes of ref
//
2012-07-25 20:48:53 +00:00
memcpy ( ref , & key . size , sizeof ( uint32_t ) ) ;
2008-02-07 20:19:44 +00:00
}
DBUG_VOID_RETURN ;
}
2008-04-17 20:56:40 +00:00
//
// Per InnoDB: Returns statistics information of the table to the MySQL interpreter,
// in various fields of the handle object.
// Return:
// 0, always success
//
2008-02-07 20:19:44 +00:00
int ha_tokudb : : info ( uint flag ) {
2010-03-25 13:30:54 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::info %p %d %lld " , this , flag , ( long long ) share - > rows ) ;
2009-09-04 02:30:35 +00:00
int error ;
DB_TXN * txn = NULL ;
uint curr_num_DBs = table - > s - > keys + test ( hidden_primary_key ) ;
DB_BTREE_STAT64 dict_stats ;
2008-02-07 20:19:44 +00:00
if ( flag & HA_STATUS_VARIABLE ) {
// Just to get optimizations right
2008-12-30 17:41:26 +00:00
stats . records = share - > rows + share - > rows_from_locked_table ;
2010-12-08 21:14:13 +00:00
if ( stats . records = = 0 ) {
stats . records + + ;
}
2008-02-07 20:19:44 +00:00
stats . deleted = 0 ;
2009-09-04 02:30:35 +00:00
if ( ! ( flag & HA_STATUS_NO_LOCK ) ) {
2012-07-25 20:48:53 +00:00
uint64_t num_rows = 0 ;
2010-12-08 15:06:06 +00:00
TOKU_DB_FRAGMENTATION_S frag_info ;
memset ( & frag_info , 0 , sizeof frag_info ) ;
2010-03-25 13:30:54 +00:00
2009-09-04 02:30:35 +00:00
error = db_env - > txn_begin ( db_env , NULL , & txn , DB_READ_UNCOMMITTED ) ;
if ( error ) { goto cleanup ; }
2012-03-23 15:49:27 +00:00
// we should always have a primary key
assert ( share - > file ! = NULL ) ;
2010-03-06 00:58:21 +00:00
error = estimate_num_rows ( share - > file , & num_rows , txn ) ;
if ( error = = 0 ) {
share - > rows = num_rows ;
stats . records = num_rows ;
2010-12-08 21:14:13 +00:00
if ( stats . records = = 0 ) {
stats . records + + ;
}
2010-03-06 00:58:21 +00:00
}
else {
goto cleanup ;
}
2010-03-09 02:55:50 +00:00
error = share - > file - > get_fragmentation (
share - > file ,
& frag_info
) ;
if ( error ) { goto cleanup ; }
stats . delete_length = frag_info . unused_bytes ;
2010-03-06 00:58:21 +00:00
2009-09-04 02:30:35 +00:00
error = share - > file - > stat64 (
share - > file ,
txn ,
& dict_stats
) ;
if ( error ) { goto cleanup ; }
2009-09-22 14:49:41 +00:00
2011-10-13 03:19:36 +00:00
stats . create_time = dict_stats . bt_create_time_sec ;
stats . update_time = dict_stats . bt_modify_time_sec ;
2012-03-08 22:12:09 +00:00
stats . check_time = dict_stats . bt_verify_time_sec ;
2009-09-04 02:30:35 +00:00
stats . data_file_length = dict_stats . bt_dsize ;
2009-09-22 14:49:41 +00:00
if ( hidden_primary_key ) {
//
// in this case, we have a hidden primary key, do not
// want to report space taken up by the hidden primary key to the user
//
2012-07-25 20:48:53 +00:00
uint64_t hpk_space = TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH * dict_stats . bt_ndata ;
2009-09-22 14:49:41 +00:00
stats . data_file_length = ( hpk_space > stats . data_file_length ) ? 0 : stats . data_file_length - hpk_space ;
}
else {
//
// one infinity byte per key needs to be subtracted
//
2012-07-25 20:48:53 +00:00
uint64_t inf_byte_space = dict_stats . bt_ndata ;
2009-09-22 14:49:41 +00:00
stats . data_file_length = ( inf_byte_space > stats . data_file_length ) ? 0 : stats . data_file_length - inf_byte_space ;
}
2009-09-09 14:16:39 +00:00
stats . mean_rec_length = stats . records ? ( ulong ) ( stats . data_file_length / stats . records ) : 0 ;
2009-09-04 02:30:35 +00:00
stats . index_file_length = 0 ;
2012-03-23 15:49:27 +00:00
// curr_num_DBs is the number of keys we have, according
// to the mysql layer. if drop index is running concurrently
// with info() (it can, because info does not take table locks),
// then it could be the case that one of the dbs was dropped
// and set to NULL before mysql was able to set table->s->keys
// accordingly.
//
// we should just ignore any DB * that is NULL.
//
// this solution is much simpler than trying to maintain an
// accurate number of valid keys at the handlerton layer.
2009-09-04 02:30:35 +00:00
for ( uint i = 0 ; i < curr_num_DBs ; i + + ) {
2012-03-23 15:49:27 +00:00
// skip the primary key, skip dropped indexes
if ( i = = primary_key | | share - > key_file [ i ] = = NULL ) {
2009-09-04 02:30:35 +00:00
continue ;
}
error = share - > key_file [ i ] - > stat64 (
share - > key_file [ i ] ,
txn ,
& dict_stats
) ;
if ( error ) { goto cleanup ; }
stats . index_file_length + = dict_stats . bt_dsize ;
2010-03-09 02:55:50 +00:00
error = share - > file - > get_fragmentation (
share - > file ,
& frag_info
) ;
if ( error ) { goto cleanup ; }
stats . delete_length + = frag_info . unused_bytes ;
2009-09-04 02:30:35 +00:00
}
}
2008-02-07 20:19:44 +00:00
}
2008-07-03 19:42:49 +00:00
if ( ( flag & HA_STATUS_CONST ) ) {
2009-09-09 16:48:15 +00:00
stats . max_data_file_length = 9223372036854775807ULL ;
2008-02-07 20:19:44 +00:00
for ( uint i = 0 ; i < table_share - > keys ; i + + ) {
2012-10-12 14:22:20 +00:00
bool is_unique_key = ( i = = primary_key ) | | ( table - > key_info [ i ] . flags & HA_NOSAME ) ;
ulong val = ( is_unique_key ) ? 1 : 0 ;
2012-12-12 18:37:24 +00:00
table - > key_info [ i ] . rec_per_key [ get_key_parts ( & table - > key_info [ i ] ) - 1 ] = val ;
2008-02-07 20:19:44 +00:00
}
}
/* Don't return key if we got an error for the internal primary key */
2008-10-10 21:13:23 +00:00
if ( flag & HA_STATUS_ERRKEY & & last_dup_key < table_share - > keys ) {
2008-02-07 20:19:44 +00:00
errkey = last_dup_key ;
2008-10-10 21:13:23 +00:00
}
2008-11-18 22:20:06 +00:00
if ( flag & HA_STATUS_AUTO & & table - > found_next_number_field ) {
2008-10-10 21:13:23 +00:00
THD * thd = table - > in_use ;
struct system_variables * variables = & thd - > variables ;
2008-11-18 22:20:06 +00:00
stats . auto_increment_value = share - > last_auto_increment + variables - > auto_increment_increment ;
}
2009-09-04 02:30:35 +00:00
error = 0 ;
cleanup :
if ( txn ! = NULL ) {
2009-11-10 19:22:08 +00:00
commit_txn ( txn , DB_TXN_NOSYNC ) ;
2009-09-04 02:30:35 +00:00
txn = NULL ;
}
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-07 20:19:44 +00:00
}
2008-04-17 20:56:40 +00:00
//
// Per InnoDB: Tells something additional to the handler about how to do things.
//
2008-02-07 20:19:44 +00:00
int ha_tokudb : : extra ( enum ha_extra_function operation ) {
2008-04-17 11:12:01 +00:00
TOKUDB_DBUG_ENTER ( " extra %p %d " , this , operation ) ;
2008-02-07 20:19:44 +00:00
switch ( operation ) {
case HA_EXTRA_RESET_STATE :
reset ( ) ;
break ;
case HA_EXTRA_KEYREAD :
key_read = 1 ; // Query satisfied with key
break ;
case HA_EXTRA_NO_KEYREAD :
key_read = 0 ;
break ;
case HA_EXTRA_IGNORE_DUP_KEY :
using_ignore = 1 ;
break ;
case HA_EXTRA_NO_IGNORE_DUP_KEY :
using_ignore = 0 ;
break ;
default :
break ;
}
2008-04-17 11:12:01 +00:00
TOKUDB_DBUG_RETURN ( 0 ) ;
2008-02-07 20:19:44 +00:00
}
int ha_tokudb : : reset ( void ) {
2008-05-05 18:38:04 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::reset " ) ;
2008-02-07 20:19:44 +00:00
key_read = 0 ;
using_ignore = 0 ;
2013-02-17 03:44:31 +00:00
reset_dsmrr ( ) ;
2013-02-20 20:36:28 +00:00
invalidate_icp ( ) ;
2008-05-05 18:38:04 +00:00
TOKUDB_DBUG_RETURN ( 0 ) ;
2008-02-05 16:00:53 +00:00
}
2008-06-26 15:43:33 +00:00
//
// helper function that iterates through all DB's
// and grabs a lock (either read or write, but not both)
// Parameters:
// [in] trans - transaction to be used to pre acquire the lock
// lt - type of lock to get, either lock_read or lock_write
// Returns:
// 0 on success
// error otherwise
//
int ha_tokudb : : acquire_table_lock ( DB_TXN * trans , TABLE_LOCK_TYPE lt ) {
int error = ENOSYS ;
2010-11-17 23:09:06 +00:00
rw_rdlock ( & share - > num_DBs_lock ) ;
uint curr_num_DBs = share - > num_DBs ;
2008-06-26 15:43:33 +00:00
if ( lt = = lock_read ) {
2010-09-03 20:47:01 +00:00
error = 0 ;
goto cleanup ;
2008-06-26 15:43:33 +00:00
}
else if ( lt = = lock_write ) {
2009-04-13 21:23:37 +00:00
if ( tokudb_debug & TOKUDB_DEBUG_LOCK )
TOKUDB_TRACE ( " %s \n " , __FUNCTION__ ) ;
2008-06-26 15:43:33 +00:00
for ( uint i = 0 ; i < curr_num_DBs ; i + + ) {
DB * db = share - > key_file [ i ] ;
error = db - > pre_acquire_table_lock ( db , trans ) ;
2009-04-13 21:23:37 +00:00
if ( error = = EINVAL )
TOKUDB_TRACE ( " %s %d db=%p trans=%p \n " , __FUNCTION__ , i , db , trans ) ;
if ( error ) break ;
2008-06-26 15:43:33 +00:00
}
2009-04-13 21:23:37 +00:00
if ( tokudb_debug & TOKUDB_DEBUG_LOCK )
TOKUDB_TRACE ( " %s error=%d \n " , __FUNCTION__ , error ) ;
if ( error ) goto cleanup ;
2008-06-26 15:43:33 +00:00
}
else {
error = ENOSYS ;
goto cleanup ;
}
error = 0 ;
cleanup :
2010-11-17 23:09:06 +00:00
rw_unlock ( & share - > num_DBs_lock ) ;
2008-06-26 15:43:33 +00:00
return error ;
}
2009-08-25 20:48:12 +00:00
int ha_tokudb : : create_txn ( THD * thd , tokudb_trx_data * trx ) {
int error ;
ulong tx_isolation = thd_tx_isolation ( thd ) ;
HA_TOKU_ISO_LEVEL toku_iso_level = tx_to_toku_iso ( tx_isolation ) ;
2011-11-04 01:48:38 +00:00
bool is_autocommit = ! thd_test_options (
thd , OPTION_NOT_AUTOCOMMIT | OPTION_BEGIN ) ;
2009-08-25 20:48:12 +00:00
/* First table lock, start transaction */
2010-05-04 17:11:34 +00:00
if ( thd_test_options ( thd , OPTION_NOT_AUTOCOMMIT | OPTION_BEGIN ) & &
2009-08-25 20:48:12 +00:00
! trx - > all & &
( thd_sql_command ( thd ) ! = SQLCOM_CREATE_TABLE ) & &
( thd_sql_command ( thd ) ! = SQLCOM_DROP_TABLE ) & &
2011-03-04 19:54:23 +00:00
( thd_sql_command ( thd ) ! = SQLCOM_DROP_INDEX ) & &
( thd_sql_command ( thd ) ! = SQLCOM_CREATE_INDEX ) & &
2009-08-25 20:48:12 +00:00
( thd_sql_command ( thd ) ! = SQLCOM_ALTER_TABLE ) ) {
/* QQQ We have to start a master transaction */
2010-05-04 17:11:34 +00:00
// DBUG_PRINT("trans", ("starting transaction all "));
2009-08-25 20:48:12 +00:00
if ( ( error = db_env - > txn_begin ( db_env , NULL , & trx - > all , toku_iso_to_txn_flag ( toku_iso_level ) ) ) ) {
trx - > tokudb_lock_count - - ; // We didn't get the lock
goto cleanup ;
}
if ( tokudb_debug & TOKUDB_DEBUG_TXN ) {
2010-07-05 14:35:31 +00:00
TOKUDB_TRACE ( " just created master:%p \n " , trx - > all ) ;
2009-08-25 20:48:12 +00:00
}
trx - > sp_level = trx - > all ;
2012-07-25 20:48:53 +00:00
trans_register_ha ( thd , true , tokudb_hton ) ;
2009-08-25 20:48:12 +00:00
}
DBUG_PRINT ( " trans " , ( " starting transaction stmt " ) ) ;
if ( trx - > stmt ) {
if ( tokudb_debug & TOKUDB_DEBUG_TXN ) {
TOKUDB_TRACE ( " warning:stmt=%p \n " , trx - > stmt ) ;
}
}
2012-07-25 20:48:53 +00:00
uint32_t txn_begin_flags ;
2010-01-11 18:24:50 +00:00
if ( trx - > all = = NULL ) {
2009-08-25 20:48:12 +00:00
txn_begin_flags = toku_iso_to_txn_flag ( toku_iso_level ) ;
2012-11-16 14:45:19 +00:00
//
// if the isolation level that the user has set is serializable,
// but autocommit is on and this is just a select,
// then we can go ahead and set the isolation level to
// be a snapshot read, because we can serialize
// the transaction to be the point in time at which the snapshot began.
//
2011-11-14 19:00:44 +00:00
if ( txn_begin_flags = = 0 & & is_autocommit & & thd_sql_command ( thd ) = = SQLCOM_SELECT ) {
2011-11-04 01:48:38 +00:00
txn_begin_flags = DB_TXN_SNAPSHOT ;
}
2009-08-25 20:48:12 +00:00
}
else {
2010-01-11 18:24:50 +00:00
txn_begin_flags = DB_INHERIT_ISOLATION ;
2009-08-25 20:48:12 +00:00
}
if ( ( error = db_env - > txn_begin ( db_env , trx - > sp_level , & trx - > stmt , txn_begin_flags ) ) ) {
/* We leave the possible master transaction open */
trx - > tokudb_lock_count - - ; // We didn't get the lock
goto cleanup ;
}
2010-07-05 14:35:31 +00:00
trx - > sub_sp_level = trx - > stmt ;
2009-08-25 20:48:12 +00:00
if ( tokudb_debug & TOKUDB_DEBUG_TXN ) {
2010-07-05 14:35:31 +00:00
TOKUDB_TRACE ( " just created stmt:%p:%p \n " , trx - > sp_level , trx - > stmt ) ;
2009-08-25 20:48:12 +00:00
}
2009-09-28 19:08:52 +00:00
reset_stmt_progress ( & trx - > stmt_progress ) ;
2012-07-25 20:48:53 +00:00
trans_register_ha ( thd , false , tokudb_hton ) ;
2009-08-25 20:48:12 +00:00
cleanup :
return error ;
}
2008-06-26 15:43:33 +00:00
2008-02-05 16:00:53 +00:00
/*
As MySQL will execute an external lock for every new table it uses
we can use this to start the transactions .
If we are in auto_commit mode we just need to start a transaction
for the statement to be able to rollback the statement .
If not , we have to start a master transaction if there doesn ' t exist
one from before .
*/
2008-04-17 20:56:40 +00:00
//
// Parameters:
// [in] thd - handle to the user thread
// lock_type - the type of lock
// Returns:
// 0 on success
// error otherwise
//
2008-02-07 20:19:44 +00:00
int ha_tokudb : : external_lock ( THD * thd , int lock_type ) {
2009-04-13 21:23:37 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::external_lock cmd=%d %d " , thd_sql_command ( thd ) , lock_type ) ;
if ( tokudb_debug & TOKUDB_DEBUG_LOCK )
TOKUDB_TRACE ( " %s cmd=%d %d \n " , __FUNCTION__ , thd_sql_command ( thd ) , lock_type ) ;
2011-06-13 18:01:03 +00:00
2008-06-25 19:12:59 +00:00
int error = 0 ;
tokudb_trx_data * trx = NULL ;
trx = ( tokudb_trx_data * ) thd_data_get ( thd , tokudb_hton - > slot ) ;
2008-02-07 20:19:44 +00:00
if ( ! trx ) {
2009-09-29 21:47:37 +00:00
error = create_tokudb_trx_data_instance ( & trx ) ;
if ( error ) { goto cleanup ; }
2008-05-02 17:36:22 +00:00
thd_data_set ( thd , tokudb_hton - > slot , trx ) ;
2008-02-07 20:19:44 +00:00
}
2008-10-08 18:29:32 +00:00
if ( trx - > all = = NULL ) {
trx - > sp_level = NULL ;
2008-06-17 14:31:53 +00:00
}
2008-02-07 20:19:44 +00:00
if ( lock_type ! = F_UNLCK ) {
2011-03-04 19:54:23 +00:00
is_fast_alter_running = false ;
2011-06-13 18:01:03 +00:00
use_write_locks = false ;
2011-06-21 18:18:06 +00:00
if ( lock_type = = F_WRLCK )
2011-06-13 18:01:03 +00:00
use_write_locks = true ;
2008-02-07 20:19:44 +00:00
if ( ! trx - > tokudb_lock_count + + ) {
DBUG_ASSERT ( trx - > stmt = = 0 ) ;
2008-04-18 19:54:14 +00:00
transaction = NULL ; // Safety
2009-08-25 20:48:12 +00:00
error = create_txn ( thd , trx ) ;
if ( error ) {
2008-06-25 19:12:59 +00:00
goto cleanup ;
2008-02-07 20:19:44 +00:00
}
}
2010-07-05 14:35:31 +00:00
assert ( thd - > in_sub_stmt = = 0 ) ;
transaction = trx - > sub_sp_level ;
2008-06-17 14:31:53 +00:00
}
else {
2008-07-08 01:59:46 +00:00
pthread_mutex_lock ( & share - > mutex ) ;
// hate dealing with comparison of signed vs unsigned, so doing this
if ( deleted_rows > added_rows & & share - > rows < ( deleted_rows - added_rows ) ) {
share - > rows = 0 ;
}
else {
share - > rows + = ( added_rows - deleted_rows ) ;
}
pthread_mutex_unlock ( & share - > mutex ) ;
added_rows = 0 ;
deleted_rows = 0 ;
2008-12-30 17:41:26 +00:00
share - > rows_from_locked_table = 0 ;
2012-08-08 17:45:04 +00:00
if ( trx - > tokudb_lock_count > 0 & & ! - - trx - > tokudb_lock_count ) {
2008-02-07 20:19:44 +00:00
if ( trx - > stmt ) {
/*
F_UNLCK is done without a transaction commit / rollback .
This happens if the thread didn ' t update any rows
We must in this case commit the work to keep the row locks
*/
DBUG_PRINT ( " trans " , ( " commiting non-updating transaction " ) ) ;
2009-09-28 19:08:52 +00:00
reset_stmt_progress ( & trx - > stmt_progress ) ;
2011-03-04 19:54:23 +00:00
if ( ! is_fast_alter_running ) {
2012-10-11 20:36:38 +00:00
commit_txn ( trx - > stmt , 0 ) ;
if ( tokudb_debug & TOKUDB_DEBUG_TXN ) {
TOKUDB_TRACE ( " commit:%p:%d \n " , trx - > stmt , error ) ;
2011-03-04 19:54:23 +00:00
}
trx - > stmt = NULL ;
trx - > sub_sp_level = NULL ;
}
2008-03-06 19:00:18 +00:00
}
}
2008-07-03 16:30:01 +00:00
transaction = NULL ;
2011-03-04 19:54:23 +00:00
is_fast_alter_running = false ;
2008-02-07 20:19:44 +00:00
}
2008-06-25 19:12:59 +00:00
cleanup :
2009-04-13 21:23:37 +00:00
if ( tokudb_debug & TOKUDB_DEBUG_LOCK )
TOKUDB_TRACE ( " %s error=%d \n " , __FUNCTION__ , error ) ;
2008-03-21 23:47:22 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-05 16:00:53 +00:00
}
/*
When using LOCK TABLE ' s external_lock is only called when the actual
TABLE LOCK is done .
Under LOCK TABLES , each used tables will force a call to start_stmt .
*/
2008-02-07 20:19:44 +00:00
int ha_tokudb : : start_stmt ( THD * thd , thr_lock_type lock_type ) {
2010-07-05 14:35:31 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::start_stmt cmd=%d %d " , thd_sql_command ( thd ) , lock_type ) ;
2008-02-07 20:19:44 +00:00
int error = 0 ;
2009-01-20 21:06:49 +00:00
2008-05-02 17:36:22 +00:00
tokudb_trx_data * trx = ( tokudb_trx_data * ) thd_data_get ( thd , tokudb_hton - > slot ) ;
2008-02-07 20:19:44 +00:00
DBUG_ASSERT ( trx ) ;
/*
note that trx - > stmt may have been already initialized as start_stmt ( )
is called for * each table * not for each storage engine ,
and there could be many bdb tables referenced in the query
*/
if ( ! trx - > stmt ) {
2009-08-25 20:48:12 +00:00
error = create_txn ( thd , trx ) ;
if ( error ) {
goto cleanup ;
}
2008-02-07 20:19:44 +00:00
}
2010-07-05 14:35:31 +00:00
else {
if ( tokudb_debug & TOKUDB_DEBUG_TXN ) {
TOKUDB_TRACE ( " trx->stmt already existed \n " ) ;
}
}
2009-08-11 16:52:44 +00:00
//
// we know we are in lock tables
// attempt to grab a table lock
// if fail, continue, do not return error
// This is because a failure ok, it simply means
// another active transaction has some locks.
// That other transaction modify this table
// until it is unlocked, therefore having acquire_table_lock
// potentially grab some locks but not all is ok.
//
if ( lock . type < = TL_READ_NO_INSERT ) {
2010-07-05 14:35:31 +00:00
acquire_table_lock ( trx - > sub_sp_level , lock_read ) ;
2009-08-11 16:52:44 +00:00
}
else {
2010-08-25 14:30:20 +00:00
if ( ! ( thd_sql_command ( thd ) = = SQLCOM_CREATE_INDEX | |
thd_sql_command ( thd ) = = SQLCOM_ALTER_TABLE | |
thd_sql_command ( thd ) = = SQLCOM_DROP_INDEX | |
thd_sql_command ( thd ) = = SQLCOM_TRUNCATE ) ) {
acquire_table_lock ( trx - > sub_sp_level , lock_write ) ;
}
2009-08-11 16:52:44 +00:00
}
2008-12-30 17:41:26 +00:00
if ( added_rows > deleted_rows ) {
share - > rows_from_locked_table = added_rows - deleted_rows ;
}
2010-07-05 14:35:31 +00:00
transaction = trx - > sub_sp_level ;
2012-07-25 20:48:53 +00:00
trans_register_ha ( thd , false , tokudb_hton ) ;
2009-08-25 20:48:12 +00:00
cleanup :
2008-03-21 23:47:22 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-05 16:00:53 +00:00
}
2010-09-03 20:47:01 +00:00
2012-07-25 20:48:53 +00:00
uint32_t ha_tokudb : : get_cursor_isolation_flags ( enum thr_lock_type lock_type , THD * thd ) {
2010-09-03 20:47:01 +00:00
uint sql_command = thd_sql_command ( thd ) ;
bool in_lock_tables = thd_in_lock_tables ( thd ) ;
2010-09-16 14:55:19 +00:00
//
// following InnoDB's lead and having checksum command use a snapshot read if told
//
if ( sql_command = = SQLCOM_CHECKSUM ) {
return 0 ;
}
else if ( ( lock_type = = TL_READ & & in_lock_tables ) | |
2011-06-13 18:01:03 +00:00
( lock_type = = TL_READ_HIGH_PRIORITY & & in_lock_tables ) | |
sql_command ! = SQLCOM_SELECT | |
( sql_command = = SQLCOM_SELECT & & lock_type > = TL_WRITE_ALLOW_WRITE ) ) { // select for update
2013-02-07 16:56:44 +00:00
ulong tx_isolation = thd_tx_isolation ( thd ) ;
// pattern matched from InnoDB
if ( ( tx_isolation = = ISO_READ_COMMITTED | | tx_isolation = = ISO_READ_UNCOMMITTED ) & &
( lock_type = = TL_READ | | lock_type = = TL_READ_NO_INSERT ) & &
( sql_command = = SQLCOM_INSERT_SELECT
| | sql_command = = SQLCOM_REPLACE_SELECT
| | sql_command = = SQLCOM_UPDATE
| | sql_command = = SQLCOM_CREATE_TABLE ) )
{
return 0 ;
}
else {
return DB_SERIALIZABLE ;
}
2010-09-03 20:47:01 +00:00
}
else {
return 0 ;
}
}
2008-02-05 16:00:53 +00:00
/*
The idea with handler : : store_lock ( ) is the following :
The statement decided which locks we should need for the table
for updates / deletes / inserts we get WRITE locks , for SELECT . . . we get
read locks .
Before adding the lock into the table lock handler ( see thr_lock . c )
mysqld calls store lock with the requested locks . Store lock can now
modify a write lock to a read lock ( or some other lock ) , ignore the
lock ( if we don ' t want to use MySQL table locks at all ) or add locks
for many tables ( like we do when we are using a MERGE handler ) .
Tokudb DB changes all WRITE locks to TL_WRITE_ALLOW_WRITE ( which
signals that we are doing WRITES , but we are still allowing other
reader ' s and writer ' s .
When releasing locks , store_lock ( ) are also called . In this case one
usually doesn ' t have to do anything .
In some exceptional cases MySQL may send a request for a TL_IGNORE ;
This means that we are requesting the same lock as last time and this
should also be ignored . ( This may happen when someone does a flush
table when we have opened a part of the tables , in which case mysqld
closes and reopens the tables and tries to get the same locks at last
time ) . In the future we will probably try to remove this .
*/
2008-02-07 20:19:44 +00:00
THR_LOCK_DATA * * ha_tokudb : : store_lock ( THD * thd , THR_LOCK_DATA * * to , enum thr_lock_type lock_type ) {
2008-07-21 13:27:13 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::store_lock, lock_type=%d cmd=%d " , lock_type , thd_sql_command ( thd ) ) ;
2010-11-17 23:09:06 +00:00
if ( tokudb_debug & TOKUDB_DEBUG_LOCK ) {
2009-04-13 21:23:37 +00:00
TOKUDB_TRACE ( " %s lock_type=%d cmd=%d \n " , __FUNCTION__ , lock_type , thd_sql_command ( thd ) ) ;
2010-11-17 23:09:06 +00:00
}
2011-01-21 15:09:18 +00:00
if ( lock_type ! = TL_IGNORE & & lock . type = = TL_UNLOCK ) {
// if creating a hot index
2012-10-18 17:41:38 +00:00
if ( thd_sql_command ( thd ) = = SQLCOM_CREATE_INDEX & & get_create_index_online ( thd ) ) {
2011-01-21 15:09:18 +00:00
rw_rdlock ( & share - > num_DBs_lock ) ;
if ( share - > num_DBs = = ( table - > s - > keys + test ( hidden_primary_key ) ) ) {
lock_type = TL_WRITE_ALLOW_WRITE ;
}
lock . type = lock_type ;
rw_unlock ( & share - > num_DBs_lock ) ;
2012-02-08 19:44:10 +00:00
}
2012-05-21 18:56:56 +00:00
2012-04-02 18:27:34 +00:00
// 5.5 supports reads concurrent with alter table. just use the default lock type.
2012-05-21 18:56:56 +00:00
# if MYSQL_VERSION_ID < 50500
2012-02-08 19:44:10 +00:00
else if ( thd_sql_command ( thd ) = = SQLCOM_CREATE_INDEX | |
thd_sql_command ( thd ) = = SQLCOM_ALTER_TABLE | |
thd_sql_command ( thd ) = = SQLCOM_DROP_INDEX ) {
2012-04-02 18:27:34 +00:00
// force alter table to lock out other readers
2012-02-08 19:44:10 +00:00
lock_type = TL_WRITE ;
2012-02-08 19:50:06 +00:00
lock . type = lock_type ;
2012-02-08 19:44:10 +00:00
}
2012-04-02 18:27:34 +00:00
# endif
2012-02-08 19:44:10 +00:00
else {
2011-01-21 15:09:18 +00:00
// If we are not doing a LOCK TABLE, then allow multiple writers
if ( ( lock_type > = TL_WRITE_CONCURRENT_INSERT & & lock_type < = TL_WRITE ) & &
! thd - > in_lock_tables & & thd_sql_command ( thd ) ! = SQLCOM_TRUNCATE & & ! thd_tablespace_op ( thd ) ) {
lock_type = TL_WRITE_ALLOW_WRITE ;
}
lock . type = lock_type ;
2008-06-17 14:31:53 +00:00
}
2008-02-05 16:00:53 +00:00
}
2008-02-07 20:19:44 +00:00
* to + + = & lock ;
2009-04-13 21:23:37 +00:00
if ( tokudb_debug & TOKUDB_DEBUG_LOCK )
TOKUDB_TRACE ( " %s lock_type=%d \n " , __FUNCTION__ , lock_type ) ;
2008-05-05 18:38:04 +00:00
DBUG_RETURN ( to ) ;
2008-02-07 20:19:44 +00:00
}
2012-04-03 04:25:26 +00:00
static inline enum row_type
compression_method_to_row_type ( enum toku_compression_method method )
{
switch ( method ) {
2012-05-01 15:42:21 +00:00
# if TOKU_INCLUDE_ROW_TYPE_COMPRESSION
2012-04-03 04:25:26 +00:00
case TOKU_NO_COMPRESSION :
return ROW_TYPE_TOKU_UNCOMPRESSED ;
case TOKU_ZLIB_METHOD :
2013-01-23 21:22:33 +00:00
case TOKU_ZLIB_WITHOUT_CHECKSUM_METHOD :
2012-04-03 04:25:26 +00:00
return ROW_TYPE_TOKU_ZLIB ;
case TOKU_QUICKLZ_METHOD :
return ROW_TYPE_TOKU_QUICKLZ ;
case TOKU_LZMA_METHOD :
return ROW_TYPE_TOKU_LZMA ;
case TOKU_FAST_COMPRESSION_METHOD :
return ROW_TYPE_TOKU_FAST ;
case TOKU_SMALL_COMPRESSION_METHOD :
return ROW_TYPE_TOKU_SMALL ;
2012-04-16 20:04:07 +00:00
# endif
2012-04-05 22:14:13 +00:00
case TOKU_DEFAULT_COMPRESSION_METHOD :
return ROW_TYPE_DEFAULT ;
2012-04-03 04:25:26 +00:00
default :
assert ( false ) ;
}
}
2012-04-04 15:12:36 +00:00
static enum row_type
get_row_type_for_key ( DB * file )
2012-04-03 04:25:26 +00:00
{
enum toku_compression_method method ;
2012-04-04 15:12:36 +00:00
int r = file - > get_compression_method ( file , & method ) ;
2012-04-03 04:25:26 +00:00
assert ( r = = 0 ) ;
return compression_method_to_row_type ( method ) ;
}
2012-04-04 15:12:36 +00:00
enum row_type
2012-04-04 20:44:23 +00:00
# if MYSQL_VERSION_ID >= 50521
ha_tokudb : : get_row_type ( void ) const
# else
2012-04-04 15:12:36 +00:00
ha_tokudb : : get_row_type ( void )
2012-04-04 20:44:23 +00:00
# endif
2012-04-04 15:12:36 +00:00
{
return get_row_type_for_key ( share - > file ) ;
}
2012-04-03 04:25:26 +00:00
static inline enum toku_compression_method
row_type_to_compression_method ( enum row_type type )
{
switch ( type ) {
2012-05-01 15:42:21 +00:00
# if TOKU_INCLUDE_ROW_TYPE_COMPRESSION
2012-04-03 04:25:26 +00:00
case ROW_TYPE_TOKU_UNCOMPRESSED :
return TOKU_NO_COMPRESSION ;
case ROW_TYPE_TOKU_ZLIB :
2013-01-23 21:22:33 +00:00
return TOKU_ZLIB_WITHOUT_CHECKSUM_METHOD ;
2012-04-03 04:25:26 +00:00
case ROW_TYPE_TOKU_QUICKLZ :
return TOKU_QUICKLZ_METHOD ;
case ROW_TYPE_TOKU_LZMA :
return TOKU_LZMA_METHOD ;
case ROW_TYPE_TOKU_SMALL :
return TOKU_SMALL_COMPRESSION_METHOD ;
2012-04-03 20:25:47 +00:00
case ROW_TYPE_TOKU_FAST :
return TOKU_FAST_COMPRESSION_METHOD ;
2012-04-16 20:04:07 +00:00
# endif
2012-04-05 22:14:13 +00:00
default :
DBUG_PRINT ( " info " , ( " Ignoring ROW_FORMAT not used by TokuDB, using TOKUDB_FAST by default instead " ) ) ;
case ROW_TYPE_DEFAULT :
return TOKU_DEFAULT_COMPRESSION_METHOD ;
2012-04-03 04:25:26 +00:00
}
}
2011-07-12 21:56:07 +00:00
static int create_sub_table (
const char * table_name ,
DBT * row_descriptor ,
DB_TXN * txn ,
uint32_t block_size ,
2012-04-03 04:25:26 +00:00
uint32_t read_block_size ,
2012-04-04 15:12:36 +00:00
enum toku_compression_method compression_method ,
2011-07-12 21:56:07 +00:00
bool is_hot_index
)
{
2008-03-26 02:47:07 +00:00
TOKUDB_DBUG_ENTER ( " create_sub_table " ) ;
2008-02-07 20:19:44 +00:00
int error ;
2009-04-01 17:54:56 +00:00
DB * file = NULL ;
2012-07-25 20:48:53 +00:00
uint32_t create_flags ;
2009-04-01 20:08:32 +00:00
2009-04-01 17:54:56 +00:00
error = db_create ( & file , db_env , 0 ) ;
if ( error ) {
DBUG_PRINT ( " error " , ( " Got error: %d when creating table " , error ) ) ;
my_errno = error ;
goto exit ;
}
2010-12-17 18:16:54 +00:00
2010-12-20 18:56:29 +00:00
if ( block_size ! = 0 ) {
error = file - > set_pagesize ( file , block_size ) ;
2010-12-17 18:16:54 +00:00
if ( error ! = 0 ) {
2010-12-20 18:56:29 +00:00
DBUG_PRINT ( " error " , ( " Got error: %d when setting block size %u for table '%s' " , error , block_size , table_name ) ) ;
2010-12-17 18:16:54 +00:00
goto exit ;
}
}
2011-07-12 21:56:07 +00:00
if ( read_block_size ! = 0 ) {
error = file - > set_readpagesize ( file , read_block_size ) ;
if ( error ! = 0 ) {
DBUG_PRINT ( " error " , ( " Got error: %d when setting read block size %u for table '%s' " , error , read_block_size , table_name ) ) ;
goto exit ;
}
}
2012-05-15 14:09:02 +00:00
error = file - > set_compression_method ( file , compression_method ) ;
if ( error ! = 0 ) {
DBUG_PRINT ( " error " , ( " Got error: %d when setting compression type %u for table '%s' " , error , compression_method , table_name ) ) ;
goto exit ;
}
2011-01-06 19:02:48 +00:00
create_flags = DB_THREAD | DB_CREATE | DB_EXCL | ( is_hot_index ? DB_IS_HOT_INDEX : 0 ) ;
error = file - > open ( file , txn , table_name , NULL , DB_BTREE , create_flags , my_umask ) ;
2009-04-01 17:54:56 +00:00
if ( error ) {
DBUG_PRINT ( " error " , ( " Got error: %d when opening table '%s' " , error , table_name ) ) ;
goto exit ;
}
2008-02-07 20:19:44 +00:00
2012-04-04 19:53:17 +00:00
error = file - > change_descriptor ( file , txn , row_descriptor , ( is_hot_index ? DB_IS_HOT_INDEX | DB_UPDATE_CMP_DESCRIPTOR : DB_UPDATE_CMP_DESCRIPTOR ) ) ;
2011-03-04 19:54:23 +00:00
if ( error ) {
DBUG_PRINT ( " error " , ( " Got error: %d when setting row descriptor for table '%s' " , error , table_name ) ) ;
goto exit ;
}
2009-04-01 17:54:56 +00:00
error = 0 ;
exit :
2009-11-10 19:22:08 +00:00
if ( file ) {
2009-12-03 15:49:42 +00:00
int r = file - > close ( file , 0 ) ;
assert ( r = = 0 ) ;
2008-02-07 20:19:44 +00:00
}
2008-03-21 23:47:22 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-07 20:19:44 +00:00
}
2009-02-28 23:04:28 +00:00
void ha_tokudb : : update_create_info ( HA_CREATE_INFO * create_info ) {
if ( share - > has_auto_inc ) {
info ( HA_STATUS_AUTO ) ;
2012-05-07 20:14:23 +00:00
if ( ! ( create_info - > used_fields & HA_CREATE_USED_AUTO ) | |
create_info - > auto_increment_value < stats . auto_increment_value ) {
create_info - > auto_increment_value = stats . auto_increment_value ;
}
}
if ( ! ( create_info - > used_fields & HA_CREATE_USED_ROW_FORMAT ) ) {
// show create table asks us to update this create_info, this makes it
// so we'll always show what compression type we're using
create_info - > row_type = get_row_type ( ) ;
2009-02-28 23:04:28 +00:00
}
}
2008-04-17 20:56:40 +00:00
//
2009-11-10 19:22:08 +00:00
// removes key name from status.tokudb.
// needed for when we are dropping indexes, so that
// during drop table, we do not attempt to remove already dropped
// indexes because we did not keep status.tokudb in sync with list of indexes.
2008-04-17 20:56:40 +00:00
//
2009-11-10 19:22:08 +00:00
int ha_tokudb : : remove_key_name_from_status ( DB * status_block , char * key_name , DB_TXN * txn ) {
2008-02-07 20:19:44 +00:00
int error ;
2009-11-10 19:22:08 +00:00
uchar status_key_info [ FN_REFLEN + sizeof ( HA_METADATA_KEY ) ] ;
HA_METADATA_KEY md_key = hatoku_key_name ;
memcpy ( status_key_info , & md_key , sizeof ( HA_METADATA_KEY ) ) ;
//
// put index name in status.tokudb
//
memcpy (
status_key_info + sizeof ( HA_METADATA_KEY ) ,
key_name ,
strlen ( key_name ) + 1
) ;
error = remove_metadata (
status_block ,
status_key_info ,
sizeof ( HA_METADATA_KEY ) + strlen ( key_name ) + 1 ,
txn
) ;
return error ;
}
2008-10-13 18:13:41 +00:00
2009-11-10 19:22:08 +00:00
//
// writes the key name in status.tokudb, so that we may later delete or rename
// the dictionary associated with key_name
//
int ha_tokudb : : write_key_name_to_status ( DB * status_block , char * key_name , DB_TXN * txn ) {
int error ;
uchar status_key_info [ FN_REFLEN + sizeof ( HA_METADATA_KEY ) ] ;
HA_METADATA_KEY md_key = hatoku_key_name ;
memcpy ( status_key_info , & md_key , sizeof ( HA_METADATA_KEY ) ) ;
//
// put index name in status.tokudb
//
memcpy (
status_key_info + sizeof ( HA_METADATA_KEY ) ,
key_name ,
strlen ( key_name ) + 1
) ;
error = write_metadata (
status_block ,
status_key_info ,
sizeof ( HA_METADATA_KEY ) + strlen ( key_name ) + 1 ,
NULL ,
0 ,
txn
) ;
return error ;
}
2008-02-07 20:19:44 +00:00
2009-11-10 19:22:08 +00:00
//
// some tracing moved out of ha_tokudb::create, because ::create was getting cluttered
//
void ha_tokudb : : trace_create_table_info ( const char * name , TABLE * form ) {
uint i ;
2008-05-26 14:07:31 +00:00
//
// tracing information about what type of table we are creating
//
2008-04-23 17:19:03 +00:00
if ( tokudb_debug & TOKUDB_DEBUG_OPEN ) {
for ( i = 0 ; i < form - > s - > fields ; i + + ) {
Field * field = form - > s - > field [ i ] ;
TOKUDB_TRACE ( " field:%d:%s:type=%d:flags=%x \n " , i , field - > field_name , field - > type ( ) , field - > flags ) ;
}
for ( i = 0 ; i < form - > s - > keys ; i + + ) {
KEY * key = & form - > s - > key_info [ i ] ;
2012-12-12 18:37:24 +00:00
TOKUDB_TRACE ( " key:%d:%s:%d \n " , i , key - > name , get_key_parts ( key ) ) ;
2008-04-23 17:19:03 +00:00
uint p ;
2012-12-12 18:37:24 +00:00
for ( p = 0 ; p < get_key_parts ( key ) ; p + + ) {
2008-04-23 17:19:03 +00:00
KEY_PART_INFO * key_part = & key - > key_part [ p ] ;
Field * field = key_part - > field ;
TOKUDB_TRACE ( " key:%d:%d:length=%d:%s:type=%d:flags=%x \n " ,
i , p , key_part - > length , field - > field_name , field - > type ( ) , field - > flags ) ;
}
}
}
2009-11-10 19:22:08 +00:00
}
2012-07-25 20:48:53 +00:00
static uint32_t get_max_desc_size ( KEY_AND_COL_INFO * kc_info , TABLE * form ) {
uint32_t max_row_desc_buff_size ;
2011-03-04 19:54:23 +00:00
max_row_desc_buff_size = 2 * ( form - > s - > fields * 6 ) + 10 ; // upper bound of key comparison descriptor
max_row_desc_buff_size + = get_max_secondary_key_pack_desc_size ( kc_info ) ; // upper bound for sec. key part
max_row_desc_buff_size + = get_max_clustering_val_pack_desc_size ( form - > s ) ; // upper bound for clustering val part
return max_row_desc_buff_size ;
}
2012-07-25 20:48:53 +00:00
static uint32_t create_secondary_key_descriptor (
2011-03-04 19:54:23 +00:00
uchar * buf ,
KEY * key_info ,
KEY * prim_key ,
uint hpk ,
TABLE * form ,
uint primary_key ,
2012-07-25 20:48:53 +00:00
uint32_t keynr ,
2011-03-04 19:54:23 +00:00
KEY_AND_COL_INFO * kc_info
)
{
uchar * ptr = NULL ;
ptr = buf ;
ptr + = create_toku_key_descriptor (
ptr ,
false ,
key_info ,
hpk ,
prim_key
) ;
ptr + = create_toku_secondary_key_pack_descriptor (
ptr ,
hpk ,
primary_key ,
form - > s ,
form ,
kc_info ,
key_info ,
prim_key
) ;
ptr + = create_toku_clustering_val_pack_descriptor (
ptr ,
primary_key ,
form - > s ,
kc_info ,
keynr ,
key_info - > flags & HA_CLUSTERING
) ;
return ptr - buf ;
}
2009-11-10 19:22:08 +00:00
//
// creates dictionary for secondary index, with key description key_info, all using txn
//
2011-01-06 19:02:48 +00:00
int ha_tokudb : : create_secondary_dictionary (
const char * name , TABLE * form ,
KEY * key_info ,
DB_TXN * txn ,
KEY_AND_COL_INFO * kc_info ,
2012-07-25 20:48:53 +00:00
uint32_t keynr ,
2012-04-04 15:12:36 +00:00
bool is_hot_index ,
enum row_type row_type
2011-01-06 19:02:48 +00:00
)
{
2009-11-10 19:22:08 +00:00
int error ;
DBT row_descriptor ;
uchar * row_desc_buff = NULL ;
char * newname = NULL ;
KEY * prim_key = NULL ;
char dict_name [ MAX_DICT_NAME_LEN ] ;
2012-07-25 20:48:53 +00:00
uint32_t max_row_desc_buff_size ;
2009-11-10 19:22:08 +00:00
uint hpk = ( form - > s - > primary_key > = MAX_KEY ) ? TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH : 0 ;
2010-12-20 18:56:29 +00:00
uint32_t block_size ;
2011-07-12 21:56:07 +00:00
uint32_t read_block_size ;
THD * thd = ha_thd ( ) ;
2008-03-31 11:43:28 +00:00
2012-05-09 18:36:52 +00:00
memset ( & row_descriptor , 0 , sizeof ( row_descriptor ) ) ;
2010-01-11 18:14:37 +00:00
2011-03-04 19:54:23 +00:00
max_row_desc_buff_size = get_max_desc_size ( kc_info , form ) ;
2010-01-11 18:14:37 +00:00
row_desc_buff = ( uchar * ) my_malloc ( max_row_desc_buff_size , MYF ( MY_WME ) ) ;
2009-11-10 19:22:08 +00:00
if ( row_desc_buff = = NULL ) { error = ENOMEM ; goto cleanup ; }
newname = ( char * ) my_malloc ( get_max_dict_name_path_length ( name ) , MYF ( MY_WME ) ) ;
if ( newname = = NULL ) { error = ENOMEM ; goto cleanup ; }
sprintf ( dict_name , " key-%s " , key_info - > name ) ;
make_name ( newname , name , dict_name ) ;
prim_key = ( hpk ) ? NULL : & form - > s - > key_info [ primary_key ] ;
//
// setup the row descriptor
//
row_descriptor . data = row_desc_buff ;
2010-01-11 18:14:37 +00:00
//
// save data necessary for key comparisons
//
2011-03-04 19:54:23 +00:00
row_descriptor . size = create_secondary_key_descriptor (
2009-11-10 19:22:08 +00:00
row_desc_buff ,
key_info ,
2011-03-04 19:54:23 +00:00
prim_key ,
2009-11-10 19:22:08 +00:00
hpk ,
2010-01-11 18:14:37 +00:00
form ,
primary_key ,
keynr ,
2011-03-04 19:54:23 +00:00
kc_info
2010-01-11 18:14:37 +00:00
) ;
assert ( row_descriptor . size < = max_row_desc_buff_size ) ;
2010-12-20 18:56:29 +00:00
block_size = key_info - > block_size < < 10 ;
if ( block_size = = 0 ) {
block_size = get_tokudb_block_size ( thd ) ;
}
2011-07-12 21:56:07 +00:00
read_block_size = get_tokudb_read_block_size ( thd ) ;
2010-12-20 18:56:29 +00:00
2012-04-04 15:12:36 +00:00
error = create_sub_table ( newname , & row_descriptor , txn , block_size , read_block_size , row_type_to_compression_method ( row_type ) , is_hot_index ) ;
2009-11-10 19:22:08 +00:00
cleanup :
my_free ( newname , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
my_free ( row_desc_buff , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
return error ;
}
2011-03-04 19:54:23 +00:00
2012-07-25 20:48:53 +00:00
static uint32_t create_main_key_descriptor (
2011-03-04 19:54:23 +00:00
uchar * buf ,
KEY * prim_key ,
uint hpk ,
uint primary_key ,
TABLE * form ,
KEY_AND_COL_INFO * kc_info
)
{
uchar * ptr = buf ;
ptr + = create_toku_key_descriptor (
ptr ,
hpk ,
prim_key ,
false ,
NULL
) ;
ptr + = create_toku_main_key_pack_descriptor (
ptr
) ;
ptr + = create_toku_clustering_val_pack_descriptor (
ptr ,
primary_key ,
form - > s ,
kc_info ,
primary_key ,
false
) ;
return ptr - buf ;
}
2009-11-10 19:22:08 +00:00
//
// create and close the main dictionarr with name of "name" using table form, all within
// transaction txn.
//
2012-04-04 15:12:36 +00:00
int ha_tokudb : : create_main_dictionary ( const char * name , TABLE * form , DB_TXN * txn , KEY_AND_COL_INFO * kc_info , enum row_type row_type ) {
2009-11-10 19:22:08 +00:00
int error ;
DBT row_descriptor ;
uchar * row_desc_buff = NULL ;
char * newname = NULL ;
KEY * prim_key = NULL ;
2012-07-25 20:48:53 +00:00
uint32_t max_row_desc_buff_size ;
2009-11-10 19:22:08 +00:00
uint hpk = ( form - > s - > primary_key > = MAX_KEY ) ? TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH : 0 ;
2010-12-20 18:56:29 +00:00
uint32_t block_size ;
2011-07-12 21:56:07 +00:00
uint32_t read_block_size ;
THD * thd = ha_thd ( ) ;
2009-11-10 19:22:08 +00:00
2012-05-09 18:36:52 +00:00
memset ( & row_descriptor , 0 , sizeof ( row_descriptor ) ) ;
2011-03-04 19:54:23 +00:00
max_row_desc_buff_size = get_max_desc_size ( kc_info , form ) ;
2010-01-11 18:14:37 +00:00
row_desc_buff = ( uchar * ) my_malloc ( max_row_desc_buff_size , MYF ( MY_WME ) ) ;
2009-11-10 19:22:08 +00:00
if ( row_desc_buff = = NULL ) { error = ENOMEM ; goto cleanup ; }
newname = ( char * ) my_malloc ( get_max_dict_name_path_length ( name ) , MYF ( MY_WME ) ) ;
if ( newname = = NULL ) { error = ENOMEM ; goto cleanup ; }
2008-03-19 20:21:49 +00:00
2008-03-03 20:27:58 +00:00
make_name ( newname , name , " main " ) ;
2009-11-10 19:22:08 +00:00
prim_key = ( hpk ) ? NULL : & form - > s - > key_info [ primary_key ] ;
2008-02-07 20:19:44 +00:00
2009-04-02 18:39:30 +00:00
//
// setup the row descriptor
//
row_descriptor . data = row_desc_buff ;
2010-01-11 18:14:37 +00:00
//
// save data necessary for key comparisons
//
2011-03-04 19:54:23 +00:00
row_descriptor . size = create_main_key_descriptor (
row_desc_buff ,
2009-04-02 18:39:30 +00:00
prim_key ,
2011-03-04 19:54:23 +00:00
hpk ,
2010-01-11 18:14:37 +00:00
primary_key ,
2011-03-04 19:54:23 +00:00
form ,
kc_info
2010-01-11 18:14:37 +00:00
) ;
assert ( row_descriptor . size < = max_row_desc_buff_size ) ;
2009-04-02 18:39:30 +00:00
2010-12-20 18:56:29 +00:00
block_size = 0 ;
if ( prim_key )
block_size = prim_key - > block_size < < 10 ;
if ( block_size = = 0 ) {
block_size = get_tokudb_block_size ( thd ) ;
}
2011-07-12 21:56:07 +00:00
read_block_size = get_tokudb_read_block_size ( thd ) ;
2010-12-20 18:56:29 +00:00
2008-02-07 20:19:44 +00:00
/* Create the main table that will hold the real rows */
2012-04-04 15:12:36 +00:00
error = create_sub_table ( newname , & row_descriptor , txn , block_size , read_block_size , row_type_to_compression_method ( row_type ) , false ) ;
2009-11-10 19:22:08 +00:00
cleanup :
my_free ( newname , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
my_free ( row_desc_buff , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
return error ;
}
2012-04-03 04:25:26 +00:00
static inline enum row_type
row_format_to_row_type ( srv_row_format_t row_format )
{
2012-05-01 15:42:21 +00:00
# if TOKU_INCLUDE_ROW_TYPE_COMPRESSION
2012-05-09 18:36:52 +00:00
switch ( row_format ) {
2012-04-03 04:25:26 +00:00
case SRV_ROW_FORMAT_UNCOMPRESSED :
return ROW_TYPE_TOKU_UNCOMPRESSED ;
case SRV_ROW_FORMAT_ZLIB :
return ROW_TYPE_TOKU_ZLIB ;
case SRV_ROW_FORMAT_QUICKLZ :
return ROW_TYPE_TOKU_QUICKLZ ;
case SRV_ROW_FORMAT_LZMA :
return ROW_TYPE_TOKU_LZMA ;
case SRV_ROW_FORMAT_SMALL :
return ROW_TYPE_TOKU_SMALL ;
2012-04-03 20:25:47 +00:00
case SRV_ROW_FORMAT_FAST :
return ROW_TYPE_TOKU_FAST ;
2012-05-03 15:42:35 +00:00
case SRV_ROW_FORMAT_DEFAULT :
2012-04-05 22:14:13 +00:00
return ROW_TYPE_DEFAULT ;
2012-04-03 04:25:26 +00:00
}
2012-05-09 18:36:52 +00:00
assert ( 0 ) ;
# endif
return ROW_TYPE_DEFAULT ; ;
2012-04-03 04:25:26 +00:00
}
2009-11-10 19:22:08 +00:00
//
// Creates a new table
// Parameters:
// [in] name - table name
// [in] form - info on table, columns and indexes
// [in] create_info - more info on table, CURRENTLY UNUSED
// Returns:
// 0 on success
// error otherwise
//
int ha_tokudb : : create ( const char * name , TABLE * form , HA_CREATE_INFO * create_info ) {
TOKUDB_DBUG_ENTER ( " ha_tokudb::create " ) ;
int error ;
DB * status_block = NULL ;
uint version ;
uint capabilities ;
DB_TXN * txn = NULL ;
2011-09-06 18:42:31 +00:00
bool do_commit = false ;
2009-11-10 19:22:08 +00:00
char * newname = NULL ;
2010-01-11 18:14:37 +00:00
KEY_AND_COL_INFO kc_info ;
2011-09-06 18:42:31 +00:00
tokudb_trx_data * trx = NULL ;
2011-09-07 15:43:50 +00:00
THD * thd = ha_thd ( ) ;
2011-04-21 00:53:18 +00:00
bool create_from_engine = ( create_info - > table_options & HA_OPTION_CREATE_FROM_ENGINE ) ;
2012-05-09 18:36:52 +00:00
memset ( & kc_info , 0 , sizeof ( kc_info ) ) ;
2008-02-07 20:19:44 +00:00
2009-11-10 19:22:08 +00:00
pthread_mutex_lock ( & tokudb_meta_mutex ) ;
2008-02-07 20:19:44 +00:00
2011-09-06 18:42:31 +00:00
trx = ( tokudb_trx_data * ) thd_data_get ( ha_thd ( ) , tokudb_hton - > slot ) ;
2012-04-04 15:32:08 +00:00
const enum row_type row_type = ( ( create_info - > used_fields & HA_CREATE_USED_ROW_FORMAT )
? create_info - > row_type
: row_format_to_row_type ( get_row_format ( thd ) ) ) ;
2011-04-21 00:53:18 +00:00
if ( create_from_engine ) {
// table already exists, nothing to do
error = 0 ;
goto cleanup ;
}
2012-04-03 04:25:26 +00:00
2009-11-10 19:22:08 +00:00
newname = ( char * ) my_malloc ( get_max_dict_name_path_length ( name ) , MYF ( MY_WME ) ) ;
if ( newname = = NULL ) { error = ENOMEM ; goto cleanup ; }
2008-02-05 16:00:53 +00:00
2011-09-07 15:43:50 +00:00
if ( thd_sql_command ( thd ) = = SQLCOM_CREATE_TABLE & & trx & & trx - > sub_sp_level ) {
2011-09-06 18:42:31 +00:00
txn = trx - > sub_sp_level ;
}
else {
do_commit = true ;
error = db_env - > txn_begin ( db_env , 0 , & txn , 0 ) ;
if ( error ) { goto cleanup ; }
}
2009-11-10 19:22:08 +00:00
primary_key = form - > s - > primary_key ;
hidden_primary_key = ( primary_key > = MAX_KEY ) ? TOKUDB_HIDDEN_PRIMARY_KEY_LENGTH : 0 ;
2010-01-11 18:14:37 +00:00
if ( hidden_primary_key ) {
primary_key = form - > s - > keys ;
}
2009-11-10 19:22:08 +00:00
/* do some tracing */
trace_create_table_info ( name , form ) ;
2008-07-04 02:24:49 +00:00
/* Create status.tokudb and save relevant metadata */
2009-10-26 17:24:15 +00:00
make_name ( newname , name , " status " ) ;
2009-04-17 18:29:25 +00:00
2009-11-10 19:22:08 +00:00
error = db_create ( & status_block , db_env , 0 ) ;
if ( error ) { goto cleanup ; }
2012-06-25 18:50:33 +00:00
error = status_block - > set_pagesize ( status_block , status_dict_pagesize ) ;
2012-06-22 19:49:45 +00:00
if ( error ) { goto cleanup ; }
2009-12-03 15:39:53 +00:00
error = status_block - > open ( status_block , txn , newname , NULL , DB_BTREE , DB_CREATE | DB_EXCL , 0 ) ;
2009-10-26 17:24:15 +00:00
if ( error ) { goto cleanup ; }
2008-08-18 18:59:52 +00:00
2009-10-26 17:24:15 +00:00
version = HA_TOKU_VERSION ;
capabilities = HA_TOKU_CAP ;
2011-05-03 16:04:15 +00:00
error = write_to_status ( status_block , hatoku_new_version , & version , sizeof ( version ) , txn ) ;
2009-10-26 17:24:15 +00:00
if ( error ) { goto cleanup ; }
2008-08-18 18:35:32 +00:00
2009-11-10 19:22:08 +00:00
error = write_to_status ( status_block , hatoku_capabilities , & capabilities , sizeof ( capabilities ) , txn ) ;
2009-10-26 17:24:15 +00:00
if ( error ) { goto cleanup ; }
2009-11-10 19:22:08 +00:00
error = write_auto_inc_create ( status_block , create_info - > auto_increment_value , txn ) ;
2009-10-26 17:24:15 +00:00
if ( error ) { goto cleanup ; }
2008-08-18 18:35:32 +00:00
2012-12-18 20:14:09 +00:00
# if TOKU_PARTITION_WRITE_FRM_DATA
error = write_frm_data ( status_block , txn , form - > s - > path . str ) ;
if ( error ) { goto cleanup ; }
# else
2011-04-21 00:53:18 +00:00
// only for tables that are not partitioned
2012-12-18 20:14:09 +00:00
if ( form - > part_info = = NULL ) {
2011-04-21 00:53:18 +00:00
error = write_frm_data ( status_block , txn , form - > s - > path . str ) ;
if ( error ) { goto cleanup ; }
}
2012-12-18 20:14:09 +00:00
# endif
2010-01-11 18:14:37 +00:00
error = allocate_key_and_col_info ( form - > s , & kc_info ) ;
if ( error ) { goto cleanup ; }
error = initialize_key_and_col_info (
form - > s ,
form ,
& kc_info ,
hidden_primary_key ,
primary_key
) ;
if ( error ) { goto cleanup ; }
2008-04-02 17:34:05 +00:00
2012-04-04 15:12:36 +00:00
error = create_main_dictionary ( name , form , txn , & kc_info , row_type ) ;
2009-09-10 20:52:19 +00:00
if ( error ) {
goto cleanup ;
}
2009-11-10 19:22:08 +00:00
for ( uint i = 0 ; i < form - > s - > keys ; i + + ) {
if ( i ! = primary_key ) {
2012-04-04 15:12:36 +00:00
error = create_secondary_dictionary ( name , form , & form - > key_info [ i ] , txn , & kc_info , i , false , row_type ) ;
2009-11-10 19:22:08 +00:00
if ( error ) {
goto cleanup ;
}
error = write_key_name_to_status ( status_block , form - > s - > key_info [ i ] . name , txn ) ;
if ( error ) { goto cleanup ; }
}
}
error = add_table_to_metadata ( name , form , txn ) ;
if ( error ) { goto cleanup ; }
2009-09-10 20:52:19 +00:00
error = 0 ;
2008-10-13 18:13:41 +00:00
cleanup :
if ( status_block ! = NULL ) {
2009-12-03 15:49:42 +00:00
int r = status_block - > close ( status_block , 0 ) ;
assert ( r = = 0 ) ;
2008-10-13 18:13:41 +00:00
}
2010-01-12 02:52:33 +00:00
free_key_and_col_info ( & kc_info ) ;
2011-09-06 18:42:31 +00:00
if ( do_commit & & txn ) {
2009-11-10 19:22:08 +00:00
if ( error ) {
abort_txn ( txn ) ;
}
else {
commit_txn ( txn , 0 ) ;
}
2009-09-10 20:52:19 +00:00
}
2008-10-13 18:13:41 +00:00
my_free ( newname , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
2009-09-17 17:51:06 +00:00
pthread_mutex_unlock ( & tokudb_meta_mutex ) ;
2008-03-21 23:47:22 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-05 16:00:53 +00:00
}
2009-09-10 20:52:19 +00:00
int ha_tokudb : : discard_or_import_tablespace ( my_bool discard ) {
/*
if ( discard ) {
my_errno = HA_ERR_WRONG_COMMAND ;
return my_errno ;
}
return add_table_to_metadata ( share - > table_name ) ;
*/
my_errno = HA_ERR_WRONG_COMMAND ;
return my_errno ;
}
2008-04-17 20:56:40 +00:00
//
2009-11-10 19:22:08 +00:00
// deletes from_name or renames from_name to to_name, all using transaction txn.
// is_delete specifies which we are doing
// is_key specifies if it is a secondary index (and hence a "key-" needs to be prepended) or
// if it is not a secondary index
2008-04-17 20:56:40 +00:00
//
2010-01-11 18:14:37 +00:00
int ha_tokudb : : delete_or_rename_dictionary ( const char * from_name , const char * to_name , const char * secondary_name , bool is_key , DB_TXN * txn , bool is_delete ) {
2009-11-10 19:22:08 +00:00
int error ;
char dict_name [ MAX_DICT_NAME_LEN ] ;
char * new_from_name = NULL ;
char * new_to_name = NULL ;
assert ( txn ) ;
new_from_name = ( char * ) my_malloc (
get_max_dict_name_path_length ( from_name ) ,
MYF ( MY_WME )
) ;
if ( new_from_name = = NULL ) {
error = ENOMEM ;
goto cleanup ;
}
if ( ! is_delete ) {
assert ( to_name ) ;
new_to_name = ( char * ) my_malloc (
get_max_dict_name_path_length ( to_name ) ,
MYF ( MY_WME )
) ;
if ( new_to_name = = NULL ) {
error = ENOMEM ;
goto cleanup ;
}
}
if ( is_key ) {
sprintf ( dict_name , " key-%s " , secondary_name ) ;
make_name ( new_from_name , from_name , dict_name ) ;
}
else {
make_name ( new_from_name , from_name , secondary_name ) ;
}
if ( ! is_delete ) {
if ( is_key ) {
sprintf ( dict_name , " key-%s " , secondary_name ) ;
make_name ( new_to_name , to_name , dict_name ) ;
}
else {
make_name ( new_to_name , to_name , secondary_name ) ;
}
}
if ( is_delete ) {
error = db_env - > dbremove ( db_env , txn , new_from_name , NULL , 0 ) ;
}
else {
error = db_env - > dbrename ( db_env , txn , new_from_name , NULL , new_to_name , 0 ) ;
}
if ( error ) { goto cleanup ; }
2009-09-10 20:52:19 +00:00
2009-11-10 19:22:08 +00:00
cleanup :
my_free ( new_from_name , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
my_free ( new_to_name , MYF ( MY_ALLOW_ZERO_PTR ) ) ;
return error ;
}
//
// deletes or renames a table. if is_delete is true, then we delete, and to_name can be NULL
// if is_delete is false, then to_name must be non-NULL, as we are renaming the table.
//
int ha_tokudb : : delete_or_rename_table ( const char * from_name , const char * to_name , bool is_delete ) {
2008-02-07 20:19:44 +00:00
int error ;
2009-12-03 15:39:53 +00:00
DB * status_db = NULL ;
2009-11-10 19:22:08 +00:00
DBC * status_cursor = NULL ;
DB_TXN * txn = NULL ;
DBT curr_key ;
DBT curr_val ;
2012-05-09 18:36:52 +00:00
memset ( & curr_key , 0 , sizeof ( curr_key ) ) ;
memset ( & curr_val , 0 , sizeof ( curr_val ) ) ;
2009-09-17 17:51:06 +00:00
pthread_mutex_lock ( & tokudb_meta_mutex ) ;
2009-09-25 21:31:19 +00:00
2009-11-10 19:22:08 +00:00
error = db_env - > txn_begin ( db_env , 0 , & txn , 0 ) ;
if ( error ) { goto cleanup ; }
2009-09-25 21:31:19 +00:00
//
2009-11-10 19:22:08 +00:00
// modify metadata db
2009-09-25 21:31:19 +00:00
//
2009-11-10 19:22:08 +00:00
if ( is_delete ) {
error = drop_table_from_metadata ( from_name , txn ) ;
2009-09-10 20:52:19 +00:00
}
2009-11-10 19:22:08 +00:00
else {
error = rename_table_in_metadata ( from_name , to_name , txn ) ;
2008-10-13 17:50:40 +00:00
}
2009-11-10 19:22:08 +00:00
if ( error ) { goto cleanup ; }
//
// open status db,
// create cursor,
// for each name read out of there, create a db and delete or rename it
//
error = open_status_dictionary ( & status_db , from_name , txn ) ;
if ( error ) { goto cleanup ; }
error = status_db - > cursor ( status_db , txn , & status_cursor , 0 ) ;
if ( error ) { goto cleanup ; }
while ( error ! = DB_NOTFOUND ) {
error = status_cursor - > c_get (
status_cursor ,
& curr_key ,
& curr_val ,
DB_NEXT
) ;
if ( error & & error ! = DB_NOTFOUND ) { goto cleanup ; }
if ( error = = DB_NOTFOUND ) { break ; }
HA_METADATA_KEY mk = * ( HA_METADATA_KEY * ) curr_key . data ;
if ( mk ! = hatoku_key_name ) {
continue ;
}
error = delete_or_rename_dictionary ( from_name , to_name , ( char * ) ( ( char * ) curr_key . data + sizeof ( HA_METADATA_KEY ) ) , true , txn , is_delete ) ;
if ( error ) { goto cleanup ; }
}
//
// delete or rename main.tokudb
//
error = delete_or_rename_dictionary ( from_name , to_name , " main " , false , txn , is_delete ) ;
if ( error ) { goto cleanup ; }
error = status_cursor - > c_close ( status_cursor ) ;
2009-12-03 16:59:52 +00:00
assert ( error = = 0 ) ;
2009-11-10 19:22:08 +00:00
status_cursor = NULL ;
2009-12-03 15:49:42 +00:00
if ( error ) { goto cleanup ; }
2009-11-10 19:22:08 +00:00
error = status_db - > close ( status_db , 0 ) ;
2009-12-03 15:49:42 +00:00
assert ( error = = 0 ) ;
2009-11-10 19:22:08 +00:00
status_db = NULL ;
//
// delete or rename status.tokudb
//
error = delete_or_rename_dictionary ( from_name , to_name , " status " , false , txn , is_delete ) ;
if ( error ) { goto cleanup ; }
2008-02-07 20:19:44 +00:00
my_errno = error ;
2008-10-13 17:50:40 +00:00
cleanup :
2009-11-10 19:22:08 +00:00
if ( status_cursor ) {
2009-12-03 16:59:52 +00:00
int r = status_cursor - > c_close ( status_cursor ) ;
assert ( r = = 0 ) ;
2009-11-10 19:22:08 +00:00
}
if ( status_db ) {
2009-12-03 15:49:42 +00:00
int r = status_db - > close ( status_db , 0 ) ;
assert ( r = = 0 ) ;
2009-11-10 19:22:08 +00:00
}
if ( txn ) {
if ( error ) {
abort_txn ( txn ) ;
}
else {
commit_txn ( txn , 0 ) ;
}
2009-09-25 21:31:19 +00:00
}
2009-09-17 17:51:06 +00:00
pthread_mutex_unlock ( & tokudb_meta_mutex ) ;
2009-11-10 19:22:08 +00:00
return error ;
}
//
// Drops table
// Parameters:
// [in] name - name of table to be deleted
// Returns:
// 0 on success
// error otherwise
//
int ha_tokudb : : delete_table ( const char * name ) {
TOKUDB_DBUG_ENTER ( " ha_tokudb::delete_table " ) ;
2009-11-12 19:36:40 +00:00
int error ;
error = delete_or_rename_table ( name , NULL , true ) ;
2010-05-21 03:41:23 +00:00
if ( error = = DB_LOCK_NOTGRANTED & & ( ( tokudb_debug & TOKUDB_DEBUG_HIDE_DDL_LOCK_ERRORS ) = = 0 ) ) {
2009-11-12 19:36:40 +00:00
sql_print_error ( " Could not delete table %s because \
another transaction has accessed the table . \
To drop the table , make sure no transactions touch the table . " , name);
}
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-07 20:19:44 +00:00
}
2008-04-17 20:56:40 +00:00
//
// renames table from "from" to "to"
// Parameters:
// [in] name - old name of table
// [in] to - new name of table
// Returns:
// 0 on success
// error otherwise
//
2008-02-07 20:19:44 +00:00
int ha_tokudb : : rename_table ( const char * from , const char * to ) {
2008-04-24 17:30:05 +00:00
TOKUDB_DBUG_ENTER ( " %s %s %s " , __FUNCTION__ , from , to ) ;
2008-02-07 20:19:44 +00:00
int error ;
2009-11-10 19:22:08 +00:00
error = delete_or_rename_table ( from , to , false ) ;
2010-05-21 03:41:23 +00:00
if ( error = = DB_LOCK_NOTGRANTED & & ( ( tokudb_debug & TOKUDB_DEBUG_HIDE_DDL_LOCK_ERRORS ) = = 0 ) ) {
2009-11-12 19:36:40 +00:00
sql_print_error ( " Could not rename table from %s to %s because \
another transaction has accessed the table . \
To rename the table , make sure no transactions touch the table . " , from, to);
}
2008-04-24 17:30:05 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
2008-02-05 16:00:53 +00:00
}
/*
2008-04-17 20:56:40 +00:00
Returns estimate on number of seeks it will take to read through the table
2008-02-05 16:00:53 +00:00
This is to be comparable to the number returned by records_in_range so
that we can decide if we should scan the table or use keys .
*/
2008-02-18 20:18:50 +00:00
/// QQQ why divide by 3
2008-02-07 20:19:44 +00:00
double ha_tokudb : : scan_time ( ) {
2008-05-05 18:38:04 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::scan_time " ) ;
2008-10-10 20:48:40 +00:00
double ret_val = ( double ) stats . records / 3 ;
2008-05-05 18:38:04 +00:00
DBUG_RETURN ( ret_val ) ;
2008-02-07 20:19:44 +00:00
}
2010-11-22 18:16:38 +00:00
double ha_tokudb : : keyread_time ( uint index , uint ranges , ha_rows rows )
{
2012-11-30 17:02:29 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::keyread_time " ) ;
double ret_val ;
if ( ( table - > key_info [ index ] . flags & HA_CLUSTERING ) | | ( index = = primary_key ) ) {
ret_val = read_time ( index , ranges , rows ) ;
DBUG_RETURN ( ret_val ) ;
}
/*
It is assumed that we will read trough the whole key range and that all
key blocks are half full ( normally things are much better ) . It is also
assumed that each time we read the next key from the index , the handler
performs a random seek , thus the cost is proportional to the number of
blocks read . This model does not take into account clustered indexes -
engines that support that ( e . g . InnoDB ) may want to overwrite this method .
*/
double keys_per_block = ( stats . block_size / 2.0 /
( table - > key_info [ index ] . key_length +
ref_length ) + 1 ) ;
ret_val = ( rows + keys_per_block - 1 ) / keys_per_block ;
DBUG_RETURN ( ret_val ) ;
2010-11-22 18:16:38 +00:00
}
2008-06-17 17:04:08 +00:00
//
// Calculate the time it takes to read a set of ranges through an index
// This enables us to optimize reads for clustered indexes.
// Implementation pulled from InnoDB
// Parameters:
// index - index to use
// ranges - number of ranges
// rows - estimated number of rows in the range
// Returns:
// estimated time measured in disk seeks
//
double ha_tokudb : : read_time (
2009-09-11 17:13:45 +00:00
uint index ,
uint ranges ,
ha_rows rows
)
2008-06-17 17:04:08 +00:00
{
2012-11-30 17:02:29 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::read_time " ) ;
2008-06-17 17:04:08 +00:00
double total_scan ;
double ret_val ;
2010-11-30 22:23:54 +00:00
bool is_primary = ( index = = primary_key ) ;
2011-01-21 14:51:44 +00:00
bool is_clustering ;
2008-06-17 17:04:08 +00:00
2008-11-19 23:05:49 +00:00
//
// in case for hidden primary key, this is called
//
if ( index > = table_share - > keys ) {
ret_val = handler : : read_time ( index , ranges , rows ) ;
goto cleanup ;
}
2011-01-21 14:51:44 +00:00
is_clustering = ( table - > key_info [ index ] . flags & HA_CLUSTERING ) ;
2008-11-19 23:05:49 +00:00
2008-11-03 20:42:59 +00:00
//
// if it is not the primary key, and it is not a clustering key, then return handler::read_time
//
2010-11-30 22:23:54 +00:00
if ( ! ( is_primary | | is_clustering ) ) {
2008-06-17 17:04:08 +00:00
ret_val = handler : : read_time ( index , ranges , rows ) ;
goto cleanup ;
}
2008-11-03 20:42:59 +00:00
//
// for primary key and for clustered keys, return a fraction of scan_time()
//
2008-06-17 17:04:08 +00:00
total_scan = scan_time ( ) ;
if ( stats . records < rows ) {
2010-12-01 16:30:16 +00:00
ret_val = is_clustering ? total_scan + 0.00001 : total_scan ;
2008-06-17 17:04:08 +00:00
goto cleanup ;
}
//
// one disk seek per range plus the proportional scan time of the rows
//
ret_val = ( ranges + ( double ) rows / ( double ) stats . records * total_scan ) ;
2010-12-01 16:30:16 +00:00
ret_val = is_clustering ? ret_val + 0.00001 : ret_val ;
2010-11-30 22:23:54 +00:00
2008-06-17 17:04:08 +00:00
cleanup :
2012-11-30 17:02:29 +00:00
DBUG_RETURN ( ret_val ) ;
2008-06-17 17:04:08 +00:00
}
2012-11-30 17:02:29 +00:00
double ha_tokudb : : index_only_read_time ( uint keynr , double records ) {
TOKUDB_DBUG_ENTER ( " ha_tokudb::index_only_read_time " ) ;
2012-12-07 00:01:22 +00:00
double ret_val = keyread_time ( keynr , 1 , ( ha_rows ) records ) ;
2012-11-30 17:02:29 +00:00
DBUG_RETURN ( ret_val ) ;
}
2008-06-17 17:04:08 +00:00
2008-04-17 20:56:40 +00:00
//
2008-05-06 17:43:04 +00:00
// Estimates the number of index records in a range. In case of errors, return
// HA_TOKUDB_RANGE_COUNT instead of HA_POS_ERROR. This was behavior
// when we got the handlerton from MySQL.
// Parameters:
// keynr -index to use
// [in] start_key - low end of the range
// [in] end_key - high end of the range
// Returns:
// 0 - There are no matching keys in the given range
// number > 0 - There are approximately number matching rows in the range
// HA_POS_ERROR - Something is wrong with the index tree
2008-04-17 20:56:40 +00:00
//
2008-05-06 17:43:04 +00:00
ha_rows ha_tokudb : : records_in_range ( uint keynr , key_range * start_key , key_range * end_key ) {
2008-03-26 02:47:07 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::records_in_range " ) ;
2009-06-18 17:24:11 +00:00
DBT key ;
2008-05-06 17:43:04 +00:00
ha_rows ret_val = HA_TOKUDB_RANGE_COUNT ;
2008-05-26 14:07:31 +00:00
DB * kfile = share - > key_file [ keynr ] ;
2012-07-25 20:48:53 +00:00
uint64_t less , equal , greater ;
uint64_t total_rows_estimate = HA_TOKUDB_RANGE_COUNT ;
uint64_t start_rows , end_rows , rows ;
2008-05-13 15:26:50 +00:00
int is_exact ;
2008-05-06 17:43:04 +00:00
int error ;
2009-06-18 17:24:11 +00:00
uchar inf_byte ;
2008-02-07 20:19:44 +00:00
2008-05-06 17:43:04 +00:00
//
2008-05-13 15:26:50 +00:00
// get start_rows and end_rows values so that we can estimate range
2008-09-12 17:12:44 +00:00
// when calling key_range64, the only value we can trust is the value for less
// The reason is that the key being passed in may be a prefix of keys in the DB
// As a result, equal may be 0 and greater may actually be equal+greater
// So, we call key_range64 on the key, and the key that is after it.
2008-05-06 17:43:04 +00:00
//
2010-09-03 20:47:01 +00:00
if ( ! start_key & & ! end_key ) {
error = estimate_num_rows ( kfile , & end_rows , transaction ) ;
if ( error ) {
ret_val = HA_TOKUDB_RANGE_COUNT ;
goto cleanup ;
}
2010-09-05 18:59:44 +00:00
ret_val = ( end_rows < = 1 ) ? 1 : end_rows ;
goto cleanup ;
2010-09-03 20:47:01 +00:00
}
2008-05-06 17:43:04 +00:00
if ( start_key ) {
2009-06-18 17:24:11 +00:00
inf_byte = ( start_key - > flag = = HA_READ_KEY_EXACT ) ?
COL_NEG_INF : COL_POS_INF ;
pack_key (
& key ,
keynr ,
key_buff ,
start_key - > key ,
start_key - > length ,
inf_byte
) ;
2008-05-13 15:26:50 +00:00
error = kfile - > key_range64 (
2008-05-06 17:43:04 +00:00
kfile ,
transaction ,
2008-09-12 17:12:44 +00:00
& key ,
2008-05-13 15:26:50 +00:00
& less ,
& equal ,
& greater ,
& is_exact
2008-05-06 17:43:04 +00:00
) ;
if ( error ) {
ret_val = HA_TOKUDB_RANGE_COUNT ;
goto cleanup ;
}
2009-06-18 17:24:11 +00:00
start_rows = less ;
2010-09-03 20:47:01 +00:00
total_rows_estimate = less + equal + greater ;
2008-02-07 20:19:44 +00:00
}
2008-05-06 17:43:04 +00:00
else {
2008-05-13 15:26:50 +00:00
start_rows = 0 ;
2008-05-06 17:43:04 +00:00
}
if ( end_key ) {
2009-06-18 17:24:11 +00:00
inf_byte = ( end_key - > flag = = HA_READ_BEFORE_KEY ) ?
COL_NEG_INF : COL_POS_INF ;
pack_key (
& key ,
keynr ,
key_buff ,
end_key - > key ,
end_key - > length ,
inf_byte
) ;
2008-05-13 15:26:50 +00:00
error = kfile - > key_range64 (
2008-05-06 17:43:04 +00:00
kfile ,
transaction ,
2008-09-12 17:12:44 +00:00
& key ,
2008-05-13 15:26:50 +00:00
& less ,
& equal ,
& greater ,
& is_exact
2008-05-06 17:43:04 +00:00
) ;
if ( error ) {
ret_val = HA_TOKUDB_RANGE_COUNT ;
goto cleanup ;
}
2009-06-18 17:24:11 +00:00
end_rows = less ;
2008-05-06 17:43:04 +00:00
}
else {
2010-09-03 20:47:01 +00:00
//
// first if-clause ensures that start_key is non-NULL
//
assert ( start_key ) ;
end_rows = total_rows_estimate ;
2008-05-06 17:43:04 +00:00
}
2008-09-12 17:12:44 +00:00
rows = ( end_rows > start_rows ) ? end_rows - start_rows : 1 ;
2008-05-13 15:26:50 +00:00
2008-05-06 17:43:04 +00:00
//
2008-05-13 15:26:50 +00:00
// MySQL thinks a return value of 0 means there are exactly 0 rows
// Therefore, always return non-zero so this assumption is not made
2008-05-06 17:43:04 +00:00
//
2008-05-13 15:26:50 +00:00
ret_val = ( ha_rows ) ( rows < = 1 ? 1 : rows ) ;
2008-05-06 17:43:04 +00:00
cleanup :
2008-10-10 20:48:40 +00:00
DBUG_RETURN ( ret_val ) ;
2008-02-05 16:00:53 +00:00
}
2008-08-18 18:35:32 +00:00
//
2009-07-27 14:52:30 +00:00
// Initializes the auto-increment data in the local "share" object to the
// greater of two values: what's stored in the metadata or the last inserted
// auto-increment field (if auto-increment field is the first field of a key).
2008-08-18 18:35:32 +00:00
//
void ha_tokudb : : init_auto_increment ( ) {
DBT key ;
DBT value ;
int error ;
HA_METADATA_KEY key_val = hatoku_max_ai ;
2012-05-09 18:36:52 +00:00
memset ( & key , 0 , sizeof ( key ) ) ;
memset ( & value , 0 , sizeof ( value ) ) ;
2008-08-18 18:35:32 +00:00
key . data = & key_val ;
key . size = sizeof ( key_val ) ;
2009-08-05 18:23:40 +00:00
value . flags = DB_DBT_USERMEM ;
2008-08-18 18:35:32 +00:00
DB_TXN * txn = NULL ;
error = db_env - > txn_begin ( db_env , 0 , & txn , 0 ) ;
if ( error ) {
share - > last_auto_increment = 0 ;
}
else {
//
// First retrieve hatoku_max_ai, which is max value used by auto increment
// column so far, the max value could have been auto generated (e.g. insert (NULL))
// or it could have been manually inserted by user (e.g. insert (345))
//
2009-08-05 18:23:40 +00:00
value . ulen = sizeof ( share - > last_auto_increment ) ;
value . data = & share - > last_auto_increment ;
2008-08-18 18:35:32 +00:00
error = share - > status_block - > get (
share - > status_block ,
txn ,
& key ,
& value ,
0
) ;
2009-08-05 18:23:40 +00:00
if ( error | | value . size ! = sizeof ( share - > last_auto_increment ) ) {
2008-08-18 18:35:32 +00:00
share - > last_auto_increment = 0 ;
}
2010-01-11 18:53:10 +00:00
2008-08-18 18:35:32 +00:00
//
// Now retrieve the initial auto increment value, as specified by create table
// so if a user does "create table t1 (a int auto_increment, primary key (a)) auto_increment=100",
// then the value 100 should be stored here
//
key_val = hatoku_ai_create_value ;
2009-08-05 18:23:40 +00:00
value . ulen = sizeof ( share - > auto_inc_create_value ) ;
value . data = & share - > auto_inc_create_value ;
2008-08-18 18:35:32 +00:00
error = share - > status_block - > get (
share - > status_block ,
txn ,
& key ,
& value ,
0
) ;
2009-08-05 18:23:40 +00:00
if ( error | | value . size ! = sizeof ( share - > auto_inc_create_value ) ) {
2008-08-18 18:35:32 +00:00
share - > auto_inc_create_value = 0 ;
}
2009-11-10 19:22:08 +00:00
commit_txn ( txn , 0 ) ;
2008-08-18 18:35:32 +00:00
}
if ( tokudb_debug & TOKUDB_DEBUG_AUTO_INCREMENT ) {
TOKUDB_TRACE ( " init auto increment:%lld \n " , share - > last_auto_increment ) ;
}
}
2008-02-07 20:19:44 +00:00
void ha_tokudb : : get_auto_increment ( ulonglong offset , ulonglong increment , ulonglong nb_desired_values , ulonglong * first_value , ulonglong * nb_reserved_values ) {
2008-05-05 18:38:04 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::get_auto_increment " ) ;
2008-03-18 21:06:01 +00:00
ulonglong nr ;
2012-12-09 18:54:32 +00:00
bool over ;
2008-03-18 21:06:01 +00:00
2008-04-02 17:34:05 +00:00
pthread_mutex_lock ( & share - > mutex ) ;
2008-08-18 18:35:32 +00:00
if ( share - > auto_inc_create_value > share - > last_auto_increment ) {
nr = share - > auto_inc_create_value ;
2012-12-09 18:54:32 +00:00
over = false ;
2008-08-18 18:35:32 +00:00
share - > last_auto_increment = share - > auto_inc_create_value ;
2008-03-18 21:06:01 +00:00
}
2008-08-18 18:35:32 +00:00
else {
nr = share - > last_auto_increment + increment ;
2012-12-09 18:54:32 +00:00
over = nr < share - > last_auto_increment ;
if ( over )
nr = ULONGLONG_MAX ;
2008-08-18 18:35:32 +00:00
}
2012-12-09 18:54:32 +00:00
if ( ! over ) {
share - > last_auto_increment = nr + ( nb_desired_values - 1 ) * increment ;
if ( delay_updating_ai_metadata ) {
ai_metadata_update_required = true ;
}
else {
update_max_auto_inc ( share - > status_block , share - > last_auto_increment ) ;
}
2009-07-10 20:01:20 +00:00
}
2012-12-09 18:54:32 +00:00
2008-08-18 18:35:32 +00:00
if ( tokudb_debug & TOKUDB_DEBUG_AUTO_INCREMENT ) {
2008-04-24 17:30:05 +00:00
TOKUDB_TRACE ( " get_auto_increment(%lld,%lld,%lld):got:%lld:%lld \n " ,
offset , increment , nb_desired_values , nr , nb_desired_values ) ;
2008-08-18 18:35:32 +00:00
}
2008-03-18 21:06:01 +00:00
* first_value = nr ;
2008-03-24 20:59:46 +00:00
* nb_reserved_values = nb_desired_values ;
2008-08-18 18:35:32 +00:00
pthread_mutex_unlock ( & share - > mutex ) ;
2008-05-05 18:38:04 +00:00
DBUG_VOID_RETURN ;
2008-02-07 20:19:44 +00:00
}
2012-01-09 03:10:29 +00:00
bool ha_tokudb : : is_optimize_blocking ( ) {
return false ;
}
2008-09-15 19:03:16 +00:00
bool ha_tokudb : : is_auto_inc_singleton ( ) {
return false ;
}
2012-03-09 20:47:36 +00:00
volatile int ha_tokudb_tokudb_add_index_wait = 0 ; // debug
2012-11-28 22:27:15 +00:00
volatile int ha_tokudb_build_index_wait = 0 ; // debug
2012-03-09 20:47:36 +00:00
2011-03-05 00:29:11 +00:00
//
// Internal function called by ha_tokudb::add_index and ha_tokudb::alter_table_phase2
// With a transaction, drops dictionaries associated with indexes in key_num
//
2008-05-26 14:07:31 +00:00
//
// Adds indexes to the table. Takes the array of KEY passed in key_info, and creates
// DB's that will go at the end of share->key_file. THE IMPLICIT ASSUMPTION HERE is
// that the table will be modified and that these added keys will be appended to the end
// of the array table->key_info
// Parameters:
// [in] table_arg - table that is being modified, seems to be identical to this->table
// [in] key_info - array of KEY's to be added
// num_of_keys - number of keys to be added, number of elements in key_info
// Returns:
// 0 on success, error otherwise
//
2011-03-04 19:54:23 +00:00
int ha_tokudb : : tokudb_add_index (
TABLE * table_arg ,
KEY * key_info ,
uint num_of_keys ,
DB_TXN * txn ,
bool * inc_num_DBs ,
bool * modified_DBs
)
{
TOKUDB_DBUG_ENTER ( " ha_tokudb::tokudb_add_index " ) ;
2012-05-21 18:56:56 +00:00
assert ( txn ) ;
2012-03-09 20:47:36 +00:00
while ( ha_tokudb_tokudb_add_index_wait ) sleep ( 1 ) ; // debug
2008-05-26 14:07:31 +00:00
int error ;
uint curr_index = 0 ;
DBC * tmp_cursor = NULL ;
int cursor_ret_val = 0 ;
2010-03-29 02:08:34 +00:00
DBT curr_pk_key , curr_pk_val ;
2008-11-04 13:41:54 +00:00
THD * thd = ha_thd ( ) ;
2010-03-29 02:08:34 +00:00
DB_LOADER * loader = NULL ;
2010-11-17 23:09:06 +00:00
DB_INDEXER * indexer = NULL ;
2012-11-20 16:11:50 +00:00
bool loader_save_space = get_load_save_space ( thd ) ;
2010-11-17 23:09:06 +00:00
bool use_hot_index = ( lock . type = = TL_WRITE_ALLOW_WRITE ) ;
2012-11-20 16:11:50 +00:00
uint32_t loader_flags = loader_save_space ? LOADER_COMPRESS_INTERMEDIATES : 0 ;
2012-07-25 20:48:53 +00:00
uint32_t indexer_flags = 0 ;
uint32_t mult_db_flags [ MAX_KEY + 1 ] = { 0 } ;
uint32_t mult_put_flags [ MAX_KEY + 1 ] ;
uint32_t mult_dbt_flags [ MAX_KEY + 1 ] ;
2011-01-06 19:02:48 +00:00
bool creating_hot_index = false ;
2010-12-08 15:06:06 +00:00
struct loader_context lc ;
memset ( & lc , 0 , sizeof lc ) ;
2010-03-29 02:08:34 +00:00
lc . thd = thd ;
lc . ha = this ;
loader_error = 0 ;
2010-11-17 23:09:06 +00:00
bool rw_lock_taken = false ;
2011-03-04 19:54:23 +00:00
* inc_num_DBs = false ;
* modified_DBs = false ;
2011-10-16 02:02:29 +00:00
invalidate_bulk_fetch ( ) ;
unpack_entire_row = true ; // for bulk fetching rows
2012-07-25 20:48:53 +00:00
for ( uint32_t i = 0 ; i < MAX_KEY + 1 ; i + + ) {
2011-06-06 21:08:45 +00:00
mult_put_flags [ i ] = 0 ;
2010-11-02 18:17:17 +00:00
mult_dbt_flags [ i ] = DB_DBT_REALLOC ;
}
2008-11-04 14:00:33 +00:00
//
// number of DB files we have open currently, before add_index is executed
//
uint curr_num_DBs = table_arg - > s - > keys + test ( hidden_primary_key ) ;
2008-07-30 14:43:19 +00:00
2012-04-04 15:12:36 +00:00
//
// get the row type to use for the indexes we're adding
//
2012-04-04 15:32:08 +00:00
const enum row_type row_type = get_row_type_for_key ( share - > file ) ;
2012-04-04 15:12:36 +00:00
2009-01-17 00:15:44 +00:00
//
// status message to be shown in "show process list"
//
char status_msg [ MAX_ALIAS_NAME + 200 ] ; //buffer of 200 should be a good upper bound.
ulonglong num_processed = 0 ; //variable that stores number of elements inserted thus far
thd_proc_info ( thd , " Adding indexes " ) ;
2008-05-26 14:07:31 +00:00
//
// in unpack_row, MySQL passes a buffer that is this long,
// so this length should be good enough for us as well
//
2012-05-09 18:36:52 +00:00
memset ( ( void * ) & curr_pk_key , 0 , sizeof ( curr_pk_key ) ) ;
memset ( ( void * ) & curr_pk_val , 0 , sizeof ( curr_pk_val ) ) ;
2008-05-29 14:32:50 +00:00
//
// The files for secondary tables are derived from the name of keys
// If we try to add a key with the same name as an already existing key,
// We can crash. So here we check if any of the keys added has the same
// name of an existing key, and if so, we fail gracefully
//
for ( uint i = 0 ; i < num_of_keys ; i + + ) {
for ( uint j = 0 ; j < table_arg - > s - > keys ; j + + ) {
if ( strcmp ( key_info [ i ] . name , table_arg - > s - > key_info [ j ] . name ) = = 0 ) {
error = HA_ERR_WRONG_COMMAND ;
goto cleanup ;
}
}
}
2010-11-17 23:09:06 +00:00
rw_wrlock ( & share - > num_DBs_lock ) ;
rw_lock_taken = true ;
2008-05-26 14:07:31 +00:00
//
// open all the DB files and set the appropriate variables in share
// they go to the end of share->key_file
//
2011-01-06 19:02:48 +00:00
creating_hot_index = use_hot_index & & num_of_keys = = 1 & & ( key_info [ 0 ] . flags & HA_NOSAME ) = = 0 ;
2011-01-19 15:57:00 +00:00
if ( use_hot_index & & ( share - > num_DBs > curr_num_DBs ) ) {
//
// already have hot index in progress, get out
//
error = HA_ERR_INTERNAL_ERROR ;
goto cleanup ;
}
2008-06-17 14:55:31 +00:00
curr_index = curr_num_DBs ;
2011-03-04 19:54:23 +00:00
* modified_DBs = true ;
2008-05-26 14:07:31 +00:00
for ( uint i = 0 ; i < num_of_keys ; i + + , curr_index + + ) {
2009-04-17 18:29:25 +00:00
if ( key_info [ i ] . flags & HA_CLUSTERING ) {
set_key_filter (
2010-01-11 18:14:37 +00:00
& share - > kc_info . key_filters [ curr_index ] ,
2009-04-17 18:29:25 +00:00
& key_info [ i ] ,
table_arg ,
false
) ;
if ( ! hidden_primary_key ) {
set_key_filter (
2010-01-11 18:14:37 +00:00
& share - > kc_info . key_filters [ curr_index ] ,
2009-04-17 18:29:25 +00:00
& table_arg - > key_info [ primary_key ] ,
table_arg ,
false
) ;
}
2010-01-11 18:14:37 +00:00
error = initialize_col_pack_info ( & share - > kc_info , table_arg - > s , curr_index ) ;
2009-04-17 18:29:25 +00:00
if ( error ) {
goto cleanup ;
}
}
2012-04-04 15:12:36 +00:00
error = create_secondary_dictionary ( share - > table_name , table_arg , & key_info [ i ] , txn , & share - > kc_info , curr_index , creating_hot_index , row_type ) ;
2010-01-11 18:14:37 +00:00
if ( error ) { goto cleanup ; }
2009-11-10 19:22:08 +00:00
error = open_secondary_dictionary (
2008-05-26 14:07:31 +00:00
& share - > key_file [ curr_index ] ,
& key_info [ i ] ,
share - > table_name ,
2009-12-02 14:02:47 +00:00
false ,
2009-11-10 19:22:08 +00:00
txn
2008-05-26 14:07:31 +00:00
) ;
if ( error ) { goto cleanup ; }
}
2011-01-06 19:02:48 +00:00
if ( creating_hot_index ) {
2010-11-17 23:09:06 +00:00
share - > num_DBs + + ;
2011-03-04 19:54:23 +00:00
* inc_num_DBs = true ;
2010-11-17 23:09:06 +00:00
error = db_env - > create_indexer (
db_env ,
txn ,
& indexer ,
share - > file ,
num_of_keys ,
& share - > key_file [ curr_num_DBs ] ,
mult_db_flags ,
indexer_flags
) ;
if ( error ) { goto cleanup ; }
2010-03-29 02:08:34 +00:00
2010-11-17 23:09:06 +00:00
error = indexer - > set_poll_function ( indexer , ai_poll_fun , & lc ) ;
if ( error ) { goto cleanup ; }
2010-03-29 02:08:34 +00:00
2010-11-17 23:09:06 +00:00
error = indexer - > set_error_callback ( indexer , loader_ai_err_fun , & lc ) ;
if ( error ) { goto cleanup ; }
2008-06-12 20:20:54 +00:00
2010-11-17 23:09:06 +00:00
rw_unlock ( & share - > num_DBs_lock ) ;
rw_lock_taken = false ;
2012-06-30 16:51:25 +00:00
# ifdef HA_TOKUDB_HAS_THD_PROGRESS
// initialize a one phase progress report.
// incremental reports are done in the indexer's callback function.
thd_progress_init ( thd , 1 ) ;
# endif
2012-11-28 22:27:15 +00:00
while ( ha_tokudb_build_index_wait ) sleep ( 1 ) ; // debug
2010-11-17 23:09:06 +00:00
error = indexer - > build ( indexer ) ;
2012-06-30 16:51:25 +00:00
2010-11-17 23:09:06 +00:00
if ( error ) { goto cleanup ; }
2008-05-26 14:07:31 +00:00
2012-06-02 13:20:58 +00:00
rw_wrlock ( & share - > num_DBs_lock ) ;
2010-11-17 23:09:06 +00:00
error = indexer - > close ( indexer ) ;
2012-06-02 13:20:58 +00:00
rw_unlock ( & share - > num_DBs_lock ) ;
2010-11-17 23:09:06 +00:00
if ( error ) { goto cleanup ; }
indexer = NULL ;
2010-09-03 20:47:01 +00:00
}
2010-11-17 23:09:06 +00:00
else {
rw_unlock ( & share - > num_DBs_lock ) ;
rw_lock_taken = false ;
2011-10-19 15:26:48 +00:00
prelocked_right_range_size = 0 ;
prelocked_left_range_size = 0 ;
2011-10-16 02:02:29 +00:00
struct smart_dbt_bf_info bf_info ;
bf_info . ha = this ;
// you need the val if you have a clustering index and key_read is not 0;
bf_info . direction = 1 ;
bf_info . thd = ha_thd ( ) ;
2012-07-25 20:48:53 +00:00
bf_info . need_val = true ;
2011-10-16 02:02:29 +00:00
2010-11-17 23:09:06 +00:00
error = db_env - > create_loader (
db_env ,
txn ,
& loader ,
NULL , // no src_db needed
num_of_keys ,
& share - > key_file [ curr_num_DBs ] ,
mult_put_flags ,
mult_dbt_flags ,
loader_flags
) ;
if ( error ) { goto cleanup ; }
2010-09-03 20:47:01 +00:00
2012-06-30 16:51:25 +00:00
error = loader - > set_poll_function ( loader , loader_poll_fun , & lc ) ;
2010-11-17 23:09:06 +00:00
if ( error ) { goto cleanup ; }
2008-07-30 14:43:19 +00:00
2010-11-17 23:09:06 +00:00
error = loader - > set_error_callback ( loader , loader_ai_err_fun , & lc ) ;
if ( error ) { goto cleanup ; }
//
// scan primary table, create each secondary key, add to each DB
//
2011-03-04 19:54:23 +00:00
if ( ( error = share - > file - > cursor ( share - > file , txn , & tmp_cursor , DB_SERIALIZABLE ) ) ) {
2010-11-17 23:09:06 +00:00
tmp_cursor = NULL ; // Safety
2008-05-26 14:07:31 +00:00
goto cleanup ;
}
2008-07-30 14:43:19 +00:00
2010-11-17 23:09:06 +00:00
//
// grab some locks to make this go faster
// first a global read lock on the main DB, because
// we intend to scan the entire thing
//
2011-10-05 21:55:09 +00:00
error = tmp_cursor - > c_pre_acquire_range_lock (
tmp_cursor ,
share - > file - > dbt_neg_infty ( ) ,
share - > file - > dbt_pos_infty ( )
) ;
2010-03-29 02:08:34 +00:00
if ( error ) { goto cleanup ; }
2009-11-25 21:00:52 +00:00
2012-01-23 21:21:23 +00:00
// set the bulk fetch iteration to its max so that adding an
// index fills the bulk fetch buffer every time. we do not
// want it to grow exponentially fast.
rows_fetched_using_bulk_fetch = 0 ;
bulk_fetch_iteration = HA_TOKU_BULK_FETCH_ITERATION_MAX ;
2011-10-16 02:02:29 +00:00
cursor_ret_val = tmp_cursor - > c_getf_next ( tmp_cursor , DB_PRELOCKED , smart_dbt_bf_callback , & bf_info ) ;
2009-01-17 00:15:44 +00:00
2012-06-30 16:51:25 +00:00
# ifdef HA_TOKUDB_HAS_THD_PROGRESS
// initialize a two phase progress report.
// first phase: putting rows into the loader
thd_progress_init ( thd , 2 ) ;
# endif
2011-10-16 02:02:29 +00:00
while ( cursor_ret_val ! = DB_NOTFOUND | | ( ( bytes_used_in_range_query_buff - curr_range_query_buff_offset ) > 0 ) ) {
if ( ( bytes_used_in_range_query_buff - curr_range_query_buff_offset ) = = 0 ) {
2011-10-19 15:26:48 +00:00
invalidate_bulk_fetch ( ) ; // reset the buffers
2011-10-16 02:02:29 +00:00
cursor_ret_val = tmp_cursor - > c_getf_next ( tmp_cursor , DB_PRELOCKED , smart_dbt_bf_callback , & bf_info ) ;
if ( cursor_ret_val ! = DB_NOTFOUND & & cursor_ret_val ! = 0 ) {
error = cursor_ret_val ;
goto cleanup ;
}
2009-03-20 03:39:23 +00:00
}
2011-10-19 15:26:48 +00:00
// do this check in case the the c_getf_next did not put anything into the buffer because
// there was no more data
2011-10-16 02:02:29 +00:00
if ( ( bytes_used_in_range_query_buff - curr_range_query_buff_offset ) = = 0 ) {
break ;
}
2011-10-19 15:26:48 +00:00
// at this point, we know the range query buffer has at least one key/val pair
2011-10-16 02:02:29 +00:00
uchar * curr_pos = range_query_buff + curr_range_query_buff_offset ;
2012-07-25 20:48:53 +00:00
uint32_t key_size = * ( uint32_t * ) curr_pos ;
2011-10-16 02:02:29 +00:00
curr_pos + = sizeof ( key_size ) ;
uchar * curr_key_buff = curr_pos ;
curr_pos + = key_size ;
curr_pk_key . data = curr_key_buff ;
curr_pk_key . size = key_size ;
2012-07-25 20:48:53 +00:00
uint32_t val_size = * ( uint32_t * ) curr_pos ;
2011-10-16 02:02:29 +00:00
curr_pos + = sizeof ( val_size ) ;
uchar * curr_val_buff = curr_pos ;
curr_pos + = val_size ;
curr_pk_val . data = curr_val_buff ;
curr_pk_val . size = val_size ;
curr_range_query_buff_offset = curr_pos - range_query_buff ;
2008-08-13 20:40:43 +00:00
2010-11-17 23:09:06 +00:00
error = loader - > put ( loader , & curr_pk_key , & curr_pk_val ) ;
if ( error ) { goto cleanup ; }
2009-01-17 00:15:44 +00:00
2010-11-17 23:09:06 +00:00
num_processed + + ;
if ( ( num_processed % 1000 ) = = 0 ) {
2012-11-20 16:11:50 +00:00
sprintf ( status_msg , " Adding indexes: Fetched %llu of about %llu rows, loading of data still remains. " , num_processed , ( long long unsigned ) share - > rows ) ;
2010-11-17 23:09:06 +00:00
thd_proc_info ( thd , status_msg ) ;
2012-06-30 16:51:25 +00:00
# ifdef HA_TOKUDB_HAS_THD_PROGRESS
thd_progress_report ( thd , num_processed , ( long long unsigned ) share - > rows ) ;
# endif
2010-11-17 23:09:06 +00:00
if ( thd - > killed ) {
error = ER_ABORTING_CONNECTION ;
goto cleanup ;
}
}
}
error = tmp_cursor - > c_close ( tmp_cursor ) ;
assert ( error = = 0 ) ;
tmp_cursor = NULL ;
2012-06-30 16:51:25 +00:00
# ifdef HA_TOKUDB_HAS_THD_PROGRESS
// next progress report phase: closing the loader.
// incremental reports are done in the loader's callback function.
thd_progress_next_stage ( thd ) ;
# endif
2010-11-17 23:09:06 +00:00
error = loader - > close ( loader ) ;
loader = NULL ;
2012-06-30 16:51:25 +00:00
2010-11-17 23:09:06 +00:00
if ( error ) goto cleanup ;
}
2010-03-29 02:08:34 +00:00
curr_index = curr_num_DBs ;
for ( uint i = 0 ; i < num_of_keys ; i + + , curr_index + + ) {
if ( key_info [ i ] . flags & HA_NOSAME ) {
bool is_unique ;
error = is_index_unique (
& is_unique ,
txn ,
share - > key_file [ curr_index ] ,
& key_info [ i ]
) ;
if ( error ) goto cleanup ;
if ( ! is_unique ) {
error = HA_ERR_FOUND_DUPP_KEY ;
last_dup_key = i ;
2008-08-13 20:40:43 +00:00
goto cleanup ;
}
}
}
2010-03-29 02:08:34 +00:00
//
// We have an accurate row count, might as well update share->rows
//
2012-04-11 16:42:12 +00:00
if ( ! creating_hot_index ) {
pthread_mutex_lock ( & share - > mutex ) ;
share - > rows = num_processed ;
pthread_mutex_unlock ( & share - > mutex ) ;
}
2009-11-10 19:22:08 +00:00
//
// now write stuff to status.tokudb
//
pthread_mutex_lock ( & share - > mutex ) ;
for ( uint i = 0 ; i < num_of_keys ; i + + ) {
write_key_name_to_status ( share - > status_block , key_info [ i ] . name , txn ) ;
}
pthread_mutex_unlock ( & share - > mutex ) ;
2008-05-26 14:07:31 +00:00
error = 0 ;
cleanup :
2012-06-30 16:51:25 +00:00
# ifdef HA_TOKUDB_HAS_THD_PROGRESS
thd_progress_end ( thd ) ;
# endif
2010-11-17 23:09:06 +00:00
if ( rw_lock_taken ) {
rw_unlock ( & share - > num_DBs_lock ) ;
rw_lock_taken = false ;
}
2009-11-10 19:22:08 +00:00
if ( tmp_cursor ) {
2009-12-03 16:59:52 +00:00
int r = tmp_cursor - > c_close ( tmp_cursor ) ;
assert ( r = = 0 ) ;
2009-11-10 19:22:08 +00:00
tmp_cursor = NULL ;
}
2010-03-29 02:08:34 +00:00
if ( loader ! = NULL ) {
2010-06-16 20:56:08 +00:00
sprintf ( status_msg , " aborting creation of indexes. " ) ;
thd_proc_info ( thd , status_msg ) ;
2010-03-29 02:08:34 +00:00
loader - > abort ( loader ) ;
}
2010-11-17 23:09:06 +00:00
if ( indexer ! = NULL ) {
sprintf ( status_msg , " aborting creation of indexes. " ) ;
thd_proc_info ( thd , status_msg ) ;
2012-06-02 13:20:58 +00:00
rw_wrlock ( & share - > num_DBs_lock ) ;
2010-11-17 23:09:06 +00:00
indexer - > abort ( indexer ) ;
2012-06-02 13:20:58 +00:00
rw_unlock ( & share - > num_DBs_lock ) ;
2010-11-17 23:09:06 +00:00
}
2011-03-04 19:54:23 +00:00
if ( error = = DB_LOCK_NOTGRANTED & & ( ( tokudb_debug & TOKUDB_DEBUG_HIDE_DDL_LOCK_ERRORS ) = = 0 ) ) {
sql_print_error ( " Could not add indexes to table %s because \
2009-11-12 19:36:40 +00:00
another transaction has accessed the table . \
To add indexes , make sure no transactions touch the table . " , share->table_name);
2011-03-04 19:54:23 +00:00
}
2010-03-29 02:08:34 +00:00
TOKUDB_DBUG_RETURN ( error ? error : loader_error ) ;
2008-05-26 14:07:31 +00:00
}
2011-03-05 00:29:11 +00:00
//
// Internal function called by ha_tokudb::add_index and ha_tokudb::alter_table_phase2
// Closes added indexes in case of error in error path of add_index and alter_table_phase2
//
2011-03-04 19:54:23 +00:00
void ha_tokudb : : restore_add_index ( TABLE * table_arg , uint num_of_keys , bool incremented_numDBs , bool modified_DBs ) {
uint curr_num_DBs = table_arg - > s - > keys + test ( hidden_primary_key ) ;
uint curr_index = 0 ;
//
// need to restore num_DBs, and we have to do it before we close the dictionaries
// so that there is not a window
//
if ( incremented_numDBs ) {
rw_wrlock ( & share - > num_DBs_lock ) ;
share - > num_DBs - - ;
}
if ( modified_DBs ) {
curr_index = curr_num_DBs ;
for ( uint i = 0 ; i < num_of_keys ; i + + , curr_index + + ) {
reset_key_and_col_info ( & share - > kc_info , curr_index ) ;
}
curr_index = curr_num_DBs ;
for ( uint i = 0 ; i < num_of_keys ; i + + , curr_index + + ) {
if ( share - > key_file [ curr_index ] ) {
int r = share - > key_file [ curr_index ] - > close (
share - > key_file [ curr_index ] ,
0
) ;
assert ( r = = 0 ) ;
share - > key_file [ curr_index ] = NULL ;
}
}
}
if ( incremented_numDBs ) {
rw_unlock ( & share - > num_DBs_lock ) ;
}
}
2008-05-26 14:07:31 +00:00
2012-03-19 12:15:50 +00:00
volatile int ha_tokudb_drop_indexes_wait = 0 ; // debug
2011-03-05 00:29:11 +00:00
//
// Internal function called by ha_tokudb::prepare_drop_index and ha_tokudb::alter_table_phase2
// With a transaction, drops dictionaries associated with indexes in key_num
//
2012-08-02 19:43:03 +00:00
int ha_tokudb : : drop_indexes ( TABLE * table_arg , uint * key_num , uint num_of_keys , KEY * key_info , DB_TXN * txn ) {
2011-03-04 19:54:23 +00:00
TOKUDB_DBUG_ENTER ( " ha_tokudb::drop_indexes " ) ;
2012-05-21 18:56:56 +00:00
assert ( txn ) ;
2012-04-02 18:27:34 +00:00
while ( ha_tokudb_drop_indexes_wait ) sleep ( 1 ) ; // debug
2012-03-19 12:15:50 +00:00
2011-04-21 01:37:04 +00:00
int error = 0 ;
2010-10-28 20:36:27 +00:00
for ( uint i = 0 ; i < num_of_keys ; i + + ) {
uint curr_index = key_num [ i ] ;
error = share - > key_file [ curr_index ] - > pre_acquire_fileops_lock ( share - > key_file [ curr_index ] , txn ) ;
if ( error ! = 0 ) {
goto cleanup ;
}
}
2008-05-26 14:07:31 +00:00
for ( uint i = 0 ; i < num_of_keys ; i + + ) {
uint curr_index = key_num [ i ] ;
2009-12-03 15:49:42 +00:00
int r = share - > key_file [ curr_index ] - > close ( share - > key_file [ curr_index ] , 0 ) ;
assert ( r = = 0 ) ;
2008-05-26 14:07:31 +00:00
share - > key_file [ curr_index ] = NULL ;
2012-08-02 19:43:03 +00:00
error = remove_key_name_from_status ( share - > status_block , key_info [ curr_index ] . name , txn ) ;
2009-11-10 19:22:08 +00:00
if ( error ) { goto cleanup ; }
2012-08-02 19:43:03 +00:00
error = delete_or_rename_dictionary ( share - > table_name , NULL , key_info [ curr_index ] . name , true , txn , true ) ;
2009-11-10 19:22:08 +00:00
if ( error ) { goto cleanup ; }
2008-05-26 14:07:31 +00:00
}
2010-08-16 18:58:33 +00:00
2008-05-26 14:07:31 +00:00
cleanup :
2010-08-16 18:58:33 +00:00
if ( error = = DB_LOCK_NOTGRANTED & & ( ( tokudb_debug & TOKUDB_DEBUG_HIDE_DDL_LOCK_ERRORS ) = = 0 ) ) {
sql_print_error ( " Could not drop indexes from table %s because \
2009-11-12 19:36:40 +00:00
another transaction has accessed the table . \
To drop indexes , make sure no transactions touch the table . " , share->table_name);
2010-08-16 18:58:33 +00:00
}
2008-05-26 14:07:31 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
}
2011-03-05 00:29:11 +00:00
//
// Internal function called by ha_tokudb::prepare_drop_index and ha_tokudb::alter_table_phase2
// Restores dropped indexes in case of error in error path of prepare_drop_index and alter_table_phase2
//
2011-03-04 19:54:23 +00:00
void ha_tokudb : : restore_drop_indexes ( TABLE * table_arg , uint * key_num , uint num_of_keys ) {
2012-03-23 15:49:27 +00:00
2011-03-04 19:54:23 +00:00
//
// reopen closed dictionaries
//
for ( uint i = 0 ; i < num_of_keys ; i + + ) {
int r ;
uint curr_index = key_num [ i ] ;
if ( share - > key_file [ curr_index ] = = NULL ) {
r = open_secondary_dictionary (
& share - > key_file [ curr_index ] ,
& table_share - > key_info [ curr_index ] ,
share - > table_name ,
false , //
NULL
) ;
assert ( ! r ) ;
}
}
}
2012-03-19 12:15:50 +00:00
2008-02-07 20:19:44 +00:00
void ha_tokudb : : print_error ( int error , myf errflag ) {
2008-04-03 11:17:39 +00:00
if ( error = = DB_LOCK_DEADLOCK )
2008-02-07 20:19:44 +00:00
error = HA_ERR_LOCK_DEADLOCK ;
2008-04-03 11:17:39 +00:00
if ( error = = DB_LOCK_NOTGRANTED )
2008-04-03 18:45:00 +00:00
error = HA_ERR_LOCK_WAIT_TIMEOUT ;
2010-07-01 16:36:17 +00:00
# if defined(HA_ERR_DISK_FULL)
2010-01-25 13:25:19 +00:00
if ( error = = ENOSPC ) {
error = HA_ERR_DISK_FULL ;
}
2010-07-01 16:36:17 +00:00
# endif
2010-03-29 02:08:34 +00:00
if ( error = = DB_KEYEXIST ) {
error = HA_ERR_FOUND_DUPP_KEY ;
}
2011-03-25 12:08:58 +00:00
# if defined(HA_ALTER_ERROR)
2011-03-04 19:54:23 +00:00
if ( error = = HA_ALTER_ERROR ) {
error = HA_ERR_UNSUPPORTED ;
2011-03-25 12:08:58 +00:00
}
# endif
2012-01-02 19:51:33 +00:00
// TODO: should rename debug code to something better
// just reusing this so that tests don' start complaining
2012-01-20 17:43:58 +00:00
# if MYSQL_VERSION_ID < 50500
2012-01-02 19:51:33 +00:00
if ( ( tokudb_debug & TOKUDB_DEBUG_HIDE_DDL_LOCK_ERRORS ) = = 0 ) {
2012-01-20 17:43:58 +00:00
THD * thd = ha_thd ( ) ;
2012-03-27 03:35:56 +00:00
if ( get_log_client_errors ( thd ) ) {
sql_print_error ( " query \" %s \" returned handler error %d " , thd - > query_string . str , error ) ;
}
2012-01-02 19:51:33 +00:00
}
2012-01-20 17:43:58 +00:00
# endif
2008-02-07 20:19:44 +00:00
handler : : print_error ( error , errflag ) ;
}
2008-02-05 16:00:53 +00:00
2009-11-10 19:22:08 +00:00
//
// truncate's dictionary associated with keynr index using transaction txn
// does so by deleting and then recreating the dictionary in the context
// of a transaction
//
int ha_tokudb : : truncate_dictionary ( uint keynr , DB_TXN * txn ) {
int error ;
bool is_pk = ( keynr = = primary_key ) ;
2012-04-03 23:44:18 +00:00
2012-04-04 15:12:36 +00:00
const enum row_type row_type = get_row_type_for_key ( share - > key_file [ keynr ] ) ;
2009-11-10 19:22:08 +00:00
error = share - > key_file [ keynr ] - > close ( share - > key_file [ keynr ] , 0 ) ;
2009-12-03 15:49:42 +00:00
assert ( error = = 0 ) ;
2009-11-10 19:22:08 +00:00
share - > key_file [ keynr ] = NULL ;
if ( is_pk ) { share - > file = NULL ; }
if ( is_pk ) {
error = delete_or_rename_dictionary (
share - > table_name ,
NULL ,
" main " ,
2009-12-03 15:39:53 +00:00
false , //is_key
2009-11-10 19:22:08 +00:00
txn ,
true // is a delete
) ;
if ( error ) { goto cleanup ; }
}
else {
error = delete_or_rename_dictionary (
share - > table_name ,
NULL ,
table_share - > key_info [ keynr ] . name ,
2009-12-03 15:39:53 +00:00
true , //is_key
2009-11-10 19:22:08 +00:00
txn ,
true // is a delete
) ;
if ( error ) { goto cleanup ; }
}
if ( is_pk ) {
2012-04-04 15:12:36 +00:00
error = create_main_dictionary ( share - > table_name , table , txn , & share - > kc_info , row_type ) ;
2009-11-10 19:22:08 +00:00
}
else {
error = create_secondary_dictionary (
share - > table_name ,
table ,
& table_share - > key_info [ keynr ] ,
2010-01-11 18:14:37 +00:00
txn ,
& share - > kc_info ,
2011-01-06 19:02:48 +00:00
keynr ,
2012-04-04 15:12:36 +00:00
false ,
row_type
2009-11-10 19:22:08 +00:00
) ;
}
if ( error ) { goto cleanup ; }
cleanup :
return error ;
}
2012-04-02 18:27:34 +00:00
volatile int ha_tokudb_truncate_wait = 0 ; // debug
2010-11-25 04:14:15 +00:00
// for 5.5
int ha_tokudb : : truncate ( ) {
2012-04-02 18:27:34 +00:00
TOKUDB_DBUG_ENTER ( " truncate " ) ;
while ( ha_tokudb_truncate_wait ) sleep ( 1 ) ; // debug
2012-04-04 20:44:23 +00:00
int error = delete_all_rows_internal ( ) ;
2012-04-02 18:27:34 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
2010-11-25 04:14:15 +00:00
}
2008-07-21 13:27:13 +00:00
// delete all rows from a table
//
// effects: delete all of the rows in the main dictionary and all of the
// indices. this must be atomic, so we use the statement transaction
// for all of the truncate operations.
// locks: if we have an exclusive table write lock, all of the concurrency
// issues go away.
// returns: 0 if success
int ha_tokudb : : delete_all_rows ( ) {
TOKUDB_DBUG_ENTER ( " delete_all_rows " ) ;
int error = 0 ;
2012-04-04 20:44:23 +00:00
if ( thd_sql_command ( ha_thd ( ) ) ! = SQLCOM_TRUNCATE ) {
share - > try_table_lock = true ;
error = HA_ERR_WRONG_COMMAND ;
}
if ( error = = 0 )
error = delete_all_rows_internal ( ) ;
TOKUDB_DBUG_RETURN ( error ) ;
}
int ha_tokudb : : delete_all_rows_internal ( ) {
TOKUDB_DBUG_ENTER ( " delete_all_rows_internal " ) ;
int error = 0 ;
2009-06-30 12:20:06 +00:00
uint curr_num_DBs = 0 ;
2009-11-10 19:22:08 +00:00
DB_TXN * txn = NULL ;
error = db_env - > txn_begin ( db_env , 0 , & txn , 0 ) ;
if ( error ) { goto cleanup ; }
2008-07-21 13:27:13 +00:00
2009-06-30 12:20:06 +00:00
curr_num_DBs = table - > s - > keys + test ( hidden_primary_key ) ;
2010-10-28 20:36:27 +00:00
for ( uint i = 0 ; i < curr_num_DBs ; i + + ) {
error = share - > key_file [ i ] - > pre_acquire_fileops_lock (
share - > key_file [ i ] ,
txn
) ;
if ( error ) { goto cleanup ; }
2012-02-08 20:28:17 +00:00
error = share - > key_file [ i ] - > pre_acquire_table_lock (
share - > key_file [ i ] ,
txn
) ;
if ( error ) { goto cleanup ; }
2010-10-28 20:36:27 +00:00
}
2008-07-21 13:27:13 +00:00
for ( uint i = 0 ; i < curr_num_DBs ; i + + ) {
2009-11-10 19:22:08 +00:00
error = truncate_dictionary ( i , txn ) ;
if ( error ) { goto cleanup ; }
2008-07-21 13:27:13 +00:00
}
// zap the row count
2009-06-29 17:23:06 +00:00
if ( error = = 0 ) {
2008-07-21 13:27:13 +00:00
share - > rows = 0 ;
2012-11-13 21:54:58 +00:00
// update auto increment
share - > last_auto_increment = 0 ;
// calling write_to_status directly because we need to use txn
write_to_status (
share - > status_block ,
hatoku_max_ai ,
& share - > last_auto_increment ,
sizeof ( share - > last_auto_increment ) ,
txn
) ;
2009-06-29 17:23:06 +00:00
}
2009-11-10 19:22:08 +00:00
2010-03-30 00:06:10 +00:00
share - > try_table_lock = true ;
2009-06-29 17:23:06 +00:00
cleanup :
2009-11-10 19:22:08 +00:00
if ( txn ) {
if ( error ) {
abort_txn ( txn ) ;
}
else {
commit_txn ( txn , 0 ) ;
}
}
2012-03-23 15:49:27 +00:00
if ( error = = DB_LOCK_NOTGRANTED & & ( ( tokudb_debug & TOKUDB_DEBUG_HIDE_DDL_LOCK_ERRORS ) = = 0 ) ) {
sql_print_error ( " Could not truncate table %s because another transaction has accessed the \
table . To truncate the table , make sure no transactions touch the table . " ,
share - > table_name ) ;
}
2009-11-10 19:22:08 +00:00
//
// regardless of errors, need to reopen the DB's
//
for ( uint i = 0 ; i < curr_num_DBs ; i + + ) {
int r = 0 ;
if ( share - > key_file [ i ] = = NULL ) {
if ( i ! = primary_key ) {
r = open_secondary_dictionary (
& share - > key_file [ i ] ,
& table_share - > key_info [ i ] ,
share - > table_name ,
2009-12-02 14:02:47 +00:00
false , //
2009-11-10 19:22:08 +00:00
NULL
) ;
assert ( ! r ) ;
}
else {
r = open_main_dictionary (
share - > table_name ,
2009-12-02 14:02:47 +00:00
false ,
2009-11-10 19:22:08 +00:00
NULL
) ;
assert ( ! r ) ;
}
}
}
2008-07-21 13:27:13 +00:00
TOKUDB_DBUG_RETURN ( error ) ;
}
2010-03-29 02:08:34 +00:00
void ha_tokudb : : set_loader_error ( int err ) {
loader_error = err ;
}
2012-05-21 18:56:56 +00:00
2010-03-29 02:08:34 +00:00
void ha_tokudb : : set_dup_value_for_pk ( DBT * key ) {
assert ( ! hidden_primary_key ) ;
unpack_key ( table - > record [ 0 ] , key , primary_key ) ;
last_dup_key = primary_key ;
}
2008-03-19 20:21:49 +00:00
2013-02-17 00:14:14 +00:00
void ha_tokudb : : close_dsmrr ( ) {
# ifdef MARIADB_BASE_VERSION
ds_mrr . dsmrr_close ( ) ;
2013-02-17 03:44:31 +00:00
# elif 50600 <= MYSQL_VERSION_ID && MYSQL_VERSION_ID <= 50699
ds_mrr . dsmrr_close ( ) ;
# endif
}
void ha_tokudb : : reset_dsmrr ( ) {
# ifdef MARIADB_BASE_VERSION
ds_mrr . dsmrr_close ( ) ;
# elif 50600 <= MYSQL_VERSION_ID && MYSQL_VERSION_ID <= 50699
ds_mrr . reset ( ) ;
2013-02-17 00:14:14 +00:00
# endif
}
2013-02-20 20:36:28 +00:00
// we cache the information so we can do filtering ourselves,
// but as far as MySQL knows, we are not doing any filtering,
// so if we happen to miss filtering a row that does not match
// idx_cond_arg, MySQL will catch it.
// This allows us the ability to deal with only index_next and index_prev,
// and not need to worry about other index_XXX functions
Item * ha_tokudb : : idx_cond_push ( uint keyno_arg , Item * idx_cond_arg ) {
toku_pushed_idx_cond_keyno = keyno_arg ;
toku_pushed_idx_cond = idx_cond_arg ;
return idx_cond_arg ;
}
2013-02-17 00:14:14 +00:00
2012-05-24 20:47:47 +00:00
// table admin
# include "ha_tokudb_admin.cc"
2012-04-02 18:27:34 +00:00
2012-11-27 15:23:21 +00:00
// update functions
2012-06-05 00:52:30 +00:00
# include "ha_tokudb_update_fun.cc"
2012-11-27 15:23:21 +00:00
// fast updates
# include "ha_tokudb_update.cc"
// alter table code for various mysql distros
2012-05-21 18:56:56 +00:00
# include "ha_tokudb_alter_55.cc"
# include "ha_tokudb_alter_56.cc"
2012-05-23 17:51:36 +00:00
2013-02-17 00:14:14 +00:00
// maria mrr
# ifdef MARIADB_BASE_VERSION
# include "ha_tokudb_mrr_maria.cc"
# endif
2013-02-17 03:44:31 +00:00
# if !defined(MARIADB_BASE_VERSION)
# if 50600 <= MYSQL_VERSION_ID && MYSQL_VERSION_ID <= 50699
# include "ha_tokudb_mrr_mysql.cc"
# endif
# endif
2012-05-23 17:51:36 +00:00
// key comparisons
# include "hatoku_cmp.cc"
// handlerton
# include "hatoku_hton.cc"