mirror of
https://github.com/MariaDB/server.git
synced 2025-01-27 09:14:17 +01:00
571 lines
18 KiB
C++
571 lines
18 KiB
C++
/* Copyright (c) 2007, 2013, Oracle and/or its affiliates.
|
|
Copyright (c) 2008, 2022, MariaDB Corporation.
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; version 2 of the License.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program; if not, write to the Free Software
|
|
Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1335 USA */
|
|
|
|
#include "mariadb.h"
|
|
#include "sql_priv.h"
|
|
#include "unireg.h"
|
|
#include "rpl_rli.h"
|
|
#include "rpl_record.h"
|
|
#include "slave.h" // Need to pull in slave_print_msg
|
|
#include "rpl_utility.h"
|
|
#include "rpl_rli.h"
|
|
|
|
/**
|
|
Pack a record of data for a table into a format suitable for
|
|
transfer via the binary log.
|
|
|
|
The format for a row in transfer with N fields is the following:
|
|
|
|
ceil(N/8) null bytes:
|
|
One null bit for every column *regardless of whether it can be
|
|
null or not*. This simplifies the decoding. Observe that the
|
|
number of null bits is equal to the number of set bits in the
|
|
@c cols bitmap. The number of null bytes is the smallest number
|
|
of bytes necessary to store the null bits.
|
|
|
|
Padding bits are 1.
|
|
|
|
N packets:
|
|
Each field is stored in packed format.
|
|
|
|
|
|
@param table Table describing the format of the record
|
|
|
|
@param cols Bitmap with a set bit for each column that should
|
|
be stored in the row
|
|
|
|
@param row_data Pointer to memory where row will be written
|
|
|
|
@param record Pointer to record that should be packed. It is
|
|
assumed that the pointer refers to either @c
|
|
record[0] or @c record[1], but no such check is
|
|
made since the code does not rely on that.
|
|
|
|
@return The number of bytes written at @c row_data.
|
|
*/
|
|
#if !defined(MYSQL_CLIENT)
|
|
size_t
|
|
pack_row(TABLE *table, MY_BITMAP const* cols,
|
|
uchar *row_data, const uchar *record)
|
|
{
|
|
Field **p_field= table->field, *field;
|
|
int const null_byte_count= (bitmap_bits_set(cols) + 7) / 8;
|
|
uchar *pack_ptr = row_data + null_byte_count;
|
|
uchar *null_ptr = row_data;
|
|
my_ptrdiff_t const rec_offset= record - table->record[0];
|
|
my_ptrdiff_t const def_offset= table->s->default_values - table->record[0];
|
|
|
|
DBUG_ENTER("pack_row");
|
|
|
|
/*
|
|
We write the null bits and the packed records using one pass
|
|
through all the fields. The null bytes are written little-endian,
|
|
i.e., the first fields are in the first byte.
|
|
*/
|
|
unsigned int null_bits= (1U << 8) - 1;
|
|
// Mask to mask out the correct but among the null bits
|
|
unsigned int null_mask= 1U;
|
|
for ( ; (field= *p_field) ; p_field++)
|
|
{
|
|
if (bitmap_is_set(cols, (uint)(p_field - table->field)))
|
|
{
|
|
my_ptrdiff_t offset;
|
|
if (field->is_null(rec_offset))
|
|
{
|
|
offset= def_offset;
|
|
null_bits |= null_mask;
|
|
}
|
|
else
|
|
{
|
|
offset= rec_offset;
|
|
null_bits &= ~null_mask;
|
|
|
|
/*
|
|
We only store the data of the field if it is non-null
|
|
|
|
For big-endian machines, we have to make sure that the
|
|
length is stored in little-endian format, since this is the
|
|
format used for the binlog.
|
|
*/
|
|
#ifndef DBUG_OFF
|
|
const uchar *old_pack_ptr= pack_ptr;
|
|
#endif
|
|
pack_ptr= field->pack(pack_ptr, field->ptr + offset,
|
|
field->max_data_length());
|
|
DBUG_PRINT("debug", ("field: %s; real_type: %d, pack_ptr: %p;"
|
|
" pack_ptr':%p; bytes: %d",
|
|
field->field_name.str, field->real_type(),
|
|
old_pack_ptr,pack_ptr,
|
|
(int) (pack_ptr - old_pack_ptr)));
|
|
DBUG_DUMP("packed_data", old_pack_ptr, pack_ptr - old_pack_ptr);
|
|
}
|
|
|
|
null_mask <<= 1;
|
|
if ((null_mask & 0xFF) == 0)
|
|
{
|
|
DBUG_ASSERT(null_ptr < row_data + null_byte_count);
|
|
null_mask = 1U;
|
|
*null_ptr++ = null_bits;
|
|
null_bits= (1U << 8) - 1;
|
|
}
|
|
}
|
|
}
|
|
|
|
/*
|
|
Write the last (partial) byte, if there is one
|
|
*/
|
|
if ((null_mask & 0xFF) > 1)
|
|
{
|
|
DBUG_ASSERT(null_ptr < row_data + null_byte_count);
|
|
*null_ptr++ = null_bits;
|
|
}
|
|
|
|
/*
|
|
The null pointer should now point to the first byte of the
|
|
packed data. If it doesn't, something is very wrong.
|
|
*/
|
|
DBUG_ASSERT(null_ptr == row_data + null_byte_count);
|
|
DBUG_DUMP("row_data", row_data, pack_ptr - row_data);
|
|
DBUG_RETURN(static_cast<size_t>(pack_ptr - row_data));
|
|
}
|
|
#endif
|
|
|
|
#if !defined(MYSQL_CLIENT) && defined(HAVE_REPLICATION)
|
|
|
|
struct Unpack_record_state
|
|
{
|
|
uchar const *const row_data;
|
|
uchar const *const row_end;
|
|
size_t const master_null_byte_count;
|
|
uchar const *null_ptr;
|
|
uchar const *pack_ptr;
|
|
/** Mask to mask out the correct bit among the null bits */
|
|
unsigned int null_mask;
|
|
/** The "current" null bits */
|
|
unsigned int null_bits;
|
|
Unpack_record_state(uchar const *const row_data,
|
|
uchar const *const row_end,
|
|
size_t const master_null_byte_count)
|
|
: row_data(row_data), row_end(row_end),
|
|
master_null_byte_count(master_null_byte_count),
|
|
null_ptr(row_data), pack_ptr(row_data + master_null_byte_count)
|
|
{}
|
|
void next_null_byte()
|
|
{
|
|
DBUG_ASSERT(null_ptr < row_data + master_null_byte_count);
|
|
null_mask= 1U;
|
|
null_bits= *null_ptr++;
|
|
}
|
|
};
|
|
|
|
|
|
static bool unpack_field(const table_def *tabledef, Field *f,
|
|
Unpack_record_state *st, uint field_idx)
|
|
{
|
|
if ((st->null_mask & 0xFF) == 0)
|
|
st->next_null_byte();
|
|
|
|
DBUG_ASSERT(st->null_mask & 0xFF); // One of the 8 LSB should be set
|
|
|
|
if (st->null_bits & st->null_mask)
|
|
{
|
|
if (f->maybe_null())
|
|
{
|
|
DBUG_PRINT("debug", ("Was NULL; null mask: 0x%x; null bits: 0x%x",
|
|
st->null_mask, st->null_bits));
|
|
/**
|
|
Calling reset just in case one is unpacking on top a
|
|
record with data.
|
|
|
|
This could probably go into set_null() but doing so,
|
|
(i) triggers assertion in other parts of the code at
|
|
the moment; (ii) it would make us reset the field,
|
|
always when setting null, which right now doesn't seem
|
|
needed anywhere else except here.
|
|
|
|
TODO: maybe in the future we should consider moving
|
|
the reset to make it part of set_null. But then
|
|
the assertions triggered need to be
|
|
addressed/revisited.
|
|
*/
|
|
|
|
#ifndef DBUG_OFF
|
|
/*
|
|
f->reset() may call store_value() to reset the value, for example
|
|
Field_new_decimal. store_value() has below assertion:
|
|
|
|
DBUG_ASSERT(marked_for_write_or_computed());
|
|
|
|
It asserts write bitmap must be set. That caused an assertion
|
|
failure for row images generated by FULL_NODUP mode.
|
|
The assertion is meaningless for unpacking a row image, so
|
|
the field is marked in write_set temporarily to avoid the
|
|
assertion failure.
|
|
*/
|
|
bool was_not_set = !bitmap_is_set(f->table->write_set, f->field_index);
|
|
if (was_not_set)
|
|
bitmap_set_bit(f->table->write_set, f->field_index);
|
|
#endif
|
|
f->reset();
|
|
#ifndef DBUG_OFF
|
|
if (was_not_set)
|
|
bitmap_clear_bit(f->table->write_set, f->field_index);
|
|
#endif
|
|
f->set_null();
|
|
}
|
|
else
|
|
{
|
|
THD *thd= f->table->in_use;
|
|
|
|
f->set_default();
|
|
push_warning_printf(thd, Sql_condition::WARN_LEVEL_WARN,
|
|
ER_BAD_NULL_ERROR,
|
|
ER_THD(thd, ER_BAD_NULL_ERROR),
|
|
f->field_name.str);
|
|
}
|
|
}
|
|
else
|
|
{
|
|
f->set_notnull();
|
|
|
|
/*
|
|
We only unpack the field if it was non-null.
|
|
Use the master's size information if available else call
|
|
normal unpack operation.
|
|
*/
|
|
uint16 const metadata = tabledef->field_metadata(field_idx);
|
|
#ifdef DBUG_TRACE
|
|
uchar const *const old_pack_ptr= st->pack_ptr;
|
|
#endif
|
|
|
|
st->pack_ptr= f->unpack(f->ptr, st->pack_ptr, st->row_end, metadata);
|
|
DBUG_PRINT("debug", ("field: %s; metadata: 0x%x;"
|
|
" pack_ptr: %p; pack_ptr': %p; bytes: %d",
|
|
f->field_name.str, metadata,
|
|
old_pack_ptr, st->pack_ptr,
|
|
(int) (st->pack_ptr - old_pack_ptr)));
|
|
if (!st->pack_ptr)
|
|
return false;
|
|
}
|
|
st->null_mask <<= 1;
|
|
return true;
|
|
}
|
|
|
|
static void convert_field(Field *f, Field *result_field, Field *conv_field)
|
|
{
|
|
#ifndef DBUG_OFF
|
|
char type_buf[MAX_FIELD_WIDTH];
|
|
char value_buf[MAX_FIELD_WIDTH];
|
|
String source_type(type_buf, sizeof(type_buf), system_charset_info);
|
|
String value_string(value_buf, sizeof(value_buf), system_charset_info);
|
|
conv_field->sql_type(source_type);
|
|
conv_field->val_str(&value_string);
|
|
DBUG_PRINT("debug", ("Copying field '%s' of type '%s' with value '%s'",
|
|
result_field->field_name.str,
|
|
source_type.c_ptr_safe(), value_string.c_ptr_safe()));
|
|
#endif
|
|
|
|
Copy_field copy;
|
|
copy.set(result_field, f, TRUE);
|
|
(*copy.do_copy)(©);
|
|
|
|
#ifndef DBUG_OFF
|
|
String target_type(type_buf, sizeof(type_buf), system_charset_info);
|
|
result_field->sql_type(target_type);
|
|
result_field->val_str(&value_string);
|
|
DBUG_PRINT("debug", ("Value of field '%s' of type '%s' is now '%s'",
|
|
result_field->field_name.str,
|
|
target_type.c_ptr_safe(), value_string.c_ptr_safe()));
|
|
#endif
|
|
}
|
|
|
|
|
|
/**
|
|
Unpack a row into @c table->record[0].
|
|
|
|
The function will always unpack into the @c table->record[0]
|
|
record. This is because there are too many dependencies on where
|
|
the various member functions of Field and subclasses expect to
|
|
write.
|
|
|
|
The row is assumed to only consist of the fields for which the
|
|
corresponding bit in bitset @c cols is set; the other parts of the
|
|
record are left alone.
|
|
|
|
At most @c colcnt columns are read: if the table is larger than
|
|
that, the remaining fields are not filled in.
|
|
|
|
@note The relay log information can be NULL, which means that no
|
|
checking or comparison with the source table is done, simply
|
|
because it is not used. This feature is used by MySQL Backup to
|
|
unpack a row from from the backup image, but can be used for other
|
|
purposes as well.
|
|
|
|
@param rgi Relay group info
|
|
@param table Table to unpack into
|
|
@param colcnt Number of columns to read from record
|
|
@param row_data
|
|
Packed row datanull_ptr
|
|
@param cols Pointer to bitset describing columns to fill in
|
|
@param curr_row_end
|
|
Pointer to variable that will hold the value of the
|
|
one-after-end position for the current row
|
|
@param master_reclength
|
|
Pointer to variable that will be set to the length of the
|
|
record on the master side
|
|
@param row_end
|
|
Pointer to variable that will hold the value of the
|
|
end position for the data in the row event
|
|
|
|
@retval 0 No error
|
|
|
|
@retval HA_ERR_GENERIC
|
|
A generic, internal, error caused the unpacking to fail.
|
|
@retval HA_ERR_CORRUPT_EVENT
|
|
Found error when trying to unpack fields.
|
|
*/
|
|
|
|
int unpack_row(const rpl_group_info *rgi, TABLE *table, uint const colcnt,
|
|
uchar const *const row_data, MY_BITMAP const *cols,
|
|
uchar const **const current_row_end,
|
|
ulong *const master_reclength, uchar const *const row_end)
|
|
{
|
|
int error;
|
|
DBUG_ENTER("unpack_row");
|
|
DBUG_ASSERT(row_data);
|
|
DBUG_ASSERT(table);
|
|
DBUG_ASSERT(rgi);
|
|
|
|
Unpack_record_state st(row_data, row_end, (bitmap_bits_set(cols) + 7) / 8);
|
|
|
|
if (bitmap_is_clear_all(cols))
|
|
{
|
|
/**
|
|
There was no data sent from the master, so there is
|
|
nothing to unpack.
|
|
*/
|
|
*current_row_end= st.pack_ptr;
|
|
*master_reclength= 0;
|
|
DBUG_RETURN(0);
|
|
}
|
|
|
|
Rpl_table_data rpl_data= *(RPL_TABLE_LIST*)table->pos_in_table_list;
|
|
const table_def *tabledef= rpl_data.tabledef;
|
|
const TABLE *conv_table= rpl_data.conv_table;
|
|
DBUG_PRINT("debug", ("Table data: tabldef: %p, conv_table: %p",
|
|
tabledef, conv_table));
|
|
uint i= 0;
|
|
|
|
st.next_null_byte();
|
|
if (!rpl_data.is_online_alter())
|
|
{
|
|
Field *result_field= NULL;
|
|
for (; i < colcnt && (result_field= table->field[i]); i++)
|
|
{
|
|
/*
|
|
If there is a conversion table, we pick up the field pointer to
|
|
the conversion table. If the conversion table or the field
|
|
pointer is NULL, no conversions are necessary.
|
|
*/
|
|
Field *conv_field= conv_table ? conv_table->field[i] : NULL;
|
|
Field *const f= conv_field ? conv_field : result_field;
|
|
|
|
DBUG_PRINT("debug", ("Conversion %srequired for field '%s' (#%u)",
|
|
conv_field ? "" : "not ",
|
|
result_field->field_name.str, i));
|
|
DBUG_ASSERT(f != NULL);
|
|
|
|
/*
|
|
No need to bother about columns that does not exist: they have
|
|
gotten default values when being emptied above.
|
|
*/
|
|
if (!bitmap_is_set(cols, i))
|
|
continue;
|
|
|
|
result_field->set_has_explicit_value();
|
|
|
|
bool unpack_result= unpack_field(tabledef, f, &st, i);
|
|
if (!unpack_result)
|
|
{
|
|
rgi->rli->report(ERROR_LEVEL, ER_SLAVE_CORRUPT_EVENT,
|
|
rgi->gtid_info(),
|
|
"Could not read field '%s' of table '%s.%s'",
|
|
f->field_name.str, table->s->db.str,
|
|
table->s->table_name.str);
|
|
DBUG_RETURN(HA_ERR_CORRUPT_EVENT);
|
|
}
|
|
|
|
/*
|
|
If conv_field is set, then we are doing a conversion. In this
|
|
case, we have unpacked the master data to the conversion
|
|
table, so we need to copy the value stored in the conversion
|
|
table into the final table and do the conversion at the same time.
|
|
|
|
If copy_fields is set, it means we are doing an online alter table,
|
|
and will use copy_fields set up in copy_data_between_tables
|
|
*/
|
|
if (conv_field)
|
|
convert_field(f, result_field, conv_field);
|
|
}
|
|
|
|
/*
|
|
Throw away master's extra fields
|
|
*/
|
|
uint max_cols= MY_MIN(tabledef->size(), cols->n_bits);
|
|
for (; i < max_cols; i++)
|
|
{
|
|
if (bitmap_is_set(cols, i))
|
|
{
|
|
if ((st.null_mask & 0xFF) == 0)
|
|
st.next_null_byte();
|
|
DBUG_ASSERT(st.null_mask & 0xFF); // One of the 8 LSB should be set
|
|
|
|
if (!((st.null_bits & st.null_mask) && tabledef->maybe_null(i))) {
|
|
uint32 len= tabledef->calc_field_size(i, (uchar *) st.pack_ptr);
|
|
DBUG_DUMP("field_data", st.pack_ptr, len);
|
|
st.pack_ptr+= len;
|
|
}
|
|
st.null_mask <<= 1;
|
|
}
|
|
}
|
|
|
|
if (master_reclength)
|
|
{
|
|
if (result_field)
|
|
*master_reclength = (ulong)(result_field->ptr - table->record[0]);
|
|
else
|
|
*master_reclength = table->s->reclength;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
/*
|
|
For Online Alter, iterate through old table fields to unpack,
|
|
then iterate through copy_field array to copy to the new table's record.
|
|
*/
|
|
|
|
DBUG_ASSERT(colcnt == conv_table->s->fields);
|
|
for (;i < colcnt; i++)
|
|
{
|
|
DBUG_ASSERT(bitmap_is_set(cols, i));
|
|
Field *f= conv_table->field[i];
|
|
#ifndef DBUG_OFF
|
|
bool result=
|
|
#endif
|
|
unpack_field(tabledef, f, &st, i);
|
|
DBUG_ASSERT(result);
|
|
}
|
|
|
|
for (const auto *copy=rpl_data.copy_fields;
|
|
copy != rpl_data.copy_fields_end; copy++)
|
|
{
|
|
copy->to_field->set_has_explicit_value();
|
|
copy->do_copy(copy);
|
|
}
|
|
if (master_reclength)
|
|
*master_reclength = conv_table->s->reclength;
|
|
} // if (rpl_data.is_online_alter())
|
|
|
|
/*
|
|
We should now have read all the null bytes, otherwise something is
|
|
really wrong.
|
|
*/
|
|
DBUG_ASSERT(st.null_ptr == row_data + st.master_null_byte_count);
|
|
DBUG_DUMP("row_data", row_data, st.pack_ptr - row_data);
|
|
|
|
*current_row_end = st.pack_ptr;
|
|
|
|
if (table->default_field && (rpl_data.is_online_alter() ||
|
|
LOG_EVENT_IS_WRITE_ROW(rgi->current_event->get_type_code())))
|
|
{
|
|
error= table->update_default_fields(table->in_use->lex->ignore);
|
|
if (unlikely(error))
|
|
DBUG_RETURN(error);
|
|
}
|
|
if (table->vfield)
|
|
{
|
|
error= table->update_virtual_fields(table->file, VCOL_UPDATE_FOR_WRITE);
|
|
if (unlikely(error))
|
|
DBUG_RETURN(error);
|
|
}
|
|
|
|
if (rpl_data.is_online_alter())
|
|
{
|
|
/* we only check constraints for ALTER TABLE */
|
|
DBUG_ASSERT(table->in_use->lex->ignore == FALSE);
|
|
error = table->verify_constraints(false);
|
|
DBUG_ASSERT(error != VIEW_CHECK_SKIP);
|
|
if (error)
|
|
DBUG_RETURN(HA_ERR_GENERIC);
|
|
}
|
|
|
|
DBUG_RETURN(0);
|
|
}
|
|
|
|
/**
|
|
Fills @c table->record[0] with default values.
|
|
|
|
First @c restore_record() is called to restore the default values for
|
|
record concerning the given table. Then, if @c check is true,
|
|
a check is performed to see if fields are have default value or can
|
|
be NULL. Otherwise error is reported.
|
|
|
|
@param table Table whose record[0] buffer is prepared.
|
|
@param skip Number of columns for which default/nullable check
|
|
should be skipped.
|
|
@param check Specifies if lack of default error needs checking.
|
|
|
|
@returns 0 on success or a handler level error code
|
|
*/
|
|
int prepare_record(TABLE *const table, const uint skip, const bool check)
|
|
{
|
|
DBUG_ENTER("prepare_record");
|
|
|
|
restore_record(table, s->default_values);
|
|
|
|
/*
|
|
This skip should be revisited in 6.0, because in 6.0 RBR one
|
|
can have holes in the row (as the grain of the writeset is
|
|
the column and not the entire row).
|
|
*/
|
|
if (skip >= table->s->fields || !check)
|
|
DBUG_RETURN(0);
|
|
|
|
/*
|
|
For fields the extra fields on the slave, we check if they have a default.
|
|
The check follows the same rules as the INSERT query without specifying an
|
|
explicit value for a field not having the explicit default
|
|
(@c check_that_all_fields_are_given_values()).
|
|
*/
|
|
for (Field **field_ptr= table->field+skip; *field_ptr; ++field_ptr)
|
|
{
|
|
Field *const f= *field_ptr;
|
|
if ((f->flags & NO_DEFAULT_VALUE_FLAG) &&
|
|
(f->real_type() != MYSQL_TYPE_ENUM))
|
|
{
|
|
THD *thd= f->table->in_use;
|
|
f->set_default();
|
|
push_warning_printf(thd,
|
|
Sql_condition::WARN_LEVEL_WARN,
|
|
ER_NO_DEFAULT_FOR_FIELD,
|
|
ER_THD(thd, ER_NO_DEFAULT_FOR_FIELD),
|
|
f->field_name.str);
|
|
}
|
|
}
|
|
|
|
DBUG_RETURN(0);
|
|
}
|
|
#endif // HAVE_REPLICATION
|