2009-09-23 23:32:31 +02:00
|
|
|
#ifndef SQL_SORT_INCLUDED
|
|
|
|
#define SQL_SORT_INCLUDED
|
|
|
|
|
2011-06-30 17:46:53 +02:00
|
|
|
/* Copyright (c) 2000, 2010, Oracle and/or its affiliates. All rights reserved.
|
2020-01-21 11:56:54 +01:00
|
|
|
Copyright (c) 2020, MariaDB Corporation.
|
2001-05-23 22:47:08 +02:00
|
|
|
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
|
|
it under the terms of the GNU General Public License as published by
|
2006-12-23 20:17:15 +01:00
|
|
|
the Free Software Foundation; version 2 of the License.
|
2001-05-23 22:47:08 +02:00
|
|
|
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
|
|
along with this program; if not, write to the Free Software
|
2019-05-11 20:29:06 +02:00
|
|
|
Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1335 USA */
|
2001-05-23 22:47:08 +02:00
|
|
|
|
2010-03-31 16:05:33 +02:00
|
|
|
#include "my_base.h" /* ha_rows */
|
2017-06-18 05:42:16 +02:00
|
|
|
#include <my_sys.h> /* qsort2_cmp */
|
2011-04-25 17:22:25 +02:00
|
|
|
#include "queues.h"
|
2010-03-31 16:05:33 +02:00
|
|
|
|
2016-01-12 14:03:29 +01:00
|
|
|
struct SORT_FIELD;
|
2010-03-31 16:05:33 +02:00
|
|
|
class Field;
|
|
|
|
struct TABLE;
|
|
|
|
|
2001-05-23 22:47:08 +02:00
|
|
|
/* Defines used by filesort and uniques */
|
|
|
|
|
|
|
|
#define MERGEBUFF 7
|
|
|
|
#define MERGEBUFF2 15
|
|
|
|
|
2003-04-24 13:33:33 +02:00
|
|
|
/*
|
|
|
|
The structure SORT_ADDON_FIELD describes a fixed layout
|
|
|
|
for field values appended to sorted values in records to be sorted
|
|
|
|
in the sort buffer.
|
|
|
|
Only fixed layout is supported now.
|
|
|
|
Null bit maps for the appended values is placed before the values
|
|
|
|
themselves. Offsets are from the last sorted field, that is from the
|
|
|
|
record referefence, which is still last component of sorted records.
|
|
|
|
It is preserved for backward compatiblility.
|
|
|
|
The structure is used tp store values of the additional fields
|
|
|
|
in the sort buffer. It is used also when these values are read
|
|
|
|
from a temporary file/buffer. As the reading procedures are beyond the
|
|
|
|
scope of the 'filesort' code the values have to be retrieved via
|
|
|
|
the callback function 'unpack_addon_fields'.
|
|
|
|
*/
|
|
|
|
|
2006-04-11 15:45:10 +02:00
|
|
|
typedef struct st_sort_addon_field
|
|
|
|
{
|
|
|
|
/* Sort addon packed field */
|
2003-04-24 13:33:33 +02:00
|
|
|
Field *field; /* Original field */
|
|
|
|
uint offset; /* Offset from the last sorted field */
|
|
|
|
uint null_offset; /* Offset to to null bit from the last sorted field */
|
|
|
|
uint length; /* Length in the sort buffer */
|
|
|
|
uint8 null_bit; /* Null bit mask for the field */
|
|
|
|
} SORT_ADDON_FIELD;
|
|
|
|
|
2007-07-02 00:33:28 +02:00
|
|
|
struct BUFFPEK_COMPARE_CONTEXT
|
|
|
|
{
|
|
|
|
qsort_cmp2 key_compare;
|
|
|
|
void *key_compare_arg;
|
|
|
|
};
|
|
|
|
|
2012-09-01 23:21:59 +02:00
|
|
|
|
2020-01-20 21:07:47 +01:00
|
|
|
/**
|
|
|
|
Descriptor for a merge chunk to be sort-merged.
|
|
|
|
A merge chunk is a sequence of pre-sorted records, written to a
|
|
|
|
temporary file. A Merge_chunk instance describes where this chunk is stored
|
|
|
|
in the file, and where it is located when it is in memory.
|
|
|
|
|
|
|
|
It is a POD because
|
|
|
|
- we read/write them from/to files.
|
|
|
|
|
|
|
|
We have accessors (getters/setters) for all struct members.
|
|
|
|
*/
|
|
|
|
|
|
|
|
struct Merge_chunk {
|
|
|
|
public:
|
|
|
|
my_off_t file_position() const { return m_file_position; }
|
|
|
|
void set_file_position(my_off_t val) { m_file_position= val; }
|
|
|
|
void advance_file_position(my_off_t val) { m_file_position+= val; }
|
|
|
|
|
|
|
|
uchar *buffer_start() { return m_buffer_start; }
|
|
|
|
const uchar *buffer_end() const { return m_buffer_end; }
|
|
|
|
|
|
|
|
void set_buffer(uchar *start, uchar *end)
|
|
|
|
{
|
|
|
|
m_buffer_start= start;
|
|
|
|
m_buffer_end= end;
|
|
|
|
}
|
|
|
|
void set_buffer_start(uchar *start)
|
|
|
|
{
|
|
|
|
m_buffer_start= start;
|
|
|
|
}
|
|
|
|
void set_buffer_end(uchar *end)
|
|
|
|
{
|
|
|
|
DBUG_ASSERT(m_buffer_end == NULL || end <= m_buffer_end);
|
|
|
|
m_buffer_end= end;
|
|
|
|
}
|
|
|
|
|
|
|
|
void init_current_key() { m_current_key= m_buffer_start; }
|
|
|
|
uchar *current_key() { return m_current_key; }
|
|
|
|
void advance_current_key(uint val) { m_current_key+= val; }
|
|
|
|
|
|
|
|
void decrement_rowcount(ha_rows val) { m_rowcount-= val; }
|
|
|
|
void set_rowcount(ha_rows val) { m_rowcount= val; }
|
|
|
|
ha_rows rowcount() const { return m_rowcount; }
|
|
|
|
|
|
|
|
ha_rows mem_count() const { return m_mem_count; }
|
|
|
|
void set_mem_count(ha_rows val) { m_mem_count= val; }
|
|
|
|
ha_rows decrement_mem_count() { return --m_mem_count; }
|
|
|
|
|
|
|
|
ha_rows max_keys() const { return m_max_keys; }
|
|
|
|
void set_max_keys(ha_rows val) { m_max_keys= val; }
|
|
|
|
|
|
|
|
size_t buffer_size() const { return m_buffer_end - m_buffer_start; }
|
|
|
|
|
|
|
|
/**
|
|
|
|
Tries to merge *this with *mc, returns true if successful.
|
|
|
|
The assumption is that *this is no longer in use,
|
|
|
|
and the space it has been allocated can be handed over to a
|
|
|
|
buffer which is adjacent to it.
|
|
|
|
*/
|
|
|
|
bool merge_freed_buff(Merge_chunk *mc) const
|
|
|
|
{
|
|
|
|
if (mc->m_buffer_end == m_buffer_start)
|
|
|
|
{
|
|
|
|
mc->m_buffer_end= m_buffer_end;
|
|
|
|
mc->m_max_keys+= m_max_keys;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
else if (mc->m_buffer_start == m_buffer_end)
|
|
|
|
{
|
|
|
|
mc->m_buffer_start= m_buffer_start;
|
|
|
|
mc->m_max_keys+= m_max_keys;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2020-01-21 11:56:54 +01:00
|
|
|
/// The current key for this chunk
|
|
|
|
uchar *m_current_key= nullptr;
|
|
|
|
/// Current position in the file to be sorted.
|
|
|
|
my_off_t m_file_position= 0;
|
|
|
|
/// Start of main-memory buffer for this chunk.
|
|
|
|
uchar *m_buffer_start= nullptr;
|
|
|
|
/// End of main-memory buffer for this chunk.
|
|
|
|
uchar *m_buffer_end= nullptr;
|
|
|
|
/// Number of unread rows in this chunk.
|
|
|
|
ha_rows m_rowcount= 0;
|
|
|
|
/// Number of rows in the main-memory buffer.
|
|
|
|
ha_rows m_mem_count= 0;
|
|
|
|
/// If we have fixed-size rows: max number of rows in buffer.
|
|
|
|
ha_rows m_max_keys= 0;
|
2020-01-20 21:07:47 +01:00
|
|
|
};
|
|
|
|
|
|
|
|
typedef Bounds_checked_array<SORT_ADDON_FIELD> Addon_fields_array;
|
|
|
|
|
|
|
|
/**
|
|
|
|
This class wraps information about usage of addon fields.
|
|
|
|
An Addon_fields object is used both during packing of data in the filesort
|
|
|
|
buffer, and later during unpacking in 'Filesort_info::unpack_addon_fields'.
|
|
|
|
|
|
|
|
@see documentation for the Sort_addon_field struct.
|
|
|
|
@see documentation for get_addon_fields()
|
|
|
|
*/
|
|
|
|
class Addon_fields {
|
|
|
|
public:
|
|
|
|
Addon_fields(Addon_fields_array arr)
|
|
|
|
: m_field_descriptors(arr),
|
|
|
|
m_addon_buf(),
|
|
|
|
m_addon_buf_length(),
|
|
|
|
m_using_packed_addons(false)
|
|
|
|
{
|
|
|
|
DBUG_ASSERT(!arr.is_null());
|
|
|
|
}
|
|
|
|
|
|
|
|
SORT_ADDON_FIELD *begin() { return m_field_descriptors.begin(); }
|
|
|
|
SORT_ADDON_FIELD *end() { return m_field_descriptors.end(); }
|
|
|
|
|
|
|
|
/// rr_unpack_from_tempfile needs an extra buffer when unpacking.
|
|
|
|
uchar *allocate_addon_buf(uint sz)
|
|
|
|
{
|
|
|
|
m_addon_buf= (uchar *)my_malloc(sz, MYF(MY_WME | MY_THREAD_SPECIFIC));
|
|
|
|
if (m_addon_buf)
|
|
|
|
m_addon_buf_length= sz;
|
|
|
|
return m_addon_buf;
|
|
|
|
}
|
|
|
|
|
|
|
|
void free_addon_buff()
|
|
|
|
{
|
|
|
|
my_free(m_addon_buf);
|
|
|
|
m_addon_buf= NULL;
|
|
|
|
m_addon_buf_length= 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
uchar *get_addon_buf() { return m_addon_buf; }
|
|
|
|
uint get_addon_buf_length() const { return m_addon_buf_length; }
|
|
|
|
|
|
|
|
void set_using_packed_addons(bool val)
|
|
|
|
{
|
|
|
|
m_using_packed_addons= val;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool using_packed_addons() const
|
|
|
|
{
|
|
|
|
return m_using_packed_addons;
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool can_pack_addon_fields(uint record_length)
|
|
|
|
{
|
|
|
|
return (record_length <= (0xFFFF));
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
@returns Total number of bytes used for packed addon fields.
|
|
|
|
the size of the length field + size of null bits + sum of field sizes.
|
|
|
|
*/
|
|
|
|
static uint read_addon_length(uchar *p)
|
|
|
|
{
|
|
|
|
return size_of_length_field + uint2korr(p);
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
Stores the number of bytes used for packed addon fields.
|
|
|
|
*/
|
|
|
|
static void store_addon_length(uchar *p, uint sz)
|
|
|
|
{
|
|
|
|
// We actually store the length of everything *after* the length field.
|
|
|
|
int2store(p, sz - size_of_length_field);
|
|
|
|
}
|
|
|
|
|
|
|
|
static const uint size_of_length_field= 2;
|
|
|
|
|
|
|
|
private:
|
|
|
|
Addon_fields_array m_field_descriptors;
|
|
|
|
|
|
|
|
uchar *m_addon_buf; ///< Buffer for unpacking addon fields.
|
|
|
|
uint m_addon_buf_length; ///< Length of the buffer.
|
|
|
|
bool m_using_packed_addons; ///< Are we packing the addon fields?
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
There are two record formats for sorting:
|
|
|
|
|<key a><key b>...|<rowid>|
|
|
|
|
/ sort_length / ref_l /
|
|
|
|
|
|
|
|
or with "addon fields"
|
|
|
|
|<key a><key b>...|<null bits>|<field a><field b>...|
|
|
|
|
/ sort_length / addon_length /
|
|
|
|
|
|
|
|
The packed format for "addon fields"
|
|
|
|
|<key a><key b>...|<length>|<null bits>|<field a><field b>...|
|
|
|
|
/ sort_length / addon_length /
|
|
|
|
|
|
|
|
<key> Fields are fixed-size, specially encoded with
|
|
|
|
Field::make_sort_key() so we can do byte-by-byte compare.
|
|
|
|
<length> Contains the *actual* packed length (after packing) of
|
|
|
|
everything after the sort keys.
|
|
|
|
The size of the length field is 2 bytes,
|
|
|
|
which should cover most use cases: addon data <= 65535 bytes.
|
|
|
|
This is the same as max record size in MySQL.
|
|
|
|
<null bits> One bit for each nullable field, indicating whether the field
|
|
|
|
is null or not. May have size zero if no fields are nullable.
|
|
|
|
<field xx> Are stored with field->pack(), and retrieved with
|
|
|
|
field->unpack(). Addon fields within a record are stored
|
|
|
|
consecutively, with no "holes" or padding. They will have zero
|
|
|
|
size for NULL values.
|
|
|
|
|
|
|
|
*/
|
|
|
|
|
2012-09-01 23:21:59 +02:00
|
|
|
class Sort_param {
|
|
|
|
public:
|
|
|
|
uint rec_length; // Length of sorted records.
|
|
|
|
uint sort_length; // Length of sorted columns.
|
|
|
|
uint ref_length; // Length of record ref.
|
2020-01-20 21:07:47 +01:00
|
|
|
uint addon_length; // Length of addon_fields
|
2012-09-01 23:21:59 +02:00
|
|
|
uint res_length; // Length of records in final sorted file/buffer.
|
|
|
|
uint max_keys_per_buffer; // Max keys / buffer.
|
2011-10-19 21:45:18 +02:00
|
|
|
uint min_dupl_count;
|
2012-09-01 23:21:59 +02:00
|
|
|
ha_rows max_rows; // Select limit, or HA_POS_ERROR if unlimited.
|
|
|
|
ha_rows examined_rows; // Number of examined rows.
|
|
|
|
TABLE *sort_form; // For quicker make_sortkey.
|
2020-01-20 21:07:47 +01:00
|
|
|
/**
|
|
|
|
ORDER BY list with some precalculated info for filesort.
|
|
|
|
Array is created and owned by a Filesort instance.
|
|
|
|
*/
|
|
|
|
Bounds_checked_array<SORT_FIELD> local_sortorder;
|
|
|
|
Addon_fields *addon_fields; // Descriptors for companion fields.
|
|
|
|
bool using_pq;
|
2016-03-22 20:51:59 +01:00
|
|
|
|
2001-05-23 22:47:08 +02:00
|
|
|
uchar *unique_buff;
|
2001-07-10 14:53:08 +02:00
|
|
|
bool not_killable;
|
2001-05-23 22:47:08 +02:00
|
|
|
char* tmp_buffer;
|
2012-09-01 23:21:59 +02:00
|
|
|
// The fields below are used only by Unique class.
|
2007-07-02 00:33:28 +02:00
|
|
|
qsort2_cmp compare;
|
|
|
|
BUFFPEK_COMPARE_CONTEXT cmp_context;
|
2001-05-23 22:47:08 +02:00
|
|
|
|
2012-09-01 23:21:59 +02:00
|
|
|
Sort_param()
|
|
|
|
{
|
2020-01-22 09:06:02 +01:00
|
|
|
memset(reinterpret_cast<void*>(this), 0, sizeof(*this));
|
2012-09-01 23:21:59 +02:00
|
|
|
}
|
|
|
|
void init_for_filesort(uint sortlen, TABLE *table,
|
|
|
|
ha_rows maxrows, bool sort_positions);
|
2020-01-20 21:07:47 +01:00
|
|
|
/// Enables the packing of addons if possible.
|
|
|
|
void try_to_pack_addons(ulong max_length_for_sort_data);
|
|
|
|
|
|
|
|
/// Are we packing the "addon fields"?
|
|
|
|
bool using_packed_addons() const
|
|
|
|
{
|
|
|
|
DBUG_ASSERT(m_using_packed_addons ==
|
|
|
|
(addon_fields != NULL &&
|
|
|
|
addon_fields->using_packed_addons()));
|
|
|
|
return m_using_packed_addons;
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Are we using "addon fields"?
|
|
|
|
bool using_addon_fields() const
|
|
|
|
{
|
|
|
|
return addon_fields != NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
Getter for record length and result length.
|
|
|
|
@param record_start Pointer to record.
|
|
|
|
@param [out] recl Store record length here.
|
|
|
|
@param [out] resl Store result length here.
|
|
|
|
*/
|
|
|
|
void get_rec_and_res_len(uchar *record_start, uint *recl, uint *resl)
|
|
|
|
{
|
|
|
|
if (!using_packed_addons())
|
|
|
|
{
|
|
|
|
*recl= rec_length;
|
|
|
|
*resl= res_length;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
uchar *plen= record_start + sort_length;
|
|
|
|
*resl= Addon_fields::read_addon_length(plen);
|
|
|
|
DBUG_ASSERT(*resl <= res_length);
|
|
|
|
const uchar *record_end= plen + *resl;
|
|
|
|
*recl= static_cast<uint>(record_end - record_start);
|
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
|
|
|
uint m_packable_length;
|
|
|
|
bool m_using_packed_addons; ///< caches the value of using_packed_addons()
|
2012-09-01 23:21:59 +02:00
|
|
|
};
|
2001-05-23 22:47:08 +02:00
|
|
|
|
2020-01-20 21:07:47 +01:00
|
|
|
typedef Bounds_checked_array<uchar> Sort_buffer;
|
2012-09-01 23:21:59 +02:00
|
|
|
|
2020-01-20 21:07:47 +01:00
|
|
|
int merge_many_buff(Sort_param *param, Sort_buffer sort_buffer,
|
|
|
|
Merge_chunk *buffpek, uint *maxbuffer, IO_CACHE *t_file);
|
|
|
|
ulong read_to_buffer(IO_CACHE *fromfile, Merge_chunk *buffpek,
|
|
|
|
Sort_param *param);
|
2018-04-12 08:28:29 +02:00
|
|
|
bool merge_buffers(Sort_param *param,IO_CACHE *from_file,
|
2020-01-20 21:07:47 +01:00
|
|
|
IO_CACHE *to_file, Sort_buffer sort_buffer,
|
|
|
|
Merge_chunk *lastbuff, Merge_chunk *Fb,
|
|
|
|
Merge_chunk *Tb, int flag);
|
|
|
|
int merge_index(Sort_param *param, Sort_buffer sort_buffer,
|
|
|
|
Merge_chunk *buffpek, uint maxbuffer,
|
|
|
|
IO_CACHE *tempfile, IO_CACHE *outfile);
|
|
|
|
void reuse_freed_buff(QUEUE *queue, Merge_chunk *reuse, uint key_length);
|
2009-09-23 23:32:31 +02:00
|
|
|
|
|
|
|
#endif /* SQL_SORT_INCLUDED */
|