2001-05-23 22:47:08 +02:00
|
|
|
/* Copyright (C) 2001 MySQL AB
|
|
|
|
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
|
|
it under the terms of the GNU General Public License as published by
|
|
|
|
the Free Software Foundation; either version 2 of the License, or
|
|
|
|
(at your option) any later version.
|
|
|
|
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
|
|
along with this program; if not, write to the Free Software
|
|
|
|
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA */
|
|
|
|
|
|
|
|
/*
|
|
|
|
Function to handle quick removal of duplicates
|
|
|
|
This code is used when doing multi-table deletes to find the rows in
|
|
|
|
reference tables that needs to be deleted.
|
|
|
|
|
|
|
|
The basic idea is as follows:
|
|
|
|
|
|
|
|
Store first all strings in a binary tree, ignoring duplicates.
|
|
|
|
When the three uses more memory than 'max_heap_table_size',
|
|
|
|
write the tree (in sorted order) out to disk and start with a new tree.
|
|
|
|
When all data has been generated, merge the trees (removing any found
|
|
|
|
duplicates).
|
|
|
|
|
|
|
|
The unique entries will be returned in sort order, to ensure that we do the
|
|
|
|
deletes in disk order.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "mysql_priv.h"
|
|
|
|
#include "sql_sort.h"
|
|
|
|
|
These are actually two changesets. One for splitting LEX in two and
the other for multi-table delete
sql/filesort.cc:
Fixed some bugs for Unique class
sql/item.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/item_sum.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/mysql_priv.h:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_class.h:
Adding multi table delete
sql/sql_delete.cc:
Added multi-table delete
sql/sql_lex.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_lex.h:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_parse.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc, plus added multi-table delete
sql/sql_select.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_update.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_yacc.yy:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc, plus added multi-table delete
sql/uniques.cc:
Fixed some bugs in duplicate stripping
BitKeeper/etc/logging_ok:
Logging to logging@openlogging.org accepted
2001-06-03 16:07:26 +02:00
|
|
|
|
|
|
|
Unique::Unique(qsort_cmp2 comp_func, void * comp_func_fixed_arg,
|
|
|
|
uint size, ulong max_in_memory_size_arg)
|
2001-05-23 22:47:08 +02:00
|
|
|
:max_in_memory_size(max_in_memory_size_arg),elements(0)
|
|
|
|
{
|
|
|
|
my_b_clear(&file);
|
2001-07-02 21:52:22 +02:00
|
|
|
init_tree(&tree, max_in_memory_size / 16, 0, size, comp_func, 0, NULL, comp_func_fixed_arg);
|
2001-05-23 22:47:08 +02:00
|
|
|
/* If the following fail's the next add will also fail */
|
|
|
|
init_dynamic_array(&file_ptrs, sizeof(BUFFPEK), 16, 16);
|
|
|
|
max_elements= max_in_memory_size / ALIGN_SIZE(sizeof(TREE_ELEMENT)+size);
|
2001-06-15 04:03:15 +02:00
|
|
|
open_cached_file(&file, mysql_tmpdir,TEMP_PREFIX, DISK_BUFFER_SIZE,
|
|
|
|
MYF(MY_WME));
|
2001-05-23 22:47:08 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
Unique::~Unique()
|
|
|
|
{
|
|
|
|
close_cached_file(&file);
|
|
|
|
delete_tree(&tree);
|
|
|
|
delete_dynamic(&file_ptrs);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/* Write tree to disk; clear tree */
|
|
|
|
bool Unique::flush()
|
|
|
|
{
|
|
|
|
BUFFPEK file_ptr;
|
|
|
|
elements+= tree.elements_in_tree;
|
|
|
|
file_ptr.count=tree.elements_in_tree;
|
|
|
|
file_ptr.file_pos=my_b_tell(&file);
|
|
|
|
if (tree_walk(&tree, (tree_walk_action) unique_write_to_file,
|
|
|
|
(void*) this, left_root_right) ||
|
|
|
|
insert_dynamic(&file_ptrs, (gptr) &file_ptr))
|
|
|
|
return 1;
|
|
|
|
delete_tree(&tree);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
These are actually two changesets. One for splitting LEX in two and
the other for multi-table delete
sql/filesort.cc:
Fixed some bugs for Unique class
sql/item.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/item_sum.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/mysql_priv.h:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_class.h:
Adding multi table delete
sql/sql_delete.cc:
Added multi-table delete
sql/sql_lex.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_lex.h:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_parse.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc, plus added multi-table delete
sql/sql_select.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_update.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_yacc.yy:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc, plus added multi-table delete
sql/uniques.cc:
Fixed some bugs in duplicate stripping
BitKeeper/etc/logging_ok:
Logging to logging@openlogging.org accepted
2001-06-03 16:07:26 +02:00
|
|
|
int unique_write_to_file(gptr key, element_count count, Unique *unique)
|
2001-05-23 22:47:08 +02:00
|
|
|
{
|
2001-09-15 15:22:34 +02:00
|
|
|
return my_b_write(&unique->file, (byte*) key,
|
|
|
|
unique->tree.size_of_element) ? 1 : 0;
|
2001-05-23 22:47:08 +02:00
|
|
|
}
|
|
|
|
|
These are actually two changesets. One for splitting LEX in two and
the other for multi-table delete
sql/filesort.cc:
Fixed some bugs for Unique class
sql/item.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/item_sum.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/mysql_priv.h:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_class.h:
Adding multi table delete
sql/sql_delete.cc:
Added multi-table delete
sql/sql_lex.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_lex.h:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_parse.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc, plus added multi-table delete
sql/sql_select.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_update.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_yacc.yy:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc, plus added multi-table delete
sql/uniques.cc:
Fixed some bugs in duplicate stripping
BitKeeper/etc/logging_ok:
Logging to logging@openlogging.org accepted
2001-06-03 16:07:26 +02:00
|
|
|
int unique_write_to_ptrs(gptr key, element_count count, Unique *unique)
|
2001-05-23 22:47:08 +02:00
|
|
|
{
|
|
|
|
memcpy(unique->record_pointers, key, unique->tree.size_of_element);
|
|
|
|
unique->record_pointers+=unique->tree.size_of_element;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
Modify the TABLE element so that when one calls init_records()
|
|
|
|
the rows will be read in priority order.
|
|
|
|
*/
|
|
|
|
|
|
|
|
bool Unique::get(TABLE *table)
|
|
|
|
{
|
|
|
|
SORTPARAM sort_param;
|
|
|
|
table->found_records=elements+tree.elements_in_tree;
|
|
|
|
|
2001-06-15 04:03:15 +02:00
|
|
|
if (my_b_tell(&file) == 0)
|
2001-05-23 22:47:08 +02:00
|
|
|
{
|
|
|
|
/* Whole tree is in memory; Don't use disk if you don't need to */
|
|
|
|
if ((record_pointers=table->record_pointers= (byte*)
|
|
|
|
my_malloc(tree.size_of_element * tree.elements_in_tree, MYF(0))))
|
|
|
|
{
|
|
|
|
(void) tree_walk(&tree, (tree_walk_action) unique_write_to_ptrs,
|
|
|
|
this, left_root_right);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
/* Not enough memory; Save the result to file */
|
|
|
|
if (flush())
|
|
|
|
return 1;
|
|
|
|
|
2001-06-15 04:03:15 +02:00
|
|
|
IO_CACHE *outfile=table->io_cache;
|
2001-05-23 22:47:08 +02:00
|
|
|
BUFFPEK *file_ptr= (BUFFPEK*) file_ptrs.buffer;
|
2001-06-07 13:10:58 +02:00
|
|
|
uint maxbuffer= file_ptrs.elements - 1;
|
2001-05-23 22:47:08 +02:00
|
|
|
uchar *sort_buffer;
|
|
|
|
my_off_t save_pos;
|
|
|
|
bool error=1;
|
|
|
|
|
|
|
|
/* Open cached file if it isn't open */
|
2001-06-15 04:03:15 +02:00
|
|
|
outfile=table->io_cache=(IO_CACHE*) my_malloc(sizeof(IO_CACHE),
|
|
|
|
MYF(MY_ZEROFILL));
|
2001-06-07 13:10:58 +02:00
|
|
|
|
|
|
|
if (!outfile || ! my_b_inited(outfile) &&
|
2001-05-23 22:47:08 +02:00
|
|
|
open_cached_file(outfile,mysql_tmpdir,TEMP_PREFIX,READ_RECORD_BUFFER,
|
|
|
|
MYF(MY_WME)))
|
|
|
|
return 1;
|
|
|
|
reinit_io_cache(outfile,WRITE_CACHE,0L,0,0);
|
These are actually two changesets. One for splitting LEX in two and
the other for multi-table delete
sql/filesort.cc:
Fixed some bugs for Unique class
sql/item.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/item_sum.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/mysql_priv.h:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_class.h:
Adding multi table delete
sql/sql_delete.cc:
Added multi-table delete
sql/sql_lex.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_lex.h:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_parse.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc, plus added multi-table delete
sql/sql_select.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_update.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_yacc.yy:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc, plus added multi-table delete
sql/uniques.cc:
Fixed some bugs in duplicate stripping
BitKeeper/etc/logging_ok:
Logging to logging@openlogging.org accepted
2001-06-03 16:07:26 +02:00
|
|
|
|
2001-07-10 14:53:08 +02:00
|
|
|
bzero((char*) &sort_param,sizeof(sort_param));
|
These are actually two changesets. One for splitting LEX in two and
the other for multi-table delete
sql/filesort.cc:
Fixed some bugs for Unique class
sql/item.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/item_sum.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/mysql_priv.h:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_class.h:
Adding multi table delete
sql/sql_delete.cc:
Added multi-table delete
sql/sql_lex.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_lex.h:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_parse.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc, plus added multi-table delete
sql/sql_select.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_update.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_yacc.yy:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc, plus added multi-table delete
sql/uniques.cc:
Fixed some bugs in duplicate stripping
BitKeeper/etc/logging_ok:
Logging to logging@openlogging.org accepted
2001-06-03 16:07:26 +02:00
|
|
|
sort_param.max_rows= elements;
|
2001-05-23 22:47:08 +02:00
|
|
|
sort_param.sort_form=table;
|
|
|
|
sort_param.sort_length=sort_param.ref_length=tree.size_of_element;
|
|
|
|
sort_param.keys= max_in_memory_size / sort_param.sort_length;
|
2001-07-10 14:53:08 +02:00
|
|
|
sort_param.not_killable=1;
|
2001-05-23 22:47:08 +02:00
|
|
|
|
These are actually two changesets. One for splitting LEX in two and
the other for multi-table delete
sql/filesort.cc:
Fixed some bugs for Unique class
sql/item.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/item_sum.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/mysql_priv.h:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_class.h:
Adding multi table delete
sql/sql_delete.cc:
Added multi-table delete
sql/sql_lex.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_lex.h:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_parse.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc, plus added multi-table delete
sql/sql_select.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_update.cc:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc
sql/sql_yacc.yy:
Changes caused by splitting lex into two parts, in order to
implement UNION's etc, plus added multi-table delete
sql/uniques.cc:
Fixed some bugs in duplicate stripping
BitKeeper/etc/logging_ok:
Logging to logging@openlogging.org accepted
2001-06-03 16:07:26 +02:00
|
|
|
if (!(sort_buffer=(uchar*) my_malloc((sort_param.keys+1) *
|
2001-06-15 04:03:15 +02:00
|
|
|
sort_param.sort_length,
|
|
|
|
MYF(0))))
|
2001-05-23 22:47:08 +02:00
|
|
|
return 1;
|
|
|
|
sort_param.unique_buff= sort_buffer+(sort_param.keys*
|
|
|
|
sort_param.sort_length);
|
|
|
|
|
|
|
|
/* Merge the buffers to one file, removing duplicates */
|
2001-06-15 04:03:15 +02:00
|
|
|
if (merge_many_buff(&sort_param,sort_buffer,file_ptr,&maxbuffer,&file))
|
2001-05-23 22:47:08 +02:00
|
|
|
goto err;
|
2001-06-15 04:03:15 +02:00
|
|
|
if (flush_io_cache(&file) ||
|
|
|
|
reinit_io_cache(&file,READ_CACHE,0L,0,0))
|
2001-05-23 22:47:08 +02:00
|
|
|
goto err;
|
2001-06-15 04:03:15 +02:00
|
|
|
if (merge_buffers(&sort_param, &file, outfile, sort_buffer, file_ptr,
|
2001-05-23 22:47:08 +02:00
|
|
|
file_ptr, file_ptr+maxbuffer,0))
|
|
|
|
goto err;
|
|
|
|
error=0;
|
|
|
|
err:
|
|
|
|
x_free((gptr) sort_buffer);
|
|
|
|
if (flush_io_cache(outfile))
|
|
|
|
error=1;
|
|
|
|
|
|
|
|
/* Setup io_cache for reading */
|
|
|
|
save_pos=outfile->pos_in_file;
|
|
|
|
if (reinit_io_cache(outfile,READ_CACHE,0L,0,0))
|
|
|
|
error=1;
|
|
|
|
outfile->end_of_file=save_pos;
|
|
|
|
return error;
|
|
|
|
}
|