mirror of
https://github.com/MariaDB/server.git
synced 2025-01-29 02:05:57 +01:00
31b9e6e03f
Fix bug in isamlog Add argument types to function declarations. Docs/manual.texi: Updated credits client/mysql.cc: Fixes for OS2 client/mysqladmin.c: Fixes for OS2 client/mysqldump.c: Fixes for OS2 client/mysqlimport.c: Fixes for OS2 client/mysqltest.c: Fixes for OS2 dbug/dbug.c: Fixes for OS2. Use new C calling convention. dbug/factorial.c: Fixes for OS2. Use new C calling convention. include/errmsg.h: Fix for OS2 include/global.h: Fixes for OS2. include/my_pthread.h: Fixes for OS2. include/my_sys.h: Fixes for OS2. include/mysql_com.h: Move defines to global.h include/thr_alarm.h: Fixes for OS2. isam/isamchk.c: Fixes for OS2. Add arguments to function declarations. isam/isamlog.c: Fixes for OS2. Fix bug in logfile handling. isam/test1.c: Add arguments to function decl isam/test2.c: Add arguments to function declarations. isam/test_all.res: Update result libmysql/get_password.c: Fixes for OS2. libmysql/libmysql.c: Fixes for OS2. libmysql/net.c: Fixes for OS2. libmysql/violite.c: Add arguments to function declarations. merge/_locking.c: Add argument types to function declarations. merge/close.c: Add argument types to function declarations. merge/create.c: Add argument types to function declarations. merge/extra.c: Add argument types to function declarations. merge/open.c: Add argument types to function declarations. merge/panic.c: Add argument types to function declarations. merge/rsame.c: Add argument types to function declarations. merge/update.c: Add argument types to function declarations. myisam/ft_eval.c: Portability fix myisam/ft_search.c: Portability fix myisam/ft_test1.c: Portability fix myisam/ftdefs.h: Portability fix myisam/mi_check.c: Portability fix myisam/mi_test1.c: Portability fix myisam/mi_test2.c: Portability fix myisam/mi_test_all.sh: Update to test for MACH variable myisam/myisamlog.c: Cleanup myisam/myisampack.c: Don't use variable 'new' myisam/sort.c: Portability fix myisammrg/myrg_delete.c: Add argument types to function declarations. myisammrg/myrg_locking.c: Add argument types to function declarations. myisammrg/myrg_open.c: Add argument types to function declarations. myisammrg/myrg_panic.c: Add argument types to function declarations. mysql-test/t/backup.test: Fix for OS2 mysql-test/t/show_check.test: Fix for OS2 mysys/charset.c: Dont use variable 'new' mysys/default.c: Fixes for OS2. mysys/getopt.c: Fixes for OS2. mysys/getopt1.c: Fixes for OS2. mysys/list.c: Don't use variable 'new' mysys/mf_dirname.c: Fixes for OS2. mysys/mf_format.c: Fixes for OS2. mysys/mf_path.c: Fixes for OS2. mysys/mf_qsort.c: Portability fix mysys/mf_tempfile.c: Fixes for OS2. mysys/my_clock.c: Fixes for OS2. mysys/my_copy.c: Fixes for OS2. mysys/my_create.c: Fixes for OS2. mysys/my_getwd.c: Fixes for OS2. mysys/my_init.c: Fixes for OS2. mysys/my_lib.c: Fixes for OS2. mysys/my_lock.c: Fixes for OS2. mysys/my_malloc.c: Portability fix mysys/my_mkdir.c: Fixes for OS2. mysys/my_open.c: Fixes for OS2. mysys/my_pthread.c: Fixes for OS2. mysys/my_realloc.c: Fixes for OS2. mysys/my_redel.c: Fixes for OS2. mysys/my_static.c: Fixes for OS2. mysys/my_tempnam.c: Fixes for OS2. mysys/my_thr_init.c: Fixes for OS2. mysys/my_write.c: Fixes for OS2. mysys/test_charset.c: Fixes for OS2. mysys/thr_alarm.c: Fixes for OS2. mysys/tree.c: Fixes for OS2. sql/field.cc: Fixes for OS2. sql/field.h: Fixes for OS2. sql/gen_lex_hash.cc: Fixes for OS2. sql/hostname.cc: Fixes for OS2. sql/item_func.cc: Fixes for OS2. sql/item_strfunc.cc: Fixes for OS2. sql/log_event.cc: Fixes for OS2. sql/md5.c: Fixes for OS2. sql/mini_client.cc: Fixes for OS2. sql/mysql_priv.h: Fixes for OS2. sql/mysqld.cc: Fixes for OS2. sql/net_serv.cc: Fixes for OS2. sql/slave.cc: Fixes for OS2. sql/sql_base.cc: Fixes for OS2. sql/sql_db.cc: Portability fix sql/sql_insert.cc: Fixes for OS2. sql/sql_load.cc: Fixes for OS2. sql/sql_parse.cc: Fixes for OS2. sql/sql_table.cc: Fixes for OS2. sql/sql_udf.cc: Fixes for OS2. sql/violite.c: Fixes for OS2. strings/ctype-big5.c: Fixes for OS2. strings/ctype-gbk.c: Fixes for OS2. strings/ctype-sjis.c: Fixes for OS2. strings/ctype-tis620.c: Fixes for OS2. strings/ctype.c: Fixes for OS2. strings/strnlen.c: Fixes for OS2.
99 lines
3.7 KiB
C
99 lines
3.7 KiB
C
/* Copyright (C) 2000 MySQL AB & MySQL Finland AB & TCX DataKonsult AB
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 2 of the License, or
|
|
(at your option) any later version.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program; if not, write to the Free Software
|
|
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA */
|
|
|
|
/* Written by Sergei A. Golubchik, who has a shared copyright to this code */
|
|
|
|
/* some definitions for full-text indices */
|
|
|
|
#include "fulltext.h"
|
|
#include <m_ctype.h>
|
|
#include <my_tree.h>
|
|
|
|
#define MIN_WORD_LEN 4
|
|
|
|
#define HYPHEN_IS_DELIM
|
|
#define HYPHEN_IS_CONCAT /* not used for now */
|
|
|
|
#define COMPILE_STOPWORDS_IN
|
|
|
|
/* Most of the formulae were shamelessly stolen from SMART distribution
|
|
ftp://ftp.cs.cornell.edu/pub/smart/smart.11.0.tar.Z
|
|
NORM_PIVOT was taken from the article
|
|
A.Singhal, C.Buckley, M.Mitra, "Pivoted Document Length Normalization",
|
|
ACM SIGIR'96, 21-29, 1996
|
|
*/
|
|
|
|
#define LWS_FOR_QUERY LWS_TF
|
|
#define LWS_IN_USE LWS_LOG
|
|
#define PRENORM_IN_USE PRENORM_AVG
|
|
#define NORM_IN_USE NORM_PIVOT
|
|
#define GWS_IN_USE GWS_PROB
|
|
/*==============================================================*/
|
|
#define LWS_TF (count)
|
|
#define LWS_BINARY (count>0)
|
|
#define LWS_SQUARE (count*count)
|
|
#define LWS_LOG (count?(log( (double) count)+1):0)
|
|
/*--------------------------------------------------------------*/
|
|
#define PRENORM_NONE (p->weight)
|
|
#define PRENORM_MAX (p->weight/docstat.max)
|
|
#define PRENORM_AUG (0.4+0.6*p->weight/docstat.max)
|
|
#define PRENORM_AVG (p->weight/docstat.sum*docstat.uniq)
|
|
#define PRENORM_AVGLOG ((1+log(p->weight))/(1+log(docstat.sum/docstat.uniq)))
|
|
/*--------------------------------------------------------------*/
|
|
#define NORM_NONE (1)
|
|
#define NORM_SUM (docstat.nsum)
|
|
#define NORM_COS (sqrt(docstat.nsum2))
|
|
|
|
#ifdef EVAL_RUN
|
|
/*
|
|
extern ulong collstat;
|
|
#define PIVOT_STAT (docstat.uniq)
|
|
#define PIVOT_SLOPE (0.69)
|
|
#define PIVOT_PIVOT ((double)collstat/(info->state->records+1))
|
|
#define NORM_PIVOT ((1-PIVOT_SLOPE)*PIVOT_PIVOT+PIVOT_SLOPE*docstat.uniq)
|
|
*/
|
|
#endif /* EVAL_RUN */
|
|
|
|
#define PIVOT_VAL (0.0115)
|
|
#define NORM_PIVOT (1+PIVOT_VAL*docstat.uniq)
|
|
/*---------------------------------------------------------------*/
|
|
#define GWS_NORM (1/sqrt(sum2))
|
|
#define GWS_GFIDF (sum/doc_cnt)
|
|
/* Mysterious, but w/o (double) GWS_IDF performs better :-o */
|
|
#define GWS_IDF log(aio->info->state->records/doc_cnt)
|
|
#define GWS_IDF1 log((double)aio->info->state->records/doc_cnt)
|
|
#define GWS_PROB log(((double)(aio->info->state->records-doc_cnt))/doc_cnt)
|
|
#define GWS_FREQ (1.0/doc_cnt)
|
|
#define GWS_SQUARED pow(log((double)aio->info->state->records/doc_cnt),2)
|
|
#define GWS_CUBIC pow(log((double)aio->info->state->records/doc_cnt),3)
|
|
#define GWS_ENTROPY (1-(suml/sum-log(sum))/log(aio->info->state->records))
|
|
/*=================================================================*/
|
|
|
|
typedef struct st_ft_word {
|
|
byte * pos;
|
|
uint len;
|
|
double weight;
|
|
#ifdef EVAL_RUN
|
|
byte cnt;
|
|
#endif /* EVAL_RUN */
|
|
} FT_WORD;
|
|
|
|
int is_stopword(char *word, uint len);
|
|
|
|
uint _ft_make_key(MI_INFO *, uint , byte *, FT_WORD *, my_off_t);
|
|
|
|
TREE * ft_parse(TREE *, byte *, int);
|
|
FT_WORD * ft_linearize(MI_INFO *, uint, byte *, TREE *);
|