mirror of
https://github.com/MariaDB/server.git
synced 2025-01-25 08:14:18 +01:00
fd247cc21f
This patch also fixes: MDEV-33050 Build-in schemas like oracle_schema are accent insensitive MDEV-33084 LASTVAL(t1) and LASTVAL(T1) do not work well with lower-case-table-names=0 MDEV-33085 Tables T1 and t1 do not work well with ENGINE=CSV and lower-case-table-names=0 MDEV-33086 SHOW OPEN TABLES IN DB1 -- is case insensitive with lower-case-table-names=0 MDEV-33088 Cannot create triggers in the database `MYSQL` MDEV-33103 LOCK TABLE t1 AS t2 -- alias is not case sensitive with lower-case-table-names=0 MDEV-33109 DROP DATABASE MYSQL -- does not drop SP with lower-case-table-names=0 MDEV-33110 HANDLER commands are case insensitive with lower-case-table-names=0 MDEV-33119 User is case insensitive in INFORMATION_SCHEMA.VIEWS MDEV-33120 System log table names are case insensitive with lower-cast-table-names=0 - Removing the virtual function strnncoll() from MY_COLLATION_HANDLER - Adding a wrapper function CHARSET_INFO::streq(), to compare two strings for equality. For now it calls strnncoll() internally. In the future it will turn into a virtual function. - Adding new accent sensitive case insensitive collations: - utf8mb4_general1400_as_ci - utf8mb3_general1400_as_ci They implement accent sensitive case insensitive comparison. The weight of a character is equal to the code point of its upper case variant. These collations use Unicode-14.0.0 casefolding data. The result of my_charset_utf8mb3_general1400_as_ci.strcoll() is very close to the former my_charset_utf8mb3_general_ci.strcasecmp() There is only a difference in a couple dozen rare characters, because: - the switch from "tolower" to "toupper" comparison, to make utf8mb3_general1400_as_ci closer to utf8mb3_general_ci - the switch from Unicode-3.0.0 to Unicode-14.0.0 This difference should be tolarable. See the list of affected characters in the MDEV description. Note, utf8mb4_general1400_as_ci correctly handles non-BMP characters! Unlike utf8mb4_general_ci, it does not treat all BMP characters as equal. - Adding classes representing names of the file based database objects: Lex_ident_db Lex_ident_table Lex_ident_trigger Their comparison collation depends on the underlying file system case sensitivity and on --lower-case-table-names and can be either my_charset_bin or my_charset_utf8mb3_general1400_as_ci. - Adding classes representing names of other database objects, whose names have case insensitive comparison style, using my_charset_utf8mb3_general1400_as_ci: Lex_ident_column Lex_ident_sys_var Lex_ident_user_var Lex_ident_sp_var Lex_ident_ps Lex_ident_i_s_table Lex_ident_window Lex_ident_func Lex_ident_partition Lex_ident_with_element Lex_ident_rpl_filter Lex_ident_master_info Lex_ident_host Lex_ident_locale Lex_ident_plugin Lex_ident_engine Lex_ident_server Lex_ident_savepoint Lex_ident_charset engine_option_value::Name - All the mentioned Lex_ident_xxx classes implement a method streq(): if (ident1.streq(ident2)) do_equal(); This method works as a wrapper for CHARSET_INFO::streq(). - Changing a lot of "LEX_CSTRING name" to "Lex_ident_xxx name" in class members and in function/method parameters. - Replacing all calls like system_charset_info->coll->strcasecmp(ident1, ident2) to ident1.streq(ident2) - Taking advantage of the c++11 user defined literal operator for LEX_CSTRING (see m_strings.h) and Lex_ident_xxx (see lex_ident.h) data types. Use example: const Lex_ident_column primary_key_name= "PRIMARY"_Lex_ident_column; is now a shorter version of: const Lex_ident_column primary_key_name= Lex_ident_column({STRING_WITH_LEN("PRIMARY")});
110 lines
3 KiB
C
110 lines
3 KiB
C
/* Copyright (c) 2000-2005, 2007 MySQL AB, 2009 Sun Microsystems, Inc.
|
|
Use is subject to license terms.
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; version 2 of the License.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program; if not, write to the Free Software
|
|
Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1335 USA */
|
|
|
|
/* Written by Sergei A. Golubchik, who has a shared copyright to this code */
|
|
|
|
/* some definitions for full-text indices */
|
|
|
|
/* #include "myisam.h" */
|
|
|
|
#ifndef _ft_global_h
|
|
#define _ft_global_h
|
|
#ifdef __cplusplus
|
|
extern "C" {
|
|
#endif
|
|
|
|
#include <my_compare.h>
|
|
|
|
#define HA_FT_MAXBYTELEN 254
|
|
#define HA_FT_MAXCHARLEN (HA_FT_MAXBYTELEN/3)
|
|
|
|
#define DEFAULT_FTB_SYNTAX "+ -><()~*:\"\"&|"
|
|
|
|
typedef struct st_ft_info FT_INFO;
|
|
struct _ft_vft
|
|
{
|
|
int (*read_next)(FT_INFO *, char *);
|
|
float (*find_relevance)(FT_INFO *, uchar *, uint);
|
|
void (*close_search)(FT_INFO *);
|
|
float (*get_relevance)(FT_INFO *);
|
|
void (*reinit_search)(FT_INFO *);
|
|
};
|
|
|
|
typedef struct st_ft_info_ext FT_INFO_EXT;
|
|
struct _ft_vft_ext
|
|
{
|
|
uint (*get_version)(); // Extended API version
|
|
ulonglong (*get_flags)();
|
|
ulonglong (*get_docid)(FT_INFO_EXT *);
|
|
ulonglong (*count_matches)(FT_INFO_EXT *);
|
|
};
|
|
|
|
/* Flags for extended FT API */
|
|
#define FTS_ORDERED_RESULT (1LL << 1)
|
|
#define FTS_DOCID_IN_RESULT (1LL << 2)
|
|
|
|
#ifndef FT_CORE
|
|
struct st_ft_info
|
|
{
|
|
struct _ft_vft *please; /* INTERCAL style :-) */
|
|
};
|
|
|
|
struct st_ft_info_ext
|
|
{
|
|
struct _ft_vft *please; /* INTERCAL style :-) */
|
|
struct _ft_vft_ext *could_you;
|
|
};
|
|
#endif
|
|
|
|
extern const char *ft_stopword_file;
|
|
extern const char *ft_precompiled_stopwords[];
|
|
|
|
extern ulong ft_min_word_len;
|
|
extern ulong ft_max_word_len;
|
|
extern ulong ft_query_expansion_limit;
|
|
extern const char *ft_boolean_syntax;
|
|
extern struct st_mysql_ftparser ft_default_parser;
|
|
|
|
int ft_init_stopwords(void);
|
|
void ft_free_stopwords(void);
|
|
|
|
#define FT_NL 0
|
|
#define FT_BOOL 1
|
|
#define FT_SORTED 2
|
|
#define FT_EXPAND 4 /* query expansion */
|
|
|
|
FT_INFO *ft_init_search(uint,void *, uint, uchar *, size_t,
|
|
CHARSET_INFO *, uchar *);
|
|
my_bool ft_boolean_check_syntax_string(const uchar *, size_t length,
|
|
CHARSET_INFO *cs);
|
|
|
|
/* Internal symbols for fulltext between maria and MyISAM */
|
|
|
|
#define HA_FT_WTYPE HA_KEYTYPE_FLOAT
|
|
#define HA_FT_WLEN 4
|
|
#define FT_SEGS 2
|
|
|
|
#define ft_sintXkorr(A) mi_sint4korr(A)
|
|
#define ft_intXstore(T,A) mi_int4store(T,A)
|
|
|
|
extern const HA_KEYSEG ft_keysegs[FT_SEGS];
|
|
|
|
typedef union {int32 i; float f;} FT_WEIGTH;
|
|
|
|
#ifdef __cplusplus
|
|
}
|
|
#endif
|
|
#endif
|