mirror of
https://github.com/MariaDB/server.git
synced 2025-01-27 01:04:19 +01:00
fd247cc21f
This patch also fixes: MDEV-33050 Build-in schemas like oracle_schema are accent insensitive MDEV-33084 LASTVAL(t1) and LASTVAL(T1) do not work well with lower-case-table-names=0 MDEV-33085 Tables T1 and t1 do not work well with ENGINE=CSV and lower-case-table-names=0 MDEV-33086 SHOW OPEN TABLES IN DB1 -- is case insensitive with lower-case-table-names=0 MDEV-33088 Cannot create triggers in the database `MYSQL` MDEV-33103 LOCK TABLE t1 AS t2 -- alias is not case sensitive with lower-case-table-names=0 MDEV-33109 DROP DATABASE MYSQL -- does not drop SP with lower-case-table-names=0 MDEV-33110 HANDLER commands are case insensitive with lower-case-table-names=0 MDEV-33119 User is case insensitive in INFORMATION_SCHEMA.VIEWS MDEV-33120 System log table names are case insensitive with lower-cast-table-names=0 - Removing the virtual function strnncoll() from MY_COLLATION_HANDLER - Adding a wrapper function CHARSET_INFO::streq(), to compare two strings for equality. For now it calls strnncoll() internally. In the future it will turn into a virtual function. - Adding new accent sensitive case insensitive collations: - utf8mb4_general1400_as_ci - utf8mb3_general1400_as_ci They implement accent sensitive case insensitive comparison. The weight of a character is equal to the code point of its upper case variant. These collations use Unicode-14.0.0 casefolding data. The result of my_charset_utf8mb3_general1400_as_ci.strcoll() is very close to the former my_charset_utf8mb3_general_ci.strcasecmp() There is only a difference in a couple dozen rare characters, because: - the switch from "tolower" to "toupper" comparison, to make utf8mb3_general1400_as_ci closer to utf8mb3_general_ci - the switch from Unicode-3.0.0 to Unicode-14.0.0 This difference should be tolarable. See the list of affected characters in the MDEV description. Note, utf8mb4_general1400_as_ci correctly handles non-BMP characters! Unlike utf8mb4_general_ci, it does not treat all BMP characters as equal. - Adding classes representing names of the file based database objects: Lex_ident_db Lex_ident_table Lex_ident_trigger Their comparison collation depends on the underlying file system case sensitivity and on --lower-case-table-names and can be either my_charset_bin or my_charset_utf8mb3_general1400_as_ci. - Adding classes representing names of other database objects, whose names have case insensitive comparison style, using my_charset_utf8mb3_general1400_as_ci: Lex_ident_column Lex_ident_sys_var Lex_ident_user_var Lex_ident_sp_var Lex_ident_ps Lex_ident_i_s_table Lex_ident_window Lex_ident_func Lex_ident_partition Lex_ident_with_element Lex_ident_rpl_filter Lex_ident_master_info Lex_ident_host Lex_ident_locale Lex_ident_plugin Lex_ident_engine Lex_ident_server Lex_ident_savepoint Lex_ident_charset engine_option_value::Name - All the mentioned Lex_ident_xxx classes implement a method streq(): if (ident1.streq(ident2)) do_equal(); This method works as a wrapper for CHARSET_INFO::streq(). - Changing a lot of "LEX_CSTRING name" to "Lex_ident_xxx name" in class members and in function/method parameters. - Replacing all calls like system_charset_info->coll->strcasecmp(ident1, ident2) to ident1.streq(ident2) - Taking advantage of the c++11 user defined literal operator for LEX_CSTRING (see m_strings.h) and Lex_ident_xxx (see lex_ident.h) data types. Use example: const Lex_ident_column primary_key_name= "PRIMARY"_Lex_ident_column; is now a shorter version of: const Lex_ident_column primary_key_name= Lex_ident_column({STRING_WITH_LEN("PRIMARY")});
267 lines
7.4 KiB
C
267 lines
7.4 KiB
C
/* Copyright (c) 2000, 2012, Oracle and/or its affiliates
|
||
Copyright (c) 2012, 2014, SkySQL Ab
|
||
|
||
This program is free software; you can redistribute it and/or modify
|
||
it under the terms of the GNU General Public License as published by
|
||
the Free Software Foundation; version 2 of the License.
|
||
|
||
This program is distributed in the hope that it will be useful,
|
||
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
GNU General Public License for more details.
|
||
|
||
You should have received a copy of the GNU General Public License
|
||
along with this program; if not, write to the Free Software
|
||
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1335 USA */
|
||
|
||
#include "mysys_priv.h"
|
||
#include <m_string.h>
|
||
|
||
#ifdef _WIN32
|
||
|
||
/*
|
||
Check a file or path for accessability.
|
||
|
||
SYNOPSIS
|
||
file_access()
|
||
path Path to file
|
||
amode Access method
|
||
|
||
RETURN VALUES
|
||
0 ok
|
||
-1 error (We use -1 as my_access is mapped to access on other platforms)
|
||
*/
|
||
|
||
int my_access(const char *path, int amode)
|
||
{
|
||
DWORD attributes;
|
||
|
||
attributes = GetFileAttributes(path);
|
||
if (attributes == INVALID_FILE_ATTRIBUTES ||
|
||
((attributes & FILE_ATTRIBUTE_READONLY) && (amode & W_OK)))
|
||
{
|
||
my_errno= errno= EACCES;
|
||
return -1;
|
||
}
|
||
return 0;
|
||
}
|
||
|
||
#endif /* _WIN32 */
|
||
|
||
|
||
/*
|
||
List of file names that causes problem on windows
|
||
|
||
NOTE that one can also not have file names of type CON.TXT
|
||
|
||
NOTE: it is important to keep "CLOCK$" on the first place,
|
||
we skip it in check_if_legal_tablename.
|
||
*/
|
||
static const char *reserved_names[]=
|
||
{
|
||
"CLOCK$",
|
||
"CON", "PRN", "AUX", "NUL",
|
||
"COM1", "COM2", "COM3", "COM4", "COM5", "COM6", "COM7", "COM8", "COM9",
|
||
"LPT1", "LPT2", "LPT3", "LPT4", "LPT5", "LPT6", "LPT7", "LPT8", "LPT9",
|
||
NullS
|
||
};
|
||
|
||
#define MAX_RESERVED_NAME_LENGTH 6
|
||
|
||
|
||
/*
|
||
Looks up a null-terminated string in a list,
|
||
case insensitively.
|
||
|
||
SYNOPSIS
|
||
str_list_find()
|
||
list list of items
|
||
str item to find
|
||
|
||
RETURN
|
||
0 ok
|
||
1 reserved file name
|
||
*/
|
||
static int str_list_find(const char **list, const char *str)
|
||
{
|
||
const char **name;
|
||
for (name= list; *name; name++)
|
||
{
|
||
if (!my_strcasecmp_latin1(*name, str))
|
||
return 1;
|
||
}
|
||
return 0;
|
||
}
|
||
|
||
|
||
/*
|
||
A map for faster reserved_names lookup,
|
||
helps to avoid loops in many cases.
|
||
1 - can be the first letter
|
||
2 - can be the second letter
|
||
4 - can be the third letter
|
||
*/
|
||
static char reserved_map[256]=
|
||
{
|
||
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, /* ................ */
|
||
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, /* ................ */
|
||
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, /* !"#$%&'()*+,-./ */
|
||
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, /* 0123456789:;<=>? */
|
||
0,1,0,1,0,0,0,0,0,0,0,0,7,4,5,2, /* @ABCDEFGHIJKLMNO */
|
||
3,0,2,0,4,2,0,0,4,0,0,0,0,0,0,0, /* PQRSTUVWXYZ[\]^_ */
|
||
0,1,0,1,0,0,0,0,0,0,0,0,7,4,5,2, /* bcdefghijklmno */
|
||
3,0,2,0,4,2,0,0,4,0,0,0,0,0,0,0, /* pqrstuvwxyz{|}~. */
|
||
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, /* ................ */
|
||
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, /* ................ */
|
||
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, /* ................ */
|
||
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, /* ................ */
|
||
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, /* ................ */
|
||
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, /* ................ */
|
||
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, /* ................ */
|
||
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0 /* ................ */
|
||
};
|
||
|
||
|
||
/*
|
||
Check if a table name may cause problems
|
||
|
||
SYNOPSIS
|
||
check_if_legal_tablename
|
||
name Table name (without any extensions)
|
||
|
||
DESCRIPTION
|
||
We don't check 'CLOCK$' because dollar sign is encoded as @0024,
|
||
making table file name 'CLOCK@0024', which is safe.
|
||
This is why we start lookup from the second element
|
||
(i.e. &reserver_name[1])
|
||
|
||
RETURN
|
||
0 ok
|
||
1 reserved file name
|
||
*/
|
||
|
||
int check_if_legal_tablename(const char *name)
|
||
{
|
||
DBUG_ENTER("check_if_legal_tablename");
|
||
DBUG_RETURN((reserved_map[(uchar) name[0]] & 1) &&
|
||
(reserved_map[(uchar) name[1]] & 2) &&
|
||
(reserved_map[(uchar) name[2]] & 4) &&
|
||
str_list_find(&reserved_names[1], name));
|
||
}
|
||
|
||
|
||
#ifdef _WIN32
|
||
/**
|
||
Checks if the drive letter supplied is valid or not. Valid drive
|
||
letters are A to Z, both lower case and upper case.
|
||
|
||
@param drive_letter : The drive letter to validate.
|
||
|
||
@return TRUE if the drive exists, FALSE otherwise.
|
||
*/
|
||
static my_bool does_drive_exists(char drive_letter)
|
||
{
|
||
DWORD drive_mask= GetLogicalDrives();
|
||
drive_letter= toupper(drive_letter);
|
||
|
||
return (drive_letter >= 'A' && drive_letter <= 'Z') &&
|
||
(drive_mask & (0x1 << (drive_letter - 'A')));
|
||
}
|
||
|
||
/**
|
||
Verifies if the file name supplied is allowed or not. On Windows
|
||
file names with a colon (:) are not allowed because such file names
|
||
store data in Alternate Data Streams which can be used to hide
|
||
the data.
|
||
Apart from colon, other characters that are not allowed in filenames
|
||
on Windows are greater/less sign, double quotes, forward slash, backslash,
|
||
pipe and star characters.
|
||
|
||
See MSDN documentation on filename restrictions.
|
||
|
||
@param name contains the file name with or without path
|
||
@param length contains the length of file name
|
||
@param allow_current_dir TRUE if paths like C:foobar are allowed,
|
||
FALSE otherwise
|
||
|
||
@return TRUE if the file name is allowed, FALSE otherwise.
|
||
*/
|
||
#define ILLEGAL_FILENAME_CHARS "<>:\"/\\|?*"
|
||
|
||
my_bool is_filename_allowed(const char *name __attribute__((unused)),
|
||
size_t length __attribute__((unused)),
|
||
my_bool allow_current_dir __attribute__((unused)))
|
||
{
|
||
/*
|
||
For Windows, check if the file name contains : character.
|
||
Start from end of path and search if the file name contains :
|
||
*/
|
||
const char* ch = NULL;
|
||
for (ch= name + length - 1; ch >= name; --ch)
|
||
{
|
||
if (FN_LIBCHAR == *ch || '/' == *ch)
|
||
break;
|
||
else if (':' == *ch)
|
||
{
|
||
/*
|
||
File names like C:foobar.txt are allowed since the syntax means
|
||
file foobar.txt in current directory of C drive. However file
|
||
names likes CC:foobar are not allowed since this syntax means ADS
|
||
foobar in file CC.
|
||
*/
|
||
return (allow_current_dir && (ch - name == 1) &&
|
||
does_drive_exists(*name));
|
||
}
|
||
else if (strchr(ILLEGAL_FILENAME_CHARS, *ch))
|
||
return FALSE;
|
||
}
|
||
return TRUE;
|
||
} /* is_filename_allowed */
|
||
#endif /* _WIN32 */
|
||
|
||
#if defined(_WIN32)
|
||
|
||
/*
|
||
Check if a path will access a reserved file name that may cause problems
|
||
|
||
SYNOPSIS
|
||
check_if_legal_filename
|
||
path Path to file
|
||
|
||
RETURN
|
||
0 ok
|
||
1 reserved file name
|
||
*/
|
||
|
||
int check_if_legal_filename(const char *path)
|
||
{
|
||
const char *end;
|
||
const char **reserved_name;
|
||
DBUG_ENTER("check_if_legal_filename");
|
||
|
||
if (!is_filename_allowed(path, strlen(path), TRUE))
|
||
DBUG_RETURN(1);
|
||
|
||
path+= dirname_length(path); /* To start of filename */
|
||
if (!(end= strchr(path, FN_EXTCHAR)))
|
||
end= strend(path);
|
||
if (path == end || (uint) (end - path) > MAX_RESERVED_NAME_LENGTH)
|
||
DBUG_RETURN(0); /* Simplify inner loop */
|
||
|
||
for (reserved_name= reserved_names; *reserved_name; reserved_name++)
|
||
{
|
||
const char *reserved= *reserved_name; /* never empty */
|
||
const char *name= path;
|
||
|
||
do
|
||
{
|
||
if (*reserved != my_toupper(&my_charset_latin1, *name))
|
||
break;
|
||
if (++name == end && !reserved[1])
|
||
DBUG_RETURN(1); /* Found wrong path */
|
||
} while (*++reserved);
|
||
}
|
||
DBUG_RETURN(0);
|
||
}
|
||
|
||
#endif /* defined(_WIN32) */
|