mariadb/strings/conf_to_src.c

341 lines
7.9 KiB
C
Raw Normal View History

/* Copyright (C) 2000 MySQL AB
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 2 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
2000-07-31 21:29:14 +02:00
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA */
2000-07-31 21:29:14 +02:00
/* can't use -lmysys because this prog is used to create -lstrings */
#include <ctype.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
#include <fcntl.h>
#include <my_global.h>
#include <m_ctype.h>
#include <my_xml.h>
2000-07-31 21:29:14 +02:00
#define CHARSETS_SUBDIR "sql/share/charsets"
#define CTYPE_TABLE_SIZE 257
#define TO_LOWER_TABLE_SIZE 256
#define TO_UPPER_TABLE_SIZE 256
#define SORT_ORDER_TABLE_SIZE 256
#define ROW_LEN 16
char *prog;
char buf[1024], *p, *endptr;
void
print_array(FILE *f, const char *set, const char *name, int n)
{
int i;
char val[100];
printf("uchar %s_%s[] = {\n", name, set);
p = buf;
*buf = '\0';
for (i = 0; i < n; ++i)
{
/* get a word from f */
endptr = p;
for (;;)
{
2001-08-30 09:51:36 +02:00
while (isspace((* (unsigned char*) endptr)))
2000-07-31 21:29:14 +02:00
++endptr;
if (*endptr && *endptr != '#') /* not comment */
break;
if ((fgets(buf, sizeof(buf), f)) == NULL)
return; /* XXX: break silently */
endptr = buf;
}
p = val;
2001-08-30 09:51:36 +02:00
while (!isspace((* (unsigned char*) endptr)))
2000-07-31 21:29:14 +02:00
*p++ = *endptr++;
*p = '\0';
p = endptr;
/* write the value out */
if (i == 0 || i % ROW_LEN == n % ROW_LEN)
printf(" ");
printf("%3d", (unsigned char) strtol(val, (char **) NULL, 16));
if (i < n - 1)
printf(",");
if ((i+1) % ROW_LEN == n % ROW_LEN)
printf("\n");
}
printf("};\n\n");
}
void
print_arrays_for(char *set)
{
FILE *f;
sprintf(buf, "%s.conf", set);
if ((f = fopen(buf, "r")) == NULL) {
fprintf(stderr, "%s: can't read conf file for charset %s\n", prog, set);
exit(EXIT_FAILURE);
}
printf("\
/* The %s character set. Generated automatically by\n\
2000-07-31 21:29:14 +02:00
* the %s program\n\
*/\n\n",
set, prog);
/* it would be nice if this used the code in mysys/charset.c, but... */
print_array(f, set, "ctype", CTYPE_TABLE_SIZE);
print_array(f, set, "to_lower", TO_LOWER_TABLE_SIZE);
print_array(f, set, "to_upper", TO_UPPER_TABLE_SIZE);
print_array(f, set, "sort_order", SORT_ORDER_TABLE_SIZE);
printf("\n");
fclose(f);
return;
}
#define MAX_BUF 16*1024
static CHARSET_INFO all_charsets[256];
static int get_charset_number(const char *charset_name)
{
CHARSET_INFO *cs;
for (cs= all_charsets; cs < all_charsets+255; ++cs)
{
if ( cs->name && !strcmp(cs->name, charset_name))
return cs->number;
}
return 0;
}
char *mdup(const char *src, uint len)
{
char *dst=(char*)malloc(len);
memcpy(dst,src,len);
return dst;
}
static void simple_cs_copy_data(CHARSET_INFO *to, CHARSET_INFO *from)
{
to->number= from->number ? from->number : to->number;
to->state|= from->state;
if (from->csname)
to->csname= strdup(from->csname);
if (from->name)
to->name= strdup(from->name);
if (from->ctype)
to->ctype= (uchar*) mdup((char*) from->ctype, MY_CS_CTYPE_TABLE_SIZE);
if (from->to_lower)
to->to_lower= (uchar*) mdup((char*) from->to_lower, MY_CS_TO_LOWER_TABLE_SIZE);
if (from->to_upper)
to->to_upper= (uchar*) mdup((char*) from->to_upper, MY_CS_TO_UPPER_TABLE_SIZE);
if (from->sort_order)
{
to->sort_order= (uchar*) mdup((char*) from->sort_order, MY_CS_SORT_ORDER_TABLE_SIZE);
/*
set_max_sort_char(to);
*/
}
if (from->tab_to_uni)
{
uint sz= MY_CS_TO_UNI_TABLE_SIZE*sizeof(uint16);
to->tab_to_uni= (uint16*) mdup((char*)from->tab_to_uni, sz);
/*
create_fromuni(to);
*/
}
}
static my_bool simple_cs_is_full(CHARSET_INFO *cs)
{
return ((cs->csname && cs->tab_to_uni && cs->ctype && cs->to_upper &&
cs->to_lower) &&
(cs->number && cs->name && cs->sort_order));
}
static int add_collation(CHARSET_INFO *cs)
{
if (cs->name && (cs->number || (cs->number=get_charset_number(cs->name))))
{
if (!(all_charsets[cs->number].state & MY_CS_COMPILED))
{
simple_cs_copy_data(&all_charsets[cs->number],cs);
}
cs->number= 0;
cs->name= NULL;
cs->state= 0;
cs->sort_order= NULL;
cs->state= 0;
}
return MY_XML_OK;
}
static int my_read_charset_file(const char *filename)
{
char buf[MAX_BUF];
int fd;
uint len;
if ((fd=open(filename,O_RDONLY)) < 0)
{
printf("Can't open '%s'\n",filename);
return 1;
}
len=read(fd,buf,MAX_BUF);
close(fd);
if (my_parse_charset_xml(buf,len,add_collation))
{
#if 0
printf("ERROR at line %d pos %d '%s'\n",
my_xml_error_lineno(&p)+1,
my_xml_error_pos(&p),
my_xml_error_string(&p));
#endif
}
return FALSE;
}
void dispcset(CHARSET_INFO *cs)
{
printf("{\n");
printf(" %d,\n",cs->number);
printf(" MY_CS_COMPILED,\n");
if (cs->name)
{
printf(" \"%s\",\n",cs->name);
printf(" \"%s\",\n",cs->csname);
printf(" \"\",\n");
printf(" ctype_%s,\n",cs->name);
printf(" to_lower_%s,\n",cs->name);
printf(" to_upper_%s,\n",cs->name);
printf(" sort_order_%s,\n",cs->name);
printf(" to_uni_%s,\n",cs->name);
printf(" from_uni_%s,\n",cs->name);
}
else
{
printf(" NULL,\n");
printf(" NULL,\n");
printf(" NULL,\n");
printf(" NULL,\n");
printf(" NULL,\n");
printf(" NULL,\n");
printf(" NULL,\n");
printf(" NULL,\n");
printf(" NULL,\n");
}
printf(" %d,\n",cs->strxfrm_multiply);
printf(" my_strnncoll_simple,\n");
printf(" my_strnxfrm_simple,\n");
printf(" my_like_range_simple,\n");
printf(" my_wild_cmp_8bit,\n");
printf(" %d,\n",cs->mbmaxlen);
printf(" NULL,\n");
printf(" NULL,\n");
printf(" NULL,\n");
printf(" my_mb_wc_8bit,\n");
printf(" my_wc_mb_8bit,\n");
printf(" my_caseup_str_8bit,\n");
printf(" my_casedn_str_8bit,\n");
printf(" my_caseup_8bit,\n");
printf(" my_casedn_8bit,\n");
printf(" my_tosort_8bit,\n");
printf(" my_strcasecmp_8bit,\n");
printf(" my_strncasecmp_8bit,\n");
printf(" my_hash_caseup_simple,\n");
printf(" my_hash_sort_simple,\n");
printf(" 0,\n");
printf(" my_snprintf_8bit,\n");
printf(" my_long10_to_str_8bit,\n");
printf(" my_longlong10_to_str_8bit,\n");
printf(" my_fill_8bit,\n");
printf(" my_strntol_8bit,\n");
printf(" my_strntoul_8bit,\n");
printf(" my_strntoll_8bit,\n");
printf(" my_strntoull_8bit,\n");
printf(" my_strntod_8bit,\n");
printf(" my_scan_8bit\n");
printf("}\n");
}
int
main(int argc, char **argv __attribute__((unused)))
{
CHARSET_INFO ncs;
CHARSET_INFO *cs;
char filename[256];
if (argc < 2)
{
fprintf(stderr, "usage: %s source-dir\n", argv[0]);
exit(EXIT_FAILURE);
}
bzero((void*)&ncs,sizeof(ncs));
bzero((void*)&all_charsets,sizeof(all_charsets));
sprintf(filename,"%s/%s",argv[1],"Index.xml");
my_read_charset_file(filename);
printf("CHARSET_INFO compiled_charsets[] = {\n");
for (cs=all_charsets; cs < all_charsets+256; cs++)
{
if (cs->number)
{
if ( (!simple_cs_is_full(cs)) && (cs->csname) )
{
sprintf(filename,"%s/%s.xml",argv[1],cs->csname);
my_read_charset_file(filename);
}
if (simple_cs_is_full)
{
printf("#ifdef HAVE_CHARSET_%s\n",cs->csname);
dispcset(cs);
printf(",\n");
printf("#endif\n");
}
}
}
dispcset(&ncs);
printf("};\n");
return 0;
}