~drizzle-trunk/drizzle/development

1 by brian
clean slate
1
/* Copyright (C) 2000 MySQL AB
2
3
   This program is free software; you can redistribute it and/or modify
4
   it under the terms of the GNU General Public License as published by
5
   the Free Software Foundation; version 2 of the License.
6
7
   This program is distributed in the hope that it will be useful,
8
   but WITHOUT ANY WARRANTY; without even the implied warranty of
9
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
10
   GNU General Public License for more details.
11
12
   You should have received a copy of the GNU General Public License
13
   along with this program; if not, write to the Free Software
14
   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA */
15
16
/*
17
  A better inplementation of the UNIX ctype(3) library.
264.1.12 by Monty Taylor
Fixed ref to my_global.h in mystrings/longlong2str_asm.c.
18
  Notes:   drizzled/global.h should be included before ctype.h
1 by brian
clean slate
19
*/
20
21
#ifndef _m_ctype_h
22
#define _m_ctype_h
23
24
#ifdef	__cplusplus
25
extern "C" {
26
#endif
27
28
#define MY_CS_NAME_SIZE			32
29
#define MY_CS_CTYPE_TABLE_SIZE		257
30
#define MY_CS_TO_LOWER_TABLE_SIZE	256
31
#define MY_CS_TO_UPPER_TABLE_SIZE	256
32
#define MY_CS_SORT_ORDER_TABLE_SIZE	256
33
#define MY_CS_TO_UNI_TABLE_SIZE		256
34
35
#define CHARSET_DIR	"charsets/"
36
37
#define my_wc_t ulong
38
39
typedef struct unicase_info_st
40
{
206 by Brian Aker
Removed final uint dead types.
41
  uint16_t toupper;
42
  uint16_t tolower;
43
  uint16_t sort;
1 by brian
clean slate
44
} MY_UNICASE_INFO;
45
46
47
extern MY_UNICASE_INFO *my_unicase_default[256];
48
extern MY_UNICASE_INFO *my_unicase_turkish[256];
49
50
typedef struct uni_ctype_st
51
{
52
  uchar  pctype;
53
  uchar  *ctype;
54
} MY_UNI_CTYPE;
55
56
extern MY_UNI_CTYPE my_uni_ctype[256];
57
58
/* wm_wc and wc_mb return codes */
59
#define MY_CS_ILSEQ	0     /* Wrong by sequence: wb_wc                   */
60
#define MY_CS_ILUNI	0     /* Cannot encode Unicode to charset: wc_mb    */
61
#define MY_CS_TOOSMALL  -101  /* Need at least one byte:    wc_mb and mb_wc */
62
#define MY_CS_TOOSMALL2 -102  /* Need at least two bytes:   wc_mb and mb_wc */
63
#define MY_CS_TOOSMALL3 -103  /* Need at least three bytes: wc_mb and mb_wc */
64
/* These following three are currently not really used */
65
#define MY_CS_TOOSMALL4 -104  /* Need at least 4 bytes: wc_mb and mb_wc */
66
#define MY_CS_TOOSMALL5 -105  /* Need at least 5 bytes: wc_mb and mb_wc */
67
#define MY_CS_TOOSMALL6 -106  /* Need at least 6 bytes: wc_mb and mb_wc */
68
/* A helper macros for "need at least n bytes" */
69
#define MY_CS_TOOSMALLN(n)    (-100-(n))
70
71
#define MY_SEQ_INTTAIL	1
72
#define MY_SEQ_SPACES	2
73
74
        /* My charsets_list flags */
75
#define MY_CS_COMPILED  1      /* compiled-in sets               */
76
#define MY_CS_CONFIG    2      /* sets that have a *.conf file   */
77
#define MY_CS_INDEX     4      /* sets listed in the Index file  */
78
#define MY_CS_LOADED    8      /* sets that are currently loaded */
79
#define MY_CS_BINSORT	16     /* if binary sort order           */
80
#define MY_CS_PRIMARY	32     /* if primary collation           */
81
#define MY_CS_STRNXFRM	64     /* if strnxfrm is used for sort   */
82
#define MY_CS_UNICODE	128    /* is a charset is full unicode   */
83
#define MY_CS_READY	256    /* if a charset is initialized    */
84
#define MY_CS_AVAILABLE	512    /* If either compiled-in or loaded*/
85
#define MY_CS_CSSORT	1024   /* if case sensitive sort order   */	
86
#define MY_CS_HIDDEN	2048   /* don't display in SHOW          */	
87
#define MY_CS_PUREASCII 4096   /* if a charset is pure ascii     */
88
#define MY_CS_NONASCII  8192   /* if not ASCII-compatible        */
89
#define MY_CHARSET_UNDEFINED 0
90
91
/* Character repertoire flags */
92
#define MY_REPERTOIRE_ASCII      1 /* Pure ASCII            U+0000..U+007F */
93
#define MY_REPERTOIRE_EXTENDED   2 /* Extended characters:  U+0080..U+FFFF */
94
#define MY_REPERTOIRE_UNICODE30  3 /* ASCII | EXTENDED:     U+0000..U+FFFF */
95
96
/* Flags for strxfrm */
97
#define MY_STRXFRM_LEVEL1          0x00000001 /* for primary weights   */
98
#define MY_STRXFRM_LEVEL2          0x00000002 /* for secondary weights */
99
#define MY_STRXFRM_LEVEL3          0x00000004 /* for tertiary weights  */
100
#define MY_STRXFRM_LEVEL4          0x00000008 /* fourth level weights  */
101
#define MY_STRXFRM_LEVEL5          0x00000010 /* fifth level weights   */
102
#define MY_STRXFRM_LEVEL6          0x00000020 /* sixth level weights   */
103
#define MY_STRXFRM_LEVEL_ALL       0x0000003F /* Bit OR for the above six */
104
#define MY_STRXFRM_NLEVELS         6          /* Number of possible levels*/
105
106
#define MY_STRXFRM_PAD_WITH_SPACE  0x00000040 /* if pad result with spaces */
107
#define MY_STRXFRM_UNUSED_00000080 0x00000080 /* for future extensions     */
108
109
#define MY_STRXFRM_DESC_LEVEL1     0x00000100 /* if desc order for level1 */
110
#define MY_STRXFRM_DESC_LEVEL2     0x00000200 /* if desc order for level2 */
111
#define MY_STRXFRM_DESC_LEVEL3     0x00000300 /* if desc order for level3 */
112
#define MY_STRXFRM_DESC_LEVEL4     0x00000800 /* if desc order for level4 */
113
#define MY_STRXFRM_DESC_LEVEL5     0x00001000 /* if desc order for level5 */
114
#define MY_STRXFRM_DESC_LEVEL6     0x00002000 /* if desc order for level6 */
115
#define MY_STRXFRM_DESC_SHIFT      8
116
117
#define MY_STRXFRM_UNUSED_00004000 0x00004000 /* for future extensions     */
118
#define MY_STRXFRM_UNUSED_00008000 0x00008000 /* for future extensions     */
119
120
#define MY_STRXFRM_REVERSE_LEVEL1  0x00010000 /* if reverse order for level1 */
121
#define MY_STRXFRM_REVERSE_LEVEL2  0x00020000 /* if reverse order for level2 */
122
#define MY_STRXFRM_REVERSE_LEVEL3  0x00040000 /* if reverse order for level3 */
123
#define MY_STRXFRM_REVERSE_LEVEL4  0x00080000 /* if reverse order for level4 */
124
#define MY_STRXFRM_REVERSE_LEVEL5  0x00100000 /* if reverse order for level5 */
125
#define MY_STRXFRM_REVERSE_LEVEL6  0x00200000 /* if reverse order for level6 */
126
#define MY_STRXFRM_REVERSE_SHIFT   16
127
128
129
typedef struct my_uni_idx_st
130
{
206 by Brian Aker
Removed final uint dead types.
131
  uint16_t from;
132
  uint16_t to;
1 by brian
clean slate
133
  uchar  *tab;
134
} MY_UNI_IDX;
135
136
typedef struct
137
{
138
  uint beg;
139
  uint end;
140
  uint mb_len;
141
} my_match_t;
142
143
enum my_lex_states
144
{
145
  MY_LEX_START, MY_LEX_CHAR, MY_LEX_IDENT, 
146
  MY_LEX_IDENT_SEP, MY_LEX_IDENT_START,
147
  MY_LEX_REAL, MY_LEX_HEX_NUMBER, MY_LEX_BIN_NUMBER,
148
  MY_LEX_CMP_OP, MY_LEX_LONG_CMP_OP, MY_LEX_STRING, MY_LEX_COMMENT, MY_LEX_END,
149
  MY_LEX_OPERATOR_OR_IDENT, MY_LEX_NUMBER_IDENT, MY_LEX_INT_OR_REAL,
150
  MY_LEX_REAL_OR_POINT, MY_LEX_BOOL, MY_LEX_EOL, MY_LEX_ESCAPE, 
151
  MY_LEX_LONG_COMMENT, MY_LEX_END_LONG_COMMENT, MY_LEX_SEMICOLON, 
152
  MY_LEX_SET_VAR, MY_LEX_USER_END, MY_LEX_HOSTNAME, MY_LEX_SKIP, 
153
  MY_LEX_USER_VARIABLE_DELIMITER, MY_LEX_SYSTEM_VAR,
154
  MY_LEX_IDENT_OR_KEYWORD,
235 by Brian Aker
Final bit of NCHAR removed.
155
  MY_LEX_IDENT_OR_HEX, MY_LEX_IDENT_OR_BIN,
1 by brian
clean slate
156
  MY_LEX_STRING_OR_DELIMITER
157
};
158
159
struct charset_info_st;
160
161
162
/* See strings/CHARSET_INFO.txt for information about this structure  */
163
typedef struct my_collation_handler_st
164
{
276 by Brian Aker
Cleaned out my_bool from strings.
165
  bool (*init)(struct charset_info_st *, void *(*alloc)(size_t));
1 by brian
clean slate
166
  /* Collation routines */
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
167
  int     (*strnncoll)(const struct charset_info_st * const,
276 by Brian Aker
Cleaned out my_bool from strings.
168
		       const uchar *, size_t, const uchar *, size_t, bool);
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
169
  int     (*strnncollsp)(const struct charset_info_st * const,
1 by brian
clean slate
170
                         const uchar *, size_t, const uchar *, size_t,
276 by Brian Aker
Cleaned out my_bool from strings.
171
                         bool diff_if_only_endspace_difference);
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
172
  size_t  (*strnxfrm)(const struct charset_info_st * const,
1 by brian
clean slate
173
                      uchar *dst, size_t dstlen, uint nweights,
174
                      const uchar *src, size_t srclen, uint flags);
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
175
  size_t    (*strnxfrmlen)(const struct charset_info_st * const, size_t);
276 by Brian Aker
Cleaned out my_bool from strings.
176
  bool (*like_range)(const struct charset_info_st * const,
77.1.95 by Monty Taylor
Fixed silly my_bool==char nonsense.
177
                        const char *s, size_t s_length,
178
                        char escape, char w_one, char w_many,
179
                        size_t res_length,
180
                        char *min_str, char *max_str,
181
                        size_t *min_len, size_t *max_len);
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
182
  int     (*wildcmp)(const struct charset_info_st * const,
1 by brian
clean slate
183
  		     const char *str,const char *str_end,
184
                     const char *wildstr,const char *wildend,
185
                     int escape,int w_one, int w_many);
186
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
187
  int  (*strcasecmp)(const struct charset_info_st * const, const char *, const char *);
1 by brian
clean slate
188
  
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
189
  uint (*instr)(const struct charset_info_st * const,
1 by brian
clean slate
190
                const char *b, size_t b_length,
191
                const char *s, size_t s_length,
192
                my_match_t *match, uint nmatch);
193
  
194
  /* Hash calculation */
236.3.9 by Andrey Hristov
- Fix build of exotic, mostly non-western, charsets (--with-extra-charsets)
195
  void (*hash_sort)(const struct charset_info_st *cs, const uchar *key, size_t len,
290 by Brian Aker
Update for ulong change over.
196
                    uint32_t *nr1, uint32_t *nr2); 
276 by Brian Aker
Cleaned out my_bool from strings.
197
  bool (*propagate)(const struct charset_info_st *cs, const uchar *str, size_t len);
1 by brian
clean slate
198
} MY_COLLATION_HANDLER;
199
200
extern MY_COLLATION_HANDLER my_collation_mb_bin_handler;
201
extern MY_COLLATION_HANDLER my_collation_8bit_bin_handler;
202
extern MY_COLLATION_HANDLER my_collation_8bit_simple_ci_handler;
203
extern MY_COLLATION_HANDLER my_collation_ucs2_uca_handler;
204
205
/* Some typedef to make it easy for C++ to make function pointers */
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
206
typedef int (*my_charset_conv_mb_wc)(const struct charset_info_st * const, my_wc_t *,
1 by brian
clean slate
207
                                     const uchar *, const uchar *);
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
208
typedef int (*my_charset_conv_wc_mb)(const struct charset_info_st * const, my_wc_t,
1 by brian
clean slate
209
                                     uchar *, uchar *);
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
210
typedef size_t (*my_charset_conv_case)(const struct charset_info_st * const,
1 by brian
clean slate
211
                                       char *, size_t, char *, size_t);
212
213
214
/* See strings/CHARSET_INFO.txt about information on this structure  */
215
typedef struct my_charset_handler_st
216
{
276 by Brian Aker
Cleaned out my_bool from strings.
217
  bool (*init)(struct charset_info_st *, void *(*alloc)(size_t));
1 by brian
clean slate
218
  /* Multibyte routines */
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
219
  uint    (*ismbchar)(const struct charset_info_st * const, const char *, const char *);
220
  uint    (*mbcharlen)(const struct charset_info_st * const, uint c);
221
  size_t  (*numchars)(const struct charset_info_st * const, const char *b, const char *e);
222
  size_t  (*charpos)(const struct charset_info_st * const, const char *b, const char *e,
1 by brian
clean slate
223
                     size_t pos);
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
224
  size_t  (*well_formed_len)(const struct charset_info_st * const,
1 by brian
clean slate
225
                             const char *b,const char *e,
226
                             size_t nchars, int *error);
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
227
  size_t  (*lengthsp)(const struct charset_info_st * const, const char *ptr, size_t length);
228
  size_t  (*numcells)(const struct charset_info_st * const, const char *b, const char *e);
1 by brian
clean slate
229
  
230
  /* Unicode conversion */
231
  my_charset_conv_mb_wc mb_wc;
232
  my_charset_conv_wc_mb wc_mb;
233
234
  /* CTYPE scanner */
236.3.9 by Andrey Hristov
- Fix build of exotic, mostly non-western, charsets (--with-extra-charsets)
235
  int (*ctype)(const struct charset_info_st *cs, int *ctype,
1 by brian
clean slate
236
               const uchar *s, const uchar *e);
237
  
238
  /* Functions for case and sort conversion */
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
239
  size_t  (*caseup_str)(const struct charset_info_st * const, char *);
240
  size_t  (*casedn_str)(const struct charset_info_st * const, char *);
1 by brian
clean slate
241
242
  my_charset_conv_case caseup;
243
  my_charset_conv_case casedn;
244
245
  /* Charset dependant snprintf() */
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
246
  size_t (*snprintf)(const struct charset_info_st * const, char *to, size_t n,
1 by brian
clean slate
247
                     const char *fmt,
212.5.26 by Monty Taylor
Removed my_attribute. Renaming __attribute__((format(x,y,z))) to ATTRIBUTE_FORMAT(x,y,z) is retarded. So we don't do it anymore.
248
                     ...) __attribute__((format(printf, 4, 5)));
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
249
  size_t (*long10_to_str)(const struct charset_info_st * const, char *to, size_t n,
1 by brian
clean slate
250
                          int radix, long int val);
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
251
  size_t (*int64_t10_to_str)(const struct charset_info_st * const, char *to, size_t n,
152 by Brian Aker
longlong replacement
252
                              int radix, int64_t val);
1 by brian
clean slate
253
  
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
254
  void (*fill)(const struct charset_info_st * const, char *to, size_t len, int fill);
1 by brian
clean slate
255
  
256
  /* String-to-number conversion routines */
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
257
  long        (*strntol)(const struct charset_info_st * const, const char *s, size_t l,
258
			 int base, char **e, int *err);
259
  ulong      (*strntoul)(const struct charset_info_st * const, const char *s, size_t l,
260
			 int base, char **e, int *err);
261
  int64_t   (*strntoll)(const struct charset_info_st * const, const char *s, size_t l,
262
			 int base, char **e, int *err);
263
  uint64_t (*strntoull)(const struct charset_info_st * const, const char *s, size_t l,
264
			 int base, char **e, int *err);
265
  double      (*strntod)(const struct charset_info_st * const, char *s, size_t l, char **e,
1 by brian
clean slate
266
			 int *err);
236.3.9 by Andrey Hristov
- Fix build of exotic, mostly non-western, charsets (--with-extra-charsets)
267
  int64_t    (*strtoll10)(const struct charset_info_st *cs,
1 by brian
clean slate
268
                           const char *nptr, char **endptr, int *error);
236.3.9 by Andrey Hristov
- Fix build of exotic, mostly non-western, charsets (--with-extra-charsets)
269
  uint64_t   (*strntoull10rnd)(const struct charset_info_st *cs,
1 by brian
clean slate
270
                                const char *str, size_t length,
271
                                int unsigned_fl,
272
                                char **endptr, int *error);
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
273
  size_t        (*scan)(const struct charset_info_st * const, const char *b, const char *e,
1 by brian
clean slate
274
                        int sq);
275
} MY_CHARSET_HANDLER;
276
277
extern MY_CHARSET_HANDLER my_charset_8bit_handler;
278
extern MY_CHARSET_HANDLER my_charset_ucs2_handler;
279
280
281
/* See strings/CHARSET_INFO.txt about information on this structure  */
282
typedef struct charset_info_st
283
{
284
  uint      number;
285
  uint      primary_number;
286
  uint      binary_number;
287
  uint      state;
288
  const char *csname;
289
  const char *name;
290
  const char *comment;
291
  const char *tailoring;
292
  uchar    *ctype;
293
  uchar    *to_lower;
294
  uchar    *to_upper;
295
  uchar    *sort_order;
206 by Brian Aker
Removed final uint dead types.
296
  uint16_t   *contractions;
297
  uint16_t   **sort_order_big;
298
  uint16_t      *tab_to_uni;
1 by brian
clean slate
299
  MY_UNI_IDX  *tab_from_uni;
300
  MY_UNICASE_INFO **caseinfo;
301
  uchar     *state_map;
302
  uchar     *ident_map;
303
  uint      strxfrm_multiply;
304
  uchar     caseup_multiply;
305
  uchar     casedn_multiply;
306
  uint      mbminlen;
307
  uint      mbmaxlen;
206 by Brian Aker
Removed final uint dead types.
308
  uint16_t    min_sort_char;
309
  uint16_t    max_sort_char; /* For LIKE optimization */
1 by brian
clean slate
310
  uchar     pad_char;
276 by Brian Aker
Cleaned out my_bool from strings.
311
  bool   escape_with_backslash_is_dangerous;
1 by brian
clean slate
312
  uchar     levels_for_compare;
313
  uchar     levels_for_order;
314
  
315
  MY_CHARSET_HANDLER *cset;
316
  MY_COLLATION_HANDLER *coll;
317
  
318
} CHARSET_INFO;
319
#define ILLEGAL_CHARSET_INFO_NUMBER (~0U)
320
321
322
extern CHARSET_INFO my_charset_bin;
323
extern CHARSET_INFO my_charset_big5_chinese_ci;
324
extern CHARSET_INFO my_charset_big5_bin;
325
extern CHARSET_INFO my_charset_cp932_japanese_ci;
326
extern CHARSET_INFO my_charset_cp932_bin;
327
extern CHARSET_INFO my_charset_cp1250_czech_ci;
328
extern CHARSET_INFO my_charset_eucjpms_japanese_ci;
329
extern CHARSET_INFO my_charset_eucjpms_bin;
330
extern CHARSET_INFO my_charset_euckr_korean_ci;
331
extern CHARSET_INFO my_charset_euckr_bin;
332
extern CHARSET_INFO my_charset_filename;
333
extern CHARSET_INFO my_charset_gb2312_chinese_ci;
334
extern CHARSET_INFO my_charset_gb2312_bin;
335
extern CHARSET_INFO my_charset_gbk_chinese_ci;
336
extern CHARSET_INFO my_charset_gbk_bin;
337
extern CHARSET_INFO my_charset_latin1;
338
extern CHARSET_INFO my_charset_latin1_german2_ci;
339
extern CHARSET_INFO my_charset_latin1_bin;
340
extern CHARSET_INFO my_charset_latin2_czech_ci;
341
extern CHARSET_INFO my_charset_sjis_japanese_ci;
342
extern CHARSET_INFO my_charset_sjis_bin;
343
extern CHARSET_INFO my_charset_tis620_thai_ci;
344
extern CHARSET_INFO my_charset_tis620_bin;
345
extern CHARSET_INFO my_charset_ucs2_general_ci;
346
extern CHARSET_INFO my_charset_ucs2_bin;
347
extern CHARSET_INFO my_charset_ucs2_unicode_ci;
348
extern CHARSET_INFO my_charset_ujis_japanese_ci;
349
extern CHARSET_INFO my_charset_ujis_bin;
350
extern CHARSET_INFO my_charset_utf16_bin;
351
extern CHARSET_INFO my_charset_utf16_general_ci;
352
extern CHARSET_INFO my_charset_utf16_unicode_ci;
353
extern CHARSET_INFO my_charset_utf32_bin;
354
extern CHARSET_INFO my_charset_utf32_general_ci;
355
extern CHARSET_INFO my_charset_utf32_unicode_ci;
356
extern CHARSET_INFO my_charset_utf8mb3_bin;
357
extern CHARSET_INFO my_charset_utf8mb3_general_ci;
358
extern CHARSET_INFO my_charset_utf8mb3_unicode_ci;
359
extern CHARSET_INFO my_charset_utf8mb4_bin;
360
extern CHARSET_INFO my_charset_utf8mb4_general_ci;
361
extern CHARSET_INFO my_charset_utf8mb4_unicode_ci;
362
363
#define MY_UTF8MB3                 "utf8mb3"
364
#define MY_UTF8MB4                 "utf8"
365
#define my_charset_utf8_general_ci my_charset_utf8mb4_general_ci
366
#define my_charset_utf8_bin        my_charset_utf8mb4_bin
367
368
369
/* declarations for simple charsets */
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
370
extern size_t my_strnxfrm_simple(const CHARSET_INFO * const,
1 by brian
clean slate
371
                                 uchar *dst, size_t dstlen, uint nweights,
372
                                 const uchar *src, size_t srclen, uint flags);
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
373
size_t my_strnxfrmlen_simple(const CHARSET_INFO * const, size_t);
374
extern int  my_strnncoll_simple(const CHARSET_INFO * const, const uchar *, size_t,
276 by Brian Aker
Cleaned out my_bool from strings.
375
				const uchar *, size_t, bool);
1 by brian
clean slate
376
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
377
extern int  my_strnncollsp_simple(const CHARSET_INFO * const, const uchar *, size_t,
1 by brian
clean slate
378
                                  const uchar *, size_t,
276 by Brian Aker
Cleaned out my_bool from strings.
379
                                  bool diff_if_only_endspace_difference);
1 by brian
clean slate
380
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
381
extern void my_hash_sort_simple(const CHARSET_INFO * const cs,
1 by brian
clean slate
382
				const uchar *key, size_t len,
290 by Brian Aker
Update for ulong change over.
383
				uint32_t *nr1, uint32_t *nr2); 
1 by brian
clean slate
384
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
385
extern size_t my_lengthsp_8bit(const CHARSET_INFO * const cs, const char *ptr, size_t length);
1 by brian
clean slate
386
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
387
extern uint my_instr_simple(const CHARSET_INFO * const,
1 by brian
clean slate
388
                            const char *b, size_t b_length,
389
                            const char *s, size_t s_length,
390
                            my_match_t *match, uint nmatch);
391
392
393
/* Functions for 8bit */
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
394
extern size_t my_caseup_str_8bit(const CHARSET_INFO * const, char *);
395
extern size_t my_casedn_str_8bit(const CHARSET_INFO * const, char *);
396
extern size_t my_caseup_8bit(const CHARSET_INFO * const, char *src, size_t srclen,
397
                             char *dst, size_t dstlen);
398
extern size_t my_casedn_8bit(const CHARSET_INFO * const, char *src, size_t srclen,
399
                             char *dst, size_t dstlen);
400
401
extern int my_strcasecmp_8bit(const CHARSET_INFO * const  cs, const char *, const char *);
402
403
int my_mb_wc_8bit(const CHARSET_INFO * const cs,my_wc_t *wc, const uchar *s,const uchar *e);
404
int my_wc_mb_8bit(const CHARSET_INFO * const cs,my_wc_t wc, uchar *s, uchar *e);
405
406
int my_mb_ctype_8bit(const CHARSET_INFO * const,int *, const uchar *,const uchar *);
407
int my_mb_ctype_mb(const CHARSET_INFO * const,int *, const uchar *,const uchar *);
408
409
size_t my_scan_8bit(const CHARSET_INFO * const cs, const char *b, const char *e, int sq);
410
411
size_t my_snprintf_8bit(const CHARSET_INFO * const, char *to, size_t n,
1 by brian
clean slate
412
                        const char *fmt, ...)
212.5.26 by Monty Taylor
Removed my_attribute. Renaming __attribute__((format(x,y,z))) to ATTRIBUTE_FORMAT(x,y,z) is retarded. So we don't do it anymore.
413
  __attribute__((format(printf, 4, 5)));
1 by brian
clean slate
414
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
415
long       my_strntol_8bit(const CHARSET_INFO * const, const char *s, size_t l, int base,
1 by brian
clean slate
416
                           char **e, int *err);
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
417
ulong      my_strntoul_8bit(const CHARSET_INFO * const, const char *s, size_t l, int base,
418
			    char **e, int *err);
419
int64_t   my_strntoll_8bit(const CHARSET_INFO * const, const char *s, size_t l, int base,
420
			    char **e, int *err);
421
uint64_t my_strntoull_8bit(const CHARSET_INFO * const, const char *s, size_t l, int base,
422
			    char **e, int *err);
423
double      my_strntod_8bit(const CHARSET_INFO * const, char *s, size_t l,char **e,
1 by brian
clean slate
424
			    int *err);
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
425
size_t my_long10_to_str_8bit(const CHARSET_INFO * const, char *to, size_t l, int radix,
1 by brian
clean slate
426
                             long int val);
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
427
size_t my_int64_t10_to_str_8bit(const CHARSET_INFO * const, char *to, size_t l, int radix,
152 by Brian Aker
longlong replacement
428
                                 int64_t val);
1 by brian
clean slate
429
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
430
int64_t my_strtoll10_8bit(const CHARSET_INFO * const cs,
1 by brian
clean slate
431
                           const char *nptr, char **endptr, int *error);
152 by Brian Aker
longlong replacement
432
int64_t my_strtoll10_ucs2(CHARSET_INFO *cs, 
1 by brian
clean slate
433
                           const char *nptr, char **endptr, int *error);
434
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
435
uint64_t my_strntoull10rnd_8bit(const CHARSET_INFO * const cs,
1 by brian
clean slate
436
                                 const char *str, size_t length, int
437
                                 unsigned_fl, char **endptr, int *error);
151 by Brian Aker
Ulonglong to uint64_t
438
uint64_t my_strntoull10rnd_ucs2(CHARSET_INFO *cs, 
1 by brian
clean slate
439
                                 const char *str, size_t length,
440
                                 int unsigned_fl, char **endptr, int *error);
441
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
442
void my_fill_8bit(const CHARSET_INFO * const cs, char* to, size_t l, int fill);
1 by brian
clean slate
443
276 by Brian Aker
Cleaned out my_bool from strings.
444
bool  my_like_range_simple(const CHARSET_INFO * const cs,
1 by brian
clean slate
445
			      const char *ptr, size_t ptr_length,
77.1.95 by Monty Taylor
Fixed silly my_bool==char nonsense.
446
			      char escape, char w_one, char w_many,
1 by brian
clean slate
447
			      size_t res_length,
448
			      char *min_str, char *max_str,
449
			      size_t *min_length, size_t *max_length);
450
276 by Brian Aker
Cleaned out my_bool from strings.
451
bool  my_like_range_mb(const CHARSET_INFO * const cs,
1 by brian
clean slate
452
			  const char *ptr, size_t ptr_length,
77.1.95 by Monty Taylor
Fixed silly my_bool==char nonsense.
453
			  char escape, char w_one, char w_many,
1 by brian
clean slate
454
			  size_t res_length,
455
			  char *min_str, char *max_str,
456
			  size_t *min_length, size_t *max_length);
457
276 by Brian Aker
Cleaned out my_bool from strings.
458
bool  my_like_range_ucs2(const CHARSET_INFO * const cs,
1 by brian
clean slate
459
			    const char *ptr, size_t ptr_length,
77.1.95 by Monty Taylor
Fixed silly my_bool==char nonsense.
460
			    char escape, char w_one, char w_many,
1 by brian
clean slate
461
			    size_t res_length,
462
			    char *min_str, char *max_str,
463
			    size_t *min_length, size_t *max_length);
464
276 by Brian Aker
Cleaned out my_bool from strings.
465
bool  my_like_range_utf16(const CHARSET_INFO * const cs,
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
466
			     const char *ptr, size_t ptr_length,
467
			     char escape, char w_one, char w_many,
468
			     size_t res_length,
469
			     char *min_str, char *max_str,
470
			     size_t *min_length, size_t *max_length);
471
276 by Brian Aker
Cleaned out my_bool from strings.
472
bool  my_like_range_utf32(const CHARSET_INFO * const cs,
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
473
			     const char *ptr, size_t ptr_length,
474
			     char escape, char w_one, char w_many,
475
			     size_t res_length,
476
			     char *min_str, char *max_str,
477
			     size_t *min_length, size_t *max_length);
478
479
480
int my_wildcmp_8bit(const CHARSET_INFO * const,
1 by brian
clean slate
481
		    const char *str,const char *str_end,
482
		    const char *wildstr,const char *wildend,
483
		    int escape, int w_one, int w_many);
484
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
485
int my_wildcmp_bin(const CHARSET_INFO * const,
1 by brian
clean slate
486
		   const char *str,const char *str_end,
487
		   const char *wildstr,const char *wildend,
488
		   int escape, int w_one, int w_many);
489
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
490
size_t my_numchars_8bit(const CHARSET_INFO * const, const char *b, const char *e);
491
size_t my_numcells_8bit(const CHARSET_INFO * const, const char *b, const char *e);
492
size_t my_charpos_8bit(const CHARSET_INFO * const, const char *b, const char *e, size_t pos);
493
size_t my_well_formed_len_8bit(const CHARSET_INFO * const, const char *b, const char *e,
1 by brian
clean slate
494
                             size_t pos, int *error);
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
495
uint my_mbcharlen_8bit(const CHARSET_INFO * const, uint c);
1 by brian
clean slate
496
497
498
/* Functions for multibyte charsets */
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
499
extern size_t my_caseup_str_mb(const CHARSET_INFO * const, char *);
500
extern size_t my_casedn_str_mb(const CHARSET_INFO * const, char *);
501
extern size_t my_caseup_mb(const CHARSET_INFO * const, char *src, size_t srclen,
502
                                         char *dst, size_t dstlen);
503
extern size_t my_casedn_mb(const CHARSET_INFO * const, char *src, size_t srclen,
504
                                         char *dst, size_t dstlen);
505
extern int my_strcasecmp_mb(const CHARSET_INFO * const  cs, const char *s, const char *t);
1 by brian
clean slate
506
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
507
int my_wildcmp_mb(const CHARSET_INFO * const,
1 by brian
clean slate
508
		  const char *str,const char *str_end,
509
		  const char *wildstr,const char *wildend,
510
		  int escape, int w_one, int w_many);
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
511
size_t my_numchars_mb(const CHARSET_INFO * const, const char *b, const char *e);
512
size_t my_numcells_mb(const CHARSET_INFO * const, const char *b, const char *e);
513
size_t my_charpos_mb(const CHARSET_INFO * const, const char *b, const char *e, size_t pos);
514
size_t my_well_formed_len_mb(const CHARSET_INFO * const, const char *b, const char *e,
1 by brian
clean slate
515
                             size_t pos, int *error);
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
516
uint my_instr_mb(const CHARSET_INFO * const,
1 by brian
clean slate
517
                 const char *b, size_t b_length,
518
                 const char *s, size_t s_length,
519
                 my_match_t *match, uint nmatch);
520
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
521
int my_strnncoll_mb_bin(const CHARSET_INFO * const  cs,
1 by brian
clean slate
522
                        const uchar *s, size_t slen,
523
                        const uchar *t, size_t tlen,
276 by Brian Aker
Cleaned out my_bool from strings.
524
                        bool t_is_prefix);
1 by brian
clean slate
525
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
526
int my_strnncollsp_mb_bin(const CHARSET_INFO * const cs,
1 by brian
clean slate
527
                          const uchar *a, size_t a_length,
528
                          const uchar *b, size_t b_length,
276 by Brian Aker
Cleaned out my_bool from strings.
529
                          bool diff_if_only_endspace_difference);
1 by brian
clean slate
530
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
531
int my_wildcmp_mb_bin(const CHARSET_INFO * const cs,
1 by brian
clean slate
532
                      const char *str,const char *str_end,
533
                      const char *wildstr,const char *wildend,
534
                      int escape, int w_one, int w_many);
535
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
536
int my_strcasecmp_mb_bin(const CHARSET_INFO * const  cs __attribute__((unused)),
1 by brian
clean slate
537
                         const char *s, const char *t);
538
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
539
void my_hash_sort_mb_bin(const CHARSET_INFO * const cs __attribute__((unused)),
290 by Brian Aker
Update for ulong change over.
540
                         const uchar *key, size_t len, uint32_t *nr1, uint32_t *nr2);
1 by brian
clean slate
541
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
542
size_t my_strnxfrm_mb(const CHARSET_INFO * const,
1 by brian
clean slate
543
                      uchar *dst, size_t dstlen, uint nweights,
544
                      const uchar *src, size_t srclen, uint flags);
545
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
546
int my_wildcmp_unicode(const CHARSET_INFO * const cs,
1 by brian
clean slate
547
                       const char *str, const char *str_end,
548
                       const char *wildstr, const char *wildend,
549
                       int escape, int w_one, int w_many,
550
                       MY_UNICASE_INFO **weights);
551
276 by Brian Aker
Cleaned out my_bool from strings.
552
extern bool my_parse_charset_xml(const char *bug, size_t len,
1 by brian
clean slate
553
				    int (*add)(CHARSET_INFO *cs));
554
276 by Brian Aker
Cleaned out my_bool from strings.
555
bool my_propagate_simple(const CHARSET_INFO * const cs, const uchar *str, size_t len);
556
bool my_propagate_complex(const CHARSET_INFO * const cs, const uchar *str, size_t len);
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
557
558
559
uint my_string_repertoire(const CHARSET_INFO * const cs, const char *str, ulong len);
276 by Brian Aker
Cleaned out my_bool from strings.
560
bool my_charset_is_ascii_based(const CHARSET_INFO * const cs);
561
bool my_charset_is_8bit_pure_ascii(const CHARSET_INFO * const cs);
1 by brian
clean slate
562
563
564
uint my_strxfrm_flag_normalize(uint flags, uint nlevels);
565
void my_strxfrm_desc_and_reverse(uchar *str, uchar *strend,
566
                                 uint flags, uint level);
264.2.6 by Andrey Hristov
Constify the usage of CHARSET_INFO almost to the last place in the code.
567
size_t my_strxfrm_pad_desc_and_reverse(const CHARSET_INFO * const cs,
1 by brian
clean slate
568
                                       uchar *str, uchar *frmend, uchar *strend,
569
                                       uint nweights, uint flags, uint level);
570
276 by Brian Aker
Cleaned out my_bool from strings.
571
bool my_charset_is_ascii_compatible(const CHARSET_INFO * const cs);
1 by brian
clean slate
572
573
#define	_MY_U	01	/* Upper case */
574
#define	_MY_L	02	/* Lower case */
575
#define	_MY_NMR	04	/* Numeral (digit) */
576
#define	_MY_SPC	010	/* Spacing character */
577
#define	_MY_PNT	020	/* Punctuation */
578
#define	_MY_CTR	040	/* Control character */
579
#define	_MY_B	0100	/* Blank */
580
#define	_MY_X	0200	/* heXadecimal digit */
581
582
583
#define	my_isascii(c)	(!((c) & ~0177))
584
#define	my_toascii(c)	((c) & 0177)
585
#define my_tocntrl(c)	((c) & 31)
586
#define my_toprint(c)	((c) | 64)
587
#define my_toupper(s,c)	(char) ((s)->to_upper[(uchar) (c)])
588
#define my_tolower(s,c)	(char) ((s)->to_lower[(uchar) (c)])
589
#define	my_isalpha(s, c)  (((s)->ctype+1)[(uchar) (c)] & (_MY_U | _MY_L))
590
#define	my_isupper(s, c)  (((s)->ctype+1)[(uchar) (c)] & _MY_U)
591
#define	my_islower(s, c)  (((s)->ctype+1)[(uchar) (c)] & _MY_L)
592
#define	my_isdigit(s, c)  (((s)->ctype+1)[(uchar) (c)] & _MY_NMR)
593
#define	my_isxdigit(s, c) (((s)->ctype+1)[(uchar) (c)] & _MY_X)
594
#define	my_isalnum(s, c)  (((s)->ctype+1)[(uchar) (c)] & (_MY_U | _MY_L | _MY_NMR))
595
#define	my_isspace(s, c)  (((s)->ctype+1)[(uchar) (c)] & _MY_SPC)
596
#define	my_ispunct(s, c)  (((s)->ctype+1)[(uchar) (c)] & _MY_PNT)
597
#define	my_isprint(s, c)  (((s)->ctype+1)[(uchar) (c)] & (_MY_PNT | _MY_U | _MY_L | _MY_NMR | _MY_B))
598
#define	my_isgraph(s, c)  (((s)->ctype+1)[(uchar) (c)] & (_MY_PNT | _MY_U | _MY_L | _MY_NMR))
599
#define	my_iscntrl(s, c)  (((s)->ctype+1)[(uchar) (c)] & _MY_CTR)
600
601
/* Some macros that should be cleaned up a little */
602
#define my_isvar(s,c)                 (my_isalnum(s,c) || (c) == '_')
603
#define my_isvar_start(s,c)           (my_isalpha(s,c) || (c) == '_')
604
605
#define my_binary_compare(s)	      ((s)->state  & MY_CS_BINSORT)
606
#define use_strnxfrm(s)               ((s)->state  & MY_CS_STRNXFRM)
607
#define my_strnxfrm(cs, d, dl, s, sl) \
608
   ((cs)->coll->strnxfrm((cs), (d), (dl), (dl), (s), (sl), MY_STRXFRM_PAD_WITH_SPACE))
609
#define my_strnncoll(s, a, b, c, d) ((s)->coll->strnncoll((s), (a), (b), (c), (d), 0))
610
#define my_like_range(s, a, b, c, d, e, f, g, h, i, j) \
611
   ((s)->coll->like_range((s), (a), (b), (c), (d), (e), (f), (g), (h), (i), (j)))
612
#define my_wildcmp(cs,s,se,w,we,e,o,m) ((cs)->coll->wildcmp((cs),(s),(se),(w),(we),(e),(o),(m)))
613
#define my_strcasecmp(s, a, b)        ((s)->coll->strcasecmp((s), (a), (b)))
614
#define my_charpos(cs, b, e, num)     (cs)->cset->charpos((cs), (const char*) (b), (const char *)(e), (num))
615
616
617
#define use_mb(s)                     ((s)->cset->ismbchar != NULL)
618
#define my_ismbchar(s, a, b)          ((s)->cset->ismbchar((s), (a), (b)))
619
#ifdef USE_MB
620
#define my_mbcharlen(s, a)            ((s)->cset->mbcharlen((s),(a)))
621
#else
622
#define my_mbcharlen(s, a)            1
623
#endif
624
625
#define my_caseup_str(s, a)           ((s)->cset->caseup_str((s), (a)))
626
#define my_casedn_str(s, a)           ((s)->cset->casedn_str((s), (a)))
627
#define my_strntol(s, a, b, c, d, e)  ((s)->cset->strntol((s),(a),(b),(c),(d),(e)))
628
#define my_strntoul(s, a, b, c, d, e) ((s)->cset->strntoul((s),(a),(b),(c),(d),(e)))
629
#define my_strntoll(s, a, b, c, d, e) ((s)->cset->strntoll((s),(a),(b),(c),(d),(e)))
630
#define my_strntoull(s, a, b, c,d, e) ((s)->cset->strntoull((s),(a),(b),(c),(d),(e)))
631
#define my_strntod(s, a, b, c, d)     ((s)->cset->strntod((s),(a),(b),(c),(d)))
632
633
634
/* XXX: still need to take care of this one */
635
#ifdef MY_CHARSET_TIS620
636
#error The TIS620 charset is broken at the moment.  Tell tim to fix it.
637
#define USE_TIS620
212.5.19 by Monty Taylor
Coupla small include cleanups.
638
#include <mystrings/t_ctype.h>
1 by brian
clean slate
639
#endif
640
641
#ifdef	__cplusplus
642
}
643
#endif
644
645
#endif /* _m_ctype_h */