1
<?xml version='1.0' encoding="utf-8"?>
6
Copyright (C) 2003 MySQL AB
8
This program is free software; you can redistribute it and/or modify
9
it under the terms of the GNU General Public License as published by
10
the Free Software Foundation; version 2 of the License.
12
This program is distributed in the hope that it will be useful,
13
but WITHOUT ANY WARRANTY; without even the implied warranty of
14
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15
GNU General Public License for more details.
17
You should have received a copy of the GNU General Public License
18
along with this program; if not, write to the Free Software
19
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23
This file lists all of the available character sets.
24
To make maintaining easier please:
25
- keep records sorted by collation number.
26
- change charsets.max-id when adding a new collation.
30
<family>Traditional Chinese</family>
31
<description>Big5 Traditional Chinese</description>
33
<alias>bigfive</alias>
34
<alias>big-five</alias>
35
<alias>cn-big5</alias>
37
<collation name="big5_chinese_ci" id="1" order="Chinese">
41
<collation name="big5_bin" id="84" order="Binary">
47
<charset name="latin2">
48
<family>Central European</family>
49
<description>ISO 8859-2 Central European</description>
50
<alias>csisolatin2</alias>
51
<alias>iso-8859-2</alias>
52
<alias>iso-ir-101</alias>
53
<alias>iso_8859-2</alias>
54
<alias>iso_8859-2:1987</alias>
56
<collation name="latin2_czech_cs" id="2" order="Czech" flag="compiled"/>
57
<collation name="latin2_general_ci" id="9" flag="primary">
58
<order>Hungarian</order>
60
<order>Romanian</order>
61
<order>Croatian</order>
63
<order>Slovenian</order>
64
<order>Sorbian</order>
66
<collation name="latin2_hungarian_ci" id="21" order="Hungarian"/>
67
<collation name="latin2_croatian_ci" id="27" order="Croatian"/>
68
<collation name="latin2_bin" id="77" order="Binary" flag="binary"/>
72
<family>Western</family>
73
<description>DEC West European</description>
74
<collation name="dec8_bin" id="69" order="Binary" flag="binary"/>
75
<collation name="dec8_swedish_ci" id="3" flag="primary">
77
<order>English</order>
79
<order>German Duden</order>
80
<order>Italian</order>
82
<order>Portuguese</order>
83
<order>Spanish</order>
87
<charset name="cp850">
88
<family>Western</family>
89
<description>DOS West European</description>
91
<alias>cspc850multilingual</alias>
93
<collation name="cp850_general_ci" id="4" flag="primary">
95
<order>English</order>
97
<order>German Duden</order>
98
<order>Italian</order>
100
<order>Portuguese</order>
101
<order>Spanish</order>
103
<collation name="cp850_bin" id="80" order="Binary" flag="binary"/>
106
<charset name="latin1">
107
<family>Western</family>
108
<description>cp1252 West European</description>
109
<alias>csisolatin1</alias>
110
<alias>iso-8859-1</alias>
111
<alias>iso-ir-100</alias>
112
<alias>iso_8859-1</alias>
113
<alias>iso_8859-1:1987</alias>
115
<alias>latin1</alias>
116
<collation name="latin1_german1_ci" id="5" order="German Duden"/>
117
<collation name="latin1_swedish_ci" id="8" order="Finnish, Swedish">
119
<flag>compiled</flag>
121
<collation name="latin1_danish_ci" id="15" order="Danish"/>
122
<collation name="latin1_german2_ci" id="31" order="German Phonebook" flag="compiled"/>
123
<collation name="latin1_spanish_ci" id="94" order="Spanish"/>
124
<collation name="latin1_bin" id="47" order="Binary">
126
<flag>compiled</flag>
128
<collation name="latin1_general_ci" id="48">
130
<order>English</order>
131
<order>French</order>
132
<order>German Duden</order>
133
<order>Italian</order>
135
<order>Portuguese</order>
136
<order>Spanish</order>
138
<collation name="latin1_general_cs" id="49">
140
<order>English</order>
141
<order>French</order>
142
<order>German Duden</order>
143
<order>Italian</order>
145
<order>Portuguese</order>
146
<order>Spanish</order>
151
<family>Western</family>
152
<description>HP West European</description>
153
<alias>hproman8</alias>
154
<collation name="hp8_bin" id="72" order="Binary" flag="binary"/>
155
<collation name="hp8_english_ci" id="6" flag="primary">
157
<order>English</order>
158
<order>French</order>
159
<order>German Duden</order>
160
<order>Italian</order>
162
<order>Portuguese</order>
163
<order>Spanish</order>
167
<charset name="koi8r">
168
<family>Cyrillic</family>
169
<description>KOI8-R Relcom Russian</description>
170
<alias>koi8-r</alias>
171
<alias>cskoi8r</alias>
172
<collation name="koi8r_general_ci" id="7" order="Russian" flag="primary"/>
173
<collation name="koi8r_bin" id="74" order="Binary" flag="binary"/>
176
<charset name="swe7">
177
<family>Western</family>
178
<description>7bit Swedish</description>
179
<alias>iso-646-se</alias>
180
<collation name="swe7_swedish_ci" id="10" order="Swedish" flag="primary"/>
181
<collation name="swe7_bin" id="82" order="Binary" flag="binary"/>
184
<charset name="ascii">
185
<family>Western</family>
186
<description>US ASCII</description>
188
<alias>us-ascii</alias>
189
<alias>csascii</alias>
190
<alias>iso-ir-6</alias>
191
<alias>iso646-us</alias>
192
<collation name="ascii_general_ci" id="11" order="English" flag="primary"/>
193
<collation name="ascii_bin" id="65" order="Binary" flag="binary"/>
196
<charset name="ujis">
197
<family>Japanese</family>
198
<description>EUC-JP Japanese</description>
199
<alias>euc-jp</alias>
200
<collation name="ujis_japanese_ci" id="12" order="Japanese">
202
<flag>compiled</flag>
204
<collation name="ujis_bin" id="91" order="Japanese">
206
<flag>compiled</flag>
210
<charset name="sjis">
211
<family>Japanese</family>
212
<description>Shift-JIS Japanese</description>
214
<alias>shift-jis</alias>
215
<alias>x-sjis</alias>
216
<collation name="sjis_japanese_ci" id="13" order="Japanese">
218
<flag>compiled</flag>
220
<collation name="sjis_bin" id="88" order="Binary">
222
<flag>compiled</flag>
226
<charset name="cp1251">
227
<family>Cyrillic</family>
228
<description>Windows Cyrillic</description>
229
<alias>windows-1251</alias>
230
<alias>ms-cyr</alias>
231
<alias>ms-cyrillic</alias>
232
<collation name="cp1251_bulgarian_ci" id="14">
233
<order>Belarusian</order>
234
<order>Bulgarian</order>
235
<order>Macedonian</order>
236
<order>Russian</order>
237
<order>Serbian</order>
238
<order>Mongolian</order>
239
<order>Ukrainian</order>
241
<collation name="cp1251_ukrainian_ci" id="23" order="Ukrainian"/>
242
<collation name="cp1251_bin" id="50" order="Binary" flag="binary"/>
243
<collation name="cp1251_general_ci" id="51" flag="primary">
244
<order>Belarusian</order>
245
<order>Bulgarian</order>
246
<order>Macedonian</order>
247
<order>Russian</order>
248
<order>Serbian</order>
249
<order>Mongolian</order>
250
<order>Ukrainian</order>
252
<collation name="cp1251_general_cs" id="52">
253
<order>Belarusian</order>
254
<order>Bulgarian</order>
255
<order>Macedonian</order>
256
<order>Russian</order>
257
<order>Serbian</order>
258
<order>Mongolian</order>
259
<order>Ukrainian</order>
263
<charset name="hebrew">
264
<family>Hebrew</family>
265
<description>ISO 8859-8 Hebrew</description>
266
<alias>csisolatinhebrew</alias>
267
<alias>iso-8859-8</alias>
268
<alias>iso-ir-138</alias>
269
<collation name="hebrew_general_ci" id="16" order="Hebrew" flag="primary"/>
270
<collation name="hebrew_bin" id="71" order="Binary" flag="binary"/>
273
<charset name="tis620">
274
<family>Thai</family>
275
<description>TIS620 Thai</description>
276
<alias>tis-620</alias>
277
<collation name="tis620_thai_ci" id="18" order="Thai">
279
<flag>compiled</flag>
281
<collation name="tis620_bin" id="89" order="Binary">
283
<flag>compiled</flag>
287
<charset name="euckr">
288
<family>Korean</family>
289
<description>EUC-KR Korean</description>
290
<alias>euc_kr</alias>
291
<alias>euc-kr</alias>
292
<collation name="euckr_korean_ci" id="19" order="Korean">
294
<flag>compiled</flag>
296
<collation name="euckr_bin" id="85">
298
<flag>compiled</flag>
302
<charset name="latin7">
303
<family>Baltic</family>
304
<description>ISO 8859-13 Baltic</description>
305
<alias>BalticRim</alias>
306
<alias>iso-8859-13</alias>
308
<collation name="latin7_estonian_cs" id="20">
309
<order>Estonian</order>
311
<collation name="latin7_general_ci" id="41">
312
<order>Latvian</order>
313
<order>Lithuanian</order>
316
<collation name="latin7_general_cs" id="42">
317
<order>Latvian</order>
318
<order>Lithuanian</order>
320
<collation name="latin7_bin" id="79" order="Binary" flag="binary"/>
323
<charset name="koi8u">
324
<family>Cyrillic</family>
325
<description>KOI8-U Ukrainian</description>
326
<alias>koi8-u</alias>
327
<collation name="koi8u_general_ci" id="22" order="Ukranian" flag="primary"/>
328
<collation name="koi8u_bin" id="75" order="Binary" flag="binary"/>
331
<charset name="gb2312">
332
<family>Simplified Chinese</family>
333
<description>GB2312 Simplified Chinese</description>
334
<alias>chinese</alias>
335
<alias>iso-ir-58</alias>
336
<collation name="gb2312_chinese_ci" id="24" order="Chinese">
338
<flag>compiled</flag>
340
<collation name="gb2312_bin" id="86">
342
<flag>compiled</flag>
346
<charset name="greek">
347
<family>Greek</family>
348
<description>ISO 8859-7 Greek</description>
349
<alias>csisolatingreek</alias>
350
<alias>ecma-118</alias>
351
<alias>greek8</alias>
352
<alias>iso-8859-7</alias>
353
<alias>iso-ir-126</alias>
354
<collation name="greek_general_ci" id="25" order="Greek" flag="primary"/>
355
<collation name="greek_bin" id="70" order="Binary" flag="binary"/>
358
<charset name="cp1250">
359
<family>Central European</family>
360
<description>Windows Central European</description>
362
<alias>windows-1250</alias>
363
<collation name="cp1250_general_ci" id="26" flag="primary">
364
<order>Hungarian</order>
365
<order>Polish</order>
366
<order>Romanian</order>
367
<order>Croatian</order>
368
<order>Slovak</order>
369
<order>Slovenian</order>
370
<order>Sorbian</order>
372
<collation name="cp1250_croatian_ci" id="44">
373
<order>Croatian</order>
375
<collation name="cp1250_polish_ci" id="99">
376
<order>Polish</order>
378
<collation name="cp1250_czech_cs" id="34" order="Czech">
379
<flag>compiled</flag>
381
<collation name="cp1250_bin" id="66" order="Binary" flag="binary"/>
385
<family>East Asian</family>
386
<description>GBK Simplified Chinese</description>
388
<collation name="gbk_chinese_ci" id="28" order="Chinese">
390
<flag>compiled</flag>
392
<collation name="gbk_bin" id="87" order="Binary">
394
<flag>compiled</flag>
398
<charset name="cp1257">
399
<family>Baltic</family>
400
<description>Windows Baltic</description>
401
<alias>WinBaltRim</alias>
402
<alias>windows-1257</alias>
403
<collation name="cp1257_lithuanian_ci" id="29" order="Lithuanian"/>
404
<collation name="cp1257_bin" id="58" order="Binary" flag="binary"/>
405
<collation name="cp1257_general_ci" id="59" flag="primary">
406
<order>Latvian</order>
407
<order>Lithuanian</order>
409
<!--collation name="cp1257_ci" id="60"/-->
410
<!--collation name="cp1257_cs" id="61"/-->
413
<charset name="latin5">
414
<family>South Asian</family>
415
<description>ISO 8859-9 Turkish</description>
416
<alias>csisolatin5</alias>
417
<alias>iso-8859-9</alias>
418
<alias>iso-ir-148</alias>
420
<alias>latin5</alias>
421
<alias>turkish</alias>
422
<collation name="latin5_turkish_ci" id="30" order="Turkish" flag="primary"/>
423
<collation name="latin5_bin" id="78" order="Binary" flag="binary"/>
426
<charset name="armscii8">
427
<family>South Asian</family>
428
<description>ARMSCII-8 Armenian</description>
429
<alias>armscii-8</alias>
430
<collation name="armscii8_general_ci" id="32" order="Armenian" flag="primary"/>
431
<collation name="armscii8_bin" id="64" order="Binary" flag="binary"/>
434
<charset name="utf8">
435
<family>Unicode</family>
436
<description>UTF-8 Unicode</description>
438
<collation name="utf8_general_ci" id="33">
440
<flag>compiled</flag>
442
<collation name="utf8_bin" id="83">
444
<flag>compiled</flag>
448
<charset name="ucs2">
449
<family>Unicode</family>
450
<description>UCS-2 Unicode</description>
451
<collation name="ucs2_general_ci" id="35">
453
<flag>compiled</flag>
455
<collation name="ucs2_bin" id="90">
457
<flag>compiled</flag>
461
<charset name="cp866">
462
<family>Cyrillic</family>
463
<description>DOS Russian</description>
465
<alias>csibm866</alias>
466
<alias>ibm866</alias>
467
<alias>DOSCyrillicRussian</alias>
468
<collation name="cp866_general_ci" id="36" order="Russian" flag="primary"/>
469
<collation name="cp866_bin" id="68" order="Binary" flag="binary"/>
472
<charset name="keybcs2">
473
<family>Central European</family>
474
<description>DOS Kamenicky Czech-Slovak</description>
475
<collation name="keybcs2_general_ci" id="37" order="Czech" flag="primary"/>
476
<collation name="keybcs2_bin" id="73" order="Binary" flag="binary"/>
479
<charset name="macce">
480
<family>Central European</family>
481
<description>Mac Central European</description>
482
<alias>MacCentralEurope</alias>
483
<collation name="macce_general_ci" id="38" flag="primary">
484
<order>Hungarian</order>
485
<order>Polish</order>
486
<order>Romanian</order>
487
<order>Croatian</order>
488
<order>Slovak</order>
489
<order>Slovenian</order>
490
<order>Sorbian</order>
492
<collation name="macce_bin" id="43" order="Binary" flag="binary"/>
495
<charset name="macroman">
496
<family>Western</family>
497
<description>Mac West European</description>
499
<alias>Macintosh</alias>
500
<alias>csmacintosh</alias>
501
<collation name="macroman_general_ci" id="39" flag="primary">
503
<order>English</order>
504
<order>French</order>
505
<order>German Duden</order>
506
<order>Italian</order>
508
<order>Portuguese</order>
509
<order>Spanish</order>
511
<collation name="macroman_bin" id="53" order="Binary" flag="binary"/>
512
<!--collation name="macroman_ci" id="54"/-->
513
<!--collation name="macroman_ci_ai" id="55"/-->
514
<!--collation name="macroman_cs" id="56"/-->
517
<charset name="cp852">
518
<family>Central European</family>
519
<description>DOS Central European</description>
522
<alias>ibm852</alias>
523
<collation name="cp852_general_ci" id="40" flag="primary">
524
<order>Hungarian</order>
525
<order>Polish</order>
526
<order>Romanian</order>
527
<order>Croatian</order>
528
<order>Slovak</order>
529
<order>Slovenian</order>
530
<order>Sorbian</order>
532
<collation name="cp852_bin" id="81" order="Binary" flag="binary"/>
535
<charset name="cp1256">
536
<family>Arabic</family>
537
<description>Windows Arabic</description>
538
<alias>ms-arab</alias>
539
<alias>windows-1256</alias>
540
<collation name="cp1256_bin" id="67" order="Binary" flag="binary"/>
541
<collation name="cp1256_general_ci" id="57" order="Arabic" flag="primary">
542
<order>Arabic</order>
543
<order>Persian</order>
544
<order>Pakistani</order>
549
<charset name="geostd8">
550
<family>South Asian</family>
551
<description>GEOSTD8 Georgian</description>
552
<collation name="geostd8_general_ci" id="92" order="Georgian" flag="primary"/>
553
<collation name="geostd8_bin" id="93" order="Binary" flag="binary"/>
556
<charset name="binary">
557
<description>Binary pseudo charset</description>
558
<collation name="binary" id="63" order="Binary">
560
<flag>compiled</flag>
564
<charset name="cp932">
565
<family>Japanese</family>
566
<description>SJIS for Windows Japanese</description>
567
<alias>ms_cp932</alias>
568
<alias>sjis_cp932</alias>
569
<alias>sjis_ms</alias>
570
<collation name="cp932_japanese_ci" id="95" order="Japanese">
572
<flag>compiled</flag>
574
<collation name="cp932_bin" id="96" order="Binary">
576
<flag>compiled</flag>
580
<charset name="eucjpms">
581
<family>Japanese</family>
582
<description>UJIS for Windows Japanese</description>
583
<alias>eucjpms</alias>
584
<alias>eucJP_ms</alias>
585
<alias>ujis_ms</alias>
586
<alias>ujis_cp932</alias>
587
<collation name="eucjpms_japanese_ci" id="97" order="Japanese">
589
<flag>compiled</flag>
591
<collation name="eucjpms_bin" id="98" order="Japanese">
593
<flag>compiled</flag>