1
<?xml version='1.0' encoding="utf-8"?>
6
Copyright (C) 2003 MySQL AB
8
This program is free software; you can redistribute it and/or modify
9
it under the terms of the GNU General Public License as published by
10
the Free Software Foundation; version 2 of the License.
12
This program is distributed in the hope that it will be useful,
13
but WITHOUT ANY WARRANTY; without even the implied warranty of
14
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15
GNU General Public License for more details.
17
You should have received a copy of the GNU General Public License
18
along with this program; if not, write to the Free Software
19
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23
This file lists all of the available character sets.
24
To make maintaining easier please:
25
- keep records sorted by collation number.
26
- change charsets.max-id when adding a new collation.
30
<family>Traditional Chinese</family>
31
<description>Big5 Traditional Chinese</description>
33
<alias>bigfive</alias>
34
<alias>big-five</alias>
35
<alias>cn-big5</alias>
37
<collation name="big5_chinese_ci" id="1" order="Chinese">
41
<collation name="big5_bin" id="84" order="Binary">
47
<charset name="latin2">
48
<family>Central European</family>
49
<description>ISO 8859-2 Central European</description>
50
<alias>csisolatin2</alias>
51
<alias>iso-8859-2</alias>
52
<alias>iso-ir-101</alias>
53
<alias>iso_8859-2</alias>
54
<alias>iso_8859-2:1987</alias>
56
<collation name="latin2_czech_cs" id="2" order="Czech" flag="compiled"/>
57
<collation name="latin2_general_ci" id="9" flag="primary">
58
<order>Hungarian</order>
60
<order>Romanian</order>
61
<order>Croatian</order>
63
<order>Slovenian</order>
64
<order>Sorbian</order>
66
<collation name="latin2_hungarian_ci" id="21" order="Hungarian"/>
67
<collation name="latin2_croatian_ci" id="27" order="Croatian"/>
68
<collation name="latin2_bin" id="77" order="Binary" flag="binary"/>
72
<family>Western</family>
73
<description>DEC West European</description>
74
<collation name="dec8_bin" id="69" order="Binary" flag="binary"/>
75
<collation name="dec8_swedish_ci" id="3" flag="primary">
77
<order>English</order>
79
<order>German Duden</order>
80
<order>Italian</order>
82
<order>Portuguese</order>
83
<order>Spanish</order>
87
<charset name="cp850">
88
<family>Western</family>
89
<description>DOS West European</description>
91
<alias>cspc850multilingual</alias>
93
<collation name="cp850_general_ci" id="4" flag="primary">
95
<order>English</order>
97
<order>German Duden</order>
98
<order>Italian</order>
100
<order>Portuguese</order>
101
<order>Spanish</order>
103
<collation name="cp850_bin" id="80" order="Binary" flag="binary"/>
106
<charset name="latin1">
107
<family>Western</family>
108
<description>cp1252 West European</description>
109
<alias>csisolatin1</alias>
110
<alias>iso-8859-1</alias>
111
<alias>iso-ir-100</alias>
112
<alias>iso_8859-1</alias>
113
<alias>iso_8859-1:1987</alias>
115
<alias>latin1</alias>
116
<collation name="latin1_german1_ci" id="5" order="German Duden"/>
117
<collation name="latin1_swedish_ci" id="8" order="Finnish, Swedish">
119
<flag>compiled</flag>
121
<collation name="latin1_danish_ci" id="15" order="Danish"/>
122
<collation name="latin1_german2_ci" id="31" order="German Phonebook" flag="compiled"/>
123
<collation name="latin1_spanish_ci" id="94" order="Spanish"/>
124
<collation name="latin1_bin" id="47" order="Binary">
126
<flag>compiled</flag>
128
<collation name="latin1_general_ci" id="48">
130
<order>English</order>
131
<order>French</order>
132
<order>German Duden</order>
133
<order>Italian</order>
135
<order>Portuguese</order>
136
<order>Spanish</order>
138
<collation name="latin1_general_cs" id="49">
140
<order>English</order>
141
<order>French</order>
142
<order>German Duden</order>
143
<order>Italian</order>
145
<order>Portuguese</order>
146
<order>Spanish</order>
151
<family>Western</family>
152
<description>HP West European</description>
153
<alias>hproman8</alias>
154
<collation name="hp8_bin" id="72" order="Binary" flag="binary"/>
155
<collation name="hp8_english_ci" id="6" flag="primary">
157
<order>English</order>
158
<order>French</order>
159
<order>German Duden</order>
160
<order>Italian</order>
162
<order>Portuguese</order>
163
<order>Spanish</order>
167
<charset name="koi8r">
168
<family>Cyrillic</family>
169
<description>KOI8-R Relcom Russian</description>
170
<alias>koi8-r</alias>
171
<alias>cskoi8r</alias>
172
<collation name="koi8r_general_ci" id="7" order="Russian" flag="primary"/>
173
<collation name="koi8r_bin" id="74" order="Binary" flag="binary"/>
176
<charset name="swe7">
177
<family>Western</family>
178
<description>7bit Swedish</description>
179
<alias>iso-646-se</alias>
180
<collation name="swe7_swedish_ci" id="10" order="Swedish" flag="primary"/>
181
<collation name="swe7_bin" id="82" order="Binary" flag="binary"/>
184
<charset name="ascii">
185
<family>Western</family>
186
<description>US ASCII</description>
188
<alias>us-ascii</alias>
189
<alias>csascii</alias>
190
<alias>iso-ir-6</alias>
191
<alias>iso646-us</alias>
192
<collation name="ascii_general_ci" id="11" order="English" flag="primary"/>
193
<collation name="ascii_bin" id="65" order="Binary" flag="binary"/>
196
<charset name="ujis">
197
<family>Japanese</family>
198
<description>EUC-JP Japanese</description>
199
<alias>euc-jp</alias>
200
<collation name="ujis_japanese_ci" id="12" order="Japanese">
202
<flag>compiled</flag>
204
<collation name="ujis_bin" id="91" order="Japanese">
206
<flag>compiled</flag>
210
<charset name="sjis">
211
<family>Japanese</family>
212
<description>Shift-JIS Japanese</description>
214
<alias>shift-jis</alias>
215
<alias>x-sjis</alias>
216
<collation name="sjis_japanese_ci" id="13" order="Japanese">
218
<flag>compiled</flag>
220
<collation name="sjis_bin" id="88" order="Binary">
222
<flag>compiled</flag>
226
<charset name="cp1251">
227
<family>Cyrillic</family>
228
<description>Windows Cyrillic</description>
229
<alias>windows-1251</alias>
230
<alias>ms-cyr</alias>
231
<alias>ms-cyrillic</alias>
232
<collation name="cp1251_bulgarian_ci" id="14">
233
<order>Belarusian</order>
234
<order>Bulgarian</order>
235
<order>Macedonian</order>
236
<order>Russian</order>
237
<order>Serbian</order>
238
<order>Mongolian</order>
239
<order>Ukrainian</order>
241
<collation name="cp1251_ukrainian_ci" id="23" order="Ukrainian"/>
242
<collation name="cp1251_bin" id="50" order="Binary" flag="binary"/>
243
<collation name="cp1251_general_ci" id="51" flag="primary">
244
<order>Belarusian</order>
245
<order>Bulgarian</order>
246
<order>Macedonian</order>
247
<order>Russian</order>
248
<order>Serbian</order>
249
<order>Mongolian</order>
250
<order>Ukrainian</order>
252
<collation name="cp1251_general_cs" id="52">
253
<order>Belarusian</order>
254
<order>Bulgarian</order>
255
<order>Macedonian</order>
256
<order>Russian</order>
257
<order>Serbian</order>
258
<order>Mongolian</order>
259
<order>Ukrainian</order>
263
<charset name="hebrew">
264
<family>Hebrew</family>
265
<description>ISO 8859-8 Hebrew</description>
266
<alias>csisolatinhebrew</alias>
267
<alias>iso-8859-8</alias>
268
<alias>iso-ir-138</alias>
269
<collation name="hebrew_general_ci" id="16" order="Hebrew" flag="primary"/>
270
<collation name="hebrew_bin" id="71" order="Binary" flag="binary"/>
273
<charset name="tis620">
274
<family>Thai</family>
275
<description>TIS620 Thai</description>
276
<alias>tis-620</alias>
277
<collation name="tis620_thai_ci" id="18" order="Thai">
279
<flag>compiled</flag>
281
<collation name="tis620_bin" id="89" order="Binary">
283
<flag>compiled</flag>
287
<charset name="euckr">
288
<family>Korean</family>
289
<description>EUC-KR Korean</description>
290
<alias>euc_kr</alias>
291
<alias>euc-kr</alias>
292
<collation name="euckr_korean_ci" id="19" order="Korean">
294
<flag>compiled</flag>
296
<collation name="euckr_bin" id="85">
298
<flag>compiled</flag>
302
<charset name="latin7">
303
<family>Baltic</family>
304
<description>ISO 8859-13 Baltic</description>
305
<alias>BalticRim</alias>
306
<alias>iso-8859-13</alias>
308
<collation name="latin7_estonian_cs" id="20">
309
<order>Estonian</order>
311
<collation name="latin7_general_ci" id="41">
312
<order>Latvian</order>
313
<order>Lithuanian</order>
316
<collation name="latin7_general_cs" id="42">
317
<order>Latvian</order>
318
<order>Lithuanian</order>
320
<collation name="latin7_bin" id="79" order="Binary" flag="binary"/>
323
<charset name="koi8u">
324
<family>Cyrillic</family>
325
<description>KOI8-U Ukrainian</description>
326
<alias>koi8-u</alias>
327
<collation name="koi8u_general_ci" id="22" order="Ukranian" flag="primary"/>
328
<collation name="koi8u_bin" id="75" order="Binary" flag="binary"/>
331
<charset name="gb2312">
332
<family>Simplified Chinese</family>
333
<description>GB2312 Simplified Chinese</description>
334
<alias>chinese</alias>
335
<alias>iso-ir-58</alias>
336
<collation name="gb2312_chinese_ci" id="24" order="Chinese">
338
<flag>compiled</flag>
340
<collation name="gb2312_bin" id="86">
342
<flag>compiled</flag>
346
<charset name="greek">
347
<family>Greek</family>
348
<description>ISO 8859-7 Greek</description>
349
<alias>csisolatingreek</alias>
350
<alias>ecma-118</alias>
351
<alias>greek8</alias>
352
<alias>iso-8859-7</alias>
353
<alias>iso-ir-126</alias>
354
<collation name="greek_general_ci" id="25" order="Greek" flag="primary"/>
355
<collation name="greek_bin" id="70" order="Binary" flag="binary"/>
358
<charset name="cp1250">
359
<family>Central European</family>
360
<description>Windows Central European</description>
362
<alias>windows-1250</alias>
363
<collation name="cp1250_general_ci" id="26" flag="primary">
364
<order>Hungarian</order>
365
<order>Polish</order>
366
<order>Romanian</order>
367
<order>Croatian</order>
368
<order>Slovak</order>
369
<order>Slovenian</order>
370
<order>Sorbian</order>
372
<collation name="cp1250_croatian_ci" id="44">
373
<order>Croatian</order>
375
<collation name="cp1250_czech_cs" id="34" order="Czech">
376
<flag>compiled</flag>
378
<collation name="cp1250_bin" id="66" order="Binary" flag="binary"/>
382
<family>East Asian</family>
383
<description>GBK Simplified Chinese</description>
385
<collation name="gbk_chinese_ci" id="28" order="Chinese">
387
<flag>compiled</flag>
389
<collation name="gbk_bin" id="87" order="Binary">
391
<flag>compiled</flag>
395
<charset name="cp1257">
396
<family>Baltic</family>
397
<description>Windows Baltic</description>
398
<alias>WinBaltRim</alias>
399
<alias>windows-1257</alias>
400
<collation name="cp1257_lithuanian_ci" id="29" order="Lithuanian"/>
401
<collation name="cp1257_bin" id="58" order="Binary" flag="binary"/>
402
<collation name="cp1257_general_ci" id="59" flag="primary">
403
<order>Latvian</order>
404
<order>Lithuanian</order>
406
<!--collation name="cp1257_ci" id="60"/-->
407
<!--collation name="cp1257_cs" id="61"/-->
410
<charset name="latin5">
411
<family>South Asian</family>
412
<description>ISO 8859-9 Turkish</description>
413
<alias>csisolatin5</alias>
414
<alias>iso-8859-9</alias>
415
<alias>iso-ir-148</alias>
417
<alias>latin5</alias>
418
<alias>turkish</alias>
419
<collation name="latin5_turkish_ci" id="30" order="Turkish" flag="primary"/>
420
<collation name="latin5_bin" id="78" order="Binary" flag="binary"/>
423
<charset name="armscii8">
424
<family>South Asian</family>
425
<description>ARMSCII-8 Armenian</description>
426
<alias>armscii-8</alias>
427
<collation name="armscii8_general_ci" id="32" order="Armenian" flag="primary"/>
428
<collation name="armscii8_bin" id="64" order="Binary" flag="binary"/>
431
<charset name="utf8">
432
<family>Unicode</family>
433
<description>UTF-8 Unicode</description>
435
<collation name="utf8_general_ci" id="33">
437
<flag>compiled</flag>
439
<collation name="utf8_bin" id="83">
441
<flag>compiled</flag>
445
<charset name="ucs2">
446
<family>Unicode</family>
447
<description>UCS-2 Unicode</description>
448
<collation name="ucs2_general_ci" id="35">
450
<flag>compiled</flag>
452
<collation name="ucs2_bin" id="90">
454
<flag>compiled</flag>
458
<charset name="cp866">
459
<family>Cyrillic</family>
460
<description>DOS Russian</description>
462
<alias>csibm866</alias>
463
<alias>ibm866</alias>
464
<alias>DOSCyrillicRussian</alias>
465
<collation name="cp866_general_ci" id="36" order="Russian" flag="primary"/>
466
<collation name="cp866_bin" id="68" order="Binary" flag="binary"/>
469
<charset name="keybcs2">
470
<family>Central European</family>
471
<description>DOS Kamenicky Czech-Slovak</description>
472
<collation name="keybcs2_general_ci" id="37" order="Czech" flag="primary"/>
473
<collation name="keybcs2_bin" id="73" order="Binary" flag="binary"/>
476
<charset name="macce">
477
<family>Central European</family>
478
<description>Mac Central European</description>
479
<alias>MacCentralEurope</alias>
480
<collation name="macce_general_ci" id="38" flag="primary">
481
<order>Hungarian</order>
482
<order>Polish</order>
483
<order>Romanian</order>
484
<order>Croatian</order>
485
<order>Slovak</order>
486
<order>Slovenian</order>
487
<order>Sorbian</order>
489
<collation name="macce_bin" id="43" order="Binary" flag="binary"/>
492
<charset name="macroman">
493
<family>Western</family>
494
<description>Mac West European</description>
496
<alias>Macintosh</alias>
497
<alias>csmacintosh</alias>
498
<collation name="macroman_general_ci" id="39" flag="primary">
500
<order>English</order>
501
<order>French</order>
502
<order>German Duden</order>
503
<order>Italian</order>
505
<order>Portuguese</order>
506
<order>Spanish</order>
508
<collation name="macroman_bin" id="53" order="Binary" flag="binary"/>
509
<!--collation name="macroman_ci" id="54"/-->
510
<!--collation name="macroman_ci_ai" id="55"/-->
511
<!--collation name="macroman_cs" id="56"/-->
514
<charset name="cp852">
515
<family>Central European</family>
516
<description>DOS Central European</description>
519
<alias>ibm852</alias>
520
<collation name="cp852_general_ci" id="40" flag="primary">
521
<order>Hungarian</order>
522
<order>Polish</order>
523
<order>Romanian</order>
524
<order>Croatian</order>
525
<order>Slovak</order>
526
<order>Slovenian</order>
527
<order>Sorbian</order>
529
<collation name="cp852_bin" id="81" order="Binary" flag="binary"/>
532
<charset name="cp1256">
533
<family>Arabic</family>
534
<description>Windows Arabic</description>
535
<alias>ms-arab</alias>
536
<alias>windows-1256</alias>
537
<collation name="cp1256_bin" id="67" order="Binary" flag="binary"/>
538
<collation name="cp1256_general_ci" id="57" order="Arabic" flag="primary">
539
<order>Arabic</order>
540
<order>Persian</order>
541
<order>Pakistani</order>
546
<charset name="geostd8">
547
<family>South Asian</family>
548
<description>GEOSTD8 Georgian</description>
549
<collation name="geostd8_general_ci" id="92" order="Georgian" flag="primary"/>
550
<collation name="geostd8_bin" id="93" order="Binary" flag="binary"/>
553
<charset name="binary">
554
<description>Binary pseudo charset</description>
555
<collation name="binary" id="63" order="Binary">
557
<flag>compiled</flag>
561
<charset name="cp932">
562
<family>Japanese</family>
563
<description>SJIS for Windows Japanese</description>
564
<alias>ms_cp932</alias>
565
<alias>sjis_cp932</alias>
566
<alias>sjis_ms</alias>
567
<collation name="cp932_japanese_ci" id="95" order="Japanese">
569
<flag>compiled</flag>
571
<collation name="cp932_bin" id="96" order="Binary">
573
<flag>compiled</flag>
577
<charset name="eucjpms">
578
<family>Japanese</family>
579
<description>UJIS for Windows Japanese</description>
580
<alias>eucjpms</alias>
581
<alias>eucJP_ms</alias>
582
<alias>ujis_ms</alias>
583
<alias>ujis_cp932</alias>
584
<collation name="eucjpms_japanese_ci" id="97" order="Japanese">
586
<flag>compiled</flag>
588
<collation name="eucjpms_bin" id="98" order="Japanese">
590
<flag>compiled</flag>