/
MAIN.TXT
2427 lines (2282 loc) · 125 KB
/
MAIN.TXT
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
#
# Fully supported code pages (92 code pages):
#
# 113 - Yugoslavian, Latin
# 437 - United States
# 667 - Polish, Mazovia encoding
# 668 - Polish, 852 compatible
# 737 - Greek-2
# 770 - Baltic
# 771 - Lithuanian and Russian, Cyrillic, KBL encoding
# 772 - duplicate of 1119
# 773 - Latin-7 (Baltic, old standard)
# 774 - duplicate of 1118
# 775 - Latin-7 (Baltic)
# 777 - Lithuanian, Accented (old)
# 778 - Lithuanian, Accented
# 790 - duplicate of 667
# 808 - Russian, Cyrillic, with EUR
# 848 - Ukrainian, Cyrillic, with EUR
# 849 - Belarusian, Cyrillic, with EUR
# 850 - Latin-1 (Western European)
# 851 - Greek, old encoding
# 852 - Latin-2 (Central European), with EUR
# 853 - Latin-3 (Turkish, Maltese, and Esperanto)
# 855 - South Slavic, Cyrillic
# 856 - Hebrew-2, with EUR
# 857 - Latin-5, with EUR
# 858 - Latin-1 (Western European), with EUR
# 859 - Latin-9 (Western European), with EUR
# 860 - Portuguese
# 861 - Icelandic
# 862 - Hebrew-2
# 863 - Canadian French
# 865 - Nordic
# 866 - Russian, Cyrillic
# 867 - Czech and Slovak, Kamenicky encoding
# 869 - Greek, with EUR
# 872 - South Slavic, Cyrillic, with EUR
# 895 - duplicate of 867
# 899 - Armenian, ArmSCII-8A encoding
# 991 - Polish, Mazovia encoding, with PLN (*)
# 1116 - Estonian
# 1117 - Latvian
# 1118 - Lithuanian, LST 1283 encoding
# 1119 - Lithuanian and Russian, Cyrillic, LST 1284 encoding
# 1125 - Ukrainian, Cyrillic
# 1131 - Belarusian, Cyrillic
# 3012 - Latvian and Russian, Cyrillic, RusLat encoding
# 3021 - Bulgarian, Cyrillic, MIK encoding
# 3845 - Hungarian, CWI-2 encoding
# 3846 - Turkish
# 3848 - Brazilian, ABICOMP encoding
# 30000 - Saami (NOTE: this is neither Windows 1270 code page, nor ISO-IR-197 encoding)
# 30001 - Celtic, with EUR
# 30002 - Tajik, Cyrillic, with EUR
# 30003 - Latin American, with EUR
# 30004 - Greenlandic, with EUR
# 30005 - Nigerian, with EUR
# 30006 - Vietnamese Latin
# 30007 - Latin, with EUR (**)
# 30008 - Abkhaz and Ossetian, Cyrillic, with EUR
# 30009 - Romani, with EUR
# 30010 - Gagauz and Moldovan, Cyrillic, with EUR
# 30011 - Russian Southern (Kalmyk, Karachay-Balkar, Ossetian, North Caucasian), Cyrillic, with EUR
# 30012 - Siberian (Altai, Buryat, Khakas, Tuvan, Yakut, Tungusic, Paleo-Siberian), Cyrillic, with EUR
# 30013 - Turkic (Bashkir, Chuvash, Tatar), Cyrillic, with EUR
# 30014 - Finno-ugric (Mari, Udmurt), Cyrillic, with EUR
# 30015 - Khanty, Cyrillic, with EUR
# 30016 - Mansi, Cyrillic, with EUR
# 30017 - Russian Northwestern (Cyrillic Nenets, Latin Karelian, Latin Veps), with EUR
# 30018 - Russian Cyrillic and Latin Tatar, with EUR
# 30019 - Russian Cyrillic and Latin Chechen, with EUR (*)
# 30020 - Low Saxon and Frisian, with EUR
# 30021 - Oceania, with EUR
# 30022 - Canadian First Nations, with EUR
# 30023 - Southern Africa, with EUR
# 30024 - Northern and Eastern Africa, with EUR
# 30025 - Western Africa, with EUR (*)
# 30026 - Central Africa, with EUR
# 30027 - Beninese, with EUR
# 30028 - Nigerien, with EUR
# 30029 - Mexican, with EUR
# 30030 - Mexican-2, with EUR
# 30031 - Latin-4 (Northern European), with EUR (NOTE: this is not an ISO 8859-4 encoding)
# 30032 - Latin-6, with EUR (NOTE: it seems there is no keyboard layout for this one)
# 30033 - Crimean Tatar, with UAH
# 30034 - Cherokee
# 30039 - Ukrainian, Cyrillic, with UAH
# 30040 - Russian, Cyrillic, with UAH
# 58152 - Kazakh, Cyrillic, with EUR (NOTE: this is neither Windows 1251 code page, nor KZ-1048 encoding)
# 58210 - Azeri and Russian, Cyrillic
# 58335 - Kashubian and Polish, Mazovia based, with PLN (*)
# 59234 - Tatar, Cyrillic
# 62306 - Uzbek, Cyrillic
# 60853 - Georgian, with capital letters
#
# Code pages supported by UTF-8 engine, despite not present in bundled CPX files (1 code page):
# 874 - Thai, with EUR
#
# (*) The following symbols had to be worked around as they are missing in Unicode standard:
# - 30025 : LATIN CAPITAL LETTER D WITH HOOK AND TAIL (only the SMALL one is available)
# - 991, 58335 : PLN SYMBOL (currency)
# - 30019 : CYRILLIC LIGATURE UO (both SMALL and CAPITAL)
#
# (**) The code page contains LATIN SMALL/CAPITAL LETTER L WITH MIDDLE DOT character, which
# cannot be decomposed without creating ambiguity, see DECOMPOSITION.TXT
#
# Code pages mostly supported (3 code pages), but with unidentified characters still left (TODO):
#
# 864 - Arabic
# - 5 characters (FreeDOS specific extension) still unidentified
# 59829 - Georgian
# - 1 character still unidentified
# 60258 - Russian Cyrillic and Latin Azeri
# - dotted capital I not handled due to UTF-8 code limitation
# ****************************************************************************
# Mapping aliases to accomodate characters missing in code pages
# ****************************************************************************
# Provide pairs of code points here. Here is how the aliases work:
# - if (from code page definition) we know how to map Unicode code point,
# the aliasing information is ignored for the given code page
# - if we do not, we try mapping from the alias code point
# (ALIAS 0xAAAA 0xBBBB measn it tries to display character for 0xBBBB
# if 0xAAAA is not available)
# - every pair below may be declared bidirectional
# Alias to alias has no effect.
#
# Only the first matching alias is used; in fact, it is perfectly fine to have
# multiple aliases for a single characters, this way different code pages will
# pick different, starting from the first (which should be the best one).
#
# It is OK to provide aliases also to characters not (yet) present in any
# supported code page, provided there aren't too many of them.
#
# In case the character you are creating aliases for is used by multiple
# languages, please try to be as much 'generic' as possible.
# Armenian codepage misses a ligature, so instead of:
# - U+0587 - ARMENIAN SMALL LIGATURE ECH YIWN
# use:
# - U+0535 - ARMENIAN CAPITAL LETTER ECH
ALIAS 0x0587 0x0535
# Some Cyrillic code pages does not contain letters used in certain languages,
# therefore if needed replace them with similar/non-accented basic ones:
ALIAS 0x0401 0x0415 #CYRILLIC CAPITAL LETTER IO
ALIAS 0x0406 0x0418 #CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I
ALIAS 0x040e 0x0423 #CYRILLIC CAPITAL LETTER SHORT U
ALIAS 0x045e 0x0443 #CYRILLIC SMALL LETTER SHORT U
ALIAS 0x0451 0x0435 #CYRILLIC SMALL LETTER IO
ALIAS 0x0490 0x0413 #CYRILLIC CAPITAL LETTER GHE WITH UPTURN
ALIAS 0x0491 0x0433 #CYRILLIC SMALL LETTER GHE WITH UPTURN
ALIAS 0x0404 0x0415 #CYRILLIC CAPITAL LETTER UKRAINIAN IE
ALIAS 0x0454 0x0435 #CYRILLIC SMALL LETTER UKRAINIAN IE
ALIAS 0x0456 0x0438 #CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I
ALIAS 0x0492 0x0413 #CYRILLIC CAPITAL LETTER GHE WITH STROKE
ALIAS 0x0493 0x0433 #CYRILLIC SMALL LETTER GHE WITH STROKE
ALIAS 0x0494 0x0413 #CYRILLIC CAPITAL LETTER GHE WITH MIDDLE HOOK
ALIAS 0x0495 0x0433 #CYRILLIC SMALL LETTER GHE WITH MIDDLE HOOK
ALIAS 0x0496 0x0416 #CYRILLIC CAPITAL LETTER ZHE WITH DESCENDER
ALIAS 0x0497 0x0436 #CYRILLIC SMALL LETTER ZHE WITH DESCENDER
ALIAS 0x0498 0x0417 #CYRILLIC CAPITAL LETTER ZE WITH DESCENDER
ALIAS 0x0499 0x0437 #CYRILLIC SMALL LETTER ZE WITH DESCENDER
ALIAS 0x049a 0x041a #CYRILLIC CAPITAL LETTER KA WITH DESCENDER
ALIAS 0x049b 0x043a #CYRILLIC SMALL LETTER KA WITH DESCENDER
ALIAS 0x049c 0x041a #CYRILLIC CAPITAL LETTER KA WITH VERTICAL STROKE
ALIAS 0x049d 0x043a #CYRILLIC SMALL LETTER KA WITH VERTICAL STROKE
ALIAS 0x049e 0x041a #CYRILLIC CAPITAL LETTER KA WITH STROKE
ALIAS 0x049f 0x043a #CYRILLIC SMALL LETTER KA WITH STROKE
ALIAS 0x04a0 0x041a #CYRILLIC CAPITAL LETTER BASHKIR KA
ALIAS 0x04a1 0x043a #CYRILLIC SMALL LETTER BASHKIR KA
ALIAS 0x04a2 0x041d #CYRILLIC CAPITAL LETTER EN WITH DESCENDER
ALIAS 0x04a3 0x043d #CYRILLIC SMALL LETTER EN WITH DESCENDER
ALIAS 0x04a4 0x041d #CYRILLIC CAPITAL LIGATURE EN GHE
ALIAS 0x04a5 0x043d #CYRILLIC SMALL LIGATURE EN GHE
ALIAS 0x04a8 0x041e #CYRILLIC CAPITAL LETTER ABKHASIAN HA
ALIAS 0x04a9 0x043e #CYRILLIC SMALL LETTER ABKHASIAN HA
ALIAS 0x04aa 0x0421 #CYRILLIC CAPITAL LETTER ES WITH DESCENDER
ALIAS 0x04ab 0x0441 #CYRILLIC SMALL LETTER ES WITH DESCENDER
ALIAS 0x04ac 0x0422 #CYRILLIC CAPITAL LETTER TE WITH DESCENDER
ALIAS 0x04ad 0x0442 #CYRILLIC SMALL LETTER TE WITH DESCENDER
ALIAS 0x04ae 0x0423 #CYRILLIC CAPITAL LETTER STRAIGHT U
ALIAS 0x04af 0x0443 #CYRILLIC SMALL LETTER STRAIGHT U
ALIAS 0x04b0 0x04ae #CYRILLIC CAPITAL LETTER STRAIGHT U WITH STROKE
ALIAS 0x04b0 0x0423 #CYRILLIC CAPITAL LETTER STRAIGHT U WITH STROKE
ALIAS 0x04b1 0x04af #CYRILLIC SMALL LETTER STRAIGHT U WITH STROKE
ALIAS 0x04b1 0x0443 #CYRILLIC SMALL LETTER STRAIGHT U WITH STROKE
ALIAS 0x04b2 0x0425 #CYRILLIC CAPITAL LETTER HA WITH DESCENDER
ALIAS 0x04b3 0x0445 #CYRILLIC SMALL LETTER HA WITH DESCENDER
ALIAS 0x04b4 0x0426 #CYRILLIC CAPITAL LIGATURE TE TSE
ALIAS 0x04b5 0x0446 #CYRILLIC SMALL LIGATURE TE TSE
ALIAS 0x04b6 0x0427 #CYRILLIC CAPITAL LETTER CHE WITH DESCENDER
ALIAS 0x04b7 0x0447 #CYRILLIC SMALL LETTER CHE WITH DESCENDER
ALIAS 0x04b8 0x0427 #CYRILLIC CAPITAL LETTER CHE WITH VERTICAL STROKE
ALIAS 0x04b9 0x0447 #CYRILLIC SMALL LETTER CHE WITH VERTICAL STROKE
ALIAS 0x04bc 0x0427 #CYRILLIC CAPITAL LETTER ABKHASIAN CHE
ALIAS 0x04bd 0x0447 #CYRILLIC SMALL LETTER ABKHASIAN CHE
ALIAS 0x04be 0x04bc #CYRILLIC CAPITAL LETTER ABKHASIAN CHE WITH DESCENDER
ALIAS 0x04be 0x0427 #CYRILLIC CAPITAL LETTER ABKHASIAN CHE WITH DESCENDER
ALIAS 0x04bf 0x04bd #CYRILLIC SMALL LETTER ABKHASIAN CHE WITH DESCENDER
ALIAS 0x04bf 0x0447 #CYRILLIC SMALL LETTER ABKHASIAN CHE WITH DESCENDER
ALIAS 0x04e0 0x0405 #CYRILLIC CAPITAL LETTER ABKHASIAN DZE
ALIAS 0x04e1 0x0455 #CYRILLIC SMALL LETTER ABKHASIAN DZE
ALIAS 0x04c1 0x0416 #CYRILLIC CAPITAL LETTER ZHE WITH BREVE
ALIAS 0x04c2 0x0436 #CYRILLIC SMALL LETTER ZHE WITH BREVE
ALIAS 0x04c3 0x041a #CYRILLIC CAPITAL LETTER KA WITH HOOK
ALIAS 0x04c4 0x043a #CYRILLIC SMALL LETTER KA WITH HOOK
ALIAS 0x04c7 0x041d #CYRILLIC CAPITAL LETTER EN WITH HOOK
ALIAS 0x04c8 0x043d #CYRILLIC SMALL LETTER EN WITH HOOK
ALIAS 0x04d0 0x0410 #CYRILLIC CAPITAL LETTER A WITH BREVE
ALIAS 0x04d1 0x0430 #CYRILLIC SMALL LETTER A WITH BREVE
ALIAS 0x04d2 0x0410 #CYRILLIC CAPITAL LETTER A WITH DIAERESIS
ALIAS 0x04d3 0x0430 #CYRILLIC SMALL LETTER A WITH DIAERESIS
ALIAS 0x04d6 0x0415 #CYRILLIC CAPITAL LETTER IE WITH BREVE
ALIAS 0x04d7 0x0435 #CYRILLIC SMALL LETTER IE WITH BREVE
ALIAS 0x04da 0x04d8 #CYRILLIC CAPITAL LETTER SCHWA WITH DIAERESIS
ALIAS 0x04db 0x04d9 #CYRILLIC SMALL LETTER SCHWA WITH DIAERESIS
ALIAS 0x04dc 0x0416 #CYRILLIC CAPITAL LETTER ZHE WITH DIAERESIS
ALIAS 0x04dd 0x0436 #CYRILLIC SMALL LETTER ZHE WITH DIAERESIS
ALIAS 0x04de 0x0417 #CYRILLIC CAPITAL LETTER ZE WITH DIAERESIS
ALIAS 0x04df 0x0437 #CYRILLIC SMALL LETTER ZE WITH DIAERESIS
ALIAS 0x04e2 0x0418 #CYRILLIC CAPITAL LETTER I WITH MACRON
ALIAS 0x04e3 0x0438 #CYRILLIC SMALL LETTER I WITH MACRON
ALIAS 0x04e4 0x0418 #CYRILLIC CAPITAL LETTER I WITH DIAERESIS
ALIAS 0x04e5 0x0438 #CYRILLIC SMALL LETTER I WITH DIAERESIS
ALIAS 0x04e6 0x041e #CYRILLIC CAPITAL LETTER O WITH DIAERESIS
ALIAS 0x04e7 0x04e7 #CYRILLIC SMALL LETTER O WITH DIAERESIS
ALIAS 0x04ea 0x04e8 #CYRILLIC CAPITAL LETTER BARRED O WITH DIAERESIS
ALIAS 0x04eb 0x04e9 #CYRILLIC SMALL LETTER BARRED O WITH DIAERESIS
ALIAS 0x04ef 0x0443 #CYRILLIC SMALL LETTER U WITH MACRON
ALIAS 0x04ee 0x0423 #CYRILLIC CAPITAL LETTER U WITH MACRON
ALIAS 0x04f0 0x0423 #CYRILLIC CAPITAL LETTER U WITH DIAERESIS
ALIAS 0x04f1 0x0443 #CYRILLIC SMALL LETTER U WITH DIAERESIS
ALIAS 0x04f2 0x0423 #CYRILLIC CAPITAL LETTER U WITH DOUBLE ACUTE
ALIAS 0x04f3 0x0443 #CYRILLIC SMALL LETTER U WITH DOUBLE ACUTE
ALIAS 0x04f4 0x0427 #CYRILLIC CAPITAL LETTER CHE WITH DIAERESIS
ALIAS 0x04f5 0x0447 #CYRILLIC SMALL LETTER CHE WITH DIAERESIS
ALIAS 0x04f8 0x042b #CYRILLIC CAPITAL LETTER YERU WITH DIAERESIS
ALIAS 0x04f9 0x044b #CYRILLIC SMALL LETTER YERU WITH DIAERESIS
ALIAS 0x0524 0x041f #CYRILLIC CAPITAL LETTER PE WITH DESCENDER
ALIAS 0x0525 0x043f #CYRILLIC SMALL LETTER PE WITH DESCENDER
# For Cyrillic, additionally map 'barred O', to regular 'O', as fallback:
ALIAS 0x04e8 0x041e #CYRILLIC CAPITAL LETTER BARRED O
ALIAS 0x04ea 0x041e #CYRILLIC CAPITAL LETTER BARRED O WITH DIAERESIS
ALIAS 0x04e9 0x043e #CYRILLIC SMALL LETTER BARRED O
ALIAS 0x04e7 0x043e #CYRILLIC SMALL LETTER O WITH DIAERESIS
# Cyrillic AE ligature or Schwa can be replaced with Latin one, and vice-versa;
ALIAS 0x04d4 0x00c6 BIDIRECTIONAL #CYRILLIC CAPITAL LIGATURE AE
ALIAS 0x04d5 0x00e6 BIDIRECTIONAL #CYRILLIC SMALL LIGATURE AE
ALIAS 0x04d8 0x018f BIDIRECTIONAL #CYRILLIC CAPITAL LETTER SCHWA
ALIAS 0x04d9 0x0259 BIDIRECTIONAL #CYRILLIC SMALL LETTER SCHWA
# If Georgian code page does not contain capital letters, replace them
# with regular ones:
ALIAS 0x10a0 0x10d0 #GEORGIAN CAPITAL LETTER AN
ALIAS 0x10a1 0x10d1 #GEORGIAN CAPITAL LETTER BAN
ALIAS 0x10a2 0x10d2 #GEORGIAN CAPITAL LETTER GAN
ALIAS 0x10a3 0x10d3 #GEORGIAN CAPITAL LETTER DON
ALIAS 0x10a4 0x10d4 #GEORGIAN CAPITAL LETTER EN
ALIAS 0x10a5 0x10d5 #GEORGIAN CAPITAL LETTER VIN
ALIAS 0x10a6 0x10d6 #GEORGIAN CAPITAL LETTER ZEN
ALIAS 0x10a7 0x10d7 #GEORGIAN CAPITAL LETTER TAN
ALIAS 0x10a8 0x10d8 #GEORGIAN CAPITAL LETTER IN
ALIAS 0x10a9 0x10d9 #GEORGIAN CAPITAL LETTER KAN
ALIAS 0x10aa 0x10da #GEORGIAN CAPITAL LETTER LAS
ALIAS 0x10ab 0x10db #GEORGIAN CAPITAL LETTER MAN
ALIAS 0x10ac 0x10dc #GEORGIAN CAPITAL LETTER NAR
ALIAS 0x10ad 0x10dd #GEORGIAN CAPITAL LETTER ON
ALIAS 0x10ae 0x10de #GEORGIAN CAPITAL LETTER PAR
ALIAS 0x10af 0x10df #GEORGIAN CAPITAL LETTER ZHAR
ALIAS 0x10b0 0x10e0 #GEORGIAN CAPITAL LETTER RAE
ALIAS 0x10b1 0x10e1 #GEORGIAN CAPITAL LETTER SAN
ALIAS 0x10b2 0x10e2 #GEORGIAN CAPITAL LETTER TAR
ALIAS 0x10b3 0x10e3 #GEORGIAN CAPITAL LETTER UN
ALIAS 0x10b4 0x10e4 #GEORGIAN CAPITAL LETTER PHAR
ALIAS 0x10b5 0x10e5 #GEORGIAN CAPITAL LETTER KHAR
ALIAS 0x10b6 0x10e6 #GEORGIAN CAPITAL LETTER GHAN
ALIAS 0x10b7 0x10e7 #GEORGIAN CAPITAL LETTER QAR
ALIAS 0x10b8 0x10e8 #GEORGIAN CAPITAL LETTER SHIN
ALIAS 0x10b9 0x10e9 #GEORGIAN CAPITAL LETTER CHIN
ALIAS 0x10ba 0x10ea #GEORGIAN CAPITAL LETTER CAN
ALIAS 0x10bb 0x10eb #GEORGIAN CAPITAL LETTER JIL
ALIAS 0x10bc 0x10ec #GEORGIAN CAPITAL LETTER CIL
ALIAS 0x10bd 0x10ed #GEORGIAN CAPITAL LETTER CHAR
ALIAS 0x10be 0x10ee #GEORGIAN CAPITAL LETTER XAN
ALIAS 0x10bf 0x10ef #GEORGIAN CAPITAL LETTER JHAN
ALIAS 0x10c0 0x10f0 #GEORGIAN CAPITAL LETTER HAE
# Greek alphabet characters are the same or very similar as many
# (usually mathematical) symbols:
# - U+00DF - LATIN SMALL LETTER SHARP S
# - U+2211 - N-ARY SUMMATION
# - U+00B5 - MICRO SIGN
# - U+2126 - OHM SIGN
# - U+2208 - ELEMENT OF
# - U+025B - LATIN SMALL LETTER OPEN E
# - U+0138 - LATIN SMALL LETTER KRA
# can be substituted by:
# - U+03B2 - GREEK SMALL LETTER BETA
# - U+03A3 - GREEK CAPITAL LETTER SIGMA
# - U+03BC - GREEK SMALL LETTER MU
# - U+03A9 - GREEK CAPITAL LETTER OMEGA
# - U+03B5 - GREEK SMALL LETTER EPSILON
# - U+03BA - GREEK SMALL LETTER KAPPA
ALIAS 0x00df 0x03b2 BIDIRECTIONAL
ALIAS 0x2211 0x03a3 BIDIRECTIONAL
ALIAS 0x00b5 0x03bc BIDIRECTIONAL
ALIAS 0x2126 0x03a9 BIDIRECTIONAL
ALIAS 0x2208 0x03b5 BIDIRECTIONAL
ALIAS 0x025b 0x03b5 BIDIRECTIONAL
ALIAS 0x0138 0x03ba BIDIRECTIONAL
# Some code pages with Greek letters do not have all the accented characters,
# like the CP 851 which misses capital Iota and Upsilon with Dialytika
ALIAS 0x0386 0x0391 #GREEK CAPITAL LETTER ALPHA WITH TONOS
ALIAS 0x0388 0x0395 #GREEK CAPITAL LETTER EPSILON WITH TONOS
ALIAS 0x0389 0x0397 #GREEK CAPITAL LETTER ETA WITH TONOS
ALIAS 0x038a 0x0399 #GREEK CAPITAL LETTER IOTA WITH TONOS
ALIAS 0x038c 0x039f #GREEK CAPITAL LETTER OMICRON WITH TONOS
ALIAS 0x038e 0x03a5 #GREEK CAPITAL LETTER UPSILON WITH TONOS
ALIAS 0x038f 0x03a9 #GREEK CAPITAL LETTER OMEGA WITH TONOS
ALIAS 0x0390 0x03b9 #GREEK SMALL LETTER IOTA WITH DIALYTIKA AND TONOS
ALIAS 0x03aa 0x0399 #GREEK CAPITAL LETTER IOTA WITH DIALYTIKA
ALIAS 0x03ab 0x03a5 #GREEK CAPITAL LETTER UPSILON WITH DIALYTIKA
ALIAS 0x03ac 0x03b1 #GREEK SMALL LETTER ALPHA WITH TONOS
ALIAS 0x03ad 0x03b5 #GREEK SMALL LETTER EPSILON WITH TONOS
ALIAS 0x03ae 0x03b7 #GREEK SMALL LETTER ETA WITH TONOS
ALIAS 0x03af 0x03b9 #GREEK SMALL LETTER IOTA WITH TONOS
ALIAS 0x03b0 0x03c5 #GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND TONOS
ALIAS 0x03c2 0x03c3 #GREEK SMALL LETTER FINAL SIGMA
ALIAS 0x03ca 0x03b9 #GREEK SMALL LETTER IOTA WITH DIALYTIKA
ALIAS 0x03cb 0x03c5 #GREEK SMALL LETTER UPSILON WITH DIALYTIKA
ALIAS 0x03cc 0x03bf #GREEK SMALL LETTER OMICRON WITH TONOS
ALIAS 0x03cd 0x03c5 #GREEK SMALL LETTER UPSILON WITH TONOS
ALIAS 0x03ce 0x03c9 #GREEK SMALL LETTER OMEGA WITH TONOS
# Old English letter:
# - U+00D0 - LATIN CAPITAL LETTER ETH
# has the same appearance as the one below, found in many languages:
# - U+0110 - LATIN CAPITAL LETTER D WITH STROKE
ALIAS 0x00d0 0x0110 BIDIRECTIONAL
# Pound and Lira signs are very similar, and sometimes a two-bar style
# is used for Pound too - so if symbol:
# - U+00A3 - POUND SIGN
# is unavailable, it can be replaced it with:
# - U+20A4 - LIRA SIGN
ALIAS 0x00a3 0x20a4
# Cent sign can be replaced with C with stroke - if needed substitute:
# - U+0x00A2 - CENT SIGN
# with:
# - U+0x023C - LATIN SMALL LETTER C WITH STROKE
ALIAS 0x00a2 0x023c
# Mayan tresillo is almost identical to open e, therefore if needed replace:
# - U+A72A - LATIN CAPITAL LETTER TRESILLO
# - U+A72B - LATIN SMALL LETTER TRESILLO
# with:
# - U+0190 - LATIN CAPITAL LETTER OPEN E
# - U+025B - LATIN SMALL LETTER OPEN E
ALIAS 0xa72a 0x0190 #LATIN CAPITAL LETTER TRESILLO
ALIAS 0xa72b 0x025b #LATIN SMALL LETTER TRESILLO
# Polish language has 2 characters, which are frequently omitted for
# code pages, including CP 852:
# - U+01B5 - LATIN CAPITAL LETTER Z WITH STROKE
# - U+01B6 - LATIN SMALL LETTER Z WITH STROKE
# They serve exactly the same purpose (tehy are just different graphical
# representations, rarely used) as the following:
# - U+017B - LATIN CAPITAL LETTER Z WITH DOT ABOVE
# - U+017C - LATIN SMALL LETTER Z WITH DOT ABOVE
# Note: Chechen Latin also uses the 'z with stroke' (and doesn't have a
# 'z with dot above'), but since this alphabet is not used any more
# (Cyrillic was later restored), this is unlikely to cause problems.
ALIAS 0x01b5 0x017b BIDIRECTIONAL
ALIAS 0x01b6 0x017c BIDIRECTIONAL
# In addition, if Polish letters are available, the missing symbols:
# - U+00A3 - POUND SIGN
# - U+20A4 - LIRA SIGN
# can be replaced with a little similar (more than capital L:
# - U+0141 - LATIN CAPITAL LETTER L WITH STROKE
ALIAS 0x00a3 0x0141
ALIAS 0x20a4 0x0141
# Romanian language has 4 characters, which are frequently omitted from
# code pages, including CP 852:
# - U+0x0218 - LATIN CAPITAL LETTER S WITH COMMA BELOW
# - U+0x0219 - LATIN SMALL LETTER S WITH COMMA BELOW
# - U+0x021A - LATIN CAPITAL LETTER T WITH COMMA BELOW
# - U+0x021B - LATIN SMALL LETTER T WITH COMMA BELOW
# Instead, letters with cedilla are being used:
# - U+0x015E - LATIN CAPITAL LETTER S WITH CEDILLA
# - U+0x015F - LATIN SMALL LETTER S WITH CEDILLA
# - U+0x0162 - LATIN CAPITAL LETTER T WITH CEDILLA
# - U+0x0163 - LATIN SMALL LETTER T WITH CEDILLA
# For more information see:
# - https://en.wikipedia.org/wiki/ISO/IEC_8859-2
# - https://pl.wikipedia.org/wiki/CP852
# - https://www.quora.com/What-is-the-difference-between-%C8%98-and-%C5%9E-in-Romanian
ALIAS 0x0218 0x015e BIDIRECTIONAL
ALIAS 0x0219 0x015f BIDIRECTIONAL
ALIAS 0x021a 0x0162 BIDIRECTIONAL
ALIAS 0x021b 0x0163 BIDIRECTIONAL
# Accented african letters can be replaced with unaccented ones,
# if only these are available:
ALIAS 0x01ba 0x0292 #LATIN SMALL LETTER EZH WITH TAIL
ALIAS 0x01ee 0x01b7 #LATIN CAPITAL LETTER EZH WITH CARON
ALIAS 0x01ef 0x0292 #LATIN SMALL LETTER EZH WITH CARON
# Accented ligatures can be replaced with unaccented ones,
# if only these are available:
ALIAS 0x01fd 0x00e6 #LATIN SMALL LETTER AE WITH ACUTE
ALIAS 0x01fc 0x00c6 #LATIN CAPITAL LETTER AE WITH ACUTE
# Some double accented letters can be replaced with single accented ones,
# if only these are available:
ALIAS 0x01fb 0x00e5 #LATIN SMALL LETTER A WITH RING ABOVE AND ACUTE
ALIAS 0x01fa 0x00c5 #LATIN CAPITAL LETTER A WITH RING ABOVE AND ACUTE
ALIAS 0x01ff 0x00f8 #LATIN SMALL LETTER O WITH STROKE AND ACUTE
ALIAS 0x01fe 0x00d8 #LATIN CAPITAL LETTER O WITH STROKE AND ACUTE
# Handle box drawing characters, which might be missing in some code pages
ALIAS 0x2534 0x2500 #BOX DRAWINGS LIGHT UP AND HORIZONTAL
ALIAS 0x252c 0x2500 #BOX DRAWINGS LIGHT DOWN AND HORIZONTAL
ALIAS 0x2565 0x2500 #BOX DRAWINGS DOWN DOUBLE AND HORIZONTAL SINGLE
ALIAS 0x2568 0x2500 #BOX DRAWINGS UP DOUBLE AND HORIZONTAL SINGLE
ALIAS 0x251c 0x2502 #BOX DRAWINGS LIGHT VERTICAL AND RIGHT
ALIAS 0x2524 0x2502 #BOX DRAWINGS LIGHT VERTICAL AND LEFT
ALIAS 0x255e 0x2502 #BOX DRAWINGS VERTICAL SINGLE AND RIGHT DOUBLE
ALIAS 0x2561 0x2502 #BOX DRAWINGS VERTICAL SINGLE AND LEFT DOUBLE
ALIAS 0x2564 0x2550 #BOX DRAWINGS DOWN SINGLE AND HORIZONTAL DOUBLE
ALIAS 0x2566 0x2550 #BOX DRAWINGS DOUBLE DOWN AND HORIZONTAL
ALIAS 0x2567 0x2550 #BOX DRAWINGS UP SINGLE AND HORIZONTAL DOUBLE
ALIAS 0x2569 0x2550 #BOX DRAWINGS DOUBLE UP AND HORIZONTAL
ALIAS 0x256a 0x2550 #BOX DRAWINGS VERTICAL SINGLE AND HORIZONTAL DOUBLE
ALIAS 0x255f 0x2551 #BOX DRAWINGS VERTICAL DOUBLE AND RIGHT SINGLE
ALIAS 0x2560 0x2551 #BOX DRAWINGS DOUBLE VERTICAL AND RIGHT
ALIAS 0x2562 0x2551 #BOX DRAWINGS VERTICAL DOUBLE AND LEFT SINGLE
ALIAS 0x2563 0x2551 #BOX DRAWINGS DOUBLE VERTICAL AND LEFT
ALIAS 0x256b 0x2551 #BOX DRAWINGS VERTICAL DOUBLE AND HORIZONTAL SINGLE
# Aliases to aid Cyrillic romanization for certain code pages, complements transliteration in ASCII.TXT
ALIAS 0x0401 0x00cb #CYRILLIC CAPITAL LETTER IO -> LATIN CAPITAL LETTER E WITH DIAERESIS
ALIAS 0x0403 0x01f4 #CYRILLIC CAPITAL LETTER GJE -> LATIN CAPITAL LETTER G WITH ACUTE
ALIAS 0x0403 0x0110 #CYRILLIC CAPITAL LETTER GJE -> LATIN CAPITAL LETTER D WITH STROKE
ALIAS 0x0405 0x1e90 #CYRILLIC CAPITAL LETTER DZE -> LATIN CAPITAL LETTER Z WITH CIRCUMFLEX
ALIAS 0x0407 0x00cf #CYRILLIC CAPITAL LETTER YI -> LATIN CAPITAL LETTER I WITH DIAERESIS
ALIAS 0x040c 0x1e30 #CYRILLIC CAPITAL LETTER KJE -> LATIN CAPITAL LETTER K WITH ACUTE
ALIAS 0x0416 0x017d #CYRILLIC CAPITAL LETTER ZHE -> LATIN CAPITAL LETTER Z WITH CARON
ALIAS 0x0418 0x0232 #CYRILLIC CAPITAL LETTER I -> LATIN CAPITAL LETTER Y WITH MACRON
ALIAS 0x0419 0x012c #CYRILLIC CAPITAL LETTER SHORT I -> LATIN CAPITAL LETTER I WITH BREVE
ALIAS 0x0427 0x010c #CYRILLIC CAPITAL LETTER CHE -> LATIN CAPITAL LETTER C WITH CARON
ALIAS 0x0428 0x0160 #CYRILLIC CAPITAL LETTER SHA -> LATIN CAPITAL LETTER S WITH CARON
ALIAS 0x042d 0x00c8 #CYRILLIC CAPITAL LETTER E -> LATIN CAPITAL LETTER E WITH GRAVE
ALIAS 0x042d 0x0116 #CYRILLIC CAPITAL LETTER E -> LATIN CAPITAL LETTER E WITH DOT ABOVE
ALIAS 0x042f 0x00c2 #CYRILLIC CAPITAL LETTER YA -> LATIN CAPITAL LETTER A WITH CIRCUMFLEX
ALIAS 0x0436 0x017e #CYRILLIC SMALL LETTER ZHE -> LATIN SMALL LETTER Z WITH CARON
ALIAS 0x0438 0x0233 #CYRILLIC SMALL LETTER I -> LATIN SMALL LETTER Y WITH MACRON
ALIAS 0x0439 0x012d #CYRILLIC SMALL LETTER SHORT I -> LATIN SMALL LETTER I WITH BREVE
ALIAS 0x0448 0x0161 #CYRILLIC SMALL LETTER SHA -> LATIN SMALL LETTER S WITH CARON
ALIAS 0x0447 0x010d #CYRILLIC SMALL LETTER CHE -> LATIN SMALL LETTER C WITH CARON
ALIAS 0x044d 0x00e8 #CYRILLIC SMALL LETTER E -> LATIN SMALL LETTER E WITH GRAVE
ALIAS 0x044d 0x0117 #CYRILLIC SMALL LETTER E -> LATIN SMALL LETTER E WITH DOT ABOVE
ALIAS 0x044f 0x00e2 #CYRILLIC SMALL LETTER YA -> LATIN SMALL LETTER A WITH CIRCUMFLEX
ALIAS 0x0451 0x00eb #CYRILLIC SMALL LETTER IO -> LATIN SMALL LETTER E WITH DIAERESIS
ALIAS 0x0453 0x01f5 #CYRILLIC SMALL LETTER GJE -> LATIN SMALL LETTER G WITH ACUTE
ALIAS 0x0453 0x0111 #CYRILLIC SMALL LETTER GJE -> LATIN SMALL LETTER D WITH STROKE
ALIAS 0x0455 0x1e91 #CYRILLIC SMALL LETTER DZE -> LATIN SMALL LETTER Z WITH CIRCUMFLEX
ALIAS 0x0457 0x00ef #CYRILLIC SMALL LETTER YI -> LATIN SMALL LETTER I WITH DIAERESIS
ALIAS 0x045c 0x1e31 #CYRILLIC SMALL LETTER KJE -> LATIN SMALL LETTER K WITH ACUTE
ALIAS 0x0498 0x00d0 #CYRILLIC CAPITAL LETTER ZE WITH DESCENDER -> LATIN CAPITAL LETTER ETH
ALIAS 0x0498 0x0179 #CYRILLIC CAPITAL LETTER ZE WITH DESCENDER -> LATIN CAPITAL LETTER Z WITH ACUTE
ALIAS 0x0499 0x00f0 #CYRILLIC SMALL LETTER ZE WITH DESCENDER -> LATIN SMALL LETTER ETH
ALIAS 0x0499 0x017a #CYRILLIC SMALL LETTER ZE WITH DESCENDER -> LATIN SMALL LETTER Z WITH ACUTE
ALIAS 0x04a2 0x00d1 #CYRILLIC CAPITAL LETTER EN WITH DESCENDER -> LATIN CAPITAL LETTER N WITH TILDE
ALIAS 0x04a3 0x00f1 #CYRILLIC SMALL LETTER EN WITH DESCENDER -> LATIN SMALL LETTER N WITH TILDE
ALIAS 0x04a4 0x1e44 #CYRILLIC CAPITAL LIGATURE EN GHE -> LATIN CAPITAL LETTER N WITH DOT ABOVE
ALIAS 0x04a5 0x1e45 #CYRILLIC SMALL LIGATURE EN GHE -> LATIN SMALL LETTER N WITH DOT ABOVE
ALIAS 0x04a8 0x00d2 #CYRILLIC CAPITAL LETTER ABKHASIAN HA -> LATIN CAPITAL LETTER O WITH GRAVE
ALIAS 0x04a9 0x00f2 #CYRILLIC SMALL LETTER ABKHASIAN HA -> LATIN SMALL LETTER O WITH GRAVE
ALIAS 0x04aa 0x015a #CYRILLIC CAPITAL LETTER ES WITH DESCENDER -> LATIN CAPITAL LETTER S WITH ACUTE
ALIAS 0x04ab 0x015b #CYRILLIC SMALL LETTER ES WITH DESCENDER -> LATIN SMALL LETTER S WITH ACUTE
ALIAS 0x04ae 0x00dc #CYRILLIC CAPITAL LETTER STRAIGHT U -> LATIN CAPITAL LETTER U WITH DIAERESIS
ALIAS 0x04ae 0x00da #CYRILLIC CAPITAL LETTER STRAIGHT U -> LATIN CAPITAL LETTER U WITH ACUTE
ALIAS 0x04af 0x00fc #CYRILLIC SMALL LETTER STRAIGHT U -> LATIN SMALL LETTER U WITH DIAERESIS
ALIAS 0x04af 0x00fa #CYRILLIC SMALL LETTER STRAIGHT U -> LATIN SMALL LETTER U WITH ACUTE
ALIAS 0x04b0 0x016a #CYRILLIC CAPITAL LETTER STRAIGHT U WITH STROKE -> LATIN CAPITAL LETTER U WITH MACRON
ALIAS 0x04b1 0x016b #CYRILLIC SMALL LETTER STRAIGHT U WITH STROKE -> LATIN SMALL LETTER U WITH MACRON
ALIAS 0x04b6 0x00c7 #CYRILLIC CAPITAL LETTER CHE WITH DESCENDER -> LATIN CAPITAL LETTER C WITH CEDILLA
ALIAS 0x04b7 0x00e7 #CYRILLIC SMALL LETTER CHE WITH DESCENDER -> LATIN SMALL LETTER C WITH CEDILLA
ALIAS 0x04d2 0x00c4 #CYRILLIC CAPITAL LETTER A WITH DIAERESIS -> LATIN CAPITAL LETTER A WITH DIAERESIS
ALIAS 0x04d3 0x00e4 #CYRILLIC SMALL LETTER A WITH DIAERESIS -> LATIN SMALL LETTER A WITH DIAERESIS
ALIAS 0x04d6 0x018e #CYRILLIC CAPITAL LETTER IE WITH BREVE -> LATIN CAPITAL LETTER REVERSED E
ALIAS 0x04d7 0x0258 #CYRILLIC SMALL LETTER IE WITH BREVE -> LATIN SMALL LETTER REVERSED E
ALIAS 0x04da 0x018f #CYRILLIC CAPITAL LETTER SCHWA WITH DIAERESIS -> LATIN CAPITAL LETTER SCHWA
ALIAS 0x04db 0x0259 #CYRILLIC SMALL LETTER SCHWA WITH DIAERESIS -> LATIN SMALL LETTER SCHWA
ALIAS 0x04de 0x0110 #CYRILLIC CAPITAL LETTER ZE WITH DIAERESIS -> LATIN CAPITAL LETTER D WITH STROKE
ALIAS 0x04df 0x0111 #CYRILLIC SMALL LETTER ZE WITH DIAERESIS -> LATIN SMALL LETTER D WITH STROKE
ALIAS 0x04e0 0x01b7 #CYRILLIC CAPITAL LETTER ABKHASIAN DZE -> LATIN CAPITAL LETTER EZH
ALIAS 0x04e1 0x0292 #CYRILLIC SMALL LETTER ABKHASIAN DZE -> LATIN SMALL LETTER EZH
ALIAS 0x04e2 0x012a #CYRILLIC CAPITAL LETTER I WITH MACRON -> LATIN CAPITAL LETTER I WITH MACRON
ALIAS 0x04e3 0x012b #CYRILLIC SMALL LETTER I WITH MACRON -> LATIN SMALL LETTER I WITH MACRON
ALIAS 0x04e4 0x00cf #CYRILLIC CAPITAL LETTER I WITH DIAERESIS -> LATIN CAPITAL LETTER I WITH DIAERESIS
ALIAS 0x04e5 0x00ef #CYRILLIC SMALL LETTER I WITH DIAERESIS -> LATIN SMALL LETTER I WITH DIAERESIS
ALIAS 0x04e6 0x022a #CYRILLIC CAPITAL LETTER O WITH DIAERESIS -> LATIN CAPITAL LETTER O WITH DIAERESIS
ALIAS 0x04e7 0x022b #CYRILLIC SMALL LETTER O WITH DIAERESIS -> LATIN SMALL LETTER O WITH DIAERESIS
ALIAS 0x04f0 0x00dc #CYRILLIC CAPITAL LETTER U WITH DIAERESIS -> LATIN CAPITAL LETTER U WITH DIAERESIS
ALIAS 0x04f1 0x00fc #CYRILLIC SMALL LETTER U WITH DIAERESIS -> LATIN SMALL LETTER U WITH DIAERESIS
ALIAS 0x04f2 0x00dc #CYRILLIC CAPITAL LETTER U WITH DOUBLE ACUTE -> LATIN CAPITAL LETTER U WITH DIAERESIS
ALIAS 0x04f3 0x00fc #CYRILLIC SMALL LETTER U WITH DOUBLE ACUTE -> LATIN SMALL LETTER U WITH DIAERESIS
ALIAS 0x04f4 0x010c #CYRILLIC CAPITAL LETTER CHE WITH DIAERESIS -> LATIN CAPITAL LETTER C WITH CARON
ALIAS 0x04f5 0x010d #CYRILLIC SMALL LETTER CHE WITH DIAERESIS -> LATIN SMALL LETTER C WITH CARON
ALIAS 0x04f8 0x018f #CYRILLIC CAPITAL LETTER YERU WITH DIAERESIS -> LATIN CAPITAL LETTER SCHWA
ALIAS 0x04f9 0x0259 #CYRILLIC SMALL LETTER YERU WITH DIAERESIS -> LATIN SMALL LETTER SCHWA
# Aliases to aid Georgian romanization for certain code pages, complements transliteration in ASCII.TXT
ALIAS 0x10a9 0x1e30 #GEORGIAN CAPITAL LETTER KAN -> LATIN CAPITAL LETTER K WITH ACUTE
ALIAS 0x10a9 0x01e8 #GEORGIAN CAPITAL LETTER KAN -> LATIN CAPITAL LETTER K WITH CARON
ALIAS 0x10ae 0x1e54 #GEORGIAN CAPITAL LETTER PAR -> LATIN CAPITAL LETTER P WITH ACUTE
ALIAS 0x10af 0x017d #GEORGIAN CAPITAL LETTER ZHAR -> LATIN CAPITAL LETTER Z WITH CARON
ALIAS 0x10b2 0x0164 #GEORGIAN CAPITAL LETTER TAR -> LATIN CAPITAL LETTER T WITH CARON
ALIAS 0x10b5 0x1e30 #GEORGIAN CAPITAL LETTER KHAR -> LATIN CAPITAL LETTER K WITH ACUTE
ALIAS 0x10b6 0x1e20 #GEORGIAN CAPITAL LETTER GHAN -> LATIN CAPITAL LETTER G WITH MACRON
ALIAS 0x10b6 0x0120 #GEORGIAN CAPITAL LETTER GHAN -> LATIN CAPITAL LETTER G WITH DOT ABOVE
ALIAS 0x10b9 0x010c #GEORGIAN CAPITAL LETTER CHIN -> LATIN CAPITAL LETTER C WITH CARON
ALIAS 0x10b9 0x0106 #GEORGIAN CAPITAL LETTER CHIN -> LATIN CAPITAL LETTER C WITH ACUTE
ALIAS 0x10ba 0x0106 #GEORGIAN CAPITAL LETTER CAN -> LATIN CAPITAL LETTER C WITH ACUTE
ALIAS 0x10bd 0x010c #GEORGIAN CAPITAL LETTER CHAR -> LATIN CAPITAL LETTER C WITH CARON
ALIAS 0x10f1 0x0113 #GEORGIAN LETTER HE -> LATIN SMALL LETTER E WITH MACRON
ALIAS 0x10f1 0x00e9 #GEORGIAN LETTER HE -> LATIN SMALL LETTER E WITH ACUTE
ALIAS 0x10d9 0x1e31 #GEORGIAN LETTER KAN -> LATIN SMALL LETTER K WITH ACUTE
ALIAS 0x10d9 0x01e9 #GEORGIAN LETTER KAN -> LATIN SMALL LETTER K WITH CARON
ALIAS 0x10de 0x1e55 #GEORGIAN LETTER PAR -> LATIN SMALL LETTER P WITH ACUTE
ALIAS 0x10df 0x017e #GEORGIAN LETTER ZHAR -> LATIN SMALL LETTER Z WITH CARON
ALIAS 0x10e2 0x0165 #GEORGIAN LETTER TAR -> LATIN SMALL LETTER T WITH CARON
ALIAS 0x10e5 0x1e31 #GEORGIAN LETTER KHAR -> LATIN SMALL LETTER K WITH ACUTE
ALIAS 0x10e6 0x1e21 #GEORGIAN LETTER GHAN -> LATIN SMALL LETTER G WITH MACRON
ALIAS 0x10e6 0x0121 #GEORGIAN LETTER GHAN -> LATIN SMALL LETTER G WITH DOT ABOVE
ALIAS 0x10e9 0x010d #GEORGIAN LETTER CHIN -> LATIN SMALL LETTER C WITH CARON
ALIAS 0x10e9 0x0107 #GEORGIAN LETTER CHIN -> LATIN SMALL LETTER C WITH ACUTE
ALIAS 0x10ea 0x0107 #GEORGIAN LETTER CAN -> LATIN SMALL LETTER C WITH ACUTE
ALIAS 0x10ed 0x010d #GEORGIAN LETTER CHAR -> LATIN SMALL LETTER C WITH CARON
ALIAS 0x10f5 0x014d #GEORGIAN LETTER HOE -> LATIN SMALL LETTER O WITH MACRON
ALIAS 0x10f5 0x022f #GEORGIAN LETTER HOE -> LATIN SMALL LETTER O WITH DOT ABOVE
# Aliases to aid Greek romanization for certain code pages, complements transliteration in ASCII.TXT
ALIAS 0x0386 0x00c1 #GREEK CAPITAL LETTER ALPHA WITH TONOS -> LATIN CAPITAL LETTER A WITH ACUTE
ALIAS 0x0388 0x00c9 #GREEK CAPITAL LETTER EPSILON WITH TONOS -> LATIN CAPITAL LETTER E WITH ACUTE
ALIAS 0x0389 0x00c9 #GREEK CAPITAL LETTER ETA WITH TONOS -> LATIN CAPITAL LETTER E WITH ACUTE
ALIAS 0x038a 0x00cd #GREEK CAPITAL LETTER IOTA WITH TONOS -> LATIN CAPITAL LETTER I WITH ACUTE
ALIAS 0x038c 0x00d3 #GREEK CAPITAL LETTER OMICRON WITH TONOS -> LATIN CAPITAL LETTER O WITH ACUTE
ALIAS 0x038e 0x00da #GREEK CAPITAL LETTER UPSILON WITH TONOS -> LATIN CAPITAL LETTER U WITH ACUTE
ALIAS 0x038f 0x00d3 #GREEK CAPITAL LETTER OMEGA WITH TONOS -> LATIN CAPITAL LETTER O WITH ACUTE
ALIAS 0x038f 0x014c #GREEK CAPITAL LETTER OMEGA WITH TONOS -> LATIN CAPITAL LETTER O WITH MACRON
ALIAS 0x0390 0x00ef #GREEK SMALL LETTER IOTA WITH DIALYTIKA AND TONOS -> LATIN SMALL LETTER I WITH DIAERESIS
ALIAS 0x0390 0x00ed #GREEK SMALL LETTER IOTA WITH DIALYTIKA AND TONOS -> LATIN SMALL LETTER A WITH ACUTE
ALIAS 0x03a9 0x014c #GREEK CAPITAL LETTER OMEGA -> LATIN CAPITAL LETTER O WITH MACRON
ALIAS 0x03aa 0x00cf #GREEK CAPITAL LETTER IOTA WITH DIALYTIKA -> LATIN CAPITAL LETTER I WITH DIAERESIS
ALIAS 0x03ab 0x00dc #GREEK CAPITAL LETTER UPSILON WITH DIALYTIKA -> LATIN CAPITAL LETTER U WITH DIAERESIS
ALIAS 0x03ac 0x00e1 #GREEK SMALL LETTER ALPHA WITH TONOS -> LATIN SMALL LETTER A WITH ACUTE
ALIAS 0x03ad 0x00e9 #GREEK SMALL LETTER EPSILON WITH TONOS -> LATIN SMALL LETTER E WITH ACUTE
ALIAS 0x03ae 0x00e9 #GREEK SMALL LETTER ETA WITH TONOS -> LATIN SMALL LETTER E WITH ACUTE
ALIAS 0x03af 0x00ed #GREEK SMALL LETTER IOTA WITH TONOS -> LATIN SMALL LETTER I WITH ACUTE
ALIAS 0x03b0 0x00fc #GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND TONOS -> LATIN SMALL LETTER U WITH DIAERESIS
ALIAS 0x03b0 0x00fa #GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND TONOS -> LATIN SMALL LETTER U WITH ACUTE
ALIAS 0x03c9 0x014d #GREEK SMALL LETTER OMEGA -> LATIN SMALL LETTER O WITH MACRON
ALIAS 0x03ca 0x00ef #GREEK SMALL LETTER IOTA WITH DIALYTIKA -> LATIN SMALL LETTER I WITH DIAERESIS
ALIAS 0x03cb 0x00fc #GREEK SMALL LETTER UPSILON WITH DIALYTIKA -> LATIN SMALL LETTER U WITH DIAERESIS
ALIAS 0x03cc 0x00f3 #GREEK SMALL LETTER OMICRON WITH TONOS -> LATIN SMALL LETTER O WITH ACUTE
ALIAS 0x03cd 0x00fa #GREEK SMALL LETTER UPSILON WITH TONOS -> LATIN SMALL LETTER U WITH ACUTE
ALIAS 0x03ce 0x00f3 #GREEK SMALL LETTER OMEGA WITH TONOS -> LATIN SMALL LETTER O WITH ACUTE
ALIAS 0x03ce 0x014c #GREEK SMALL LETTER OMEGA WITH TONOS -> LATIN CAPITAL LETTER O WITH MACRON
# ****************************************************************************
# List of duplicated code pages
# ****************************************************************************
# FreeDOS CPX files contain several duplicated code pages. List them here in
# pairs; whenever the first code page is encountered, it the engine will use
# the second one from the pair.
CODEPAGE 790 DUPLICATES 667 # Polish, Mazovia encoding
CODEPAGE 895 DUPLICATES 867 # Czech and Slovak, Kamenicky encoding
CODEPAGE 774 DUPLICATES 1118 # Lithuanian, LST 1283 encoding
CODEPAGE 772 DUPLICATES 1119 # Russian and Lithuanian, Cyrillic, LST 1284 encoding
# ****************************************************************************
# Receipts how to construct code page mappings
# ****************************************************************************
# For each code page, provide the list of partial mappings, starting from
# the highest priority one - if more than one mapping provides the Unicode
# code point for the given code page symbol, only the first will be used.
# Note, that FreeDOS code pages sometimes differ slightly from code pages
# of the era, they often add Euro sign, there is often a character in the
# 'undefined' area. Please check (for example, using Dos Navigator built-in
# tool, Utilities -> ASCII table) this for each code page you add, this is
# not always clearly docummented.
# If the codepage data set is particulary large, put it in a separate file,
# as a full (0x80-0xff characters, codes up to 0x7f are ignored) code page.
CODEPAGE 113 # Yugoslavian, Latin
0x85 0x00e0 #LATIN SMALL LETTER A WITH GRAVE
0x86 0x0107 #LATIN SMALL LETTER C WITH ACUTE
0x8f 0x0106 #LATIN CAPITAL LETTER C WITH ACUTE
0x90 0x00c9 #LATIN CAPITAL LETTER E WITH ACUTE
0x91 0x010d #LATIN SMALL LETTER C WITH CARON
0x92 0x010c #LATIN CAPITAL LETTER C WITH CARON
0x9b 0x0111 #LATIN SMALL LETTER D WITH STROKE
0x9d 0x0110 #LATIN CAPITAL LETTER D WITH STROKE
0xa4 0x0161 #LATIN SMALL LETTER S WITH CARON
0xa5 0x0160 #LATIN CAPITAL LETTER S WITH CARON
0xa6 0x017e #LATIN SMALL LETTER Z WITH CARON
0xa7 0x017d #LATIN CAPITAL LETTER Z WITH CARON
EXTENDS CODEPAGE 437
CODEPAGE 437 # United States
EXTENDS FILE mapping-unicode.org CP_437.TXT
CODEPAGE 667 # Polish, Mazovia encoding
# reference: https://en.wikipedia.org/wiki/Mazovia_encoding
0x86 0x0105 #LATIN SMALL LETTER A WITH OGONEK
0x8d 0x0107 #LATIN SMALL LETTER C WITH ACUTE
0x8f 0x0104 #LATIN CAPITAL LETTER A WITH OGONEK
0x90 0x0118 #LATIN CAPITAL LETTER E WITH OGONEK
0x91 0x0119 #LATIN SMALL LETTER E WITH OGONEK
0x92 0x0142 #LATIN SMALL LETTER L WITH STROKE
0x95 0x0106 #LATIN CAPITAL LETTER C WITH ACUTE
0x98 0x015a #LATIN CAPITAL LETTER S WITH ACUTE
0x9c 0x0141 #LATIN CAPITAL LETTER L WITH STROKE
0x9e 0x015b #LATIN SMALL LETTER S WITH ACUTE
0xa0 0x0179 #LATIN CAPITAL LETTER Z WITH ACUTE
0xa1 0x017b #LATIN CAPITAL LETTER Z WITH DOT ABOVE
0xa2 0x00f3 #LATIN SMALL LETTER O WITH ACUTE
0xa3 0x00d3 #LATIN CAPITAL LETTER O WITH ACUTE
0xa4 0x0144 #LATIN SMALL LETTER N WITH ACUTE
0xa5 0x0143 #LATIN CAPITAL LETTER N WITH ACUTE
0xa6 0x017a #LATIN SMALL LETTER Z WITH ACUTE
0xa7 0x017c #LATIN SMALL LETTER Z WITH DOT ABOVE
EXTENDS CODEPAGE 437
CODEPAGE 668 # Polish, 852 compatible
# Provides national characters on the same points as with CP 852, but is
# limited to Polish glyphs only, thus preserves more graphical characters
0x86 0x0107 #LATIN SMALL LETTER C WITH ACUTE
0x88 0x0142 #LATIN SMALL LETTER L WITH STROKE
0x8d 0x0179 #LATIN CAPITAL LETTER Z WITH ACUTE
0x8f 0x0106 #LATIN CAPITAL LETTER C WITH ACUTE
0x97 0x015a #LATIN CAPITAL LETTER S WITH ACUTE
0x98 0x015b #LATIN SMALL LETTER S WITH ACUTE
0x9d 0x0141 #LATIN CAPITAL LETTER L WITH STROKE
0xa2 0x00f3 #LATIN SMALL LETTER O WITH ACUTE
0xa4 0x0104 #LATIN CAPITAL LETTER A WITH OGONEK
0xa5 0x0105 #LATIN SMALL LETTER A WITH OGONEK
0xa8 0x0118 #LATIN CAPITAL LETTER E WITH OGONEK
0xa9 0x0119 #LATIN SMALL LETTER E WITH OGONEK
0xab 0x017a #LATIN SMALL LETTER Z WITH ACUTE
0xbd 0x017b #LATIN CAPITAL LETTER Z WITH DOT ABOVE
0xbe 0x017c #LATIN SMALL LETTER Z WITH DOT ABOVE
0xe0 0x00d3 #LATIN CAPITAL LETTER O WITH ACUTE
0xe3 0x0143 #LATIN CAPITAL LETTER N WITH ACUTE
0xe4 0x0144 #LATIN SMALL LETTER N WITH ACUTE
EXTENDS CODEPAGE 437
CODEPAGE 737 # Greek-2
EXTENDS FILE mapping-unicode.org CP_737.TXT
CODEPAGE 770 # Baltic
# reference: https://en.wikipedia.org/wiki/Code_page_770
0x80 0x010c #LATIN CAPITAL LETTER C WITH CARON
0x82 0x0117 #LATIN SMALL LETTER E WITH DOT ABOVE
0x83 0x0101 #LATIN SMALL LETTER A WITH MACRON
0x85 0x0105 #LATIN SMALL LETTER A WITH OGONEK
0x86 0x013c #LATIN SMALL LETTER L WITH CEDILLA
0x87 0x010d #LATIN SMALL LETTER C WITH CARON
0x88 0x0113 #LATIN SMALL LETTER E WITH MACRON
0x89 0x0112 #LATIN CAPITAL LETTER E WITH MACRON
0x8a 0x0119 #LATIN SMALL LETTER E WITH OGONEK
0x8b 0x0118 #LATIN CAPITAL LETTER E WITH OGONEK
0x8c 0x012b #LATIN SMALL LETTER I WITH MACRON
0x8d 0x012f #LATIN SMALL LETTER I WITH OGONEK
0x8e 0x00c4 #LATIN CAPITAL LETTER A WITH DIAERESIS
0x8f 0x0104 #LATIN CAPITAL LETTER A WITH OGONEK
0x90 0x0116 #LATIN CAPITAL LETTER E WITH DOT ABOVE
0x91 0x017e #LATIN SMALL LETTER Z WITH CARON
0x92 0x017d #LATIN CAPITAL LETTER Z WITH CARON
0x93 0x00f5 #LATIN SMALL LETTER O WITH TILDE
0x95 0x00d5 #LATIN CAPITAL LETTER O WITH TILDE
0x96 0x016b #LATIN SMALL LETTER U WITH MACRON
0x97 0x0173 #LATIN SMALL LETTER U WITH OGONEK
0x98 0x0123 #LATIN SMALL LETTER G WITH CEDILLA
0x9c 0x013b #LATIN CAPITAL LETTER L WITH CEDILLA
0x9d 0x201e #DOUBLE LOW-9 QUOTATION MARK
0x9e 0x0161 #LATIN SMALL LETTER S WITH CARON
0x9f 0x0160 #LATIN CAPITAL LETTER S WITH CARON
0xa0 0x0100 #LATIN CAPITAL LETTER A WITH MACRON
0xa1 0x012a #LATIN CAPITAL LETTER I WITH MACRON
0xa2 0x0137 #LATIN SMALL LETTER K WITH CEDILLA
0xa3 0x0136 #LATIN CAPITAL LETTER K WITH CEDILLA
0xa4 0x0146 #LATIN SMALL LETTER N WITH CEDILLA
0xa5 0x0145 #LATIN CAPITAL LETTER N WITH CEDILLA
0xa6 0x016a #LATIN CAPITAL LETTER U WITH MACRON
0xa7 0x0172 #LATIN CAPITAL LETTER U WITH OGONEK
0xa8 0x0122 #LATIN CAPITAL LETTER G WITH CEDILLA
0xad 0x012e #LATIN CAPITAL LETTER I WITH OGONEK
EXTENDS CODEPAGE 437
CODEPAGE 771 # Lithuanian and Russian, Cyrillic, KBL encoding
# reference: https://en.wikipedia.org/wiki/Code_page_866
0xdc 0x0104 #LATIN CAPITAL LETTER A WITH OGONEK
0xdd 0x0105 #LATIN SMALL LETTER A WITH OGONEK
0xde 0x010c #LATIN CAPITAL LETTER C WITH CARON
0xdf 0x010d #LATIN SMALL LETTER C WITH CARON
0xf0 0x0118 #LATIN CAPITAL LETTER E WITH OGONEK
0xf1 0x0119 #LATIN SMALL LETTER E WITH OGONEK
0xf2 0x0116 #LATIN CAPITAL LETTER E WITH DOT ABOVE
0xf3 0x0117 #LATIN SMALL LETTER E WITH DOT ABOVE
0xf4 0x012e #LATIN CAPITAL LETTER I WITH OGONEK
0xf5 0x012f #LATIN SMALL LETTER I WITH OGONEK
0xf6 0x0160 #LATIN CAPITAL LETTER S WITH CARON
0xf7 0x0161 #LATIN SMALL LETTER S WITH CARON
0xf8 0x0172 #LATIN CAPITAL LETTER U WITH OGONEK
0xf9 0x0173 #LATIN SMALL LETTER U WITH OGONEK
0xfa 0x016a #LATIN CAPITAL LETTER U WITH MACRON
0xfb 0x016b #LATIN SMALL LETTER U WITH MACRON
0xfc 0x017d #LATIN CAPITAL LETTER Z WITH CARON
0xfd 0x017e #LATIN SMALL LETTER Z WITH CARON
EXTENDS CODEPAGE 866
CODEPAGE 773 # Latin-7 (Baltic, old standard)
# reference: https://en.wikipedia.org/wiki/Code_page_773
EXTENDS FILE mapping-wikipedia.org CP_773.TXT
CODEPAGE 775 # Latin-7 (Baltic)
EXTENDS FILE mapping-unicode.org CP_775.TXT
CODEPAGE 777 # Lithuanian, Accented (old)
EXTENDS FILE mapping-wikipedia.org CP_777.TXT
CODEPAGE 778 # Lithuanian, Accented
# NOTE: FreeDOS definitions differ a little from official ones
0xfe 0x25a0 #BLACK SQUARE
EXTENDS FILE mapping-wikipedia.org CP_778.TXT
CODEPAGE 808 # Russian, Cyrillic, with EUR
# reference: https://en.wikipedia.org/wiki/Code_page_866
0xfd 0x20ac #EURO SIGN
EXTENDS CODEPAGE 866
CODEPAGE 848 # Ukrainian, Cyrillic, with EUR
# reference: https://en.wikipedia.org/wiki/Code_page_866
0xfd 0x20ac #EURO SIGN
EXTENDS CODEPAGE 1125
CODEPAGE 849 # Belarusian, Cyrillic, with EUR
# reference: https://en.wikipedia.org/wiki/Code_page_866
0xfb 0x20ac #EURO SIGN
EXTENDS CODEPAGE 1131
CODEPAGE 850 # Latin-1 (Western European)
EXTENDS FILE mapping-unicode.org CP_850.TXT
CODEPAGE 851 # Greek, old encoding
EXTENDS FILE mapping-wikipedia.org CP_851.TXT
CODEPAGE 852 # Latin-2 (Central European), with EUR
0xaa 0x20ac #EURO SIGN - FreeDOS specific
EXTENDS FILE mapping-unicode.org CP_852.TXT
CODEPAGE 853 # Latin-3 (Turkish, Maltese, and Esperanto)
0xaa 0x20ac #EURO SIGN - FreeDOS specific
0xd0 0x00a2 #CENT SIGN - FreeDOS specific
0xd1 0x00a5 #YEN SIGN - FreeDOS specific
0xf1 0x00b1 #PLUS-MINUS SIGN - FreeDOS specific
0xdd 0x20a4 #LIRA SIGN - FreeDOS specific
0xfb 0x20b7 #SPESMILO SIGN - FreeDOS specific
EXTENDS FILE mapping-wikipedia.org CP_853.TXT
CODEPAGE 855 # South Slavic, Cyrillic
EXTENDS FILE mapping-unicode.org CP_855.TXT
CODEPAGE 856 # Hebrew-2, with EUR
0xad 0x20ac #EURO SIGN - FreeDOS specific
EXTENDS FILE mapping-unicode.org CP_856.TXT
CODEPAGE 857 # Latin-5, with EUR
0xd5 0x20ac #EURO SIGN - FreeDOS specific
EXTENDS FILE mapping-unicode.org CP_857.TXT
CODEPAGE 858 # Latin-1 (Western European), with EUR
0xd5 0x20ac #EURO SIGN - FreeDOS specific
EXTENDS CODEPAGE 850
CODEPAGE 859 # Latin-9 (Western European), with EUR
# reference: https://en.wikipedia.org/wiki/Code_page_859
0xab 0x0153 #LATIN SMALL LIGATURE OE
0xac 0x0152 #LATIN CAPITAL LIGATURE OE
0xd5 0x20ac #EURO SIGN
0xdd 0x0160 #LATIN CAPITAL LETTER S WITH CARON
0xef 0x017d #LATIN CAPITAL LETTER Z WITH CARON
0xf3 0x0178 #LATIN CAPITAL LETTER Y WITH DIAERESIS
0xf7 0x017e #LATIN SMALL LETTER Z WITH CARON
0xf9 0x0161 #LATIN SMALL LETTER S WITH CARON
EXTENDS CODEPAGE 850
CODEPAGE 860 # Portuguese
EXTENDS FILE mapping-unicode.org CP_860.TXT
CODEPAGE 861 # Icelandic
EXTENDS FILE mapping-unicode.org CP_861.TXT
CODEPAGE 862 # Hebrew-2
EXTENDS FILE mapping-unicode.org CP_862.TXT
CODEPAGE 863 # Canadian French
EXTENDS FILE mapping-unicode.org CP_863.TXT
CODEPAGE 864 # Arabic
# 0x9b TODO: unidentified character - FreeDOS specific
# 0x9c TODO: unidentified character - FreeDOS specific
# 0x9f TODO: unidentified character - FreeDOS specific
# 0xa6 TODO: unidentified character - FreeDOS specific
# 0xa7 TODO: unidentified character - FreeDOS specific
EXTENDS FILE mapping-unicode.org CP_864.TXT
CODEPAGE 865 # Nordic
EXTENDS FILE mapping-unicode.org CP_865.TXT
CODEPAGE 866 # Russian, Cyrillic
# Note: this is NOT an alternative layout mentioned here:
# https://en.wikipedia.org/wiki/Code_page_866
EXTENDS FILE mapping-unicode.org CP_866.TXT
CODEPAGE 867 # Czech and Slovak, Kamenicky encoding
# reference: https://en.wikipedia.org/wiki/Kamenick%C3%BD_encoding
0x80 0x010c #LATIN CAPITAL LETTER C WITH CARON
0x83 0x010f #LATIN SMALL LETTER D WITH CARON
0x85 0x010e #LATIN CAPITAL LETTER D WITH CARON
0x86 0x0164 #LATIN CAPITAL LETTER T WITH CARON
0x87 0x010d #LATIN SMALL LETTER C WITH CARON
0x88 0x011b #LATIN SMALL LETTER E WITH CARON
0x89 0x011a #LATIN CAPITAL LETTER E WITH CARON
0x8a 0x0139 #LATIN CAPITAL LETTER L WITH ACUTE
0x8b 0x00cd #LATIN CAPITAL LETTER I WITH ACUTE
0x8c 0x013e #LATIN SMALL LETTER L WITH CARON
0x8d 0x013a #LATIN SMALL LETTER L WITH ACUTE
0x8f 0x00c1 #LATIN CAPITAL LETTER A WITH ACUTE
0x91 0x017e #LATIN SMALL LETTER Z WITH CARON
0x92 0x017d #LATIN CAPITAL LETTER Z WITH CARON
0x95 0x00d3 #LATIN CAPITAL LETTER O WITH ACUTE
0x96 0x016f #LATIN SMALL LETTER U WITH RING ABOVE
0x97 0x00da #LATIN CAPITAL LETTER U WITH ACUTE
0x98 0x00fd #LATIN SMALL LETTER Y WITH ACUTE
0x9b 0x0160 #LATIN CAPITAL LETTER S WITH CARON
0x9c 0x013d #LATIN CAPITAL LETTER L WITH CARON
0x9d 0x00dd #LATIN CAPITAL LETTER Y WITH ACUTE
0x9e 0x0158 #LATIN CAPITAL LETTER R WITH CARON
0x9f 0x0165 #LATIN SMALL LETTER T WITH CARON
0xa4 0x0148 #LATIN SMALL LETTER N WITH CARON
0xa5 0x0147 #LATIN CAPITAL LETTER N WITH CARON
0xa6 0x016e #LATIN CAPITAL LETTER U WITH RING ABOVE
0xa7 0x00d4 #LATIN CAPITAL LETTER O WITH CIRCUMFLEX
0xa8 0x0161 #LATIN SMALL LETTER S WITH CARON
0xa9 0x0159 #LATIN SMALL LETTER R WITH CARON
0xaa 0x0155 #LATIN SMALL LETTER R WITH ACUTE
0xab 0x0154 #LATIN CAPITAL LETTER R WITH ACUTE
0xad 0x00a7 #SECTION SIGN
EXTENDS CODEPAGE 437
CODEPAGE 869 # Greek, with EUR
0x87 0x20ac #EURO SIGN - FreeDOS specific
EXTENDS FILE mapping-unicode.org CP_869.TXT
CODEPAGE 872 # South Slavic, Cyrillic, with EUR
0xcf 0x20ac #EURO SIGN - FreeDOS specific
EXTENDS CODEPAGE 855
CODEPAGE 899 # Armenian, ArmSCII-8A encoding
0xff 0x055b #ARMENIAN EMPHASIS MARK - FreeDOS specific
EXTENDS FILE mapping-wikipedia.org CP_899.TXT
CODEPAGE 874 # Thai, with EUR
EXTENDS FILE mapping-unicode.org CP_874.TXT
CODEPAGE 991 # Polish, Mazovia encoding, with PLN
0x9b 0xfffd #replacement for PLN SYMBOL, symbol not available in Unicode
EXTENDS CODEPAGE 667
CODEPAGE 1116 # Estonian
# reference: https://en.wikipedia.org/wiki/Code_page_1116
0xd1 0x0161 #LATIN SMALL LETTER S WITH CARON
0xd2 0x0160 #LATIN CAPITAL LETTER S WITH CARON
0xe7 0x017e #LATIN SMALL LETTER Z WITH CARON
0xe8 0x017d #LATIN CAPITAL LETTER Z WITH CARON
EXTENDS CODEPAGE 850
CODEPAGE 1117 # Latvian
# reference: https://en.wikipedia.org/wiki/Code_page_1117
EXTENDS FILE mapping-wikipedia.org CP_1117.TXT
CODEPAGE 1118 # Lithuanian, LST 1283 encoding
# reference: https://en.wikipedia.org/wiki/Code_page_1118
0xb5 0x0104 #LATIN CAPITAL LETTER A WITH OGONEK
0xb6 0x010c #LATIN CAPITAL LETTER C WITH CARON
0xb7 0x0118 #LATIN CAPITAL LETTER E WITH OGONEK
0xb8 0x0116 #LATIN CAPITAL LETTER E WITH DOT ABOVE
0xbd 0x012e #LATIN CAPITAL LETTER I WITH OGONEK
0xbe 0x0160 #LATIN CAPITAL LETTER S WITH CARON
0xc6 0x0172 #LATIN CAPITAL LETTER U WITH OGONEK
0xb7 0x016a #LATIN CAPITAL LETTER U WITH MACRON
0xcf 0x017d #LATIN CAPITAL LETTER Z WITH CARON
0xd0 0x0105 #LATIN SMALL LETTER A WITH OGONEK
0xd1 0x010d #LATIN SMALL LETTER C WITH CARON
0xd2 0x0119 #LATIN SMALL LETTER E WITH OGONEK
0xd3 0x0117 #LATIN SMALL LETTER E WITH DOT ABOVE
0xd4 0x012f #LATIN SMALL LETTER I WITH OGONEK
0xd5 0x0161 #LATIN SMALL LETTER S WITH CARON
0xd6 0x0173 #LATIN SMALL LETTER U WITH OGONEK
0xd7 0x016b #LATIN SMALL LETTER U WITH MACRON
0xd8 0x017e #LATIN SMALL LETTER Z WITH CARON
0xe1 0x03b2 #GREEK SMALL LETTER BETA
0xef 0x22c2 #N-ARY INTERSECTION
0xf4 0x201e #DOUBLE LOW-9 QUOTATION MARK
0xf5 0x201c #LEFT DOUBLE QUOTATION MARK
0xfa 0x02d9 #DOT ABOVE
EXTENDS CODEPAGE 437
CODEPAGE 1119 # Lithuanian and Russian, Cyrillic, LST 1284 encoding
# reference: https://en.wikipedia.org/wiki/Code_page_866
0xb5 0x0104 #LATIN CAPITAL LETTER A WITH OGONEK
0xb6 0x010c #LATIN CAPITAL LETTER C WITH CARON
0xb7 0x0118 #LATIN CAPITAL LETTER E WITH OGONEK
0xb8 0x0116 #LATIN CAPITAL LETTER E WITH DOT ABOVE
0xbd 0x012e #LATIN CAPITAL LETTER I WITH OGONEK
0xbe 0x0160 #LATIN CAPITAL LETTER S WITH CARON
0xc6 0x0172 #LATIN CAPITAL LETTER U WITH OGONEK
0xc7 0x016a #LATIN CAPITAL LETTER U WITH MACRON
0xcf 0x017d #LATIN CAPITAL LETTER Z WITH CARON
0xd0 0x0105 #LATIN SMALL LETTER A WITH OGONEK
0xd1 0x010d #LATIN SMALL LETTER C WITH CARON
0xd2 0x0119 #LATIN SMALL LETTER E WITH OGONEK
0xd3 0x0117 #LATIN SMALL LETTER E WITH DOT ABOVE
0xd4 0x012f #LATIN SMALL LETTER I WITH OGONEK
0xd5 0x0161 #LATIN SMALL LETTER S WITH CARON
0xd6 0x0173 #LATIN SMALL LETTER U WITH OGONEK
0xd7 0x016b #LATIN SMALL LETTER U WITH MACRON
0xd9 0x017e #LATIN SMALL LETTER Z WITH CARON
0xf2 0x2265 #GREATER-THAN OR EQUAL TO
0xf3 0x2264 #LESS-THAN OR EQUAL TO
0xf4 0x201e #DOUBLE LOW-9 QUOTATION MARK
0xf5 0x201c #LEFT DOUBLE QUOTATION MARK
0xf6 0x00f7 #DIVISION SIGN
0xf7 0x2248 #ALMOST EQUAL TO
0xfc 0x207f #SUPERSCRIPT LATIN SMALL LETTER N
0xfd 0x00b2 #SUPERSCRIPT TWO
EXTENDS CODEPAGE 866
CODEPAGE 1125 # Ukrainian, Cyrillic
# reference: https://en.wikipedia.org/wiki/Code_page_866
0xf2 0x0490 #CYRILLIC CAPITAL LETTER GHE WITH UPTURN
0xf3 0x0491 #CYRILLIC SMALL LETTER GHE WITH UPTURN
0xf4 0x0404 #CYRILLIC CAPITAL LETTER UKRAINIAN IE
0xf5 0x0454 #CYRILLIC SMALL LETTER UKRAINIAN IE
0xf6 0x0406 #CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I
0xf7 0x0456 #CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I
0xf8 0x0407 #CYRILLIC CAPITAL LETTER YI
0xf9 0x0457 #CYRILLIC SMALL LETTER YI
0xfa 0x00f7 #DIVISION SIGN