-
-
Notifications
You must be signed in to change notification settings - Fork 1
/
transliterationTests.json
151 lines (151 loc) · 10.2 KB
/
transliterationTests.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
{
"canonical_source": "https://github.com/indic-transliteration/indic_transliteration_scala/blob/master/src/test/resources/transliterationTests.json",
"comments": "Shared transliteration tests. In each test, the dev field is compulsory.",
"TODO": [
"Add tests for ॐ, handling of .Da in kannada.",
"various fraction symbols in various scripts"
],
"devanaagarii_round_trip": [
{
"description": "A general test. Checks punctuations, OM.",
"dev": "असय औषधिः ग्रन्थः! ॡकारो नास्ति लेशोऽपि संशयः। कीलकम्? कूपिः? कष्ठं भोः। शङ्कर! ज्ञानम्। सञ्जीवय। १२३४५॥ ॐ तत्।",
"iast": "asaya auṣadhiḥ granthaḥ! ḹkāro nāsti leśo'pi saṃśayaḥ. kīlakam? kūpiḥ? kaṣṭhaṃ bhoḥ. śaṅkara! jñānam. sañjīvaya. 12345.. oṃ tat.",
"iastDcs": "asaya auṣadhiḥ granthaḥ! ḹkāro nāsti leśo'pi saṃśayaḥ/ kīlakam? kūpiḥ? kaṣṭhaṃ bhoḥ/ śaṅkara! jñānam/ sañjīvaya/ 12345// aum tat/",
"hk": "asaya auSadhiH granthaH! lRRkAro nAsti lezo'pi saMzayaH| kIlakam? kUpiH? kaSThaM bhoH| zaGkara! jJAnam| saJjIvaya| 12345|| OM tat|",
"optitrans": "asaya auShadhiH granthaH! LLIkaaro naasti lesho.api saMshayaH. kiilakam? kuupiH? kaShThaM bhoH. shankara! JNaanam. sanjiivaya. 12345.. OM tat.",
"slp": "asaya OzaDiH granTaH! XkAro nAsti leSo'pi saMSayaH. kIlakam? kUpiH? kazWaM BoH. SaNkara! jYAnam. saYjIvaya. 12345.. oM tat.",
"wx": "asaya ORaXiH granWaH! ḹkAro nAswi leSoZpi saMSayaH. kIlakam? kUpiH? kaRTaM BoH. Safkara! jFAnam. saFjIvaya. 12345.. oM waw.",
"kannada": "ಅಸಯ ಔಷಧಿಃ ಗ್ರನ್ಥಃ! ೡಕಾರೋ ನಾಸ್ತಿ ಲೇಶೋಽಪಿ ಸಂಶಯಃ। ಕೀಲಕಮ್? ಕೂಪಿಃ? ಕಷ್ಠಂ ಭೋಃ। ಶಙ್ಕರ! ಜ್ಞಾನಮ್। ಸಞ್ಜೀವಯ। ೧೨೩೪೫॥ ಓಂ ತತ್।",
"malayalam": "അസയ ഔഷധിഃ ഗ്രന്ഥഃ! ൡകാരോ നാസ്തി ലേശോഽപി സംശയഃ। കീലകമ്? കൂപിഃ? കഷ്ഠം ഭോഃ। ശങ്കര! ജ്ഞാനമ്। സഞ്ജീവയ। ൧൨൩൪൫॥ ഓം തത്।",
"telugu": "అసయ ఔషధిః గ్రన్థః! ౡకారో నాస్తి లేశోఽపి సంశయః। కీలకమ్? కూపిః? కష్ఠం భోః। శఙ్కర! జ్ఞానమ్। సఞ్జీవయ। ౧౨౩౪౫॥ ఓం తత్।",
"gujarati": "અસય ઔષધિઃ ગ્રન્થઃ! ૡકારો નાસ્તિ લેશોઽપિ સંશયઃ। કીલકમ્? કૂપિઃ? કષ્ઠં ભોઃ। શઙ્કર! જ્ઞાનમ્। સઞ્જીવય। ૧૨૩૪૫॥ ૐ તત્।",
"assamese": "অসয ঔষধিঃ গ্ৰন্থঃ! ৡকাৰো নাস্তি লেশোঽপি সংশযঃ। কীলকম্? কূপিঃ? কষ্ঠং ভোঃ। শঙ্কৰ! জ্ঞানম্। সঞ্জীবয। ১২৩৪৫॥ ॐ তত্।",
"oriya": "ଅସଯ ଔଷଧିଃ ଗ୍ରନ୍ଥଃ! ୡକାରୋ ନାସ୍ତି ଲେଶୋଽପି ସଂଶଯଃ। କୀଲକମ୍? କୂପିଃ? କଷ୍ଠଂ ଭୋଃ। ଶଙ୍କର! ଜ୍ଞାନମ୍। ସଞ୍ଜୀଵଯ। ୧୨୩୪୫॥ ଓଂ ତତ୍।",
"titus": "asaya auṣadʰiḥ grantʰaḥ! l̥̄kāro nāsti leśo'pi saṃśayaḥ. kīlakam? kūpiḥ? kaṣṭʰaṃ bʰoḥ. śaṅkara! jñānam. sañjīvaya. 12345.. oṃ tat."
},
{
"description": "Tests La",
"dev": "अग्निमीळे पुरोहितं यज्ञस्य देवमृत्विजम्",
"iast": "agnimīḻe purohitaṃ yajñasya devamṛtvijam",
"iastDcs": "agnimīḻe purohitaṃ yajñasya devamṛtvijam",
"hk": "agnimILe purohitaM yajJasya devamRtvijam",
"optitrans": "agnimiiLe purohitaM yaJNasya devamRtvijam",
"slp": "agnimILe purohitaM yajYasya devamftvijam",
"wx": "agnimIḻe purohiwaM yajFasya xevamqwvijam",
"kannada": "ಅಗ್ನಿಮೀಳೇ ಪುರೋಹಿತಂ ಯಜ್ಞಸ್ಯ ದೇವಮೃತ್ವಿಜಮ್",
"malayalam": "അഗ്നിമീളേ പുരോഹിതം യജ്ഞസ്യ ദേവമൃത്വിജമ്",
"telugu": "అగ్నిమీళే పురోహితం యజ్ఞస్య దేవమృత్విజమ్",
"sinhala": "අග්නිමීළේ පුරෝහිතං යජ්ඤස්ය දේවමෘත්විජම්",
"oriya": "ଅଗ୍ନିମୀଳେ ପୁରୋହିତଂ ଯଜ୍ଞସ୍ଯ ଦେଵମୃତ୍ଵିଜମ୍",
"gurmukhi": "ਅਗ੍ਨਿਮੀਲ਼ੇ ਪੁਰੋਹਿਤਂ ਯਜ੍ਞਸ੍ਯ ਦੇਵਮृਤ੍ਵਿਜਮ੍",
"gujarati": "અગ્નિમીળે પુરોહિતં યજ્ઞસ્ય દેવમૃત્વિજમ્",
"assamese": "অগ্নিমীळে পুৰোহিতং যজ্ঞস্য দেবমৃত্বিজম্"
},
{
"description": "Tests WX avagraha and anunAsika options",
"dev": "लेशोऽपि, साँयि",
"wx": "leSoZpi, sAzyi"
},
{
"description": "Tests glyphs with nuTka",
"TODO": "Fix assamese test",
"dev": "अंशाइ पड़िब फ़कीर ज़रूर",
"oriya": "ଅଂଶାଇ ପଡ଼ିବ ଫ଼କୀର ଜ଼ରୂର",
"gujarati": "અંશાઇ પડ઼િબ ફ઼કીર જ઼રૂર",
"assamese": "অংশাই পড়িৱ फ़কীৰ ज़ৰূৰ",
"gurmukhi": "ਅਂਸ਼ਾਇ ਪੜਿਬ ਫ਼ਕੀਰ ਜ਼ਰੂਰ",
"itrans": "aMshaai pa.Diba fakiira zaruura"
},
{
"description": "Tests ch",
"optitrans": "agnipanchiikaraNa",
"dev": "अग्निपञ्चीकरण"
},
{
"description": "Tests R RR",
"titus": "vr̥kṣyaṃ havīṃṣi gr̥hyanta r̥̄ṇamu pitr̥̄n//",
"dev": "वृक्ष्यं हवींषि गृह्यन्त ॠणमु पितॄन्॥"
},
{
"description": "Tests glyphs with nuTka - ऱ ऴ set",
"dev": "ऱ ऴ",
"malayalam": "റ ഴ",
"kannada": "ಱ ೞ"
},
{
"description": "ᳵ ᳶ",
"dev": "ᳵ ᳶ",
"kannada": "ೱ ೲ"
},
{
"description": "Tests nuTka",
"comments": "malayalam and telugu have no nuTka",
"dev": "़",
"oriya": "଼",
"gujarati": "઼",
"assamese": "়",
"bengali": "়",
"kannada": "಼",
"gurmukhi": "਼"
},
{
"description": "Tests anunAsika",
"dev": "अँअळा",
"oriya": "ଅଁଅଳା",
"kannada": "ಅಁಅಳಾ",
"malayalam": "അഁഅളാ",
"gujarati": "અઁઅળા",
"assamese": "অঁঅळা",
"bengali": "অঁঅळা",
"gurmukhi": "ਅਁਅਲ਼ਾ"
}
],
"to_devanaagarii": [
{
"description": "Tests optitrans anunAsikas",
"dev": "सङ्क्षेपः",
"optitrans": "sanxepaH"
},
{
"description": "Check aDDak and tippee",
"dev": "अब्भर अक्क मूंडा भुल्ला",
"gurmukhi": "ਅੱਭਰ ਅੱਕ ਮੂੰਡਾ ਭੁੱਲਾ"
},
{
"description": "Tests Capitalized IAST",
"dev": "असय औषधिः ग्रन्थः! ॡकारो।ऽस्ति। नास्ति लेशोऽपि संशयः। कीलकम्? कूपिः? काष्ठं भोः। शङ्कर! ज्ञानम्। सञ्जीवय। १२३४५॥ ॐ तत्।",
"iast": "Asaya Auṣadhiḥ granthaḥ! ḹkāro.'sti. nāsti leśo'pi saṃśayaḥ. kīlakam? kūpiḥ? kāṣṭhaṃ bhoḥ. Śaṅkara! jñānam. sañjīvaya. 12345|| oṃ tat."
},
{
"description": "svaras",
"dev": "तुवे꣡ असुर्यं᳡ व꣡सवो नि꣡ ऋण्वन्",
"iast": "tuvé asuryàṃ vásavo ní r̥ṇvan",
"nonSupportingPrograms": "scala/indic-transliteration"
}
],
"from_devanaagarii": [
{
"description": "A general test for scripts without equivalents for some devanAgarI letters, like gurmukhI, bengali and tamil",
"dev": "असय औषधिः ग्रन्थः! ॡकारो नास्ति लेशोऽपि संशयः। कीलकम्? कूपिः? कष्ठं भोः। शङ्कर! ज्ञानम्। सञ्जीवय। १२३४५॥ ॐ तत्। अब अव",
"bengali": "অসয ঔষধিঃ গ্রন্থঃ! ৡকারো নাস্তি লেশোঽপি সংশযঃ। কীলকম্? কূপিঃ? কষ্ঠং ভোঃ। শঙ্কর! জ্ঞানম্। সঞ্জীবয। ১২৩৪৫॥ ॐ তত্। অব অব",
"gurmukhi": "ਅਸਯ ਔਸ਼ਧਿਃ ਗ੍ਰਨ੍ਥਃ! ॡਕਾਰੋ ਨਾਸ੍ਤਿ ਲੇਸ਼ੋऽਪਿ ਸਂਸ਼ਯਃ। ਕੀਲਕਮ੍? ਕੂਪਿਃ? ਕਸ਼੍ਠਂ ਭੋਃ। ਸ਼ਙ੍ਕਰ! ਜ੍ਞਾਨਮ੍। ਸਞ੍ਜੀਵਯ। ੧੨੩੪੫॥ ੴ ਤਤ੍। ਅਬ ਅਵ"
},
{
"description": "A general test for Roman scripts without equivalents for some devanAgarI letters, like optitrans",
"dev": "पड़िब छीड़ा ऴ ऱ",
"optitrans": "pa.Diba ChI.DA .La .Rha",
"nonSupportingPrograms": "scala/indic-transliteration"
},
{
"description": "hrasva e and o",
"dev": "ऎट ऒट कॆकॊकि",
"optitrans": "ETa OTa kEkOki"
},
{
"description": "ea and oa",
"dev": "कॉफी ऍक ऑक",
"optitrans": "koaphI eaka oaka",
"nonSupportingPrograms": "scala/indic-transliteration"
}
]
}