You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: scriptshifter/tables/data/arabic.yml
+58-54Lines changed: 58 additions & 54 deletions
Original file line number
Diff line number
Diff line change
@@ -4,7 +4,8 @@
4
4
---
5
5
general:
6
6
name: Arabic
7
-
description: Arabic R2S using a conversion table and S2R using a 3rd party library.
7
+
description: >
8
+
Arabic R2S using a conversion table and S2R using a 3rd party library.
8
9
case_sensitive: false
9
10
10
11
parents:
@@ -16,17 +17,18 @@ roman_to_script:
16
17
17
18
# Original table by David Bucknum
18
19
# Last updated 25 January 2019
19
-
# Modified by WK with testing by Arabic Cat Staff LOC-CAIRO
20
-
# Additional info from R. Vassie, [n.d.] "Marrying the Arabic and Latin Scripts Conceptually"
20
+
# Modified by WK with testing by Arabic Cat Staff LOC-CAIRO
21
+
# Additional info from R. Vassie, [n.d.] "Marrying the Arabic and Latin
22
+
# Scripts Conceptually"
21
23
22
24
23
-
# Punctuation marks:
25
+
# Punctuation marks:
24
26
"*": "\u066D"
25
27
",": "\u060C"
26
28
";": "\u061B"
27
29
"?": "\u061F"
28
30
29
-
# Exceptions for specific words
31
+
# Exceptions for specific words
30
32
# Allah
31
33
"Alla\u0304h": "\u0627\u0644\u0644\u0647"
32
34
@@ -66,19 +68,19 @@ roman_to_script:
66
68
67
69
# "sh[dot below] as in "Ishaq"
68
70
69
-
"%sh\u0323%": "\u0633\u062D"
71
+
"sh\u0323": "\u0633\u062D"
70
72
71
73
# "s[prime]h" combos
72
74
73
-
"%s\u02B9h%": "\u0633\u0647"
75
+
"s\u02B9h": "\u0633\u0647"
74
76
75
77
# "th[dot below]"
76
78
77
-
"%th\u0323%": "\u062A\u062D"
79
+
"th\u0323": "\u062A\u062D"
78
80
79
-
# dh[dot under]
81
+
# dh[dot under]
80
82
81
-
"%dh\u0323%": "\u062F\u062D"
83
+
"dh\u0323": "\u062F\u062D"
82
84
83
85
# La-hu
84
86
@@ -96,7 +98,9 @@ roman_to_script:
96
98
"mi\u02BEat": "\u0645\u0627\u0626\u0629"
97
99
"mi\u02BCat": "\u0645\u0627\u0626\u0629"
98
100
99
-
# Numbers (I have set these to Hindi numbers. Note that Persian and Urdu will technically use \u06F0-06F9. This needs further discussion with PSD as RLIN21 used Hindi numbers, Connexion and Voyager does not.)
101
+
# Numbers (I have set these to Hindi numbers. Note that Persian and Urdu
102
+
# will technically use \u06F0-06F9. This needs further discussion with PSD
103
+
# as RLIN21 used Hindi numbers, Connexion and Voyager does not.)
# truncation necessary? It seems to work fine with.
165
+
# truncation necessary? It seems to work fine with.
162
166
163
-
"%i\u0304\u02BEah": "\u064A\u0626\u0629"
164
-
"%i\u0304\u02BCah": "\u064A\u0626\u0629"
167
+
"i\u0304\u02BEah%": "\u064A\u0626\u0629"
168
+
"i\u0304\u02BCah%": "\u064A\u0626\u0629"
165
169
166
-
"%i\u0304\u02BEat": "\u064A\u0626\u0629"
167
-
"%i\u0304\u02BCat": "\u064A\u0626\u0629"
170
+
"i\u0304\u02BEat%": "\u064A\u0626\u0629"
171
+
"i\u0304\u02BCat%": "\u064A\u0626\u0629"
168
172
169
-
"%i\u02BEa\u0304": "\u0626\u0627"
170
-
"%i\u02BCa\u0304": "\u0626\u0627"
173
+
"i\u02BEa\u0304%": "\u0626\u0627"
174
+
"i\u02BCa\u0304%": "\u0626\u0627"
171
175
172
-
"%i\u02BE": "\u0626"
173
-
"%i\u02BC": "\u0626"
176
+
"i\u02BE%": "\u0626"
177
+
"i\u02BC%": "\u0626"
174
178
"a\u0304\u02BEa\u0304": "\u0627\u0621\u0627"
175
179
"a\u0304\u02BCa\u0304": "\u0627\u0621\u0627"
176
-
180
+
177
181
"a\u02BE": "\u0623"
178
182
"a\u02BC": "\u0623"
179
183
"\u02BEi": "\u0626"
@@ -198,64 +202,66 @@ roman_to_script:
198
202
"a\u0304\u02BEi": "\u0627\u0626"
199
203
"a\u0304\u02BC": "\u0627\u0621"
200
204
"a\u0304\u02BE": "\u0627\u0621"
201
-
"A\u0304%": "\u0622"
202
-
"a\u0304%": "\u0622"
205
+
"%A\u0304": "\u0622"
206
+
"%a\u0304": "\u0622"
203
207
"A\u0304": "\u0627"
204
208
"a\u0304": "\u0627"
205
209
206
-
# These next two lines were intended to convert to alif-ayn when it is at the beginning of a word, definite or indefinine (i.e. al-a[ayn]ma[macron]l or [space]a[ayn]ma[macron]l"
207
-
"A\u02BB%": "\u0623\u0639"
208
-
"a\u02BB%": "\u0623\u0639"
210
+
# These next two lines were intended to convert to alif-ayn when it is at
211
+
# # the beginning of a word, definite or indefinine (i.e.
212
+
# al-a[ayn]ma[macron]l or [space]a[ayn]ma[macron]l"
213
+
"%A\u02BB": "\u0623\u0639"
214
+
"%a\u02BB": "\u0623\u0639"
209
215
"a\u02BB": "\u0639"
210
216
"A\u0301": "\u0649"
211
217
"a\u0301": "\u0649"
212
218
213
219
"ayy": "\u064A"
214
-
"A%": "\u0623"
215
-
"a%": "\u0627"
220
+
"%A": "\u0623"
221
+
"%a": "\u0627"
216
222
"A": "\u0623"
217
223
"a": ""
218
224
219
225
# I - Capital I at beginning of word is usually alif hamzah-below.
0 commit comments