You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: scriptshifter/tables/data/arabic.yml
+53-46Lines changed: 53 additions & 46 deletions
Original file line number
Diff line number
Diff line change
@@ -4,7 +4,8 @@
4
4
---
5
5
general:
6
6
name: Arabic
7
-
description: Arabic R2S using a conversion table and S2R using a 3rd party library.
7
+
description: >
8
+
Arabic R2S using a conversion table and S2R using a 3rd party library.
8
9
case_sensitive: false
9
10
10
11
parents:
@@ -17,7 +18,8 @@ roman_to_script:
17
18
# Original table by David Bucknum
18
19
# Last updated 25 January 2019
19
20
# Modified by WK with testing by Arabic Cat Staff LOC-CAIRO
20
-
# Additional info from R. Vassie, [n.d.] "Marrying the Arabic and Latin Scripts Conceptually"
21
+
# Additional info from R. Vassie, [n.d.] "Marrying the Arabic and Latin
22
+
# Scripts Conceptually"
21
23
22
24
# Punctuation marks:
23
25
"*": "\u066D"
@@ -65,19 +67,19 @@ roman_to_script:
65
67
66
68
# "sh[dot below] as in "Ishaq"
67
69
68
-
"%sh\u0323%": "\u0633\u062D"
70
+
"sh\u0323": "\u0633\u062D"
69
71
70
72
# "s[prime]h" combos
71
73
72
-
"%s\u02B9h%": "\u0633\u0647"
74
+
"s\u02B9h": "\u0633\u0647"
73
75
74
76
# "th[dot below]"
75
77
76
-
"%th\u0323%": "\u062A\u062D"
78
+
"th\u0323": "\u062A\u062D"
77
79
78
-
# dh[dot under]
80
+
# dh[dot under]
79
81
80
-
"%dh\u0323%": "\u062F\u062D"
82
+
"dh\u0323": "\u062F\u062D"
81
83
82
84
# La-hu
83
85
@@ -95,7 +97,9 @@ roman_to_script:
95
97
"mi\u02BEat": "\u0645\u0627\u0626\u0629"
96
98
"mi\u02BCat": "\u0645\u0627\u0626\u0629"
97
99
98
-
# Numbers (I have set these to Hindi numbers. Note that Persian and Urdu will technically use \u06F0-06F9. This needs further discussion with PSD as RLIN21 used Hindi numbers, Connexion and Voyager does not.)
100
+
# Numbers (I have set these to Hindi numbers. Note that Persian and Urdu
101
+
# will technically use \u06F0-06F9. This needs further discussion with PSD
102
+
# as RLIN21 used Hindi numbers, Connexion and Voyager does not.)
# truncation necessary? It seems to work fine with.
164
+
# truncation necessary? It seems to work fine with.
161
165
162
-
"%i\u0304\u02BEah": "\u064A\u0626\u0629"
163
-
"%i\u0304\u02BCah": "\u064A\u0626\u0629"
166
+
"i\u0304\u02BEah%": "\u064A\u0626\u0629"
167
+
"i\u0304\u02BCah%": "\u064A\u0626\u0629"
164
168
165
-
"%i\u0304\u02BEat": "\u064A\u0626\u0629"
166
-
"%i\u0304\u02BCat": "\u064A\u0626\u0629"
169
+
"i\u0304\u02BEat%": "\u064A\u0626\u0629"
170
+
"i\u0304\u02BCat%": "\u064A\u0626\u0629"
167
171
168
-
"%i\u02BEa\u0304": "\u0626\u0627"
169
-
"%i\u02BCa\u0304": "\u0626\u0627"
172
+
"i\u02BEa\u0304%": "\u0626\u0627"
173
+
"i\u02BCa\u0304%": "\u0626\u0627"
170
174
171
-
"%i\u02BE": "\u0626"
172
-
"%i\u02BC": "\u0626"
175
+
"i\u02BE%": "\u0626"
176
+
"i\u02BC%": "\u0626"
173
177
"a\u0304\u02BEa\u0304": "\u0627\u0621\u0627"
174
178
"a\u0304\u02BCa\u0304": "\u0627\u0621\u0627"
175
179
@@ -197,32 +201,34 @@ roman_to_script:
197
201
"a\u0304\u02BEi": "\u0627\u0626"
198
202
"a\u0304\u02BC": "\u0627\u0621"
199
203
"a\u0304\u02BE": "\u0627\u0621"
200
-
"A\u0304%": "\u0622"
201
-
"a\u0304%": "\u0622"
204
+
"%A\u0304": "\u0622"
205
+
"%a\u0304": "\u0622"
202
206
"A\u0304": "\u0627"
203
207
"a\u0304": "\u0627"
204
208
205
-
# These next two lines were intended to convert to alif-ayn when it is at the beginning of a word, definite or indefinine (i.e. al-a[ayn]ma[macron]l or [space]a[ayn]ma[macron]l"
206
-
"A\u02BB%": "\u0623\u0639"
207
-
"a\u02BB%": "\u0623\u0639"
209
+
# These next two lines were intended to convert to alif-ayn when it is at
210
+
# # the beginning of a word, definite or indefinine (i.e.
211
+
# al-a[ayn]ma[macron]l or [space]a[ayn]ma[macron]l"
212
+
"%A\u02BB": "\u0623\u0639"
213
+
"%a\u02BB": "\u0623\u0639"
208
214
"a\u02BB": "\u0639"
209
215
"A\u0301": "\u0649"
210
216
"a\u0301": "\u0649"
211
217
212
218
"ayy": "\u064A"
213
-
"A%": "\u0623"
214
-
"a%": "\u0627"
219
+
"%A": "\u0623"
220
+
"%a": "\u0627"
215
221
"A": "\u0623"
216
222
"a": ""
217
223
218
224
# I - Capital I at beginning of word is usually alif hamzah-below.
0 commit comments