diff options
Diffstat (limited to 'arabluatex_voc.lua')
-rw-r--r-- | arabluatex_voc.lua | 116 |
1 files changed, 59 insertions, 57 deletions
diff --git a/arabluatex_voc.lua b/arabluatex_voc.lua index 0097450..0331794 100644 --- a/arabluatex_voc.lua +++ b/arabluatex_voc.lua | |||
@@ -93,8 +93,9 @@ hamza = { | |||
93 | {a="'i'([^uaiUAI])", b="إI%1"}, | 93 | {a="'i'([^uaiUAI])", b="إI%1"}, |
94 | -- madda (historic writing below) | 94 | -- madda (historic writing below) |
95 | {a="'a'([^uaiUAI])", b="آ%1"}, | 95 | {a="'a'([^uaiUAI])", b="آ%1"}, |
96 | --tmp {a="'a?A([%_%^%.]?[%`%'btjghdrzsfqklmnywAY])", b="آ%1"}, | 96 | {a="([^uiUI])\'a?A([%_%^%.]?[%`%'btjghdrzsfqklmnywAY])", b="%1آ%2"}, |
97 | {a="([^UIui])'a?A([%_%^%.]?[%`%'btjghdrzsfqklmnywAY])", b="%1آ%2"}, | 97 | {a="^\'a?A([%_%^%.]?[%`%'btjghdrzsfqklmnywAY])", b="آ%1"}, |
98 | {a="(%W)\'a?A([%_%^%.]?[%`%'btjghdrzsfqklmnywAY])", b="%1آ%2"}, | ||
98 | {a="(A)(')(uN?)$", b="aآء%3"}, | 99 | {a="(A)(')(uN?)$", b="aآء%3"}, |
99 | {a="(A)(')(uN?)(%W)", b="aآء%3%4"}, | 100 | {a="(A)(')(uN?)(%W)", b="aآء%3%4"}, |
100 | {a="(A)(')(iN?)$", b="aآء%3"}, | 101 | {a="(A)(')(iN?)$", b="aآء%3"}, |
@@ -179,8 +180,9 @@ hamzaeasy = { -- differences marked below with 'easy' | |||
179 | {a="'i'([^uaiUAI])", b="إI%1"}, | 180 | {a="'i'([^uaiUAI])", b="إI%1"}, |
180 | -- madda (historic writing below) | 181 | -- madda (historic writing below) |
181 | {a="'a'([^uaiUAI])", b="آ%1"}, | 182 | {a="'a'([^uaiUAI])", b="آ%1"}, |
182 | --tmp {a="'a?A([%_%^%.]?[%`%'btjghdrzsfqklmnywAY])", b="آ%1"}, | 183 | {a="([^uiUI])\'a?A([%_%^%.]?[%`%'btjghdrzsfqklmnywAY])", b="%1آ%2"}, |
183 | {a="([^UIui])'a?A([%_%^%.]?[%`%'btjghdrzsfqklmnywAY])", b="%1آ%2"}, | 184 | {a="^\'a?A([%_%^%.]?[%`%'btjghdrzsfqklmnywAY])", b="آ%1"}, |
185 | {a="(%W)\'a?A([%_%^%.]?[%`%'btjghdrzsfqklmnywAY])", b="%1آ%2"}, | ||
184 | --easy (begin) | 186 | --easy (begin) |
185 | {a="(A)(')(uN?)$", b="aاء%3"}, | 187 | {a="(A)(')(uN?)$", b="aاء%3"}, |
186 | {a="(A)(')(uN?)(%W)", b="aاء%3%4"}, | 188 | {a="(A)(')(uN?)(%W)", b="aاء%3%4"}, |
@@ -246,69 +248,69 @@ hamzaeasy = { -- differences marked below with 'easy' | |||
246 | } | 248 | } |
247 | 249 | ||
248 | tanwin = { | 250 | tanwin = { |
249 | {a="uNU", b="ٌو"}, | 251 | {a="%-?uNU", b="ٌو"}, |
250 | {a="aNU", b="ًوا"}, | 252 | {a="%-?aNU", b="ًوا"}, |
251 | {a="iNU", b="ٍو"}, | 253 | {a="%-?iNU", b="ٍو"}, |
252 | -- assimilations (begin) | 254 | -- assimilations (begin) |
253 | {a="(uN)(%s)([rlmnwy])", b="ٌ%2%3%3"}, | 255 | {a="%-?(uN)(%s)([rlmnwy])", b="ٌ%2%3%3"}, |
254 | {a="(aN)(_A)(%s)([rlmnwy])", b="ًى%3%4%4"}, | 256 | {a="%-?(aN)(_A)(%s)([rlmnwy])", b="ًى%3%4%4"}, |
255 | {a="(aN)(Y)(%s)([rlmnwy])", b="ًى%3%4%4"}, | 257 | {a="%-?(aN)(Y)(%s)([rlmnwy])", b="ًى%3%4%4"}, |
256 | {a="(T)(aN)(%s)([rlmnwy])", b="%1ً%3%4%4"}, | 258 | {a="(T)%-?(aN)(%s)([rlmnwy])", b="%1ً%3%4%4"}, |
257 | {a="(ء)(aN)(%s)([rlmnwy])", b="%1ً%3%4%4"}, | 259 | {a="(ء)%-?(aN)(%s)([rlmnwy])", b="%1ً%3%4%4"}, |
258 | {a="([^TA])(aN)(%s)([rlmnwy])", b="%1ًا%3%4%4"}, | 260 | {a="([^TA])%-?(aN)(%s)([rlmnwy])", b="%1ًا%3%4%4"}, |
259 | {a="(iN)(%s)([rlmnwy])", b="ٍ%2%3%3"}, | 261 | {a="%-?(iNI?)(%s)([rlmnwy])", b="ٍ%2%3%3"}, |
260 | -- assimilations (end) | 262 | -- assimilations (end) |
261 | -- quoted tanwīn (begin) | 263 | -- quoted tanwīn (begin) |
262 | {a="(\"uN)", b=""}, | 264 | {a="%-?(\"uN)", b=""}, |
263 | {a="(B)(\"aN)", b="%1"}, | 265 | {a="(B)%-?(\"aN)", b="%1"}, |
264 | {a="(\"aN)(_A)", b="ى"}, | 266 | {a="%-?(\"aN)(_A)", b="ى"}, |
265 | {a="(\"aN)(Y)", b="ى"}, | 267 | {a="%-?(\"aN)(Y)", b="ى"}, |
266 | {a="(T)(\"aN)", b="%1"}, | 268 | {a="(T)%-?(\"aN)", b="%1"}, |
267 | {a="(ء)(\"aN)", b="%1"}, | 269 | {a="(ء)%-?(\"aN)", b="%1"}, |
268 | {a="([^TA])(\"aN)", b="%1ا"}, | 270 | {a="([^TA])%-?(\"aN)", b="%1ا"}, |
269 | {a="(\"iN)", b=""}, | 271 | {a="%-?(\"iNI?)", b=""}, |
270 | -- quoted tanwīn (end) | 272 | -- quoted tanwīn (end) |
271 | {a="(uN)", b="ٌ"}, | 273 | {a="%-?(uN)", b="ٌ"}, |
272 | {a="(B)(aN)", b="%1ً"}, | 274 | {a="(B)%-?(aN)", b="%1ً"}, |
273 | {a="(aN)(_A)", b="ًى"}, | 275 | {a="%-?(aN)(_A)", b="ًى"}, |
274 | {a="(aN)(Y)", b="ًى"}, | 276 | {a="%-?(aN)(Y)", b="ًى"}, |
275 | {a="(T)(aN)", b="%1ً"}, | 277 | {a="(T)%-?(aN)", b="%1ً"}, |
276 | {a="(ء)(aN)", b="%1ً"}, | 278 | {a="(ء)%-?(aN)", b="%1ً"}, |
277 | {a="([^TA])(aN)", b="%1ًا"}, | 279 | {a="([^TA])%-?(aN)", b="%1ًا"}, |
278 | {a="(iNI?)", b="ٍ"} | 280 | {a="%-?(iNI?)", b="ٍ"} |
279 | } | 281 | } |
280 | 282 | ||
281 | tanwineasy = { -- 'easy' requires some lines to be taken out: | 283 | tanwineasy = { -- 'easy' requires some lines to be taken out: |
282 | {a="uNU", b="ٌو"}, | 284 | {a="%-?uNU", b="ٌو"}, |
283 | {a="aNU", b="ًوا"}, | 285 | {a="%-?aNU", b="ًوا"}, |
284 | {a="iNU", b="ٍو"}, | 286 | {a="%-?iNU", b="ٍو"}, |
285 | -- assimilations (begin) | 287 | -- assimilations (begin) |
286 | -- {a="(uN)(%s)([rlmnwy])", b="ٌ%2%3%3"}, | 288 | -- {a="%-?(uN)(%s)([rlmnwy])", b="ٌ%2%3%3"}, |
287 | -- {a="(aN)(_A)(%s)([rlmnwy])", b="ًى%3%4%4"}, | 289 | -- {a="%-?(aN)(_A)(%s)([rlmnwy])", b="ًى%3%4%4"}, |
288 | -- {a="(aN)(Y)(%s)([rlmnwy])", b="ًى%3%4%4"}, | 290 | -- {a="%-?(aN)(Y)(%s)([rlmnwy])", b="ًى%3%4%4"}, |
289 | -- {a="(T)(aN)(%s)([rlmnwy])", b="%1ً%3%4%4"}, | 291 | -- {a="(T)%-?(aN)(%s)([rlmnwy])", b="%1ً%3%4%4"}, |
290 | -- {a="(ء)(aN)(%s)([rlmnwy])", b="%1ً%3%4%4"}, | 292 | -- {a="(ء)%-?(aN)(%s)([rlmnwy])", b="%1ً%3%4%4"}, |
291 | -- {a="([^TA])(aN)(%s)([rlmnwy])", b="%1ًا%3%4%4"}, | 293 | -- {a="([^TA])%-?(aN)(%s)([rlmnwy])", b="%1ًا%3%4%4"}, |
292 | -- {a="(iN)(%s)([rlmnwy])", b="ٍ%2%3%3"}, | 294 | -- {a="%-?(iNI?)(%s)([rlmnwy])", b="ٍ%2%3%3"}, |
293 | -- assimilations (end) | 295 | -- assimilations (end) |
294 | -- quoted tanwīn (begin) | 296 | -- quoted tanwīn (begin) |
295 | {a="(\"uN)", b=""}, | 297 | {a="%-?(\"uN)", b=""}, |
296 | {a="(B)(\"aN)", b="%1"}, | 298 | {a="(B)%-?(\"aN)", b="%1"}, |
297 | {a="(\"aN)(_A)", b="ى"}, | 299 | {a="%-?(\"aN)(_A)", b="ى"}, |
298 | {a="(\"aN)(Y)", b="ى"}, | 300 | {a="%-?(\"aN)(Y)", b="ى"}, |
299 | {a="(T)(\"aN)", b="%1"}, | 301 | {a="(T)%-?(\"aN)", b="%1"}, |
300 | {a="(ء)(\"aN)", b="%1"}, | 302 | {a="(ء)%-?(\"aN)", b="%1"}, |
301 | {a="([^TA])(\"aN)", b="%1ا"}, | 303 | {a="([^TA])%-?(\"aN)", b="%1ا"}, |
302 | {a="(\"iN)", b=""}, | 304 | {a="%-?(\"iNI?)", b=""}, |
303 | -- quoted tanwīn (end) | 305 | -- quoted tanwīn (end) |
304 | {a="(uN)", b="ٌ"}, | 306 | {a="%-?(uN)", b="ٌ"}, |
305 | {a="(B)(aN)", b="%1ً"}, | 307 | {a="(B)%-?(aN)", b="%1ً"}, |
306 | {a="(aN)(_A)", b="ًى"}, | 308 | {a="%-?(aN)(_A)", b="ًى"}, |
307 | {a="(aN)(Y)", b="ًى"}, | 309 | {a="%-?(aN)(Y)", b="ًى"}, |
308 | {a="(T)(aN)", b="%1ً"}, | 310 | {a="(T)%-?(aN)", b="%1ً"}, |
309 | {a="(ء)(aN)", b="%1ً"}, | 311 | {a="(ء)%-?(aN)", b="%1ً"}, |
310 | {a="([^TA])(aN)", b="%1ًا"}, | 312 | {a="([^TA])%-?(aN)", b="%1ًا"}, |
311 | {a="(iNI?)", b="ٍ"} | 313 | {a="%-?(iNI?)", b="ٍ"} |
312 | } | 314 | } |
313 | 315 | ||
314 | trigraphs = { -- trigraphs or more | 316 | trigraphs = { -- trigraphs or more |
@@ -452,7 +454,7 @@ digraphs = { | |||
452 | --tmp-added hyphen + initial alif without hamza: | 454 | --tmp-added hyphen + initial alif without hamza: |
453 | {a="(%-)([uai])([%^%_%.%`]?)(%a)", b="%1ا%3%4"}, | 455 | {a="(%-)([uai])([%^%_%.%`]?)(%a)", b="%1ا%3%4"}, |
454 | {a="^([uai])", b="ا%1"}, -- initial alif without hamza | 456 | {a="^([uai])", b="ا%1"}, -- initial alif without hamza |
455 | {a="(%s)([uai])", b="%1ا%2"}, -- initial alif without hamza | 457 | {a="(%s)([uai])", b="%1ا"}, -- initial alif without hamza |
456 | {a="%-%-", b="ـ"}, | 458 | {a="%-%-", b="ـ"}, |
457 | {a="ؤؤ", b="ؤّ"}, | 459 | {a="ؤؤ", b="ؤّ"}, |
458 | {a="أأ", b="أّ"}, | 460 | {a="أأ", b="أّ"}, |