Skip to content

Commit 65181b6

Browse files
committed
Arabic edeprels.
1 parent 159c442 commit 65181b6

File tree

1 file changed

+31
-0
lines changed

1 file changed

+31
-0
lines changed

udapi/block/ud/ar/fixedeprels.py

Lines changed: 31 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -24,6 +24,36 @@ class FixEdeprels(Block):
2424
'فَ': []
2525
}
2626

27+
# Reduction and normalization of prepositions and conjunctions, including
28+
# the derived and compound ones. The Latin transliterations are not really
29+
# needed in the process. We include them here as documentation, but also
30+
# to help the poor editor with rendering the lines. Ideally, each line
31+
# should have left-to-right text at both the beginning and end.
32+
substitution = [
33+
{'target': ('min:gen', 'مِن:gen'),
34+
'sources':
35+
[('ibtida min', 'اِبتِدَاء_مِن')]
36+
},
37+
{'target': ('ʾiṯra:gen', 'إِثرَ:gen'), # ʾiṯra = right after
38+
'sources':
39+
[('ʾiṯra', 'إِثرَ')]
40+
},
41+
{'target': ('ʾaṯnāʾa:gen', 'أَثنَاءَ:gen'), # ʾaṯnāʾa = during
42+
'sources':
43+
[('ʾaṯnāʾa', 'أَثنَاءَ')]
44+
},
45+
{'target': ('ʾiḏ', 'إِذ'), # ʾiḏ = because
46+
'sources':
47+
[('ʾiḏ', 'إِذ'),
48+
('ʾiḏ ʾanna', 'إِذ_أَنَّ')]
49+
},
50+
{'target': ('ʾiḏā', 'إِذَا'), # ʾiḏā = if
51+
'sources':
52+
[('ʾiḏā', 'إِذَا'),
53+
('ʾiḏā', 'إِذًا')]
54+
},
55+
]
56+
2757
# Secondary prepositions sometimes have the lemma of the original part of
2858
# speech. We want the grammaticalized form instead. List even those that
2959
# will have the same lexical form, as we also want to check the morphological
@@ -481,6 +511,7 @@ class FixEdeprels(Block):
481511
'ما_دَام': 'مِمَّا',
482512
'مادامت': 'مِمَّا',
483513
'مَالَم': 'مَالَم', # mālam = unless
514+
'مَا_إِذَا': 'إِذَا',
484515
'مِثلَ': 'مِثلَ', # remove morphological case; miṯla = like
485516
'مِثلَمَا': 'مِثلَ', # miṯla = like
486517
'مَعَ': 'مَعَ:gen', # maʿa = with

0 commit comments

Comments
 (0)