@@ -24,6 +24,36 @@ class FixEdeprels(Block):
2424 'فَ' : []
2525 }
2626
27+ # Reduction and normalization of prepositions and conjunctions, including
28+ # the derived and compound ones. The Latin transliterations are not really
29+ # needed in the process. We include them here as documentation, but also
30+ # to help the poor editor with rendering the lines. Ideally, each line
31+ # should have left-to-right text at both the beginning and end.
32+ substitution = [
33+ {'target' : ('min:gen' , 'مِن:gen' ),
34+ 'sources' :
35+ [('ibtida min' , 'اِبتِدَاء_مِن' )]
36+ },
37+ {'target' : ('ʾiṯra:gen' , 'إِثرَ:gen' ), # ʾiṯra = right after
38+ 'sources' :
39+ [('ʾiṯra' , 'إِثرَ' )]
40+ },
41+ {'target' : ('ʾaṯnāʾa:gen' , 'أَثنَاءَ:gen' ), # ʾaṯnāʾa = during
42+ 'sources' :
43+ [('ʾaṯnāʾa' , 'أَثنَاءَ' )]
44+ },
45+ {'target' : ('ʾiḏ' , 'إِذ' ), # ʾiḏ = because
46+ 'sources' :
47+ [('ʾiḏ' , 'إِذ' ),
48+ ('ʾiḏ ʾanna' , 'إِذ_أَنَّ' )]
49+ },
50+ {'target' : ('ʾiḏā' , 'إِذَا' ), # ʾiḏā = if
51+ 'sources' :
52+ [('ʾiḏā' , 'إِذَا' ),
53+ ('ʾiḏā' , 'إِذًا' )]
54+ },
55+ ]
56+
2757 # Secondary prepositions sometimes have the lemma of the original part of
2858 # speech. We want the grammaticalized form instead. List even those that
2959 # will have the same lexical form, as we also want to check the morphological
@@ -481,6 +511,7 @@ class FixEdeprels(Block):
481511 'ما_دَام' : 'مِمَّا' ,
482512 'مادامت' : 'مِمَّا' ,
483513 'مَالَم' : 'مَالَم' , # mālam = unless
514+ 'مَا_إِذَا' : 'إِذَا' ,
484515 'مِثلَ' : 'مِثلَ' , # remove morphological case; miṯla = like
485516 'مِثلَمَا' : 'مِثلَ' , # miṯla = like
486517 'مَعَ' : 'مَعَ:gen' , # maʿa = with
0 commit comments