commit 53780f8b0c7a66c38bbf5d85b32cca5f323e0944 Author: ruthenian8 Date: Fri Jul 2 16:43:21 2021 +0300 changes to lexd +new hfstol file diff --git a/Makefile b/Makefile index c54f16f..cef3af8 100644 --- a/Makefile +++ b/Makefile @@ -12,6 +12,8 @@ hfst-compose-intersect $^ -o $@ %.tr.hfst: %.ana.hfst hfst-compose translit/translit.hfst $< -o $@ +%.tr.hfstol: %.tr.hfst + hfst-fst2fst --optimized-lookup-unweighted -i $< -o $@ check-ana: bagval_numbers.ana.hfst gold-standart.ana.txt bash compare.sh $^ check-gen: bagval_numbers.gen.hfst gold-standart.txt diff --git a/merged.lexd b/merged.lexd index 0489488..ff21e0c 100644 --- a/merged.lexd +++ b/merged.lexd @@ -133,9 +133,9 @@ rootInit[DaNumber] end[DaNumber] rootInit[RaNumber] end[RaNumber] # ра, Кибрик et al. С. 155 PATTERN DaSuffixedNums -decimal end[DaNumber] -milli end[DaNumber] -centi end[DaNumber] +decimal end +milli end +centi end PATTERN NomNumbersAgr singles ( OblAdjSingular[OblSu] | OblAdjPlural[OblPlLu] ) @@ -236,16 +236,16 @@ PostClitic[all] RestrParticle ModalParticle UQparticle -QuestParticle -negSuffix[pst] +QuestParticle PostClitic[all]? +negSuffix[pst] QuestParticle? PostClitic[all]? PATTERN NCl # = Nominal clitics PostClitic RestrParticle ModalParticle UQparticle -QuestParticle -negSuffix[pst] +QuestParticle PostClitic? +negSuffix[pst] QuestParticle? PostClitic? # ---------------------------------------------------------------------------------------------- # ---------------------------------------------------------------------------------------------- @@ -342,6 +342,7 @@ adjSingle OblAdjSup NCl? # PerPronounStems genitiveCase[GenAgr] NCl? PerPronounStems[PrExc] CaseMain[ErgR,-RegErg,-nullNom] NCl? +PerPronounStems[PrExc] ( DatExcMin[pron] | SupExcMin[pron] ) NCl? PerPronounStems[-PrExc] CaseMain[ErgR] NCl? PerPronounExc NCl? PerPronounStems locMain directCase NCl? @@ -673,15 +674,21 @@ LEXICON TimeMarker LEXICON PostClitic :{ep.й}{ep.е}л[all] :ди[all] -:гъе[all] +:гъа[all] +:гъади[all] +:гъадила[all] :гъала[all] +:гъалади[all] +:гъаладила[all] +:гъе[all] :гъеди[all] +:гъедила[all] :дила[all] :гъаби[nom] :ла[all] # 179 :лъа[all] # 179 -:да[all] # 180 -:дала[all] # 180 +:да[all] # 180 +:дала[all] # 180 :лена[nom] :ена[nom] :гъула[all] # 180 @@ -691,8 +698,8 @@ LEXICON PostClitic # NUMBER DERIVATION # LEXICON end -:да[DaNumber] -:ра[RaNumber] +:да[DaNumber] +:ра[RaNumber] LEXICON col :ла @@ -833,7 +840,7 @@ LEXICON DatExcMin :лъа[OblLi] :ла[OblPlLu] :лла[OblPlAlu] -:ха[pron] +:гьа[pron] LEXICON SupExceptions :ща[OblSu] @@ -854,7 +861,7 @@ LEXICON SupExcMin :лъа[OblLi] :ла[OblPlLu] :лла[OblPlAlu] -:ха[pron] +:гьа[pron] LEXICON genitiveCase :лъ @@ -2661,21 +2668,30 @@ LEXICON UQparticle :хъал LEXICON ModalParticle -:гъо -:гъа -:гъасо -:гъаса -:гъабо -:гъаба +:гъо +:гъа +:гъасо +:гъаса +:гъабо +:гъаба +:або +:аба +:лъабо +:лъаба LEXICON QuestParticle :{ep.й}{ep.и}што +:йшто :{ep.й}{ep.и}шта +:йшта :{ep.й}{ep.и}шт :{ep.й}{ep.и}ш :{ep.й}{ep.и}ле +:йле :{ep.й}{ep.и}лах +:йлах :{ep.й}{ep.и} +:{ep.й}{ep.и}ᵸ LEXICON RestrParticle :тара @@ -4472,7 +4488,6 @@ LEXICON NounAbs лъер:лъер лъехъулгьар:лъехъулгьар лъеᵸ:лъеᵸ -лъеᵸ:лъеᵸ лъидир:лъидир лъилар:лъилар лъилъ:лъилъ @@ -9050,6 +9065,7 @@ LEXICON NounOblLi рекӀидалар:рекӀидалар рекӀидар:рекӀидар релгьаб:релгьаб +решен:решен рещӀар:рещӀар рижи:рижи ритӀар:ритӀар @@ -11120,8 +11136,8 @@ LEXICON VerbStem букъу:укъви[Idecl,AgrInit] # 863 cut букъу:ухъви[Idecl,AgrInit] # Gudava cut букъукъу:укъукъви[Idecl,AgrInit] -букӀуᵸ:укӀуᵸ[Idecl,AgrInit] букӀуᵸ:укӀвиᵸ[Idecl,AgrInit] # 89 +букӀуᵸ:укӀуᵸ[Idecl,AgrInit] бущущу:ущущви[Idecl,AgrInit] гвагвани:гвагвани[Idecl] гъенбелгьи:гъенбелгьи[Idecl] @@ -11135,9 +11151,16 @@ LEXICON VerbStem гьещӀи:гьещӀи[Idecl] гӀагалли:гӀагалли[Idecl] гӀаламатли:гӀаламатли[Idecl] +елъдви[Idecl,AgrInit] +етӀви[Idecl,AgrInit] +жекъви[Idecl] +жехъӀви[Idecl] +жукъви[Idecl] +жухъӀви[Idecl] зали:зали[Idecl] захӀматли:захӀматли[Idecl] игьвалъи:игьвалъи[Idecl] +ижви[Idecl,AgrInit] ичи:ичи[Idecl] ичи:ичи[Idecl] # 849 give ичичи:ичичи[Idecl] @@ -11167,8 +11190,23 @@ LEXICON VerbStem свадди:свадди[Idecl] сварди:сварди[Idecl] свари:свари[Idecl] +сусукӀви[Idecl] сӀелли:сӀелли[Idecl] +сӀухъви[Idecl] тӀоли:тӀоли[Idecl] +угъви[Idecl,AgrInit] +угьви[Idecl,AgrInit] +укви[Idecl,AgrInit] +укъви[Idecl,AgrInit] +укъукъви[Idecl,AgrInit] +укъухъӀви[Idecl,AgrInit] +укӀвиᵸ[Idecl,AgrInit] +улъви[Idecl,AgrInit] +усшви[Idecl,AgrInit] +ухъӀви[Idecl,AgrInit] +ухъӀукъви[Idecl,AgrInit] +ухъӀухъӀви[Idecl,AgrInit] +ушшви[Idecl,AgrInit] хвасарли:хвасарли[Idecl] хъвани:хъвани[Idecl] хъони:хъони[Idecl] @@ -11208,6 +11246,8 @@ LEXICON VerbStem аргъваᵸ:аргъваᵸ[IIdecl] атита:атита[IIdecl] ахбукӀва:ахбукӀва[IIdecl] +ахъваᵸ[IIdecl,AgrInit] +ачва[IIdecl,AgrInit] аша:аша[IIdecl] аща:аща[IIdecl] аᵸгьаᵸ:аᵸгьаᵸ[IIdecl] @@ -11217,7 +11257,6 @@ LEXICON VerbStem багӀари:багӀа[IIdecl] # bleat Gudava бала:ала[IIdecl,AgrInit] басаᵸ:асаᵸ[IIdecl,AgrInit] -басаᵸ:асаᵸ[IIdecl,AgrInit] басисаᵸ:асисаᵸ[IIdecl,AgrInit] бахиха:ахиха[IIdecl,AgrInit] бацӀа:ацӀа[IIdecl,AgrInit] @@ -11246,7 +11285,6 @@ LEXICON VerbStem бичӀаᵸ:ичӀаᵸ[IIdecl,AgrInit] # 849 look (irregular) бичӀичӀа:ичӀичӀа[IIdecl,AgrInit] бишаᵸ:ишаᵸ[IIdecl,AgrInit] -бишаᵸ:ишаᵸ[IIdecl,AgrInit] биъа:иъа[IIdecl,AgrInit] божа:ожа[IIdecl,AgrInit] бугъа:бугъа[IIdecl] # 89 @@ -11272,10 +11310,10 @@ LEXICON VerbStem гецӀа:гецӀа[IIdecl] гьаᵸдибугьа:гьаᵸдибугьа[IIdecl] гьекьаᵸ:гьекьаᵸ[IIdecl] -гьекьаᵸ:гьекьаᵸ[IIdecl] гьекьикьаᵸ:гьекьикьаᵸ[IIdecl] гьикьибагьа:гьикьибагьа[IIdecl] джеллаᵸ:джеллаᵸ[IIdecl] +зигьваᵸ[IIdecl] къебукӀва:къебукӀва[IIdecl] къоса:къоса[IIdecl] къосида:къосида[IIdecl] @@ -11284,20 +11322,38 @@ LEXICON VerbStem кьарашаᵸ:кьарашаᵸ[IIdecl] кьегъаᵸ:кьегъаᵸ[IIdecl] кьигьаᵸ:кьигьаᵸ[IIdecl] -ракъаᵸ:ракъаᵸ[IIdecl] +ожа[IIdecl,AgrInit] ракъаᵸ:ракъаᵸ[IIdecl] ракъи–рашваᵸ:ракъи–рашваᵸ[IIdecl] ракӀвачӀбукӀва:ракӀвачӀбукӀва[IIdecl] рахъӀаᵸ:рахъӀаᵸ[IIdecl] рекӀваᵸ:рекӀваᵸ[IIdecl] +рекӀваᵸ[IIdecl] ригьигьаᵸ:ригьигьаᵸ[IIdecl] +ругьаᵸ[IIdecl] тӀекваᵸ:тӀекваᵸ[IIdecl] +тӀекваᵸ[IIdecl] +уваᵸ[IIdecl,AgrInit] +угьа[IIdecl,AgrInit] +угьаᵸ[IIdecl,AgrInit] +угьаᵸ[IIdecl] +укаᵸ[IIdecl,AgrInit] +укӀа[IIdecl,AgrInit] +уллаᵸ[IIdecl,AgrInit] +ута[IIdecl,AgrInit] +ухӀа[IIdecl,AgrInit] +учаᵸ[IIdecl,AgrInit] +учӀаᵸ[IIdecl,AgrInit] +ушаᵸ[IIdecl,AgrInit] +ущаᵸ[IIdecl,AgrInit] хъӀочаᵸ:хъӀочаᵸ[IIdecl] хӀащӀабагьа:хӀащӀабагьа[IIdecl] чӀалгӀайна:чӀалгӀайна[IIdecl] чӀалгӀаᵸ:чӀалгӀаᵸ[IIdecl] чӀата:чӀата[IIdecl] +чӀунтӀа[IIdecl] экваᵸ:экваᵸ[IIdecl] +экваᵸ[IIdecl] экукаᵸ:экукаᵸ[IIdecl] экьаᵸ:экьаᵸ[IIdecl] эта:эта[IIdecl] @@ -11305,7 +11361,6 @@ LEXICON VerbStem эхъаᵸ:эхъаᵸ[IIdecl] эшаᵸ:эшаᵸ[IIdecl] эщаᵸ:эщаᵸ[IIdecl] -эщаᵸ:эщаᵸ[IIdecl] эщещаᵸ:эщещаᵸ[IIdecl] абатате:абатате[IIIdecl] агьецӀе:агьецӀе[IIIdecl] diff --git a/merged.tr.hfstol b/merged.tr.hfstol new file mode 100644 index 0000000..787c8d4 Binary files /dev/null and b/merged.tr.hfstol differ diff --git a/translit/translit b/translit/translit index a053c80..44287d9 100644 --- a/translit/translit +++ b/translit/translit @@ -57,6 +57,7 @@ ũ:уᵸ ū:у ō:о : +̄: =: -: : \ No newline at end of file