Skip to content

Commit

Permalink
more words and contlexes
Browse files Browse the repository at this point in the history
2833 missing unique forms in 2013
  • Loading branch information
rueter committed Nov 18, 2024
1 parent 60dd773 commit eed22ca
Show file tree
Hide file tree
Showing 20 changed files with 509 additions and 134 deletions.
3 changes: 3 additions & 0 deletions src/fst/morphology/affixes/adjectives.lexc
Original file line number Diff line number Diff line change
Expand Up @@ -14,6 +14,9 @@

LEXICON A_UZ1 !!≈ * **@CODE@** = uz’:ud, goes to NMN_NORUZ
NMN_NORUZ1 ;
LEXICON A_NAGRIZH !nagriž:nagr
N_NAGRIZH ;
+Comp:he%>mb N_POIG ;

LEXICON A_RUSKED !!≈ * **@CODE@** = goes to NMN\_RUSKED
NMN_RUSKED ;
Expand Down
104 changes: 88 additions & 16 deletions src/fst/morphology/affixes/nouns.lexc
Original file line number Diff line number Diff line change
Expand Up @@ -285,6 +285,23 @@ R ; ! xxx check
:a PL-ACC-SUF ;
: PL-OBLIQUE ;

LEXICON N_0/an/ad/ha/id ! kund:kund
! _0/an/ad/ha/id
!Sg+Nom/Sg+Gen/Sg+Par/Sg+Ill/Pl+Par
!!€gt-norm: Noun ' / '
!!€ kund: kund+N+Sg+Nom
!!€ kundan: kund+N+Sg+Gen
!!€ kundha: kund+N+Sg+Ill
!!€ kundid: kund+N+Pl+Par
: SG-NOM-SUF ;
+Sg+Ill:ha K ;
:a SG-OBLIQUE ;
R ; ! xxx check
! Plural
:a PL-NOM-SUF ;
:a PL-ACC-SUF ;
: PL-OBLIQUE ;

LEXICON N_0/an/ad/aha/id ! uskonda:uskond
! _0/an/ad/aha/id
!Sg+Nom/Sg+Gen/Sg+Par/Sg+Ill/Pl+Par
Expand Down Expand Up @@ -584,7 +601,8 @@ LEXICON N_KEL1 !kelʼ:kel
:ʼ SG-NOM-SUF ;
:ʼ SG-PAR-SUF_t ;
:%>e SG-OBLIQUE ;
R ; ! xxx check
+Cmp/SgNom:ʼ R ;
+Err/Orth-no-pal+Cmp/SgNom: R ;
! Plural
:%>e PL-NOM-SUF ;
:%>e PL-ACC-SUF ;
Expand All @@ -596,9 +614,13 @@ LEXICON N_SAR1 !sarʼ:sar
!!€ n: +N+Sg+Gen
!!€ d: +N+Pl+Par
:ʼ SG-NOM-SUF ;
: SG-PAR-SUF_t ;
+Err/Orth-no-pal: SG-NOM-SUF ;
:ʼ SG-PAR-SUF_t ;
+Err/Orth-no-pal: SG-PAR-SUF_t ;
+Sg+Ill:ʼhe K ;
:%>e SG-OBLIQUE ;
R ; ! xxx check
+Cmp/SgNom:ʼ R ; !
+Cmp/SgNom+Err/Orth-no-pal: R ; !
! Plural
:%>e PL-NOM-SUF ;
:%>e PL-ACC-SUF ;
Expand Down Expand Up @@ -634,6 +656,21 @@ R ; ! xxx check
:%^PEN%^DEVOICE%^RmVow%^DEVOICE%>a PL-ACC-SUF ;
:%^PEN%^DEVOICE%^RmVow%^DEVOICE%>o PL-OBLIQUE ;

LEXICON N_IKUN !ikun:ikun
!!€gt-norm: Noun ' / '
!!€ ikun: ikun+N+Sg+Nom
!!€ iknan: ikun+N+Sg+Gen
!!€ iknoid: ikun+N+Pl+Par
!
: SG-NOM-SUF ;
!^RmVow
:%^RmVowa SG-OBLIQUE ;
R ; ! xxx check
! Plural
:%^RmVow%>a PL-NOM-SUF ;
:%^RmVow%>a PL-ACC-SUF ;
:%^RmVow%>o PL-OBLIQUE ;

LEXICON N_SAMAL !samal:samal syncope
!!€gt-norm: Noun ' / '
!!€ : +N+Sg+Nom
Expand Down Expand Up @@ -681,9 +718,9 @@ R ; ! xxx check

LEXICON N_1/en/ed/ehe/id ! apʼ:ap
!!€gt-norm: Noun ' / '
!!€ papʼ: +N+Sg+Nom
!!€ papin: +N+Sg+Gen
!!€ papid: +N+Pl+Par
!!€ apʼ: +N+Sg+Nom
!!€ apen: +N+Sg+Gen
!!€ apid: +N+Pl+Par
:ʼ SG-NOM-SUF ;
+Err/Orth-no-pal: SG-NOM-SUF ;
:e SG-OBLIQUE ;
Expand Down Expand Up @@ -720,6 +757,21 @@ R ; ! xxx check
:%>i PL-ACC-SUF ;
: PL-OBLIQUE ;

LEXICON N_GRAEHK !grähk:grähk
!!€gt-norm: Noun ' / '
!!€ grähk: grähk+N+Sg+Nom
!!€ grähkän: grähk+N+Sg+Gen
!!€ grähkid: grähk+N+Pl+Par
: SG-NOM-SUF ;
:%>ä SG-OBLIQUE ;!2013 New Testament
:%>a SG-OBLIQUE ;!2010 vep-ven
+Cmp/SgNom: R ; !
! Plural
:%>ä PL-NOM-SUF ;!2013 New Testament
:%>ä PL-ACC-SUF ;!2013 New Testament
:%>a PL-NOM-SUF ;!2010 vep-ven
:%>a PL-ACC-SUF ;!2010 vep-ven
: PL-OBLIQUE ;

LEXICON N_NIMI !nimi:nim
!!€gt-norm: Noun ' / '
Expand Down Expand Up @@ -783,12 +835,30 @@ R ; ! xxx check
:že PL-ACC-SUF ;
:ž PL-OBLIQUE ;

! noruz’:norud
LEXICON N_LAPS1
!!€gt-norm: Noun ' / '
!!€ lapsʼ: +N+Sg+Nom
!!€ lapsen: +N+Sg+Gen
!!€ last: +N+Sg+Par
!!€ lapsed: +N+Pl+Par
:psʼ SG-NOM-SUF ;
+Err/Orth-no-pal:ps SG-NOM-SUF ;
:s SG-PAR-SUF_t ;
+Sg+Ill:pshe K ;!CHECKME 2024-11-17
:pse SG-OBLIQUE ;
:psʼ R ; ! xxx check
! Plural
:pse PL-NOM-SUF ;
:pse PL-ACC-SUF ;
:ps PL-OBLIQUE ;

! noruzʼ:norud
LEXICON N_NORUZ1 ! OUN-ZD_QEQ
!!€gt-norm: Noun ' / '
!!€ : +N+Sg+Nom
!!€ n: +N+Sg+Gen
!!€ d: +N+Pl+Par
!!€ noruzʼ: noruzʼ+N+Sg+Nom
!!€ noruden: noruzʼ+N+Sg+Gen
!!€ norut: noruzʼ+N+Sg+Par
!!€ noruzid: +N+Pl+Par
: NMN_NORUZ1 ;


Expand Down Expand Up @@ -889,6 +959,7 @@ LEXICON N_o/on/od/oho/oid
!!€ nadoid: nado+N+Pl+Par
!!* Yaml: __nado__
: SG-NOM-SUF ;
+Sg+Ill:ho K ;
: SG-OBLIQUE ;
R ; ! xxx check
! Plural
Expand All @@ -901,10 +972,12 @@ R ; ! xxx check
!! ## Nominals

LEXICON NMN_NORUZ1
:%^TS’ SG-NOM-SUF ;
:%^DEVOICE SG-PAR-SUF ;
:%^TSʼ SG-NOM-SUF ;
+Err/Orth-no-pal:%^TS SG-NOM-SUF ;
+Sg+Par:%^DEVOICE K ;
:e SG-OBLIQUE ;
R ; ! xxx check
:%^TSʼ R ; !
+Err/Orth-no-pal:%^TS R ; !
! Plural
:e PL-NOM-SUF ;
:e PL-ACC-SUF ;
Expand Down Expand Up @@ -1163,11 +1236,10 @@ LEXICON ILL-SUF
LEXICON SG-INE-SUF
+Sg: INE-SUF ;
LEXICON INE-SUF
+Ine:%>s K ; ! s/š kül’betiš
+Ine:%>s K ; ! s/š külʼbetiš

LEXICON SG-NOM-SUF
+Sg: NOM-SUF ;
+Cmp/SgNom: R ; !
LEXICON NOM-SUF
+Nom: K ;

Expand Down Expand Up @@ -1253,7 +1325,7 @@ LEXICON PL-ILL-SUF
+Pl+Ill:%>ihe K ; ! o-ho

LEXICON PL-INE-SUF
+Pl+Ine:%>iš K ; ! s/š kül’betiš
+Pl+Ine:%>iš K ; ! s/š külʼbetiš

LEXICON PL-NOM-SUF
+Pl+Nom:%>d K ;
Expand Down
2 changes: 1 addition & 1 deletion src/fst/morphology/affixes/numerals.lexc
Original file line number Diff line number Diff line change
Expand Up @@ -13,7 +13,7 @@
! [email protected] or [email protected]

! ############################## !
!! # Olonets numerals
!! # VEPS numerals
! ############################## !

!! # Numeral inflection
Expand Down
25 changes: 22 additions & 3 deletions src/fst/morphology/affixes/pronouns.lexc
Original file line number Diff line number Diff line change
Expand Up @@ -47,11 +47,24 @@ ičeze+Pron+Refl+Pl3+Gen:ičeze K ;
ičeze+Pron+Refl+Sg3+Apr2:ičezennoks K ;
ičeze+Pron+Refl+Sg3+Egr:ičezennopäi K ;
ičeze+Pron+Refl+Pl3+Apr2:ičezennoks K ;!Do we want + OR +SP3
nece+Det:ne DET_NECE ;
nece+Det:ne DET_NECE ;! occurs also as a determiner
nece+Pron:ne DET_NECE ;
kaikutte+Pron:kaiku A_IN_TTE ;
mitte+Pron:mi PRON_IN_TTE ;
nimitte+Pron:nimi PRON_IN_TTE ;

nimi+Pron+Neg+Sg+Par:nimidä K ;
ken-ni+Pron+Indef+Sg+Nom:ken-ni K ;
ken-ni+Pron+Indef+Sg+Gen:kenen-ni K ;
ken-ni+Pron+Indef+Sg+Com:kenenke-ni K ;
ken-ni+Pron+Indef+Sg+Par:keda-ni K ;
ken-ni+Pron+Indef+Sg+Ade:kenel-ni K ;
ken-ni+Pron+Indef+Sg+All:kenele-ni K ;
ken-se+Pron+Indef+Sg+Nom:ken-se K ;
ken-se+Pron+Indef+Sg+Gen:kenen-se K ;
ken-se+Pron+Indef+Sg+Par:keda-se K ;
ken-se+Pron+Indef+Sg+Ade:kenel-se K ;
ken-se+Pron+Indef+Sg+All:kenele-se K ;
kuna+Pron+Rel:kuna K ;

LEXICON PRON_IN_TTE !mitte
N_IN_TTE ;
Expand Down Expand Up @@ -163,6 +176,11 @@ LEXICON DEM-PRON
se+Pron+Dem+Sg+Nom:se K ;
se+Pron+Dem+Sg+Gen:sen K ;
se+Pron+Dem+Sg+Par:sidä K ;
se+Pron+Dem+Sg+All:sille K ;
se+Pron+Dem+Sg+Ade:sil K ;
se+Pron+Dem+Sg+Ine:siš K ;
se+Pron+Dem+Sg+Ela:sišpäi K ;
se+Pron+Dem+Sg+Ill:sihe K ;

LEXICON NEG-PRON
!! @LEXNAME@ split in Nom Gen Par
Expand Down Expand Up @@ -195,7 +213,8 @@ LEXICON DET_NECE !nece+Pron:ne
+Dem:n PL-GEN-SUF ;
+Dem:n PL-ILL-SUF ;
+Dem:n PL-INE-SUF ;
+Dem:ne PL-NOM-SUF ;
+Dem:ne PL-NOM-SUF ;! «nened» occurs both as Det and Pron
+Dem+Pl+Nom:ne K ;!! «nene» occurs both as Det and Pron
+Dem:n PL-PAR-SUF ;
+Dem:n PL-TRA-SUF ;

Expand Down
26 changes: 23 additions & 3 deletions src/fst/morphology/affixes/quantifiers.lexc
Original file line number Diff line number Diff line change
Expand Up @@ -15,10 +15,30 @@ LEXICON NUM_UEHESA
+Sg+Nom: K ;
+Sg: OBLIQUE_CASES_FOR_PRONOUNS ;

!LEXICON NUM_NORUZ
!!! **LEXICON @LEXNAME@**
LEXICON NUM_SEICHEME !seičeme:seičem
:e SG-NOM-SUF ;
:%>e SG-OBLIQUE ;
:e R ; ! xxx check
! Plural
:%>e PL-NOM-SUF ;
:%>e PL-ACC-SUF ;
:%>i PL-OBLIQUE ;

LEXICON NUM_KOUME !koume:koum
!! **LEXICON @LEXNAME@**
:e SG-NOM-SUF ;
+Sg+Ill:he K ;
:%>e SG-OBLIQUE ;
:e R ; ! xxx check
! Plural
:%>e PL-NOM-SUF ;
:%>e PL-ACC-SUF ;
:%>i PL-OBLIQUE ;

LEXICON NUM_NORUZ1
!! **LEXICON @LEXNAME@**
!+Sg+Nom:%>D1E1 K ;
!: N_NORUZ1 ; ! this applies correct case
: NMN_NORUZ1 ; ! this applies correct case

LEXICON NUM_
!! **LEXICON @LEXNAME@**
Expand Down
Loading

0 comments on commit eed22ca

Please sign in to comment.