Skip to content

Commit

Permalink
Work with nominal declension type guesser
Browse files Browse the repository at this point in the history
  • Loading branch information
rueter committed Jun 30, 2024
1 parent fec81f2 commit 6aeb8b8
Show file tree
Hide file tree
Showing 13 changed files with 429 additions and 209 deletions.
3 changes: 3 additions & 0 deletions src/fst/morphology/affixes/adjectives.lexc
Original file line number Diff line number Diff line change
Expand Up @@ -32,6 +32,9 @@ LEXICON A_KALĀ !!= @CODE@ contains kalā:kaʼlā 18
LEXICON A_TUBĀ !!= @CODE@ tubā:tuʼbā 19
NMN_TUBĀ ;

LEXICON A_AMĀ !!= @CODE@ amā:aʼm 19a
NMN_AMĀ ;

LEXICON A_AIGĀ !!= @CODE@ aigā:aʼig 20
NMN_AIGĀ ;
+Comp:%^StodRM%>īm NMN_SIDĀM ;
Expand Down
112 changes: 90 additions & 22 deletions src/fst/morphology/affixes/nouns.lexc
Original file line number Diff line number Diff line change
Expand Up @@ -63,6 +63,15 @@ LEXICON N_KALĀ-SG !!≈ * **@CODE@** contains kalā:kaʼlā 18
LEXICON N_KALĀ-PL !!≈ * **@CODE@** contains kalā:kaʼlā 18
NMN_KALĀ-PL ;

LEXICON N_IRĒ !!≈ * **@CODE@** contains irē:iʼr 18
NMN_IRĒ ;

LEXICON N_IRĒ-SG !!≈ * **@CODE@** contains irē:iʼr 18
NMN_IRĒ-SG ;

LEXICON N_IRĒ-PL !!≈ * **@CODE@** contains irē:iʼr 18
NMN_IRĒ-PL ;

LEXICON N_TUBĀ !!≈ * **@CODE@** tubā:tuʼbā 19
N_TUBĀ-SG ;
N_TUBĀ-PL ;
Expand All @@ -73,6 +82,16 @@ LEXICON N_TUBĀ-SG !!≈ * **@CODE@** tubā:tuʼbā 19
LEXICON N_TUBĀ-PL !!≈ * **@CODE@** tubā:tuʼbā 19
NMN_TUBĀ-PL ;

LEXICON N_AMĀ !!≈ * **@CODE@** amā:aʼm 19a
N_AMĀ-SG ;
N_AMĀ-PL ;

LEXICON N_AMĀ-SG !!≈ * **@CODE@** amā:aʼm 19a
NMN_AMĀ-SG ;

LEXICON N_AMĀ-PL !!≈ * **@CODE@** amā:aʼm 19a
NMN_AMĀ-PL ;

LEXICON N_AIGĀ !!≈ * **@CODE@** aigā:aigā 20
NMN_AIGĀ ;

Expand Down Expand Up @@ -1375,6 +1394,32 @@ LEXICON NMN_KALĀ-PL
:%^PalatalizeLeft PL-ILL_ži ;
:%^PalatalizeLeft PL-PAR_ḑi ;

!! 18a
LEXICON NMN_IRĒ !!≈ * **@CODE@** irē:iʼr
!!≈ * Yaml: **N-kalaa** Pass: 2014.12.12
!! Stem change: Yes
!! Consonant lengthening
!! Consonant palatalization
!! Vowel change in 2nd syllable ā:õ/0
!! Stød: Yes
NMN_IRĒ-SG ;
NMN_IRĒ-PL ;

LEXICON NMN_IRĒ-SG
:%^StodRMē SG-DAT_n ;
:%^StodRMē SG-ELA/INE_st ;
:%^StodRMē SG-GEN ;
:%{XC%}%>õ SG-ILL_ZERO ;
:%^StodRMē SG-INS_ks ;
:%^StodRMē SG-NOM ;
:%{XC%}%>õ SG-PAR_ZERO ;

LEXICON NMN_IRĒ-PL
:%^StodRMē PL-INS_DÕKS-STEM ;
:%^PalatalizeLeft PL-ELA/INE_šti ;
:%^PalatalizeLeft PL-ILL_ži ;
:%^PalatalizeLeft PL-PAR_ḑi ;

!! 19
LEXICON NMN_TUBĀ !!≈ * **@CODE@** tubā:tuʼb
!! * Yaml: **A-amaa, N-tubaa** Pass: 2014.12.12
Expand All @@ -1398,6 +1443,29 @@ LEXICON NMN_TUBĀ-PL
:%^PalatalizeLeft PL-ILL_ži ;
:%^PalatalizeLeft PL-PAR_ḑi ;

!! 19a
LEXICON NMN_AMĀ !!≈ * **@CODE@** amā:tuʼb
!! * Yaml: **A-amaa, N-tubaa** Pass: 2014.12.12
!! Stem change: Yes
!! Vowel change in word-final position a:õ/0
!! Stød
NMN_AMĀ-SG ;
NMN_AMĀ-PL ;
LEXICON NMN_AMĀ-SG
:%^StodRMā SG-DAT_n ;
:%^StodRMā SG-ELA/INE_st ;
:%^StodRMā SG-GEN ;
:%{XC%}%>õ SG-ILL_ZERO ;
:%^StodRMā SG-INS_ks ;
:%^StodRMā SG-NOM ;
:%{XC%}%>õ SG-PAR_ZERO ;

LEXICON NMN_AMĀ-PL
:%^StodRMā PL-INS_DÕKS-STEM ;
:%^PalatalizeLeft PL-ELA/INE_šti ;
:%^PalatalizeLeft PL-ILL_ži ;
:%^PalatalizeLeft PL-PAR_ḑi ;

!! 20
LEXICON NMN_AIGĀ !!≈ * **@CODE@** aigā:aʼig
!! * Yaml: **N-aigaa**
Expand Down Expand Up @@ -1431,19 +1499,19 @@ LEXICON NMN_LĒBA !!≈ * **@CODE@** lēba:leib
NMN_LĒBA-PL ;

LEXICON NMN_LĒBA-SG
:%^VowsLI1a SG-DAT_n ;
:%^VowsLI1a SG-ELA/INE_st ;
:%^VowsLI1a SG-GEN ;
: SG-ILL_õ ;
:%^VowsLI1a SG-INS_ks ;
:%^VowsLI1a SG-NOM ;
: SG-PAR_õ ;
:%^U2ZERO SG-DAT_n ;
:%^U2ZERO SG-ELA/INE_st ;
:%^U2ZERO SG-GEN ;
:%^VV2V%^VowsRM SG-ILL_õ ;
:%^U2ZERO SG-INS_ks ;
:%^U2ZERO SG-NOM ;
:%^VV2V%^VowsRM SG-PAR_õ ;

LEXICON NMN_LĒBA-PL
:%^VowsLI1a PL-INS_DÕKS-STEM ;
: PL-ELA/INE_šti ;
: PL-ILL_ži ;
: PL-PAR_ḑi ;
:%^U2ZERO PL-INS_DÕKS-STEM ;
:%^VV2V%^VowsRM PL-ELA/INE_šti ;
:%^VV2V%^VowsRM PL-ILL_ži ;
:%^VV2V%^VowsRM PL-PAR_ḑi ;

!! 21
LEXICON NMN_KŪJA !!≈ * **@CODE@** kūja:leiba
Expand Down Expand Up @@ -1661,19 +1729,19 @@ LEXICON NMN_LIEPĀ !!≈ * **@CODE@** liepā:liep 29
NMN_LIEPĀ-SG ;
NMN_LIEPĀ-PL ;
LEXICON NMN_LIEPĀ-SG !!≈ * **@CODE@** liepā:lieppā 29
:ā SG-DAT_n ;
:ā SG-ELA/INE_st ;
:ā SG-GEN ;
:%{XC%} SG-ILL_õ ;
:ā SG-INS_ks ;
:ā SG-NOM ;
:%{XC%} SG-PAR_õ ;
:%^CC2C SG-DAT_n ;
:%^CC2C SG-ELA/INE_st ;
:%^CC2C SG-GEN ;
:%^VowsRM SG-ILL_õ ;
:%^CC2C SG-INS_ks ;
:%^CC2C SG-NOM ;
:%^VowsRM SG-PAR_õ ;

LEXICON NMN_LIEPĀ-PL !!≈ * **@CODE@** liepā:lieppā 29
:ā PL-INS_DÕKS-STEM ;
: PL-ELA/INE_īst ;
: PL-ILL_īž ;
:%^VV2V PL-PAR_ți ;
:%^CC2C PL-INS_DÕKS-STEM ;
:%^CC2C%^VowsRM PL-ELA/INE_īst ;
:%^CC2C%^VowsRM PL-ILL_īž ;
:%^VV2V%^CC2C%^VowsRM PL-PAR_ți ;

LEXICON NMN_OKSĀ !!≈ * **@CODE@** oksā:oksā 30
!!≈ * Yaml: **N-oksaa** Passed:
Expand Down
6 changes: 6 additions & 0 deletions src/fst/morphology/affixes/propernouns.lexc
Original file line number Diff line number Diff line change
Expand Up @@ -49,6 +49,12 @@ LEXICON PROP_KALĀ !!= @CODE@ contains kalā:kalā 18
LEXICON PROP_KALĀ-SG !!= @CODE@ contains kalā:kalā 18
NMN_KALĀ-SG ;

!LEXICON PROP_IRĒ !!= @CODE@ contains irē:iʼr 18a
! NMN_IRĒ ;

LEXICON PROP_IRĒ-SG !!= @CODE@ contains irē:iʼr 18a
NMN_IRĒ-SG ;

LEXICON PROP_TUBĀ !!= @CODE@ tubā:tubā 19
NMN_TUBĀ ;

Expand Down
98 changes: 98 additions & 0 deletions src/fst/morphology/root.lexc
Original file line number Diff line number Diff line change
Expand Up @@ -532,6 +532,104 @@ Multichar_Symbols
%^VowsL1aToǭ !!≈ * **@CODE@** = a >> ǭ

! guess attempt
+N_12_puu
+N_13_rooq
+N_14_paeae
+N_15_tiiqe
+N_16_brii
+N_17_tei
+N_18_kalaa
+N_18a_iree
+N_19_tubaa
+N_19a_amaa
+N_20_aigaa
+N_21_leeba
!+N_22_puuoga only one stem
+N_23_looja
+N_24_paeaeva
+N_25_izaa
+N_25a_piezaa
+N_26_azhaa
+N_27_aaldzha
+N_28_sukaa
+N_29_liepaa

+N_30_oksaa
+N_31_voontsa
+N_32_liestaa
+N_33_aaiga
+N_33a_laanga
+N_34_siilma
+N_35_kaeaenga
+N_36_aaina
+N_37_veena ! virtually same as 38
+N_38_rooda ! virtually same as 37
+N_39_padaa

+N_40_sobraa
+N_41_kaepaa
+N_42_maksaa
+N_43_keera
+N_44_joora
!+N_45_puuola single word
+N_46_aaita
+N_47_uushka
+N_48_mooka
+N_49_dadzhaa

+N_50_sushaa
+N_51_kupshaa
+N_52_tshuurtsha
+N_53_seemda
+N_54_tiiera
+N_55_krooipa
+N_56_lilla
+N_57_kutaa
+N_58_neetsha
+N_59_kiqv

+N_60_
+N_61_
+N_62_
+N_63_
+N_64_
+N_65_
+N_66_
+N_67_
+N_68_
+N_69_

+N_70_
+N_71_
+N_72_
+N_73_
+N_74_
+N_75_
+N_76_
+N_77_
+N_78_
+N_79_

+N_80_
+N_81_
+N_82_
+N_83_
+N_84_
+N_85_
+N_86_
+N_87_
+N_88_
+N_89_

+N_90_
+N_91_
+N_92_
+N_93_
+N_94_
+N_95_
+N_96_
+N_97_
+N_98_
+N_99_ul
+N_101_täm
+N_136_tas
Expand Down
Loading

0 comments on commit 6aeb8b8

Please sign in to comment.