Skip to content

Commit

Permalink
Add more proper names
Browse files Browse the repository at this point in the history
New Testament still missing
6475 unique forms
https://www.kielipankki.fi/tools/giellalt_language_models/veps/
where unique misses were 8,439
  • Loading branch information
rueter committed Nov 11, 2024
1 parent 1f65d5f commit 1018a03
Show file tree
Hide file tree
Showing 4 changed files with 49 additions and 1 deletion.
6 changes: 6 additions & 0 deletions src/fst/morphology/affixes/nouns.lexc
Original file line number Diff line number Diff line change
Expand Up @@ -53,6 +53,8 @@ LEXICON N_SANA
R ;

LEXICON N_MARJ
! _0/an/ad/aha/oid
!Sg+Nom/Sg+Gen/Sg+Par/Sg+Ill/Pl+Par

! The accusative singular has two forms, one is the same as the
!! nominative singular in form and the other is identical to the
Expand Down Expand Up @@ -178,6 +180,8 @@ R ; ! xxx check
:u PL-OBLIQUE ;

LEXICON N_JAUH ! jauh:jauh
! _0/on/Q/ho/oid?
!Sg+Nom/Sg+Gen/Sg+Par/Sg+Ill/Pl+Par
!!€gt-norm: Noun ' / '
!!€ : +N+Sg+Nom
!!€ n: +N+Sg+Gen
Expand All @@ -199,6 +203,8 @@ LEXICON N_SHAPUK ! šapuk
:U1 NMN_ ;

LEXICON N_UNI ! uni:un
! _i/en/t/Q/id Q=unknown
!Sg+Nom/Sg+Gen/Sg+Par/Sg+Ill/Pl+Par
!!€gt-norm: Noun ' / '
!!€ : +N+Sg+Nom
!!€ n: +N+Sg+Gen
Expand Down
4 changes: 4 additions & 0 deletions src/fst/morphology/affixes/propernouns.lexc
Original file line number Diff line number Diff line change
Expand Up @@ -33,6 +33,10 @@ LEXICON PROP_SARV
N_SARV ;
LEXICON PROP_TEGII
N_TEGII ;
LEXICON PROP_MARJ
! _0/an/ad/aha/oid
!Sg+Nom/Sg+Gen/Sg+Par/Sg+Ill/Pl+Par
N_MARJ ;


! vim: set ft=xfst-lexc:
Expand Down
2 changes: 1 addition & 1 deletion src/fst/morphology/affixes/quantifiers.lexc
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@

LEXICON NUM_KAKS1
!! **LEXICON @LEXNAME@**
+Sg+Nom:ks' K ;
+Sg+Nom:ksʼ K ;
+Sg+Gen:hten K ;

LEXICON NUM_YKS1
Expand Down
38 changes: 38 additions & 0 deletions src/fst/morphology/stems/propernouns_newwords.lexc
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,44 @@ LEXICON PROP_NEWWORDS
test:test N_ "" ;
!! ADD NOUNS BELOW

Aaron+N+Prop:Aaron N_MARJ ;
Adam+N+Prop:Adam N_MARJ ;
Afin+N+Prop:Afin N_MARJ ;
Ahaz+N+Prop:Ahaz N_MARJ ;
Ahim+N+Prop:Ahim N_MARJ ;
Amon+N+Prop:Amon N_MARJ ;
Aram+N+Prop:Aram N_MARJ ;
Damask+N+Prop:Damask N_MARJ ;
Efes+N+Prop:Efes N_MARJ ;
Egipt+N+Prop:Egipt N_MARJ ;
Eliakim+N+Prop:Eliakim N_MARJ ;
Erast+N+Prop:Erast N_MARJ ;
Esrom+N+Prop:Esrom N_MARJ ;
Fares+N+Prop:Fares N_MARJ ;
Feliks+N+Prop:Feliks N_MARJ ;
Fest+N+Prop:Fest N_MARJ ;
Filip+N+Prop:Filip N_MARJ ;!wierd _p/ppan/ppad/Q/id
Germas+N+Prop:Germas N_MARJ ;
Harran+N+Prop:Harran N_MARJ ;
Irod+N+Prop:Irod N_MARJ ;
Isak+N+Prop:Isak N_MARJ ;
Isav+N+Prop:Isav N_MARJ ;
Jakov+N+Prop:Jakov N_MARJ ;
Jason+N+Prop:Jason N_MARJ ;
Joafam+N+Prop:Joafam N_MARJ ;
Joan+N+Prop:Joan N_MARJ ;
Joram+N+Prop:Joram N_MARJ ;
Krisp+N+Prop:Krisp N_MARJ ;
Naasson+N+Prop:Naasson N_MARJ ;
Pilat+N+Prop:Pilat N_MARJ ;
Sion+N+Prop:Sion N_MARJ ;
Valaam+N+Prop:Valaam N_MARJ ;
Vavilon+N+Prop:Vavilon N_MARJ ;
Viflejem+N+Prop:Viflejem N_MARJ ;
Vooz+N+Prop:Vooz N_MARJ ;
Zevs+N+Prop:Zevs N_MARJ ;
Zilot+N+Prop:Zilot N_MARJ ;

Iisus+N+Prop:Iisus N_MARJ ;
Jumal+N+Prop:Jumal N_POIG ;
Ižand+N+Prop:Ižand N_POIG ;
Expand Down

0 comments on commit 1018a03

Please sign in to comment.