From 63caf83576d80a916c175fd260a93d9c071ebd17 Mon Sep 17 00:00:00 2001 From: Jack Rueter Date: Sat, 16 Nov 2024 15:56:04 +0200 Subject: [PATCH] Add exceptions for possessive suffixes --- src/fst/morphology/Makefile.am | 1 + src/fst/morphology/root.lexc | 2 +- src/fst/morphology/stems/exceptions.lexc | 21 +++++++++++++++++++++ 3 files changed, 23 insertions(+), 1 deletion(-) create mode 100644 src/fst/morphology/stems/exceptions.lexc diff --git a/src/fst/morphology/Makefile.am b/src/fst/morphology/Makefile.am index 5b277862..509b8d0a 100644 --- a/src/fst/morphology/Makefile.am +++ b/src/fst/morphology/Makefile.am @@ -40,6 +40,7 @@ GT_LEXC_SRCS_L1_L2=\ stems/adjectives_newwords.lexc \ stems/adpositions.lexc \ stems/adverbs.lexc \ + stems/exceptions.lexc \ stems/nouns.lexc \ stems/nouns_newwords.lexc \ stems/numerals.lexc \ diff --git a/src/fst/morphology/root.lexc b/src/fst/morphology/root.lexc index 7fbc0706..ed9042f8 100644 --- a/src/fst/morphology/root.lexc +++ b/src/fst/morphology/root.lexc @@ -506,7 +506,7 @@ LEXICON Root V_NEWWORDS ; ! SUBJUNCTION ; PRONOUN-TYPES ; - + EXCEPTIONS ; !! ### Other lexica LEXICON CC_ diff --git a/src/fst/morphology/stems/exceptions.lexc b/src/fst/morphology/stems/exceptions.lexc new file mode 100644 index 00000000..d110a012 --- /dev/null +++ b/src/fst/morphology/stems/exceptions.lexc @@ -0,0 +1,21 @@ +!! Exceptions are quite strange word-forms. the ones that do not fit anywhere +!! else. This file contains all enumerated word forms that cannot reasonably be +!! created from lexical data by regular inflection. Usually there should be next +!! to none exceptions, it's always better to have a paradigm that covers only +!! one or few words than an exception since these will not work nicely with e.g. +!! compounding scheme or possibly many end applications. + +LEXICON EXCEPTIONS + +! special nouns with possessive suffixes + +ak+N:aka POSS_SUF ; +baba+N:baba POSS_SUF ; +emagaine+N:emagaiže POSS_SUF ; +mama+N:mama POSS_SUF ; +mezʼ+N:mehe POSS_SUF ; +poigaine+N:poigaiže POSS_SUF ; +sünduine+N:sünduiže POSS_SUF ; +tat+N:tata POSS_SUF ; + +