From 6d7d58f8795f4edee25e3c88b5ebc9b72c2421cc Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Judithe=20Denb=C3=A6k?= Date: Fri, 25 Oct 2024 23:56:53 +0000 Subject: [PATCH] =?UTF-8?q?=C3=A9g=20skil=20ekki=20=C3=BEessi=20helv=C3=AD?= =?UTF-8?q?tis=20flag=20diakrit=C3=ADskir,=20to=20be=20continued=20=C3=A1?= =?UTF-8?q?=20m=C3=A1nudaginn?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- src/fst/morphology/Makefile.am | 8 +-- src/fst/morphology/affixes/noun-to-noun.lexc | 4 +- src/fst/morphology/root.lexc | 14 +++++- src/fst/morphology/stems/semtagged/food.txt | 49 ++++++++++--------- .../morphology/stems/semtagged/nouns_sem.lexc | 22 +++++---- 5 files changed, 59 insertions(+), 38 deletions(-) diff --git a/src/fst/morphology/Makefile.am b/src/fst/morphology/Makefile.am index 810a6f747..d13fdaec3 100644 --- a/src/fst/morphology/Makefile.am +++ b/src/fst/morphology/Makefile.am @@ -36,14 +36,15 @@ GT_LEXC_SRCS_L1_L2=\ stems/abbreviations.lexc \ stems/acronyms.lexc \ stems/nouns.lexc \ - stems/semtagged/nouns_sem.lexc \ stems/numerals.lexc \ stems/particles.lexc \ stems/pronouns.lexc \ stems/propernouns.lexc \ stems/verbs.lexc \ + stems/semtagged/nouns_sem.lexc \ stems/semtagged/verbs_sem.lexc \ - affixes/enclitics.lexc \ + affixes/semtagged/noun-to-noun_sem.lexc \ + affixes/semtagged/pre-inflections-nouns.lexc \ affixes/loanwords.lexc \ affixes/noun-to-noun.lexc \ affixes/noun-to-verb.lexc \ @@ -56,7 +57,8 @@ GT_LEXC_SRCS_L1_L2=\ affixes/inflections-nouns.lexc \ affixes/inflections-verbs-IV.lexc \ affixes/inflections-verbs-TV.lexc \ - affixes/inflections-NUM.lexc + affixes/inflections-NUM.lexc \ + affixes/enclitics.lexc # If you are building an error-detecting L2 analyser, specify the lexc files # that differ between the regular L1 and the L2 analysers below, in L1 and diff --git a/src/fst/morphology/affixes/noun-to-noun.lexc b/src/fst/morphology/affixes/noun-to-noun.lexc index c216c9e8c..eebdef82b 100644 --- a/src/fst/morphology/affixes/noun-to-noun.lexc +++ b/src/fst/morphology/affixes/noun-to-noun.lexc @@ -272,6 +272,9 @@ LEXICON ZsaqZmorf !!= * @CODE@ derivationsmorfemer til nominer ZsaqZ ; LEXICON Z1+qaZmorf !!= * @CODE@ derivationsmorfemer til nominer +@C.Z1qaZmorf@ deflagged_Z1qaZmorf ; + +LEXICON deflagged_Z1qaZmorf Der_nn_TRUNC ; recessive_TRUNCrsuaq ; Z1+qaZ ; @@ -631,7 +634,6 @@ LEXICON Der_nn_ALL +LIRSAAR+Der/nv+UTE+Der/vn+LIAQ+Der/nn:lersaarusiaq tp ; !piviusulersaarusiaq +LIRSAAR+Der/nv+UTE+Der/vn:lersaarut tpt ; +LIUR+Der/nv+TAR+Der/vv+USIQ+Der/vn:liortaaseq ZseqZ ; -+MINIQ+Der/nn:mineq Z2+rZmorf ; @U.Num.Pl@+MINIQ+Der/nn+ALUK+Der/nn:@U.Num.Pl@%minaaluk tup- ; @U.Num.Pl@+MINIQ+Der/nn+ALUK+Der/nn:@U.Num.Pl@%minaaluk tup- ; !231019 PN. paarnaminaalunnillu +MINIQ+Der/nn+ARAQ+Der/nn+INNAQ+Der/nn:mineeraannaq tup- ; diff --git a/src/fst/morphology/root.lexc b/src/fst/morphology/root.lexc index 0981d384e..a448cafdc 100644 --- a/src/fst/morphology/root.lexc +++ b/src/fst/morphology/root.lexc @@ -89,7 +89,8 @@ TA+ !!≈ * **@CODE@** = præfiks +Sem/Unit !!≈ * **@CODE@** = Unit !Til besværlige låneord som 'time' etc., der optræder absolut +Sem/Url !!≈ * **@CODE@** tag til adresser af typen www.ccc.cc +Sem/misse !!≈ * **@CODE@** tag til at markere usikker possessor for misse - + +!####SEMANTISK LEKSIKON###! !! ### 20241022 semtag lexicon migration checklist !! ### taglist: Katersat !! Verbs @@ -103,6 +104,15 @@ TA+ !!≈ * **@CODE@** = præfiks +Sem/food-c-h +Sem/food-m-h +@U.Z1ssZmorf@ +@C.Z1ssZmorf@ + +@U.Z2rZ@ +@U.Z1qaZmorf@ +@U.Z2rZmorf@ + +@P.Z2rZmorf@ + !! ### Grammar @@ -948,4 +958,6 @@ LEXICON Root !!= ## @CODE@ pointing to main parts of speech Forkortelser ; !!≈ - **@CODE@** Akronymer ; !!≈ - **@CODE@** Pronomen ; !!≈ - **@CODE@** + sem_nouns ; !!≈ - **@CODE@** + ! Kingumoorutit ; !Testmodel sammen med Der/Test diff --git a/src/fst/morphology/stems/semtagged/food.txt b/src/fst/morphology/stems/semtagged/food.txt index 96a6c80da..811e1b457 100644 --- a/src/fst/morphology/stems/semtagged/food.txt +++ b/src/fst/morphology/stems/semtagged/food.txt @@ -1,10 +1,11 @@ list of entries tagged with food in Katersat migrated to nouns_sem.lexc file: ✅ - +nogle tilføjet i Sem/an og Sem/A, Sem/Aich ✅allaq ✅cuvette +✅gluten ✅eqaluk ✅forloren hare ✅inumineq @@ -23,6 +24,8 @@ migrated to nouns_sem.lexc file: ✅ ✅saarullik ✅tangeq ✅taquaq +✅t-bone steaki -> T-bonesteak +✅uummat @@ -74,47 +77,45 @@ tuttup qimerlua tuttup talia tuttup uummataa - - +stem:uummat +tuttup uummataa +savaaqqap uummataa moved stem aapaartoq -> jfood +aappatit +akuutissalersornagu nerisassiaq amaateeraq +amusat aqerlortigaq +assaqqoq +karrymi marinerigaq kimittussuseq mamarilluagaq mamarisaq mamartuliaq mamma -qiteqqutaq -sakiamineq -mikiarneq -uusuliaq -gluten -amusat -qajuusiassat inuussutissartaat -aappatit -akuutissalersornagu nerisassiaq -ulluinnarsiutit manniliaq +mikiarneq +neqi anaalerlugu aqilisagaq neqimineq nersussuaaqqap quttoraaneersoq - -nersuteeqqamit sakiamineq -karrymi marinerigaq neqimineq tuttup quttoraaneersoq neqimineq umimmaap quttoraaneersoq -qimerluup neqqarinnera -umimmaap quttoramerna silarleq nersussuup quttoramerna silarleq -t-bone steaki +nersuteeqqamit sakiamineq +oquutaasaq pamiallup eqqaani neqqarinneq -neqi anaalerlugu aqilisagaq pukusumineq siatassaq +qajuusiassat inuussutissartaat +qaleralilaat +qatigak qimerluk +qimerluup neqqarinnera +qiteqqutaq qungaseq -assaqqoq -qatigak -oquutaasaq -qaleralilaat \ No newline at end of file +sakiamineq +ulluinnarsiutit +umimmaap quttoramerna silarleq +uusuliaq diff --git a/src/fst/morphology/stems/semtagged/nouns_sem.lexc b/src/fst/morphology/stems/semtagged/nouns_sem.lexc index 61df40b6e..e6c88b6ab 100644 --- a/src/fst/morphology/stems/semtagged/nouns_sem.lexc +++ b/src/fst/morphology/stems/semtagged/nouns_sem.lexc @@ -28,9 +28,12 @@ ! (Sem/H OR just inuk | Sem/Hnat OR just kalaaleq, qallunaaq | Sem/f-an | Sem/an) + MINIQ = Sem/food ! kunne måske omdannes i et filter +LEXICON sem_nouns +food ; +animal ; +anatomical ; - -!LEXICON food +LEXICON food allaq+Sem/food:allaq Z1Zmorf ; !brystkødet på en fugl avaleraasartooq+Sem/food:avaleraasartooq Z1Zmorf ; eqaluk+Sem/food:eqaluk Z2-Zmorf ; @@ -57,7 +60,7 @@ qallunaaq+MINIQ+Der/nn+Sem/food:qallunaamineq Z2+rZ ; ! MINIQ qeeraq+Sem/food:qeeraq Z1+qaZmorf ; quaq+Sem/food:quaq Z1Zmorf ; quttoraq+Sem/anost+MINIQ+Der/nn:quttoramineq Z2+rZ ; ! MINIQ -sakiak+MINIQ+Der/nn+Sem/food:sakiamineq Z2+rZ ; ! MINIQ +!sakiak+MINIQ+Der/nn+Sem/food:sakiamineq Z2+rZ ; ! MINIQ saarullik+Sem/food:saarullik Z2-Zmorf ; sava+Sem/food:sava Z1VZmorf ; tangeq+Sem/food:tangeq Z2Zmorf ; @@ -76,7 +79,7 @@ ossobuco+Sem/food:ossobuco N_Loan_o ; !egentl. italiensk T-bonesteak+Sem/food:T-bonesteak N_Loan ; -!LEXICON animal +LEXICON animal allaq+Sem/A:allaq Z1Zmorf ; !bjørn, brunbjørn, landbjørn avaleraasartooq+Sem/A:avaleraasartooq Z1Zmorf ; eqaluk+Sem/Aich:eqaluk Z2-Zmorf ; @@ -100,11 +103,11 @@ tuttu+Sem/A+Orth/Alt:tuttoq Krestr ; aborre+Sem/Aich:aborre N_Loan_e ; -!LEXICON anatomical +LEXICON anatomical puku:puku SUKgemin ; !20241007 TEMPORARY SOLUTIONS delignen må fikses på anden måde! -quttoraq+Sem/anost:quttoraq Z1+qaZmorf ; -sakiak+Sem/an:sakiak Z1+ssZmorf ; -sakiak+Sem/an:sakiak Z1Zmorf ; !NN230217 sakiannilu !JD20241025 kan man ikke bare tilføje en linje/linjer med et flag i samme fleksionsleksikon som den første +quttoraq+Sem/anost:quttoraq Z1+qaZmorf ; !Z1+qaZmorf +@U.Z1ssZmorf@sakiak+Sem/an:@U.Z1ssZmorf@sakiak anatomical_pre_nn_suff ; !Z1+ssZmorf +!sakiak+Sem/an:sakiak Z1Zmorf ; !NN230217 sakiannilu !JD20241025 kan man ikke bare tilføje en linje/linjer med et flag i samme fleksionsleksikon som den første uummat+Sem/an:uummat tptmorf ; !######### !LOANWORDS @@ -116,4 +119,5 @@ uummat+Sem/an:uummat tptmorf ; !######### !LOANWORDS !######### -gluten+Sem/ch-chem:gluten N_Loan ; \ No newline at end of file +gluten+Sem/ch-chem:gluten N_Loan ; +