Skip to content

Commit

Permalink
Fjernet QATIGIIP 2. afsnit
Browse files Browse the repository at this point in the history
  • Loading branch information
planggard committed Oct 12, 2023
1 parent 09fc0b3 commit 3b8ef63
Show file tree
Hide file tree
Showing 3 changed files with 29 additions and 13 deletions.
6 changes: 4 additions & 2 deletions src/cg3/disambiguator.cg3
Original file line number Diff line number Diff line change
Expand Up @@ -1813,7 +1813,7 @@ LIST FEM = "aana" "aleqa" "anaana" "arnaq" "naja" "ningiu" "niviarsiaraq" "panik
LIST GEOOBJ = "imaq" ("naalap" VIK) "nuna" "qarmaq" "qeqertaq" "sermeq" "sineriak" "sissaq" "tungi"; # et specifikt set af mulige objekter til disambiguering af fx sinip vs. siner og ersi vs. ersip
LIST HOLIDAY = "juulli" "poorski" "piinsi" ;
LIST HUM = (/"ajor"\ Gram/IV\ TUQ/l) "angut" "arnaq" (/"atuar"\ Gram/HV\ Gram/IV\ QATE/l) ("atuar" TUQ) "ikinngut" "ila" "ilaqutaq" (/"iner"\ Gram/IV\ SIMA\ Der/vv\ Gram/IV\ TUQ/l) "innuttaq" "inuk" ("inuusup" TUQ) (/"iser"\ Gram/IV\ TUQ/l) "kalaaleq" "meeraq" "niviarsiaq" "niviarsiaraq" "nukappiaq" "nukappiaraq" "peqataasoq" (/"peqat"\ U\ Der/nv\ Gram/IV\ TUQ/l) (/"pissaq"\ U\ Der/nv\ Gram/IV\ NIQ\ Der/vn\ LIK/l) "qallunaaq" "sanileq" (/"siuaa"\ Gram/TV\ TAQ/l) "tarneq" "tarnik" "utoqqaq" ; #tarneq og tarnik medtaget da ofte objekt for +HUM verber. ilaqutaq da ofte adjektivisk på linie med arnaq m.fl.
LIST INDERIVERENDE_SUBSTANTIV_X = (/"aki"\ [^\(Gram\/IV\)]/l SSAQ) "akiliut" "angajoqqaaq" (/"angala"\ Gram/IV\ UTE\ Der/vn/l) "aningaasartuut" "ASN" "ataatsimiititaliaq" (/"ataatsimiip"\ Gram/IV\ TIP\ Der/vv\ Gram/TV\ TAQ\ Der/vn\ LIAQ/l) "atuakkiaq" "billet" "blogger" "bloggeri" "blog" "cand.mag." "cand. mag." "direktør" "eqqaassutissaq" "ersiut" "filmiliaq" ("film" LIAQ) "igalaasartooq" "ilaqutaq" "ilassinnissut" ("iluaqut" N) "ilisimatusartoq" "inatsit" "inerteqqut" "innuttaq" "isertugaq" "isi" ("isuma" N) (/"isuma"\ QATE\ Der/nn\ GIIP\ Der/nv\ Gram/IV\ UTE/l N) (LIAQ N) "malittarisassaq" "minister" "mittarfik" (/"mip"\ Gram/IV\ TAR\ Der/vv\ Gram/IV\ VIK/l) (/"naalagaq"\ LIRSUR\ Der/nv\ Gram/TV\ HTR\ Der/vv\ Gram/IV\ TUQ/l) "naapeqatigiinneq" ("\(N|n\)akorsaaneq"r) "nalliuttorsiorneq" "nalunaarusiaq" "nassaaq" "nioqqut" "nunap inoqqaavi" "nuuttoq" "oqallissaarut" "oqaluttuaq" "oqaluttuarisaaneq" "oqartussaaffik" "oqimaassusilik" ("pasitsaap" TAQ) "peqataasoq" (/"peqat"\ GIIP\ Der/nv\ Gram/IV\ VIK\ Der/vn\ N/l) "peqqussut" "piffissaliussaq" (/"pilersaar"\ Gram/HV\ UTE\ Der/vn/l) "pineq" "piniartoq" "pisortaq" "pisortaqarfik" "pisuttuarneq" "politik" "qaartartorsuaq" "qaatigooq" "saassussineq" (/"salip"\ Gram/IV\ UTE\ Der/vn/l) "sanaaq" "sinniisoq" (/"siunnersor"\ Gram/TV\ HTR\ Der/vv\ Gram/IV\ TUQ/l) "siunnersorti" (/"suli"\ Gram/IV\ TUQ/l) "suliaqartoq" "suliassaq" "sungiusaasoq" "taaguutilik" "tigummiaq" (/"timersor"\ Gram/IV\ QATE\ Der/vn\ GIIP\ Der/nv\ Gram/Reci\ Gram/IV\ VIK/l) "toqqammavik" "tunngavilersuutige" "ujaasineq" (/"paasi"\ Gram/TV\ Gram/Refl\ Gram/IV\ UTE/l) FAM TUGAQ ;
LIST INDERIVERENDE_SUBSTANTIV_X = (/"aki"\ [^\(Gram\/IV\)]/l SSAQ) "akiliut" "angajoqqaaq" (/"angala"\ Gram/IV\ UTE\ Der/vn/l) "aningaasartuut" "ASN" "ataatsimiititaliaq" (/"ataatsimiip"\ Gram/IV\ TIP\ Der/vv\ Gram/TV\ TAQ\ Der/vn\ LIAQ/l) "atuakkiaq" "billet" "blogger" "bloggeri" "blog" "cand.mag." "cand. mag." "direktør" "eqqaassutissaq" "ersiut" "filmiliaq" ("film" LIAQ) "igalaasartooq" "ilaqutaq" "ilassinnissut" ("iluaqut" N) "ilisimatusartoq" "inatsit" "inerteqqut" "innuttaq" "isertugaq" "isi" ("isuma" N) (/"isuma"\ QATE\ Der/nn\ GIIP\ Der/nv\ Gram/IV\ UTE/l N) (LIAQ N) "malittarisassaq" "minister" "mittarfik" (/"mip"\ Gram/IV\ TAR\ Der/vv\ Gram/IV\ VIK/l) (/"naalagaq"\ LIRSUR\ Der/nv\ Gram/TV\ HTR\ Der/vv\ Gram/IV\ TUQ/l) "naapeqatigiinneq" ("\(N|n\)akorsaaneq"r) "nalliuttorsiorneq" "nalunaarusiaq" "nassaaq" "nioqqut" "nunap inoqqaavi" "nuuttoq" "oqallissaarut" "oqaluttuaq" "oqaluttuarisaaneq" "oqartussaaffik" "oqimaassusilik" ("pasitsaap" TAQ) "peqataasoq" (/"peqat"\ GIIP\ Der/nv\ Gram/Reci\ Gram/IV\ VIK/l) "peqqussut" "piffissaliussaq" (/"pilersaar"\ Gram/HV\ UTE\ Der/vn/l) "pineq" "piniartoq" "pisortaq" "pisortaqarfik" "pisuttuarneq" "politik" "qaartartorsuaq" "qaatigooq" "saassussineq" (/"salip"\ Gram/IV\ UTE\ Der/vn/l) "sanaaq" "sinniisoq" (/"siunnersor"\ Gram/TV\ HTR\ Der/vv\ Gram/IV\ TUQ/l) "siunnersorti" (/"suli"\ Gram/IV\ TUQ/l) "suliaqartoq" "suliassaq" "sungiusaasoq" "taaguutilik" "tigummiaq" (/"timersor"\ Gram/IV\ QATE\ Der/vn\ GIIP\ Der/nv\ Gram/Reci\ Gram/IV\ VIK/l) "toqqammavik" "tunngavilersuutige" "ujaasineq" (/"paasi"\ Gram/TV\ Gram/Refl\ Gram/IV\ UTE/l) FAM TUGAQ ;
LIST INDERIVERENDE_UNDTAGELSE = (/LIAQ\ Der/nn\ U\ Der/nv\ Gram/IV\ TUQ/l) (/"pooq"\ SSAQ\ Der/nn\ LIAQ/l) (/"akoq"\ SSAQ\ Der/nn\ LIAQ/l); #for at kunne adskille LIAQ i kongruensadledskontekst fra LIAQ som fuldt nomen og for at undtage leksikaliseringer
LIST INDERIVERENDE_TITEL = "adjunkt" "bachelor" (/"ilisima"\ Gram/IV\ TUUQ/l) "lektor" "minister" (/"naalagaq"\ LIRSUR\ Der/nv\ Gram/TV\ HTR\ Der/vv\ Gram/IV\ TUQ/l) "Naalakkersuisoq" (/"naalagaq"\ LIRSUR\ Der/nv\ Gram/TV\ HTR\ Der/vv\ Gram/IV\ TUQ/l) (/"oqaaseq"\ QAR\ Der/nv\ Gram/IV\ TAR\ Der/vv\ Gram/IV\ TUQ/l) "professor";
#LIST VERBALNOMEN = "isuma" "oqaluttuaq" "naapeqatigiinneq" ;
Expand Down Expand Up @@ -14619,7 +14619,7 @@ REMOVE:8599F (*) - iSem/Hprof (0 ("sakkutooq")) ; #Jude 20231010
REMOVE:8599G (/"avat"\ ARSUK/l) IF (0 ("avataarsuaq")); #USA-p præsidentiata tullersortaa Mike Pence, USA-p AVATAARSUANUT tunngasunut siunnersuisoqatigiivinut, National Space Councilimut, oqalugiarnermini taama ilaatigut oqarpoq.
REMOVE:8599H (/"ip"\ Gram/[IT]V\ \(Gram/Pass\ \)?TUQ/l) + POSSESSUM IF (0 ("ittu") OR ("ittoq")); #Politiit ITTUAT
REMOVE:8599I ("ittu") IF (0 ("ittoq")) ; #PL20231010 vurderes lidt hyppigere

REMOVE:8599J (/"umik"\ ARSUK/l) IF (0 (/"umiaq"\ SUAQ/l));


# Nomen eller pron
Expand Down Expand Up @@ -15406,7 +15406,9 @@ REMOVE:5559B (/QATE\ Der/nn\ GIIP\ Der/nv/l) OR QATE + GIIT IF (0 (/QATE\ Der/vn
(NEGATE 0 (/QATE\ Der/nn\ GIIT\ Der/nn\ N\ Aeq\ Pl/l) LINK 1 V - 3Pl - 4Pl)#NAALAGAAFFEQATIGIITTUT suleqatigiilluarutta nukittunerussaagut, taanna oqarpoq.
(NEGATE 0 (/"isuma"\ QATE\ Der/nn\ GIIP\ Der/nv\ Gram/Reci\ Gram/IV\ \(iSem/agree\ \)?UTE\ Der/vn\ N\ Lok/l) LINK 1 (/"allap"\ Gram/HV\ \(iSem/write\ \)?SIMA/l) )#Taannali aatsaat savalimmiormiut kalaallillu oqartussaasuisa imarisaanik akuersinerisigut atuutilissasoq, ISUMAQATIGIISSUMMI allassimavoq.
(NEGATE *-1 Rel LINK 1 Rel + CONJ-C LINK *1 (/"isuma"\ QATE\ Der/nn\ GIIP\ Der/nv\ Gram/Reci\ Gram/IV\ \(iSem/agree\ \)?UTE/l) + 3PlPoss + &&IV_SUBJ& LINK *1 V + &&IV_SUBJ& BARRIER (*) - Adv)#Nunatta USA-llu siorna oktobari naalersoq ISUMAQATIGIISSUTIGISAAT aamma sammineqassasoq ilimagineqarpoq
(NEGATE 0 (/[SIUT|UTE]\ Der/nn\ LIK\ Der/nn\ QATE\ Der/nn/l))
;
REMOVE:5559C (/LIR\ Der/nv\ \(Gram/[IT]V\ \)?QATE\ Der/vn\ GIIP/l) IF (0 (/LIK\ Der/nn\ QATE\ Der/nn\ GIIP/l)) ;
REMOVE:5560 ("ukior") + QATE IF (0 ("ukioq") + QATE) ;
REMOVE:5561 ("ilik") + U + USIQ IF (0 ("ilior") + USIQ) ;
REMOVE:5562 LIK + U IF (0 LIUR) ;
Expand Down
18 changes: 16 additions & 2 deletions src/fst/affixes/derivations-inflections.lexc
Original file line number Diff line number Diff line change
Expand Up @@ -481,6 +481,7 @@ LEXICON Z1Zmorf !!= * @CODE@ Derivationsmorfemer til nominer, viser til **tp** o
+SIAQ+Der/nn+TUAQ+Der/nn:%>siatuaq tp ;
+SIUT+Der/nn:%>siut tpt ;
+SIUT+Der/nn+LIK+Der/nn:%>siuti Z2+lZ ;
+SIUT+Der/nn+LIK+Der/nn+QATE+Der/nn:%>siutileqat tpt ;
+SIUT+Der/nn+NNGUAQ+Der/nn:%>siutinnguaq Z1nnguaqZ ;
+SIUT+Der/[email protected]@+Der/nn:%>[email protected]@ tup- ;
+SIUT+Der/[email protected]@+Der/nn+ALUK+Der/nn:%>[email protected]@ tup- ;
Expand Down Expand Up @@ -521,6 +522,17 @@ LEXICON Z1Zmorf !!= * @CODE@ Derivationsmorfemer til nominer, viser til **tp** o
+SSAQ+Der/nn+SIAQ+Der/nn+KKAAQ+Der/nn:%>%TRUNCssarsiakkaaq tp ;
+SSAQ+Der/nn+SIAQ+Der/nn+SSAQ+Der/nn:%>%TRUNCssarsiassaq tp ;
+SSAQ+Der/nn+SIAQ+Der/nn+SSAQ+Der/nn+GALUAQ+Der/nn:%>%TRUNCssarsiassaraluaq Z2aqZ ; !liv 170130
+SSAQ+Der/nn+SIUT+Der/nn:%>%TRUNCssarsiut tpt ;
+SSAQ+Der/nn+SIUT+Der/nn+LIK+Der/nn:%>%TRUNCssarsiuti Z2+lZ ;
+SSAQ+Der/nn+SIUT+Der/nn+LIK+Der/nn+QATE+Der/nn:%>%TRUNCssarsiutileqat tpt ;
+SSAQ+Der/nn+SIUT+Der/nn+NNGUAQ+Der/nn:%>%TRUNCssarsiutinnguaq Z1nnguaqZ ;
+SSAQ+Der/nn+SIUT+Der/[email protected]@+Der/nn:%>%[email protected]@ tup- ;
+SSAQ+Der/nn+SIUT+Der/[email protected]@+Der/nn+ALUK+Der/nn:%>%[email protected]@ tup- ;
+SSAQ+Der/nn+SIUT+Der/[email protected]@+Der/nn+SUAQ+Der/nn:%>%[email protected]@ Z2aqZ ;
+SSAQ+Der/nn+SIUT+Der/nn+RUJUK+Der/nn+SUAQ+Der/nn:%>%TRUNCssarsiuterujussuaq Z2aqZ ;
+SSAQ+Der/nn+SIUT+Der/nn+SSAQ+Der/nn:%>%TRUNCssarsiutissaq tp ;
+SSAQ+Der/nn+SIUT+Der/nn+VIK+Der/nn:%>%TRUNCssarsiutivik tup- ;
+SSAQ+Der/nn+SIUT+Der/nn+VIK+Der/nn+SSAQ+Der/nn:%>%TRUNCssarsiutivissaq tp ;
+SSAQ+Der/nn+SUAQ+Der/nn:%>%TRUNCssarsuaq Z2aqZ ;
+SSAQ+Der/nn+SUNNI+Der/nn:%>%TRUNCssarsunni tp ;
+SSAQ+Der/nn+TAQ+Der/nn:%>%TRUNCssartaq tp ;
Expand Down Expand Up @@ -557,6 +569,8 @@ LEXICON Z1Zmorf !!= * @CODE@ Derivationsmorfemer til nominer, viser til **tp** o
+SUAQ+Der/nn+USAQ+Der/nn:%>%TRUNCrsuaasaq tp ;
+SUAQ+Der/nn+USAQ+Der/nn+SUAQ+Der/nn:%>%TRUNCrsuaasarsuaq Z2aqZ ;
+SUAQ+Der/nn+UTE+Der/nn:%>%TRUNCrsuaat tpt ;
+SUAQ+Der/nn+UTE+Der/nn+LIK+Der/nn:%>%TRUNCrsuaati Z2+lZ ;
+SUAQ+Der/nn+UTE+Der/nn+LIK+Der/nn+QATE+Der/nn:%>%TRUNCrsuaatileqat tpt ;
+SUAQ+Der/nn+VIK+Der/nn:%>%TRUNCrsuavik tup- ;
+SUNNI+Der/nn:%>sunni tp ;
+SUNNI+Der/nn+ALAAQ+Der/nn:%>sunnialaaq tp ;
Expand Down Expand Up @@ -8656,7 +8670,7 @@ LEXICON Z2-Zmorf !!= * @CODE@ derivationsmorfemer til tup- paa K. Jf. Z2-qZmorf
+USAQ+Der/nn+SUAQ+Der/nn:%>%TRUNCusarsuaq Z2aqZ ;
+UTE+Der/nn:%>%TRUNCut tpt ;
+UTE+Der/nn+LIK+Der/nn:%>%TRUNCuti Z2+lZ ; !05112020
+UTE+Der/nn+LIVIK+Der/nn:%>%TRUNC%ProgIusivik tup- ;
+UTE+Der/nn+LIK+Der/nn+QATE+Der/nn:%>%TRUNCutileqat tpt ;
+UTE+Der/nn+SSAQ+Der/nn:%>%TRUNCutissaq tp ;
+UTE+Der/nn+SUAQ+Der/nn:%>%TRUNCussuaq Z2aqZ ;
+UTE+Der/nn+TAAQ+Der/nn:%>%TRUNCutitaaq tp ;
Expand Down Expand Up @@ -113344,7 +113358,7 @@ LEXICON tpt !!= * @CODE@
+GIP+Der/nv:%>igip XIiXmorf_stem ;
+GISSAAR+Der/nv:%>igissaar IV_r_stem ;
!+GISSAAR+Der/nv+GI+Der/vv:%>igissaari XIgujoqX ;
[email protected]@+Der/nv:%>[email protected]@ XIiXmorf_stem ;
[email protected]@+Der/nv+Gram/Reci:%>[email protected]@ XIiXmorf_stem ;
+IAR+Der/nv:%>aajar HTR_r_GAQ_i ;
+ILATSI+Der/nv:%>ilatsi IV_voq ;
[email protected]@+Der/nv+Gram/IV:%>[email protected]@ IV_r ; !+IR+Der/nv+NIAR+Der/vv
Expand Down
18 changes: 9 additions & 9 deletions src/fst/stems/nouns.lexc
Original file line number Diff line number Diff line change
Expand Up @@ -391,8 +391,8 @@ aataqqiut tptmorf ;
aatsar+Gram/IV+NAVIIR+Der/vv+Gram/IV+UTE+Der/vn:aatsarnaveeqqut tptmorf ;
aatsialak Z2-Zmorf ;
aatsialaq Z1Zmorf ;
aatsitaq Z1Zmorf ;
aatsitassaq Z1Zmorf ;
!aatsitaq Z1Zmorf ;
!aatsitassaq Z1Zmorf ;
aatsitassarsiuut tptmorf ;
aatsoq Z1Zmorf ;
aatsorluut tptmorf ;
Expand Down Expand Up @@ -36983,18 +36983,18 @@ umiarsuaarartaartoq Z1Zmorf ;
umiarsuaartoq Z1Zmorf ;
umiarsuaartorpaluttoq Z1Zmorf ;
umiarsuaartortoq Z1Zmorf ;
umiarsuaat tptmorf ;
umiarsuaatilik:umiarsuaati Z2+lZmorf ;
umiarsuakkoortitaq Z1Zmorf ;
umiarsualiorfik Z2-Zmorf ;
umiarsualiorneq Z2Zmorf ;
umiarsualiortoq Z1Zmorf ;
!umiarsuaat tptmorf ;
!umiarsuaatilik:umiarsuaati Z2+lZmorf ;
!umiarsuakkoortitaq Z1Zmorf ;
!umiarsualiorfik Z2-Zmorf ;
!umiarsualiorneq Z2Zmorf ;
!umiarsualiortoq Z1Zmorf ;
umiarsualiveqarfik Z2-Zmorf ;
umiarsualivik Z2-Zmorf ;
umiarsualiviliorneq Z2Zmorf ;
umiarsuapalaaq Z1Zmorf ;
umiarsuapiluk Z2-Zmorf ;
umiarsuaq Z2aqZmorf ;
!umiarsuaq Z2aqZmorf ;
umiarsuarmioq Z1Zmorf ;
umiarsuarmiu Z1VZmorf ;
umiarsuarsiortoq Z1Zmorf ;
Expand Down

0 comments on commit 3b8ef63

Please sign in to comment.