Skip to content

Commit

Permalink
morfemkombinationer + verbs + nouns
Browse files Browse the repository at this point in the history
  • Loading branch information
Juutitta committed Oct 14, 2023
1 parent dae7fe6 commit 6e5d337
Show file tree
Hide file tree
Showing 4 changed files with 40 additions and 37 deletions.
33 changes: 18 additions & 15 deletions src/cg3/disambiguator.cg3
Original file line number Diff line number Diff line change
Expand Up @@ -1595,7 +1595,7 @@ LIST OQARPOQ = (/"oqar"\ Gram/IV\ V/l) (/"oqar"\ Gram/IV\ NNGIT\ Der/vv\ Gram/IV
# 'erserpoq' som inline match fordi kun intr. upersonlig kan være inquit
LIST ORATIOOBLVERBnOQAR = "aalajanger" "aalianger" (/"aarleqqut"\ GE/l) (/"aki"\ Gram/IV\ V/l) ("allap" USIQ GE) (/"allap"\ Gram/HV\ Gram/IV\ USIQ\ Der/vn\ GE\ Der/nv\ Gram/TV\ TAQ\ Der/vn\ QAR/l) (/"angu"\ Gram/TV\ \(NIAR\ Der/vv\ Gram/TV\ \)?TAQ\ Der/vn\ GE/l) ("apeqqut" GE) ("apeqqut" U) "apere" ("assuarliut" GE) "eqqaa" "eqqaama" "eqqartor" "erseqqissar" "erseqqissaatige" (/"erseqqissar"\ Gram/TV\ UTE\ Der/vn\ GE/l) (/"erser"\ Gram/IV\ V/l 3Sg) ("erser" QQIP TAQ UTE GE)
(/"ilimasaarut"\ \(\(i\)?Sem/predict\ \)?GE/l)
"ilimage" "ilimasup" ("ili" SIMA TIP HTR) (/"ilisima"\ Gram/IV\ TIP/l) "ilisimatitsi" "ilisimatitsissut" "ilumoor" "imaap" ("inassut" GE) "inassutige" (/"innersuup"\ Gram/TV\ UTE\ Der/vn\ GE/l) ("isuma" LIUR) ("isuma" QAR) ("isuma" QATE GIIP) "isummer" "kaammattor" "kajumissaar" "kalerrip" (/"kissar"\ UTE\ Der/vn\ GE/l) "maluge" "malunnar" "malunnarsi" "marser" (/"mianersor"\ Gram/IV\ QQU/l)
"ilimage" "ilimasup" ("ili" SIMA TIP HTR) (/"ilisima"\ Gram/IV\ TIP/l) "ilisimatitsi" "ilisimatitsissut" "ilumoor" "imaap" ("inassut" GE) "inassutige" ("isuma" LIUR) ("isuma" QAR) ("isuma" QATE GIIP) "isummer" "kaammattor" "kajumissaar" "kalerrip" (/"kissar"\ UTE\ Der/vn\ GE/l) "maluge" "malunnar" "malunnarsi" "marser" (/"mianersor"\ Gram/IV\ QQU/l)
#"misissor" #skal genovervejes. Masser af uventede konsekvenser
"missinger" "missingersuutige" "naatsorsor" "naggaser" (/"nale"\ LIR\ Der/nv\ Gram/TV/l) (/"nale"\ LIRSUR\ Der/nv/l) "nalu" "nalunaar" "nalunaarfige" "nalunaarut" "nalunaarutige" (/"nassuerut"\ GE/l) "nassuerutige" (/"nassuiar"\ Gram/TV\ UTE\ Der/vn\ GE/l) (/"nassuiar"\ Gram/TV\ V/l) "neriorsor" "neriup" "nipangiup"
(/"nillia"\ Gram/IV\ UTE\ Der/vn\ GE/l) #PL20230206
Expand Down Expand Up @@ -2427,7 +2427,7 @@ REMOVE:Arch Orth/Arch + (/\(.*\)/r) (0 (VSTR:$1) - Orth/Arch)
REMOVE:Gram (/nv\ Gram/IV\ Gram/IV\ V/l) + (/\(.*\)/r) (0 (/nv\ Gram/IV\ V/l) + (VSTR:$1)) ; #Jude 20231009 eksempel: AMEERNIARPOQ

### Judithes afsnit start ### påbegyndt 20231006: sorter umulige morfemkombinationer fra
### Der/nv
### Der/nv ###
#GASAAR
REMOVE:MorfGasaar0001 (*) - iSem/anzo (0 GASAAR) ; #Jude 20231006
#GE
Expand Down Expand Up @@ -2460,22 +2460,18 @@ REMOVE:MorfLoc0007 (*) - iProp (0 LocVr) ; #Jude 20231013
REMOVE:MorfLoc0008 SEM/inst (0 SEM/Hprof + LocSuf + LocVr) ; #Jude 20231013
REMOVE:MorfLoc0009 SEM/furn OR SEM/Hprof (0 SEM/Lh + LocVr OR SEM/Lh + LocSuf + LocVr) ; #Jude 20231013


#LIR

#LIRNGUSAATE
#LIRI
#LIRSUR
#LIRSUR
#LISAAR
#LISAAR
#LISAR
#LIUR
#LIUR
#LIUTE
#LUP
#NIP
#NNGUR
#NNGUR
#PALAAR
#PALLAP
#PALUP
Expand All @@ -2487,19 +2483,21 @@ REMOVE:MorfQatigiip (*) - iSem/Lciv (0 QATE + GIIP + (/"naalagaq"\ U\ Der/nv\ Gr
#SIUR
#SIUR#Der/nv#UTE#Der/vv
#SUNNIP
#SUNNIP
#SSAQQIP
#SSIP
#TAAR
#TU
#TUR
#U
#USAAR
### Der/nn
REMOVE:MorfUsaar0001 (/U\ Der/nv\ Gram/IV\ \(i?Sem/.*\)?SAAR\ Der/vv/l) (0 USAAR)
(NEGATE 0 ("pitsak")) ; #Jude 20231014

### Der/nn ###

### Der/vn
### Der/vn ###

### Der/vv
### Der/vv ###
REMOVE ("nipip") (0 RUJUUR) ; #Jude20231009
### Judithes afsnit slut ###

Expand Down Expand Up @@ -3581,15 +3579,18 @@ SUBSTITUTE:adv41lux (LU)(ADV-LU) TARGET LU IF (0 CONT + 3SgO LINK -1 (Abs Sg) LI
(NEGATE 0 TAR)
; #PL20230118 Matup tigummivia tigoriarlugu kigaatsunnguamik gangi takussallugu, tigummivik TIGULLUGULU assakkut uuvunga tupannermillu nilliavunga.
SUBSTITUTE:conj1li (LI)(CONJ-LI) TARGET LI + $$MOOD IF (-*1 $$MOOD BARRIER (*) - KOMMA);
SUBSTITUTE:conj2li_1 (LI)(CONJ-LI) TARGET LI IF (0 Sem/Hum) (-*1 BOS BARRIER (*) - FIRSTNAME);
SUBSTITUTE:conj2li_1 (LI)(CONJ-LI) TARGET LI IF (0 Sem/Hum) (-*1 BOS BARRIER (*) - FIRSTNAME)
(NEGATE 0 (/LI\ Der/vv/l));
#Lars ØSTERGAARDILI oqarpoq taamaanngitsoq.
SUBSTITUTE:conj2li_2 (LI)(CONJ-LI) TARGET LI IF (0 N OR Prop OR Pron OR Adv) (-1 BOS) (NEGATE 0 TIME)
(NEGATE 0 (/LI\ Der/nv/l))#
;
SUBSTITUTE:conj3li (LI)(CONJ-LI) TARGET LI IF (-1 KOMMA)
(NEGATE *-1 $$KASUS LINK *1 _TARGET_ + ("taamani") BARRIER (*) - KOMMA LINK 1 $$KASUS + Der/vn) #Silassorippasigisannik naapitsigaangama titartagara siulleq, TAAMANILI toqqortarisimasara, atorlugu misilittaasarpunga.
;
SUBSTITUTE:conj4li (LI)(CONJ-LI) TARGET LI IF (*-1 VFIN BARRIER (*) - PUNCT)(0 V LINK 1 EOS);
SUBSTITUTE:conj4li (LI)(CONJ-LI) TARGET LI IF (*-1 VFIN BARRIER (*) - PUNCT)(0 V LINK 1 EOS)
(NEGATE 0 (/LI\ Der/vv/l))
;

SUBSTITUTE:adv1lix LI ADV-LI TARGET LI (0 HUMAN + U OR TIME + QAR LINK 0 Cau OR CONT OR Par) #meeraallunili, ukioqartungali
(NEGATE *-1 Abs + Sg LINK *1 CONT + 4Sg LINK 1 _TARGET_ + Abs LINK *1 3SgO + 3Sg BARRIER V)#Præsidentissaq Barack Obama nammineq peqataanani PRÆSIDENTINNGORNIUTEQATAASIMASORLI senator John Kerry ataatsimeersuarnermi Poznanimi Polenimi pisumi peqataatippaa.
Expand Down Expand Up @@ -3682,7 +3683,8 @@ REMOVE:7254 Adv + ("kisianni") IF (-1 BOS) ; #Kisianni aramaannarniarit piffissa
SUBSTITUTE:Sub0001 (LU) (CONJ-LU) TARGET (*) ;
SUBSTITUTE:Sub0002 (LUUNNIIT) (CONJ-LUUNNIIT Gram/Conj-encl) TARGET (*) IF (NEGATE 0 CONJ-LU OR CONJ-LUUNNIIT OR ADV-LU OR ADV-LUUNNIIT) ; #PL20220926 rettet fra Gram/Unsafe-encl
SUBSTITUTE:Sub0003 (LI) (CONJ-LI) TARGET (*)
(NEGATE 0 (/LI\ Der/nv/l))#
(NEGATE 0 (/LI\ Der/nv/l))
(NEGATE 0 (/LI\ Der/vv/l))
;


Expand Down Expand Up @@ -9385,6 +9387,7 @@ REMOVE:5490GV ("iki") + humverb + VFIN OR ("ikip") + humverb + VFIN IF (0 (/"iki
REMOVE:5490GW ("aalajanger") + Gram/TV + SIMA + Gram/Pass IF (0 ("aalajanger") + Gram/IV + SIMA - Gram/Pass); #aalajangersimavoq
REMOVE:5490GX ("milup") IF (0 ("milor") LINK -1 Trm); #”Qimaaqqissanngilatit,” ataataata siniffianut MILORUJUPPAA, ”qimaaqqikkaluarna!” ingerlallunilu.
REMOVE:5490GY ("minguer") + SSUSIQ IF (0 ("minguip") + SSUSIQ);
REMOVE:5490GZ (/"oqip"\ LI\ Der/vv/l) (0 ("oqili")) ; #Jude 20231014

# Verbum eller partikel?
SELECT:5491A ("aarit") IF (-1 BOS);
Expand Down Expand Up @@ -10113,7 +10116,7 @@ REMOVE:6000V (/"ilimmar"\ Gram/IV\ VIK/l) IF (0 ("Ilimmarfik") + Prop);
REMOVE:6000W FIRSTNAME IF (0 Sem/LastName LINK -1 FIRSTNAME); #Nersornaatisivoq Nauja BIANCO, 29-nik ukiulik, taannalu naalagaaffimmi pissutsit pillugit cand. scient. pol-itut ilinniagaqarsimavoq, maannalu Kultureqarnermut Ilinniartitaanermullu Pisortaqarfimmi sullissisutut atorfeqarluni.

#Proprium eller verbum
REMOVE:6100A ("Oqi" Sem/Hum) IF (0 ("oqila") OR ("oqiliallap"));#oqiliallaqaanga
REMOVE:6100A ("Oqi" Sem/Hum) IF (0 ("oqila") OR ("oqiliallap") OR (/"oqili"\ \(Gram/IV\ \)?ALLAP\ Der/vv/l));#oqiliallaqaanga

#Partiklerne
REMOVE:5860 ("taama") + Interj IF (0 ("taama") + Adv LINK 1 V) ;
Expand Down
4 changes: 2 additions & 2 deletions src/fst/affixes/derivations-inflections.lexc
Original file line number Diff line number Diff line change
Expand Up @@ -28509,7 +28509,7 @@ LEXICON IV_voq2 !!= * @CODE@ skal få 200 medl.
!+KUTSUUR+Der/vv+SSA+Der/vv+NIRAR+Der/vv+TAR+Der/vv:%>kutsuussanerartar flex-iv ;
+KUTSUUR+Der/vv+SSAMAAR+Der/vv:%>kutsuussamaar IV-mod_C ;
+KUTSUUR+Der/vv+SSAMAAR+Der/vv+TIGE+Der/vv:%>kutsuussamaartig flex-iv_schwa ;
+KUTSUUR+Der/vv+SSAMAAR+Der/vv+Der/vv+GALUAR+Der/vv:%>kutsuussamaartigigaluar IV-mod_C ;
+KUTSUUR+Der/vv+SSAMAAR+Der/vv+GALUAR+Der/vv:%>kutsuussamaartigigaluar IV-mod_C ;
!+KUTSUUR+Der/vv+TAR+Der/vv:%>kutsoortar flex-iv ;
!+KUTSUUR+Der/vv+TAR+Der/vv+GALUAR+Der/vv:%>kutsoortaraluar IV-mod_C ;
[email protected]@+Der/vv:%>[email protected]@ flex-iv_voq ;
Expand Down Expand Up @@ -46825,7 +46825,7 @@ LEXICON XItX2 !!= * @CODE@
+INNAR+Der/vv+LLAR+Der/vv+SINNAR+Der/vv:%>%TRUNCinnallarsinnar IV-mod_C ;
+INNAR+Der/vv+LLUINNAR+Der/vv:%>%TRUNCinnarluinnar IV-mod_C ;
+INNAR+Der/vv+NGAJAP+Der/vv:%>%TRUNCinnangajap IV-mod_C ;
+INNAR+Der/vv+NGAJAP+SIMA+Der/vv+Der/vv:%>%TRUNCinnangajassima IV-mod_V ;
+INNAR+Der/vv+NGAJAP+SIMA+Der/vv:%>%TRUNCinnangajassima IV-mod_V ;
+INNAR+Der/vv+NGAJAP+Der/vv+GALUAR+Der/vv:%>%TRUNCinnangajakkaluar IV-mod_C ;
!+INNAR+Der/vv+NGAJAP+Der/vv+TAR+Der/vv:%>%TRUNCinnangajattar flex-iv ;
+INNAR+Der/vv+NIAR+Der/vv:%>%TRUNCinnarniar IV-mod_C ;
Expand Down
22 changes: 11 additions & 11 deletions src/fst/stems/nouns.lexc
Original file line number Diff line number Diff line change
Expand Up @@ -11892,10 +11892,10 @@ inupalaarsuusoq Z1Zmorf ;
inupalaasoq Z1Zmorf ;
Iñupiaq Z1Zmorf ;
iñupiaq Z1Zmorf ;
inupiluk Z2-Zmorf ;
!inupiluk Z2-Zmorf ;
inupilussiaq Z1Zmorf ;
inupilussuaq Z2aqZmorf ;
inupilussuusaartoq Z1Zmorf ;
!inupilussuaq Z2aqZmorf ;
!inupilussuusaartoq Z1Zmorf ;
inupiluuserneq Z2Zmorf ;
inupiluuserniartarneq Z2Zmorf ;
inupiluusertarneq Z2Zmorf ;
Expand Down Expand Up @@ -12547,7 +12547,7 @@ isiginnaariartoq Z1Zmorf ;
isiginnaartitsissut tptmorf ;
isiginnaartitsivik Z2-Zmorf ;
isiginnartitsinerpalaartoq Z1Zmorf ;
isiginngitsuusaartoq Z1Zmorf ;
!isiginngitsuusaartoq Z1Zmorf ;
isiginnittaaseq GEMS ;
isigisassaassuseq SEQgemin ;
isigisassiarinninneq Z2Zmorf ;
Expand Down Expand Up @@ -13151,7 +13151,7 @@ itersineq Z2Zmorf ;
itersioq Z1Zmorf ;
itersisoq Z1Zmorf ;
itersortoq Z1Zmorf ;
itertoq Z1Zmorf ;
!itertoq Z1Zmorf ;
iteruusivik Z2-Zmorf ;
iteruut tptmorf ;
iter+Gram/IV+JAALLU+Der/vv+Gram/IV+TUUQ+Der/vn:itiaallusooq Z1Zmorf ;
Expand Down Expand Up @@ -24325,9 +24325,9 @@ pinngitsaalisaaneq Z2Zmorf ;
pinngitsaalisaannginneq Z2Zmorf ;
pinngitsaalisaasoq Z1Zmorf ;
pinngitsaalisaq Z1Zmorf ;
pinngitsoq Z1Zmorf ;
!pinngitsoq Z1Zmorf ;
pinngitsuugaqanngitsoq Z1Zmorf ;
pinngitsuusaartoq Z1Zmorf ;
!pinngitsuusaartoq Z1Zmorf ;
pinngitsuusoq Z1Zmorf ;
pinngitsuussuseq SEQgemin ;
pi+Gram/IV+NNGIT+Der/vv+Gram/IV+TUQ+Der/vn+U+Der/nv+Gram/IV+TIP+Der/vv+Gram/TV+TAQ+Der/vn+U+Der/nv+Gram/IV+UTE+Der/vn:pinngitsuutitaassut tptmorf ;
Expand Down Expand Up @@ -24798,8 +24798,8 @@ piusarnertooq Z1Zmorf ;
piusoq Z1Zmorf ;
piusugittaatsoq Z1Zmorf ;
piusugittartoq Z1Zmorf ;
piusuusaartitsisoq Z1Zmorf ;
piusuusaartoq Z1Zmorf ;
!piusuusaartitsisoq Z1Zmorf ;
!piusuusaartoq Z1Zmorf ;
piut tptmorf ;
piutaasoq Z1Zmorf ;
piutserfiginninneq Z2Zmorf ;
Expand Down Expand Up @@ -34970,7 +34970,7 @@ toqussinartoq Z1Zmorf ;
toqussut tptmorf ;
toqussutaasoq Z1Zmorf ;
toqusuissoq Z1Zmorf ;
toqusuusaartoq Z1Zmorf ;
!toqusuusaartoq Z1Zmorf ;
toqu+Gram/IV+TIP+Der/vv+Gram/TV+QQU+Der/vv+Gram/TV+UTE+Der/vn:toquteqqussut tptmorf ;
toqutseqataasoq Z1Zmorf ;
toqutsivik Z2-Zmorf ;
Expand Down Expand Up @@ -35751,7 +35751,7 @@ tusaammaseq Z1Zmorf ;
tusaammasiinnarsortoq Z1Zmorf ;
tusaanngisaq Z1Zmorf ;
tusaanngitsoortoq Z1Zmorf ;
tusaanngitsoq Z1Zmorf ;
!tusaanngitsoq Z1Zmorf ;
tusaasaaruttoq Z1Zmorf ;
tusaasoq Z1Zmorf ;
tusaassut tptmorf ;
Expand Down
18 changes: 9 additions & 9 deletions src/fst/stems/verbs.lexc
Original file line number Diff line number Diff line change
Expand Up @@ -2245,7 +2245,7 @@ avalaap XIuteXmorf ;
avalaassup HTR_UTE_SSAQ_ssi ;
avammoor IV_long ;
avammoortip HTR_C_TAQ_tsi ;
avammukar IV_r_stem ;
!avammukar IV_r_stem ;
[email protected]@ IV_voq ;
[email protected]@ HTR_UTE_SSAQ_ssi ;
avannamukaar IV_long_stem ;
Expand Down Expand Up @@ -5102,7 +5102,7 @@ inupalaa IV_voq_stem ;
inupalaar IV_long_stem ;
inupalaarsuu IV_voq_stem ;
inupilussiare:inupilussiar HTR_schwa_SAQ_nnip ;
inupilussuusaar IV_long_stem ;
!inupilussuusaar IV_long_stem ;
inupiluu IV_voq_stem ;
inupiluuser XIirXmorf_stem ;
inuppalup IV_k_stem ;
Expand Down Expand Up @@ -5220,7 +5220,7 @@ inuusussi XIi_voqXmorf_stem ;
inuusussaatige:inuusussaatig HTR_schwa_SAQ_nnip ;
[email protected]@ IV_voq ;
inuusuttuaraa IV_voq_stem ;
inuusaar IV_long_stem ;
!inuusaar IV_long_stem ;
inuusaartip HTR_C_TAQ_tsi ;
inuutige:inuutig HTR_schwa_SAQ_nnip ;
inuutissarsiutigivip TV ;
Expand Down Expand Up @@ -5603,8 +5603,8 @@ isigiarsup IV_k_stem ;
isigilluariar TV ;
isiginere:isiginer HTR_schwa_SAQ_nnip ;
isiginnartitsinerpalaar IV_long_stem ;
isiginngitsuusaar IV_long_stem ;
isiginngitsuusaar HTR_longi_GAQ_nnip ;
!isiginngitsuusaar IV_long_stem ;
!isiginngitsuusaar HTR_longi_GAQ_nnip ;
isiginnittuu IV_voq_stem ;
isiginnaagassialior IV_r_stem ;
isiginnaagassiaa IV_voq_stem ;
Expand Down Expand Up @@ -15093,8 +15093,8 @@ piusartuiu IV_voq_stem ;
piusare:piusar HTR_schwa_SAQ_nnip ;
piusugittar IV_r_stem ;
piusugittaap XItsXmorf_stem ;
piusuusaar IV_long_stem ;
piusuusaartitsi XIi_voqXmorf_stem ;
!piusuusaar IV_long_stem ;
!piusuusaartitsi XIi_voqXmorf_stem ;
piusaar IV_long_stem ;
piusaartitsi XIi_voqXmorf_stem ;
piusaatigiunnaar UDEN_HTR_r_GAQ ; !Ved ikke betydning
Expand Down Expand Up @@ -16109,7 +16109,7 @@ qallunassi XIi_voqXmorf_stem ;
qallunneri XIi_voqXmorf_stem ;
qallunneritu IV_voq ;
qallunniaa IV_voq_stem ;
qallunaajusaar IV_long_stem ;
!qallunaajusaar IV_long_stem ;
qallunaaminertor IV_r_stem ;
qallunaaq+U+Der/nv+Orth/Arch:qallunaa IV_voq_stem ;
qallunaar+Orth/Arch:qallunaar IV_long_stem ;
Expand Down Expand Up @@ -21849,7 +21849,7 @@ toqussutaa IV_voq_stem ;
toqussaa IV_voq_stem ;
toqussaanngivip XIiXmorf_stem ;
[email protected]@ XIuteXmorf ;
toqusuusaar IV_long_stem ;
!toqusuusaar IV_long_stem ;
toqusaa IV_voq_stem ;
toqutare:toqutar HTR_schwa_SAQ_nnip ;
toqutser UDEN_HTR_r_GAQ ;
Expand Down

0 comments on commit 6e5d337

Please sign in to comment.