# Divvun & Giellatekno - open source grammars for Sámi and other languages
# Copyright © 2000-2010 The University of Tromsø & the Norwegian Sámi Parliament
# http://giellatekno.uit.no & http://divvun.no
#
# This program is free software; you can redistribute and/or modify
# this file under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version. The GNU General Public License
# is found at http://www.gnu.org/licenses/gpl.html. It is
# also available in the file $GTHOME/LICENSE.txt.
#
# Other licensing options are available upon request, please contact
# giellatekno@hum.uit.no or divvun@samediggi.no
# =================================================================== #
# =================================================================== #
# L U L E S Á M I D I S A M B I G U A T O R #
# =================================================================== #
# =================================================================== #
# =========================================== #
# Short table of contents #
# =========================================== #
# Delimiters
# Tags and sets
# Mapping rules
# Disambiguation rules
# One-cohort disambiguation - cycle 0
# Local disambiguation - cycles 1 and 2
# Cycle 2: Other local disambiguation
# Cycle 3: Global disambiguation
# Cycle 4: Syntactic disambiguation
# Cycle 5: Post-syntactic morphological disambiguation
# ========== #
# Delimiters #
# ========== #
DELIMITERS = "<.>" "" ">" "<...>" "<¶>";
# ============= #
# Tags and sets #
# ============= #
# ========
SETS
# ========
LIST BOS = (>>>) ();
LIST EOS = (<<<) (); # vislcg and CG-2 together.
# Tags declared as single-membered LISTs
# ======================================
LIST = ;
LIST = ;
LIST = ;
# Parts of speech
# ---------------
LIST N = N ;
LIST A = A ;
LIST Adv = Adv ;
LIST V = V ;
LIST Pron = Pron ;
LIST CS = CS ;
LIST CC = CC ;
LIST Po = Po ;
LIST Pr = Pr ;
LIST Pcle = Pcle ;
LIST Qst = Qst ;
LIST Num = Num ;
LIST Prop = Prop ;
# POS sub-categories
# ------------------
LIST Pers = Pers ;
LIST Dem = Dem ;
LIST Interr = Interr ;
LIST Indef = Indef ;
LIST Recipr = Recipr ;
LIST Refl = Refl ;
LIST Rel = Rel ;
LIST Interj = Interj ;
LIST Adp = Adp ;
LIST Coll = Coll ;
# Morphosyntactic properties
# --------------------------
LIST Sg = Sg ;
LIST Pl = Pl ;
LIST Nom = Nom ;
LIST Gen = Gen ;
LIST Acc = Acc ;
LIST Ill = Ill ;
LIST Ine = Ine ;
LIST Ela = Ela ;
LIST Com = Com ;
LIST Ess = Ess ;
LIST Par = Par ;
LIST Abe = Abe ;
LIST SgCmp = SgCmp ;
LIST SgNomCmp = SgNomCmp ;
LIST SgGenCmp = SgGenCmp ;
LIST PlGenCmp = PlGenCmp ;
LIST RCmpnd = RCmpnd ;
LIST PxSg1 = PxSg1 ;
LIST PxSg2 = PxSg2 ;
LIST PxSg3 = PxSg3 ;
LIST PxDu1 = PxDu1 ;
LIST PxDu2 = PxDu2 ;
LIST PxDu3 = PxDu3 ;
LIST PxPl1 = PxPl1 ;
LIST PxPl2 = PxPl2 ;
LIST PxPl3 = PxPl3 ;
LIST Comp = Comp ;
LIST Superl = Superl ;
LIST Actor = Actor ;
LIST Actio = Actio ;
LIST Clt = Clt ;
LIST Foc = Foc ;
LIST Attr = Attr ;
LIST Card = Card ;
LIST Ord = Ord ;
LIST Date = Date ;
LIST Range = Range ;
LIST Dim = Dim ;
LIST Inch = Inch ;
LIST Prs = Prs ;
LIST Prt = Prt ;
LIST Ind = Ind ;
LIST Pot = Pot ;
LIST Cond = Cond ;
LIST Imprt = Imprt ;
LIST ImprtII = ImprtII ;
LIST Sup = Sup ;
LIST IV = IV ;
LIST TV = TV ;
LIST Sg1 = Sg1 ;
LIST Sg2 = Sg2 ;
LIST Sg3 = Sg3 ;
LIST Du1 = Du1 ;
LIST Du2 = Du2 ;
LIST Du3 = Du3 ;
LIST Pl1 = Pl1 ;
LIST Pl2 = Pl2 ;
LIST Pl3 = Pl3 ;
LIST Inf = Inf ;
LIST Ger = Ger ;
LIST GerII = GerII ;
LIST ConNeg = ConNeg ;
LIST Neg = Neg ;
LIST PrsPrc = PrsPrc ;
LIST PrfPrc = PrfPrc ;
LIST VGen = VGen ;
LIST VAbess = VAbess ;
LIST CLB = CLB ;
LIST PUNCT = PUNCT ;
LIST LEFT = LEFT ;
LIST RIGHT = RIGHT ;
LIST HYPH = HYPH ;
LIST PAR = PAR ;
# Noun tags
LIST LOC = Ine Ela Loc ; # This set since we imported sme rules, all LOCs must be revised.
# Syntactic tags
# --------------
LIST @+FAUXV = @+FAUXV ;
LIST @+FMAINV = @+FMAINV ;
LIST @-FAUXV = @-FAUXV ;
LIST @-FMAINV = @-FMAINV ;
LIST @-FSUBJ = @-FSUBJ ;
SET FMAINV = @-FMAINV OR @+FMAINV ;
LIST @ADVL = @ADVL ;
LIST @>ADVL = @>ADVL ;
LIST @ADVL< = @ADVL< ;
LIST @ = @ADVL> ;
LIST @-FADVL = @-FADVL ;
LIST @A< = @A< ;
LIST @>A = @>A ;
LIST @ActioN> = @ActioN> ;
LIST @APP = @APP ;
LIST @APP-N< = @APP-N< ;
LIST @APP-Pron< = @APP-Pron< ;
LIST @APP>Pron = @APP>Pron ;
LIST @APP-Num< = @APP-Num< ;
LIST @APP-ADVL< = @APP-ADVL< ;
LIST @CVP = @CVP ;
LIST @CNP = @CNP ;
LIST @CMPND = @CMPND ;
LIST @COMP-CS< = @COMP-CS< ;
LIST @HAB = @HAB ;
LIST @HNOUN = @HNOUN ;
LIST @INTERJ = @INTERJ ;
LIST @MEASURE = @MEASURE ;
LIST @>N = @>N ;
LIST @N< = @N< ;
LIST @NNum> = @NNum>;
LIST @NumN< = @NumN<;
LIST @>Num = @>Num;
LIST @Num< = @Num< ;
LIST @NPron< = @NPron< ;
LIST @NQ< = @NQ< ;
LIST @NUM-PRON = @NUM-PRON ;
#LIST @NUMBER = @NUMBER ;
LIST @OBJ = @OBJ ;
LIST @ = @OBJ> ;
LIST @OPRED = @OPRED ;
LIST @ = @OPRED> ;
LIST @PCLE = @PCLE ;
LIST @PrcN> = @PrcN> ;
LIST @PronN< = @PronN< ;
LIST @PronN> = @PronN> ;
LIST @Pron< = @Pron< ;
LIST @>Pron = @>Pron ;
LIST @P< = @P< ;
LIST @>P = @>P ;
LIST @SPRED = @SPRED ;
LIST @ = @SPRED> ;
LIST @SUBJ = @SUBJ ;
LIST @ = @SUBJ> ;
LIST @SUBJ-QH = @SUBJ-QH ;
LIST @TITLE = @TITLE ;
LIST @VOC = @VOC ;
LIST @X = @X ;
# Semantic tags
# -------------
LIST Ani = Ani ;
LIST Fem = Fem ;
LIST Mal = Mal ;
LIST Obj = Obj ;
List Org = Org ;
LIST Plc = Plc ;
LIST Sur = Sur ;
LIST Tit = Tit ;
LIST HUM-PROP = Fem Mal Sur Tit ;
# Other tags
# ----------
LIST ABBR = ABBR ;
LIST ACR = ACR ;
# Single-word sets
# ----------------
LIST COMMA = "," ;
LIST ¶ = ¶;
# ======== #
# Tag sets #
# ======== #
SETS #
# ======== #
SECTION
LIST WORD = N A Adv V Pron CS CC Adp Po Pr Interj Pcle Pers Dem Interr Refl Recipr Rel Indef ; # any word
# Case sets
# ---------
LIST ADVLCASE = Ill Ine Ela Com Ess Loc ;
LIST OBLCASE = Acc Gen Ill Ine Ela Com Ess Par Loc ;
LIST CASE = Nom Acc Gen Ill Ine Ela Com Ess Par Loc ;
SET NOT-GEN = CASE - Gen ;
# Verb sets
# ---------
SET VERB = V - (V N); # V is all readings with a V tag in them, VERB should
# be the ones without an N tag following the V
# Finiteness and mood
# - - - - - - - - - -
SET V-IND-FIN = Prs OR Prt ; # Problem: "In boahtán" is an invisible indicative
SET V-MOOD = Prs OR Prt OR Pot OR Imprt OR ImprtII OR Cond ;
SET VFIN = V-MOOD - ConNeg ;
SET VFIN-POS = V-MOOD - ConNeg - Neg ;
SET VFIN-NOT-IMP = VFIN - Imprt - ImprtII ;
SET NOT-VFIN = VERB - VFIN ;
# Person
# - - - -
LIST V-SG1 = (V Ind Prs Sg1) (V Ind Prt Sg1) (V Cond Prs Sg1)
(V Cond Prt Sg1) (V Pot Prs Sg1) (V Neg Ind Sg1);
LIST V-SG2 = (V Ind Prs Sg2) (V Ind Prt Sg2) (V Cond Prs Sg2)
(V Cond Prt Sg2) (V Pot Prs Sg2) (V Neg Ind Sg2);
LIST V-SG3 = (V Ind Prs Sg3) (V Ind Prt Sg3) (V Cond Prs Sg3)
(V Cond Prt Sg3) (V Pot Prs Sg3) (V Neg Ind Sg3);
LIST V-DU1 = (V Ind Prs Du1) (V Ind Prt Du1) (V Cond Prs Du1)
(V Cond Prt Du1) (V Pot Prs Du1) (V Neg Ind Du1);
LIST V-DU2 = (V Ind Prs Du2) (V Ind Prt Du2) (V Cond Prs Du2)
(V Cond Prt Du2) (V Pot Prs Du2) (V Neg Ind Du2);
LIST V-DU3 = (V Ind Prs Du3) (V Ind Prt Du3) (V Cond Prs Du3)
(V Cond Prt Du3) (V Pot Prs Du3) (V Neg Ind Du3);
LIST V-PL1 = (V Ind Prs Pl1) (V Ind Prt Pl1) (V Cond Prs Pl1)
(V Cond Prt Pl1) (V Pot Prs Pl1) (V Neg Ind Pl1);
LIST V-PL2 = (V Ind Prs Pl2) (V Ind Prt Pl2) (V Cond Prs Pl2)
(V Cond Prt Pl2) (V Pot Prs Pl2) (V Neg Ind Pl2);
LIST V-PL3 = (V Ind Prs Pl3) (V Ind Prt Pl3) (V Cond Prs Pl3)
(V Cond Prt Pl3) (V Pot Prs Pl3) (V Neg Ind Pl3);
# Some subsets of the VFIN sets
# - - - - - - - - - - - - - - -
SET V-DU = V-DU1 OR V-DU2 OR V-DU3 ;
SET V-PL = V-PL1 OR V-PL2 OR V-PL3 ;
SET V-DU-PL = V-DU1 OR V-DU2 OR V-DU3 OR V-PL1 OR V-PL2 OR V-PL3 ;
SET V-NOT-SG1 = VFIN-NOT-IMP - V-SG1 ;
SET V-NOT-SG3 = V-SG1 OR V-SG2 OR V-DU1 OR V-DU2 OR V-DU3 OR
V-PL1 OR V-PL2 OR V-PL3 ;
SET V-1-2 = V-SG1 OR V-SG2 OR V-DU1 OR V-DU2 OR V-PL1 OR V-PL2 ;
SET V-3 = V-SG3 OR V-DU3 OR V-PL3 ;
# Pronoun sets
# ------------
SETS
LIST MUN = (Pron Pers Sg1 Nom) ;
LIST DON = (Pron Pers Sg2 Nom) ;
LIST SON = ("son" Pron Pers Sg3 Nom) ("sån" Pron Pers Sg3 Nom) ;
LIST MÅJ = (Pron Pers Du1 Nom) ;
LIST DÅJ = (Pron Pers Du2 Nom) ;
LIST SÅJ = (Pron Pers Du3 Nom) ;
LIST MIJPERS = (Pron Pers Pl1 Nom) ;
LIST DIJ = (Pron Pers Pl2 Nom) ;
LIST SIJ = ("son" Pron Pers Pl3 Nom) ("sån" Pron Pers Pl3 Nom) ;
SET PPRON-NOM-NOT-DAT = MUN OR DON OR SON OR MÅJ OR DÅJ OR SÅJ OR MIJPERS OR DIJ OR SIJ ;
SET PPRON-DU-PL = MÅJ OR DÅJ OR SÅJ OR MIJPERS OR DIJ OR SIJ ;
SET PPRON-NOT-SIJ = MUN OR DON OR SON OR MÅJ OR DÅJ OR SÅJ OR MIJPERS OR DIJ ;
LIST PPRON-GEN = (Sg1 Gen) (Sg2 Gen) (Sg3 Gen) (Du1 Gen) (Du2 Gen) (Du3 Gen)
(Pl1 Gen) (Pl2 Gen) (Pl3 Gen);
SET PPRON-NOT-GEN = (Pron Pers) - PPRON-GEN ;
LIST DEM-SG = (Pron Dem Sg Nom);
LIST DEM-PL = (Pron Dem Pl Nom);
SET NOT-DEM = WORD - Dem ;
# Adjectival sets and their complements
# -------------------------------------
SET A-CASE = A - Attr - Adv ;
SET NOT-ADJ = WORD - A ;
SET NOT-Attr = WORD - Attr ;
SET NOT-AA = WORD - A - Adv ;
SET NOT-AAPCLE = WORD - A - Adv - Pcle ;
# Adverbial sets and their complements
# ------------------------------------
SET NOT-ADJ-PCLE = WORD - A - Pcle ;
SET NOT-ADJ-CC = WORD - A - CC ;
SET NOT-ADV = WORD - Adv ;
SET NOT-ADV-PCLE = WORD - Adv - Pcle ;
SET NOT-ADV-PCLE-VFIN = WORD - Adv - Pcle - VFIN ;
SET LEX-ADV = Adv - (A*) ;
SET ADVERBIAL = Adv OR Ill OR Ine OR Ela OR Com OR Ess ;
SET NOT-ADV-N = WORD - Adv - N;
SET NOT-ADV-INDEF = WORD - Adv - Indef ;
SET NOT-ADV-PCLE-ILL = WORD - Adv - Pcle - Ill ;
SET NOT-ADV-PCLE-INDEF = WORD - Adv - Pcle - Indef ;
SET NOT-ADV-PCLE-NEG = WORD - Adv - Pcle - Neg ;
SET NOT-ADVL-PCLE-NEG = WORD - @ADVL - @P< - Pcle - Neg ;
# Coordinators
# - - - - - - -
LIST NEGFOC = (Neg Foc) ;
LIST XGU = "dagu" "degu" ;
# compounds
SET CRD = COMMA OR CC OR ("/") OR XGU ;
# coordinators
# Sets of elements with common syntactic behaviour
# ================================================
LIST COPULAS = "bissot" "liehket" "sjaddat" "soajttet" "viedjet" "årrot" "dáidit" "gártat" "leahkit" "leat" "orrut" "soaitit" "šaddat" "veadjit" ;
#"dáidit" "gártat" ;
# 'Dáidit' can appear without 'leat'.
LIST REALCOPULAS = "liehket" "dáidit" "leat" ;
LIST GerII-V = "ájttsat" "gullat" "gullát" "mannat" "tjuodtjot" "tjåhkkåhit" "vuojnnet" "vællahit" ;
SET V-TRANS-ACT = TV - (Der/Pass) ;
# All active verbs with a TV tag, including AUX-OR-MAIN.
SET V-TRANS-ACT-NOT-ACT = V-TRANS-ACT - Actio - Actor - PrsPrc ;
# Sets for verbs choosing oblique objects or adverbials
# - - - - - - - - - - - - - - - - - - - - - - - - - - -
LIST OPREDV = "adnet" "gåhttjot" "válldet" "atnit" "dadjat" "dahkat" "dulkot" "geavahit" "geahččat" "gohčodit" "gohččut" "meroštallat" "navdit" "váldit" "válljet" ;
LIST ESSV = "aneduvvat" "boahtet" "sjaddat";
# NOUNS
# -----
# NP sets defined according to their morphosyntactic features
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
LIST N-SG-NOM = (N Sg Nom); LIST N-PL-NOM = (N Pl Nom);
SET NOT-ACTOR = N - Actor ;
LIST PROP = (N Prop);
SET CNOUN = N - Prop;
SET CNOUN-PL-NOM = (N Pl Nom) - Prop ;
SET HNOUN = N - RCmpnd ;
SET HNOUN-NOM = (N Nom) - RCmpnd ;
SET N-NOT-GEN = N - (N Gen) ;
SET NP-HEAD = Pron OR HNOUN ;
SET NP-HEAD-SG = (Pron Sg1) OR (Pron Sg2) OR (Pron Sg3) OR (N Sg) - RCmpnd;
SET NP-HEAD-PL = (Pron Pl1) OR (Pron Pl2) OR (Pron Pl3) OR (N Pl) - RCmpnd;
SET NP-HEAD-SG-NOM = (Pron Sg1 Nom) OR (Pron Sg2 Nom) OR (Pron Sg3 Nom) OR (N Sg Nom) - RCmpnd;
SET NP-HEAD-PL-NOM = (Pron Pl1 Nom) OR (Pron Pl2 Nom) OR (Pron Pl3 Nom) OR (N Pl Nom) - RCmpnd;
SET NP-HEAD-NOM = NP-HEAD-SG-NOM OR NP-HEAD-PL-NOM;
SET NP-HEAD-ACC = (Pron Acc) OR (N Acc) - RCmpnd;
SET NP-HEAD-GEN = (Pron Gen) OR (N Gen) - RCmpnd;
# The PRE-NP-HEAD family of sets
# - - - - - - - - - - - - - - - -
SET PRE-NP-HEAD = (Prop Attr) OR (Prop @>N) OR (A Attr) OR ("buorre") OR (Pron Pers Gen) OR (N Gen) OR
Num OR RCmpnd OR CC OR (Pron Dem) OR (Pron Refl Gen) OR (Pron Indef) OR
(PrfPrc @>N) OR (PrfPrc @PrcN>) OR PrsPrc OR (A Ord) ;
# OR (Ill LINK 1 (PrfPrc @AN>)) OR (Com LINK 1 (PrfPrc @AN>)) OR (LOC LINK 1 (PrfPrc @AN>))
# The strict version of items that can only be premodifiers, not parts of the predicate
SET V-PRE-NP = PrfPrc OR PrsPrc OR Actor OR Actio OR (V A) OR (Ind Prs Sg3) OR (Ind Prs Sg1) OR (Imprt Prs Du2) OR (ImprtII Prs Du2) ;
# to be used together with PRE-NP-HEAD before @PrcN> is disambiguated
SET NP-MEMBER = PRE-NP-HEAD OR N ;
SET PRE-A-N = (Pron Pers Gen) OR (Pron Indef) OR Num OR (A Ord) OR (Pron Dem) OR (Pron Refl Gen) ;
SET NOT-PRE-A-N = WORD - PRE-A-N ;
LIST PUNCT-LEFT = (PUNCT LEFT) ;
LIST PUNCT-RIGHT = (PUNCT RIGHT) ;
SET PRE-APP = COMMA OR PUNCT-LEFT OR PRE-NP-HEAD ; # This set ist not only for what can
# stand in front of appositions but also
# postmodifiers.
# There must be a sensible naming convention for these sets...
# Most strict BARRIERs...
SET NPNH = WORD - PRE-NP-HEAD OR ABBR ; # NPNH = "NOT-PRE-NP-HEAD"
SET NPNHV = WORD - PRE-NP-HEAD - V-PRE-NP ; # including possible verbal premodifiers
SET NPNHA = WORD - PRE-NP-HEAD - Adv ; # NPNHA = "NOT-PRE-NP-HEAD-OR-ADV"
SET NPNHAV = WORD - PRE-NP-HEAD - Adv - V-PRE-NP ; # including possible verbal premodifiers
SET NPNHAI = WORD - PRE-NP-HEAD - Adv - Indef ; # NPNHAI = " ...-OR-INDEF"
SET NPNHAII = WORD - PRE-NP-HEAD - Adv - Indef - Ill ; # Illative indir.obj.
SET NPNHAIIP = WORD - PRE-NP-HEAD - Adv - Indef - Ill - Pcle ; # <== is this our NPNH set?
SET NPNHC = WORD - PRE-NP-HEAD - Com ; # "njaŋggofirpmiiguin bivdin"
SET NPNHCCC = WORD - PRE-NP-HEAD - COMMA ;
SET NAPP = WORD - PRE-APP ;
# ... Most sloppy BARRIERs
# Set for NP with participle premodifier
# LocComIll are ok, but only with a PrfPcc to the right
# Other negatively defined sets
# - - - - - - - - - - - - - - -
SET NOT-N = WORD - N ;
SET NOT-NA = WORD - N - A ;
SET NOT-NP = ConNeg OR Inf OR Pcle OR Interj OR CS ; # The set NP-BOUNDARY is bigger.
SET NPROP = N - PROP ;
SET NOT-COMMA = CLB - COMMA OR PUNCT-LEFT OR PUNCT-RIGHT ;
# Nominal sets defined according to their semantical properties
# - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
LIST TITLE = "gånågis" "profehta" "profehtta" ("gásttašit" Der/eaddji) "justitiarius" "majestehta" "prof" "cand.mag" "cand.oecon" "cand.philol" "cand.real" "cand.scient" "cand.theol" "cand" "dr.art" "eksp.hoavd" "eksp.sj" "fenr" "fig" "fil.tri" "gen.lt" "genr" "genr.lt" "h.r.adv" "hr" "kapt" "korp" "lekt" "lic" "ltn" "mag.art" "mag" "majestehta" "merc" "miss" "Miss" "Mr" "Mrs" "odont" "oecon" "ordf" "ossod.dir" "stud.phil." "res.kap" "stud.philol" "vit.ass" "dr" "dr.med" "dr.philos" "dr.theol" ;
LIST ESS-ADVL-N = "bäjvádahka" "biegga" "dálkke" "dulvve" "njáhsto" "rássjo" "sjievnnjet" "arvi" "árga" "baika" ("bassi" N) ("báhkka" N) "beaivvádat" "biegga" "bievla" ("buolaš" N) "čuoika" "čuovga" (".*dálki"r) "dulvi" "mánoheahpi" "muohta" "njáhcu" ("seavdnjat" N) "veaigi" ;
# Time sets
# - - - - -
LIST AIGODAT = "ájge" "gávdda" "ájge#gávdda" "válgga#gávdda" "sámedikke#gávdda" "áigi" (".*áigodat"r) "álgo#áigi" "bargo#áigi" "soahte#áigi" "soahte#gaska#áigi" ;
LIST VAHKKU = "biejvve" "b" "gidá" "giesse" "tijmma" "jánndur" "båddå" "tjaktja" "tjaktja#giesse" "tjaktja#sjievnnjet" "tjuohte#jahke" "dálvve" "kloahkka" "kloahkko" "kl" "doajmma#jahke" "gierdde" "giesse" "gidá" "bálle" "idja" "jahke" "jahke#tjuohte" "mánno" "mihttsamárra" "riegádim#biejve" "vahkko" "stuorradigge#gávdda" "1700-#låhko" "1700-#jahke#låhko" "beaivi" "jándor" "bodda" "čakča" "čakča#geassi" "čakča#seavdnjat" "čuohte#jahki" "dálvi" "diibmu" "eahket" "eahket#bodda" "geassi" "giđđa" "idja" "iđit" "iđit#bodda" "jahki" "jahke#bealle" "jahke#čuohti" "kaleanddar#jahki" "loahppa#jahki" "mánnu" "minukta" "njealjádas#jahki" "skuvla#jahki" "tiibma" "vahkko#loahppa" "vahkku" "b" "bievla#jahki" "bivdo#áigi" (".*#beaivi"r) "D-#beaivi" "dienas#jahki" "doaibma#jahki" "eamiálbmot#jahki" "earre#jahki" "gaska#idja" "geardi" "juovla#bassi" "luome#jahki" "luopmo#jahki" "mihcamárra" "muorje#jahki" "nisson#jahki" "vuoito#jahki" "vuođđo#skuvla#vahkku" ("[0-9]*#-jahki"r) ("[0-9]*-#jahki"r) "[0-9]*-[0-9]*-#jahki" "[0-9]*-[0-9]*-#lohku" ("[0-9]*-#lohku"r) ("[0-9]*#-lohku"r) ;
# The quoteless jahki here is since the preprocessor is not fine-tuned
# yet, it still gives '"1870-" # jahki N Sg Com'. # lets see if "dbm" works
LIST AJGGI = "ájgge" (".*#ájgge"r) "áigi" (".*#áigi"r) ;
LIST MANNU = "ådå-jak-#mánno" "ådåjakmánno" "guovvamánno" "snjuktjamánno" "vuoratjismánno" "moarmesmánno" "biehtsemánno" "snjilltjamánno" "bårggemánno" "ragátmánno" "gålgådismánno" "basádismánno" "javllamánno" "ođđa#jage#mánnu" "ođđa#jagi#mánnu" "guovva#mánnu" "njukča#mánnu" "njuvčča#mánnu" "márs#mánnu" "cuoŋo#mánnu" "cuoŋos#mánnu" "cuoŋu#mánnu" "gáranas#mánnu" "miesse#mánnu" "mái#mánnu" "geasse#mánnu" "suoidne#mánnu" "borge#mánnu" "šnjilča#mánnu" "šnjilža#mánnu" "čakča#mánnu" "golggot#mánnu" "skábma#mánnu" "november#mánnu" "ritne#mánnu" "juovla#mánnu" ;
LIST BEAIVI = "mánnodak" "dijstak" "gasskavak" "duorastak" "bierjjedak" "lávvodak" "ájllek" "basse" "albmái#mannan#beaivi" "bargočoahkkin#beaivi" "beassáš#beaivi" "mánnodat" "vuoss#árga" "disdat" "maŋŋeb#árga" "gaska#vahkku" "duorastat" "bearjadat" "juovla#beaivi" "lávvardat" "lávvordat" "sotna#beaivi" "sábbát" "skille#duorastat" "álbmot#beaivi" "árga#beaivi" "bargo#beaivi" "beaivi" "duopmo#beaivi" "riegádan#beaivi" "skuvla#beaivi";
SET TIME = MANNU OR VAHKKU OR BEAIVI OR AJGGI ;
# Do not add AIGODAT, it has some other characteristics in some cases.
LIST GIESSEK = "dálvvek" "gidak" "giessek" ("giessek" Adv) "tjaktjak" "dálvet" "dálvit" "giđđat" "geasset" ("geassit" Adv) "čakčat" ;
# Amount sets
# - - - - - -
LIST MEASURE = "mijlla" "kilo#mehter" "mehtar" "mehter" "senti#mehter" "sm" "milli#mehter" "stihkko" "salla" "lihttar" "kilo" "unnánasj" "cl" "lihtar" (".*#lihtter"r) "dl" "lihtter" "ml" "mg" "kg" "kilo" "kilu" "gilo" "tonna" "čuolda#badji" "dumá" "fierbme#badji" "gaska" "miila" (".*#mehtar"r) (".*#mehter"r) "mehtar" "mehter" "sente" "cm" "tumá" "állan" "salla" "buolaš#ceahkki" "buolaš#gráda" "liegga#ceahkki" "liegga#gráda" "uhcánaš" "unnánaš" "jahki" "minukta" "sekunda" "vahkku" "mánnu" "diibmu" ;
LIST CURRENCY = "kråvnnå" "kr" "¢" "€" "$" "denara" "dollár" "euro" "kruvdnu" "ru" "rubel" "ruvdno" "ruvdnu" ;
LIST NUMUNIT = "tjuohte" "tuvsán" "millijåvnnå" "milijåvnnå" "mill" "mil" "milliárdda" "mrd" "čuohti" "duhát" "miljon" "millijovdna" "milliovdna" "milj" "miljo" "miljarda" ;
LIST KLASS = "ássje" "bálkká#tsiehkke" "s" "sijddo" "§" "§§" "páragráffa" "oasse" "kap" "kapihtal" "ášši" "bálká#ceahkki" "čuokkis" "siidu" "paragráfa" "oassi" "kapihttal" ;
LIST AKTA = "akta" "okta" ;
SET NUMERALS = Num - AKTA ;
# this set does not contain ordinals, I am not sure if that is necessary.
SET CARDINALS = Num - Ord ;
LIST ALU = ("allu" Gen)("assu" Gen)("čiekŋu" Gen)("gassu" Gen)("govdu" Gen)
("guhkku" Gen)("lossu" Gen)("stuorru" Gen)("viidu" Gen);
# Those are words that only appear in one form, which Nickel calls A/G.
# They are only in a predicative position.
# needs to be translated . Are they translatable, do these forms exist in Julev (TO)?
# Semantic noun-sets
# -------------------
LIST HUMAN-smj = "áddjá" "áhkká" "áhkko" "áhttje" "áhttje#bielle" "ájttek" "bárne#bárnne" "bárne#niejdda" "bárnne" "bárnne#bielle" "biebbmo#bárnne" "biddno#moarsse" "boaddnje" "gájmme" "gállasj#guojmme" "gállasj#ålmåj" "gálojinitja" "goasske" "goasske" "gieruk" "guolle#bivdde" "ibme" "ieddne" "ieddne#bielle" "iemet" "irgge" "iset" "násste#dåbdde" "niejdda" "næjttso" "næjttso#riehko" "oarbben#bielle" "oarbben" "siessá" "siessal" "sirram#nissun" "svilli" "mannje" "moarsse" "muohtá" "muohtal" "niehpe" "oabbá" "oabbá#bielle" "sijdda" "stáhta#ministar" "tjiehtje" "tjiehtjev" "vehka" "vieljasj" "viellja" "viellja#gieres" "viellja#bielle" "vilpástalle" "æddnul" "ænoj" "årro" ;
LIST HUMAN-sme = "Bergen#-soalddát" "Enodat#sápmelaš" "Guovda#geain#sápmelaš" "Maya#-indiána" "Norgga#-ustit" "Ruošša-#Sápmelaš" "Suonjil#sápmelaš" "Sáme#demokráhtta" "Sámedigge#presideanta" "Sápmi" "Várjjat#sápmelaš" "almennet" "almmolašvuohta" "almmái#olmmoš" "arkeologa" "badje#sápmelaš" "bajit#báhppa" "bargo#veahka" "bassaleaddji" "bassi" "beahtu" "bearaš" "bearaš#minister" "beargalat" "bearre#mánni" "bibliotekára" "biebmo#ministtar" "biila#divvu" "birasgáhtten#ministtar" "birasgáhttenráđđe#addi" "bisma" "bismá" "bispa" "boadnji" "boanda" "boaris" "boazo#doalli" "boazo#eaiggát" "boazo#sápmelaš" "boazo#sápmi" "boazodoallo#hoavda" "boles#meašttir" "buvttadeaddji" "báhkkár" "báhppa" "bálvalan#guoibmi" "bálvaleaddji" "bárdne#mánná" "bárdni" "bártnáš" "davvi#sápmi" "dearvvašvuođa#ministtar" "dekana" "delegašuvdna" "dievdo#olmmoš" "divššohas" "duiskkalaš" "dulka" "duojár" "dáiddár" "dáidár" "dállo#doalli" "dálon" "dálu#eamit" "dálu#isit" "dánskalaš" "dárkkisteaddji" "dáčča" ("duodje#oahpahallat" Actor) "eadni" "eahki" "eaiggát" "eallo#doalli" "ealáhus#doalli" "eamit" "eammi" "eanadoallo#minister" "eanan#doalli" "eanan#eaiggát" "eanan#hearrá" "eanu" "eatnan#doalli" "eatnigiel#hálli" "eaŋkil#olmmoš" "eŋgel" "farao" "fitnodat#doaibmi" "fitnodat#oamasteaddji" "fylkka#ráđđi" "fáldi" "fásta#ássi" "geavaheaddji" "gieldda#minister" "giella#ráđđi" "gili#almennet" "gili#ássi" "girdi" "girko#bálvaleaddji" "girko#dulka" "goaski" "golle#rávdi" "gonagas" "govva#dáiddár" "govva#dáidár" "govvedeaddji" "govvejeaddji" "guoibmi" "guolásteaddji" "guolástus#minister" "guossi" "guovdageaidnolaš" "guođoheaddji" "gáktehas" "gánda" "gávpejas" "gázzi" "hearrá" "hollándalaš" "háldi" "hárjeheaddji" "indiána" "informánta" "ipmil" "irgi" "isit" "israellaš" "johtti#sápmelaš" "johtti#sápmi" "judálaš" "julev#sápmelaš" "julev#sápmi" "justis#ministtar" "juvddálaš" "kandidáhta" "kandidáhtta" "keaisár" "kirurga" "koahkka" "korefereanta" "kránnjá" "kultur#minister" "kursa#oahppi" "lagamuš" "leans#mánni" "leanut" "lestadiánalaš" "logopeda" "luhkkár" "lulli#sápmelaš" "lulli#sápmi" "lunta" "lágideaddji" "láibu" "lávlu" "mannji" "mearra#almmái" "mearra#olmmái" "mearra#sápmi" "ministtar" "mišuneara" "moarsi" "muitaleaddji" "muoŧŧa" "muoŧŧal" "museá#bargi" "musihkka#dahkki" "musihkkár" "máhttájeaddji" "máilmme#meašttir" "mánná" "mánáid#mánná" "mánáš" "mátta#sápmi" "máttar#áddjá" "máttar#áhkku" "neahpi" "neavttár" "nieida" "nieiddaš" "nisson" "nisson#olmmoš" "nisson#áirras" "nisu" "njunuš#jurista" "njávdán#sápmelaš" "noaidi" "nomáda" "nuorra" "nuorta#sápmi" "nuortalaš" "náittos#guoibmi" "návet#vázzi" "oabbá" "oabbá#bealli" "oahpahalli" "oahppan#olmmoš" "oahppi" "oaivadeaddji" "oaivámuš" "oambealli" "oapmahaš" "oappáš" "oarje#sápmelaš" "oarje#sápmi" "oarpmealli" "oktavuođa#olmmoš" "olbmo#bárdni" "olgo#riikkalaš" "olles#olmmoš" "olmmoš" "olmmái" "osku#guoibmi" "osku#viellja" "ossodat#direktevra" "ossodat#direktøra" "ovda#olmmoš" "ovttas#ássi" "ođas#hoavda" "ođas#lohkki" "palestinalaš" "parkeren#fákta" "pasienta" "pedagoga" "plánejeaddji" "poliisa" "politihkar" "politihkkár" "politiija" "prentejeaddji" "presideanta" "profehta" "professor" "reaŋga" "redaktevra" "rehket#doalli" "rehketdoallo#dárkkisteaddji" "rektor" "riika#vuloš" "riikka#ássi" "rist#vánhen" "romalaš" "romer" "ruhttejeaddji" "ruota#suopmelaš" "ruvdna#prinsa" "ruvvejeaddji" "rádje#fákta" "rádje#soalddat" "ráidu" "ránnjá" "rávdi" "rávis#olmmoš" "ráđđe#addi" "ráđđe#almmái" "ráđđe#olmmái" "ráđđi" "samarialaš" "sealge#eadni" "sester" "siessal" "siessá" "siida#guoibme#nisu" "siida#guoibmi" "silba#rávdi" "sis#eatnan#sápmelaš" "skibir" "skihpár" "skohter#vuoddji" "smávva#gánda" "snihkkár" "soahte#olmmái" "soalddat" "sohka" "sohka#goddi" "sosionoma" "sosiála#ministtar" "spábba#čiekči" "spábbačiekčan#hárjeheaddji" "stipendiáhta" "stivra#lahttu" "studeanta" "stáhta#almennet" "stáhta#boargár" "stáhta#ministtar" "stáhta#ráđđi" "stállu" "sundi" "suodjalus#eŋgel" "suodjalus#minister" "suohkan#báhppa" "suohkan#plánejeaddji" "sága#doalli" "sáme#demokráhtta" "sáme#dikke#ráđđi" "sáme#duojár" "sáme#gielat" "sáme#mánná" "sáme#nisson" "sáme#nisu" "sáme#nuorra" "sámedigge#presideanta" "sámedikke#áirras" "sápmi" "sárdnideaddji" "sátne#jođiheaddji" "sávza#doalli" "taksi#vuoddji" "telefon#vástideaddji" "tuollár" "turista" "turista#ofelaš" "uksa#fákta" "ulda" "universitehta#lektor" "unnit#lohku" "ustit" "veahka" "verdde" "vieljaš" "viellja" "viellja#bealli" "viesso#hoiddár" "viissis" "vilbealli" "virge#guoibmi" "virge#olmmoš" "vuohppa" "vuokta#čuohppi" "vuon#áhkku" "vuoni" "vuoras#olmmoš" "vuoste#bealli" "vuoste#belle" "vuotna#sápmelaš" "vuotna#ássi" "váhnen" "váldo#doaimmaheaddji" "várre#presideanta" "áddjut" "áddjá" "áhkku" "áhkkut" "áhkká" "áhčči" "áirras" "ákšo#álmmái" "álbmot" "álbmot#guoibmi" "ámmát#olmmoš" "ámmát#olmmái" "ámta#mánni" "ássi" "čalbme#eadni" "čalbme#áhkku" "čeahci" "čeahcit" "šibit#doalli" "čiekči" "čorgejeaddji" "čála#oahppavaš" (".*#geahčči"r) (".*#guovttis"r) (".*#guovttos"r) (".*#mánni"r) (".*#vuoddji"r) (".*#vuovdi"r) (".*#álbmot"r) (".*advokahta"r) (".*artista"r) (".*assisteanta"r) (".*bagadalli"r) (".*bagadeaddji"r) (".*bargi"r) (".*bearaš"r) (".*biigá"r) (".*bivdi"r) (".*dikšu"r) (".*direktevra"r) (".*dirigeanta"r) (".*divššár"r) (".*doaimmaheaddji"r) (".*doavttir"r) (".*duopmar"r) (".*duopmár"r) (".*dutki"r) (".*hoavda"r) (".*hábmejeaddji"r) (".*joavku"r) (".*journalista"r) (".*jođiheaddji"r) (".*komiteá"r) (".*kommišuvdna"r) (".*konsuleanta"r) (".*meannudeaddji"r) (".*oahpaheaddji"r) (".*sadjásaš"r) ("sápmi" N Pl) (".*sássa"r) ("suddu" Der/laš) (".*teknihkar"r) (".*terapeuta"r) (".*terapevta"r) (".*veahka"r) (".*veahkki"r) (".*áittardeaddji"r) (".*čearda"r) (".*čuojaheaddji"r) (".*čálli"r) ;
LIST HUMAN-sma = "maana" ;
SET HUMAN = HUMAN-sma OR HUMAN-sme OR HUMAN-smj ;
LIST ANIMAL-smj = "boatsoj" "guokkardiddje" "guolle" "judos" "rievsak" "sávttsa" "vierttsa" ;
LIST ANIMAL-sme = "ábe#gáhttu" "ásen" "beana" "bohkká" "bussá" "čeavrris" "ciiku" "čivga" "dámmá" "ealit" "fuođđu" "gáhttu" "gáica" "gálbi" "gihcci" "guigu" "gussa" "heasta" "horti" "láppis" "loddi" "máhtu" "njiŋŋálas" "ore" "sávza" "sávza#beana" "smávva#fuođđu" "spiinne#čivga" "spiidni" "vársá" "vársi" "vielppis" "vierca" "vuoksá" "vuoncá#varis" "vuonccis" "ealga" "rievssat" "áldu" "boazu" "čearpmat" "čora" "eallu" "heargi" "miessi" "sarvvis" "vierro#boazu" "vuonjal" "bálddis" "čuska" "dápmot" "diddi" "diksu" "dorske#guolli" "dorski" "duovvi" "gilot" "guolli" "hávga" "juksu" "luos#juolgi" "luossa" "luossa#guolli" "luossa#nálli" "muortu" "sallit" "sáidi" "sáiva#guolli" "šákša#dorski" "stábbasáidi" "stáinnir" "stuora#sáidi" "rutnot" "veajet" "čora" "eallu" "hearge#ráidu" "ákta" "báiski" "bovttáš" "cagan" "čearret" "gádde#loddi" "gáiru" "meara#loddi" "skávli" "skuolfi" "šuoršu" "albatrossa" "alit#bađuš" "alit#gaccet" "alit#oai#gaccet" "bakku" "baste#suorsi" "bađoš#gaccet" "beahce#báhcat#loddi" "beahce#loddi" "bealdo#cihci" "bealdo#garjá" "bealdo#vuorra" "bealge#loddi" "beallje#loađgu" "beallje#rásttis" "bearal#skuolfi" "beaste#rages" "beibboš" "beibboš#cihci" "beibboš#cizáš" "belddoš#vizar" "beškkoš" "beštor" "biegga#fálli" "biehkan" "bigán" "bihcabas#čáihni" "bihcebas#gáski" "bihcebas#čáihni" "bisse#hávka" "bižus" "boaimmáš" "boallo#njukča" "boađđo#civkkán" "borjjastit" "borse#njunni" "bovttáš" "bulddogas" "bumbá" "buoide#gaccet" "buokčat" "buokči" "bupmálaš" "bursa#njunni" "bussá#skuolfi" "buvvedat" "báiski" "bákte#duvvá" "bárbmo#fálli" "bávgoš" "cagan" "cagán" "cielláš" "cihce#skuolfi" "cihrre#lasta#vizar" "civka#leivvoš" "cizaš#fálli" "cizopaš" "cizot" "davve#lasta#vizar" "davve#loddi" "davve#vizar" "deagga#čáihni" "deagge#báiski" "deagge#cihci" "dearbme#rásttis" "derpmoš" "dieldá" "dielko#duvvá" "dihtti" "dikso#báhppa" "dirre#lihká" "doadjo#suorsi" "dokta" "dovtta" "duoršu" "duottar#bižus" "duottar#civka#leivvoš" "duvvá" "duvvá#rásttis" "dálve#beštor" "dálve#ruoivil" "dálvi" "dáža#boaimmáš" "dáža#suorsi" "fasána" "fiehta" "fiervá#vierru" "fiervá#viroš" "fiskes#beštor" "fiskes#cihci" "fiskes#cižáš" "fiskes#gaccet" "fiskes#jievžžan" "fiskes#njun#gáhkkor" "fiskes#vizar" "fiŋka" "gaccepaš" "gaccet" "gahper#báiski" "gahper#vizar" "garjá" "gassa#njunni" "gazza#loddi" "gazze#biehtár" "geađge#jorgu" "geađge#rásttis" "giega#biigá" "giehka" "giehpa#vuonccis" "giella#vealgu" "gierdo#duvvá" "gierdo#rásttis" "gierdo#suorsi" "gierdo#čuonjá" "gierra" "giljobaš" "gilljobaš" "gilva#beštor" "girje#báhcat#loddi" "girje#livkkár" "giron" "goahcce#loddi" "goahppil" "goahppil#gálli" "goahte#goljaš" "goalsi" "goalso#ruoššehas" "goalšo#vizar" "goarga" "goarga#loddi" "goargŋo#haŋŋá" "goaski" "goaskin" "gollaš" "golle#beibboš" "golle#cihci" "golle#gahpir" "golli" "golláš" "gorges#hávda" "gorges#lihkká" "govu#skuolfi" "gođa#loddi" "gožu#vuoražas" "guoik#gáhrit" "guoik#gárri" "guoksa" "guolbba#vierru" "guolbba#viroš" "guolbba#čoavžžu" "guolle#fálli" "guolle#čearret" "guorga" "guossa#báhcat#loddi" "guossa#gaccet" "guossa#ruossa#njunni" "guossa#vizar" "guovssat" "guovsso#loddi" "gussa#goalsi" "guškil#vierru" "guškil#viroš" "guškkástat" "gádde#buvvet" "gádde#skirvi" "gádde#vierru" "gádde#viroš" "gáhkkor" "gáiru" "gállat" "gálli" "gállit" "gáranas" "gáranas#loddi" "gárggo#goalsi" "gárgo#goalsi" "gávla#čuonjá" "hálka#loddi" "haŋŋá" "hearta#vizar" "hoašša#cihci" "hurrat" "hurri" "hurri#goahppil" "hurri#čukčá" "háigir" "háigir#loddi" "hálka" "hálka#gonagas" "hálka#čielkkis" "háskil" "hávda" "idja#skuolfi" "jeagge#fálli" "jeagge#meahkástat" "jeagge#čoavžžu" "jeaggehávut" "kanária#loddi" "keaisár#pingviidna" "jiekŋa#čielkkis" "jiesmi" "jievja#skuolfi" "jievže#loddi" "jávre#sopmir" "leahtto#fálli" "leahtto#spálfu" "leaibe#loddi" "leivvoš" "lidnu" "liidn-elláš" "liin-elláš" "litnut" "livkkár" "loađgu" "loddi" "lodde#gonagas" "lodde#jievži" "luhkka#loddi" "láfol" "láhto#spálfu" "látte#guoksa" "látte#guovssat" "látto#vuonccis" "láŋgá" "meahkástat" "mearra#goaski" "mearra#goaskin" "mearra#gáiru" "mearra#čuonji" "mearra#čuonjá" "mielle#spálfu" "miestta#cihci" "miestta#rásttis" "miestta#vizar" "miestta#šurre#vizar" "molde#cizáš" "muhkke#cizáš" "muogir" "muorra#civkkán" "muorra#gakcu" "mákrealla#čearret" "niehtte#garjá" "niito#civkkán" "njukča" "njurggu" "njurgut" "noaide#loddi" "nuorta#cihci" "nuorta#lasta#vizar" "nuorti" "náhkke#soadjá" "oanehis#njun#čuonjá" "paradiisa#loddi" "pelikan#loddi" "pingviidna" "ribe#skáiti" "riddo#civka#leivvoš" "riddo#vierru" "riddo#viroš" "rievssat" "rievssat#cižáš" "rievssat#fálli" "roavgo#gonagas" "rohto#gaccet" "rohto#vizar" "rohto#čoavžu" "rohto#čoavžžu" "rukses#bađoš" "rukses#beibboš" "rukses#civka#leivvoš" "rukses#fiehta" "rukses#guškil" "rukses#juol#čoavžžu" "rukses#ruivil" "rukses#ruoivil" "rukses#rásttis" "rukses#soadjá" "rukses#suorre#hávut" "ruoivil" "ruoná#beibboš" "ruoná#cihci" "ruoná#cizáš" "ruoná#juol#čoavžžu" "ruoná#čáihni" "ruossalas#njunni" "ruovddagas" "ruovde#cihci" "ruovde#cizáš" "ruođa" "ruošša#boaimmáš" "ruošša#skire" "ruošša#skirri" "ruošša#állat" "ránes#cihci" "ránes#cizáš" "ránes#háigir" "ránes#livkkár" "ránes#rásttis" "ránes#skuolfi" "ránes#skávli" "ránes#snárttal" "ránes#čuonjá" "ránes#čáihni" "rásttis" "rávgoš" "sallet#gáiru" "sallit#gáiru" "sealle#cižáš" "siesse#mohkki" "sieđga#civkkán" "silde#gáiru" "silke#buokča" "sitron#beštor" "skierru" "skilke#skálka" "skire" "skirri" "skiŋge#gaccet" "skoarra" "skuolfi" "skutnja#loddi" "skáhpe#loddi" "skáiti" "skárfa" "skárfa#čielkkis" "skávli" "snárttal" "soadja#njálla" "sopmir" "spoađđo#duoršu" "spálfu" "stoarbma#loddi" "stoarbma#spálfu" "stohkke#gaccet" "stohkke#rievdu" "stohkke#spálfu" "stohpo#háigir" "stohpo#spálfu" "struhcca" "struhcca#loddi" "stuorra#fiehta" "stuorra#giljobaš" "stuorra#guškil" "stuorra#guškkástat" "stuorra#meahkástat" "stuorra#skáiti" "stuorra#skávli" "stuorra#vuodja" "stuorra#vuojaš" "stuorra#čarkkus" "stuorra#čoavžu" "stuorra#čoavžžu" "stuorra#čuonjá" "stálo#beibboš" "stárra" "suoidne#suorsi" "suoidne#čiksa" "suola#skáiti" "suorre#spálfu" "suorsi" "suotnjo#liráš" "suotnjo#čoavžžu" "suovka#cihci" "suvlá" "sáhco#meahkástat" "sáhpán#boaimmáš" "sáhpán#skuolfi" "sáiva#hávda" "sávja#hávda" "sávza#loddi" "toardna#garjá" "toardna#gájon" "uhca#buokča" "uhca#buvvedat" "uhca#báiski" "uhca#ciellá" "uhca#cihci" "uhca#meahkástat" "uhca#njukča" "uhca#saddi" "uhca#vierru" "uhca#viroš" "uhca#čoavžžu" "uhca#čáihni" "ummol#cizáš" "upmol#cizáš" "unduláhtta" "uvlo#hávut" "varra#loddi" "veastareaddji" "viglá#čoavžžu" "vilges#nier#čuonjá" "vilges#soadja#skávli" "vilges#ummol#cizáš" "vilges#vierru" "vilges#viroš" "vilges#čoavžu" "vilges#čoavžžu" "vilgessealčáihni" "vintán" "vuoncá#čivga" "vuoncá#varis" "vizardit" "vuodja" "vuojaš" "vuokta#fiehta" "vuokta#gaccet" "vuokta#goalsi" "vuokta#láfol" "vuokta#skárfa" "vuonccis" "vuonccis#loddi" "vuoražas" "vuorččis" "vuovda#duvvá" "vuovde#civka#leivvoš" "vuovde#gaccet" "vuovde#loddi" "vuovde#meahkástat" "vuovde#rásttis" "vuovde#vizar" "vuovde#vuorččis" "vuovde#čoavžu" "vuovde#čoavžžu" "ábi#rievssat" "áhpe#dokta" "áhpe#dovtta" "áhpe#háskil" "áhpe#hávda" "áhpe#lihkká" "áhpe#spálfu" "ákta" "állat" "čarkkus" "čearret" "čiekčá" "čielkkis" "čiergges#rásttis" "čiksa" "čoađgi" "čukčá" "čuohte#gielas" "čuohte#giella" "čuonji" "čuonjá" "čuonjá#fálli" "čáhce#bávgoš" "čáhce#vuonccis" "čáhppes#bađoš#guškil" "čáhppes#buokča" "čáhppes#seal#beštor" "čáhppes#gaccet" "čáhppes#rásttis" "čáhppes#čoavji" "čáhppes#čoavžu" "čáhppes#čoavžžu" "čáihne#cizáš" "čáihne#gaccet" "čáihni" "šilljo#cihci" ;
#LIST ANIMAL-sma ;
SET ANIMAL = ANIMAL-sme OR ANIMAL-smj ;
SET ANIMATE = HUMAN OR ANIMAL ;
LIST CONCRETE-ROUTE = "gahttun" "njálmme#rájgge" "uksa#rájgge" "væddja" "Álttá-Kárášjoga-#máđidja" "Álttá-Kárášjoga-#máđii" "bálggis" "bievla#geaidnu" "dálve#luodda" "dálve#máđidja" "dálve#máđii" "eanadat#luodda" "E6#-bálggis" "gáhta" "gávpot#gáhta" "geaidnu" "guorra" "johttin#geaidnu" "kultur#luodda" "láhttu" "luodda" "luonddu#bálggis" "máđidja" "máđii" "meahcce#luodda" "ráidu" "reahpen#ráigi" "spáiddar#ráidu" "suohkan#luodda" "váldo#geaidnu" ;
LIST ABSTR-ROUTE = "mijlla" "gaska" "mátki" "miila" "mohkki" "tuvra" ;
SET ROUTE = CONCRETE-ROUTE OR ABSTR-ROUTE ;
LIST ORGANIZATION = (Prop Org) "giddagas" "girku" ;
LIST INSTITUTION = "instituhtta" ;
LIST INDUSTRY = "æládus#tjærdda" ;
LIST EDUCATION = "skåvlla" "vuodo#skåvllå" ;
SET ACTOR = ANIMATE OR INSTITUTION OR ORGANIZATION ;
SET HAB-ACTOR = ACTOR OR INDUSTRY OR EDUCATION OR ("guhti") OR ("guhtis") OR ("guhtimusj") OR ("galles") OR ("gii") OR ("eará") OR Coll OR Pers OR Mal OR Fem OR Sur ;
LIST HAB-CASE = Loc ( Ine) ( Gen) ;
LIST HEADOFPARTS = "oassi" "oajvve#oasse" "bielle" "guhtimusj" "goappátjagá" "proseanta" "%" "nisson#oassi" "váldo#oassi" "bealli" "guhtemuš" "goappašat" "proseanta" "%" ;
# This may be a better partitive set.
# Miscellaneous sets
# ------------------
LIST Px = PxSg1 PxSg2 PxSg3 PxDu1 PxDu2 PxDu3 PxPl1 PxPl2 PxPl3 ;
LIST PX1 = PxSg1 PxDu1 PxPl1 ;
LIST PX2 = PxSg2 PxDu2 PxPl2 ;
LIST PX3 = PxSg3 PxDu3 PxPl3 ;
SET PXNOTSG1 = Px - PxSg1 ; SET PXNOTSG2 = Px - PxSg2 ; SET PXNOTSG3 = Px - PxSg3 ;
SET PXNOTDU1 = Px - PxDu1 ; SET PXNOTDU2 = Px - PxDu2 ; SET PXNOTDU3 = Px - PxDu3 ;
SET PXNOTPL1 = Px - PxPl1 ; SET PXNOTPL2 = Px - PxPl2 ; SET PXNOTPL3 = Px - PxPl3 ;
LIST GASKAL = "gaskal" "gaskii" "gaska" "gaskas" ;
# p-positions that like coordination
SET REALCLB = CLB - COMMA ;
# Border sets and their complements
# ---------------------------------
SET CP = (Pron Interr) OR (Pron Rel) ;
LIST MO-MANge = "gåktu" "gåktus" "gånnå" "gåsstå" "gåsstås" "manen" "goas" "gokko" "gos" "gosa" "govt" "makkár" "man" "manne" "mo" "mot" "mov" "movt" ("nugo" @CVP) (V Qst);
SET MO = MO-MANge - ("man" Foc/ge) ;
LIST SEMICOL = "\;" ;
LIST COL = ":" ;
SET S-BOUNDARY2 = (Pron Interr) OR (Pron Rel) OR ("\;") OR (":") OR ("-") OR ("–") OR (@CVP) ;
SET BOC2 = S-BOUNDARY2 OR BOS ;
SET EOC2 = S-BOUNDARY2 OR EOS ;
SET NP-BOUNDARY = BOS OR EOS OR REALCLB OR VFIN OR Inf OR GerII OR ConNeg OR VGen OR Sup OR PPRON-NOT-GEN OR Recipr OR Po OR Pr OR Pcle OR ("jed") OR Interj OR CS OR CP ;
SET SV-BOUNDARY2 = S-BOUNDARY2 OR FMAINV ;
# Syntactic sets
# --------------
LIST ALLSYNTAG = (@+FAUXV) (@+FMAINV) (@-FAUXV) (@-FMAINV) (@-FSUBJ)
(@ADV-A) (@ADV-ADV) (@ADVL) (@ActioN>) (@CC)
(@CMPND) (@CS) (@P<) (@>P)
(@HNOUN) (@INTERJ) (@MEASURE) (@NPron<) (@NQ<)
(@NUM-PRON) (@OBJ) (@OPRED) (@PCLE)
(@PCLE-COMPL) (@PrcN>) (@PronN<) (@PronN>)
(@N<) (@>N) (@SPRED)
(@SUBJ) (@SUBJ-QH) (@VOC) (@X);
# =================================== #
# =================================== #
SECTION #
# =================================== #
# Determiner mappings
# -------------------
MAP (@>N) TARGET (Dem Nom) IF (*1 Num OR A OR N BARRIER NP-BOUNDARY LINK 0 Nom) (NEGATE 1 Interr OR COMMA OR Dem);
## Mannit åhpatjit majt dá bágo mierkkiji...
MAP (@>N) TARGET (Dem Par) IF (*1 Num OR A OR N BARRIER NP-BOUNDARY LINK 0 Ela) (NEGATE 1 Interr OR COMMA OR Dem);
MAP (@>N) TARGET (Dem Sg Gen) IF (*1 Num OR A OR N BARRIER NP-BOUNDARY LINK 0 (Sg Gen) OR (Sg Ill) OR LOC + Sg)(NEGATE 1 Po);
## Gáhtjada vuossteguojmijnat såbadittjat gå ájn manojn lihppe, vaják duv ij duobmára åvddåj giese ja duobmár vávta åvddåj ja dån fáŋŋgagoahtáj bálkestuvá.
MAP (@>N) TARGET (Dem Sg Acc) IF (*1 Num OR A BARRIER NP-BOUNDARY OR (N Sg Acc) LINK 0 Acc)(NEGATE *1 CC BARRIER WORD);
## Mun lean oastán ja klipsen dáid njiŋŋelasaid.
MAP (@>N) TARGET (Dem Acc) IF (*1 (N Acc) BARRIER ADVLCASE OR VFIN);
## Jus le Jubmela Bárnne, de gåhtjo dájt giergijt lájbben sjaddat.
MAP (@>N) TARGET (Dem Attr) IF (*1 N BARRIER NP-BOUNDARY);
## Josiaj riegádij Joakin vieljatjij dan áige gå álmmugav vuolgadin Babylonaj.
MAP (@>N) TARGET (Dem Sg Par) IF (*1 (N Sg Ela) BARRIER NP-BOUNDARY);
## Dat rájes Jesus sárnnedatjáj...
## Nissun dát bájkes suv tjuorvo suostoj..
MAP (@>N) TARGET (Dem Sg Com) IF (*1 (N Sg Com) BARRIER NP-BOUNDARY);
## Duobbmobiejven Nineve almatja tjuodtjeli aktan dájna vierregijn ja sijá duobbmon sjaddá, dajna gå buorádusáv Jon sárnnedattijn dahkin...
MAP (@>N) TARGET (Dem Pl Nom) IF (*1C (N Pl Nom) BARRIER NP-BOUNDARY);
## Váidalusas galgá leat namahuvvon dat dilálašvuohta.
MAP (@>N) TARGET (Dem Pl Gen) IF (*1 (N Pl Gen) BARRIER NP-BOUNDARY);
## Bärggal de alla várráj suv doalvoj ja vuosedij sunji gájkka värálda rijkajt ja daj herlukvuodav ja javlaj.
MAP (@>N) TARGET (Dem Pl Acc) IF (*1 (N Pl Acc) BARRIER NP-BOUNDARY);
## Dat ásahuvvojedje aiddo dainna ulbmiliin, ahte...
MAP (@>N) TARGET (Dem Pl Ill) IF (*1 (N Pl Ill) BARRIER NP-BOUNDARY);
## Dat ásahuvvojedje aiddo dainna ulbmiliin, ahte...
MAP (@>N) TARGET (Dem Pl Ine) IF (*1 (N Pl Ine) BARRIER NP-BOUNDARY);
## Dat ásahuvvojedje aiddo dainna ulbmiliin, ahte...
MAP (@>N) TARGET (Dem Pl Ill) IF (*1 (N Pl Ill) BARRIER NP-BOUNDARY);
## De lassánii maid sisafárren dáidda guovlluide.
MAP (@>N) TARGET (Dem Pl Ine) IF (*1 (N Pl Ine) BARRIER NP-BOUNDARY);
## ...ahte eamiálbmotriekti sáhttá leat okta dain speadjaliin,...
MAP (@>N) TARGET (Dem Pl Ela) IF (*1 (N Pl Ela) BARRIER NP-BOUNDARY);
## ...ahte eamiálbmotriekti sáhttá leat okta dain speadjaliin,...
MAP (@>N) TARGET (Dem Pl Com) IF (*1 (N Pl Com) BARRIER NP-BOUNDARY);
## Daj ájgij Jesus javlaj..
MAP (@>N) TARGET (Dem Pl Com) IF (*1 (N Pl Com) BARRIER NOT-AA);
## Ain ferte joatkit daiguin sierra doaibmabijuiguin.
# Attribute mappings
# ------------------
# MAP (@PronN>)
MAP (@>N) TARGET (A Attr) ;
# MAP (@PrcN>)
# MAP (@ActioN>)
#MAP (@ADV-ADV) TARGET Date IF (-1 BEAIVI);
LIST JUOHKE = "juohkka" "juohke" ;
MAP (@>N) TARGET JUOHKE ;
## Galgá gávdnot divššohasbearráigeahčči juohke fylkkas.
MAP (@>N) TARGET (Pron Attr) ;
## Härrá, Härrá, ep gus mij le duv namán åvddålijsárnnum, bahás vuojŋŋanisájit duv namán vuodjelam ja edna oavddodagov duv namán dahkam?
## Gå muhtem ájgev sijá lunna lijga årrum, de...
MAP (@>Pron) TARGET Gen (1 Indef) ;
## Diján le ienep árvvo gå vájk man edna tsitsátjin.
MAP (@Pron<) TARGET (Indef Pl Nom) IF (*-1 PPRON-DU-PL OR (N Pl) LINK 0 Nom BARRIER S-BOUNDARY2)(NEGATE -1 CC OR CLB)(NEGATE 1 Rel);
##
MAP (@Pron<) TARGET (Refl Sg Nom) IF (*-1 MUN OR DON OR (Pron Sg3 Nom) OR (Pron Sg Nom) OR (N Sg Nom) BARRIER S-BOUNDARY2);
## Mån iesj lev alep åjvij vuollálasj ja doarroålmmå li muv vuollálattja.
MAP (@Pron<) TARGET (Refl Sg Nom) IF (*1C MUN OR DON OR (Pron Sg3 Nom) OR (Pron Sg Nom) OR (N Sg Nom) BARRIER NOT-ADV-PCLE);
## Gájkajis de iesj guhtik sijddasis vuolgij, valla Jesus Olijvavárráj manáj.
MAP (@Pron<) TARGET (Refl Pl Nom) IF (*-1 PPRON-DU-PL OR (N Pl) BARRIER S-BOUNDARY2 LINK 0 Nom);
## ...ja ehpit dij ietja håla, ájnat áhtjáda Vuoiŋŋanis dijá baktu.
MAP (@>Pron) TARGET (Refl Pl Nom) IF (*1 PPRON-DU-PL OR (N Pl) BARRIER NOT-ADV-PCLE LINK 0 Nom)(NEGATE *1 VFIN OR Inf BARRIER NOT-ADV-PCLE);
## Na, manen val ietja Jubmela budájit doadjebihtit ietjada njuolgadusáj diehti?
MAP (@>Pron) TARGET Recipr IF (1 Recipr);
##
MAP (@>N) TARGET Indef IF (*1 N BARRIER NPNH OR Indef)(NEGATE 0 Nom LINK 1 Acc) (NEGATE 0 ADVLCASE OR ("juoga")) (NEGATE 1 (N Sg Gen) LINK NOT 0 Px LINK *1 N BARRIER NPNH OR CC)(NEGATE 1 (N Sg Gen PxSg2) LINK *-1 (V-SG2) LINK *1 N BARRIER NPNH OR CC)(NEGATE 1 VFIN OR Ess OR ("veara"));
## Gå Jesus lij riegádam Betleheman, Judean, gånågis Herodesa ájgen, de lullet muhtem násstedåbdde Jerusalemij båhtin ja gahtjin...
#MAP (@PronN>) TARGET Indef IF (1 ("ietjá") OR Dem)(NEGATE 0 Nom LINK 1 Acc) (NEGATE 0 ADVLCASE);
## Divna dát sjattaj vaj luluj ålliduvvat mav Härrá lij profehta baktu javllam...
# The partitive construction would have been máŋggain earáin and ollu daid earáin
LIST OLLU = "ollu" "ållo" ;
LIST EARA = "ietjá" "eará" "iežá" ;
MAP (@ADVL>) TARGET Indef IF (0 OLLU)(1 EARA LINK 0 LOC + Pl OR LOC + (Dem Pl LOC))(*2 V-SG3 BARRIER NOT-ADJ-PCLE)(NEGATE 0 Nom LINK 1 Acc)(NEGATE 0 ADVLCASE);
MAP (@>ADVL) TARGET Indef IF (*-1 V-SG3 BARRIER S-BOUNDARY2 OR VFIN)(0 OLLU)(1 EARA LINK 0 LOC + Pl OR LOC + (Dem pl))(NEGATE 0 Nom LINK 1 Acc)(NEGATE 0 ADVLCASE);
## Ollu earáin lea hávski. # for habeo-constructions where ollu modifies eará+Loc
MAP (@>Pron) TARGET Indef IF (NEGATE *-1 V-SG3 BARRIER S-BOUNDARY2 OR VFIN)(0 OLLU)(1 EARA LINK 0 LOC + Pl OR LOC + (Dem Pl)) (NEGATE *2 V-SG3 BARRIER NOT-ADJ-PCLE)(NEGATE 0 Nom LINK 1 Acc)(NEGATE 0 ADVLCASE);
##
MAP (@>N) TARGET Indef IF (0 Nom)(*1 (N Nom) BARRIER NPNH) (NEGATE 0 Pl LINK 1 Inf);
## Gå dal Herodes árvvedij sån lij násstedåbddija bähtádallam, de harmmat moarádij ja gåhtjoj gåddet gájkka guovtejahkásaj ja nuorap bárnnemánájit Betleheman...
MAP (@>N) TARGET Indef IF (1 A-CASE)(NEGATE 1 ("veara"));
##
MAP (@>Num) TARGET Indef IF (NEGATE 0 ("iešguhtet") OR ADVLCASE)(1 Num);
##
LIST GAJKA = "buot" "gájka" ;
MAP (@>Pron) TARGET GAJKA IF (1 Dem OR Indef);
##
MAP (@>N) TARGET GAJKA + Pron IF (*1 N BARRIER NPNH);
##
#MAP (@PronN>) TARGET Indef IF (*1 N BARRIER NP-BOUNDARY OR REALCLB) (NEGATE *-1 ("leat") BARRIER NOT-ADV-PCLE LINK *1 Indef LINK *1 PrfPrc BARRIER VERB) (NEGATE *-1 INFV BARRIER NOT-ADV-PCLE LINK *1 Indef LINK *1 Inf BARRIER VERB)(NEGATE 0 ADVLCASE)(NEGATE 1 (Pers Gen) LINK *1 N BARRIER NOT-NP OR CLB LINK NOT 0 LOC)(NEGATE 1 Adv LINK 1 N) (NEGATE 1 (N Sg Gen) LINK *1 N BARRIER NPNH)(NEGATE 1 VFIN OR Ess OR ("veara"));
##
LIST MIJ = "mij" "mii" ;
MAP (@>SPRED) TARGET MIJ + (Interr Pl Nom) IF (*1C (N Pl Nom) BARRIER NP-BOUNDARY);
MAP (@>SPRED) TARGET MIJ + (Rel Pl Nom) IF (*1C (N Pl Nom) BARRIER NP-BOUNDARY);
##
#MAP (@PronN>) TARGET Interr IF (NEGATE 0 ("guhti"))(1 N) (NEGATE 0 ("mij") LINK NOT 1 (Pl Gen))(NEGATE 0 (Sg Nom) LINK 1 V-SG3) (NEGATE 1 Gen LINK *1 N BARRIER NPNH);
#MAP (@PronN>) TARGET Rel IF (NEGATE 0 ("guhti"))(1 N) (NEGATE 0 ("mij") LINK NOT 1 (Pl Gen))(NEGATE 0 (Sg Nom) LINK 1 V-SG3) (NEGATE 1 Gen LINK *1 N BARRIER NPNH);
## Galg anodit mav Härráj le vuornnán dahkam.
#MAP (@>N) TARGET Interr IF (0 ("guhtimusj"))(*1 LOC + Pers BARRIER NOT-PCLE);
#MAP (@>N) TARGET Rel IF (0 ("guhtimusj"))(*1 LOC + Pers BARRIER NOT-PCLE);
##
MAP (@>N) TARGET GAJKA IF (*1 (N Pl Nom) OR (N Pl Acc) BARRIER NP-BOUNDARY);
##
# Quantifier mappings
# -------------------
# MAP (QN<)
MAP (@>N) TARGET (Actio Nom) IF (-1 Gen)(1 N)(NEGATE 1 PrfPrc);
## Mannit bus Israela álmmuga láhppum sávtsaj lusi.
MAP (@Num<) TARGET MEASURE IF (-1 Num)(0 Gen);
## 5 kr.
MAP (@Num<) TARGET MEASURE IF (-1 Num)(1 ALU OR A);
##
MAP (@Num<) TARGET MEASURE IF (-1 Num)(1 Adv OR Pr);
##
MAP (@Num<) TARGET TIME IF (-1 Num)(1 ("boaris") OR ("nuorra") OR ("boares") );
##
MAP (@Num<) TARGET TIME IF (-1 Num)(1 ("maŋil") OR ("maŋis"));
##
MAP (@Num<) TARGET N IF (-1 Num)(1 ("velggolaš") OR ("velgulasj"));
##
MAP (@Num<) TARGET (N Sg Acc) IF (-1 (Num Acc))(0 MEASURE)(1 (N Acc));
##
MAP (@>N) TARGET CASE - Gen IF (0 Num LINK NOT 0 Acc LINK *1 N BARRIER NPNH) ;
MAP (@Num<) TARGET (N Gen) IF (*-1 (Num Acc) BARRIER NPNH LINK NOT 0 AKTA) ;
MAP (@>N) TARGET TITLE + Nom IF (0 Attr OR Nom)(1 Prop LINK 0 Fem OR Mal OR Sur);
# A title is nominative if it has a Nom reading at all.
SELECT (Sg Nom) IF (0 TITLE LINK NOT 0 ABBR LINK 1 Mal OR Fem OR Sur LINK NEGATE 1 CC LINK 1 Mal OR Fem OR Sur);
## Suv birra profehta Jesaja le hållam gå javlaj :
SELECT Nom IF (0 TITLE LINK NOT 0 ABBR LINK 1 Mal OR Fem OR Sur);
# Genitive mappings
# -----------------
# N Sg Gen = N Pl Nom
# N Sg Nom = N Sg Gen = N Pl Nom
# Pron Sg3 Acc = Gen
# N Sg Ela = N Sg Nom PxSg3 = N Sg Acc PxSg3 = N Sg Gen PxSg3
# N Pl Gen = N Pl Com
# N Pl Gen = N Sg Ill = N Pl Com
# Pron Pers Sg3 Gen = Pron Pers Sg3 Acc
# possible syntactic tags for Gen: @GN>, @GP>, @QN>, @ADVL, @NQ<, @GP<, @-FSUBJ?, @SPRED, @NNum>
# D: @DN>
# Indef: @PronN>
# A: @AN>
# Actio: @ActioN>
# Pronouns
# - - - - -
MAP (@>N) TARGET (Pron Sg1 Gen) IF (1 (Refl PxSg1));
##
MAP (@>N) TARGET (Pron Sg2 Gen) IF (1 (Refl PxSg2));
##
MAP (@>N) TARGET (Pron Sg3 Gen) IF (1 (Refl PxSg3));
##
MAP (@>N) TARGET (N Sg Gen) IF (1 (Refl PxSg3));
##
MAP (@>N) TARGET (Pron Du1 Gen) IF (1 (Refl PxDu1));
##
MAP (@>N) TARGET (Pron Du2 Gen) IF (1 (Refl PxDu2));
##
MAP (@>N) TARGET (Pron Du3 Gen) IF (1 (Refl PxDu3));
##
MAP (@>N) TARGET (Pron Pl1 Gen) IF (1 (Refl PxPl1));
##
MAP (@>N) TARGET (Pron Pl2 Gen) IF (1 (Refl PxPl2));
##
MAP (@>N) TARGET (Pron Pl3 Gen) IF (1 (Refl PxPl3));
##
# Nouns (mostly)
# - - - - - - - -
MAP (@>P) TARGET Gen IF (1C Po OR (Po ADVLCASE) LINK NOT *1 Gen BARRIER NPNH);
## ..., lågenanniellja buolva Davida rájes Babylona fáŋŋgavuoda rádjáj ja lågenanniellja buolva fáŋŋgavuoda rájes Kristusa rádjáj.
MAP (@>N) TARGET Gen IF (0 (N Pl))(NEGATE 0 Px OR TIME)(1 Nom);
MAP (@>P) TARGET Gen IF (NEGATE 0 Num LINK 1 Ill)(1 Po);
##
LIST DIHTE = "diehti" "dihte" ;
MAP (@>P) TARGET Gen IF (NEGATE 0 Num LINK 1 Ill) (NEGATE 0 (V Actio) LINK 1 DIHTE)(1 PUNCT-LEFT LINK *1 PUNCT-RIGHT LINK 1 Po);
##
MAP (@>P) TARGET Gen IF (NEGATE 0 RCmpnd)(1 CC)(*2 Gen BARRIER NPNHA LINK 1 Po) (NEGATE 0 (V Actio) LINK 1 CC LINK 1 (V Actio) LINK 1 DIHTE);
##
MAP (@>P) TARGET Gen IF (NEGATE 0 RCmpnd)(1 COMMA)(*2 Gen BARRIER NPNHA LINK 1 CC LINK *1 Gen BARRIER NPNHA LINK 1 Po) (NEGATE 0 (V Actio) LINK 1 CC LINK 1 (V Actio) LINK 1 DIHTE);
##
MAP (@>P) TARGET Gen IF (1 (Neg Foc))(2 Gen)(3 Po);
##
MAP (@>P) TARGET Gen IF (0 TIME OR AIGODAT)(1 Num)(2 Po);
##
MAP (@P<) TARGET Gen IF (*-1 Pr BARRIER NOT-NP OR CLB)(NEGATE 1 (N Gen)) (NEGATE 0 TIME LINK *-1 Po BARRIER NP-BOUNDARY LINK -1 Gen);
## Sån ham biejves buorij ja baháj badjel mårijdahttá ja rievtesferdugij ja vádnarievtesferdugij nal rássjodahttá.
MAP (@P<) TARGET Gen IF (*-1 CC BARRIER S-BOUNDARY2 LINK *-1 GASKAL BARRIER S-BOUNDARY2)(1 NP-BOUNDARY);
##
MAP (@P<) TARGET (Pl Gen) IF (*-1 GASKAL BARRIER NOT-NP LINK NOT -1 (Pl Gen)) (1 NP-BOUNDARY);
##
MAP (@>N) TARGET Gen IF (0 MANNU)(1 Ord);
##
#MAP (@>N) TARGET Gen IF (0 TIME OR AIGODAT OR ROUTE)(NEGATE 1 CC)(NEGATE 0 VAHKKU LINK 1 CARDINALS) (*1 N BARRIER NP-BOUNDARY OR REALCLB OR Po OR Pr);
##
LIST BIEJVVE = "biejvve" "beaivi" "b" ;
MAP (@ADVL @>N) TARGET Gen IF (-2 Gen LINK 0 MANNU)(-1 Ord)(0 BIEJVVE);
##
MAP (@ADVL>) TARGET Gen IF (0 TIME OR ROUTE)(*1 FMAINV BARRIER S-BOUNDARY2);
MAP (@) TARGET Gen IF (1 (Actio Gen))(NEGATE 1 N)(2 N) ;
##
MAP (@-FSUBJ>) TARGET Gen IF (1 Ger);
## Valla Petrus gájkaj guládijn vuornoj ja javlaj.
MAP (@-FSUBJ>) TARGET Gen IF (NEGATE 0 TIME OR ROUTE)(1 VAbess);
##
MAP (@-FSUBJ>) TARGET Gen IF (*-1 REALCOPULAS BARRIER NPNHA)(1 (V Actio Ela));
##
MAP (@>A) TARGET Gen IF (*-1 COPULAS BARRIER S-BOUNDARY2 OR VERB)(1 (A Comp)) (NEGATE 1 N);
## ... nåv sjaddá avtat ájnna buorádusdahkke suddáris stuoráp ávvo almen, gå aktselåkavtset rievtesferdugis gudi e buorádusáv dárbaha dahkat.
MAP (@>A) TARGET Gen IF (1 (A Comp))(*2 COPULAS BARRIER S-BOUNDARY2 OR VERB OR CC LINK NOT *1 FMAINV BARRIER S-BOUNDARY2);
##
MAP (@>A) TARGET Gen IF (1 (A Comp))(NEGATE 1 VERB OR Adv)(NEGATE *2 N BARRIER NP-BOUNDARY);
##
MAP (@>A) TARGET Gen IF (0 MEASURE)(1 A);
##
MAP (@>A) TARGET ("mierre" Gen) IF (-1 (Pron Dem Sg Gen))(1 A);
##
# Habitive mappings
MAP (@HAB) TARGET HAB-ACTOR ((0 HAB-CASE LINK 1 REALCOPULAS LINK *1 (N Nom) OR (Indef Nom) BARRIER NPNHAI) OR (0 HAB-CASE + LINK *1 (N Nom) OR (Indef Nom) BARRIER NPNHAI)) ;
MAP (@>N) TARGET Gen IF (NEGATE -1 NUMERALS LINK 0 Nom) (NEGATE 0C ALU OR RCmpnd OR Num)(*1 N OR Actio BARRIER NOT-NP OR REALCLB OR Indef LINK NOT 0 GerII) (NEGATE 1 PUNCT LINK 1 CC)(NEGATE 1 Inf) (NEGATE 1 CC LINK *1 Gen BARRIER NOT-NP LINK 1 Po) (NEGATE 1 COMMA LINK 1 Gen LINK 1 CC LINK 1 Gen LINK 1 Po) (NEGATE 1 CARDINALS LINK 0 ADVLCASE) (NEGATE 0 Actio LINK 1 DIHTE);
###
MAP (@>N) TARGET Gen IF (NEGATE -1 NUMERALS LINK 0 Nom) (NEGATE 0 ALU OR RCmpnd OR Num) (1 COMMA)(2 Rel LINK *1 COMMA LINK *1 N BARRIER NOT-NP OR REALCLB) (NEGATE 1 PUNCT LINK 1 CC) (NEGATE 1 CC LINK *1 Gen BARRIER NOT-NP LINK 1 Po) (NEGATE 1 COMMA LINK 1 Gen LINK 1 CC LINK 1 Gen LINK 1 Po) (NEGATE 0 Actio LINK 1 DIHTE);
##
MAP (@>N) TARGET Gen IF (-2 ("s") OR ("siidu") OR ("sijddo") OR ("paragráfa") OR ("paragráffa") OR ("kapihttal") OR ("kapihtal") OR HEADOFPARTS OR ("jahki") OR ("jahke") OR GIESSEK LINK 1 CARDINALS)(*1 N BARRIER NOT-ADJ);
## 8
MAP (@>N) TARGET Gen IF (NEGATE -1 NUMERALS LINK 0 Num) (NEGATE 0 ALU OR Num OR RCmpnd)(*1 N BARRIER NOT-AA OR CLB)(NEGATE 1 Inf);
##
MAP (@>A) TARGET Gen IF (1C A)(1 (Sg LOC))(2C NP-BOUNDARY); # (NEGATE 0 Interr OR ALU)
##
MAP (@Pron<) TARGET (N Pl Gen) IF (-1 MIJ + Interr OR ("mihkkege") OR ("guhti"));
## Maid ipmašiid doppe dagat?
# Appositions
# -----------
SET APP-BOUNDARY = REALCLB OR VFIN OR Inf OR GerII OR ConNeg OR VGen OR Sup OR Recipr OR Po OR Pr OR Pcle OR Interj OR CS OR CP ;
LIST DÅPPE = "dáppe" "dåppe" "ålggon" "badjin" "bajil" "dakko" "dá" "dákko" "dáppe" "diekko" "dieppe" "do" "dokko" "doppe" "duo" "duokko" "duoppe" "olgun" ;
# Adverbs with a inessive form, but don´t get Ine or Loc as a tag.
LIST DÅHKU = "diehki" "dåhku" "ålgus" "bajás" "deike" "diehke" "diehko" "dohko" "duohko" "lulás" "olggos" "ruoktot" "sisa" "vuovdimassii" ;
LIST PAST-MARKER = "iektu" "uddni" ("mánná" Ess) "dalle" "diibmá" "dolin" "dološ" "dovle" "duvle" "eske" "gieskat" "ikte" ("nuorra" Ess) "ovdal" ("ovddit#beaivi" Gen) ("vássán#áigi" Loc) ("boares#áigi" Gen) ;
LIST PRESENT-MARKER = "dálla" "dálle" "ådnå" "dál" "ihttin" "odne" "otne" ("boahtte#áigi" Loc) ("boahtte#áigi" Gen) ;
SET TIME-MARKER = PAST-MARKER OR PRESENT-MARKER ;
LIST OTHER-TIME-ADV = "árabuš" "árrat" "easkka" "guhká" ("guhkit" Adv) "maŋemustá" "maŋŋel" "maŋŋelaš" "maŋŋeleappos" "maŋŋit" "muhtumin" "ovdal" ;
SET TIME-ADV = TIME-MARKER OR OTHER-TIME-ADV OR GIESSEK;
MAP (@APP-N<) TARGET (Num Nom) IF (-1 (Prop Sur Nom) LINK -1 ("\("))(1 COMMA LINK 1 ("s") LINK 1 CARDINALS LINK 1 ("\)"));
#Simonsen 1959, s. 45)
MAP (@APP-N<) TARGET Num IF (-1 BIEJVVE LINK -1 Ord LINK -1 MANNU);
## Mun boađán geassemánu 16. b. 2002.
MAP (@APP-N<) TARGET Num IF (-2 Ord)(-1 MANNU);
## 23. cuoŋománu 1728 dovddus geaskkus lea ee. celkon ahte mearraguollebivdu lea luđolaš earret"
MAP (@APP-N<) TARGET (Num Nom) IF (-1 Nom LINK 0 MANNU)(0 CARDINALS);
MAP (@APP-N<) TARGET (Num Nom) IF (-1 LOC LINK 0 MANNU)(0 CARDINALS);
## Guovdageaidnu / Kautokeino, skábmamánnu 2002.
## Bargojoavkku čoahkkima árvalus ovddiduvvo konvenšuvnna oktasaščoahkkimis guovvamánus 2004.
MAP (@APP-N<) TARGET (Num Nom) IF (-1 Gen LINK 0 MANNU)(0 CARDINALS)(1 Po);
## Mun oaivvildan leat liiggás oanehis áiggi árvvoštallat klieantalávdegotti ođđajagimánus čakčamánu 1999 rádjái, (9 mánu).
MAP (@APP-N< @SUBJ @SPRED @HNOUN) TARGET (Num Nom) IF (-1 MANNU LINK NOT 0 Nom)(0 CARDINALS);
MAP (@APP-N<) TARGET (Num Nom) IF (-2 BOS OR (PUNCT LEFT))(-1 KLASS LINK 0 Nom);
## Ášši 07/00 Sámedikki 1999 jahkedieđáhus.
MAP (@APP-N<) TARGET Acc IF (-1 MEASURE LINK -1 Num LINK *-1 V-TRANS-ACT-NOT-ACT BARRIER S-BOUNDARY2 OR VERB) ;
## Juohke heasta borrá sullii 6 kilu suinniid beaivái.
MAP (@APP-N<) TARGET (N Gen) IF (*-1 COMMA BARRIER APP-BOUNDARY OR ADVLCASE LINK -1 Gen)(1 COMMA LINK 1 N LINK NOT 0 Gen) ;
MAP (@APP-N<) TARGET (N Gen) IF (*-1 COMMA BARRIER APP-BOUNDARY OR ADVLCASE LINK -1 Gen)(1 CC LINK **1 Gen BARRIER VERB LINK 1 COMMA LINK 1 N LINK NOT 0 Gen) ;
## Dát lea Jesus Kristusa, Dávveda bártni ja Abrahama bártni, sohka.
MAP (@APP-ADVL<) TARGET LOC + N IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC OR ADVLCASE LINK -1 DÅPPE)(1 EOS) ;
MAP (@APP-ADVL<) TARGET (N Ill) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 DÅHKU LINK *-1 BOS BARRIER APP-BOUNDARY)(1 COMMA) ;
MAP (@APP-ADVL<) TARGET (N Gen) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 TIME-MARKER OR TIME-ADV OR BEAIVI)(0 TIME LINK 0 Gen)(1 EOS);
## Mun vuolggán ihttin, bearjadaga.
## Doppe son orui guhká, vihtta jagi.
MAP (@APP-ADVL<) TARGET Pr IF (*-1 COMMA BARRIER NOT-ADV LINK -1 TIME-ADV OR TIME-MARKER OR TIME)(*1 (N Gen) OR (Pers Gen) BARRIER NPNH LINK 1 EOS);
MAP (@APP-ADVL<) TARGET Pr IF (*-1 COMMA BARRIER NOT-ADV LINK -1 TIME-ADV OR TIME-MARKER OR TIME LINK -1 BOS)(*1 (N Gen) OR (Pers Gen) BARRIER APP-BOUNDARY OR CC LINK 1 COMMA);
## Dolin, ovdal soađi, olbmot lávejedje vuovdit joŋaid.
MAP (@APP-ADVL<) TARGET Po IF (-1 Gen LINK *-1 COMMA BARRIER NOT-ADV LINK -1 TIME-ADV OR TIME-MARKER OR TIME LINK -1 BOS)(1 COMMA);
MAP (@APP-ADVL<) TARGET (Po) IF (-1 Gen LINK *-1 COMMA BARRIER NOT-ADV LINK -1 TIME-ADV OR TIME-MARKER OR TIME)(1 EOS);
## Maid sii geavahedje guhkit, gitta 1960-logu rádjai.
MAP (@APP-N<) TARGET (N Nom) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC OR ADVLCASE OR Ess LINK -1 (N Nom))(1 EOS) ;
MAP (@APP-N<) TARGET (N Nom) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC OR ADVLCASE OR Ess LINK -1 (N Nom))(1 COMMA LINK 1 S-BOUNDARY2) ;
MAP (@APP-Pron<) TARGET (N Nom) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC OR ADVLCASE OR Ess LINK -1 (Pron Nom))(1 EOS) ;
MAP (@APP-Pron<) TARGET (N Nom) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC OR ADVLCASE OR Ess LINK -1 (Pron Nom))(1 COMMA LINK 1 S-BOUNDARY2) ;
## Mon lean Will Turner, Sáppatbátti Turnera bárdni!
MAP (@APP-N<) TARGET (Prop Nom) IF (-1 HUMAN + Nom LINK -1 BOC2)(1 VFIN);
MAP (@APP-N<) TARGET (N Acc) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC OR (N Nom) LINK -1 (N Acc) LINK NOT *-1 COMMA BARRIER APP-BOUNDARY OR CC)(1 EOS) ;
MAP (@APP-N<) TARGET (N Acc) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC OR (N Nom) LINK -1 (N Acc) LINK NOT *-1 COMMA BARRIER APP-BOUNDARY OR CC)(1 COMMA LINK 1 S-BOUNDARY2) ;
MAP (@APP-Pron<) TARGET (N Acc) IF (*-1 COMMA BARRIER APP-BOUNDARY OR @CVP OR (N Nom) LINK -1 (Pron Acc) LINK NOT *-1 COMMA BARRIER APP-BOUNDARY OR CC)(1 EOS) ;
MAP (@APP-Pron<) TARGET (N Acc) IF (*-1 COMMA BARRIER APP-BOUNDARY OR @CVP OR (N Nom) LINK -1 (Pron Acc) LINK NOT *-1 COMMA BARRIER APP-BOUNDARY OR CC)(1 COMMA LINK 1 S-BOUNDARY2 OR ("dan_diehti") OR ("dan_dihte")) ;
## Oidnet go Mihkkala, min nuoramus bártni?
## Mon oainnán fierpmi, su mearkka, ja dieđán ahte Spider-Man lea leamaš das.
MAP (@APP-N<) TARGET LOC + N IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC OR ADVLCASE LINK -1 LOC + N)(1 EOS) ;
MAP (@APP-N<) TARGET LOC + N IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC OR ADVLCASE LINK -1 LOC + N)(1 COMMA LINK 1 S-BOUNDARY2 OR Adv) ;
MAP (@APP-N<) TARGET (N Ela) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC OR ADVLCASE LINK -1 (N Ela))(1 EOS) ;
MAP (@APP-N<) TARGET (N Ela) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC OR ADVLCASE LINK -1 (N Ela))(1 COMMA LINK 1 S-BOUNDARY2 OR Adv) ;
MAP (@APP-Pron<) TARGET LOC + N IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC OR ADVLCASE LINK -1 LOC + Pron)(1 EOS) ;
MAP (@APP-Pron<) TARGET LOC + N IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC OR ADVLCASE LINK -1 LOC + Pron)(1 COMMA LINK 1 S-BOUNDARY2 OR Adv) ;
MAP (@APP-Pron<) TARGET (N Ela) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC OR ADVLCASE LINK -1 (Pron Ela))(1 EOS) ;
MAP (@APP-Pron<) TARGET (N Ela) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC OR ADVLCASE LINK -1 (Pron Ela))(1 COMMA LINK 1 S-BOUNDARY2 OR Adv) ;
## Ánde orru Oslos, Norgga oaivegávpogis.
MAP (@APP-N<) TARGET (N Ill) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 (N Ill))((1 EOS) OR (*1 LOC LINK 1 EOS)) ;
MAP (@APP-N<) TARGET (N Ill) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 (N Ill))(1 COMMA LINK 1 S-BOUNDARY2) ;
MAP (@APP-Pron<) TARGET (N Ill) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 (Pers Ill))(1 EOC2 OR COMMA) ;
#MAP:1 (@APP-Pron<) TARGET (N Ill) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 (Pers Ill))(*1 COMMA BARRIER NOT-QMARK LINK *1 S-BOUNDARY2 BARRIER NOT-QMARK) ;
## Dan mun muitalan dušše dutnje, mu buoremus olbmái.
MAP (@APP-N<) TARGET (N Ill) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 (N Ill) LINK *-1 BOS BARRIER APP-BOUNDARY)(1 COMMA) ;
MAP (@APP-Pron<) TARGET (N Ill) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 (Pron Ill) LINK *-1 BOS BARRIER APP-BOUNDARY)(1 COMMA) ;
## Dutnje, mu buori ustibii, mun muitalan buot.
MAP (@APP-N<) TARGET (N Com) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 (N Com))(1 EOS) ;
MAP (@APP-N<) TARGET (N Com) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 (N Com))(1 COMMA LINK 1 S-BOUNDARY2 OR Adv) ;
## Mun hupmen Máhte-Iŋggáin, Niillas-Máhte eamidiin.
MAP (@APP-Pron<) TARGET (N Com) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 (Pron Com))(1 EOS) ;
MAP (@APP-Pron<) TARGET (N Com) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 (Pron Com))(1 COMMA LINK 1 S-BOUNDARY2 OR Adv) ;
MAP (@APP-N<) TARGET (N Nom) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 (N Nom) LINK *-1 BOC2 BARRIER APP-BOUNDARY)(1 COMMA LINK 1 VFIN) ;
MAP (@APP-Pron<) TARGET (N Nom) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 (Pron Nom) LINK *-1 BOS BARRIER APP-BOUNDARY)(1 COMMA LINK 1 VFIN) ;
## Will Turner, Sáppatbátti Turnera bárdni, lea boahtán.
MAP (@APP-N<) TARGET LOC + N IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 LOC + N LINK *-1 BOS BARRIER APP-BOUNDARY)(1 COMMA LINK 1 VFIN) ;
MAP (@APP-Pron<) TARGET LOC + N IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 LOC + Pron LINK *-1 BOS BARRIER APP-BOUNDARY)(1 COMMA LINK 1 VFIN) ;
MAP (@APP-N<) TARGET (N Ela) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 (N Ela) LINK *-1 BOS BARRIER APP-BOUNDARY)(1 COMMA LINK 1 VFIN) ;
MAP (@APP-Pron<) TARGET (N Ela) IF (*-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 (Pron Ela) LINK *-1 BOS BARRIER APP-BOUNDARY)(1 COMMA LINK 1 VFIN) ;
## Romssas, Davvi-Norgga stuorimus gávpogis, leat vaikko man ollu studeanttat.
MAP (@APP-N<) TARGET (N Nom) IF (-1 (N Gen) OR (Pers Gen) LINK *-1 CC BARRIER APP-BOUNDARY LINK -1 (N Gen) OR (Pers Gen) LINK *-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 (N Nom))(1 EOS) ;
MAP (@APP-N<) TARGET (N Nom) IF (-1 (N Gen) OR (Pers Gen) LINK *-1 CC BARRIER APP-BOUNDARY LINK -1 (N Gen) OR (Pers Gen) LINK *-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 (N Nom))(1 COMMA BARRIER S-BOUNDARY2) ;
MAP (@APP-Pron<) TARGET (N Nom) IF (-1 (N Gen) OR (Pers Gen) LINK *-1 CC BARRIER APP-BOUNDARY LINK -1 (N Gen) OR (Pers Gen) LINK *-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 (Pron Nom))(1 EOS) ;
MAP (@APP-Pron<) TARGET (N Nom) IF (-1 (N Gen) OR (Pers Gen) LINK *-1 CC BARRIER APP-BOUNDARY LINK -1 (N Gen) OR (Pers Gen) LINK *-1 COMMA BARRIER APP-BOUNDARY OR CC LINK -1 (Pron Nom))(1 COMMA LINK 1 S-BOUNDARY2 OR ("dan_diehti") OR ("dan_dihte")) ;
#MAP (@APP-N<) TARGET (N Nom) IF (*-1 ("nugo") OR ("sihke") BARRIER APP-BOUNDARY LINK -1 COMMA LINK -1 (N Nom))(1 EOS) ;
#MAP (@APP-Pron<) TARGET (N Nom) IF (*-1 ("nugo") OR ("sihke") BARRIER APP-BOUNDARY LINK -1 COMMA LINK -1 (Pron Nom))(*1 EOS BARRIER APP-BOUNDARY) ;
## Návetgoađis ledje ealut, nugo sávzzat, gáiccat ja gusat.
#MAP (@APP-N<) TARGET (N Nom) IF (*-1 ("nugo") OR ("sihke") BARRIER APP-BOUNDARY LINK -1 COMMA LINK -1 (N Nom) LINK *-1 BOS BARRIER APP-BOUNDARY)(*1 COMMA BARRIER APP-BOUNDARY LINK 1 VFIN) ;
#MAP (@APP-Pron<) TARGET (N Nom) IF (*-1 ("nugo") OR ("sihke") BARRIER APP-BOUNDARY LINK -1 COMMA LINK -1 (Pron Nom) LINK *-1 BOS BARRIER APP-BOUNDARY)(*1 COMMA BARRIER APP-BOUNDARY LINK 1 VFIN) ;
## Mu vánhemat, sihke áhčči ja eadni, leaba jápmán.
#MAP (@APP-N<) TARGET (N Acc) IF (*-1 ("nugo") OR ("sihke") BARRIER APP-BOUNDARY LINK -1 COMMA LINK -1 (N Acc) LINK *-1 BOS BARRIER APP-BOUNDARY)(*1 COMMA BARRIER APP-BOUNDARY) ;
#MAP (@APP-Pron<) TARGET (N Acc) IF (*-1 ("nugo") OR ("sihke") BARRIER APP-BOUNDARY LINK -1 COMMA LINK -1 (Pron Acc) LINK *-1 BOS BARRIER APP-BOUNDARY)(*1 COMMA BARRIER APP-BOUNDARY) ;
## Muhtun sámi biktasiid, nugo gápmagiid ja vuoddagiid, sii geavahedje guhkit, gitta 1960-logu rádjai.
#SELECT (@APP-N<) IF (*-1 COMMA BARRIER APP-BOUNDARY LINK -1 SUBJ OR SPRED)(1 COMMA OR EOS)(NEGATE *-1 ("sihke") OR ("nugo") LINK -1 VERB) ;
#SELECT (@APP-Pron<) IF (*-1 COMMA BARRIER APP-BOUNDARY LINK -1 SUBJ OR SPRED)(1 COMMA OR EOS)(NEGATE *-1 ("sihke") OR ("nugo") LINK -1 VERB) ;
## Mu viellja, Tore, sáhttá boahtit deike.
## Mon lean Will Turner, Sáppatbátti Turnera bárdni!
SELECT:r3306 (@APP-N<) IF (-1 MEASURE LINK -1 Num LINK *-1 V-TRANS-ACT-NOT-ACT BARRIER SV-BOUNDARY2) ;
## Juohke heasta borrá sullii 6 kilu suinniid beaivái.
MAP (@HNOUN) TARGET (N Nom) IF (*-1 BOS BARRIER V)(NOT 0 )(*1 EOS BARRIER V);
MAP (@OPRED>) TARGET Ess IF (NOT 0 ESS-ADVL-N LINK *1 OPREDV BARRIER S-BOUNDARY2);
MAP (@ BARRIER NOT-ADV-PCLE)) ;
MAP (@) TARGET (Interr Nom) (*1 COPULAS BARRIER NOT-ADV-PCLE LINK 0 FMAINV LINK *1 NP-HEAD-NOM BARRIER NPNH) ;
## Guhtis le muv ieddne ja gudi li muv vielja?
MAP (@SPRED>) TARGET (A Nom) (*1 REALCOPULAS BARRIER NOT-ADV-PCLE LINK 0 FMAINV LINK 1 NP-HEAD-NOM) ;
MAP (@SPRED>) TARGET (A Nom) (1 REALCOPULAS LINK 0 VFIN LINK *1 Inf BARRIER NOT-ADV); #XX
MAP (@SPRED>) TARGET Ess IF (NOT 0 ESS-ADVL-N LINK *1 FMAINV BARRIER S-BOUNDARY2);
MAP (@) TARGET (Indef Nom) (NOT 0 ESS-ADVL-N LINK *1 ESSV BARRIER S-BOUNDARY2);
MAP (@) TARGET (N Nom)(*-1 COMMA OR S-BOUNDARY2 BARRIER NPNH)(*1 VFIN BARRIER NOT-ADV-PCLE LINK 0 REALCOPULAS LINK 1 EOC2);
MAP (@) TARGET (Sg Nom) IF (*1 (V Sg3) BARRIER VFIN OR S-BOUNDARY2);
MAP (@SUBJ>) TARGET (Pl Nom) IF (*1 (V Pl3) BARRIER VFIN OR S-BOUNDARY2);
MAP (@) TARGET (Sg Nom) IF (*1 Rel BARRIER WORD LINK *1 VFIN LINK *1 (V Sg3) BARRIER VFIN OR S-BOUNDARY2 OR Nom);
MAP (@SUBJ>) TARGET $$PERSONNUMBER + (Pers Nom) IF (*1 $$PERSONNUMBER + V BARRIER VFIN OR S-BOUNDARY2 LINK NOT 0 ConNeg);
MAP (@) TARGET (Rel Nom) (*-1 BOS BARRIER VFIN) ;
#MAP (@SUBJ) TARGET (N Nom) (NEGATE *-1 COPULAS BARRIER SV-BOUNDARY2)(NEGATE 0 Gen OR Px)(1 (":") LINK *1C Nom);
# ## Jesus Kristusa, Davida bárne, Abrahama bárne máddo: Abrahamaj riegádij Isak, Isakij Jakob,...
#
#SELECT (@SUBJ) IF (NEGATE *-1 COPULAS BARRIER SV-BOUNDARY2)(*-1C VFIN BARRIER SV-BOUNDARY2 LINK 0 Sg3)(0 (N Sg Nom))(NEGATE 0 Gen OR Px)(NEGATE *1 COPULAS BARRIER SV-BOUNDARY2);
# ## Elihudaj riegádij Elasar, Elasaraj Mattan, Mattanij Jakob, ja Jakobij riegádij Josef, Maria ålmåj.
#
#SELECT (@SUBJ) IF (-1 (@CNP) LINK -1C (@SUBJ))(0 N)(NEGATE 0 Gen OR Px);
# ## De dal gádjusibme ja fábmo ja rijkka Jubmelij gullu ja viellde sunji gev le vuojddam.
#
## subject coordination/appositions
## - - - - - - - - - - - - - - - - -
#
#SELECT (@SUBJ) IF (*-1 COMMA BARRIER NPNH LINK -1C (@SUBJ))(1 COMMA)(2C (Rel @SUBJ));
# ## Josef, suv ålmåj, guhti lij rievtesmielak, ittjij sidá suv hehpaduhttet ja áigoj sujsta suolev sirádit.
#
## object predicate
## ----------------
#
#SELECT (@OPRED) IF (*-1 (@OBJ) BARRIER S-BOUNDARY2 OR PUNCT LINK NOT 0 Dem)(*-1 OPREDV BARRIER SV-BOUNDARY2)(NEGATE 0 Gen LINK *1 N BARRIER NPNH)(NEGATE 0 Interr OR TIME OR ROUTE) (NEGATE 0 Num LINK 1 ROUTE OR TIME)(NEGATE 1 (TV Actio) LINK NOT *1 (@OBJ) BARRIER S-BOUNDARY2);
# ## Sån gåhttju suv Jesusin.
#
#SELECT (@OPRED) IF (*-1 (@OBJ) BARRIER S-BOUNDARY2 OR Nom)(0 Ess);
# ## Dån galga suv Jesusin gåhttjot.
#
#SELECT (@SPRED) IF (*-1 COPULAS BARRIER VERB LINK 0 Sg3 LINK NOT *-1 Ine BARRIER NOT-ADV-PCLE)(0 A)(NEGATE 0 Attr LINK 1 N)(NEGATE 0 Gen OR Px)(NEGATE *1 PrfPrc BARRIER NOT-ADV-PCLE);
# ## Josef, suv ålmåj, guhti lij rievtesmielak, ittjij sidá suv hehpaduhttet ja ájgoj sjsta suolev sirádit.
#
##REMOVE (@SPRED) IF (*-1 REALCOPULAS BARRIER NOT-ADV-PCLE OR ("degu"))(*1 PrfPrc BARRIER NOT-ADV-PCLE LINK NOT 0 Pass);
# ##
#SELECT (@SPRED) IF (*-1 BOS OR CLB OR PUNCT BARRIER NOT-CC)(0 A)(1 (Pers Nom) OR (Rel Nom));
#SELECT (@SPRED) IF (*-1 BOS OR CLB OR PUNCT BARRIER NOT-CC)(0 ("sáluk"))(1 (N Nom));
# ## Sálugin gudi rievtesferdukvuodav nälggu ja gåjkki, sij galliduvvi.
# ## Sálugin ármmogisá, sij ármmogisvuodav oadtju.
#
#MAP (@SPRED) TARGET Nom IF (NEGATE 0 ("tijmma") OR Adv LINK *1 Num BARRIER NP-BOUNDARY OR COMMA LINK 1 Num LINK *1 MEASURE LINK 1 ALU) (NEGATE 0 Num LINK *-1 ("tijmma") BARRIER NP-BOUNDARY) (NEGATE 0 (Prop Nom) LINK 1 ORGANIZATION)(NEGATE 0 GerII OR ESS-ADVL-N OR Num);
MAP (@ADVL>) TARGET TIME OR ROUTE (0 Gen OR Acc)(*1 FMAINV BARRIER S-BOUNDARY2) ;
MAP (@) TARGET (Num Acc)(*1 TIME OR ROUTE BARRIER NPNH LINK 0 Gen LINK *1 FMAINV BARRIER S-BOUNDARY2) ;
MAP (@) TARGET Acc IF (*1 (Actio Ela) BARRIER NP-BOUNDARY)(0 NP-HEAD-ACC);
MAP (@-FOBJ>) TARGET Acc IF (1 Inf OR Sup OR Ger LINK NOT 0 @-FMAINV);
MAP (@OBJ>) TARGET Acc (NOT 0 TIME OR ROUTE)(*1 FMAINV + TV BARRIER S-BOUNDARY2 OR COMMA) ;
MAP (@) TARGET Acc (NOT 1 EOS) ;
MAP (@CS) TARGET ("dan_diehti") OR ("dan_dihte") (1 CS) ;
MAP (@) TARGET ADVLMAPPING IF (NOT *-1 FMAINV BARRIER S-BOUNDARY2);
MAP (@ADVL>) TARGET ADVLMAPPING IF (*1 FMAINV BARRIER S-BOUNDARY2);
MAP (@) TARGET Actio IF (0 Ill OR LOC OR Ela OR Com LINK *1 FMAINV BARRIER S-BOUNDARY2);
MAP (@ADVL) TARGET Ess IF (0 Num) ;
MAP (@ADVL) TARGET Ess IF (0 ESS-ADVL-N);
# Other mappings
# --------------
# Default mapping
# ---------------
MAP (@X) TARGET WORD ;
# Cleaning up gerunds
SELECT VAbess (-1 TIME + Gen)(1 COPULAS LINK 1 PrfPrc) ;
## Gå nielljalåk biejve ja nielljalåk ijá båråk lij viessum, de vijmak nälggáj.
SELECT VFIN (-1 COMMA LINK -1 @VOC)(*1 EOS BARRIER VFIN) ;
## Man huohppelasj la dån, Tore, javlaj Ámmá munji.
REMOVE (@X) ;
# ===================== #
# Global rules: cycle 4 #
# ===================== #
SECTION #
# ===================== #
# Here we have some rules that scan the whole domain.
# We must consider whether they should be integrated earlier or not.
# P complements
# -------------
REMOVE (@P<) IF (NEGATE *-1 Pr BARRIER NPNH);
# Q complements
# -------------
REMOVE (@NQ<) IF (NEGATE *-1 Num BARRIER VFIN);
#Incomplete barrier.
REMOVE (@>N) IF (*-1 Num BARRIER NPNH)(0 (@Num<))(NEGATE *1 N BARRIER NPNH);
## Muhtem nissun, lågenanguokta jage varddemijs bijnástuvvam, ...
# Late rules
SELECT VFIN IF (NEGATE *-1 VFIN BARRIER CLB)(NEGATE *1 VFIN BARRIER CLB OR @CVP);
## - Vuorde dal ájn.
## Åro sjávot desik lav tjielggim.
SECTION #
SECTION #
REMOVE (@X) ;
#=====#
END #
#=====#