-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathapertium-fao-isl.isl-fao.rlx
607 lines (443 loc) · 25.5 KB
/
apertium-fao-isl.isl-fao.rlx
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
###############################################################################
#
# This is a partial conversion of the rule file from the IceTagger
# part-of-speech tagger for Icelandic by Hrafn Loftsson, along with
# some hacked up rules from Trond Trosterud's Faroese CG and some of
# our very own home-brew crack.
#
###############################################################################
SOFT-DELIMITERS = "<,>" ;
DELIMITERS = "<.>" "<:>" "<!>" "<?>" "<|>" "<$.>" "<$:>" "<$!>" "<$?>" "<$|>";
LIST BOS = (>>>) (<s>) (sent) sent ;
LIST EOS = (<<<) (</s>) (sent) sent ;
LIST CLB = (sent) (cnjsub) (cm) (rel) (cnjcoo);
LIST Coma = (cm);
LIST N = (n) ;
LIST Num = (num) ("þúsund" n) ("milljón" n) ("milljarður" n) ("hundrað" n);
LIST ProperNom = (np) ;
LIST Adj = (adj) ;
LIST Weak = (vei) ;
LIST Strong = (sta) ;
LIST Adv = (adv) ;
LIST PersPron = (prn p1) (prn p2) (prn p3) ;
LIST IndefPron = (prn ind);
LIST DemPron = (prn dem) ;
LIST Refl = (prn ref) ;
LIST InterrPron = (prn itg) ;
LIST PossPron = (prn pos) ;
LIST Pron = (prn);
LIST Prep = (pr) ;
LIST Participle = (pp) (supn);
LIST PP = (actv pp) ;
LIST Inf = (inf) ;
LIST VerbInf = (vblex inf) ;
LIST VerbSpecAux = (vaux) ;
LIST VerbAux = (vaux) (vbhaver) (vbser) ("verða" vblex) ("geta" vblex); ## check verða = aux ?
LIST VerbSupine = (vblex supn) ;
LIST VerbBe = (vbser) ;
LIST Verb = (vblex) (vbser) (vbhaver) (vaux);
LIST TempsFin = (pri) (past) (prs) (pss);
LIST TempsIrreal = (prs) (pss);
LIST Rel = (rel) ;
LIST Conj = (cnjcoo) (cnjadv) (cnjsub) ;
LIST CC = (cnjcoo) ;
LIST CS = (cnjsub) ;
LIST Exclamation = (ij) ;
LIST Article = (def) ;
LIST Det = (det) ;
LIST Interj = (itg) ;
LIST Def = (def) ;
LIST Indef = (ind) ;
LIST Fem = (f);
LIST Msc = (m);
LIST Neu = (nt);
LIST Sg = (sg);
LIST Pl = (pl);
LIST Nom = (nom);
LIST Gen = (gen);
LIST Acc = (acc);
LIST Dat = (dat);
LIST Inf = (inf);
LIST GenPrep = "án"ri "auk"ri "austan"ri "innan"ri "í staö"ri "meðal"ri "megin"ri "milli"ri "millum"ri
"neðan"ri "norðan"ri "ofan"ri "sakir"ri "sunnan"ri "sökum"ri "til"ri "utan"ri "vegna"ri "vestan"ri ;
LIST AccPrep = "fyrir ofan"ri "gegnum"ri "kringum"ri "um"ri "umfram"ri "umhverfis"ri ;
LIST DatPrep = "að"ri "af"ri "andspænis"ri "ásamt"ri "frá"ri "gagn"ri "gagnvart"ri "gegnt"ri "handa"ri
"hjá"ri "meðfram"ri "mót"ri "móti"ri "nálægt"ri "undan"ri "úr"ri ;
LIST AccDatPrep = "á"ri "eftir"ri "fyrir"ri "í"ri "með"ri "undir"ri "við"ri "yfir"ri ;
LIST MODV = "ætla" "kunna" "láta" "skula" "vilja" "munu" "mega" "vera" ; #todo: translate fao to icelandic
LIST ACCSUBJVERB = "bresta" "dreyma" "fýsir" "greinir" "grípa" "gruna" "hrylla" "hungra" "kitla" "klígja" "klæja" "kreppa" "langa" "lengja" "lengja# eftir" "lysta" "lægja" "misminnir" "minnir" "muna" "órar" "raga" "ráma" "reka" "saka" "setur" "skefur" "skipta" "skorta" "stoða" "sundla" "svengja" "svima" "svíða" "syfja" "undra" "vanhagar" "vanta" "varðar" "verkjar" "þrjóta" "þverra" ;
LIST DATSUBJVERB = "auðnast" "áskotnast" "batna" "ber" "berast" "birtast" "bjóða" "blandast" "blæða" "blæða# út" "blöskra" "bragðast" "bregða" "brenna" "búa" "bætast" "daprast" "dáma" "dettta" "drjúpa" "duga" "dveljast" "dyljast" "elna" "endast" "fara" "feila" "festast" "fjölga" "fljúga" "fylgja" "fyrirgefa" "fæðast" "fækka" "förla" "gagnast" "ganga" "geðjast" "gefast" "gremjast" "greypast" "græðast" "haldast" "hefnast" "heilsast" "henta" "heppnast" "heyrast" "henta" "hlaupa" "hlekkjast" "hlotnast" "hlýnar" "hnignar" "hrakar" "hrjósa" "hugkvæmast" "hugnast" "hæfa" "hægja" "hættir" "kemur" "kólna" "kyngir" "lánast" "lást" "leiðast" "leyfast" "ljúka" "ljósta" "lærast" "misfarast" "misheppnast" "misheyrast" "nægja" "ofbjóða" "óa" "ratast" "reiknast" "réna" "rigna" "rísa" "sárna" "seinka" "sinnast" "sjatna" "sjást" "skána" "skeika" "skiljast" "skjátlast" "skola" "skrika" "snúast" "sortna" "stafa" "standa" "stígur" "stekkur" "súrna" "svelgjast" "svipa" "svíða" "sýnast" "sækjast" "sæma" "takast" "teljast" "mér" "vefjast" "vegna" "veita" "versna" "viðkoma" "viðvíkja" "vinnast" "vinnast" "vitnast" "volgna" "vökna" "yfirsjást" "ylna" "þoka" "þóknast" "líða" ("finna" midv) ("skilja" midv) "líka" "mislíka"; ## TODO: CHECK 'líða' and 'finnst'
LIST WANTINGVERB = "vilja";
LIST REPORTINGVERB = "segja";
LIST SADV = "aldrei" "ekki" "alltaf" ; # complete
LIST NAGD = nom acc gen dat;
LIST GENDER = m f nt;
LIST NUMBER = sg pl;
LIST PERSON = p1 p2 p3;
LIST COMMA = (",") ;
SET VerbFin = Verb + TempsFin;
SET NomMscFem = (n m) OR (n f) ;
SET NomMscNeu = (n m) OR (n nt) ;
SET NomFemNeu = (n f) OR (n nt) ;
SET NOTDAT = Nom | Gen | Acc ;
SET NOTACC = Nom | Gen | Dat ;
SET NOTACCDAT = Nom | Gen ;
SET OBL = Acc | Dat | Gen ;
SET POST-DET = Adj | Det | N | Num | Adv ;
SET PRE-N = Adj | Det | (N Gen) | Num | (Pron Gen) | (Pron Dem) | CC ; # Det???
SET WORD = N | Verb | Adj | Prep | Pron | Det | Adv | CC | CS | Interj | Num | ("\?") ;
SET MARK = COMMA | ("\\") | ("\;") ; #"
SET WORDMARK = WORD | MARK ;
SET NPNHA = WORDMARK - PRE-N - Adv ;
SECTION
#################################################################################
# Specific lexemes
#################################################################################
REMOVE N IF (-1C N OR ProperNom) (0 ("<á>"));
REMOVE N IF (1 PP | VerbSupine) (0 ("hafa"));
#Finnland er í Evrópusambandinu og er eina Norðurlandaþjóðin sem hefur tekið upp evruna sem gjaldmiðil.
REMOVE Rel IF (0 ("sem")) (NOT 1* VerbFin BARRIER CLB);
REMOVE Conj IF (0 ("er")) (-1 Conj);
#Ekki er búið að boða hvenær það hefst.
REMOVE Rel IF (0 ("er")) (NOT -1 COMMA) ;
#Töldu margir þingmenn að skýrslan gæti verið gott innlegg í umræðuna og gæti aukið jöfnuð á ný meðal Kínverja.
REMOVE ("gæta") IF (0 ("gæta")) (0 ("geta")) (1 Adj | PP | VerbSupine);
#################################################################################
# Proper nouns
#################################################################################
# hús Láru
SELECT ProperNom IF (-1C N) (1 Gen) ; # !tag.isCase(GENITIVE) ;
SELECT ProperNom IF (-1C GenPrep) (1 Gen) ;
SELECT ProperNom IF (-1C AccPrep) (1 Acc) ;
SELECT ProperNom IF (-1C DatPrep) (1 Dat) ;
# Hildar Guðmundsdóttur
SELECT ProperNom IF (-1C ProperNom) (-1C Gen) (0 ("<.*dóttur>"r)) (0 Gen) ; # !tag.isCase(GENITIVE) ;
SELECT ProperNom IF (-1C ProperNom) (-1C Fem) ; # !tag.isGender(FEMININE) ;
SELECT ProperNom IF (-1C ProperNom) (-1C Msc) ; # !tag.isGender(MASCULINE) ;
REMOVE ProperNom + Acc IF (1C* Acc BARRIER CLB);
#################################################################################
# Noms
#################################################################################
# hann sýnir but stakk hún hendi is ok, það sýnir aldrei
# CEx. Þessi íslenska kona
#SELECT Nom IF ((-1C PersPron) OR (-1C PersPron LINK -1C DemPron) OR (-1C ("<við>"ri)));
# CEx. um nýja samkomulagið
#SELECT N IF (-1C GenPrep) (1 Gen) ;
#SELECT N IF (-1C AccPrep) (1 Acc) ;
#SELECT N IF (-1C DatPrep) (1 Dat) ;
# að (cn/aa) beina (sgn/n*) mér
# Íslendingar munu boða að
REMOVE N IF (-1 Inf) (0 VerbInf) (NOT -1 MODV) ;
# einhvern sem sæti
# sem steðjar að heiminum
REMOVE N IF (-1 ("<sem>"ri)) (0 Verb) (NOT 1 ("að"ri));
# choose the verb
# CEx. Ísland á dagskrá eftir viku
# CEx. Fundi Íslendinga með Bretum og Hollendingum um Icesave málið lauk í dag án niðurstöðu.
#REMOVE N IF (-1C ProperNom) (0 Verb) ;
# Disallow two nouns in a row unless the latter is in the genitive case
REMOVE N IF (-1C N) (NOT -1 Gen) ((NOT -2 ProperNom) OR (-2 BOS));
# select the possessive pronoun, "pabbi sinn"
SELECT PossPron IF (-1C N);
SELECT ("á"ri) IF (-1 Adv);
# skal (ekki) hita
SELECT VerbInf IF ((-1 VerbSpecAux) OR (-1C Adv LINK NOT -2 BOS LINK -2 VerbSpecAux));
# hafði talið, velja sagnbót
# þetta kerfi get ekki þýtt neitt.
SELECT VerbSupine IF ((-1 VerbAux) OR (-2 VerbAux));
# select the adjective, but ok is "fyrir framan X", and ok is "bara verð markaðarins"
SELECT Adv IF (0 Adj) (-1 BOS OR (NOT -1 Prep)) (1 EOS OR (NOT 1 N LINK 1 Gen));
# sú líkn
# CEx. að í því hefðu fyrirvararnir
#SELECT DemPron IF (-1 N) (NOT 0 N);
#SELECT VerbBe IF (NOT 0 N);
# select the adjective, "hann er lasinn",
SELECT Adj IF (-1 VerbBe) (NOT -2 BOS) (-2 PersPron);
#Auðvitað brá okkur við þetta
REMOVE N IF (NOT -1* VerbFin BARRIER BOS) (NOT 1* VerbFin BARRIER EOS) (0 VerbFin) (0 N);
#Bandaríkin heita aðstoð
REMOVE Adj IF (NOT -1* VerbFin BARRIER BOS) (NOT 1* VerbFin BARRIER EOS) (0 VerbFin) (0 Adj);
#Finnland er í Evrópusambandinu og er eina Norðurlandaþjóðin sem hefur tekið upp evruna sem gjaldmiðil.
REMOVE Conj IF (NOT -1* VerbFin BARRIER BOS) (NOT 1* VerbFin BARRIER EOS) (0 VerbFin) (0 Conj);
REMOVE Conj IF (NOT -1* VerbFin BARRIER BOS) (NOT 1* VerbFin BARRIER Conj LINK 1 VerbFin) (0 VerbFin) (0 Conj);
#Að því loknu verður málið rætt á þingi.
REMOVE N + Acc IF (0 Nom) (0 Acc) (NOT -1* N + Nom BARRIER CLB) (NOT 1* N + Nom BARRIER CLB) (NOT 1* ACCSUBJVERB BARRIER CLB) (NOT -1* ACCSUBJVERB BARRIER CLB);
#Þór býr í höll sem heitir Bilskirnir
REMOVE Adj IF (-1C Prep) (1 Conj | Rel);
#################################################################################
# Adverbs
#################################################################################
#Hin íslenska Wikipedia fór í gang 5. desember 2003 og inniheldur núna 27.671 greinar.
REMOVE ("núa") + PP IF (0 ("núna") + Adv) (NOT -1C* VerbAux BARRIER CLB) (NOT 1C* VerbAux BARRIER CLB);
#Rouston Benoit, 10 ára, var á gangi með ömmu sinni þegar skjálftinn reið yfir.
REMOVE ("þegar") + Adv IF (-1* VerbFin BARRIER BOS) (1* VerbFin BARRIER EOS);
#################################################################################
# Adjectives
#################################################################################
# Hann borðar mjög heita súpu en hún hleypur.
REMOVE N IF (-1C ("<mjög>"));
REMOVE VerbInf IF (-1C ("<mjög>"));
REMOVE VerbFin IF (-1C ("<mjög>"));
# norska ríkisstjórnin
REMOVE N IF (0 N) (0 Nom) (0 Adj) (0 (vei)) (1C N) (1C Def);
# íslenskan almenning
REMOVE N IF (0 N) (0 Nom) (0 Adj) (0 (sta)) (1C N) (1C Indef);
# kröfurnar voru skýrar;
REMOVE Adv IF (0 Adv) (0 Adj) (-1C VerbBe) (1C CLB);
# Fallega rauða rósin
REMOVE Adv IF (NOT -1C* VerbFin BARRIER CLB) (0 Adv) (0 Adj) (1 Adj);
# Ég er að flytja frá Akureyri til Reykjavíkur í eitt ár.
REMOVE Adj IF (-1 Prep) (0 Adj) (0 Num) (1 N) (1 Sg);
#Bankarnir stóru.
REMOVE Adj + Strong IF (-1C N + Def);
#################################################################################
# Advs
#################################################################################
SELECT Adv IF (-1C VerbFin) (1C Verb) (1 Participle);
#################################################################################
# Personal pronouns
#################################################################################
#ég gerði það sjálfur
SELECT PersPron + Acc IF (-1 VerbFin) (-1C* PersPron + Nom BARRIER VerbFin | CLB);
#Við gerðum það sjálf.
SELECT:r53p $$PERSON IF (1C VerbFin + $$PERSON)(0 PersPron) ;
#þá auðveldustu
REMOVE ("<þá>"ri) + PersPron IF (1 Verb OR Adv OR N); # was + Conj
REMOVE ("<þá>"ri) + PersPron IF (-1 VerbBe OR Adv OR N); # was + Conj
REMOVE ("<þá>"ri) + PersPron IF ((-1C Refl) OR (-1 VerbBe OR PersPron)); # væri þá and réði sig þá
REMOVE PersPron + Nom IF (-1C* PersPron + Nom BARRIER VerbFin | CLB);
REMOVE PersPron + Nom IF (-1C* PersPron + Nom BARRIER VerbFin | CLB);
#sem hann sá í gær.
REMOVE PersPron + Acc IF (-1 ("sem")) (1 VerbFin) (0 PersPron + Nom) (0 PersPron + Acc) (NOT 1* Nom BARRIER CLB | EOS);
#Ég veit ekki hvort það hafa einhverjir nemendur ekki lokið verkefninu
REMOVE InterrPron + Nom IF (-1C* PersPron + Nom BARRIER CLB);
#################################################################################
# Indefinite pronouns
#################################################################################
#Hvað ert þú að gera ?
REMOVE Pron + Nom IF (1C* PersPron + Nom BARRIER CLB);
REMOVE IndefPron + Nom IF (-1 BOS | EOS) (0 IndefPron) (0 InterrPron);
REMOVE IndefPron IF (-1 BOS | EOS) (0 IndefPron) (0 InterrPron) ;
#################################################################################
# Demonstrative pronouns
#################################################################################
# Ég sá ekki
# finnst þér þá
#ég þakka þeim kærlega fyrir
#Fá þeir íbúar, sem ekki geta eða vilja snúa aftur í íbúðirnar yfir nóttina, aðstoð með gistingu ef þörf krefur.
REMOVE DemPron + Nom IF (0 DemPron) (0 PersPron); ## this needs fixing
#SELECT DemPron + $$GENDER + $$NUMBER + $$NAGD IF (1C N + $$GENDER + $$NUMBER + $$NAGD);
REMOVE DemPron IF (-1C PersPron) ;
REMOVE ("<þá>"ri) + DemPron IF (1 VerbFin) (NOT 1 Rel); # þá sem ...
REMOVE ("<þá>"ri) + DemPron IF (1 Conj OR Adv) (-1 BOS); # Þá þegar ...
REMOVE ("<þá>"ri) + DemPron IF (1C N OR ProperNom) (-1 Verb); # gekk þá maðurinn
# En mér leið ekki vel eftir þetta.
REMOVE Det IF (0 Det) (0 Pron) (NOT 1 POST-DET);
# Við gerðum það sjálf.
REMOVE DemPron IF (-1C VerbFin) (1C Refl);
# í gær sá stelpan.
REMOVE DemPron IF (0 DemPron) (0 VerbFin) (NOT -1* VerbFin BARRIER CLB) (NOT 1 VerbFin BARRIER CLB);
#Þetta er borgin, er hann kom frá.
SELECT Rel IF (-1C Coma) (0 ("er")) (1C* VerbFin BARRIER CLB);
#################################################################################
# Reflexive pronouns
#################################################################################
# sem hann sér í dag.
REMOVE Refl IF (0 Refl) (0 VerbFin) (NOT -1* VerbFin BARRIER CLB) (NOT 1 VerbFin BARRIER CLB);
#################################################################################
# Interrogative pronouns
#################################################################################
# Ég veit ekki hvort Jón læsi aldrei bókina
REMOVE ("hvor"ri) + InterrPron IF (1 N + Nom) ;
REMOVE ("hvor"ri) + InterrPron IF (1 ProperNom + Nom) ;
#################################################################################
# Possessive pronouns
#################################################################################
#################################################################################
# Prepositions
#################################################################################
#að styðja
SELECT Prep IF (0 ("að"ri)) (1 VerbInf);
#sem leggja fram kæru á hendur ríkinu.
SELECT Prep IF (0 ("[Áá]"ri)) (1C N OR ProperNom) (NOT 1C Gen);
#Þeir eru undir rúminu
SELECT Prep IF (0 Prep) (0 Adv) (1C PRE-N);
#Ég talaði aldrei við Súsönnu.
REMOVE PersPron + Nom IF (-1C* PersPron BARRIER CLB);
#################################################################################
# NPs
#################################################################################
# 15 milljörðum dollara
# um 1.950 milljörðum íslenskra króna.
# This is a hack because we don't want to do unification with 'billion' etc. perhaps there
# is a better way of doing it .
SELECT (n pl gen) IF (-1C Num + (pl));
REMOVE:ufc_f PP + Fem IF (0 $$NAGD) (*1 NomMscNeu + $$NAGD BARRIER NPNHA LINK NOT 0 Fem);
REMOVE:ufc_m PP + Msc IF (0 $$NAGD) (*1 NomFemNeu + $$NAGD BARRIER NPNHA LINK NOT 0 Msc);
REMOVE:ufc_nt PP + Neu IF (0 $$NAGD) (*1 NomMscFem + $$NAGD BARRIER NPNHA LINK NOT 0 Neu);
REMOVE:ufc_f Adj + Fem IF (0 $$NAGD) (*1 NomMscNeu + $$NAGD BARRIER NPNHA LINK NOT 0 Fem);
REMOVE:ufc_m Adj + Msc IF (0 $$NAGD) (*1 NomFemNeu + $$NAGD BARRIER NPNHA LINK NOT 0 Msc);
REMOVE:ufc_nt Adj + Neu IF (0 $$NAGD) (*1 NomMscFem + $$NAGD BARRIER NPNHA LINK NOT 0 Neu);
REMOVE:ufc_f_p Adj + Fem IF (0 $$NAGD) (*-1 NomMscNeu + $$NAGD BARRIER NPNHA LINK NOT 0 Fem) (NOT 1* Nom + Fem BARRIER NPNHA);
REMOVE:ufc_m_p Adj + Msc IF (0 $$NAGD) (*-1 NomFemNeu + $$NAGD BARRIER NPNHA LINK NOT 0 Msc) (NOT 1* Nom + Msc BARRIER NPNHA);
REMOVE:ufc_nt_p Adj + Neu IF (0 $$NAGD) (*-1 NomMscFem + $$NAGD BARRIER NPNHA LINK NOT 0 Neu) (NOT 1* Nom + Neu BARRIER NPNHA);
REMOVE:d_ufc_f Det + Fem IF (0 $$NAGD) (*1 NomMscNeu + $$NAGD BARRIER NPNHA LINK NOT 0 Fem);
REMOVE:d_ufc_m Det + Msc IF (0 $$NAGD) (*1 NomFemNeu + $$NAGD BARRIER NPNHA LINK NOT 0 Msc);
REMOVE:d_ufc_nt Det + Neu IF (0 $$NAGD) (*1 NomMscFem + $$NAGD BARRIER NPNHA LINK NOT 0 Neu);
SELECT:r30 $$GENDER IF (-1C Num + $$GENDER)(0 N);
SELECT:r28 $$GENDER IF (-1C Adj + $$GENDER)(0 N);
SELECT:r28b $$GENDER IF (-1C Det + $$GENDER)(0 N);
SELECT:r28c $$GENDER IF (-1C IndefPron + $$GENDER)(0 N);
SELECT:r28d $$GENDER IF (-1C PP + $$GENDER)(0 N);
SELECT:r30 $$NAGD IF (-1C Num + $$NAGD)(0 N);
SELECT:r29 $$NAGD IF (-1C Adj + $$NAGD)(0 N);
SELECT:r29b $$NAGD IF (-1C Det + $$NAGD)(0 N);
SELECT:r29c $$NAGD IF (-1C IndefPron + $$NAGD)(0 N);
SELECT:r29d $$NAGD IF (-1C PP + $$NAGD)(0 N);
SELECT:r30 $$NUMBER IF (-1C Num + $$NUMBER)(0 N);
SELECT:r30 $$NUMBER IF (-1C Adj + $$NUMBER)(0 N);
SELECT:r30b $$NUMBER IF (-1C Det + $$NUMBER)(0 N);
SELECT:r30c $$NUMBER IF (-1C IndefPron + $$NUMBER)(0 N);
SELECT:r30d $$NUMBER IF (-1C PP + $$NUMBER)(0 N);
# enga bók
SELECT:r31 Det IF (1C PRE-N) (0 Det) (0 IndefPron);
#Nánast allir Íslendingar nota nú netið með ADSL.
SELECT Det IF (0 $$NAGD) (0 Det OR Pron) (1C* N) (1C* $$NAGD);
#Hundur systur minnar
SELECT Gen IF (-1C Nom) (0 NAGD) (1C PossPron)
#á mati lögreglu
SELECT Gen IF (-1C N) (-1C Nom OR Acc OR Dat) (NOT 0 VerbFin);
#Einungis þriðjungur Norðmanna vill að landið gangi í Evrópusambandið
#REMOVE Nom IF (-1C VerbFin) (0 Nom) (0 Acc) (NOT -1 DATSUBJVERB | ACCSUBJVERB);
#################################################################################
# Verbs
#################################################################################
REMOVE (imp) (NOT -1 CLB);
#Fá þeir íbúar, sem ekki geta eða vilja snúa aftur í íbúðirnar yfir nóttina, aðstoð með gistingu ef þörf krefur.
REMOVE Inf IF (-1 BOS) (NOT 1* VerbFin BARRIER CLB);
SELECT Inf IF (-1 ("að"ri)) (-2 ("við"ri));
# Ég sé hesta
#Ennfremur sé málið mjög viðkvæmt í Hollandi.
#Tjónið gæti verið meira en 15 milljörðum dollara eða um 1.950 milljörðum íslenskra króna.
REMOVE TempsIrreal + VerbAux IF (NOT -1* CS) (NOT -1 BOS) (NOT -1 Adv LINK -1 BOS) (NOT 0 VerbAux);
SELECT:r51 Inf IF (*-1 MODV BARRIER Verb);
# María mun koma
SELECT:r52 MODV IF (1C Inf);
# Íslendingar munu boða að þeir ætli að draga úr losun
SELECT MODV + TempsFin IF (1C Inf);
# Ég las bókina
# #á morgun í Kaupmannahöfn, að því er Ríkisútvarpið greindi frá.
SELECT:r53 $$PERSON IF (-1 PersPron + $$PERSON)(0 VerbFin) (NOT 1 ("er"ri));
SELECT:r53a $$PERSON IF (1C PersPron + $$PERSON + Nom)(0 VerbFin) (NOT 1 ("er"ri)) (NOT 0 ("sem"ri) OR ("er"ri));
SELECT:r53b VerbFin + $$NUMBER IF (-1 N + $$NUMBER + Nom) (0 VerbFin) (NOT 1 ("er"ri)) (NOT 0 ("sem"ri));
# The modals munu and skulu can never be preceded by another auxiliary. (p.10)
REMOVE:r54 VerbAux IF (1C ("munu") OR ("skulu"));
REMOVE:r55 VerbFin IF (-1C* VerbFin BARRIER CLB) (0 VerbFin) ;
# *NATO sendi 7.000 hermenn
REMOVE VerbFin + (p1) IF (NOT -1* (prn p1) BARRIER CLB) (NOT 1* (prn p1) BARRIER CLB) ;
REMOVE VerbFin + (p2) IF (NOT -1* (prn p2) BARRIER CLB) (NOT 1* (prn p2) BARRIER CLB) ;
#Bandaríkin hafa beðið þær 43 þjóðir sem eru með hermenn í Afganistan að senda 10.000 hermenn
SELECT ("hafa"ri) + VerbFin IF (1C* Participle BARRIER PRE-N);
#100 breskir hermenn hafa fallið í Afganistan
#Við vorum að vakna og nú tekur við fundur þar sem farið verður yfir verkefni dagsins
SELECT Participle IF (-1C VerbAux);
SELECT Participle IF (1C VerbAux);
#Himinninn er blár
REMOVE Rel IF (0 ("<er>"ri)) (NOT -1* VerbFin BARRIER CLB) (NOT 1* VerbFin BARRIER CLB);
#mátt þú ekki eta
SELECT MODV + $$PERSON IF (1C PersPron + $$PERSON) (NOT 0 ("er"));
# Í gær borðuðu allir stóru strákarnir góðu súpuna.
REMOVE PP IF (NOT -1* VerbFin BARRIER BOS) (NOT 1* VerbFin BARRIER EOS) (0 VerbFin) (0 PP);
# Þetta er besti árangur minn.
REMOVE ("er"ri) + Conj IF (NOT -1* VerbFin BARRIER BOS) (NOT 1* VerbFin BARRIER EOS) (0 VerbFin) (0 Conj);
# Haítí, Port-au-Prince, er rústir einar.
REMOVE ("er"ri) + Conj IF (-1C Coma LINK -1 N | ProperNom LINK -1C Coma);
# en fjölskylda hans tilkynnti ekki um hvarfið fyrr en í nóvember þar sem hún hélt að hann væri á sólarströnd við Karabíska hafið.
REMOVE Verb IF (-1C Adj) (0 N) (0 Verb) (1 EOS);
##
# Specific pre-disambiguation lexical selection
#
SELECT ("stig"ri) IF (0 ("<stiga>"ri)) (1 ("frost"ri) OR ("hiti"ri));
#################################################################################
# Syntax
#################################################################################
## Todo:
## Disambiguate co-ordinators, find objects, predicates, adverbials, just
## enough to let us write transfer rules more easily.
SECTION
LIST @X = @X;
LIST @←ADVL = @←ADVL;
LIST @ADVL→ = @ADVL→;
LIST @←SUBJ = @←SUBJ;
LIST @SUBJ→ = @SUBJ→;
LIST @-FMAINV = @-FMAINV;
LIST @+FMAINV = @+FMAINV;
LIST @-FAUXV = @-FAUXV;
LIST @+FAUXV = @FAUXV;
LIST @←N = @←N;
LIST @N→ = @N→;
LIST @CS→ = @CS→;
LIST @CNP = @CNP; # SN co-ordinator
LIST @CVP = @CVP; # SV co-ordinator
MAP (@←SUBJ) TARGET PersPron + Nom + $$PERSON + $$NUMBER (-1C* VerbFin + $$PERSON + $$NUMBER BARRIER CLB) (0C PersPron) (NOT 0 PossPron);
MAP (@SUBJ→) TARGET DemPron + Nom (1C* VerbFin BARRIER CLB) (0C DemPron) (NOT 0 PossPron);
MAP (@SUBJ→) TARGET PersPron + Nom (1C* VerbFin BARRIER CLB) (0C PersPron) (NOT 0 PossPron);
MAP (@SUBJ→) TARGET PersPron + Dat (1C* VerbFin + DATSUBJVERB BARRIER CLB) (0C PersPron) (NOT 0 PossPron);
MAP (@SUBJ→) TARGET PersPron + Acc (1C* VerbFin + ACCSUBJVERB BARRIER CLB) (0C PersPron) (NOT 0 PossPron);
MAP (@←SUBJ) TARGET PersPron + Nom + $$PERSON + $$NUMBER (-1C* VerbFin BARRIER CLB) (-1* VerbFin + $$PERSON + $$NUMBER BARRIER CLB) (0 PersPron + Nom) (NOT 0 PossPron) (NOT -1C* PersPron + Nom) (1 EOS);
MAP (@←SUBJ) TARGET PersPron + Dat (-1C* VerbFin + DATSUBJVERB BARRIER CLB) (0C PersPron) (NOT 0 PossPron);
MAP (@←SUBJ) TARGET PersPron + Acc (-1C* VerbFin + ACCSUBJVERB BARRIER CLB) (0C PersPron) (NOT 0 PossPron);
#MAP (@←SUBJ) TARGET N + Nom + $$NUMBER (-1C* VerbFin + $$NUMBER + (p3) BARRIER CLB) (0 N + Nom + $$NUMBER);
MAP (@←SUBJ) TARGET N + Nom + $$NUMBER (-1* VerbFin + $$NUMBER + (p3) BARRIER CLB)
(0 N + Nom + $$NUMBER)
(NOT -1* @←SUBJ OR @SUBJ→ BARRIER CLB);
MAP (@SUBJ→) TARGET N + Nom (1C VerbFin) (0 N + Nom);
MAP (@SUBJ→) TARGET N + Nom (1C* VerbFin BARRIER CLB) (0 N + Nom);
MAP (@SUBJ→) TARGET ProperNom + Nom (1 VerbFin) (0 ProperNom + Nom) (NOT -1* Nom BARRIER CLB) (NOT 1C* Nom BARRIER CLB);
MAP (@SUBJ→) TARGET ProperNom + Nom (1C VerbFin) (0C ProperNom + Nom);
MAP (@←SUBJ) TARGET ProperNom + Nom (-1C VerbFin) (0C ProperNom + Nom) (NOT -1C* @SUBJ→ BARRIER CLB);
#Litlu músina hafði stóra uglan étið í gær
MAP (@OBJ→) TARGET N + Acc (1C VerbFin) (0C N + Acc);
MAP (@←OBJ) TARGET N + Acc (-1C VerbFin) (0C N + Acc);
# Check these 'auxv' with pp/supn and 'modv' with 'inf' ?
MAP (@+FAUXV) TARGET VerbAux + TempsFin (NOT 1C* VerbAux + TempsFin BARRIER CLB)
(NOT -1C* VerbAux + TempsFin BARRIER CLB)
(0C VerbAux + TempsFin)
(1C* Participle OR Inf OR VerbSupine BARRIER CLB | PRE-N);
MAP (@+FAUXV) TARGET MODV + TempsFin (NOT 1C* MODV + TempsFin BARRIER CLB)
(NOT -1C* MODV + TempsFin BARRIER CLB | Conj)
(0C MODV + TempsFin)
(1C* Participle OR Inf OR VerbSupine BARRIER CLB | PRE-N);
MAP (@+FMAINV) TARGET VerbFin + (p3) + $$NUMBER (1* @←SUBJ + $$NUMBER BARRIER CLB) (0 VerbFin LINK -1 Adv);
MAP (@+FMAINV) TARGET VerbFin + (p3) + $$NUMBER (-1* @SUBJ→ + $$NUMBER BARRIER CLB);
MAP (@+FMAINV) TARGET VerbFin + $$PERSON + $$NUMBER (-1C* @SUBJ→ + $$PERSON + $$NUMBER BARRIER CLB);
MAP (@+FMAINV) TARGET VerbFin + $$PERSON + $$NUMBER (1C* @←SUBJ + $$PERSON + $$NUMBER BARRIER CLB);
MAP (@+FMAINV) TARGET VerbFin + $$PERSON + $$NUMBER (NOT 1* @+FMAINV BARRIER CLB) (NOT -1* @+FMAINV BARRIER CLB);
# sem leikað var ...
MAP (@-FMAINV) TARGET VerbSupine | Participle (-1 Rel) (1C VerbAux + TempsFin);
MAP (@-FMAINV) TARGET VerbSupine | Participle (-1C* VerbAux + TempsFin BARRIER CLB);
MAP (@-FMAINV) TARGET Inf (-1C* MODV + TempsFin BARRIER CLB + PRE-N);
MAP (@←N) TARGET Adj + $$NAGD + $$NUMBER (0C Adj) (-1C N + $$NAGD + $$NUMBER);
SELECT Adj + @←N (0C Adj) (NOT 1* N + $$NAGD + $$NUMBER) (-1C N + $$NAGD + $$NUMBER); ## ugly hack.
MAP (@N→) TARGET Num + Gen (0C Num) (1C N + Gen);
MAP (@N→) TARGET Num (0C Num) (1C* N BARRIER CLB | VerbFin);
MAP (@N→) TARGET (det) (0C (det)) (1C N);
MAP (@←N) TARGET Num + Gen (0C Num + $$NUMBER) (-1C N + $$NUMBER);
MAP (@←N) TARGET Num + Gen (0C Num) (-1C N + Gen);
MAP (@CS→) TARGET (cnjsub) (0C (cnjsub));
MAP (@ADVL→) TARGET Adv (1* @+FMAINV | @-FMAINV BARRIER CLB) ;
MAP (@←ADVL) TARGET Adv (-1* @+FMAINV | @-FMAINV BARRIER CLB) ;
AFTER-SECTIONS
#Okkur fannst hún grunsamleg er hún kom hingað fyrst og keypti sprautur og nálar.
SELECT @SUBJ→ IF (1C @+FMAINV);
MAP (@X) TARGET VerbFin;
MAP (@X) TARGET N;
MAP (@X) TARGET ProperNom;
MAP (@X) TARGET Det;
# ganga# í vs. ganga+í
#SUBSTITUTE (pr @X) (pr) Verb (0 (+í));
#SUBSTITUTE (pr @+FMAINV) (pr) Verb (0 (+í));
#SUBSTITUTE (pr @-FMAINV) (pr) Verb (0 (+í));
#
#SUBSTITUTE (sg pr) (sg) Verb;
#SUBSTITUTE (+í) (+í pr) Verb (0 (+í));