-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathhbo-with.cg3
1033 lines (789 loc) · 36.4 KB
/
hbo-with.cg3
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
DELIMITERS = "<svb>" ;
OPTIONS += safe-setparent ;
####################
# Boundaries
####################
LIST PB = pb ;
LIST CB = cb ;
LIST SB = sb ;
LIST SVB = svb ;
LIST BD = pb cb sb svb ;
####################
# POS
####################
LIST Det = art ;
LIST Pr = prep ;
LIST Noun = subs nmpr (verb ptcp) (verb ptca) ;
LIST RelMark = ("אשׁר" conj @mark) ("ה" conj CP Rela) ("שׁ" conj) ;
LIST Number = card ordn ;
LIST PRON = prde prps prn ;
LIST ADJ = adjv ;
LIST ADV = advb nega ;
LIST SCONJ = "כי" "פן" "אשׁר" "אם" "שׁ" "ה" "לולא" "לו" (conj retag:prep) (conj retag:subs ppre) ;
LIST NonMarkingSCONJ = "לו" ;
####################
# Subcategories
####################
LIST Participle = ptca ptcp ;
####################
# Text-Fabric labels
####################
# Complete
LIST ClauseType = AjCl CPen Defc Ellp InfA InfC MSyn NmCl Ptcp Reop Unkn Voct Way0 WayX WIm0 WImX WQt0 WQtX WxI0 WXIm WxIX WxQ0 WXQt WxQX WxY0 WXYq WxYX WYq0 WYqX xIm0 XImp xImX XPos xQt0 XQtl xQtX xYq0 XYqt xYqX ZIm0 ZImX ZQt0 ZQtX ZYq0 ZYqX ; # feature typ
LIST AGen = m f ;
LIST ANum = sg du pl ;
LIST ADet = det und ;
LIST Domain = N D Q ? QQ ;
# Subsets
LIST NonQuote = N D ? ;
####################
# Helper labels
####################
LIST HasConj = HasConj ;
LIST HasMark = HasMark ;
LIST HasRel = HasRel ;
LIST PPHead = PPHead ;
LIST NPHead = NPHead ;
LIST CR = ClauseRoot ; # is root of clause
LIST FullClauseRoot = FullClauseRoot ; # is root of non-relative clause
SET PlainC = CR - HasMark - HasRel - (@nsubj:outer) ;
SET PlainNC = PlainC - HasConj ;
LIST Lemma = ".*"r ;
LIST Lemma2 = ".*"r ;
LIST Q = Q ;
LIST QQ = QQ ;
LIST NQ = NQ ;
LIST QuoteLevel = NQ Q QQ ;
LIST VerbArgs = @nsubj @obj @obl @vocative (@xcomp adjv) (@advcl infa) (@advcl infc) @advmod ;
####################
# Word lists
####################
LIST AdvclObl = ("בלי" subs CP) ;
LIST NegObl = ("בלת" subs InfC) ;
LIST QMark = ("לאמר" SCONJ verb) ;
LIST CaseAbleAdv = "כן" "שׁם" "פה" "שׁם" "הלאה" "הנה" "עתה" "אז" "כה" ;
LIST FamilyOrTitle = "בן" "בת" "אב" "כלה" "אשׁה" "מלך" "גברת" "שׂר" "אחות" "כהן" "אח" "שׁפחה" "אדון" "אלוף" ;
LIST CcompVerb = "ראה" "ירא" "ידע" "נחם" "נגד" ;
LIST XcompVerb = "שׁחת" "קרא" "מלא" "לבשׁ" "שׁחת" "מהר" "יכל" "חדל" "אמץ" "כלה" ;
LIST AdvclMarkVerb = "קרא" ;
LIST PrAdvcl = "עד" ;
LIST XcompInf = "יסף" "יכל" "חפץ" "מהר" "אמץ" "חדל" "כלה" "ירא" "מלא" "חלל" "קרב" "יאל" "לאה" "צוה" "נתן" ;
LIST SpeakingVerb = quot "ברך" "צוה" "נגד" "דבר" "ענה" "שׁמע" ;
LIST ConjAblePrep = "כמו" "למען" "עד" ;
LIST ConjAbleSubsPrep = "בלת" ;
LIST SubsToPrep = "אחר" "בין" "אצל" "בעד" ;
LIST Masculine = "מכיר" "אשׁר" "בצע" "בקר" ;
# TODO: BDB says sometimes masculine
LIST FeminineMixed = "ארץ" "יד" "צאן" "אשׁ" "גן" "גפן" ;
# TODO: BDB says sometimes feminine
LIST MasculineMixed = "לחם" "דרך" "אור" "אות" "ארון" "גמל" ;
SET GeneologyTitle = ("אלוף" Genesis) - (w20123) ;
####################
# Special-case words
####################
LIST PPHeadOverride = (Ruth w575) (Ruth w580) ;
# Apposition and NP conjunction
LIST FamilyOrTitleSkip = (Genesis w14663) ;
LIST ApposToLastGen = w265 w297 w307 w640 w648 w734 w1129 w1257 w1338 w1966 w2993 w3000 w5450 w7733 w11294 w12466 w12610 w12711 w13874 w14590 w14649 w18761 w18788 w19072 w3308 w3314 w3331 w5402 w4106 w4185 w6817 w6820 w2672 w8520 w8578 w9563 w24352 w24349 w6459 w27627 w27629 w7423 w10681 w10987 w11356 ;
LIST ApposToLastRut = w19 w50 w93 w1528 ;
SET ApposToLast = ApposToLastGen + (Genesis) OR ApposToLastRut + (Ruth) ;
LIST ApposOverAcl = (Genesis w3325) (Genesis w12858) (Genesis w14778) (Genesis w10252) ;
LIST ApposOverride = (w93 Ruth) (w189 Genesis) (Genesis w14323) (Genesis w4544) ;
LIST ConjToAppos = w36714 (w7950 Exodus) (w95 Ruth) (w215 Genesis) (w313 Genesis) (Genesis w303) (Genesis w5424) (Genesis w6462) (Genesis w7517) (Genesis w7793) (Genesis w11149) ;
LIST ConjToSmixut = (Genesis w734) (Genesis w6582) (Genesis w6628) (Genesis w8154) ;
# prn doesn't have w###, so use preceding prep
LIST PrnNmodToSublist = (Genesis w2960) (Genesis w3165) (Genesis w3871) (Genesis w3921) (Genesis w4172) (Genesis w3298) (Genesis w26108) ;
# @acl and @advcl
LIST NonAclOverride = (Genesis w2676) (Ruth w1682) (Genesis w10555) ;
LIST MarkOverride = (Genesis w1508) (Genesis w1561) (Genesis w2064) (Genesis w2072) (Genesis w14455) (Genesis w15341) (Ruth w319) (Genesis w8867) ;
LIST NonMarkOverride = (Genesis w1243) (Genesis w11173) ;
LIST NonRelOverride = (Genesis w2676) (Genesis w10555) ;
LIST PreMark = (Genesis w1774) (Genesis w6030) (Genesis w6036) (Genesis w11906) (Genesis w16927) (Genesis w17650) (Genesis w28321) (Ruth w1212) (Ruth w1206) (Ruth w1412) (Genesis w6169) (Genesis w9388) (Genesis w8176) (Genesis w11268) (Genesis w25408) ;
LIST PostMark = (Genesis w1035) (Genesis w1231) (Genesis w2977) (Ruth w948) (Ruth w1301) (Ruth w1467) (Genesis w5736) (Genesis w17852) (Genesis w7273) (Genesis w8069) (Genesis w28587) (Genesis w17852) (Genesis w28587) ;
LIST NestMark = (Genesis w2099) (Genesis w2760) (Genesis w13723) (Genesis w16271) (Genesis prn c32626) (Genesis w21741) (Genesis w25551) (Ruth w122) (Ruth w127) (Ruth w266) (Ruth w1161) (Ruth w1181) (Ruth w1325) (Genesis w8239) ;
LIST MarkToAcl = (Genesis w1848) (Genesis w19068) (Genesis w26087) (Ruth w714) (Genesis w12378) (Genesis w5084) ;
LIST ActuallyCcomp = (w351 Genesis) (Genesis w1037) (Genesis w1251) (Genesis w7129) (Genesis w3697) (Genesis w10561) ;
LIST ActuallyAdvcl = (Genesis w26044) (Genesis w28625) (Ruth w1161) (Ruth w1187) (Ruth w1418) (Genesis w8318) (Genesis w15305) (Genesis w7576) (Genesis w15883) (Genesis w25513) (Genesis w23318) (Genesis w23300) (Genesis w18024) (Genesis w9388) (Genesis w8176) (Genesis w9841) (Genesis w9928) (Genesis w13245) (Genesis w10555) ;
LIST DontConjTo = (Genesis w4993) ;
LIST HasConjOverride = (Genesis w4584) ;
####################
# Universal Dependencies
####################
LIST @root = @root ; # The root of the sentence, often a finite verb
LIST @nsubj = @nsubj ; # The nominal subject of the sentence
LIST @nsubj:outer = @nsubj:outer ;
LIST @amod = @amod ; #
LIST @advmod = @advmod ; # An adverbial modifier
LIST @case = @case ; # The relation of an adposition to its head
LIST @acl = @acl ; # A clause which modifies a nominal
LIST @nmod = @nmod ; # Nominal modifier
LIST @cop = @cop ; #
LIST @nmod:poss = @nmod:poss ;
LIST @obl = @obl ;
LIST @obj = @obj ;
LIST @advcl = @advcl ;
LIST @parataxis = @parataxis ;
LIST @det = @det ;
LIST @csubj = @csubj ;
LIST @nummod = @nummod ;
LIST @compound:smixut = @compound:smixut ;
LIST @cc = @cc ;
LIST @conj = @conj ;
LIST @ccomp = @ccomp ;
LIST @mark = @mark ;
LIST @discourse = @discourse ;
LIST @vocative = @vocative ;
LIST @appos = @appos ;
LIST @dislocated = @dislocated ;
LIST @xcomp = @xcomp ;
LIST @flat = @flat ;
LIST @flat:name = @flat:name ;
LIST @orphan = @orphan ;
LIST @fixed = @fixed ;
LIST @obl:npmod = @obl:npmod ;
LIST DepLabel = @acl @advcl @advmod @amod @appos @case @cc @ccomp @compound:smixut @conj @cop @csubj @det @discourse @dislocated @fixed @flat @flat:name @mark @nmod @nmod:poss @nsubj @nsubj:outer @nummod @obj @obl @obl:npmod @orphan @parataxis @root @vocative @xcomp ;
####################
# Special-case words
####################
LIST etNotAcc = NonAcc (Genesis w2857) (Genesis w2946) (Genesis w3165) (Genesis w3529) (Genesis w3560) (Genesis w3693) (Genesis w4172) (Genesis w4221) (Genesis w13880) (Ruth w897) (Ruth w901) (Genesis w25257) ;
####################
# Unsorted lists
####################
LIST NPish = NP PP ;
LIST SubsOverride = (Genesis w20500) (Ruth w1233) (Genesis w13703) (Genesis w14216) ; # actually nouns, don't retag as prep
LIST ItgAdv = "מתי" "איפה" "איך" "אן" "מדוע" ;
LIST VoctNonCROverride = (Genesis s81570) (Genesis s81725) (Genesis s85145) (Genesis s82809) (Genesis w9312) ;
LIST NsubjPrn = ExsS ModS NCoS PrcS PreS (InjP IntS ClausePhraseRoot) ;
LIST ObjPrn = PreO PtcO ;
LIST BigNumber = "עשׂרה" "מאה" "עשׂר" ;
LIST NumberedOverride = (Genesis w3094) ; # should have @nummod child but normally wouldn't
LIST PrnMaybeDet = prde (prps p3) ;
LIST BetterHeads = Pred Subj Objc PreC PreO ;
LIST AdvIsh = (advb AdvP) (nega NegP) ;
LIST NumberLabel = @nummod @conj @flat ;
LIST ConjHeadOverride = (Genesis w3284) (Genesis w3292) (Genesis w3327) (Genesis w4544) (Genesis w6216) ;
LIST NPIsh = NP PPrP PP PrNP PreO ;
LIST Titles = "בכר" ;
LIST NmodOverridePrep = (Genesis w17245) (Genesis w15328) ; # prep whose prn should get @nmod
LIST ApposToConjHead = (Genesis w3289) (Genesis w3332) ;
LIST YesApposAble = subs nmpr prn (adjv NPHead) (adjv PPHead) ;
LIST NoApposAble = wp2 @nmod:poss ;
SET ApposAble = YesApposAble - NoApposAble ;
LIST NorP = NPHead PPHead ;
LIST ConjSkipClause = (Genesis w1771) (Genesis w11903) (Ruth w1409) (Genesis w9386) (Genesis w8174) (Genesis w6737) (Genesis w6738) ; # conjunction to clause after next clause
LIST NoGlom = prep ;
LIST SubjIsh = Subj (IntS prn) ;
LIST OblIsh = Time Cmpl Loca Modi Adju Supp (Conj PPHead) ;
LIST PredIsh = PreC PrcS PrAd PreO PreS PtcO ;
LIST CopIsh = (Pred vbcp) NCop NCoS ;
LIST NonCopIsh = (Genesis w1955) ;
LIST OrphanPrepVerb = (Genesis w18716) ;
LIST ObjcXcomp = "יסף" "יכל" ;
LIST AdjuXcomp = "מהר" "נתן" ("אמץ" hit) "חדל" "צוה" "כלה" "חפץ" "יסף" "חלל" "קרב" "ירא" "מלא" "לאה" "יאל" "אבה" ;
LIST Ptc = ptcp ptca infc ;
LIST AdvclAble = ("כי" conj @mark) ("אם" conj @mark) ;
LIST ActuallyAcl = (Genesis ClauseRoot ph47742) ;
LIST OrphanInfc = (Genesis w18716) ;
LIST NonFCROverride = (Genesis w5072) ;
LIST FCRSkip = @csubj @acl @advcl rela:Attr ;
LIST SmallQstQ = inrg prin ;
LIST SmallQstPrn = prde prn ;
LIST AdjNonAcl = (Genesis w23609) ;
LIST SubjAble = subs prps nmpr prde prn prin ;
LIST CsubjOverride = (Genesis w1006) (Genesis w5072) ;
LIST ObjAble = subs prn nmpr prin prde ;
LIST XcompOverride = (Genesis w17124) (Genesis w26289) ;
LIST AclChain = (Genesis w603) ;
LIST RelSkip = (Ruth w550) ;
LIST RelToPrn = (Ruth w1714) ;
LIST ConjTypes = CPen NmCl MSyn ;
LIST AclAble = subs adjv ptcp ptca nmpr ;
LIST AclCompNotOk = (Genesis w1179) (Genesis w12528) (Genesis w12613) (Ruth w712) (Genesis w26221) (Genesis w26340) (Genesis w26404) (Genesis w24882) (Genesis w11227) ;
LIST AclMultiTarget = (Genesis w391) (Genesis w9660) (Genesis w9740) ;
LIST XorO = (@xcomp ProbablyObj) @obj ;
LIST CRconj = @ccomp @root @parataxis ;
LIST CcompAble = "חלל" "נתן" "מהר" "צוה" "שׁמע" ;
LIST AttrSkipAcl = (Genesis w22880) ;
LIST ClauseCon = @conj @parataxis @xcomp ;
LIST ConjToAdvcl = (Genesis w772) ;
LIST DontConj = @conj @acl @nmod @xcomp @appos @advcl @nmod:poss (@ccomp N) @obl @mark HasConj @csubj skipconj (@ccomp rela:Objc) ;
SET DetAble = Noun OR ADJ OR PRON ;
SET ProbablyNumber = Number + NumberLabel ;
SET CaseAble = Noun - ProbablyNumber OR PRON OR (verb infc) - QMark OR (verb infa) OR CaseAbleAdv + ADV OR (prin) OR (inrg);
SET AfterPrep = @case OR @nummod OR @cc OR ProbablyNumber ;
SET NonAppos = NPHead - @appos ;
SET SpecialMark = MarkToAcl OR NestMark OR PreMark OR PostMark ;
SET CorR = (conj CP) OR RelMark ;
SET CorM = CR OR (nmcp) - @cop ;
SET MSynIsh = CorR + @cc OR @advmod ;
LIST ActuallyParataxis = (Genesis w888) (Genesis w921) (Genesis w935) (Genesis w2979) (Genesis w4072) (Genesis w4208) (Genesis w12675) (Genesis w12530) (Genesis w7997) (Genesis w23609) ;
LIST ActuallyCsubj = (Genesis w5072) ;
LIST ActuallyObl = (Genesis ph57618) ;
LIST QuoteSkipAcl = (Genesis w7270) ;
LIST ParenSent = (Genesis s82236) ;
LIST ActuallyInf = (Genesis w13111) ;
########################################
# INDIVIDUAL WORDS
########################################
BEFORE-SECTIONS
####################
# Hide Punctuation
####################
REMCOHORT IGNORED (punct) ;
####################
# Corrections
####################
LIST MislabeledAsNarrative = w1404 w1405 w1423 w1424 w14251 w14252 w14253 (Genesis s80885) (Ruth s5672) (Ruth s5673) (Genesis s83562) (Ruth s5647) (Ruth s5650) (Ruth s5651) (Genesis s85072) (Genesis s83308) (Genesis s83309) (Genesis s84608) (Genesis s83116) (Genesis s83082) (Genesis s81615) (Genesis s81616) (Genesis s81881) ;
SUBSTITUTE (N) (Q) MislabeledAsNarrative ;
LIST UnknownShouldBeNarrative = (Genesis w2137) ;
SUBSTITUTE (?) (N) UnknownShouldBeNarrative ;
SUBSTITUTE (infc) (infa) (Ruth w797) ;
ADD (m) Noun - AGen IF (0 Masculine OR MasculineMixed) ;
ADD (f) Noun - AGen IF (0 FeminineMixed) ;
####################
# Nested Quotations
####################
LIST DoubleQuoteGen = s80831 s80834 s80836 s80837 s80886 s81424 s81443 s81543 s81737 s81766 s81767 s81785 s81829 s81933 s81999 s82001 s82028 s82037 s82159 s82295 s82315 s82367 s82380 s82382 s82410 s82412 s82413 s82446 s82450 s82599 s82626 s82629 s82776 s82946 s83252 s83255 s83285 s83303 s83318 s83319 s83327 s83431 s83432 s83449 s83459 s83470 s83474 s83479 s83480 s83482 s83510 s83626 s83628 s83906 s83919 s84071 s84283 s84313 s84382 s84435 s84464 s84492 s84537 s84545 s84551 s84552 s84555 s84638 s84673 s84681 s84708 s84709 s84719 s84722 s84765 s84804 s84805 s84828 s84934 s84941 s84943 s85134 s85229 s85230 s85261 s85262
c29820 ; # TODO: handle rela:Objc properly
LIST DoubleQuoteRuth = s5648 s5649 s5720 s5825 ;
SET DoubleQuote = (Genesis) + DoubleQuoteGen OR (Ruth) + DoubleQuoteRuth ;
SUBSTITUTE (Q) (QQ) DoubleQuote ;
ADD NQ (*) - QuoteLevel - BD ;
####################
# MWE names
####################
SUBSTITUTE (nmpr a) (subs c m retag:nmpr) ("בית" wp1) ;
SUBSTITUTE (nmpr a) (subs c m retag:nmpr) ("בן" wp1) ;
SUBSTITUTE (nmpr) (subs retag:nmpr m) ("אל" wp2) ;
SUBSTITUTE (nmpr) (subs retag:nmpr) ("לחם" wp2) ;
SUBSTITUTE (nmpr) (subs retag:nmpr) ("צדק" wp2) ;
SUBSTITUTE ("מלכי" nmpr) ("מלך" subs c retag:nmpr) (wp1 Genesis w6557) ;
SUBSTITUTE ("עמי" nmpr) ("עם" subs retag:nmpr has_prn) ("עמי" wp2) ;
SUBSTITUTE ("אוני" nmpr) ("און" subs retag:nmpr has_prn) ("אוני" wp2) ;
ADDCOHORT ("<prn>" "אני" prn p1 sg) AFTER ("עם" subs retag:nmpr) ;
ADDCOHORT ("<prn>" "אני" prn p1 sg) AFTER ("און" subs retag:nmpr) ;
MAP @flat:name (nmpr wp2) IF (-1 (nmpr wp1)) ;
SETPARENT @flat:name TO (-1* (nmpr wp1)) ;
####################
# MWE conjunctions
####################
WITH ("אם" conj) OR ("כי" conj) IF (-1 ("עד" prep)) {
SETPARENT (*) TO (jC1 (*)) ;
MAP @fixed (*) ;
SUBSTITUTE (prep) (conj retag:prep) _C1_ ;
} ;
####################
# Retagging
####################
# quotation
MERGECOHORTS ("<le'emor>" "$2$1"v SCONJ *) ("(אמר)"r verb infc) - ActuallyInf WITH (-1 ("(ל)"r prep)) ;
# Substantivized adjectives
SUBSTITUTE (adjv) (subs retag:adjv) (c) ;
SUBSTITUTE (adjv) (subs retag:adjv) (a) (1 BD) (-1* Noun + (c) BARRIER (*) - Det) ;
SUBSTITUTE (adjv) (subs retag:adjv) (adjv a) (1 (prn)) ;
# TODO: does this really apply to all gentillics?
SUBSTITUTE (adjv) (subs retag:adjv) (adjv gntl pl) ;
SUBSTITUTE (adjv) (subs retag:adjv) (adjv gntl) (-1* Noun + (c) BARRIER (*) - Det) ;
SUBSTITUTE (adjv) (subs retag:adjv) (adjv gntl) (NEGATE 0* (subs) - (retag:adjv gntl) OR (nmpr) BARRIER PB) ;
# Participles in smixut
SUBSTITUTE (verb) (subs retag:verb) Participle + NPish ;
# Adverbs tagged subs
SET AdvOk = (*) - (prn ModS) - ("מאד" padv) ;
SUBSTITUTE (subs) (advb retag:subs) (padv) - (NP) (-1* BD BARRIER AdvOk) (1* BD BARRIER AdvOk) ;
# Determiner on clause participles
SUBSTITUTE (art) (conj retag:art) (CP Rela) ;
# Prepositions tagged as nouns
SUBSTITUTE (subs) (conj retag:subs) ConjAbleSubsPrep + (CP) ;
SUBSTITUTE (subs) (advb retag:subs) ("אחר" subs ppre AdvP) (1 BD) ;
SUBSTITUTE (subs) (prep retag:subs) SubsToPrep + (subs ppre) ;
SUBSTITUTE (subs) (prep retag:subs) (ppre CP Conj)
IF (NOT 0 SubsOverride)
(NEGATE 0 ("טרם" subs) LINK -1 ("ב" prep))
(NEGATE 0 ("בלי" subs CP) LINK -1* ("על" prep) BARRIER PB) ;
SUBSTITUTE (prep) (conj retag:prep) ConjAblePrep + (CP)
IF (NOT 1 ("אשׁר" conj)) ;
# yesh and ein
SUBSTITUTE (subs) (verb retag:subs ClauseRoot) (nmcp) ;
# interrogative adverbs
SUBSTITUTE (inrg) (advb retag:inrg) ItgAdv ;
####################
# Helper labels
####################
ADD (NonAcc) ("את" prep Cmpl) + $$ClauseType - (NonAcc)
IF (0* ("את" prep Objc) + $$ClauseType BARRIER SB) ;
ADD PPHead PPHeadOverride - PPHead ;
SUBSTITUTE (ClausePhraseRoot) (WhyAreVocativesTheirOwnClause) VoctNonCROverride ;
SUBSTITUTE (ClausePhraseRoot) (WhyAreVocativesTheirOwnClause) (Voct) IF (0* (ClausePhraseRoot) - (Voct) BARRIER SB) ;
ADD (ClausePhraseRoot) ("חלילה" intj) - (ClausePhraseRoot) ;
SUBSTITUTE (ClausePhraseRoot) (InterjectionOverride) (!intj)
IF (0* ("חלילה" intj) BARRIER CB) ;
ADD (skipconj) DontConjTo - (skipconj) ;
ADD HasConj HasConjOverride - HasConj ;
####################
# Consistent labels
####################
MAP @det Det ;
MAP @mark SCONJ + (conj CP) ;
MAP @mark ("ה" inrg) ;
MAP @obj ("את") + Pr IF (1 RelMark) ;
MAP @obl Pr IF (1 RelMark) ;
MAP @case Pr ;
MAP @cc (conj) - (Rela) ;
MAP @advmod ADV - (ClausePhraseRoot) - PPHead ;
MAP @advmod ADV + (MSyn) ;
MAP @advmod ADV + (ClausePhraseRoot) IF (0* PRON BARRIER BD) ;
MAP @advmod ("למה" inrg) ;
MAP @discourse (intj) - (ClausePhraseRoot) ; # TODO: is there a better way to handle הנה?
####################
# Pronoun suffixes
####################
SUBSTITUTE ("prn") ("אני") ("prn" prn p1 sg) ;
SUBSTITUTE ("prn") ("אנחנו") ("prn" prn p1 pl) ;
SUBSTITUTE ("prn") ("אתה") ("prn" prn p2 m sg) ;
SUBSTITUTE ("prn") ("את") ("prn" prn p2 f sg) ;
SUBSTITUTE ("prn") ("אתם") ("prn" prn p2 m pl) ;
SUBSTITUTE ("prn") ("אתן") ("prn" prn p2 f pl) ;
SUBSTITUTE ("prn") ("הוא") ("prn" prn p3 m sg) ;
SUBSTITUTE ("prn") ("היא") ("prn" prn p3 f sg) ;
SUBSTITUTE ("prn") ("הם") ("prn" prn p3 m pl) ;
SUBSTITUTE ("prn") ("הן") ("prn" prn p3 f pl) ;
########################################
# PHRASES
########################################
SECTION
####################
# Pronoun suffixes
####################
MAP @nsubj (prn) + NsubjPrn ;
MAP @obj (prn) + ObjPrn ;
MAP (NPHead @obj) (prn Objc) IF (-1 Pr + ("את") - etNotAcc) ;
SETPARENT (prn @obj) OR (prn @nsubj) (NOT p (*)) TO (-1 (verb) OR (intj ClausePhraseRoot)) ;
WITH (prn) - DepLabel IF (-1 Noun - (verb)) (NOT p (*)) {
MAP @nmod (*) IF (jC1 Number) ;
MAP @nmod:poss (*) ;
SETPARENT (*) TO (jC1 (*)) ;
} ;
####################
# Determiners
####################
SETPARENT Det TO (1 DetAble) ;
MAP @det PrnMaybeDet IF (-1 Det LINK -1 Noun) ;
SETPARENT @det TO (-1* Noun BARRIER (*) - Det) ;
MAP @det PrnMaybeDet IF (-1 Number) ;
SETPARENT @det + PrnMaybeDet TO (-1 Number) ;
REMCOHORT IGNORED WITHCHILD (*) @det ;
####################
# Numbers
####################
WITH BigNumber + Number - DepLabel IF (-1 Number) (NOT p (*)) {
MAP @flat (*) ;
SETPARENT (*) TO (jC1 (*)) ;
REMCOHORT IGNORED (*) ;
} ;
WITH Number - DepLabel IF (-1 @cc) (-2 Number) (NOT p (*)) {
MAP @conj (*) ;
SETCHILD (*) TO (jC1 (*)) ;
SETPARENT (*) TO (-1* Number) ; # TODO: this doesn't run if we put jC2
REMCOHORT IGNORED WITHCHILD (*) (*) ;
} ;
SETPARENT Number + (c) TO (1 Noun - Number) ;
SETPARENT Number (-1 Noun + (c)) TO (1 Noun) ;
SETPARENT Number TO (-1 Noun - Number) ;
SETPARENT Number
TO (1* Noun - Number OR NumberedOverride BARRIER (*) - Number - @cc) ;
SETPARENT Number
TO (0* Noun - Number BARRIER (*) - Number - @cc) ;
MAP @nummod Number IF (p Noun OR (prn) OR NumberedOverride) (NEGATE c @nmod) ;
####################
# Smixut
####################
# conjunction within smixut
# (kinda weird, but arg structure doesn't make sense otherwise)
WITH $$Lemma + (subs) - DepLabel
IF (-1* (*) LINK 0 @cc LINK -1* (*) - (prn) LINK 0 $$Lemma + (subs))
(NOT p (*))
(NEGATE 1* PrnNmodToSublist BARRIER BD)
{
MAP @conj (*) ;
SETPARENT (*) TO (jC1 (*)) ;
} ;
SETPARENT @cc TO (1 (subs @conj)) ;
MAP @compound:smixut Noun OR ADJ OR (prin) IF (-1* Noun + (c) - Number BARRIER (*) - @nummod - @cc - (card @conj)) ;
SETPARENT @compound:smixut TO (-1* Noun - @nummod) ;
####################
# Adjectives
####################
WITH (nega) IF (1 ADJ) {
SETPARENT (*) TO (jC1 (*)) ;
REMCOHORT IGNORED (*) ;
} ;
MAP @conj ADJ IF (-1 @cc) (-2 ADJ) ;
MAP @conj ADJ IF (-1 ADJ) (1 @cc) (2 ADJ) ;
SETPARENT ADJ + @conj
TO (-1* ADJ - @conj BARRIER (*) - @cc) ;
SETPARENT @cc (-1 ADJ) TO (1 ADJ) ;
SETPARENT ADJ + $$AGen + $$ANum + $$ADet
TO (-1* Noun + $$AGen + $$ANum + $$ADet BARRIER PB OR Pr) ;
SETPARENT ADJ + $$ANum + $$ADet
TO (-1* Noun + $$ANum + $$ADet - AGen BARRIER PB OR Pr) ;
MAP @amod ADJ IF (p Noun) ;
UNMAP @advmod IF (NOT 0 (MSyn)) (NEGATE 0* BetterHeads BARRIER SB) ;
ADD CR AdvIsh - CR ;
SETPARENT ("מאד" @advmod) TO (-1 ADV) ;
####################
# Prepositions
####################
SETPARENT @case TO (1* CaseAble BARRIER (*) - AfterPrep) ;
SETPARENT @case TO (1*A ADJ BARRIER (*) - AfterPrep LINK NOT p (*)) ;
####################
# Weird List Behavior
####################
MAP (@nmod prn_sub) (prn) IF (c PrnNmodToSublist) ;
SETPARENT (@nmod prn_sub) TO (-1* ConjHeadOverride BARRIER PB) ;
SETPARENT (@nmod prn_sub)
TO (-1* BD LINK 1* @cc LINK 1* Noun BARRIER (*) - Pr) ;
ADD (conjhead) ConjHeadOverride IF (NOT 0 (conjhead)) ;
ADD (conjhead) (*) - (conjhead) IF (c (@nmod prn_sub)) ;
####################
# Label NP heads
####################
ADD PPHead Noun OR PRON OR ADJ OR ADV IF (NOT p (*)) (NOT 0 PPHead) (c @case - ("את") OR etNotAcc) ;
ADD NPHead Noun OR PRON OR ADJ IF (NOT p (*)) (NOT 0 PPHead OR NPHead) ;
####################
# NP/PP conjunctions
####################
SETPARENT REPEAT @cc TO (1* NPHead OR PPHead BARRIER PB) ;
ADD REPEAT HasConj NPHead OR PPHead IF (NOT 0 HasConj) (c @cc) ;
####################
# NP/PP adverbs
####################
SETPARENT @advmod + NPIsh TO (1* NPHead OR PPHead OR ADJ BARRIER PB) ;
####################
# Apposition
####################
MAP @nmod (*) IF (c NmodOverridePrep) ;
MAP @conj GeneologyTitle IF (-1* GeneologyTitle BARRIER SB) ;
SETPARENT GeneologyTitle + @conj TO (-1* GeneologyTitle - @conj) ;
MAP REPEAT @appos NPHead - HasConj - (nmpr) IF (-1* NPHead OR PPHead BARRIER BD) ;
MAP REPEAT @appos NPHead - HasConj + (nmpr) IF (-1* NPHead + Titles BARRIER BD OR NPHead OR PPHead) ;
####################
# VP
####################
MAP @obl NegObl IF (1 (infc)) ;
SETPARENT NegObl TO (1 (infc)) ;
MAP @acl (verb infc VP) IF (-1 (subs c) - NegObl) ;
SETPARENT (verb infc VP @acl) TO (-1 (subs c)) ;
WITH (infa) IF (-1 @cc) (-2 (infa)) {
MAP @advcl _C2_ IF (NOT 0 (ClausePhraseRoot)) ;
MAP @conj (*) ;
SETCHILD (*) TO (jC1 (*)) ;
SETPARENT (*) TO (-2 _C2_) ; #(jC2 (*)) ;
REMCOHORT IGNORED WITHCHILD (*) (*) ;
} ;
####################
# Connect NPs
####################
MAP REPEAT @conj PPHead + HasConj + (/^\(ph\\d+\)$/r)
IF (-1* PPHead + (VSTR:$1)) ;
MAP REPEAT @conj PPHead IF (-1* PPHead BARRIER BD OR NonAppos)
(1* PPHead + HasConj BARRIER BD OR NonAppos) ;
SECTION
SETPARENT PPHead + @conj
TO (-1* PPHead - @conj BARRIER BD OR NonAppos) ;
SECTION
# TODO: any better way to do this?
SETPARENT (w189 Genesis) TO (-1* (w185)) ;
SETPARENT (Genesis w3459) TO (-1* NPHead - (verb)) ;
SETPARENT (Genesis w14323) TO (-1* (prn)) ;
SETPARENT (Genesis w4544) OR (Genesis w2674) OR (Genesis w7425)
TO (-1* (subs)) ;
MAP @conj (Genesis w2674) OR (Genesis w6219) ;
SETPARENT (Genesis w2671) OR (Genesis w2672)
TO (1* (Genesis w2674)) ;
SETPARENT (Genesis w6219) OR (Genesis w6222) OR (Genesis w6226)
TO (-1* (Genesis w6216)) ;
MAP @appos ApposOverride;
SETPARENT CaseAble + ConjToAppos TO (-1* @appos) ;
SETPARENT CaseAble + ConjToSmixut TO (-1* @compound:smixut) ;
MAP REPEAT @conj NPHead + HasConj + (/^\(ph\\d+\)$/r)
IF (-1* NPHead + (VSTR:$1)) ;
MAP @conj NPHead IF (-1* NonAppos BARRIER BD) (1* NPHead + HasConj BARRIER BD) ;
SETPARENT NPHead + @conj + (/^\(ph\\d+\)$/r)
TO (-1* (conjhead VSTR:$1) OR NonAppos - @conj + (VSTR:$1)) ;
SETPARENT ApposToConjHead TO (-1* (conjhead)) ;
SETPARENT FamilyOrTitle + (subs) - FamilyOrTitleSkip + $$AGen
TO (-1* (nmpr a) - (topo) - @flat:name + $$AGen BARRIER (*) - @flat:name) ;
SETPARENT (nmpr) TO (-1* FamilyOrTitle BARRIER (*) - (prn)) ;
SETPARENT ApposOverAcl + (/^\(ph\\d+\)$/r)
TO (-1* ApposAble + (VSTR:$1)) ;
SETPARENT ApposOverAcl
TO (-1* (rela:Attr) LINK -1* CB LINK -1* ApposAble) ;
SETPARENT CaseAble + ApposToLast TO (-1* ApposAble) ;
SETPARENT (prn) (c Pr + ApposToLast) TO (-1* ApposAble) ;
SETPARENT CaseAble - ApposToLast - ConjToAppos - (prn ModS)
TO (-1* BD LINK 1*A CaseAble - @compound:smixut BARRIER BD LINK NOT p (*)) ;
MAP @conj CaseAble IF (c @cc) (p CaseAble) ;
MAP KEEPORDER @appos CaseAble IF (c @case + $$Lemma) (p CaseAble LINK c @case + $$Lemma) ;
MAP @nmod CaseAble IF (c @case - ("את")) (p CaseAble) ;
MAP @appos CaseAble - (verb infc) IF (p CaseAble - CR) ;
SETPARENT PPHead TO (-1* NPHead BARRIER PB) ;
MAP @nmod PPHead IF (p NPHead OR PPHead) ;
SETPARENT NPHead + @appos TO (-1* NorP - @appos BARRIER BD) ;
SETPARENT UNSAFE (nmpr @appos) TO (p ("אלהים") LINK c (@compound:smixut)) ;
####################
# Other labels
####################
MAP @cop (vbcp) + $$ClauseType OR (aux nmcp) IF (0* (PreC) + $$ClauseType BARRIER SB) ;
SETPARENT @cop + $$ClauseType TO (0* (PreC) + $$ClauseType + NorP - @conj BARRIER SB) ;
SECTION # conjunction
SETPARENT (conj PP) TO (1* (subs PP)) ;
MAP @conj (subs PP) - (PreC) - CR IF (0 (subs) LINK c @cc) (NOT c @cop) ;
SETPARENT (subs PPHead @conj /^\(ph\\d+\)$/r) - CR
TO (-1* CaseAble + (VSTR:$1) - @conj - @compound:smixut) ;
SETPARENT (subs PPHead @conj) - CR TO (-1* (subs PP) - @conj - @compound:smixut) ;
SETPARENT (conj NP) TO (1* (subs NP)) ;
SECTION # helper labels
TEMPLATE CRp = (NOT 0 CR LINK NEGATE 0* CR BARRIER CB) ;
ADD CR (ClausePhraseRoot) - CR + (/^(c\\d+\)$/r) - QMark IF (NEGATE -1* (VSTR:$1) + CR) ;
# irregular conjunction attachment
SETPARENT ConjSkipClause TO (1* CR LINK 1* CR) ;
####################
# Blah
####################
SETPARENT (Genesis w1251) TO (-1* CR LINK -1* CR) ;
SETPARENT (Genesis w1256) TO (-1* CR) ;
SETPARENT (Genesis w21545) TO (-1* NPHead) ;
SETPARENT (Genesis w8857) TO (-1* (Genesis w8839)) ;
MAP @nmod (Genesis w21545) ;
SETPARENT (Genesis w11587) TO (-1* (w11585)) ;
####################
# Attach by clause label
####################
SETPARENT (/^\(c\\d+\)$/r) - CR - NoGlom TO (0* (VSTR:$1) + CR) ;
MAP @obl ActuallyObl ;
MAP @nsubj SubjIsh - CR IF (p CR LINK NEGATE c @nsubj) ;
MAP @dislocated (Subj) - CR IF (p CR) ;
MAP @obj (Objc) - CR - (Ellp) IF (p CR LINK NEGATE c @obj) ;
MAP @xcomp (Objc) - CR - (Ellp) OR (PrAd) - CR IF (p CR) ;
MAP @obj (ProbablyObj InrP) - CR - (Ellp) IF (p CR LINK NEGATE c @obj) ;
MAP @advcl (infa AdvP) IF (NEGATE 1* (*) LINK 0 BD) (NEGATE c @cop) ;
MAP @obl:npmod (verb infa) + $$Lemma - CR IF (p CR + $$Lemma) ;
MAP @advmod (verb infa AdvP) - CR IF (p NPHead) ;
MAP @orphan OblIsh + (Ellp) - CR OR (Objc Ellp) - CR IF (p CR + (Ellp)) ;
MAP @obl OblIsh - CR IF (p CR) ;
ADD CR (Pred) - (vbcp) - CR - QMark ;
ADD CR PredIsh IF (T:CRp) ;
ADD CR CopIsh - NonCopIsh IF (T:CRp) ;
ADD (PrepVerb) (verb) - (PrepVerb) - OrphanPrepVerb IF (c @case OR ("בלת" @obl)) ;
ADD (PrepVerb) (*) - (PrepVerb) IF (c @cop LINK c @case) ;
SECTION # clause con
ADD HasRel CR - HasRel - NonRelOverride IF (c @mark + (Rela) OR RelMark) ;
ADD HasConj CR - HasConj IF (c @cc) ;
ADD HasMark CR - HasMark + (infc) IF (c @case) ;
ADD HasMark CR + (PrepVerb) - HasMark ;
ADD HasMark CR - HasMark - HasRel - NonMarkOverride IF (c @mark - (inrg ques) - QMark - (Rela) - RelMark - NonMarkingSCONJ) ;
ADD HasMark CR + MarkOverride - HasMark ;
SECTION
SETCHILD REPEAT CR + (/^par:\(c\\d+\)$/r rela:PreC) - ActuallyCsubj
TO (-1*A CR + (VSTR:$1 Subj) LINK NOT p (*)) ;
MAP REPEAT @nsubj:outer CR + (Subj) IF (p CR + (rela:PreC)) ;
MAP @ccomp ActuallyCcomp ;
MAP @advcl ActuallyAdvcl ;
MAP @parataxis ActuallyParataxis ;
SETPARENT CR TO (c RelMark LINK -1 Pr) ;
MAP @acl CR IF (p Pr) ;
SETPARENT Pr + (/^par:\(c\\d+\)$/r) (c CR) TO (0* CR + (VSTR:$1)) ;
SETPARENT CR + (/^par:\(c\\d+\)$/r) TO (0* CR + (VSTR:$1)) ;
SETPARENT UNSAFE CR + (rela:Coor) (NOT p Pr) TO (p (rela:Coor) LINK p (*)) ;
MAP @xcomp CR + (rela:Objc) IF (p CR + ObjcXcomp) ;
MAP @xcomp CR + (rela:Adju) IF (p CR + AdjuXcomp) ;
MAP @parataxis CR + (rela:Adju Ellp Subj) IF (p CR) ;
MAP @acl CR + (rela:Adju) - (PrepVerb) IF (p CR + (subs)) ;
MAP @appos CR + (rela:Coor) - HasConj IF (p CR) (NEGATE 0* (ClauseRoot rela:Coor HasConj) BARRIER SB) ;
MAP @advcl CR IF (-1* CR) (c AdvclObl) ;
MAP @ccomp CR + (rela:Objc) IF (p CR) ;
MAP @advcl CR + (rela:Adju) IF (p CR) ;
MAP @conj CR + (rela:Coor) IF (p CR) ;
MAP @csubj CR + (rela:Subj) IF (p CR) ;
SECTION
SETPARENT (HasMark HasConj)
TO (-1* HasMark - HasConj BARRIER PlainC) ;
MAP @conj (HasMark HasConj) - NestMark IF (p HasMark) ;
SETPARENT (verb) + Ptc - QMark - NonAclOverride
TO (-1* Noun - @compound:smixut BARRIER (*) - BD - @compound:smixut) ;
MAP @acl (verb) + Ptc - QMark IF (p Noun) ;
MAP @xcomp (verb infc InfC) - QMark IF (-1* XcompInf + (verb) BARRIER SB OR @mark) ;
SETPARENT (@xcomp InfC) TO (-1* XcompInf + (verb) BARRIER SB) ;
WITH (vbcp) - DepLabel
IF (1* Participle OR (infc) BARRIER (*) - BD - ("ל" prep))
{
MAP @cop (*) ;
SETPARENT (*) TO (jC1 (*)) ;
} ;
MAP @xcomp Participle - (Subj) - HasRel IF (-1* (verb nmcp) BARRIER SB) ;
SETPARENT @advcl OR @xcomp TO (-1* (verb nmcp) BARRIER SB) ;
SECTION
SETPARENT NestMark TO (0* CR + HasMark) ;
SETPARENT PreMark TO (1* CR - HasMark) ;
SETPARENT PostMark + $$QuoteLevel TO (-1* CR + $$QuoteLevel - HasMark - HasRel) ;
SETPARENT HasMark
TO (0* PlainC - @csubj - (rela:Subj) BARRIER CR - HasMark - HasRel OR SB OR ("ה" inrg)) ;
MAP @csubj CR + (rela:Cmpl) IF (p ("חלילה" intj)) ;
SETPARENT QMark
TO (1* (FullClauseRoot Q) OR (FullClauseRoot QQ)) ;
SETPARENT CR + $$Domain - SpecialMark - HasRel (c AdvclAble)
TO (-1* PlainC + $$Domain BARRIER Domain - $$Domain) ;
SETPARENT (verb infc) + $$Domain - QMark (NEGATE c @cc)
TO (-1* CR + $$Domain - @csubj - (rela:Subj) BARRIER Domain - $$Domain) ;
MAP @acl ActuallyAcl ;
MAP @advcl CR IF (c AdvclAble) (p AdvclMarkVerb) ;
MAP @xcomp CR IF (c AdvclAble) (p XcompVerb) ;
MAP @ccomp CR IF (c AdvclAble) (p CcompVerb) ;
MAP @advcl CR IF (c AdvclAble) (p (*)) ;
MAP @advcl (PrepVerb) IF (p (*)) ;
MAP @advcl CR + HasMark - OrphanInfc IF (p CR) ;
SETPARENT @ccomp TO (0* CcompVerb BARRIER SB) ;
ADD FullClauseRoot PlainC - @acl - FullClauseRoot - NonFCROverride ;
SECTION
SETPARENT FullClauseRoot + HasConj + $$Domain
TO (-1* FullClauseRoot - HasConj + $$Domain - FCRSkip - ParenSent BARRIER FullClauseRoot - $$Domain - ParenSent) ;
MAP @conj FullClauseRoot + HasConj IF (p FullClauseRoot) ;
SECTION # adjacent words
MAP @nsubj SmallQstQ - CR IF (-1 BD) (1 SmallQstPrn LINK 1 BD) ;
SECTION # phrase-internal structure
MAP @acl (ClauseRoot AjCl) - AdjNonAcl
IF (-1* CB BARRIER SB OR @mark LINK -1* NPHead BARRIER BD) ;
####################
# Label verb arguments
####################
SECTION
### SUBJECTS
WITH SubjAble + (Subj NmCl ClausePhraseRoot) - DepLabel
IF (1* CR + HasRel BARRIER CR)
{
MAP @nsubj (*) ;
SETPARENT (*) TO (jC1 (*)) ;
} ;
MAP @dislocated CR + (rela:Subj) IF (1* (prps Subj rela:Resu)) ;
MAP @csubj CsubjOverride ;
SETPARENT @csubj OR CR + @dislocated TO (0* CR BARRIER SB) ;
### OBJECTS
LIST AddProbObj = Objc InrP !ProbablyObj ;
ADD REPEAT (ProbablyObj) ObjAble + AddProbObj ;
MAP @xcomp XcompOverride ;
### OBLIQUES
MAP @obl PPHead + (PreC) IF (-1* (nmcp) BARRIER SB) ;
MAP @obl (PreC) - CR ;
MAP @vocative Noun + (Voct) - CR ;
####################
# Attach verb arguments
####################
SECTION
SETPARENT CR + (rela:Attr /^par:\(w\\d+\)$/r) TO (-1* (VSTR:$1)) ;
MAP (@conj rel_conj) (ClauseRoot NmCl rela:Coor) IF (-1* RelMark BARRIER CB) ;
MAP @acl (ClauseRoot NmCl) IF (-1* RelMark BARRIER CB) ;
MAP @acl CR + (rela:Attr) IF (c RelMark) (p (*)) ;
SETPARENT @acl + AclChain TO (-1* @acl LINK p (*)) ;
SETPARENT (subs @acl) - AclChain TO (-1* Noun - (verb) - @flat:name OR Pr + @obj OR Pr + @obl) ;
SETPARENT @acl + RelToPrn TO (c RelMark LINK -1* (prn)) ;
SETPARENT @acl OR CR + @conj + (rela:Coor rel_conj)
TO (-1* NorP - RelSkip BARRIER SB) ;
SECTION
SETPARENT VerbArgs + $$ClauseType - Pr
TO (0* CR + $$ClauseType BARRIER SB) ;
SECTION
SETPARENT (conj CP) TO (1 PB LINK 1 @cop LINK p (*)) ;
MAP @acl CR - NonAclOverride
IF (c RelMark) (NEGATE c (@nsubj NmCl)) (NEGATE c @nsubj:outer) ;
SETPARENT @acl TO (-1* AclMultiTarget BARRIER SB) ;
SETPARENT @acl TO (c @mark LINK -1 Pr) ;
SETPARENT @acl + AclCompNotOk
TO (-1* CB LINK -1* AclAble - @compound:smixut BARRIER BD) ;
SETPARENT @acl - AclCompNotOk - AclChain
TO (-1* CB LINK -1* AclAble - @nummod - @amod BARRIER BD) ;
SETPARENT UNSAFE (verb /^par:\(ph\\d+\)$/r) + Ptc (p (*) - (VSTR:$1)) TO (-1* NPHead + (VSTR:$1)) ;
MAP @ccomp QMark IF (NEGATE 1* CR) ;
MAP @mark QMark ;
SECTION
SETPARENT CR TO (c RelMark LINK -1* CB BARRIER Pr LINK -1* NorP BARRIER PB) ;
MAP @acl CR IF (p NorP) (c RelMark) ;
SETPARENT XorO + $$ClauseType
TO (0* CR + $$ClauseType BARRIER SB) ;
SECTION
SETPARENT CorR + ConjTypes + @mark TO (1* CorM - @acl) ;
MAP @advcl (ClauseRoot Q HasMark)
IF (c @mark - (inrg ques) - QMark) (1* (ClauseRoot Q) BARRIER NonQuote LINK NEGATE c @mark) ;
SETPARENT MSynIsh + ConjTypes TO (1* CorM - @advcl - @acl) ;
MAP @conj (ClauseRoot Q)
IF (c @cc) (-1* (ClauseRoot Q) - @acl - @advcl - @xcomp - HasMark BARRIER (N)) ;
MAP @parataxis (ClauseRoot Q) - (infc) - HasMark - HasConj
IF (NEGATE c @cc) (NEGATE c @mark)
(-1* (ClauseRoot Q) - @acl - @advcl - @csubj - (HasMark @conj) BARRIER (N)) ;
MAP @ccomp (ClauseRoot Q)
IF (NEGATE c @mark) (-1* CR + NonQuote)
(NOT -1* (ClauseRoot Q) - @acl BARRIER NonQuote) ;
SETPARENT (ClauseRoot Q HasConj) - HasMark
TO (-1* PlainNC + (Q) BARRIER CR + NonQuote) ;
SETPARENT (ClauseRoot Q @conj)
TO (-1* (ClauseRoot Q) + CRconj) ;
MAP @root CR IF (NOT -1* CR - @advcl - @acl - @csubj) ;
SETPARENT @advcl + $$Domain (NEGATE 0* CR BARRIER SB) TO (1* CR + $$Domain - @advcl) ;
SETPARENT (@ccomp Q) + QuoteSkipAcl TO (-1* CR - @mark - @acl) ;
SETPARENT (@ccomp Q) TO (-1* (quot ClauseRoot) - @mark) ;
SETPARENT @ccomp TO (-1* CcompAble + CR) ;
SETPARENT CR + (rela:Attr) - AttrSkipAcl TO (-1* CB LINK -1* ApposAble) ;
MAP @acl CR + (rela:Attr) IF (p ApposAble) ;
MAP (@conj ClauseRoot) CR + $$NonQuote IF (-1* CR + $$NonQuote) (c @cc) ;
MAP (@parataxis ClauseRoot) CR + $$NonQuote - (PrepVerb) IF (-1* CR + $$NonQuote) ;
SETPARENT ConjToAdvcl TO (-1* CR + @advcl) ;
SETPARENT CR + ClauseCon + $$Domain
TO (-1* CR + $$Domain - DontConj - ParenSent) ;
SECTION
MAP @dislocated SubjAble + (CPen) ;
SETPARENT (@dislocated Frnt) TO (-1* @mark BARRIER (*) - BD LINK p (*)) ;
SETPARENT (@dislocated Frnt) + $$Domain TO (1* CR + $$Domain - @advcl) ;
SECTION
MAP @obl PPHead - CR ;
SETPARENT Pr + VerbArgs TO (-1* (verb) BARRIER SB) ;
SETPARENT Pr + VerbArgs TO (1* (verb) BARRIER SB) ;
SETPARENT Pr + VerbArgs TO (-1* (verb)) ;
SETPARENT VerbArgs
TO (c @acl LINK 1* CB LINK 1* CR BARRIER CB OR SB) ;
SETPARENT @mark TO (1* CR) ;
SECTION
SETPARENT UNSAFE @root TO (@0 (*)) ;
SETPARENT @vocative + (Q) TO (0* CR + (Q) BARRIER SB) ;
SETPARENT @vocative + $$Domain TO (0* CR + $$Domain) ;
SETPARENT @vocative TO (-1* CR) ;
SETPARENT @discourse
TO (1* @nsubj BARRIER (*) - BD LINK p (*)) ;
SECTION
SETPARENT ParenSent TO (-1* NPHead OR PPHead) ;
SETPARENT CR + (Q) + @advcl TO (0* CR + (Q) - @xcomp - @advcl BARRIER CR - (Q)) ;
SETPARENT CR + (Q) TO (-1* SpeakingVerb + (verb N) - QMark BARRIER PlainC + (N) - QMark OR PlainC + (Q)) ;
SETPARENT CR + (Q) (c QMark) TO (-1* PlainC + (N)) ;