-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathlassy_stats.py
6002 lines (5987 loc) · 378 KB
/
lassy_stats.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
mcatcat= {('np', 'conj'): 2648, ('smain', 'pp'): 12294, ('oti',
'ti'): 2264, ('ap', 'oti'): 103, ('du', 'vz'): 3, ('du', 'adj'):
114, ('oti', 'adj'): 1, ('ti', 'conj'): 7, ('du', 'vg'): 761,
('pp', 'ap'): 40, ('conj', 'vg'): 16972, ('ppart', 'sv1'): 5,
('ppres', 'mwu'): 10, ('advp', 'du'): 1, ('du', 'whq'): 65, ('top',
'bw'): 22, ('advp', 'ww'): 7, ('mwu', 'lid'): 1717, ('np', 'bw'):
2525, ('cp', 'ap'): 27, ('conj', 'whq'): 24, ('np', 'tsw'): 1,
('ti', 'du'): 2, ('detp', 'ww'): 1, ('whq', 'ppart'): 1, ('smain',
'detp'): 1, ('inf', 'tw'): 16, ('detp', 'bw'): 112, ('inf',
'conj'): 845, ('sv1', 'oti'): 16, ('advp', 'bw'): 1888, ('sv1',
'whrel'): 5, ('conj', 'cp'): 412, ('du', 'spec'): 525, ('whsub',
'ssub'): 456, ('ssub', 'whrel'): 30, ('conj', 'smain'): 7608,
('pp', 'oti'): 58, ('mwu', 'ww'): 516, ('np', 'ppres'): 260,
('top', 'whq'): 279, ('ppart', 'ssub'): 1, ('conj', 'vnw'): 232,
('smain', 'vg'): 12, ('ppart', 'cp'): 1049, ('rel', 'np'): 84,
('whrel', 'ap'): 22, ('whrel', 'vg'): 1, ('du', 'bw'): 323,
('ppart', 'ppres'): 11, ('smain', 'ap'): 1678, ('top', 'adj'): 55,
('pp', 'ppart'): 6, ('detp', 'spec'): 5, ('ppres', 'ppart'): 2,
('sv1', 'cp'): 134, ('whsub', 'vnw'): 160, ('whq', 'sv1'): 349,
('sv1', 'inf'): 224, ('ap', 'ww'): 475, ('ppres', 'vz'): 5,
('svan', 'whq'): 1, ('inf', 'ppres'): 9, ('smain', 'ww'): 31320,
('cp', 'np'): 1387, ('whrel', 'np'): 12, ('np', 'rel'): 5690,
('detp', 'np'): 3, ('conj', 'ssub'): 1327, ('ppart', 'whrel'): 74,
('smain', 'vnw'): 10354, ('top', 'spec'): 316, ('np', 'ap'): 1666,
('pp', 'n'): 10299, ('detp', 'adj'): 140, ('inf', 'ahi'): 3, ('pp',
'whrel'): 127, ('ppres', 'n'): 19, ('oti', 'conj'): 148, ('ppart',
'vnw'): 3762, ('ap', 'vg'): 1, ('top', 'np'): 3094, ('cp',
'ppart'): 22, ('sv1', 'ap'): 50, ('rel', 'du'): 9, ('whsub', 'vg'):
1, ('ppres', 'conj'): 7, ('smain', 'mwu'): 1526, ('detp', 'detp'):
3, ('np', 'ssub'): 2, ('ssub', 'ww'): 13271, ('ssub', 'du'): 10,
('smain', 'vz'): 2021, ('ap', 'mwu'): 341, ('pp', 'mwu'): 4061,
('ppres', 'ww'): 366, ('pp', 'tw'): 2072, ('ap', 'sv1'): 2, ('du',
'ppres'): 5, ('cp', 'cp'): 24, ('cp', 'pp'): 186, ('inf', 'smain'):
13, ('smain', 'tsw'): 6, ('cp', 'bw'): 435, ('du', 'vnw'): 91,
('sv1', 'ppres'): 1, ('sv1', 'pp'): 500, ('ppart', 'oti'): 407,
('inf', 'pp'): 5726, ('advp', 'np'): 99, ('pp', 'advp'): 94,
('ppres', 'ap'): 3, ('top', 'ssub'): 24, ('ppart', 'vg'): 7,
('ppres', 'ti'): 2, ('ssub', 'sv1'): 1, ('rel', 'pp'): 65, ('ssub',
'mwu'): 387, ('rel', 'mwu'): 5, ('cp', 'advp'): 8, ('mwu', 'vz'):
5450, ('smain', 'du'): 25, ('advp', 'n'): 272, ('np', 'oti'): 668,
('smain', 'lid'): 1, ('ap', 'ti'): 68, ('ppart', 'tw'): 18, ('inf',
'spec'): 7, ('du', 'whsub'): 7, ('conj', 'adj'): 2127, ('sv1',
'spec'): 17, ('du', 'conj'): 1042, ('ssub', 'np'): 6755, ('ap',
'smain'): 2, ('conj', 'conj'): 490, ('detp', 'oti'): 11, ('mwu',
'let'): 697, ('detp', 'vnw'): 316, ('rel', 'advp'): 1, ('mwu',
'n'): 10827, ('ap', 'rel'): 1, ('smain', 'sv1'): 9, ('ti', 'ww'):
115, ('whrel', 'sv1'): 6, ('smain', 'advp'): 437, ('mwu', 'vg'):
731, ('top', 'cp'): 63, ('ap', 'ssub'): 2, ('inf', 'vg'): 8,
('sv1', 'bw'): 532, ('inf', 'adj'): 1188, ('oti', 'vz'): 2414,
('conj', 'spec'): 605, ('sv1', 'adj'): 115, ('conj', 'mwu'): 1476,
('du', 'smain'): 4156, ('conj', 'tw'): 907, ('ssub', 'ppart'):
3010, ('ppart', 'whsub'): 30, ('whq', 'ap'): 6, ('smain', 'np'):
25183, ('ssub', 'vz'): 62, ('ppres', 'cp'): 13, ('advp', 'vg'): 5,
('conj', 'whrel'): 32, ('np', 'smain'): 85, ('whq', 'ssub'): 9,
('whrel', 'du'): 5, ('ppres', 'adj'): 116, ('advp', 'cp'): 76,
('conj', 'inf'): 403, ('detp', 'cp'): 56, ('pp', 'rel'): 6, ('sv1',
'smain'): 1, ('ssub', 'ahi'): 13, ('conj', 'oti'): 107, ('rel',
'ppart'): 1, ('top', 'tsw'): 37, ('pp', 'smain'): 1, ('np', 'vnw'):
13527, ('ssub', 'n'): 1336, ('ppart', 'rel'): 14, ('advp', 'pp'):
80, ('conj', 'ti'): 578, ('sv1', 'np'): 767, ('ppart', 'ww'):
11790, ('whq', 'du'): 2, ('advp', 'ap'): 1, ('ssub', 'spec'): 21,
('np', 'np'): 3072, ('pp', 'sv1'): 4, ('conj', 'let'): 7, ('ppres',
'spec'): 2, ('inf', 'vz'): 1041, ('ssub', 'whsub'): 26, ('top',
'lid'): 20, ('ppres', 'oti'): 1, ('conj', 'tsw'): 3, ('du', 'np'):
1831, ('ap', 'cp'): 634, ('top', 'pp'): 152, ('np', 'tw'): 7729,
('ppres', 'advp'): 3, ('du', 'advp'): 42, ('np', 'ti'): 208,
('detp', 'tw'): 239, ('inf', 'ti'): 116, ('np', 'sv1'): 42, ('sv1',
'ti'): 46, ('pp', 'bw'): 1278, ('rel', 'conj'): 279, ('top', 'vz'):
30, ('top', 'oti'): 7, ('ap', 'tw'): 23, ('svan', 'np'): 1, ('top',
'tw'): 459, ('pp', 'whsub'): 19, ('detp', 'vg'): 1, ('du', 'oti'):
23, ('rel', 'vnw'): 4641, ('np', 'adj'): 27434, ('ap', 'n'): 71,
('pp', 'pp'): 290, ('mwu', 'adj'): 2480, ('cp', 'vz'): 1950,
('top', 'ap'): 55, ('inf', 'whsub'): 116, ('smain', 'ahi'): 11,
('np', 'du'): 334, ('whq', 'bw'): 155, ('ssub', 'ap'): 742, ('rel',
'vg'): 3, ('np', 'n'): 98504, ('whsub', 'pp'): 42, ('inf', 'mwu'):
452, ('np', 'lid'): 64122, ('inf', 'sv1'): 7, ('top', 'ppres'): 3,
('smain', 'ppart'): 6061, ('smain', 'ppres'): 64, ('ppart',
'smain'): 9, ('detp', 'rel'): 1, ('cp', 'n'): 569, ('du', 'pp'):
556, ('ahi', 'vz'): 1, ('sv1', 'ww'): 1889, ('mwu', 'spec'): 21459,
('du', 'ppart'): 46, ('top', 'vnw'): 18, ('np', 'whsub'): 17,
('conj', 'ppres'): 27, ('rel', 'sv1'): 1, ('np', 'vz'): 31, ('ap',
'vnw'): 853, ('ssub', 'cp'): 577, ('np', 'ppart'): 872, ('svan',
'vz'): 5, ('np', 'pp'): 30888, ('conj', 'sv1'): 289, ('inf',
'oti'): 284, ('ppart', 'np'): 7130, ('cp', 'du'): 29, ('smain',
'inf'): 3785, ('smain', 'n'): 4399, ('du', 'sv1'): 512, ('whq',
'np'): 43, ('inf', 'du'): 13, ('advp', 'vz'): 11, ('top', 'smain'):
19196, ('ap', 'spec'): 11, ('np', 'whq'): 2, ('oti', 'inf'): 2,
('cp', 'sv1'): 74, ('whq', 'pp'): 13, ('top', 'ti'): 18, ('ppart',
'ppart'): 50, ('smain', 'spec'): 46, ('sv1', 'vz'): 191, ('cp',
'vnw'): 31, ('np', 'cp'): 1250, ('advp', 'spec'): 2, ('whsub',
'du'): 1, ('mwu', 'tw'): 3469, ('smain', 'ssub'): 3, ('du', 'inf'):
41, ('whsub', 'np'): 68, ('top', 'mwu'): 594, ('advp', 'oti'): 28,
('pp', 'vnw'): 1556, ('whsub', 'conj'): 16, ('ap', 'adj'): 5159,
('rel', 'ssub'): 5349, ('ppart', 'vz'): 38, ('advp', 'advp'): 3,
('ppart', 'n'): 1117, ('du', 'ap'): 86, ('np', 'mwu'): 8103, ('ap',
'conj'): 55, ('ppart', 'bw'): 3538, ('np', 'whrel'): 4, ('whsub',
'ap'): 25, ('ppart', 'du'): 11, ('conj', 'ppart'): 449, ('inf',
'np'): 8784, ('smain', 'ti'): 1048, ('smain', 'bw'): 6251, ('conj',
'vz'): 139, ('ap', 'du'): 2, ('pp', 'lid'): 1, ('advp', 'mwu'): 17,
('whrel', 'bw'): 205, ('ap', 'bw'): 2134, ('whrel', 'pp'): 2,
('top', 'conj'): 3812, ('whq', 'tw'): 2, ('top', 'du'): 5583,
('np', 'detp'): 520, ('top', 'advp'): 7, ('ti', 'inf'): 5108,
('cp', 'inf'): 9, ('sv1', 'tw'): 5, ('ssub', 'advp'): 147, ('du',
'ssub'): 18, ('ppart', 'ap'): 460, ('rel', 'inf'): 3, ('ap',
'advp'): 235, ('conj', 'n'): 7603, ('advp', 'vnw'): 255, ('advp',
'conj'): 2, ('ahi', 'inf'): 27, ('ap', 'ppres'): 2, ('ssub', 'ti'):
319, ('mwu', 'bw'): 671, ('pp', 'tsw'): 2, ('whq', 'conj'): 4,
('sv1', 'vg'): 1, ('top', 'sv1'): 577, ('conj', 'detp'): 25, ('np',
'advp'): 71, ('whq', 'vnw'): 149, ('np', 'vg'): 7, ('inf',
'whrel'): 95, ('whsub', 'advp'): 1, ('smain', 'cp'): 3160, ('cp',
'mwu'): 197, ('pp', 'inf'): 2, ('sv1', 'whsub'): 29, ('cp',
'ssub'): 5384, ('np', 'spec'): 1944, ('ppart', 'inf'): 1, ('du',
'tsw'): 57, ('ppres', 'np'): 25, ('advp', 'rel'): 9, ('conj',
'advp'): 37, ('smain', 'oti'): 588, ('sv1', 'n'): 257, ('top',
'ww'): 53, ('cp', 'vg'): 6810, ('ppres', 'vnw'): 35, ('inf', 'n'):
1700, ('whsub', 'ppart'): 2, ('conj', 'lid'): 1, ('whq', 'inf'): 7,
('smain', 'whsub'): 130, ('ssub', 'ppres'): 20, ('ppart', 'pp'):
9980, ('mwu', 'pp'): 1, ('cp', 'tw'): 24, ('pp', 'adj'): 392,
('top', 'rel'): 10, ('smain', 'conj'): 2694, ('whrel', 'vnw'): 413,
('cp', 'ww'): 33, ('whrel', 'ppres'): 1, ('pp', 'conj'): 4587,
('smain', 'smain'): 14, ('whq', 'ti'): 2, ('sv1', 'ppart'): 158,
('whsub', 'tw'): 6, ('whsub', 'ppres'): 1, ('inf', 'ppart'): 1286,
('ppres', 'bw'): 72, ('top', 'whrel'): 5, ('np', 'svan'): 5,
('ssub', 'vnw'): 8993, ('ssub', 'bw'): 2177, ('ppart', 'ti'): 155,
('cp', 'whrel'): 9, ('inf', 'ap'): 441, ('detp', 'mwu'): 137,
('pp', 'spec'): 332, ('whrel', 'conj'): 27, ('detp', 'du'): 2,
('smain', 'tw'): 32, ('sv1', 'conj'): 87, ('ssub', 'conj'): 687,
('detp', 'advp'): 6, ('inf', 'inf'): 834, ('oti', 'bw'): 17,
('inf', 'ww'): 12719, ('whsub', 'bw'): 155, ('du', 'cp'): 338,
('ppart', 'advp'): 226, ('whsub', 'ti'): 2, ('detp', 'n'): 12,
('ap', 'ap'): 154, ('du', 'rel'): 6, ('advp', 'adj'): 226, ('sv1',
'vnw'): 736, ('mwu', 'vnw'): 603, ('conj', 'rel'): 209, ('inf',
'vnw'): 5075, ('ppart', 'mwu'): 555, ('sv1', 'mwu'): 102, ('conj',
'du'): 270, ('inf', 'cp'): 1090, ('ap', 'np'): 423, ('conj', 'bw'):
379, ('du', 'du'): 692, ('advp', 'tw'): 84, ('inf', 'ssub'): 1,
('ppres', 'pp'): 181, ('pp', 'ti'): 103, ('du', 'ww'): 52, ('ssub',
'smain'): 4, ('ssub', 'pp'): 3796, ('conj', 'ww'): 249, ('top',
'ppart'): 51, ('ppart', 'spec'): 13, ('smain', 'whrel'): 268,
('svan', 'inf'): 2, ('advp', 'smain'): 1, ('ssub', 'inf'): 2093,
('ppart', 'conj'): 698, ('cp', 'ti'): 301, ('np', 'ww'): 4491,
('whrel', 'mwu'): 3, ('top', 'whsub'): 14, ('ssub', 'oti'): 143,
('detp', 'vz'): 1, ('sv1', 'du'): 1, ('mwu', 'tsw'): 11, ('ppart',
'adj'): 1654, ('whrel', 'advp'): 1, ('du', 'ti'): 8, ('conj',
'ap'): 470, ('pp', 'vg'): 15, ('ap', 'whsub'): 1, ('inf', 'bw'):
2861, ('ssub', 'adj'): 1063, ('top', 'let'): 69726, ('ti', 'vz'):
5232, ('cp', 'conj'): 768, ('ap', 'pp'): 1635, ('cp', 'smain'): 1,
('top', 'inf'): 83, ('top', 'n'): 1266, ('np', 'let'): 5, ('detp',
'lid'): 27, ('svan', 'n'): 1, ('np', 'inf'): 8, ('conj', 'np'):
13040, ('conj', 'whsub'): 78, ('rel', 'bw'): 982, ('pp', 'vz'):
65376, ('top', 'vg'): 14, ('pp', 'np'): 44495, ('du', 'whrel'): 46,
('pp', 'cp'): 360, ('conj', 'pp'): 2072, ('whrel', 'ssub'): 621,
('smain', 'adj'): 2693, ('ssub', 'vg'): 6, ('cp', 'spec'): 29,
('cp', 'ppres'): 1, ('ppres', 'whsub'): 2, ('du', 'mwu'): 1038,
('oti', 'pp'): 2, ('ap', 'vz'): 21, ('du', 'n'): 1153, ('pp',
'du'): 12, ('du', 'let'): 50, ('sv1', 'advp'): 9, ('ssub', 'tw'):
32, ('inf', 'advp'): 200, ('cp', 'oti'): 5, ('du', 'tw'): 800,
('ssub', 'tsw'): 2, ('inf', 'tsw'): 4, ('pp', 'ww'): 126, ('ahi',
'mwu'): 26, ('cp', 'adj'): 144}
mcatcatTheta=10
#own additions
mcatcat[('sv1', 'ahi')]=mcatcatTheta+1
mcatcat[('sv1', 'advp')]=mcatcatTheta+1
mcatcat[('sv1', 'ppres')]=mcatcatTheta+1
mcatcat[('top', 'whrel')]=mcatcatTheta+1
catTheta=10
relposcat= {('crd', 'bw'): 292, ('--', 'mwu'): 594, ('dp', 'ti'):
3, ('--', 'let'): 69726, ('predm', 'n'): 2, ('mod', 'mwu'): 1737,
('--', 'cp'): 63, ('sat', 'np'): 333, ('body', 'n'): 569, ('hd',
'tw'): 1187, ('nucl', 'np'): 410, ('svp', 'adj'): 365, ('mod',
'ti'): 72, ('predc', 'ppart'): 418, ('obj1', 'vz'): 54, ('mod',
'ppart'): 1000, ('predc', 'vg'): 1, ('app', 'n'): 1765, ('cnj',
'advp'): 37, ('cmp', 'vg'): 6809, ('nucl', 'spec'): 15, ('predm',
'advp'): 10, ('dp', 'du'): 272, ('dp', 'pp'): 445, ('mod', 'let'):
1, ('hd', 'vg'): 27, ('svp', 'np'): 1, ('body', 'mwu'): 89, ('cmp',
'conj'): 1, ('predc', 'tsw'): 3, ('mod', 'ww'): 2804, ('obj1',
'vnw'): 5273, ('sat', 'mwu'): 44, ('nucl', 'sv1'): 111, ('su',
'mwu'): 1111, ('body', 'cp'): 23, ('ld', 'adj'): 12, ('mwp',
'let'): 697, ('crd', 'vg'): 16964, ('dp', 'sv1'): 80, ('mod',
'ap'): 2800, ('nucl', 'adj'): 11, ('--', 'conj'): 3812, ('hd',
'lid'): 24, ('sat', 'bw'): 5, ('body', 'smain'): 1, ('cmp', 'mwu'):
128, ('dp', 'vz'): 3, ('sat', 'du'): 146, ('nucl', 'pp'): 42,
('nucl', 'du'): 266, ('crd', 'tw'): 5, ('mwp', 'ww'): 516, ('dp',
'smain'): 1667, ('nucl', 'vg'): 1, ('body', 'ww'): 144, ('--',
'whsub'): 14, ('ld', 'pp'): 3579, ('su', 'advp'): 3, ('cnj', 'tw'):
902, ('mod', 'whrel'): 316, ('crd', 'n'): 1, ('obj2', 'bw'): 5,
('--', 'advp'): 7, ('nucl', 'vnw'): 1, ('--', 'vg'): 14, ('me',
'pp'): 3, ('tag', 'bw'): 34, ('sat', 'ap'): 12, ('obj2', 'n'): 109,
('whd', 'vnw'): 309, ('obcomp', 'ti'): 1, ('dp', 'rel'): 1, ('tag',
'cp'): 9, ('det', 'mwu'): 129, ('app', 'vnw'): 2, ('cnj', 'vg'): 8,
('--', 'ppres'): 3, ('obj1', 'du'): 11, ('su', 'pp'): 2, ('whd',
'vg'): 1, ('sat', 'ww'): 1, ('crd', 'vz'): 128, ('predm', 'conj'):
24, ('svp', 'vz'): 3228, ('predc', 'cp'): 626, ('mwp', 'vz'): 5450,
('tag', 'pp'): 21, ('dlink', 'bw'): 34, ('vc', 'conj'): 511,
('tag', 'ppart'): 1, ('predc', 'bw'): 93, ('nucl', 'rel'): 5,
('su', 'detp'): 1, ('svp', 'ww'): 96, ('rhd', 'vg'): 4, ('rhd',
'advp'): 2, ('cnj', 'oti'): 107, ('--', 'whrel'): 5, ('obj1',
'inf'): 2, ('hd', 'bw'): 1955, ('predm', 'mwu'): 3, ('cnj', 'du'):
270, ('body', 'oti'): 5, ('whd', 'bw'): 308, ('cnj', 'ap'): 470,
('det', 'vnw'): 12135, ('predm', 'ap'): 153, ('predm', 'cp'): 418,
('--', 'smain'): 19196, ('vc', 'vnw'): 2, ('mod', 'sv1'): 65,
('obj1', 'ap'): 32, ('su', 'vg'): 14, ('tag', 'inf'): 1, ('tag',
'n'): 79, ('obj2', 'vnw'): 354, ('cnj', 'vnw'): 231, ('hd', 'vz'):
65225, ('mod', 'tw'): 2382, ('rhd', 'conj'): 2, ('mwp', 'adj'):
2480, ('crd', 'mwu'): 93, ('mod', 'spec'): 544, ('su', 'conj'):
1895, ('vc', 'du'): 1, ('body', 'ssub'): 11819, ('dp', 'oti'): 10,
('obj2', 'conj'): 39, ('obj1', 'ww'): 120, ('svp', 'mwu'): 801,
('body', 'sv1'): 430, ('mod', 'advp'): 1333, ('dp', 'ap'): 56,
('se', 'n'): 1, ('cnj', 'ppart'): 449, ('sat', 'ti'): 5, ('vc',
'oti'): 896, ('nucl', 'tw'): 6, ('me', 'np'): 509, ('obj1',
'conj'): 5747, ('mod', 'conj'): 2584, ('mwp', 'tw'): 3469, ('obj2',
'mwu'): 9, ('cnj', 'smain'): 7608, ('hd', 'let'): 3, ('predc',
'inf'): 1, ('vc', 'bw'): 11, ('dp', 'tw'): 657, ('whd', 'ppres'):
1, ('vc', 'ti'): 1823, ('dp', 'ww'): 30, ('cnj', 'whrel'): 32,
('tag', 'ap'): 9, ('body', 'np'): 1442, ('body', 'pp'): 184,
('obj1', 'lid'): 2, ('det', 'pp'): 8, ('--', 'rel'): 10, ('sat',
'ppres'): 2, ('hd', 'spec'): 1224, ('det', 'n'): 335, ('mwp',
'vg'): 731, ('--', 'sv1'): 577, ('--', 'ssub'): 24, ('body',
'inf'): 5158, ('cnj', 'n'): 7602, ('tag', 'mwu'): 97, ('vc',
'ahi'): 27, ('mod', 'vz'): 91, ('dp', 'whsub'): 2, ('svp', 'ti'):
46, ('pc', 'bw'): 323, ('su', 'adj'): 84, ('obj1', 'tw'): 2093,
('whd', 'advp'): 1, ('tag', 'ssub'): 9, ('cnj', 'bw'): 87, ('app',
'bw'): 2, ('nucl', 'conj'): 275, ('det', 'tw'): 3883, ('obj2',
'adj'): 5, ('predc', 'vnw'): 122, ('hd', 'adj'): 5568, ('whd',
'conj'): 11, ('mod', 'np'): 2464, ('rhd', 'ap'): 22, ('dp',
'ppres'): 2, ('sat', 'vnw'): 4, ('su', 'oti'): 153, ('--', 'n'):
1266, ('dp', 'ssub'): 3, ('--', 'lid'): 20, ('dp', 'whrel'): 19,
('su', 'spec'): 31, ('sat', 'conj'): 368, ('nucl', 'tsw'): 5,
('vc', 'inf'): 6933, ('nucl', 'ww'): 17, ('body', 'ap'): 24,
('sat', 'adj'): 2, ('su', 'whsub'): 40, ('dp', 'mwu'): 774, ('mod',
'rel'): 5721, ('pc', 'conj'): 160, ('cnj', 'conj'): 490, ('predm',
'vnw'): 56, ('nucl', 'ap'): 9, ('me', 'conj'): 15, ('svp', 'vnw'):
26, ('mod', 'vnw'): 3879, ('--', 'vz'): 30, ('predm', 'adj'): 96,
('vc', 'ssub'): 6, ('cmp', 'ww'): 4, ('--', 'ppart'): 51, ('det',
'ap'): 194, ('obj1', 'advp'): 63, ('vc', 'ww'): 17, ('mwp', 'pp'):
1, ('dp', 'conj'): 387, ('ld', 'np'): 98, ('sat', 'spec'): 40,
('su', 'ti'): 122, ('hd', 'np'): 5, ('--', 'np'): 3094, ('dp',
'advp'): 37, ('su', 'np'): 25998, ('--', 'inf'): 83, ('dp', 'whq'):
14, ('ld', 'n'): 9, ('obj2', 'vz'): 1, ('tag', 'conj'): 12, ('tag',
'tsw'): 48, ('pobj1', 'vnw'): 269, ('dp', 'ppart'): 31, ('obj1',
'mwu'): 2937, ('nucl', 'ppres'): 1, ('body', 'advp'): 3, ('obcomp',
'adj'): 88, ('vc', 'whsub'): 330, ('app', 'conj'): 582, ('whd',
'tw'): 8, ('nucl', 'bw'): 15, ('dp', 'spec'): 134, ('tag', 'advp'):
2, ('predc', 'pp'): 597, ('sat', 'n'): 36, ('cnj', 'ww'): 249,
('mod', 'pp'): 52260, ('dp', 'n'): 846, ('predc', 'tw'): 27, ('dp',
'tsw'): 4, ('hd', 'ww'): 73136, ('sat', 'ssub'): 1, ('ld', 'bw'):
142, ('rhd', 'mwu'): 5, ('nucl', 'ssub'): 5, ('dp', 'let'): 23,
('svp', 'bw'): 520, ('su', 'cp'): 504, ('predm', 'ppart'): 54,
('sat', 'sv1'): 102, ('svp', 'conj'): 2, ('hdf', 'vz'): 149,
('svp', 'n'): 342, ('crd', 'spec'): 87, ('mwp', 'n'): 10827,
('cmp', 'bw'): 165, ('cnj', 'ti'): 578, ('rhd', 'vnw'): 5054,
('cnj', 'ppres'): 27, ('det', 'np'): 186, ('cnj', 'tsw'): 3,
('cmp', 'adj'): 30, ('mod', 'ssub'): 3, ('body', 'whrel'): 9,
('su', 'vnw'): 20136, ('app', 'let'): 1, ('dp', 'np'): 1056, ('dp',
'vg'): 10, ('crd', 'adj'): 21, ('nucl', 'inf'): 16, ('sat', 'cp'):
200, ('det', 'lid'): 64121, ('tag', 'tw'): 89, ('rhd', 'bw'): 1184,
('tag', 'ww'): 4, ('me', 'vnw'): 44, ('su', 'du'): 1, ('cnj',
'lid'): 1, ('sat', 'whq'): 8, ('app', 'ww'): 5, ('vc', 'advp'): 1,
('mod', 'inf'): 4, ('body', 'bw'): 35, ('tag', 'vg'): 6, ('obj1',
'np'): 62166, ('obj1', 'vg'): 10, ('me', 'bw'): 3, ('sat', 'inf'):
10, ('--', 'whq'): 279, ('mod', 'lid'): 4, ('mod', 'smain'): 107,
('mod', 'detp'): 3, ('dlink', 'mwu'): 16, ('me', 'tw'): 9, ('cnj',
'detp'): 25, ('sat', 'whrel'): 25, ('cnj', 'whsub'): 78, ('dp',
'cp'): 92, ('body', 'conj'): 1235, ('mwp', 'vnw'): 603, ('dp',
'bw'): 235, ('det', 'conj'): 149, ('sat', 'ppart'): 7, ('ld',
'advp'): 25, ('vc', 'ppart'): 9973, ('obj1', 'tsw'): 9, ('me',
'adj'): 8, ('hd', 'tsw'): 1, ('tag', 'let'): 27, ('--', 'pp'): 152,
('body', 'whq'): 1, ('cmp', 'spec'): 18, ('obcomp', 'cp'): 754,
('rhd', 'pp'): 65, ('rhd', 'ppres'): 1, ('whd', 'pp'): 55, ('tag',
'spec'): 333, ('mod', 'adj'): 31538, ('dp', 'adj'): 94, ('cnj',
'cp'): 412, ('obj1', 'bw'): 157, ('me', 'mwu'): 2, ('cnj', 'let'):
4, ('whd', 'np'): 111, ('obj1', 'pp'): 167, ('cnj', 'inf'): 403,
('sat', 'oti'): 6, ('whd', 'ap'): 31, ('cmp', 'vnw'): 6, ('cnj',
'pp'): 2072, ('det', 'bw'): 16, ('me', 'spec'): 8, ('predc',
'oti'): 8, ('hd', 'vnw'): 1548, ('su', 'whrel'): 104, ('obj1',
'sv1'): 3, ('obcomp', 'oti'): 50, ('predc', 'ap'): 2021, ('obj1',
'whrel'): 149, ('nucl', 'whsub'): 2, ('predc', 'np'): 3537, ('app',
'du'): 11, ('sat', 'tw'): 48, ('app', 'tw'): 642, ('crd', 'vnw'):
1, ('hdf', 'mwu'): 5, ('tag', 'oti'): 2, ('dp', 'inf'): 14, ('cnj',
'np'): 13040, ('app', 'adj'): 24, ('--', 'bw'): 22, ('predc',
'ww'): 209, ('tag', 'adj'): 7, ('tag', 'du'): 8, ('ld', 'vz'): 12,
('crd', 'let'): 3, ('mod', 'ppres'): 291, ('su', 'bw'): 4, ('ld',
'mwu'): 11, ('pc', 'vz'): 26, ('hd', 'mwu'): 7009, ('predm', 'pp'):
56, ('predm', 'du'): 7, ('predm', 'bw'): 317, ('--', 'spec'): 316,
('app', 'sv1'): 2, ('predc', 'vz'): 12, ('sat', 'pp'): 48, ('me',
'ap'): 10, ('mwp', 'spec'): 21459, ('body', 'ppres'): 1, ('obj1',
'adj'): 186, ('tag', 'sv1'): 219, ('app', 'spec'): 232, ('sat',
'advp'): 1, ('ld', 'ap'): 26, ('--', 'vnw'): 18, ('sup', 'vnw'):
493, ('body', 'tw'): 24, ('nucl', 'n'): 192, ('mod', 'tsw'): 2,
('sat', 'whsub'): 3, ('cnj', 'mwu'): 1383, ('det', 'detp'): 520,
('me', 'n'): 13, ('cnj', 'ssub'): 1327, ('svp', 'pp'): 77,
('predc', 'ppres'): 25, ('ld', 'conj'): 76, ('--', 'adj'): 55,
('nucl', 'smain'): 2088, ('obj2', 'pp'): 507, ('hd', 'n'): 94459,
('--', 'oti'): 7, ('tag', 'np'): 32, ('body', 'du'): 48, ('obj1',
'spec'): 299, ('mwp', 'bw'): 671, ('tag', 'smain'): 147, ('predm',
'np'): 7, ('predm', 'ppres'): 51, ('nucl', 'ppart'): 7, ('--',
'tw'): 459, ('dlink', 'vg'): 744, ('whd', 'ppart'): 2, ('obj2',
'np'): 324, ('su', 'inf'): 7, ('su', 'n'): 5595, ('app', 'smain'):
23, ('det', 'adj'): 305, ('mwp', 'lid'): 1717, ('cmp', 'vz'): 9602,
('cnj', 'adj'): 2106, ('body', 'adj'): 96, ('nucl', 'whq'): 43,
('predc', 'ti'): 1, ('nucl', 'oti'): 5, ('cnj', 'sv1'): 289,
('rhd', 'np'): 29, ('mod', 'n'): 2338, ('mod', 'bw'): 20077,
('nucl', 'cp'): 37, ('mod', 'du'): 380, ('app', 'mwu'): 1718,
('app', 'np'): 1454, ('dp', 'vnw'): 86, ('mod', 'oti'): 1200,
('predc', 'advp'): 1, ('cnj', 'spec'): 518, ('body', 'spec'): 10,
('predc', 'whrel'): 34, ('se', 'vnw'): 1015, ('nucl', 'mwu'): 107,
('nucl', 'advp'): 2, ('--', 'ti'): 18, ('pc', 'pp'): 8120, ('app',
'cp'): 1, ('det', 'spec'): 43, ('--', 'ap'): 55, ('predc', 'mwu'):
228, ('body', 'vnw'): 25, ('predc', 'spec'): 20, ('predm', 'ww'):
22, ('nucl', 'whrel'): 2, ('--', 'tsw'): 37, ('mwp', 'tsw'): 11,
('dlink', 'spec'): 3, ('su', 'tw'): 27, ('app', 'whq'): 2, ('su',
'ww'): 46, ('app', 'ap'): 2, ('mod', 'vg'): 12, ('cnj', 'rel'):
209, ('body', 'ppart'): 24, ('--', 'ww'): 53, ('vc', 'svan'): 5,
('sat', 'smain'): 254, ('predc', 'n'): 284, ('cnj', 'vz'): 11,
('mod', 'cp'): 4200, ('ld', 'vnw'): 108, ('predc', 'conj'): 526,
('--', 'du'): 5583, ('obj1', 'n'): 12735, ('body', 'ti'): 2569,
('predc', 'adj'): 1920, ('cnj', 'whq'): 24, ('vc', 'cp'): 1897}
mcatrelTheta=10
mcatrel={('cp', 'cmp'): 9085, ('ssub', 'sup'): 47, ('ssub', 'ld'):
777, ('mwu', 'mwp'): 48632, ('whrel', 'mod'): 5, ('sv1', 'predc'):
184, ('detp', 'mod'): 461, ('top', '--'): 105643, ('smain', 'se'):
445, ('np', 'me'): 18, ('np', 'obcomp'): 80, ('inf', 'me'): 26,
('du', 'tag'): 1196, ('inf', 'vc'): 2656, ('ap', 'hd'): 5805,
('ap', 'se'): 11, ('np', 'obj1'): 114, ('du', 'nucl'): 3696, ('np',
'ld'): 48, ('ppart', 'predm'): 11, ('ap', 'mod'): 4470, ('ssub',
'mod'): 5780, ('inf', 'pc'): 1612, ('ap', 'obj1'): 76, ('np',
'det'): 82021, ('detp', 'obcomp'): 79, ('smain', 'su'): 30673,
('oti', 'cmp'): 2414, ('rel', 'rhd'): 5711, ('rel', 'mod'): 1,
('whq', 'whd'): 371, ('du', 'dp'): 7087, ('ppart', 'obj2'): 365,
('ppart', 'svp'): 257, ('ppart', 'pobj1'): 16, ('detp', 'det'): 3,
('ppart', 'predc'): 767, ('ap', 'obcomp'): 568, ('smain', 'me'):
117, ('du', 'dlink'): 797, ('ssub', 'predm'): 292, ('inf', 'se'):
236, ('ti', 'body'): 5232, ('pp', 'hd'): 66950, ('smain', 'sup'):
380, ('sv1', 'ld'): 89, ('cp', 'body'): 9084, ('ssub', 'predc'):
2115, ('inf', 'ld'): 813, ('pp', 'obj1'): 66393, ('pp', 'mod'):
1426, ('ppres', 'hd'): 395, ('smain', 'predc'): 6539, ('smain',
'pc'): 2797, ('svan', 'body'): 5, ('ppres', 'svp'): 5, ('advp',
'hd'): 1500, ('pp', 'se'): 32, ('ppart', 'me'): 6, ('sv1', 'mod'):
996, ('np', 'su'): 18, ('ap', 'obj2'): 16, ('ahi', 'body'): 27,
('inf', 'mod'): 8904, ('ppart', 'pc'): 1848, ('np', 'mod'): 81428,
('inf', 'predm'): 108, ('ppres', 'me'): 11, ('ap', 'me'): 385,
('sv1', 'predm'): 30, ('ppart', 'vc'): 498, ('sv1', 'su'): 1107,
('pp', 'predc'): 92, ('sv1', 'me'): 3, ('np', 'predm'): 18, ('ap',
'vc'): 178, ('ppres', 'se'): 6, ('smain', 'ld'): 1592, ('ppres',
'obj1'): 34, ('ssub', 'obj1'): 3107, ('ppres', 'predc'): 19,
('whsub', 'body'): 467, ('smain', 'pobj1'): 39, ('ppart', 'sup'):
7, ('detp', 'me'): 1, ('smain', 'vc'): 11586, ('ssub', 'hd'):
13195, ('ti', 'cmp'): 5232, ('ppart', 'su'): 2610, ('inf',
'predc'): 959, ('sv1', 'vc'): 501, ('cp', 'hd'): 1, ('smain',
'mod'): 19782, ('ap', 'ld'): 2, ('whsub', 'mod'): 2, ('ppart',
'hd'): 11984, ('smain', 'predm'): 816, ('detp', 'hd'): 529, ('sv1',
'pc'): 184, ('ap', 'pc'): 888, ('ppart', 'mod'): 15014, ('np',
'pc'): 65, ('sv1', 'svp'): 222, ('ahi', 'cmp'): 27, ('ap',
'pobj1'): 2, ('whq', 'body'): 371, ('rel', 'body'): 5711, ('advp',
'me'): 29, ('inf', 'su'): 8447, ('conj', 'cnj'): 41052, ('smain',
'obj2'): 402, ('ssub', 'obj2'): 150, ('ssub', 'svp'): 306,
('ppres', 'vc'): 12, ('sv1', 'obj1'): 619, ('np', 'app'): 6468,
('conj', 'crd'): 17595, ('ppart', 'ld'): 759, ('ssub', 'vc'): 5547,
('pp', 'hdf'): 154, ('smain', 'hd'): 31090, ('inf', 'sup'): 45,
('inf', 'pobj1'): 11, ('ppart', 'se'): 63, ('sv1', 'se'): 15,
('cp', 'mod'): 287, ('np', 'vc'): 974, ('pp', 'pobj1'): 185,
('advp', 'mod'): 1371, ('smain', 'obj1'): 6681, ('sv1', 'obj2'):
33, ('inf', 'obj2'): 381, ('inf', 'svp'): 1519, ('ppres', 'su'): 1,
('ssub', 'me'): 28, ('oti', 'body'): 2414, ('np', 'svp'): 20,
('ppres', 'pc'): 98, ('ssub', 'su'): 13022, ('np', 'obj2'): 6,
('ap', 'predm'): 1, ('ssub', 'se'): 207, ('ssub', 'pc'): 1135,
('whsub', 'whd'): 467, ('smain', 'svp'): 3175, ('ap', 'predc'): 6,
('sv1', 'pobj1'): 1, ('ppres', 'mod'): 265, ('sv1', 'sup'): 14,
('inf', 'hd'): 12624, ('ppart', 'obj1'): 8598, ('ssub', 'pobj1'):
15, ('whrel', 'rhd'): 657, ('sv1', 'hd'): 1875, ('du', 'sat'):
1711, ('oti', 'mod'): 20, ('advp', 'obcomp'): 166, ('pp', 'pc'): 1,
('inf', 'obj1'): 6593, ('np', 'hd'): 105423, ('np', 'se'): 1,
('np', 'predc'): 33, ('whrel', 'body'): 657, ('ppres', 'ld'): 18,
('pp', 'vc'): 481, ('svan', 'cmp'): 5, ('advp', 'pc'): 1}
#additions
mcatrel[('svan', 'cmp')]=mcatrelTheta+1
mcatrel[('svan', 'body')]=mcatrelTheta+1
mcatrelcatTheta=10
mcatrelcat= {('sv1', 'svp', 'mwu'): 8, ('ppres', 'vc', 'ti'): 1,
('cp', 'mod', 'ap'): 3, ('sv1', 'ld', 'bw'): 2, ('detp', 'mod',
'mwu'): 132, ('inf', 'predc', 'pp'): 82, ('np', 'vc', 'ssub'): 1,
('ppart', 'svp', 'vz'): 21, ('ssub', 'su', 'cp'): 37, ('top', '--',
'mwu'): 594, ('smain', 'svp', 'bw'): 325, ('inf', 'obj1', 'n'):
718, ('rel', 'rhd', 'bw'): 981, ('advp', 'hd', 'tw'): 15, ('du',
'dp', 'pp'): 445, ('mwu', 'mwp', 'let'): 697, ('cp', 'body',
'smain'): 1, ('cp', 'body', 'ppart'): 22, ('ppres', 'mod', 'mwu'):
4, ('smain', 'mod', 'spec'): 8, ('cp', 'body', 'tw'): 24, ('whsub',
'whd', 'conj'): 8, ('advp', 'mod', 'ap'): 1, ('advp', 'hd', 'vz'):
10, ('inf', 'obj1', 'vnw'): 859, ('conj', 'cnj', 'ti'): 578,
('detp', 'mod', 'tw'): 1, ('ssub', 'vc', 'vnw'): 1, ('ppres',
'predc', 'cp'): 2, ('pp', 'mod', 'vg'): 1, ('ssub', 'mod', 'bw'):
1923, ('du', 'dlink', 'bw'): 34, ('detp', 'mod', 'np'): 3, ('sv1',
'obj1', 'spec'): 12, ('smain', 'sup', 'vnw'): 380, ('du', 'dp',
'ti'): 3, ('ap', 'mod', 'spec'): 4, ('detp', 'hd', 'vg'): 1,
('ssub', 'predm', 'advp'): 3, ('du', 'dp', 'ssub'): 3, ('pp',
'mod', 'du'): 3, ('smain', 'su', 'pp'): 2, ('np', 'det', 'tw'):
3883, ('pp', 'obj1', 'conj'): 4557, ('ssub', 'obj2', 'vnw'): 45,
('smain', 'obj2', 'vnw'): 107, ('ppart', 'vc', 'oti'): 119,
('ppart', 'se', 'vnw'): 63, ('np', 'mod', 'ssub'): 1, ('pp', 'vc',
'whsub'): 19, ('smain', 'vc', 'bw'): 7, ('ppart', 'mod', 'pp'):
7260, ('ti', 'body', 'ww'): 115, ('np', 'mod', 'mwu'): 830, ('ap',
'obcomp', 'ti'): 1, ('sv1', 'obj1', 'vnw'): 85, ('pp', 'pobj1',
'vnw'): 185, ('sv1', 'me', 'vnw'): 1, ('oti', 'mod', 'pp'): 2,
('ppart', 'obj2', 'n'): 30, ('inf', 'predm', 'pp'): 7, ('ssub',
'obj2', 'n'): 10, ('detp', 'mod', 'rel'): 1, ('du', 'tag', 'conj'):
12, ('top', '--', 'tw'): 459, ('inf', 'su', 'spec'): 2, ('whsub',
'whd', 'ap'): 25, ('sv1', 'obj2', 'conj'): 1, ('np', 'vc', 'oti'):
441, ('np', 'app', 'tw'): 642, ('inf', 'su', 'tw'): 3, ('pp',
'mod', 'n'): 6, ('smain', 'su', 'detp'): 1, ('smain', 'predc',
'ap'): 1143, ('pp', 'vc', 'ti'): 102, ('pp', 'hd', 'bw'): 288,
('ap', 'mod', 'du'): 2, ('ap', 'pobj1', 'vnw'): 2, ('np', 'app',
'smain'): 23, ('inf', 'mod', 'ww'): 20, ('du', 'dp', 'let'): 23,
('smain', 'svp', 'n'): 220, ('sv1', 'mod', 'pp'): 238, ('du', 'dp',
'mwu'): 774, ('cp', 'cmp', 'conj'): 1, ('smain', 'obj2', 'conj'):
14, ('du', 'nucl', 'tw'): 6, ('ssub', 'mod', 'oti'): 86, ('ssub',
'ld', 'mwu'): 3, ('sv1', 'pc', 'conj'): 4, ('smain', 'vc', 'ssub'):
3, ('cp', 'cmp', 'spec'): 18, ('ppres', 'vc', 'cp'): 7, ('np',
'mod', 'ap'): 1466, ('conj', 'cnj', 'ppres'): 27, ('pp', 'vc',
'cp'): 276, ('ssub', 'mod', 'spec'): 8, ('ssub', 'svp', 'adj'): 28,
('ap', 'obj1', 'conj'): 7, ('inf', 'su', 'np'): 3636, ('du', 'sat',
'inf'): 10, ('smain', 'pc', 'pp'): 2667, ('inf', 'predm', 'ww'): 4,
('np', 'mod', 'rel'): 5690, ('pp', 'predc', 'ppart'): 2, ('sv1',
'su', 'whrel'): 4, ('advp', 'mod', 'pp'): 79, ('smain', 'predm',
'ww'): 12, ('smain', 'su', 'whsub'): 35, ('smain', 'predm',
'conj'): 15, ('pp', 'mod', 'mwu'): 99, ('ppart', 'mod', 'tw'): 4,
('rel', 'rhd', 'pp'): 63, ('ppart', 'mod', 'spec'): 3, ('sv1',
'ld', 'conj'): 1, ('inf', 'obj1', 'np'): 4649, ('smain', 'mod',
'smain'): 14, ('conj', 'crd', 'n'): 1, ('smain', 'mod', 'whrel'):
162, ('inf', 'svp', 'vz'): 994, ('sv1', 'svp', 'vz'): 184, ('inf',
'svp', 'pp'): 22, ('smain', 'obj1', 'vnw'): 537, ('np', 'det',
'vnw'): 12132, ('inf', 'mod', 'np'): 150, ('detp', 'hd', 'bw'): 5,
('sv1', 'obj2', 'vnw'): 14, ('sv1', 'vc', 'ww'): 3, ('sv1',
'predc', 'vnw'): 37, ('du', 'dp', 'advp'): 37, ('ssub', 'mod',
'pp'): 1942, ('top', '--', 'inf'): 83, ('conj', 'crd', 'vz'): 128,
('ssub', 'me', 'tw'): 4, ('smain', 'me', 'mwu'): 2, ('du', 'dp',
'du'): 272, ('sv1', 'obj1', 'whrel'): 1, ('ssub', 'predm', 'ww'):
6, ('ssub', 'obj1', 'ap'): 2, ('np', 'mod', 'cp'): 831, ('du',
'dp', 'n'): 846, ('ssub', 'predc', 'tsw'): 1, ('conj', 'cnj',
'conj'): 490, ('whsub', 'body', 'ssub'): 456, ('ppart', 'ld',
'mwu'): 3, ('ssub', 'vc', 'conj'): 81, ('ppart', 'mod', 'sv1'): 5,
('ap', 'me', 'tw'): 1, ('ap', 'vc', 'ti'): 67, ('inf', 'ld', 'vz'):
2, ('sv1', 'predc', 'conj'): 6, ('smain', 'su', 'tw'): 17,
('smain', 'predc', 'spec'): 13, ('conj', 'crd', 'tw'): 5, ('ssub',
'su', 'np'): 4170, ('smain', 'predm', 'du'): 6, ('np', 'mod',
'ww'): 2678, ('du', 'nucl', 'oti'): 5, ('advp', 'me', 'bw'): 1,
('ppart', 'predc', 'np'): 120, ('smain', 'su', 'du'): 1, ('sv1',
'obj1', 'np'): 370, ('ap', 'vc', 'cp'): 23, ('conj', 'cnj',
'whrel'): 32, ('du', 'dlink', 'vg'): 744, ('ap', 'hd', 'spec'): 6,
('inf', 'me', 'vnw'): 2, ('inf', 'predc', 'n'): 28, ('inf', 'su',
'oti'): 10, ('ti', 'body', 'du'): 2, ('du', 'sat', 'spec'): 40,
('ssub', 'predm', 'mwu'): 1, ('ssub', 'obj1', 'conj'): 133,
('ppart', 'su', 'oti'): 3, ('np', 'det', 'n'): 335, ('du', 'tag',
'inf'): 1, ('inf', 'obj2', 'mwu'): 2, ('smain', 'mod', 'tw'): 2,
('sv1', 'su', 'n'): 153, ('rel', 'body', 'conj'): 279, ('sv1',
'pc', 'vz'): 1, ('ppart', 'obj2', 'pp'): 175, ('ssub', 'mod',
'inf'): 1, ('inf', 'mod', 'adj'): 824, ('whq', 'whd', 'tw'): 2,
('ssub', 'ld', 'vz'): 4, ('ap', 'vc', 'ssub'): 1, ('inf', 'obj1',
'adj'): 8, ('smain', 'obj2', 'pp'): 133, ('inf', 'vc', 'conj'): 64,
('advp', 'obcomp', 'adj'): 73, ('detp', 'mod', 'spec'): 2, ('np',
'det', 'ap'): 194, ('smain', 'predm', 'ppres'): 35, ('ppart',
'mod', 'vnw'): 712, ('inf', 'vc', 'whsub'): 116, ('cp', 'body',
'ti'): 301, ('mwu', 'mwp', 'vg'): 731, ('sv1', 'mod', 'n'): 1,
('ppart', 'mod', 'advp'): 222, ('smain', 'hd', 'np'): 4, ('ppres',
'vc', 'whsub'): 2, ('smain', 'se', 'vnw'): 444, ('ssub', 'predc',
'tw'): 14, ('pp', 'obj1', 'tsw'): 2, ('inf', 'svp', 'adj'): 80,
('ap', 'me', 'n'): 9, ('ppart', 'ld', 'conj'): 10, ('np', 'mod',
'ppres'): 260, ('inf', 'predc', 'mwu'): 17, ('smain', 'mod',
'conj'): 245, ('np', 'hd', 'let'): 3, ('ppart', 'predc', 'vnw'): 1,
('ssub', 'su', 'advp'): 1, ('pp', 'mod', 'np'): 73, ('conj', 'cnj',
'oti'): 107, ('ppart', 'hd', 'bw'): 5, ('smain', 'svp', 'adj'):
219, ('inf', 'predm', 'n'): 1, ('du', 'dp', 'tw'): 657, ('np',
'predc', 'ww'): 4, ('sv1', 'ld', 'vnw'): 8, ('smain', 'su', 'vnw'):
7655, ('detp', 'hd', 'mwu'): 5, ('du', 'sat', 'ap'): 12, ('inf',
'me', 'ap'): 3, ('oti', 'body', 'ti'): 2264, ('ap', 'me', 'vnw'):
18, ('np', 'app', 'spec'): 232, ('advp', 'mod', 'n'): 69, ('top',
'--', 'oti'): 7, ('detp', 'obcomp', 'cp'): 56, ('du', 'tag',
'smain'): 147, ('pp', 'mod', 'cp'): 5, ('pp', 'mod', 'vnw'): 10,
('conj', 'cnj', 'mwu'): 1383, ('ppart', 'vc', 'ti'): 152, ('conj',
'cnj', 'inf'): 403, ('np', 'app', 'ww'): 5, ('sv1', 'predc',
'spec'): 2, ('ssub', 'pobj1', 'vnw'): 15, ('du', 'nucl', 'conj'):
275, ('smain', 'predc', 'cp'): 175, ('ppres', 'hd', 'vz'): 3,
('smain', 'ld', 'adj'): 6, ('smain', 'vc', 'oti'): 116, ('np',
'pc', 'vz'): 1, ('np', 'predm', 'mwu'): 1, ('cp', 'body', 'du'):
29, ('inf', 'svp', 'vnw'): 5, ('ppart', 'ld', 'ap'): 2, ('sv1',
'su', 'np'): 344, ('detp', 'mod', 'detp'): 3, ('pp', 'predc',
'pp'): 1, ('sv1', 'predc', 'np'): 37, ('ssub', 'mod', 'sv1'): 1,
('smain', 'mod', 'bw'): 5603, ('smain', 'svp', 'conj'): 1, ('ap',
'hd', 'bw'): 495, ('conj', 'cnj', 'vz'): 11, ('np', 'vc', 'cp'):
342, ('ap', 'hd', 'ww'): 453, ('advp', 'mod', 'conj'): 2, ('whrel',
'body', 'du'): 5, ('ap', 'hd', 'tw'): 19, ('sv1', 'svp', 'adj'): 7,
('sv1', 'predc', 'tw'): 2, ('np', 'app', 'np'): 1454, ('ppart',
'svp', 'ww'): 5, ('smain', 'su', 'advp'): 1, ('ssub', 'vc', 'ti'):
287, ('smain', 'mod', 'ppres'): 11, ('sv1', 'predc', 'cp'): 2,
('np', 'obj1', 'mwu'): 1, ('sv1', 'obj2', 'pp'): 9, ('ap', 'hd',
'mwu'): 269, ('whsub', 'whd', 'vg'): 1, ('smain', 'mod', 'ap'):
411, ('inf', 'ld', 'n'): 2, ('smain', 'obj1', 'vg'): 5, ('sv1',
'vc', 'bw'): 1, ('np', 'app', 'bw'): 2, ('ppart', 'mod', 'adj'):
1286, ('ppres', 'obj1', 'np'): 12, ('du', 'dp', 'tsw'): 4, ('whq',
'body', 'ppart'): 1, ('smain', 'predc', 'oti'): 6, ('whsub', 'whd',
'tw'): 6, ('inf', 'obj1', 'whrel'): 7, ('sv1', 'mod', 'mwu'): 5,
('smain', 'vc', 'conj'): 278, ('du', 'sat', 'tw'): 48, ('smain',
'su', 'adj'): 59, ('du', 'sat', 'ppart'): 7, ('np', 'obcomp',
'cp'): 71, ('ppart', 'su', 'conj'): 85, ('ap', 'mod', 'ap'): 153,
('ahi', 'cmp', 'mwu'): 26, ('ap', 'me', 'adj'): 2, ('ssub',
'predc', 'spec'): 2, ('sv1', 'mod', 'ap'): 16, ('inf', 'su', 'vg'):
2, ('cp', 'body', 'cp'): 23, ('pp', 'obj1', 'mwu'): 2639, ('du',
'dp', 'inf'): 14, ('sv1', 'mod', 'smain'): 1, ('du', 'nucl', 'ap'):
9, ('sv1', 'me', 'np'): 1, ('inf', 'mod', 'sv1'): 7, ('sv1', 'vc',
'ti'): 44, ('oti', 'cmp', 'vz'): 2414, ('inf', 'su', 'mwu'): 121,
('ap', 'obj1', 'ap'): 1, ('smain', 'me', 'n'): 3, ('sv1', 'su',
'cp'): 8, ('advp', 'pc', 'pp'): 1, ('du', 'tag', 'ssub'): 9,
('ssub', 'mod', 'du'): 9, ('du', 'dp', 'adj'): 94, ('ssub', 'ld',
'ap'): 7, ('conj', 'crd', 'vnw'): 1, ('ppart', 'vc', 'inf'): 1,
('du', 'sat', 'mwu'): 44, ('pp', 'obj1', 'tw'): 2071, ('whrel',
'body', 'conj'): 25, ('smain', 'me', 'ap'): 4, ('du', 'dp',
'spec'): 134, ('inf', 'predc', 'adj'): 251, ('smain', 'svp',
'vnw'): 13, ('inf', 'predm', 'ap'): 12, ('inf', 'mod', 'advp'):
192, ('np', 'det', 'adj'): 305, ('sv1', 'obj2', 'np'): 7, ('sv1',
'predm', 'cp'): 6, ('ssub', 'mod', 'vg'): 3, ('ppart', 'predc',
'ww'): 26, ('advp', 'mod', 'np'): 89, ('smain', 'predc', 'bw'): 36,
('np', 'ld', 'np'): 1, ('top', '--', 'conj'): 3812, ('np', 'mod',
'inf'): 3, ('ssub', 'su', 'spec'): 9, ('inf', 'vc', 'oti'): 40,
('ssub', 'obj2', 'np'): 41, ('np', 'det', 'pp'): 8, ('sv1', 'obj1',
'ww'): 1, ('whq', 'whd', 'conj'): 3, ('inf', 'vc', 'ppart'): 1243,
('ppres', 'mod', 'ppart'): 1, ('ppart', 'predm', 'pp'): 2,
('ppart', 'predc', 'oti'): 2, ('rel', 'rhd', 'mwu'): 5, ('advp',
'mod', 'bw'): 770, ('sv1', 'se', 'vnw'): 15, ('sv1', 'predc',
'pp'): 4, ('detp', 'hd', 'lid'): 24, ('pp', 'mod', 'spec'): 14,
('ssub', 'predm', 'conj'): 7, ('sv1', 'mod', 'tw'): 2, ('advp',
'mod', 'du'): 1, ('pp', 'se', 'vnw'): 32, ('du', 'nucl', 'tsw'): 5,
('ppart', 'svp', 'pp'): 16, ('ap', 'obj1', 'n'): 6, ('np', 'mod',
'bw'): 2451, ('mwu', 'mwp', 'vz'): 5450, ('smain', 'predc', 'vnw'):
19, ('np', 'mod', 'whrel'): 4, ('advp', 'hd', 'vg'): 5, ('ap',
'mod', 'ppres'): 1, ('ti', 'body', 'conj'): 7, ('oti', 'mod',
'adj'): 1, ('np', 'vc', 'conj'): 18, ('ssub', 'svp', 'mwu'): 136,
('du', 'tag', 'cp'): 9, ('mwu', 'mwp', 'vnw'): 603, ('du', 'nucl',
'whsub'): 2, ('inf', 'su', 'whrel'): 20, ('np', 'svp', 'pp'): 2,
('smain', 'obj2', 'adj'): 1, ('np', 'mod', 'ppart'): 865, ('ssub',
'vc', 'ww'): 1, ('smain', 'pc', 'vz'): 5, ('smain', 'predm', 'bw'):
172, ('ap', 'me', 'pp'): 2, ('inf', 'predm', 'np'): 1, ('smain',
'mod', 'tsw'): 1, ('sv1', 'svp', 'pp'): 2, ('pp', 'mod', 'pp'):
123, ('np', 'obcomp', 'oti'): 7, ('top', '--', 'ssub'): 24,
('ppart', 'predc', 'advp'): 1, ('advp', 'hd', 'vnw'): 87, ('mwu',
'mwp', 'lid'): 1717, ('smain', 'me', 'conj'): 8, ('sv1', 'su',
'whsub'): 1, ('top', '--', 'ppres'): 3, ('whsub', 'body', 'du'): 1,
('sv1', 'ld', 'vz'): 1, ('pp', 'predc', 'n'): 1, ('ssub', 'mod',
'vz'): 11, ('cp', 'body', 'ww'): 29, ('smain', 'svp', 'vz'): 1984,
('ppart', 'me', 'adj'): 1, ('inf', 'predm', 'ppart'): 2, ('np',
'mod', 'smain'): 62, ('ppres', 'predc', 'ppart'): 1, ('sv1', 'su',
'ti'): 1, ('sv1', 'obj2', 'n'): 2, ('sv1', 'obj1', 'n'): 95, ('pp',
'hdf', 'vz'): 149, ('ssub', 'pc', 'bw'): 74, ('smain', 'predc',
'ppres'): 18, ('cp', 'cmp', 'mwu'): 102, ('inf', 'mod', 'du'): 12,
('ssub', 'svp', 'ti'): 18, ('detp', 'hd', 'spec'): 3, ('ppres',
'hd', 'adj'): 32, ('ssub', 'ld', 'conj'): 11, ('np', 'vc', 'inf'):
5, ('smain', 'obj2', 'np'): 102, ('ssub', 'svp', 'n'): 28, ('inf',
'me', 'n'): 1, ('ssub', 'obj1', 'mwu'): 19, ('conj', 'cnj', 'lid'):
1, ('ppart', 'obj2', 'np'): 66, ('du', 'tag', 'let'): 27, ('np',
'mod', 'vg'): 3, ('ppart', 'su', 'tw'): 2, ('du', 'dp', 'np'):
1056, ('ppart', 'pc', 'pp'): 1730, ('smain', 'ld', 'pp'): 1418,
('np', 'se', 'vnw'): 1, ('cp', 'mod', 'n'): 1, ('np', 'ld', 'pp'):
47, ('smain', 'obj1', 'adj'): 15, ('cp', 'cmp', 'ww'): 4, ('sv1',
'vc', 'conj'): 12, ('du', 'nucl', 'bw'): 15, ('ppres', 'mod',
'ap'): 2, ('rel', 'body', 'ssub'): 5349, ('sv1', 'mod', 'oti'): 8,
('ppart', 'mod', 'oti'): 283, ('np', 'su', 'mwu'): 3, ('smain',
'su', 'spec'): 19, ('advp', 'hd', 'mwu'): 11, ('whsub', 'whd',
'pp'): 42, ('ppres', 'ld', 'pp'): 18, ('ssub', 'ld', 'bw'): 50,
('smain', 'me', 'bw'): 1, ('ppart', 'predc', 'spec'): 2, ('svan',
'body', 'whq'): 1, ('ppart', 'hd', 'ww'): 11722, ('advp', 'hd',
'n'): 203, ('sv1', 'ld', 'pp'): 76, ('detp', 'mod', 'vz'): 1,
('inf', 'mod', 'spec'): 1, ('inf', 'mod', 'vz'): 27, ('ssub', 'vc',
'oti'): 35, ('ssub', 'su', 'oti'): 22, ('ap', 'predm', 'adj'): 1,
('ssub', 'predc', 'conj'): 73, ('sv1', 'me', 'ap'): 1, ('np',
'mod', 'vz'): 10, ('ap', 'mod', 'mwu'): 72, ('smain', 'predm',
'mwu'): 1, ('sv1', 'su', 'vnw'): 495, ('ppart', 'obj1', 'np'):
5536, ('pp', 'obj1', 'lid'): 1, ('smain', 'se', 'n'): 1, ('ppart',
'hd', 'vz'): 2, ('inf', 'su', 'conj'): 258, ('cp', 'body', 'inf'):
9, ('top', '--', 'bw'): 22, ('ppart', 'predc', 'bw'): 8, ('ppres',
'predc', 'conj'): 4, ('ppart', 'pc', 'conj'): 28, ('ssub', 'su',
'whsub'): 3, ('ppart', 'vc', 'whsub'): 29, ('smain', 'mod', 'mwu'):
250, ('whsub', 'body', 'conj'): 8, ('sv1', 'mod', 'bw'): 481,
('smain', 'predm', 'np'): 5, ('smain', 'ld', 'bw'): 43, ('sv1',
'predc', 'n'): 3, ('cp', 'body', 'advp'): 3, ('inf', 'mod', 'cp'):
727, ('ppart', 'predm', 'bw'): 3, ('detp', 'me', 'vnw'): 1,
('smain', 'obj1', 'ap'): 3, ('inf', 'mod', 'pp'): 3265, ('smain',
'obj1', 'bw'): 1, ('du', 'nucl', 'ppres'): 1, ('sv1', 'su', 'oti'):
4, ('advp', 'obcomp', 'cp'): 65, ('ssub', 'mod', 'ww'): 7, ('ssub',
'su', 'bw'): 1, ('ppart', 'mod', 'bw'): 3397, ('np', 'app', 'adj'):
24, ('np', 'hd', 'vg'): 4, ('du', 'nucl', 'whq'): 43, ('cp', 'mod',
'bw'): 235, ('conj', 'crd', 'vg'): 16964, ('inf', 'predc', 'ap'):
194, ('smain', 'obj1', 'np'): 5121, ('np', 'mod', 'conj'): 1890,
('smain', 'obj1', 'mwu'): 58, ('du', 'dp', 'ap'): 56, ('ssub',
'pc', 'pp'): 1046, ('svan', 'cmp', 'vz'): 5, ('ssub', 'su',
'whrel'): 7, ('ppart', 'predc', 'mwu'): 23, ('ppart', 'predc',
'tw'): 2, ('inf', 'obj2', 'conj'): 14, ('smain', 'svp', 'ww'): 51,
('inf', 'su', 'ti'): 8, ('ssub', 'hd', 'ww'): 13195, ('ap', 'hd',
'adj'): 4099, ('ssub', 'predc', 'ap'): 568, ('ppart', 'mod', 'np'):
255, ('conj', 'cnj', 'np'): 13040, ('du', 'tag', 'sv1'): 219,
('ppres', 'vc', 'oti'): 1, ('inf', 'obj1', 'vg'): 2, ('ssub', 'su',
'vnw'): 7394, ('ap', 'me', 'np'): 349, ('ap', 'pc', 'pp'): 851,
('smain', 'su', 'np'): 16711, ('ppart', 'su', 'whrel'): 1,
('smain', 'obj1', 'whrel'): 2, ('ppart', 'vc', 'conj'): 27, ('ap',
'ld', 'pp'): 2, ('inf', 'vc', 'ww'): 12, ('ppart', 'mod', 'whrel'):
61, ('np', 'hd', 'vz'): 20, ('cp', 'body', 'ssub'): 5384, ('ppart',
'obj1', 'pp'): 2, ('mwu', 'mwp', 'tsw'): 11, ('du', 'sat',
'whsub'): 3, ('ap', 'me', 'spec'): 1, ('du', 'sat', 'pp'): 48,
('ssub', 'ld', 'vnw'): 50, ('smain', 'ld', 'vnw'): 24, ('inf',
'mod', 'smain'): 13, ('detp', 'obcomp', 'oti'): 11, ('np', 'obj1',
'n'): 44, ('ssub', 'predc', 'ppres'): 6, ('mwu', 'mwp', 'ww'): 516,
('pp', 'mod', 'sv1'): 1, ('smain', 'mod', 'np'): 374, ('du', 'tag',
'ppart'): 1, ('mwu', 'mwp', 'spec'): 21459, ('smain', 'predc',
'conj'): 390, ('smain', 'ld', 'n'): 5, ('np', 'det', 'np'): 186,
('inf', 'vc', 'bw'): 2, ('inf', 'ld', 'mwu'): 2, ('ssub', 'predm',
'pp'): 17, ('inf', 'svp', 'mwu'): 175, ('du', 'dp', 'vg'): 10,
('detp', 'mod', 'lid'): 3, ('ssub', 'predc', 'ww'): 39, ('du',
'nucl', 'vnw'): 1, ('ppart', 'obj1', 'mwu'): 157, ('ap', 'vc',
'whsub'): 1, ('advp', 'mod', 'adj'): 106, ('whrel', 'rhd', 'conj'):
2, ('ppart', 'mod', 'cp'): 646, ('ssub', 'predm', 'ap'): 33,
('ssub', 'predc', 'ppart'): 112, ('inf', 'predc', 'ww'): 29,
('ssub', 'su', 'n'): 919, ('inf', 'me', 'conj'): 3, ('inf',
'predc', 'ppart'): 26, ('ssub', 'svp', 'pp'): 11, ('smain', 'obj2',
'n'): 38, ('smain', 'predc', 'pp'): 283, ('ppart', 'mod', 'ap'):
375, ('smain', 'su', 'cp'): 421, ('du', 'dp', 'smain'): 1667,
('inf', 'predc', 'spec'): 1, ('sv1', 'su', 'conj'): 25, ('np',
'obj1', 'np'): 52, ('pp', 'predc', 'np'): 2, ('cp', 'body', 'sv1'):
74, ('cp', 'body', 'adj'): 96, ('pp', 'obj1', 'ww'): 105, ('np',
'det', 'spec'): 43, ('np', 'pc', 'pp'): 58, ('cp', 'mod', 'pp'): 4,
('top', '--', 'pp'): 152, ('cp', 'body', 'ap'): 24, ('inf', 'obj1',
'mwu'): 45, ('sv1', 'mod', 'adj'): 66, ('pp', 'mod', 'tw'): 1,
('inf', 'obj1', 'spec'): 3, ('inf', 'predc', 'np'): 201, ('inf',
'svp', 'ti'): 3, ('np', 'svp', 'mwu'): 14, ('ssub', 'mod', 'np'):
101, ('np', 'mod', 'sv1'): 40, ('np', 'app', 'let'): 1, ('ppart',
'su', 'mwu'): 47, ('du', 'dp', 'cp'): 92, ('ppart', 'predc', 'n'):
31, ('top', '--', 'whq'): 279, ('detp', 'mod', 'n'): 11, ('smain',
'svp', 'ti'): 22, ('np', 'me', 'vnw'): 3, ('ssub', 'predm', 'cp'):
88, ('ppart', 'svp', 'adj'): 26, ('ssub', 'predm', 'vnw'): 16,
('du', 'sat', 'sv1'): 102, ('inf', 'predm', 'adj'): 10, ('inf',
'predc', 'cp'): 65, ('sv1', 'su', 'vg'): 1, ('whrel', 'rhd', 'vg'):
1, ('rel', 'rhd', 'np'): 17, ('sv1', 'mod', 'conj'): 4, ('np',
'predc', 'adj'): 9, ('smain', 'predc', 'tw'): 9, ('ppart', 'su',
'np'): 1132, ('sv1', 'vc', 'ppart'): 147, ('inf', 'ld', 'advp'): 6,
('whrel', 'rhd', 'ppres'): 1, ('np', 'hd', 'bw'): 45, ('sv1',
'predm', 'ppres'): 1, ('ppart', 'mod', 'ssub'): 1, ('ppart',
'obj1', 'ww'): 8, ('np', 'mod', 'let'): 1, ('ppart', 'mod', 'ti'):
1, ('inf', 'ld', 'vnw'): 15, ('ssub', 'obj1', 'tw'): 1, ('np',
'mod', 'n'): 2187, ('inf', 'su', 'n'): 842, ('inf', 'obj2', 'bw'):
3, ('np', 'det', 'mwu'): 129, ('smain', 'svp', 'pp'): 24, ('smain',
'predc', 'mwu'): 144, ('inf', 'svp', 'ww'): 22, ('du', 'sat',
'vnw'): 4, ('du', 'sat', 'conj'): 368, ('conj', 'cnj', 'ww'): 249,
('advp', 'mod', 'mwu'): 6, ('whq', 'whd', 'pp'): 13, ('np', 'det',
'lid'): 64121, ('sv1', 'svp', 'bw'): 11, ('inf', 'su', 'vnw'):
3495, ('ppres', 'obj1', 'spec'): 1, ('sv1', 'obj1', 'adj'): 2,
('rel', 'rhd', 'vg'): 3, ('inf', 'predc', 'vz'): 1, ('conj', 'cnj',
'sv1'): 289, ('du', 'sat', 'smain'): 254, ('top', '--', 'whsub'):
14, ('ssub', 'obj2', 'conj'): 5, ('du', 'tag', 'adj'): 7, ('ppres',
'hd', 'ww'): 360, ('whsub', 'whd', 'bw'): 153, ('ppart', 'su',
'vnw'): 1091, ('smain', 'predc', 'whrel'): 32, ('ap', 'mod',
'advp'): 235, ('np', 'app', 'sv1'): 2, ('sv1', 'svp', 'ti'): 1,
('du', 'sat', 'bw'): 5, ('inf', 'vc', 'cp'): 237, ('detp', 'hd',
'adj'): 53, ('ppres', 'mod', 'bw'): 59, ('pp', 'mod', 'rel'): 6,
('inf', 'mod', 'vnw'): 297, ('ap', 'mod', 'vnw'): 377, ('conj',
'cnj', 'spec'): 518, ('ssub', 'svp', 'bw'): 20, ('du', 'nucl',
'advp'): 2, ('ssub', 'predm', 'ppres'): 11, ('ppart', 'ld', 'pp'):
695, ('smain', 'predc', 'vz'): 7, ('cp', 'body', 'whrel'): 9,
('smain', 'hd', 'ww'): 31085, ('du', 'nucl', 'sv1'): 111, ('ppres',
'me', 'spec'): 1, ('ssub', 'ld', 'pp'): 615, ('whsub', 'whd',
'np'): 68, ('ppart', 'obj1', 'whrel'): 12, ('inf', 'mod', 'whrel'):
68, ('oti', 'mod', 'bw'): 17, ('np', 'predm', 'cp'): 5, ('smain',
'obj1', 'spec'): 2, ('inf', 'me', 'pp'): 1, ('pp', 'mod', 'vz'): 2,
('du', 'tag', 'vg'): 6, ('inf', 'su', 'advp'): 1, ('np', 'app',
'whq'): 2, ('smain', 'mod', 'ww'): 29, ('ssub', 'vc', 'inf'): 2092,
('du', 'nucl', 'n'): 192, ('whq', 'body', 'inf'): 7, ('pp', 'obj1',
'np'): 44420, ('conj', 'crd', 'bw'): 292, ('inf', 'mod', 'ap'):
222, ('ppart', 'me', 'np'): 5, ('ppres', 'pc', 'vz'): 2, ('sv1',
'obj1', 'tw'): 1, ('ppart', 'obj1', 'ap'): 4, ('conj', 'cnj',
'rel'): 209, ('ssub', 'me', 'np'): 19, ('ap', 'mod', 'ww'): 22,
('ssub', 'mod', 'mwu'): 66, ('sv1', 'vc', 'oti'): 4, ('pp', 'hd',
'n'): 33, ('pp', 'mod', 'whrel'): 1, ('top', '--', 'ti'): 18,
('du', 'dp', 'oti'): 10, ('conj', 'crd', 'mwu'): 93, ('pp', 'hd',
'spec'): 46, ('smain', 'obj1', 'lid'): 1, ('top', '--', 'n'): 1266,
('smain', 'predm', 'ppart'): 45, ('smain', 'su', 'ww'): 32,
('ppres', 'predc', 'mwu'): 4, ('sv1', 'vc', 'inf'): 224, ('ppres',
'predc', 'adj'): 4, ('conj', 'cnj', 'ap'): 470, ('np', 'app',
'ap'): 2, ('inf', 'mod', 'bw'): 2577, ('pp', 'hd', 'ww'): 16,
('np', 'hd', 'np'): 1, ('inf', 'obj2', 'vz'): 1, ('pp', 'hd',
'vnw'): 1, ('ahi', 'cmp', 'vz'): 1, ('np', 'det', 'bw'): 16,
('ppart', 'predc', 'pp'): 100, ('advp', 'mod', 'vz'): 1, ('inf',
'vc', 'ahi'): 3, ('ssub', 'obj1', 'tsw'): 1, ('pp', 'obj1', 'vz'):
54, ('top', '--', 'ap'): 55, ('ssub', 'obj1', 'adj'): 5, ('rel',
'body', 'sv1'): 1, ('smain', 'predc', 'n'): 161, ('np', 'mod',
'oti'): 220, ('ppres', 'mod', 'adj'): 77, ('inf', 'pc', 'conj'):
31, ('du', 'dp', 'ww'): 30, ('detp', 'det', 'vnw'): 3, ('du',
'sat', 'whq'): 8, ('ppres', 'mod', 'n'): 2, ('whsub', 'whd',
'advp'): 1, ('inf', 'ld', 'conj'): 16, ('ppres', 'mod', 'conj'): 1,
('top', '--', 'sv1'): 577, ('du', 'tag', 'bw'): 34, ('ap', 'obj2',
'pp'): 9, ('ssub', 'pc', 'conj'): 15, ('pp', 'mod', 'advp'): 31,
('ap', 'predc', 'pp'): 3, ('ssub', 'svp', 'vnw'): 5, ('ppart',
'obj1', 'conj'): 319, ('ap', 'pc', 'bw'): 22, ('inf', 'obj2',
'pp'): 129, ('np', 'su', 'vnw'): 6, ('ppres', 'mod', 'vnw'): 25,
('du', 'dp', 'rel'): 1, ('inf', 'obj2', 'adj'): 4, ('du', 'tag',
'np'): 32, ('ap', 'vc', 'conj'): 3, ('ppres', 'predc', 'pp'): 3,
('pp', 'mod', 'ppart'): 4, ('smain', 'vc', 'ahi'): 11, ('pp',
'predc', 'ti'): 1, ('inf', 'predc', 'bw'): 13, ('top', '--', 'cp'):
63, ('top', '--', 'vnw'): 18, ('mwu', 'mwp', 'tw'): 3469, ('ap',
'obj1', 'vnw'): 29, ('np', 'app', 'cp'): 1, ('ssub', 'predc',
'pp'): 118, ('inf', 'pobj1', 'vnw'): 11, ('ssub', 'predc', 'vz'):
2, ('pp', 'mod', 'smain'): 1, ('ppart', 'obj1', 'spec'): 7,
('ssub', 'predm', 'du'): 1, ('conj', 'crd', 'let'): 3, ('sv1',
'predc', 'mwu'): 2, ('ppres', 'vc', 'conj'): 1, ('conj', 'cnj',
'cp'): 412, ('ppart', 'svp', 'mwu'): 151, ('np', 'hd', 'adj'):
1044, ('advp', 'hd', 'spec'): 2, ('ppart', 'mod', 'vg'): 2, ('ap',
'mod', 'conj'): 28, ('advp', 'obcomp', 'oti'): 28, ('ap', 'predc',
'ppres'): 1, ('smain', 'ld', 'mwu'): 3, ('np', 'mod', 'spec'): 500,
('ssub', 'obj1', 'np'): 1973, ('np', 'mod', 'pp'): 30765, ('conj',
'cnj', 'du'): 270, ('np', 'hd', 'tsw'): 1, ('du', 'dp', 'whsub'):
2, ('advp', 'hd', 'ww'): 3, ('ppart', 'svp', 'bw'): 17, ('sv1',
'predm', 'advp'): 1, ('ppres', 'mod', 'advp'): 3, ('du', 'tag',
'ap'): 9, ('ssub', 'ld', 'n'): 2, ('du', 'sat', 'ww'): 1, ('conj',
'cnj', 'smain'): 7608, ('pp', 'hd', 'mwu'): 1318, ('sv1', 'pobj1',
'vnw'): 1, ('top', '--', 'ww'): 53, ('ap', 'mod', 'cp'): 47, ('pp',
'predc', 'adj'): 3, ('sv1', 'vc', 'whsub'): 28, ('ssub', 'predc',
'np'): 425, ('sv1', 'obj1', 'conj'): 33, ('du', 'nucl', 'ssub'): 5,
('inf', 'pc', 'vz'): 16, ('du', 'dp', 'sv1'): 80, ('pp', 'obj1',
'inf'): 2, ('pp', 'mod', 'bw'): 836, ('conj', 'cnj', 'ppart'): 449,
('cp', 'body', 'oti'): 5, ('smain', 'obj1', 'conj'): 405, ('ap',
'obcomp', 'oti'): 4, ('np', 'obj2', 'pp'): 5, ('sv1', 'mod', 'np'):
7, ('smain', 'predc', 'inf'): 1, ('ap', 'mod', 'ssub'): 1, ('ap',
'mod', 'sv1'): 2, ('whq', 'whd', 'vnw'): 149, ('smain', 'mod',
'du'): 17, ('sv1', 'predm', 'ppart'): 1, ('ssub', 'vc', 'ppart'):
2884, ('sv1', 'predc', 'ap'): 32, ('inf', 'obj2', 'np'): 107,
('np', 'mod', 'tw'): 2286, ('ppres', 'svp', 'mwu'): 2, ('ppart',
'su', 'vg'): 1, ('ppart', 'mod', 'conj'): 205, ('top', '--',
'spec'): 316, ('smain', 'ld', 'conj'): 38, ('ssub', 'vc', 'whsub'):
23, ('np', 'pc', 'conj'): 2, ('ppart', 'mod', 'ppart'): 22, ('du',
'nucl', 'cp'): 37, ('sv1', 'mod', 'advp'): 8, ('ppres', 'me',
'np'): 10, ('inf', 'ld', 'pp'): 708, ('sv1', 'mod', 'spec'): 3,
('np', 'svp', 'ww'): 1, ('inf', 'se', 'vnw'): 236, ('np', 'su',
'np'): 5, ('inf', 'pc', 'pp'): 1512, ('advp', 'mod', 'cp'): 11,
('ap', 'mod', 'vz'): 1, ('conj', 'crd', 'adj'): 21, ('inf', 'mod',
'vg'): 3, ('ppart', 'obj1', 'tw'): 10, ('du', 'nucl', 'pp'): 42,
('ppart', 'pc', 'bw'): 89, ('du', 'nucl', 'np'): 410, ('ssub',
'su', 'conj'): 292, ('ahi', 'body', 'inf'): 27, ('ap', 'obj2',
'vnw'): 7, ('ssub', 'ld', 'advp'): 6, ('ppart', 'predm', 'vnw'): 1,
('ppart', 'mod', 'du'): 11, ('ssub', 'vc', 'cp'): 130, ('sv1',
'predm', 'bw'): 16, ('smain', 'predc', 'ww'): 107, ('np', 'predc',
'n'): 6, ('du', 'sat', 'ppres'): 2, ('pp', 'mod', 'conj'): 3,
('ppres', 'pc', 'bw'): 13, ('detp', 'hd', 'vnw'): 199, ('conj',
'cnj', 'tw'): 902, ('inf', 'me', 'adj'): 1, ('sv1', 'predc',
'ppart'): 5, ('svan', 'body', 'np'): 1, ('pp', 'obj1', 'sv1'): 3,
('whq', 'body', 'ssub'): 9, ('np', 'mod', 'np'): 1355, ('advp',
'mod', 'smain'): 1, ('whrel', 'rhd', 'vnw'): 413, ('np', 'obj1',
'adj'): 1, ('smain', 'pobj1', 'vnw'): 39, ('ppart', 'mod', 'vz'):
14, ('sv1', 'pc', 'bw'): 8, ('smain', 'su', 'conj'): 1235, ('np',
'mod', 'ti'): 68, ('inf', 'obj2', 'n'): 29, ('advp', 'me', 'np'):
10, ('rel', 'body', 'np'): 67, ('whq', 'whd', 'bw'): 155, ('ap',
'mod', 'pp'): 768, ('sv1', 'predm', 'adj'): 4, ('np', 'obj2',
'np'): 1, ('du', 'sat', 'ssub'): 1, ('pp', 'obj1', 'n'): 10259,
('ppart', 'ld', 'vnw'): 11, ('top', '--', 'vz'): 30, ('ssub',
'predm', 'adj'): 20, ('inf', 'predm', 'ppres'): 4, ('inf', 'predm',
'cp'): 28, ('smain', 'ld', 'ap'): 11, ('smain', 'predm', 'adj'):
56, ('ppart', 'ld', 'advp'): 3, ('ssub', 'mod', 'ap'): 130, ('np',
'su', 'n'): 4, ('smain', 'ld', 'advp'): 10, ('np', 'mod', 'vnw'):
523, ('sv1', 'su', 'mwu'): 69, ('np', 'vc', 'ti'): 140, ('pp',
'obj1', 'advp'): 63, ('ti', 'body', 'inf'): 5108, ('ppres', 'mod',
'pp'): 77, ('ppart', 'obj1', 'vg'): 2, ('sv1', 'predc', 'ww'): 4,
('pp', 'vc', 'oti'): 57, ('ssub', 'svp', 'vz'): 45, ('ssub', 'me',
'conj'): 2, ('cp', 'mod', 'advp'): 5, ('du', 'sat', 'n'): 36,
('inf', 'hd', 'ww'): 12624, ('inf', 'obj1', 'conj'): 285, ('conj',
'cnj', 'pp'): 2072, ('rel', 'rhd', 'advp'): 1, ('np', 'app',
'conj'): 582, ('smain', 'obj1', 'tw'): 2, ('ssub', 'mod', 'ppres'):
3, ('ap', 'hd', 'vnw'): 409, ('ssub', 'predc', 'cp'): 69, ('ssub',
'predc', 'vnw'): 49, ('whrel', 'rhd', 'advp'): 1, ('cp', 'mod',
'cp'): 1, ('whq', 'body', 'sv1'): 349, ('np', 'hd', 'mwu'): 5405,
('sv1', 'predc', 'bw'): 13, ('ppart', 'mod', 'ppres'): 11, ('du',
'sat', 'advp'): 1, ('ppart', 'predm', 'adj'): 3, ('inf', 'mod',
'mwu'): 90, ('inf', 'sup', 'vnw'): 45, ('inf', 'mod', 'tw'): 6,
('oti', 'body', 'conj'): 148, ('np', 'mod', 'lid'): 1, ('mwu',
'mwp', 'adj'): 2480, ('ti', 'cmp', 'vz'): 5232, ('cp', 'body',
'n'): 568, ('pp', 'mod', 'ap'): 21, ('sv1', 'predc', 'vz'): 1,
('smain', 'mod', 'adj'): 1335, ('pp', 'vc', 'conj'): 27, ('inf',
'obj2', 'vnw'): 92, ('inf', 'predm', 'bw'): 35, ('sv1', 'svp',
'n'): 3, ('ap', 'mod', 'smain'): 2, ('inf', 'vc', 'vnw'): 1,
('whq', 'whd', 'np'): 43, ('inf', 'mod', 'tsw'): 1, ('du', 'sat',
'cp'): 200, ('detp', 'mod', 'vnw'): 113, ('ppres', 'obj1', 'conj'):
1, ('du', 'nucl', 'ppart'): 7, ('inf', 'predc', 'vg'): 1, ('whq',
'body', 'du'): 2, ('cp', 'body', 'vnw'): 25, ('whrel', 'rhd',
'ap'): 22, ('smain', 'predm', 'pp'): 30, ('ppart', 'vc', 'cp'):
164, ('ssub', 'me', 'ap'): 2, ('ssub', 'mod', 'conj'): 68,
('whsub', 'whd', 'ppres'): 1, ('ap', 'se', 'vnw'): 11, ('ssub',
'obj1', 'bw'): 1, ('np', 'vc', 'whsub'): 17, ('top', '--', 'vg'):
14, ('ppart', 'hd', 'vg'): 2, ('whq', 'body', 'conj'): 1, ('inf',
'obj1', 'tsw'): 3, ('np', 'predc', 'np'): 5, ('cp', 'body', 'bw'):
35, ('ssub', 'ld', 'adj'): 3, ('pp', 'obj1', 'adj'): 145, ('ppres',
'mod', 'cp'): 4, ('ppart', 'predc', 'cp'): 232, ('detp', 'mod',
'bw'): 107, ('du', 'sat', 'oti'): 6, ('top', '--', 'ppart'): 51,
('np', 'predm', 'adj'): 2, ('ppart', 'ld', 'adj'): 2, ('ap',
'predc', 'cp'): 2, ('smain', 'svp', 'mwu'): 315, ('ap', 'hd', 'n'):
34, ('ssub', 'su', 'ti'): 14, ('cp', 'body', 'np'): 1374, ('pp',
'obj1', 'du'): 9, ('inf', 'obj1', 'ap'): 4, ('cp', 'body', 'mwu'):
89, ('ssub', 'me', 'vnw'): 1, ('cp', 'cmp', 'vz'): 1950, ('sv1',
'vc', 'cp'): 38, ('oti', 'body', 'inf'): 2, ('inf', 'mod', 'n'): 8,
('sv1', 'svp', 'conj'): 1, ('whsub', 'body', 'ti'): 2, ('du',
'sat', 'whrel'): 25, ('ppart', 'svp', 'ti'): 2, ('inf', 'ld',
'ap'): 6, ('smain', 'mod', 'pp'): 7737, ('du', 'tag', 'pp'): 21,
('ssub', 'obj1', 'spec'): 2, ('inf', 'predm', 'vnw'): 1, ('smain',
'predc', 'ppart'): 248, ('ssub', 'mod', 'tw'): 8, ('ppart',
'predc', 'conj'): 19, ('np', 'mod', 'advp'): 71, ('whsub', 'whd',
'ppart'): 2, ('top', '--', 'np'): 3094, ('smain', 'ld', 'vz'): 5,
('smain', 'me', 'np'): 89, ('cp', 'cmp', 'adj'): 30, ('du', 'sat',
'np'): 333, ('ssub', 'su', 'ww'): 6, ('smain', 'vc', 'du'): 1,
('ppres', 'obj1', 'adj'): 1, ('ppres', 'svp', 'n'): 1, ('inf',
'mod', 'ppart'): 15, ('inf', 'vc', 'ssub'): 1, ('np', 'hd', 'vnw'):
852, ('ssub', 'obj2', 'bw'): 2, ('advp', 'me', 'vnw'): 18,
('smain', 'mod', 'vz'): 20, ('ap', 'mod', 'n'): 22, ('sv1', 'mod',
'vz'): 4, ('smain', 'predc', 'np'): 2747, ('pp', 'mod', 'ww'): 5,
('du', 'tag', 'tw'): 89, ('pp', 'obj1', 'pp'): 165, ('ap',
'obcomp', 'cp'): 562, ('ssub', 'obj1', 'ww'): 2, ('np', 'predc',
'ppart'): 1, ('cp', 'body', 'spec'): 10, ('inf', 'mod', 'ppres'):
5, ('ssub', 'mod', 'whrel'): 20, ('sv1', 'pc', 'pp'): 171, ('np',
'hd', 'n'): 94163, ('whrel', 'rhd', 'pp'): 2, ('ssub', 'mod',
'ppart'): 9, ('sv1', 'mod', 'ppart'): 5, ('smain', 'vc', 'ppart'):
5689, ('np', 'predc', 'pp'): 3, ('ap', 'mod', 'np'): 41, ('ssub',
'se', 'vnw'): 207, ('ssub', 'su', 'vg'): 3, ('inf', 'obj1', 'du'):
1, ('ppart', 'su', 'whsub'): 1, ('inf', 'vc', 'inf'): 834, ('advp',
'hd', 'bw'): 1117, ('smain', 'vc', 'whsub'): 95, ('sv1', 'su',
'adj'): 2, ('advp', 'hd', 'adj'): 47, ('ssub', 'predc', 'mwu'): 36,
('smain', 'vc', 'advp'): 1, ('conj', 'cnj', 'ssub'): 1327, ('du',
'dlink', 'mwu'): 16, ('ppres', 'obj1', 'vnw'): 4, ('du', 'tag',
'ww'): 4, ('smain', 'mod', 'ppart'): 79, ('detp', 'mod', 'advp'):
6, ('ppres', 'mod', 'ti'): 1, ('du', 'dp', 'whrel'): 19, ('du',
'tag', 'mwu'): 97, ('whsub', 'whd', 'vnw'): 160, ('smain', 'su',
'vg'): 7, ('du', 'tag', 'spec'): 333, ('pp', 'predc', 'bw'): 1,
('top', '--', 'adj'): 55, ('cp', 'mod', 'adj'): 18, ('ssub', 'mod',
'smain'): 4, ('ap', 'hd', 'vg'): 1, ('ppres', 'obj1', 'n'): 15,
('cp', 'body', 'pp'): 182, ('du', 'dp', 'ppart'): 31, ('ppart',
'vc', 'bw'): 1, ('inf', 'mod', 'ti'): 2, ('smain', 'su', 'oti'):
114, ('smain', 'pc', 'bw'): 60, ('np', 'hd', 'tw'): 915, ('conj',
'cnj', 'adj'): 2106, ('du', 'dp', 'conj'): 387, ('inf', 'ld',
'np'): 25, ('ssub', 'ld', 'np'): 26, ('ap', 'pc', 'conj'): 15,
('conj', 'cnj', 'n'): 7602, ('whrel', 'body', 'sv1'): 6, ('np',
'app', 'du'): 11, ('cp', 'cmp', 'bw'): 165, ('ppart', 'obj1',
'vnw'): 1771, ('ppart', 'mod', 'rel'): 14, ('smain', 'predm',
'ap'): 106, ('ap', 'obj1', 'np'): 33, ('inf', 'ld', 'bw'): 30,
('du', 'nucl', 'inf'): 16, ('ssub', 'obj1', 'n'): 315, ('conj',
'cnj', 'advp'): 37, ('smain', 'vc', 'ti'): 927, ('inf', 'pc',
'bw'): 53, ('du', 'dp', 'bw'): 235, ('smain', 'obj1', 'n'): 523,
('inf', 'obj1', 'tw'): 7, ('ppart', 'su', 'spec'): 1, ('ppart',
'obj1', 'n'): 760, ('inf', 'me', 'np'): 15, ('rel', 'mod', 'bw'):
1, ('ap', 'mod', 'rel'): 1, ('ap', 'mod', 'adj'): 1056, ('pp',
'predc', 'cp'): 79, ('pp', 'hdf', 'mwu'): 5, ('top', '--', 'advp'):
7, ('ssub', 'obj1', 'vnw'): 652, ('np', 'me', 'np'): 11, ('du',
'tag', 'du'): 8, ('ppart', 'ld', 'bw'): 17, ('ppart', 'obj2',
'conj'): 5, ('smain', 'me', 'adj'): 4, ('conj', 'crd', 'spec'): 87,
('ppart', 'svp', 'n'): 19, ('ppres', 'pc', 'pp'): 83, ('np', 'app',
'n'): 1765, ('ap', 'me', 'bw'): 1, ('pp', 'hd', 'adj'): 65, ('du',
'dp', 'vnw'): 86, ('du', 'dlink', 'spec'): 3, ('ssub', 'sup',
'vnw'): 47, ('smain', 'predm', 'n'): 1, ('ppart', 'sup', 'vnw'): 7,
('smain', 'su', 'bw'): 3, ('du', 'nucl', 'smain'): 2088, ('ppart',
'su', 'adj'): 1, ('smain', 'su', 'whrel'): 72, ('pp', 'predc',
'vz'): 1, ('whrel', 'rhd', 'bw'): 203, ('np', 'obj1', 'tw'): 1,
('np', 'vc', 'ppart'): 5, ('cp', 'mod', 'np'): 13, ('inf', 'obj1',
'bw'): 1, ('ap', 'mod', 'bw'): 1616, ('cp', 'cmp', 'vnw'): 6,
('du', 'nucl', 'adj'): 11, ('smain', 'predm', 'advp'): 5, ('smain',
'vc', 'inf'): 3777, ('ppart', 'pc', 'vz'): 1, ('conj', 'cnj',
'vnw'): 231, ('smain', 'su', 'mwu'): 745, ('ppart', 'predc',
'ppart'): 23, ('ppart', 'su', 'cp'): 5, ('ssub', 'predm', 'ppart'):
5, ('advp', 'mod', 'advp'): 3, ('inf', 'su', 'ww'): 7, ('advp',
'mod', 'rel'): 9, ('sv1', 'obj1', 'mwu'): 18, ('inf', 'ld', 'adj'):
1, ('inf', 'su', 'cp'): 33, ('du', 'sat', 'ti'): 5, ('inf',
'predc', 'vnw'): 16, ('conj', 'cnj', 'let'): 4, ('detp', 'hd',
'n'): 1, ('np', 'det', 'detp'): 520, ('ppart', 'mod', 'smain'): 9,
('du', 'dp', 'vz'): 3, ('smain', 'predc', 'adj'): 998, ('sv1',
'hd', 'ww'): 1875, ('ssub', 'predc', 'n'): 54, ('sv1', 'svp',
'ww'): 2, ('np', 'predc', 'mwu'): 2, ('du', 'tag', 'n'): 79,
('inf', 'su', 'adj'): 9, ('ap', 'vc', 'oti'): 83, ('ap', 'hd',
'vz'): 20, ('conj', 'cnj', 'bw'): 87, ('ppart', 'vc', 'ppart'): 5,
('du', 'nucl', 'vg'): 1, ('inf', 'predm', 'conj'): 2, ('np',
'obj1', 'vnw'): 8, ('ppart', 'mod', 'mwu'): 174, ('inf', 'mod',
'oti'): 234, ('smain', 'pc', 'conj'): 65, ('ssub', 'svp', 'ww'):
15, ('cp', 'mod', 'mwu'): 6, ('smain', 'ld', 'np'): 29, ('np',
'mod', 'du'): 323, ('smain', 'obj2', 'mwu'): 7, ('ppres', 'mod',
'ww'): 6, ('rel', 'body', 'du'): 9, ('ppres', 'su', 'n'): 1,
('smain', 'mod', 'n'): 10, ('sv1', 'predm', 'ap'): 1, ('smain',
'predm', 'vnw'): 38, ('smain', 'hd', 'mwu'): 1, ('ppres', 'se',
'vnw'): 6, ('du', 'dp', 'whq'): 14, ('du', 'tag', 'advp'): 2,
('np', 'hd', 'ww'): 1803, ('mwu', 'mwp', 'n'): 10827, ('advp',
'mod', 'ww'): 4, ('ap', 'mod', 'oti'): 16, ('conj', 'cnj',
'whsub'): 78, ('ppres', 'predc', 'ap'): 1, ('whrel', 'rhd', 'np'):
12, ('smain', 'obj1', 'tsw'): 3, ('ssub', 'su', 'mwu'): 126,
('ssub', 'mod', 'adj'): 471, ('np', 'hd', 'spec'): 1167, ('np',
'predc', 'ap'): 3, ('ssub', 'predm', 'bw'): 84, ('smain', 'su',
'inf'): 7, ('whq', 'whd', 'ap'): 6, ('np', 'mod', 'adj'): 26044,
('np', 'vc', 'svan'): 5, ('np', 'predm', 'np'): 1, ('inf', 'svp',
'bw'): 147, ('smain', 'vc', 'ww'): 1, ('sv1', 'obj1', 'du'): 1,
('smain', 'su', 'n'): 3437, ('np', 'pc', 'bw'): 4, ('ssub', 'su',
'tw'): 5, ('ssub', 'predc', 'whrel'): 2, ('pp', 'pc', 'pp'): 1,
('np', 'predm', 'ap'): 1, ('advp', 'mod', 'vnw'): 150, ('ppart',
'ld', 'np'): 16, ('ssub', 'vc', 'ahi'): 13, ('pp', 'hd', 'vz'):
65170, ('inf', 'predc', 'conj'): 34, ('ssub', 'predc', 'adj'): 523,
('ppart', 'obj1', 'bw'): 1, ('cp', 'hd', 'vg'): 1, ('du', 'nucl',
'du'): 266, ('ap', 'me', 'conj'): 2, ('ppart', 'predm', 'cp'): 2,
('whsub', 'mod', 'bw'): 2, ('du', 'tag', 'oti'): 2, ('top', '--',
'lid'): 20, ('smain', 'mod', 'advp'): 420, ('sv1', 'sup', 'vnw'):
14, ('inf', 'predm', 'advp'): 1, ('inf', 'obj1', 'ww'): 1, ('pp',
'obj1', 'spec'): 272, ('mwu', 'mwp', 'pp'): 1, ('smain', 'mod',
'cp'): 1595, ('ssub', 'mod', 'vnw'): 511, ('smain', 'mod', 'vnw'):
1098, ('ssub', 'mod', 'cp'): 253, ('smain', 'vc', 'cp'): 680,
('ppart', 'pobj1', 'vnw'): 16, ('du', 'nucl', 'rel'): 5, ('np',
'obj1', 'conj'): 7, ('ppres', 'svp', 'adj'): 2, ('ppart', 'predc',
'ap'): 79, ('np', 'me', 'tw'): 2, ('du', 'sat', 'adj'): 2, ('pp',
'obj1', 'vnw'): 1328, ('smain', 'me', 'tw'): 2, ('conj', 'cnj',
'whq'): 24, ('smain', 'mod', 'sv1'): 9, ('top', '--', 'tsw'): 37,
('np', 'app', 'mwu'): 1718, ('conj', 'cnj', 'detp'): 25, ('ppart',
'mod', 'n'): 13, ('pp', 'hd', 'vg'): 13, ('rel', 'rhd', 'vnw'):
4641, ('rel', 'body', 'pp'): 2, ('sv1', 'mod', 'vnw'): 63,
('ppart', 'hd', 'adj'): 228, ('ssub', 'obj2', 'pp'): 47, ('np',
'det', 'conj'): 149, ('cp', 'body', 'ppres'): 1, ('ssub', 'su',
'adj'): 13, ('np', 'predm', 'bw'): 7, ('conj', 'cnj', 'tsw'): 3,
('detp', 'mod', 'adj'): 75, ('ppart', 'predc', 'adj'): 98,
('smain', 'su', 'ti'): 99, ('np', 'me', 'spec'): 2, ('pp', 'obj1',
'bw'): 153, ('du', 'dp', 'ppres'): 2, ('smain', 'predc', 'tsw'): 2,
('top', '--', 'rel'): 10, ('detp', 'obcomp', 'adj'): 12, ('ppart',
'su', 'n'): 239, ('pp', 'mod', 'adj'): 179, ('smain', 'mod',
'oti'): 352, ('du', 'nucl', 'whrel'): 2, ('du', 'nucl', 'spec'):
15, ('ap', 'mod', 'tw'): 3, ('sv1', 'ld', 'np'): 1, ('detp', 'mod',
'du'): 2, ('ssub', 'predc', 'bw'): 22, ('np', 'app', 'vnw'): 2,
('ssub', 'mod', 'advp'): 137, ('ppart', 'obj1', 'adj'): 9, ('sv1',
'svp', 'vnw'): 3, ('du', 'tag', 'tsw'): 48, ('inf', 'svp', 'n'):
71, ('pp', 'obj1', 'ap'): 18, ('ppart', 'su', 'ww'): 1, ('np',
'svp', 'adj'): 3, ('ppart', 'hd', 'n'): 25, ('detp', 'hd', 'tw'):
238, ('sv1', 'mod', 'ww'): 4, ('svan', 'body', 'inf'): 2, ('whrel',
'mod', 'mwu'): 3, ('whq', 'body', 'ti'): 2, ('cp', 'cmp', 'vg'):
6809, ('ssub', 'mod', 'n'): 8, ('top', '--', 'du'): 5583, ('whrel',
'body', 'ssub'): 621, ('ap', 'obcomp', 'adj'): 1, ('np', 'predm',
'ppart'): 1, ('du', 'sat', 'du'): 146, ('conj', 'cnj', 'vg'): 8,
('pp', 'mod', 'oti'): 1, ('mwu', 'mwp', 'bw'): 671, ('svan',
'body', 'n'): 1, ('rel', 'body', 'inf'): 3, ('top', '--', 'let'):
69726, ('pp', 'obj1', 'whrel'): 126, ('cp', 'mod', 'spec'): 1,
('whrel', 'mod', 'bw'): 2, ('inf', 'vc', 'ti'): 103, ('sv1',
'predc', 'adj'): 34, ('ppres', 'mod', 'np'): 3, ('ssub', 'obj1',
'whrel'): 1, ('pp', 'obj1', 'vg'): 1, ('inf', 'mod', 'conj'): 138,
('sv1', 'mod', 'cp'): 80, ('np', 'obcomp', 'adj'): 2, ('cp',
'body', 'conj'): 767, ('du', 'nucl', 'mwu'): 107, ('advp', 'mod',
'tw'): 69, ('rel', 'body', 'ppart'): 1, ('ppart', 'mod', 'ww'): 28,
('detp', 'mod', 'ww'): 1, ('top', '--', 'smain'): 19196, ('smain',
'me', 'spec'): 4, ('top', '--', 'whrel'): 5, ('smain', 'svp',
'np'): 1, ('smain', 'obj1', 'ww'): 3, ('pp', 'predc', 'ap'): 1,
('smain', 'predm', 'cp'): 289, ('ppart', 'obj2', 'vnw'): 89, ('du',
'nucl', 'ww'): 17}
#additions
mcatrelcat[('sv1', 'vc','ahi')]=mcatrelcatTheta+1
mcatrelcat[('sv1', 'predc','ppres')]=mcatrelcatTheta+1
mcatrelcat[('sv1', 'predc','ppart')]=mcatrelcatTheta+1
mcatrelcat[('sv1', 'mod','np')]=mcatrelcatTheta+1
mcatrelcat[('sv1', 'mod','advp')]=mcatrelcatTheta+1
mcatrelcat[('sv1', 'predm','adj')]=mcatrelcatTheta+1
mcatrelcat[('sv1', 'predc','n')]=mcatrelcatTheta+1
mcatrelcat[('sv1', 'vc','svan')]=mcatrelcatTheta+1
mcatrelcat[('sv1', 'vc','ww')]=mcatrelcatTheta+1
mcatrelcat[('sv1', 'predc','detp')]=mcatrelcatTheta+1
mcatrelcat[('sv1', 'obj1','detp')]=mcatrelcatTheta+1
mcatrelcat[('sv1', 'predc','conj')]=mcatrelcatTheta+1
mcatrelcat[('sv1', 'mod','conj')]=mcatrelcatTheta+1
mcatrelcat[('sv1', 'ld','ap')]=mcatrelcatTheta+1
mcatrelcat[('smain', 'vc','svan')]=mcatrelcatTheta+1
mcatrelcat[('smain', 'ld','ap')]=mcatrelcatTheta+1
mcatrelcat[('smain', 'vc','ww')]=mcatrelcatTheta+1
mcatrelcat[('smain', 'predc','detp')]=mcatrelcatTheta+1
mcatrelcat[('smain', 'obj1','detp')]=mcatrelcatTheta+1
mcatrelcat[('sv1', 'predc','advp')]=mcatrelcatTheta+1
mcatrelcat[('sv1', 'ld','bw')]=mcatrelcatTheta+1
mcatrelcat[('du', 'sat','vnw')]=mcatrelcatTheta+1
mcatrelcat[('du', 'nucl','ap')]=mcatrelcatTheta+1
mcatrelcat[('du', 'tag','adj')]=mcatrelcatTheta+1
mcatrelcat[('top', '--','whrel')]=mcatrelcatTheta+1
siblings= {('ssub', ('ww', 'mwu', 'n', 'np')): 1, ('top', ('smain',
'lid', 'let')): 10, ('ppart', ('ww', 'bw', 'vnw', 'np', 'adj')): 9,
('ppart', ('adj',)): 12, ('ssub', ('ap', 'ww', 'conj', 'vnw',
'pp')): 1, ('inf', ('ww', 'n', 'conj', 'vnw', 'vz')): 1, ('pp',
('cp', 'adj')): 1, ('ww', ()): 77473, ('ssub', ('ww', 'bw', 'n',
'adj')): 4, ('inf', ('pp', 'ti', 'ww', 'vnw', 'whrel')): 1,
('ssub', ('pp', 'oti', 'ww', 'n', 'np')): 1, ('ssub', ('inf', 'ww',
'n')): 145, ('conj', ('vg', 'ppart', 'ppres')): 4, ('inf', ('ww',
'bw', 'np')): 244, ('ssub', ('ww', 'tw', 'np')): 2, ('ppart',
('advp', 'ww', 'bw', 'np', 'cp')): 2, ('inf', ('cp', 'ww', 'ap',
'adj')): 1, ('ppart', ('ww', 'bw', 'np', 'whrel')): 3, ('ap',
('advp', 'oti', 'mwu')): 1, ('smain', ('advp', 'ww', 'n', 'vnw',
'pp')): 2, ('pp', ('conj', 'vz', 'cp')): 11, ('smain', ('ww',