1 <?xml version=
"1.0" encoding=
"UTF-8"?> <!-- -*- nxml -*- -->
6 <cat-item tags=
"SN.*"/>
10 <cat-item tags=
"SV.*"/>
11 <cat-item tags=
"SVneg.*"/>
14 <def-cat n=
"SV_pers"><!--Formes personals. Exclou inf i ger (i alguns imperatius per ara) -->
15 <cat-item lemma=
"verbcj" tags=
"SV.*"/>
16 <cat-item lemma=
"verbcj" tags=
"SVneg.*"/>
17 <cat-item lemma=
"aux_verb" tags=
"SV.*"/>
18 <cat-item lemma=
"aux_verb" tags=
"SVneg.*"/>
19 <cat-item lemma=
"haver_pp" tags=
"SV.*"/>
20 <cat-item lemma=
"haver_pp" tags=
"SVneg.*"/>
21 <cat-item lemma=
"haver_pp_enc" tags=
"SV.*"/>
22 <cat-item lemma=
"haver_pp_enc" tags=
"SVneg.*"/>
23 <cat-item lemma=
"aux_haver_pp" tags=
"SV.*"/>
24 <cat-item lemma=
"aux_haver_pp" tags=
"SVneg.*"/>
25 <cat-item lemma=
"aux_haver_pp_enc" tags=
"SV.*"/>
26 <cat-item lemma=
"aux_haver_pp_enc" tags=
"SVneg.*"/>
27 <cat-item lemma=
"verbcj_enc" tags=
"SV.*"/>
28 <cat-item lemma=
"verbcj_enc" tags=
"SVneg.*"/>
29 <!-- <cat-item lemma="be_adj" tags="SV.*"/>-->
33 <cat-item tags=
"SV.vblex.inf"/>
34 <cat-item tags=
"SVneg.vblex.inf"/>
35 <cat-item tags=
"SV.vbhaver.inf"/>
36 <cat-item tags=
"SVneg.vbhaver.inf"/>
37 <cat-item tags=
"SV.vbser.inf"/>
38 <cat-item tags=
"SVneg.vbser.inf"/>
39 <cat-item tags=
"SV.vbmod.inf"/>
40 <cat-item tags=
"SVneg.vbmod.inf"/>
44 <cat-item tags=
"SV.vbser.*"/>
45 <cat-item tags=
"SVneg.vbser.*"/>
49 <cat-item tags=
"cnjsub"/>
50 <cat-item tags=
"cnjadv"/>
54 <cat-item lemma=
"de" tags=
"PREP"/>
58 <cat-item lemma=
"haverhi" tags=
"SV.*"/>
59 <cat-item lemma=
"haverhi" tags=
"SVneg.*"/>
60 <cat-item lemma=
"haverhi_pp" tags=
"SV.*"/>
61 <cat-item lemma=
"haverhi_pp" tags=
"SVneg.*"/>
65 <cat-item tags=
"SA.*"/>
69 <cat-item tags=
"sent"/>
77 <attr-item tags=
"p1"/>
78 <attr-item tags=
"p2"/>
79 <attr-item tags=
"p3"/>
80 <attr-item tags=
"PD"/>
86 <attr-item tags=
"mf"/>
87 <attr-item tags=
"GD"/>
88 <attr-item tags=
"nt"/>
92 <attr-item tags=
"sg"/>
93 <attr-item tags=
"pl"/>
94 <attr-item tags=
"sp"/>
95 <attr-item tags=
"ND"/>
99 <attr-item tags=
"inf"/>
100 <attr-item tags=
"pres"/>
101 <attr-item tags=
"past"/>
102 <attr-item tags=
"pri"/>
103 <attr-item tags=
"ifip"/>
104 <attr-item tags=
"cni"/>
105 <attr-item tags=
"fti"/>
106 <attr-item tags=
"pp"/>
107 <attr-item tags=
"ger"/>
108 <attr-item tags=
"pprs"/>
109 <attr-item tags=
"subs"/>
110 <attr-item tags=
"imp"/>
111 <attr-item tags=
"ifi"/>
112 <attr-item tags=
"pii"/>
113 <attr-item tags=
"pis"/>
114 <attr-item tags=
"prs"/>
119 <def-attr n=
"a_verb">
120 <attr-item tags=
"vblex"/>
121 <attr-item tags=
"vbser"/>
122 <attr-item tags=
"vbhaver"/>
123 <attr-item tags=
"vbmod"/>
124 <attr-item tags=
"vaux"/>
132 <def-var n=
"paraula"/>
137 <def-macro n=
"f_bcond" npar=
"1"><!--Per mirar si el blanc conté o no format. Cal posar aquesta funció en les regles en què desaparegui alguna paraula, per tal de decidir si el blanc de la paraula eliminada s'ha d'eliminar o conservar. Si conté format cal conservar-la, si no en conté cal eliminar-la perquè no apareguin dos espais seguits. -->
155 </section-def-macros>
165 <!--Regles per a sintagmes sols que han pogut quedarse amb GD, ND o PD -->
167 <rule comment=
"REGLA: SN (per assignar gènere i nombre si hi ha GD i ND que no s'han pogut determinar, com passa en alguns pronoms: both, etc.)">
169 <pattern-item n=
"SN"/>
176 <clip pos=
"1" part=
"gen"/>
181 <clip pos=
"1" part=
"gen"/>
190 <clip pos=
"1" part=
"nbr"/>
195 <clip pos=
"1" part=
"nbr"/>
202 <clip pos=
"1" part=
"lem"/>
203 <clip pos=
"1" part=
"tags"/>
204 <clip pos=
"1" part=
"chcontent"/>
210 <rule comment=
"REGLA: haverhi SN">
212 <pattern-item n=
"haverhi"/>
213 <pattern-item n=
"SN"/>
222 <clip pos=
"2" part=
"nbr"/>
226 <clip pos=
"2" part=
"nbr"/>
233 <clip pos=
"1" part=
"nbr"/>
234 <clip pos=
"2" part=
"nbr"/>
239 <clip pos=
"1" part=
"nbr"/>
244 <choose><!--això no sé si fa falta però ho poso per si de cas, estudiar-ho i treure-ho si cal -->
248 <clip pos=
"2" part=
"nbr"/>
253 <clip pos=
"2" part=
"nbr"/>
258 <choose><!--això no sé si fa falta però ho poso per si de cas, estudiar-ho i treure-ho si cal -->
262 <clip pos=
"2" part=
"gen"/>
267 <clip pos=
"2" part=
"nbr"/>
274 <clip pos=
"1" part=
"whole"/>
278 <clip pos=
"2" part=
"whole"/>
286 <rule comment=
"REGLA: SN haverhi SN (per a frase com 'al seu país no hi ha dubte que', pq no entrin per 'SN SV'">
288 <pattern-item n=
"SN"/>
289 <pattern-item n=
"haverhi"/>
290 <pattern-item n=
"SN"/>
297 <clip pos=
"1" part=
"gen"/>
302 <clip pos=
"1" part=
"gen"/>
311 <clip pos=
"1" part=
"nbr"/>
316 <clip pos=
"1" part=
"nbr"/>
327 <clip pos=
"3" part=
"nbr"/>
331 <clip pos=
"3" part=
"nbr"/>
338 <clip pos=
"2" part=
"nbr"/>
339 <clip pos=
"3" part=
"nbr"/>
344 <clip pos=
"2" part=
"nbr"/>
349 <choose><!--això no sé si fa falta però ho poso per si de cas, estudiar-ho i treure-ho si cal -->
353 <clip pos=
"3" part=
"nbr"/>
358 <clip pos=
"3" part=
"nbr"/>
363 <choose><!--això no sé si fa falta però ho poso per si de cas, estudiar-ho i treure-ho si cal -->
367 <clip pos=
"3" part=
"gen"/>
372 <clip pos=
"3" part=
"nbr"/>
379 <clip pos=
"1" part=
"whole"/>
383 <clip pos=
"2" part=
"whole"/>
387 <clip pos=
"3" part=
"whole"/>
394 <rule comment=
"REGLA: haverhi (per quan no va seguit de SN, assignar-li nombre per defecte">
396 <pattern-item n=
"haverhi"/>
403 <clip pos=
"1" part=
"nbr"/>
408 <clip pos=
"1" part=
"nbr"/>
415 <clip pos=
"1" part=
"whole"/>
426 <rule comment=
"REGLA: SN SV">
428 <pattern-item n=
"SN"/>
429 <pattern-item n=
"SV"/>
436 <clip pos=
"1" part=
"gen"/>
441 <clip pos=
"1" part=
"gen"/>
450 <clip pos=
"1" part=
"nbr"/>
455 <clip pos=
"1" part=
"nbr"/>
462 <clip pos=
"1" part=
"lem"/>
463 <clip pos=
"1" part=
"tags"/>
464 <clip pos=
"1" part=
"chcontent"/>
468 <clip pos=
"2" part=
"lem"/>
469 <clip pos=
"2" part=
"tags"/>
470 <clip pos=
"2" part=
"chcontent"/>
478 <rule comment=
"REGLA: SN SV inf (SN han decidit venir -> SN have decided TO come)" >
480 <pattern-item n=
"SN"/>
481 <pattern-item n=
"SV_pers"/>
482 <pattern-item n=
"inf"/>
489 <clip pos=
"1" part=
"gen"/>
494 <clip pos=
"1" part=
"gen"/>
503 <clip pos=
"1" part=
"nbr"/>
508 <clip pos=
"1" part=
"nbr"/>
515 <clip pos=
"1" part=
"whole"/>
519 <clip pos=
"2" part=
"whole"/>
524 <when><!--si és vbmod (o vaux: "can") no posis el "to" pq no cal ("can") o ja el té incorporat ("have to"). -->
529 <clip pos=
"2" part=
"a_verb"/>
533 <clip pos=
"2" part=
"a_verb"/>
541 <get-case-from pos=
"3">
546 <get-case-from pos=
"3">
558 <clip pos=
"3" part=
"whole"/>
564 <rule comment=
"REGLA: SV inf (han decidit venir -> have decided TO come) (caldria generar aquí subjecte? estudiar)" >
566 <pattern-item n=
"SV_pers"/>
567 <pattern-item n=
"inf"/>
572 <clip pos=
"1" part=
"whole"/>
577 <when><!--si és vbmod (o vaux: "can") no posis el "to" pq no cal ("can") o ja el té incorporat ("have to"). -->
582 <clip pos=
"1" part=
"a_verb"/>
586 <clip pos=
"1" part=
"a_verb"/>
594 <get-case-from pos=
"2">
599 <get-case-from pos=
"2">
611 <clip pos=
"2" part=
"whole"/>
620 <rule comment=
"REGLA: SV SA inf (és/considera difícil entendre -> is/considers difficult TO understand)" >
622 <pattern-item n=
"SV"/>
623 <pattern-item n=
"SA"/>
624 <pattern-item n=
"inf"/>
629 <clip pos=
"1" part=
"whole"/>
633 <clip pos=
"2" part=
"whole"/>
637 <get-case-from pos=
"3">
642 <get-case-from pos=
"3">
650 <clip pos=
"3" part=
"whole"/>
657 <rule comment=
"REGLA: SV SA de inf (és/considera difícil d'entendre -> is/considers difficult TO understand) MG: treureho? es fa ja tot en el t1x?" >
659 <pattern-item n=
"SV"/>
660 <pattern-item n=
"SA"/>
661 <pattern-item n=
"de"/>
662 <pattern-item n=
"inf"/>
667 <clip pos=
"1" part=
"whole"/>
671 <clip pos=
"2" part=
"whole"/>
675 <get-case-from pos=
"3">
680 <get-case-from pos=
"3">
688 <clip pos=
"4" part=
"whole"/>
695 <rule comment=
"REGLA: SN SV SA inf (això és/considera difícil entendre -> is/considers difficult TO understand)" >
697 <pattern-item n=
"SN"/>
698 <pattern-item n=
"SV"/>
699 <pattern-item n=
"SA"/>
700 <pattern-item n=
"inf"/>
707 <clip pos=
"1" part=
"gen"/>
712 <clip pos=
"1" part=
"gen"/>
721 <clip pos=
"1" part=
"nbr"/>
726 <clip pos=
"1" part=
"nbr"/>
733 <clip pos=
"1" part=
"whole"/>
737 <clip pos=
"2" part=
"whole"/>
741 <clip pos=
"3" part=
"whole"/>
745 <get-case-from pos=
"4">
750 <get-case-from pos=
"4">
758 <clip pos=
"4" part=
"whole"/>
765 <rule comment=
"REGLA: SN SV SA de inf (és/considera difícil d'entendre -> is/considers difficult TO understand)MG: treureho? es fa ja tot en el t1x?" >
767 <pattern-item n=
"SN"/>
768 <pattern-item n=
"SV"/>
769 <pattern-item n=
"SA"/>
770 <pattern-item n=
"de"/>
771 <pattern-item n=
"inf"/>
778 <clip pos=
"1" part=
"gen"/>
783 <clip pos=
"1" part=
"gen"/>
792 <clip pos=
"1" part=
"nbr"/>
797 <clip pos=
"1" part=
"nbr"/>
804 <clip pos=
"1" part=
"whole"/>
808 <clip pos=
"2" part=
"whole"/>
812 <clip pos=
"3" part=
"whole"/>
816 <get-case-from pos=
"4">
821 <get-case-from pos=
"4">
829 <clip pos=
"5" part=
"whole"/>
838 <rule comment="REGLA: SN ADV SV">
840 <pattern-item n="SN"/>
841 <pattern-item n="ADV"/>
842 <pattern-item n="SV"/>
849 <clip pos="1" part="gen"/>
854 <clip pos="1" part="gen"/>
863 <clip pos="1" part="nbr"/>
868 <clip pos="1" part="nbr"/>
877 <clip pos="1" part="lem"/>
878 <clip pos="1" part="tags"/>
879 <clip pos="1" part="chcontent"/>
883 <clip pos="2" part="lem"/>
884 <clip pos="2" part="tags"/>
885 <clip pos="2" part="chcontent"/>
889 <clip pos="3" part="lem"/>
890 <clip pos="3" part="tags"/>
891 <clip pos="3" part="chcontent"/>
897 <!--Regles per a afegir pronom subjecte -->
899 <rule comment=
"REGLA: punt SV (. Significava -> IT meant)">
901 <pattern-item n=
"punt"/>
902 <pattern-item n=
"SV_pers"/>
907 <clip pos=
"1" part=
"whole"/>
916 <clip pos=
"2" part=
"temps"/>
923 <get-case-from pos=
"2">
926 <lit-tag v=
"prn.subj"/>
927 <clip pos=
"2" part=
"pers"/>
929 <clip pos=
"2" part=
"nbr"/>
931 <get-case-from pos=
"2">
934 <lit-tag v=
"prn.subj.3.4.5"/>
943 <case-of pos=
"2" part=
"lem"/>
948 <clip pos=
"2" part=
"lem"/>
957 <clip pos=
"2" part=
"lem"/>
958 <clip pos=
"2" part=
"tags"/>
959 <clip pos=
"2" part=
"chcontent"/>
965 <rule comment=
"REGLA: punt SV inf (. Intentava venir -> IT tried TO come)">
967 <pattern-item n=
"punt"/>
968 <pattern-item n=
"SV_pers"/>
969 <pattern-item n=
"inf"/>
974 <clip pos=
"1" part=
"whole"/>
983 <clip pos=
"2" part=
"temps"/>
990 <get-case-from pos=
"2">
993 <lit-tag v=
"prn.subj"/>
994 <clip pos=
"2" part=
"pers"/>
996 <clip pos=
"2" part=
"nbr"/>
998 <get-case-from pos=
"2">
1001 <lit-tag v=
"prn.subj.3.4.5"/>
1010 <case-of pos=
"2" part=
"lem"/>
1015 <clip pos=
"2" part=
"lem"/>
1024 <clip pos=
"2" part=
"lem"/>
1025 <clip pos=
"2" part=
"tags"/>
1026 <clip pos=
"2" part=
"chcontent"/>
1031 <when><!--si és vbmod (o vaux: "can") no posis el "to" pq no cal ("can") o ja el té incorporat ("have to"). -->
1036 <clip pos=
"2" part=
"a_verb"/>
1037 <lit-tag v=
"vbmod"/>
1040 <clip pos=
"2" part=
"a_verb"/>
1048 <get-case-from pos=
"3">
1053 <get-case-from pos=
"3">
1065 <clip pos=
"3" part=
"whole"/>
1072 <rule comment=
"REGLA: punt SV SA inf (. Era difícil ajudar -> IT was difficult TO help)">
1074 <pattern-item n=
"punt"/>
1075 <pattern-item n=
"SV_pers"/>
1076 <pattern-item n=
"SA"/>
1077 <pattern-item n=
"inf"/>
1082 <clip pos=
"1" part=
"whole"/>
1091 <clip pos=
"2" part=
"temps"/>
1098 <get-case-from pos=
"2">
1101 <lit-tag v=
"prn.subj"/>
1102 <clip pos=
"2" part=
"pers"/>
1104 <clip pos=
"2" part=
"nbr"/>
1106 <get-case-from pos=
"2">
1109 <lit-tag v=
"prn.subj.3.4.5"/>
1118 <case-of pos=
"2" part=
"lem"/>
1123 <clip pos=
"2" part=
"lem"/>
1132 <clip pos=
"2" part=
"lem"/>
1133 <clip pos=
"2" part=
"tags"/>
1134 <clip pos=
"2" part=
"chcontent"/>
1138 <clip pos=
"3" part=
"whole"/>
1142 <get-case-from pos=
"4">
1147 <get-case-from pos=
"4">
1155 <clip pos=
"4" part=
"whole"/>
1164 <rule comment=
"REGLA: punt SV SA de inf (. Era difícil d'ajudar -> IT was difficult TO help)MG: treureho? es fa ja tot en el t1x?">
1166 <pattern-item n=
"punt"/>
1167 <pattern-item n=
"SV_pers"/>
1168 <pattern-item n=
"SA"/>
1169 <pattern-item n=
"de"/>
1170 <pattern-item n=
"inf"/>
1175 <clip pos=
"1" part=
"whole"/>
1184 <clip pos=
"2" part=
"temps"/>
1191 <get-case-from pos=
"2">
1194 <lit-tag v=
"prn.subj"/>
1195 <clip pos=
"2" part=
"pers"/>
1197 <clip pos=
"2" part=
"nbr"/>
1199 <get-case-from pos=
"2">
1202 <lit-tag v=
"prn.subj.3.4.5"/>
1211 <case-of pos=
"2" part=
"lem"/>
1216 <clip pos=
"2" part=
"lem"/>
1225 <clip pos=
"2" part=
"lem"/>
1226 <clip pos=
"2" part=
"tags"/>
1227 <clip pos=
"2" part=
"chcontent"/>
1231 <clip pos=
"3" part=
"whole"/>
1235 <get-case-from pos=
"4">
1240 <get-case-from pos=
"4">
1248 <clip pos=
"5" part=
"whole"/>
1255 <rule comment=
"REGLA: cnjsub SV ( que vinguis -> that YOU come)">
1257 <pattern-item n=
"cnjsub"/>
1258 <pattern-item n=
"SV_pers"/>
1263 <clip pos=
"1" part=
"whole"/>
1267 <get-case-from pos=
"2">
1270 <lit-tag v=
"prn.subj"/>
1271 <clip pos=
"2" part=
"pers"/>
1273 <clip pos=
"2" part=
"nbr"/>
1275 <get-case-from pos=
"2">
1278 <lit-tag v=
"prn.subj.3.4.5"/>
1283 <clip pos=
"2" part=
"whole"/>
1289 <rule comment=
"REGLA: cnjsub SV inf ( que intentis venir -> that YOU try TO come)">
1291 <pattern-item n=
"cnjsub"/>
1292 <pattern-item n=
"SV_pers"/>
1293 <pattern-item n=
"inf"/>
1298 <clip pos=
"1" part=
"whole"/>
1302 <get-case-from pos=
"2">
1305 <lit-tag v=
"prn.subj"/>
1306 <clip pos=
"2" part=
"pers"/>
1308 <clip pos=
"2" part=
"nbr"/>
1310 <get-case-from pos=
"2">
1313 <lit-tag v=
"prn.subj.3.4.5"/>
1318 <clip pos=
"2" part=
"whole"/>
1323 <when><!--si és vbmod (o vaux: "can") no posis el "to" pq no cal ("can") o ja el té incorporat ("have to"). -->
1328 <clip pos=
"2" part=
"a_verb"/>
1329 <lit-tag v=
"vbmod"/>
1332 <clip pos=
"2" part=
"a_verb"/>
1340 <get-case-from pos=
"3">
1345 <get-case-from pos=
"3">
1357 <clip pos=
"3" part=
"whole"/>
1364 <rule comment=
"REGLA: cnjsub SV SA inf ( que és difícil venir -> that IT is difficult TO come)">
1366 <pattern-item n=
"cnjsub"/>
1367 <pattern-item n=
"SV_pers"/>
1368 <pattern-item n=
"SA"/>
1369 <pattern-item n=
"inf"/>
1374 <clip pos=
"1" part=
"whole"/>
1378 <get-case-from pos=
"2">
1381 <lit-tag v=
"prn.subj"/>
1382 <clip pos=
"2" part=
"pers"/>
1384 <clip pos=
"2" part=
"nbr"/>
1386 <get-case-from pos=
"2">
1389 <lit-tag v=
"prn.subj.3.4.5"/>
1394 <clip pos=
"2" part=
"whole"/>
1398 <clip pos=
"3" part=
"whole"/>
1402 <get-case-from pos=
"4">
1407 <get-case-from pos=
"4">
1415 <clip pos=
"4" part=
"whole"/>
1421 <rule comment=
"REGLA: cnjsub SV SA de inf ( que és difícil d'entendre -> that IT is difficult TO understand)MG: treureho? es fa ja tot en el t1x?">
1423 <pattern-item n=
"cnjsub"/>
1424 <pattern-item n=
"SV_pers"/>
1425 <pattern-item n=
"SA"/>
1426 <pattern-item n=
"de"/>
1427 <pattern-item n=
"inf"/>
1432 <clip pos=
"1" part=
"whole"/>
1436 <get-case-from pos=
"2">
1439 <lit-tag v=
"prn.subj"/>
1440 <clip pos=
"2" part=
"pers"/>
1442 <clip pos=
"2" part=
"nbr"/>
1444 <get-case-from pos=
"2">
1447 <lit-tag v=
"prn.subj.3.4.5"/>
1452 <clip pos=
"2" part=
"whole"/>
1456 <clip pos=
"3" part=
"whole"/>
1460 <get-case-from pos=
"4">
1465 <get-case-from pos=
"4">
1473 <clip pos=
"5" part=
"whole"/>