1 <?xml version=
"1.0" encoding=
"UTF-8"?> <!-- -*- nxml -*- -->
8 <cat-item name=
"inf_enc"/>
9 <cat-item name=
"subs_enc"/>
10 <cat-item name=
"inf_enc_enc"/>
13 <cat-item name=
"inf_inf"/>
16 <def-cat n=
"ger"> <!-- BCN -->
17 <cat-item name=
"ger"/>
21 <cat-item name=
"ger_enc"/>
24 <def-cat n=
"ger_enc_enc">
25 <cat-item name=
"ger_enc_enc"/>
33 <cat-item name=
"nom"/>
37 <cat-item name=
"nom_nom"/>
41 <cat-item name=
"adj_nom"/>
44 <def-cat n=
"adj_adj_nom">
45 <cat-item name=
"adj_adj_nom"/>
48 <def-cat n=
"nom_i_nom">
49 <cat-item name=
"nom_conj_nom"/>
54 <def-cat n=
"pottenirpronom">
55 <cat-item name=
"verbcj"/>
56 <cat-item name=
"verbcj_perif"/>
57 <cat-item name=
"pro_verbcj"/>
58 <cat-item name=
"pro_verbcj_perif"/>
59 <cat-item name=
"auxmod_inf"/>
60 <cat-item name=
"mod_inf"/>
61 <cat-item name=
"have_pp"/>
62 <cat-item name=
"be_ger"/>
63 <cat-item name=
"auxmod_mod_inf"/>
64 <cat-item name=
"mod_inf_perif"/>
65 <cat-item name=
"pro_be_ger"/>
66 <cat-item name=
"pro_auxmod_inf"/>
67 <cat-item name=
"pro_mod_inf"/>
68 <cat-item name=
"pro_have_pp"/>
69 <cat-item name=
"pro_do_inf"/>
70 <cat-item name=
"pro_mod_inf_perif"/>
71 <cat-item name=
"pro_auxmod_mod_inf"/>
72 <cat-item name=
"pro_auxmod_have_pp"/>
75 <def-cat n=
"pottenirenclitic"><!--MG: canviar tot això pel nou mecanisme, sense mlu en el t1x, i aquí fabricar les mlu -->
76 <cat-item name=
"verbcj_inf_perif"/>
77 <cat-item name=
"verbcj_inf"/>
78 <cat-item name=
"auxmod_inf_inf"/>
79 <cat-item name=
"have_pp_inf"/>
80 <cat-item name=
"be_inf_inf"/>
86 <def-cat n=
"pro_vblike">
87 <cat-item name=
"pro_vblike"/>
89 <def-cat n=
"pro_vblike2">
90 <cat-item name=
"pro_vblike2"/>
92 <def-cat n=
"pro_vblike3">
93 <cat-item name=
"pro_vblike3"/>
105 <attr-item tags=
"p1"/>
106 <attr-item tags=
"p2"/>
107 <attr-item tags=
"p3"/>
108 <attr-item tags=
"PD"/>
112 <attr-item tags=
"m"/>
113 <attr-item tags=
"f"/>
114 <attr-item tags=
"mf"/>
115 <attr-item tags=
"GD"/>
116 <attr-item tags=
"nt"/>
120 <attr-item tags=
"sg"/>
121 <attr-item tags=
"pl"/>
122 <attr-item tags=
"sp"/>
123 <attr-item tags=
"ND"/>
126 <def-attr n=
"tipus_verb">
127 <attr-item tags=
"SV.pron"/>
128 <attr-item tags=
"SV"/>
132 <attr-item tags=
"inf"/>
133 <attr-item tags=
"pres"/>
134 <attr-item tags=
"past"/>
135 <attr-item tags=
"pri"/>
136 <attr-item tags=
"pp"/>
137 <attr-item tags=
"ger"/>
138 <attr-item tags=
"pprs"/>
139 <attr-item tags=
"subs"/>
143 <attr-item tags=
"DET"/>
144 <attr-item tags=
"UNDET"/>
145 <attr-item tags=
"NUM"/>
146 <attr-item tags=
"PDET"/><!--'Per determinar', per a SN UNDET que han de passar a determinats, transformació que farà el postchunk detectant els PDET. -->
150 <def-attr n=
"a_preadv"><!--BCN (per generar bé els adj_nom quan hi ha comparatius/superlatius-->
151 <attr-item tags=
"preadv"/>
155 <def-attr n=
"a_verb">
156 <attr-item tags=
"vblex"/>
157 <attr-item tags=
"vblex.pron"/>
158 <attr-item tags=
"vbhaver"/>
159 <attr-item tags=
"vbser"/>
160 <attr-item tags=
"vbmod"/>
161 <attr-item tags=
"HAVER"/>
165 <attr-item tags=
"n"/>
166 <attr-item tags=
"np"/>
170 <attr-item tags=
"np.ant"/>
171 <attr-item tags=
"np.cog"/>
172 <attr-item tags=
"np.al"/>
175 <def-attr n=
"a_prnpro">
176 <attr-item tags=
"prn.pro"/>
179 <def-attr n=
"a_prnenc">
180 <attr-item tags=
"prn.enc"/>
184 <attr-item tags=
"ref"/>
189 <def-var n=
"paraula"/>
195 <def-macro n=
"f_bcond" npar=
"1">
213 </section-def-macros>
217 <rule comment=
"CHUNK: nom">
219 <pattern-item n=
"nom"/>
227 <clip pos=
"0" part=
"a_SN"/>
232 <clip pos=
"1" part=
"a_nom"/>
240 <get-case-from pos=
"1">
243 <lit-tag v=
"det.def"/>
244 <clip pos=
"1" part=
"gen"/>
245 <clip pos=
"1" part=
"nbr"/>
253 <clip pos=
"1" part=
"whole"/>
259 <rule comment=
"CHUNK: adj nom">
261 <pattern-item n=
"adj_nom"/>
268 <clip pos=
"0" part=
"a_SN"/>
274 <get-case-from pos=
"1">
277 <lit-tag v=
"det.def"/>
278 <clip pos=
"1" part=
"gen"/>
279 <clip pos=
"1" part=
"nbr"/>
287 <clip pos=
"1" part=
"whole"/>
291 <clip pos=
"2" part=
"whole"/>
294 <choose> <!-- BCN si s'ha afegit l'adverbi 'més' no genera l'adjectiu-->
298 <clip pos=
"2" part=
"a_preadv"/>
299 <lit-tag v=
"preadv"/>
305 <clip pos=
"3" part=
"whole"/>
313 <rule comment=
"CHUNK: nom conj nom">
315 <pattern-item n=
"nom_i_nom"/>
323 <clip pos=
"0" part=
"a_SN"/>
328 <clip pos=
"1" part=
"a_nom"/>
336 <get-case-from pos=
"1">
339 <lit-tag v=
"det.def"/>
340 <clip pos=
"1" part=
"gen"/>
341 <clip pos=
"1" part=
"nbr"/>
345 <clip pos=
"1" part=
"whole"/>
349 <clip pos=
"2" part=
"whole"/>
353 <get-case-from pos=
"3">
356 <lit-tag v=
"det.def"/>
357 <clip pos=
"3" part=
"gen"/>
358 <clip pos=
"3" part=
"nbr"/>
362 <clip pos=
"3" part=
"whole"/>
369 <clip pos=
"1" part=
"whole"/>
373 <clip pos=
"2" part=
"whole"/>
377 <clip pos=
"3" part=
"whole"/>
386 <rule comment=
"CHUNK: adj adj nom">
388 <pattern-item n=
"adj_adj_nom"/>
395 <clip pos=
"0" part=
"a_SN"/>
401 <get-case-from pos=
"1">
404 <lit-tag v=
"det.def"/>
405 <clip pos=
"1" part=
"gen"/>
406 <clip pos=
"1" part=
"nbr"/>
414 <clip pos=
"1" part=
"whole"/>
418 <clip pos=
"2" part=
"whole"/>
422 <clip pos=
"3" part=
"whole"/>
431 <rule comment=
"CHUNK: INF">
433 <pattern-item n=
"inf"/>
438 <test><!--Mirem si ha deixat de ser 'inf' i ha rebut persona i nombre. Si no és PD tampoc serà ND, en principi -->
442 <clip pos=
"0" part=
"pers"/>
448 <clip pos=
"0" part=
"temps"/>
456 <clip pos=
"1" part=
"lemh"/>
457 <clip pos=
"1" part=
"tags"/>
458 <clip pos=
"0" part=
"pers"/>
459 <clip pos=
"0" part=
"nbr"/>
460 <clip pos=
"1" part=
"lemq"/>
467 <clip pos=
"1" part=
"whole"/>
478 <rule comment=
"CHUNK: INF + 2a paraula">
480 <pattern-item n=
"inf_2"/>
485 <test><!--Mirem si ha deixat de ser 'inf' i ha rebut persona i nombre. Si no és PD tampoc serà ND, en principi -->
489 <clip pos=
"0" part=
"pers"/>
495 <clip pos=
"0" part=
"temps"/>
503 <clip pos=
"1" part=
"lemh"/>
504 <clip pos=
"1" part=
"tags"/>
505 <clip pos=
"0" part=
"pers"/>
506 <clip pos=
"0" part=
"nbr"/>
507 <clip pos=
"1" part=
"lemq"/>
514 <clip pos=
"1" part=
"whole"/>
522 <clip pos=
"2" part=
"whole"/>
533 <rule comment=
"CHUNK: GER (BCN)">
535 <pattern-item n=
"ger"/>
540 <test><!--Si no és PD tampoc serà ND, en principi -->
544 <clip pos=
"0" part=
"pers"/>
550 <clip pos=
"0" part=
"temps"/>
558 <clip pos=
"1" part=
"lemh"/>
559 <clip pos=
"1" part=
"tags"/>
560 <clip pos=
"0" part=
"pers"/>
561 <clip pos=
"0" part=
"nbr"/>
562 <clip pos=
"1" part=
"lemq"/>
569 <clip pos=
"1" part=
"whole"/>
577 <rule comment=
"CHUNK: GER ENC">
579 <pattern-item n=
"ger_enc"/>
584 <test><!--Si no és PD tampoc serà ND, en principi -->
588 <clip pos=
"0" part=
"pers"/>
594 <clip pos=
"0" part=
"temps"/>
602 <clip pos=
"2" part=
"lem"/>
603 <lit-tag v=
"prn.pro"/>
604 <clip pos=
"2" part=
"a_ref"/><!--només tindrà valor si el pronom és reflexiu -->
605 <clip pos=
"2" part=
"pers"/>
606 <clip pos=
"2" part=
"gen"/>
607 <clip pos=
"2" part=
"nbr"/>
611 <clip pos=
"1" part=
"lemh"/>
612 <clip pos=
"1" part=
"tags"/>
613 <clip pos=
"0" part=
"pers"/>
614 <clip pos=
"0" part=
"nbr"/>
615 <clip pos=
"2" part=
"lemq"/><!--atenció: lemq de posició 2, tot i que ho és del verb, perquè per les operacions del t1x ha passat a ser cua del pronom i no del verb, aquí cal recolocar-la -->
619 <otherwise><!--si no tenen pers ni nbr, cal crear les 'mlu'. Aquí la cua ja està bé com està -->
623 <clip pos=
"1" part=
"whole"/>
626 <clip pos=
"2" part=
"whole"/>
632 <call-macro n=
"f_bcond">
633 <with-param pos=
"1"/>
639 <rule comment=
"CHUNK: GER ENC">
641 <pattern-item n=
"ger_enc_enc"/>
646 <test><!--Si no és PD tampoc serà ND, en principi -->
650 <clip pos=
"0" part=
"pers"/>
656 <clip pos=
"0" part=
"temps"/>
664 <clip pos=
"2" part=
"lem"/>
665 <lit-tag v=
"prn.pro"/>
666 <clip pos=
"2" part=
"a_ref"/><!--només tindrà valor si el pronom és reflexiu -->
667 <clip pos=
"2" part=
"pers"/>
668 <clip pos=
"2" part=
"gen"/>
669 <clip pos=
"2" part=
"nbr"/>
673 <clip pos=
"3" part=
"lem"/>
674 <lit-tag v=
"prn.pro"/>
675 <clip pos=
"3" part=
"pers"/>
676 <clip pos=
"3" part=
"gen"/>
677 <clip pos=
"3" part=
"nbr"/>
681 <clip pos=
"1" part=
"lemh"/>
682 <clip pos=
"1" part=
"tags"/>
683 <clip pos=
"0" part=
"pers"/>
684 <clip pos=
"0" part=
"nbr"/>
685 <clip pos=
"2" part=
"lemq"/><!--atenció: lemq de posició 2, tot i que ho és del verb, perquè per les operacions del t1x ha passat a ser cua del pronom i no del verb, aquí cal recolocar-la -->
689 <otherwise><!--si no tenen pers ni nbr, cal crear les 'mlu'. Aquí la cua ja està bé com està-->
693 <clip pos=
"1" part=
"whole"/>
696 <clip pos=
"2" part=
"whole"/>
699 <clip pos=
"3" part=
"whole"/>
705 <call-macro n=
"f_bcond">
706 <with-param pos=
"1"/>
712 <rule comment=
"CHUNK: BE (there is)">
714 <pattern-item n=
"be"/>
721 <clip pos=
"0" part=
"a_verb"/>
725 <choose><!--en aquesta regla, el nom no diferencia el perifràstic del sintètic: cal mirar si la primera paraula és 'anar' i modificar el lema de la 2a paraula en cas afirmatiu; si no, el de la primera. -->
728 <equal caseless=
"yes">
729 <clip pos=
"1" part=
"lem"/>
734 <clip pos=
"2" part=
"lem"/>
738 <clip pos=
"2" part=
"a_verb"/>
739 <lit-tag v=
"vbhaver"/>
744 <clip pos=
"1" part=
"lem"/>
748 <clip pos=
"1" part=
"a_verb"/>
749 <lit-tag v=
"vbhaver"/>
755 <choose><!--imprimeix, 1 o 2 chunks segons si és perifràstic o no-->
758 <equal caseless=
"yes">
759 <clip pos=
"1" part=
"lem"/>
765 <clip pos=
"1" part=
"whole"/>
769 <clip pos=
"2" part=
"whole"/>
776 <clip pos=
"1" part=
"whole"/>
785 <!-- regles per arreglar els verbs tipus "like->m'agrada" -->
787 <rule comment=
"assigna persona i nombre als verbs tipus LIKE amb pronom">
789 <pattern-item n=
"pro_vblike"/>
793 <clip pos=
"2" part=
"pers"/>
794 <clip pos=
"1" part=
"pers"/>
797 <clip pos=
"2" part=
"nbr"/>
798 <clip pos=
"1" part=
"nbr"/>
802 <clip pos=
"2" part=
"whole"/>
805 <call-macro n=
"f_bcond">
806 <with-param pos=
"1"/>
811 <rule comment=
"assigna persona i nombre als verbs tipus LIKE amb pronom">
813 <pattern-item n=
"pro_vblike2"/>
817 <clip pos=
"2" part=
"pers"/>
818 <clip pos=
"1" part=
"pers"/>
821 <clip pos=
"2" part=
"nbr"/>
822 <clip pos=
"1" part=
"nbr"/>
826 <clip pos=
"2" part=
"whole"/>
830 <clip pos=
"3" part=
"whole"/>
833 <call-macro n=
"f_bcond">
834 <with-param pos=
"2"/>
839 <rule comment=
"assigna persona i nombre als verbs tipus LIKE amb pronom">
841 <pattern-item n=
"pro_vblike3"/>
845 <clip pos=
"2" part=
"pers"/>
846 <clip pos=
"1" part=
"pers"/>
849 <clip pos=
"2" part=
"nbr"/>
850 <clip pos=
"1" part=
"nbr"/>
854 <clip pos=
"2" part=
"whole"/>
858 <clip pos=
"3" part=
"whole"/>
862 <clip pos=
"4" part=
"whole"/>
865 <call-macro n=
"f_bcond">
866 <with-param pos=
"3"/>
871 <!-- regles per arreglar el pronom reflexiu de tercera persona (li-> se)-->
873 <rule comment=
"arregla el pron reflexiu de tercera persona, quan és proclític">
875 <pattern-item n=
"pottenirpronom"/>
882 <clip pos=
"0" part=
"tipus_verb"/>
883 <lit-tag v=
"SV.pron"/>
890 <clip pos=
"0" part=
"pers"/>
895 <clip pos=
"1" part=
"lem"/>
899 <clip pos=
"1" part=
"a_prnpro"/>
900 <lit-tag v=
"prn.pro.ref"/>
903 <clip pos=
"1" part=
"nbr"/>
910 <clip pos=
"1" part=
"whole"/>
914 <clip pos=
"2" part=
"whole"/>
921 <equal caseless=
"yes">
922 <clip pos=
"0" part=
"lem"/>
923 <lit v=
"verbcj_perif"/>
925 <equal caseless=
"yes">
926 <clip pos=
"0" part=
"lem"/>
927 <lit v=
"pro_verbcj"/>
929 <equal caseless=
"yes">
930 <clip pos=
"0" part=
"lem"/>
931 <lit v=
"auxmod_inf"/>
933 <equal caseless=
"yes">
934 <clip pos=
"0" part=
"lem"/>
937 <equal caseless=
"yes">
938 <clip pos=
"0" part=
"lem"/>
941 <equal caseless=
"yes">
942 <clip pos=
"0" part=
"lem"/>
950 <clip pos=
"3" part=
"whole"/>
959 <equal caseless=
"yes">
960 <clip pos=
"0" part=
"lem"/>
961 <lit v=
"pro_verbcj_perif"/>
963 <equal caseless=
"yes">
964 <clip pos=
"0" part=
"lem"/>
965 <lit v=
"auxmod_mod_inf"/>
967 <equal caseless=
"yes">
968 <clip pos=
"0" part=
"lem"/>
969 <lit v=
"mod_inf_perif"/>
971 <equal caseless=
"yes">
972 <clip pos=
"0" part=
"lem"/>
973 <lit v=
"pro_be_ger"/>
975 <equal caseless=
"yes">
976 <clip pos=
"0" part=
"lem"/>
977 <lit v=
"pro_auxmod_inf"/>
979 <equal caseless=
"yes">
980 <clip pos=
"0" part=
"lem"/>
981 <lit v=
"pro_mod_inf"/>
983 <equal caseless=
"yes">
984 <clip pos=
"0" part=
"lem"/>
985 <lit v=
"pro_have_pp"/>
987 <equal caseless=
"yes">
988 <clip pos=
"0" part=
"lem"/>
989 <lit v=
"pro_do_inf"/>
996 <clip pos=
"3" part=
"whole"/>
1000 <clip pos=
"4" part=
"whole"/>
1009 <equal caseless=
"yes">
1010 <clip pos=
"0" part=
"lem"/>
1011 <lit v=
"pro_mod_inf_perif"/>
1013 <equal caseless=
"yes">
1014 <clip pos=
"0" part=
"lem"/>
1015 <lit v=
"pro_auxmod_mod_inf"/>
1017 <equal caseless=
"yes">
1018 <clip pos=
"0" part=
"lem"/>
1019 <lit v=
"pro_auxmod_have_pp"/>
1026 <clip pos=
"3" part=
"whole"/>
1030 <clip pos=
"4" part=
"whole"/>
1034 <clip pos=
"5" part=
"whole"/>
1041 <choose><!--Mira si hi ha algun verb que sigui HAVER (d'haver-hi), en tal cas cal canviar lemes i etiquetes del verb principal ('ser' passa a 'haver') -->
1045 <clip pos=
"0" part=
"a_verb"/>
1046 <lit-tag v=
"HAVER"/>
1052 <equal caseless=
"yes">
1053 <clip pos=
"0" part=
"lem"/>
1058 <clip pos=
"1" part=
"lem"/>
1062 <clip pos=
"1" part=
"a_verb"/>
1063 <lit-tag v=
"vbhaver"/>
1069 <equal caseless=
"yes">
1070 <clip pos=
"0" part=
"lem"/>
1071 <lit v=
"auxmod_inf"/>
1073 <equal caseless=
"yes">
1074 <clip pos=
"0" part=
"lem"/>
1077 <equal caseless=
"yes">
1078 <clip pos=
"0" part=
"lem"/>
1081 <equal caseless=
"yes">
1082 <clip pos=
"0" part=
"lem"/>
1083 <lit v=
"verbcj_perif"/>
1088 <clip pos=
"2" part=
"lem"/>
1092 <clip pos=
"2" part=
"a_verb"/>
1093 <lit-tag v=
"vbhaver"/>
1099 <equal caseless=
"yes">
1100 <clip pos=
"0" part=
"lem"/>
1101 <lit v=
"auxmod_mod_inf"/>
1103 <equal caseless=
"yes">
1104 <clip pos=
"0" part=
"lem"/>
1105 <lit v=
"mod_inf_perif"/>
1110 <clip pos=
"3" part=
"lem"/>
1114 <clip pos=
"3" part=
"a_verb"/>
1115 <lit-tag v=
"vbhaver"/>
1122 <out><!--I ara imprimeix el resultat de tot -->
1124 <clip pos=
"1" part=
"whole"/>
1131 <equal caseless=
"yes">
1132 <clip pos=
"0" part=
"lem"/>
1133 <lit v=
"verbcj_perif"/>
1135 <equal caseless=
"yes">
1136 <clip pos=
"0" part=
"lem"/>
1137 <lit v=
"pro_verbcj"/>
1139 <equal caseless=
"yes">
1140 <clip pos=
"0" part=
"lem"/>
1141 <lit v=
"auxmod_inf"/>
1143 <equal caseless=
"yes">
1144 <clip pos=
"0" part=
"lem"/>
1147 <equal caseless=
"yes">
1148 <clip pos=
"0" part=
"lem"/>
1151 <equal caseless=
"yes">
1152 <clip pos=
"0" part=
"lem"/>
1160 <clip pos=
"2" part=
"whole"/>
1169 <equal caseless=
"yes">
1170 <clip pos=
"0" part=
"lem"/>
1171 <lit v=
"pro_verbcj_perif"/>
1173 <equal caseless=
"yes">
1174 <clip pos=
"0" part=
"lem"/>
1175 <lit v=
"auxmod_mod_inf"/>
1177 <equal caseless=
"yes">
1178 <clip pos=
"0" part=
"lem"/>
1179 <lit v=
"mod_inf_perif"/>
1181 <equal caseless=
"yes">
1182 <clip pos=
"0" part=
"lem"/>
1183 <lit v=
"pro_be_ger"/>
1185 <equal caseless=
"yes">
1186 <clip pos=
"0" part=
"lem"/>
1187 <lit v=
"pro_auxmod_inf"/>
1189 <equal caseless=
"yes">
1190 <clip pos=
"0" part=
"lem"/>
1191 <lit v=
"pro_mod_inf"/>
1193 <equal caseless=
"yes">
1194 <clip pos=
"0" part=
"lem"/>
1195 <lit v=
"pro_have_pp"/>
1197 <equal caseless=
"yes">
1198 <clip pos=
"0" part=
"lem"/>
1199 <lit v=
"pro_be_ger"/>
1201 <equal caseless=
"yes">
1202 <clip pos=
"0" part=
"lem"/>
1203 <lit v=
"pro_do_inf"/>
1210 <clip pos=
"2" part=
"whole"/>
1214 <clip pos=
"3" part=
"whole"/>
1223 <equal caseless=
"yes">
1224 <clip pos=
"0" part=
"lem"/>
1225 <lit v=
"pro_mod_inf_perif"/>
1227 <equal caseless=
"yes">
1228 <clip pos=
"0" part=
"lem"/>
1229 <lit v=
"pro_auxmod_mod_inf"/>
1231 <equal caseless=
"yes">
1232 <clip pos=
"0" part=
"lem"/>
1233 <lit v=
"pro_auxmod_have_pp"/>
1240 <clip pos=
"2" part=
"whole"/>
1244 <clip pos=
"3" part=
"whole"/>
1248 <clip pos=
"4" part=
"whole"/>
1259 <!--<rule comment="arregla el pron reflexiu de tercera persona quan és enclític. No es pot accedir el lema del pronom enclític i per ara no es pot fer la regla">
1261 <pattern-item n="pottenirenclitic"/>
1268 <clip pos="3" part="a_prnenc"/>
1269 <lit-tag v="prn.enc"/>
1290 <rule comment=
"CHUNK: HI">
1292 <pattern-item n=
"hi"/>
1296 <clip pos=
"1" part=
"lem"/>
1300 <clip pos=
"1" part=
"tags"/>
1301 <lit-tag v=
"prn.pro.adv"/>
1305 <clip pos=
"1" part=
"whole"/>