1 <?xml version=
"1.0" encoding=
"UTF-8"?> <!-- -*- nxml -*- -->
10 <cat-item name=
"inf_inf"/>
12 <def-cat n=
"ger"> <!-- BCN -->
13 <cat-item name=
"ger"/>
17 <cat-item name=
"ger_enc"/>
26 <cat-item name=
"nom"/>
30 <cat-item name=
"nom_nom"/>
34 <cat-item name=
"adj_nom"/>
37 <def-cat n=
"adj_adj_nom">
38 <cat-item name=
"adj_adj_nom"/>
41 <def-cat n=
"nom_i_nom">
42 <cat-item name=
"nom_conj_nom"/>
45 <def-cat n=
"pottenirpronom">
46 <cat-item name=
"verbcj"/>
47 <cat-item name=
"verbcj_perif"/>
48 <cat-item name=
"pro_verbcj"/>
49 <cat-item name=
"pro_verbcj_perif"/>
50 <cat-item name=
"auxmod_inf"/>
51 <cat-item name=
"mod_inf"/>
52 <cat-item name=
"have_pp"/>
53 <cat-item name=
"be_ger"/>
54 <cat-item name=
"auxmod_mod_inf"/>
55 <cat-item name=
"mod_inf_perif"/>
56 <cat-item name=
"pro_be_ger"/>
57 <cat-item name=
"pro_auxmod_inf"/>
58 <cat-item name=
"pro_mod_inf"/>
59 <cat-item name=
"pro_have_pp"/>
60 <cat-item name=
"pro_do_inf"/>
61 <cat-item name=
"pro_mod_inf_perif"/>
62 <cat-item name=
"pro_auxmod_mod_inf"/>
63 <cat-item name=
"pro_auxmod_have_pp"/>
66 <def-cat n=
"pottenirenclitic">
67 <cat-item name=
"verbcj_inf_perif"/>
68 <cat-item name=
"verbcj_inf"/>
69 <cat-item name=
"auxmod_inf_inf"/>
70 <cat-item name=
"have_pp_inf"/>
71 <cat-item name=
"be_inf_inf"/>
77 <def-cat n=
"pro_vblike">
78 <cat-item name=
"pro_vblike"/>
80 <def-cat n=
"pro_vblike2">
81 <cat-item name=
"pro_vblike2"/>
83 <def-cat n=
"pro_vblike3">
84 <cat-item name=
"pro_vblike3"/>
96 <attr-item tags=
"p1"/>
97 <attr-item tags=
"p2"/>
98 <attr-item tags=
"p3"/>
99 <attr-item tags=
"PD"/>
103 <attr-item tags=
"m"/>
104 <attr-item tags=
"f"/>
105 <attr-item tags=
"mf"/>
106 <attr-item tags=
"GD"/>
107 <attr-item tags=
"nt"/>
111 <attr-item tags=
"sg"/>
112 <attr-item tags=
"pl"/>
113 <attr-item tags=
"sp"/>
114 <attr-item tags=
"ND"/>
117 <def-attr n=
"tipus_verb">
118 <attr-item tags=
"SV.pron"/>
119 <attr-item tags=
"SV"/>
123 <attr-item tags=
"inf"/>
124 <attr-item tags=
"pres"/>
125 <attr-item tags=
"past"/>
126 <attr-item tags=
"pri"/>
127 <attr-item tags=
"pp"/>
128 <attr-item tags=
"ger"/>
129 <attr-item tags=
"pprs"/>
130 <attr-item tags=
"subs"/>
134 <attr-item tags=
"DET"/>
135 <attr-item tags=
"UNDET"/>
136 <attr-item tags=
"NUM"/>
137 <attr-item tags=
"PDET"/><!--'Per determinar', per a SN UNDET que han de passar a determinats, transformació que farà el postchunk detectant els PDET. -->
141 <def-attr n=
"a_preadv"><!--BCN (per generar bé els adj_nom quan hi ha comparatius/superlatius-->
142 <attr-item tags=
"preadv"/>
146 <def-attr n=
"a_verb">
147 <attr-item tags=
"vblex"/>
148 <attr-item tags=
"vblex.pron"/>
149 <attr-item tags=
"vbhaver"/>
150 <attr-item tags=
"vbser"/>
151 <attr-item tags=
"vbmod"/>
152 <attr-item tags=
"HAVER"/>
156 <attr-item tags=
"n"/>
157 <attr-item tags=
"np"/>
161 <attr-item tags=
"np.ant"/>
162 <attr-item tags=
"np.cog"/>
163 <attr-item tags=
"np.al"/>
166 <def-attr n=
"a_prnpro">
167 <attr-item tags=
"prn.pro"/>
170 <def-attr n=
"a_prnenc">
171 <attr-item tags=
"prn.enc"/>
177 <def-var n=
"paraula"/>
183 <def-macro n=
"f_bcond" npar=
"1">
201 </section-def-macros>
205 <rule comment=
"CHUNK: nom">
207 <pattern-item n=
"nom"/>
215 <clip pos=
"0" part=
"a_SN"/>
220 <clip pos=
"1" part=
"a_nom"/>
228 <get-case-from pos=
"1">
231 <lit-tag v=
"det.def"/>
232 <clip pos=
"1" part=
"gen"/>
233 <clip pos=
"1" part=
"nbr"/>
241 <clip pos=
"1" part=
"whole"/>
247 <rule comment=
"CHUNK: adj nom">
249 <pattern-item n=
"adj_nom"/>
256 <clip pos=
"0" part=
"a_SN"/>
262 <get-case-from pos=
"1">
265 <lit-tag v=
"det.def"/>
266 <clip pos=
"1" part=
"gen"/>
267 <clip pos=
"1" part=
"nbr"/>
275 <clip pos=
"1" part=
"whole"/>
279 <clip pos=
"2" part=
"whole"/>
282 <choose> <!-- BCN si s'ha afegit l'adverbi 'més' no genera l'adjectiu-->
286 <clip pos=
"2" part=
"a_preadv"/>
287 <lit-tag v=
"preadv"/>
293 <clip pos=
"3" part=
"whole"/>
301 <rule comment=
"CHUNK: nom conj nom">
303 <pattern-item n=
"nom_i_nom"/>
311 <clip pos=
"0" part=
"a_SN"/>
316 <clip pos=
"1" part=
"a_nom"/>
324 <get-case-from pos=
"1">
327 <lit-tag v=
"det.def"/>
328 <clip pos=
"1" part=
"gen"/>
329 <clip pos=
"1" part=
"nbr"/>
333 <clip pos=
"1" part=
"whole"/>
337 <clip pos=
"2" part=
"whole"/>
341 <get-case-from pos=
"3">
344 <lit-tag v=
"det.def"/>
345 <clip pos=
"3" part=
"gen"/>
346 <clip pos=
"3" part=
"nbr"/>
350 <clip pos=
"3" part=
"whole"/>
357 <clip pos=
"1" part=
"whole"/>
361 <clip pos=
"2" part=
"whole"/>
365 <clip pos=
"3" part=
"whole"/>
374 <rule comment=
"CHUNK: adj adj nom">
376 <pattern-item n=
"adj_adj_nom"/>
383 <clip pos=
"0" part=
"a_SN"/>
389 <get-case-from pos=
"1">
392 <lit-tag v=
"det.def"/>
393 <clip pos=
"1" part=
"gen"/>
394 <clip pos=
"1" part=
"nbr"/>
402 <clip pos=
"1" part=
"whole"/>
406 <clip pos=
"2" part=
"whole"/>
410 <clip pos=
"3" part=
"whole"/>
417 <rule comment=
"CHUNK: nom">
419 <pattern-item n=
"nom_nom"/>
427 <clip pos=
"0" part=
"a_SN"/>
432 <clip pos=
"2" part=
"a_nom"/>
440 <get-case-from pos=
"1">
443 <lit-tag v=
"det.def"/>
444 <clip pos=
"1" part=
"gen"/>
445 <clip pos=
"1" part=
"nbr"/>
453 <clip pos=
"1" part=
"whole"/>
457 <clip pos=
"2" part=
"whole"/>
466 <clip pos=
"2" part=
"a_np"/>
467 <lit-tag v=
"np.ant"/>
470 <clip pos=
"2" part=
"a_np"/>
471 <lit-tag v=
"np.cog"/>
479 <clip pos=
"3" part=
"whole"/>
488 <rule comment=
"CHUNK: INF">
490 <pattern-item n=
"inf"/>
495 <test><!--Si no és PD tampoc serà ND, en principi -->
498 <clip pos=
"0" part=
"pers"/>
505 <clip pos=
"1" part=
"lemh"/>
506 <clip pos=
"1" part=
"tags"/>
507 <clip pos=
"0" part=
"pers"/>
508 <clip pos=
"0" part=
"nbr"/>
509 <clip pos=
"1" part=
"lemq"/>
516 <clip pos=
"1" part=
"whole"/>
525 <rule comment=
"CHUNK: INF INF">
527 <pattern-item n=
"inf_inf"/>
532 <test><!--Si no és PD tampoc serà ND, en principi -->
535 <clip pos=
"0" part=
"pers"/>
542 <clip pos=
"1" part=
"lemh"/>
543 <clip pos=
"1" part=
"tags"/>
544 <clip pos=
"0" part=
"pers"/>
545 <clip pos=
"0" part=
"nbr"/>
546 <clip pos=
"1" part=
"lemq"/>
553 <clip pos=
"1" part=
"whole"/>
561 <clip pos=
"2" part=
"whole"/>
567 <rule comment=
"CHUNK: GER (BCN)">
569 <pattern-item n=
"ger"/>
574 <test><!--Si no és PD tampoc serà ND, en principi -->
577 <clip pos=
"0" part=
"pers"/>
584 <clip pos=
"1" part=
"lemh"/>
585 <clip pos=
"1" part=
"tags"/>
586 <clip pos=
"0" part=
"pers"/>
587 <clip pos=
"0" part=
"nbr"/>
588 <clip pos=
"1" part=
"lemq"/>
595 <clip pos=
"1" part=
"whole"/>
603 <rule comment=
"CHUNK: GER ENC">
605 <pattern-item n=
"ger_enc"/>
610 <test><!--Si no és PD tampoc serà ND, en principi -->
613 <clip pos=
"0" part=
"pers"/>
622 <clip pos=
"0" part=
"tipus_verb"/>
623 <lit-tag v=
"SV.pron"/>
628 <clip pos=
"2" part=
"lem"/>
629 <lit-tag v=
"prn.pro.ref"/>
630 <clip pos=
"2" part=
"pers"/>
631 <clip pos=
"2" part=
"gen"/>
632 <clip pos=
"2" part=
"nbr"/>
636 <clip pos=
"3" part=
"lem"/>
637 <lit-tag v=
"prn.pro"/>
638 <clip pos=
"3" part=
"pers"/>
639 <clip pos=
"3" part=
"gen"/>
640 <clip pos=
"3" part=
"nbr"/>
644 <clip pos=
"1" part=
"lemh"/>
645 <clip pos=
"1" part=
"tags"/>
646 <clip pos=
"0" part=
"pers"/>
647 <clip pos=
"0" part=
"nbr"/>
648 <clip pos=
"1" part=
"lemq"/>
655 <clip pos=
"2" part=
"lem"/>
656 <lit-tag v=
"prn.pro"/>
657 <clip pos=
"2" part=
"pers"/>
658 <clip pos=
"2" part=
"gen"/>
659 <clip pos=
"2" part=
"nbr"/>
663 <clip pos=
"1" part=
"lemh"/>
664 <clip pos=
"1" part=
"tags"/>
665 <clip pos=
"0" part=
"pers"/>
666 <clip pos=
"0" part=
"nbr"/>
667 <clip pos=
"1" part=
"lemq"/>
678 <clip pos=
"0" part=
"tipus_verb"/>
679 <lit-tag v=
"SV.pron"/>
685 <clip pos=
"1" part=
"whole"/>
688 <clip pos=
"2" part=
"whole"/>
691 <clip pos=
"3" part=
"whole"/>
700 <clip pos=
"1" part=
"whole"/>
703 <clip pos=
"2" part=
"whole"/>
709 <call-macro n=
"f_bcond">
710 <with-param pos=
"1"/>
717 <rule comment=
"CHUNK: BE (there is)">
719 <pattern-item n=
"be"/>
726 <clip pos=
"0" part=
"a_verb"/>
730 <choose><!--en aquesta regla, el nom no diferencia el perifràstic del sintètic: cal mirar si la primera paraula és 'anar' i modificar el lema de la 2a paraula en cas afirmatiu; si no, el de la primera. -->
733 <equal caseless=
"yes">
734 <clip pos=
"1" part=
"lem"/>
739 <clip pos=
"2" part=
"lem"/>
743 <clip pos=
"2" part=
"a_verb"/>
744 <lit-tag v=
"vbhaver"/>
749 <clip pos=
"1" part=
"lem"/>
753 <clip pos=
"1" part=
"a_verb"/>
754 <lit-tag v=
"vbhaver"/>
760 <choose><!--imprimeix, 1 o 2 chunks segons si és perifràstic o no-->
763 <equal caseless=
"yes">
764 <clip pos=
"1" part=
"lem"/>
770 <clip pos=
"1" part=
"whole"/>
774 <clip pos=
"2" part=
"whole"/>
781 <clip pos=
"1" part=
"whole"/>
790 <!-- regles per arreglar els verbs tipus "like->m'agrada" -->
792 <rule comment=
"assigna persona i nombre als verbs tipus LIKE amb pronom">
794 <pattern-item n=
"pro_vblike"/>
798 <clip pos=
"2" part=
"pers"/>
799 <clip pos=
"1" part=
"pers"/>
802 <clip pos=
"2" part=
"nbr"/>
803 <clip pos=
"1" part=
"nbr"/>
807 <clip pos=
"2" part=
"whole"/>
810 <call-macro n=
"f_bcond">
811 <with-param pos=
"1"/>
816 <rule comment=
"assigna persona i nombre als verbs tipus LIKE amb pronom">
818 <pattern-item n=
"pro_vblike2"/>
822 <clip pos=
"2" part=
"pers"/>
823 <clip pos=
"1" part=
"pers"/>
826 <clip pos=
"2" part=
"nbr"/>
827 <clip pos=
"1" part=
"nbr"/>
831 <clip pos=
"2" part=
"whole"/>
835 <clip pos=
"3" part=
"whole"/>
838 <call-macro n=
"f_bcond">
839 <with-param pos=
"2"/>
844 <rule comment=
"assigna persona i nombre als verbs tipus LIKE amb pronom">
846 <pattern-item n=
"pro_vblike3"/>
850 <clip pos=
"2" part=
"pers"/>
851 <clip pos=
"1" part=
"pers"/>
854 <clip pos=
"2" part=
"nbr"/>
855 <clip pos=
"1" part=
"nbr"/>
859 <clip pos=
"2" part=
"whole"/>
863 <clip pos=
"3" part=
"whole"/>
867 <clip pos=
"4" part=
"whole"/>
870 <call-macro n=
"f_bcond">
871 <with-param pos=
"3"/>
876 <!-- regles per arreglar el pronom reflexiu de tercera persona (li-> se)-->
878 <rule comment=
"arregla el pron reflexiu de tercera persona, quan és proclític">
880 <pattern-item n=
"pottenirpronom"/>
887 <clip pos=
"0" part=
"tipus_verb"/>
888 <lit-tag v=
"SV.pron"/>
895 <clip pos=
"0" part=
"pers"/>
900 <clip pos=
"1" part=
"lem"/>
904 <clip pos=
"1" part=
"a_prnpro"/>
905 <lit-tag v=
"prn.pro.ref"/>
908 <clip pos=
"1" part=
"nbr"/>
915 <clip pos=
"1" part=
"whole"/>
919 <clip pos=
"2" part=
"whole"/>
926 <equal caseless=
"yes">
927 <clip pos=
"0" part=
"lem"/>
928 <lit v=
"verbcj_perif"/>
930 <equal caseless=
"yes">
931 <clip pos=
"0" part=
"lem"/>
932 <lit v=
"pro_verbcj"/>
934 <equal caseless=
"yes">
935 <clip pos=
"0" part=
"lem"/>
936 <lit v=
"auxmod_inf"/>
938 <equal caseless=
"yes">
939 <clip pos=
"0" part=
"lem"/>
942 <equal caseless=
"yes">
943 <clip pos=
"0" part=
"lem"/>
946 <equal caseless=
"yes">
947 <clip pos=
"0" part=
"lem"/>
955 <clip pos=
"3" part=
"whole"/>
964 <equal caseless=
"yes">
965 <clip pos=
"0" part=
"lem"/>
966 <lit v=
"pro_verbcj_perif"/>
968 <equal caseless=
"yes">
969 <clip pos=
"0" part=
"lem"/>
970 <lit v=
"auxmod_mod_inf"/>
972 <equal caseless=
"yes">
973 <clip pos=
"0" part=
"lem"/>
974 <lit v=
"mod_inf_perif"/>
976 <equal caseless=
"yes">
977 <clip pos=
"0" part=
"lem"/>
978 <lit v=
"pro_be_ger"/>
980 <equal caseless=
"yes">
981 <clip pos=
"0" part=
"lem"/>
982 <lit v=
"pro_auxmod_inf"/>
984 <equal caseless=
"yes">
985 <clip pos=
"0" part=
"lem"/>
986 <lit v=
"pro_mod_inf"/>
988 <equal caseless=
"yes">
989 <clip pos=
"0" part=
"lem"/>
990 <lit v=
"pro_have_pp"/>
992 <equal caseless=
"yes">
993 <clip pos=
"0" part=
"lem"/>
994 <lit v=
"pro_do_inf"/>
1001 <clip pos=
"3" part=
"whole"/>
1005 <clip pos=
"4" part=
"whole"/>
1014 <equal caseless=
"yes">
1015 <clip pos=
"0" part=
"lem"/>
1016 <lit v=
"pro_mod_inf_perif"/>
1018 <equal caseless=
"yes">
1019 <clip pos=
"0" part=
"lem"/>
1020 <lit v=
"pro_auxmod_mod_inf"/>
1022 <equal caseless=
"yes">
1023 <clip pos=
"0" part=
"lem"/>
1024 <lit v=
"pro_auxmod_have_pp"/>
1031 <clip pos=
"3" part=
"whole"/>
1035 <clip pos=
"4" part=
"whole"/>
1039 <clip pos=
"5" part=
"whole"/>
1046 <choose><!--Mira si hi ha algun verb que sigui HAVER (d'haver-hi), en tal cas cal canviar lemes i etiquetes del verb principal ('ser' passa a 'haver') -->
1050 <clip pos=
"0" part=
"a_verb"/>
1051 <lit-tag v=
"HAVER"/>
1057 <equal caseless=
"yes">
1058 <clip pos=
"0" part=
"lem"/>
1063 <clip pos=
"1" part=
"lem"/>
1067 <clip pos=
"1" part=
"a_verb"/>
1068 <lit-tag v=
"vbhaver"/>
1074 <equal caseless=
"yes">
1075 <clip pos=
"0" part=
"lem"/>
1076 <lit v=
"auxmod_inf"/>
1078 <equal caseless=
"yes">
1079 <clip pos=
"0" part=
"lem"/>
1082 <equal caseless=
"yes">
1083 <clip pos=
"0" part=
"lem"/>
1086 <equal caseless=
"yes">
1087 <clip pos=
"0" part=
"lem"/>
1088 <lit v=
"verbcj_perif"/>
1093 <clip pos=
"2" part=
"lem"/>
1097 <clip pos=
"2" part=
"a_verb"/>
1098 <lit-tag v=
"vbhaver"/>
1104 <equal caseless=
"yes">
1105 <clip pos=
"0" part=
"lem"/>
1106 <lit v=
"auxmod_mod_inf"/>
1108 <equal caseless=
"yes">
1109 <clip pos=
"0" part=
"lem"/>
1110 <lit v=
"mod_inf_perif"/>
1115 <clip pos=
"3" part=
"lem"/>
1119 <clip pos=
"3" part=
"a_verb"/>
1120 <lit-tag v=
"vbhaver"/>
1127 <out><!--I ara imprimeix el resultat de tot -->
1129 <clip pos=
"1" part=
"whole"/>
1136 <equal caseless=
"yes">
1137 <clip pos=
"0" part=
"lem"/>
1138 <lit v=
"verbcj_perif"/>
1140 <equal caseless=
"yes">
1141 <clip pos=
"0" part=
"lem"/>
1142 <lit v=
"pro_verbcj"/>
1144 <equal caseless=
"yes">
1145 <clip pos=
"0" part=
"lem"/>
1146 <lit v=
"auxmod_inf"/>
1148 <equal caseless=
"yes">
1149 <clip pos=
"0" part=
"lem"/>
1152 <equal caseless=
"yes">
1153 <clip pos=
"0" part=
"lem"/>
1156 <equal caseless=
"yes">
1157 <clip pos=
"0" part=
"lem"/>
1165 <clip pos=
"2" part=
"whole"/>
1174 <equal caseless=
"yes">
1175 <clip pos=
"0" part=
"lem"/>
1176 <lit v=
"pro_verbcj_perif"/>
1178 <equal caseless=
"yes">
1179 <clip pos=
"0" part=
"lem"/>
1180 <lit v=
"auxmod_mod_inf"/>
1182 <equal caseless=
"yes">
1183 <clip pos=
"0" part=
"lem"/>
1184 <lit v=
"mod_inf_perif"/>
1186 <equal caseless=
"yes">
1187 <clip pos=
"0" part=
"lem"/>
1188 <lit v=
"pro_be_ger"/>
1190 <equal caseless=
"yes">
1191 <clip pos=
"0" part=
"lem"/>
1192 <lit v=
"pro_auxmod_inf"/>
1194 <equal caseless=
"yes">
1195 <clip pos=
"0" part=
"lem"/>
1196 <lit v=
"pro_mod_inf"/>
1198 <equal caseless=
"yes">
1199 <clip pos=
"0" part=
"lem"/>
1200 <lit v=
"pro_have_pp"/>
1202 <equal caseless=
"yes">
1203 <clip pos=
"0" part=
"lem"/>
1204 <lit v=
"pro_be_ger"/>
1206 <equal caseless=
"yes">
1207 <clip pos=
"0" part=
"lem"/>
1208 <lit v=
"pro_do_inf"/>
1215 <clip pos=
"2" part=
"whole"/>
1219 <clip pos=
"3" part=
"whole"/>
1228 <equal caseless=
"yes">
1229 <clip pos=
"0" part=
"lem"/>
1230 <lit v=
"pro_mod_inf_perif"/>
1232 <equal caseless=
"yes">
1233 <clip pos=
"0" part=
"lem"/>
1234 <lit v=
"pro_auxmod_mod_inf"/>
1236 <equal caseless=
"yes">
1237 <clip pos=
"0" part=
"lem"/>
1238 <lit v=
"pro_auxmod_have_pp"/>
1245 <clip pos=
"2" part=
"whole"/>
1249 <clip pos=
"3" part=
"whole"/>
1253 <clip pos=
"4" part=
"whole"/>
1264 <!--<rule comment="arregla el pron reflexiu de tercera persona quan és enclític. No es pot accedir el lema del pronom enclític i per ara no es pot fer la regla">
1266 <pattern-item n="pottenirenclitic"/>
1273 <clip pos="3" part="a_prnenc"/>
1274 <lit-tag v="prn.enc"/>
1295 <rule comment=
"CHUNK: HI">
1297 <pattern-item n=
"hi"/>
1301 <clip pos=
"1" part=
"lem"/>
1305 <clip pos=
"1" part=
"tags"/>
1306 <lit-tag v=
"prn.pro.adv"/>
1310 <clip pos=
"1" part=
"whole"/>