1 <?xml version=
"1.0" encoding=
"UTF-8"?> <!-- -*- nxml -*- -->
3 <transfer default=
"chunk">
6 <cat-item tags=
"cnjadv"/>
7 <cat-item tags=
"cnjcoo"/>
8 <cat-item tags=
"cnjsub"/>
9 <cat-item tags=
"cnjcoo.*"/>
10 <cat-item tags=
"cnjadv.*"/>
11 <cat-item tags=
"cnjsub.*"/>
14 <cat-item tags=
"rel.*"/>
17 <cat-item tags=
"adj"/>
18 <cat-item tags=
"adj.*"/>
19 <cat-item tags=
"adj.sint"/>
20 <cat-item tags=
"adj.sint.*"/>
21 <cat-item tags=
"adj.sint.comp"/>
22 <cat-item tags=
"adj.sint.comp.*"/>
25 <cat-item tags=
"n.*"/>
26 <cat-item tags=
"np.ant.*"/>
27 <cat-item tags=
"np.top.*"/>
29 <def-cat n=
"genitive">
30 <cat-item tags=
"gen"/>
33 <cat-item tags=
"sent"/>
35 <def-cat n=
"det_ignore">
36 <cat-item lemma=
"a" tags=
"det.ind.*"/>
37 <cat-item tags=
"det.def.*"/>
40 <cat-item tags=
"det.ind.*"/>
41 <cat-item tags=
"det.dem.*"/>
44 <cat-item lemma=
"prpers" tags=
"prn.*"/>
46 <def-cat n=
"verbnm"><!--verb no modal -->
47 <cat-item tags=
"vblex.*"/>
48 <cat-item tags=
"vbser.*"/>
49 <cat-item tags=
"vbhaver.*"/>
51 <def-cat n=
"prep"> <!-- preposition -->
53 <cat-item tags=
"pr.*"/>
55 <def-cat n=
"number"> <!-- number -->
56 <cat-item tags=
"num"/>
57 <cat-item tags=
"num.*"/>
59 <def-cat n=
"num_234w">
60 <cat-item lemma=
"two" tags=
"num"/>
61 <cat-item lemma=
"three" tags=
"num"/>
62 <cat-item lemma=
"four" tags=
"num"/>
65 <cat-item lemma=
"2" tags=
"num"/>
66 <cat-item lemma=
"3" tags=
"num"/>
67 <cat-item lemma=
"4" tags=
"num"/>
72 <def-attr n=
"nbr"> <!-- Number -->
73 <attr-item tags=
"sg"/>
74 <attr-item tags=
"pl"/>
75 <attr-item tags=
"sp"/>
77 <def-attr n=
"gen"> <!-- Gender -->
78 <attr-item tags=
"m1"/>
79 <attr-item tags=
"m2"/>
80 <attr-item tags=
"m3"/>
82 <attr-item tags=
"nt"/>
83 <attr-item tags=
"mf"/>
86 <attr-item tags=
"cnjadv"/>
87 <attr-item tags=
"cnjsub"/>
88 <attr-item tags=
"cnjcoo"/>
92 <attr-item tags=
"n.acr"/>
93 <attr-item tags=
"n.unc"/>
94 <attr-item tags=
"np.top"/>
97 <attr-item tags=
"adj.sint"/>
98 <attr-item tags=
"adj"/>
99 <attr-item tags=
"comp"/>
100 <attr-item tags=
"sup"/>
102 <def-attr n=
"stress">
103 <attr-item tags=
"uns"/>
106 <attr-item tags=
"det.ind"/>
107 <attr-item tags=
"det.def"/>
110 <attr-item tags=
"num"/>
113 <attr-item tags=
"rel"/>
114 <attr-item tags=
"rel.nn"/>
115 <attr-item tags=
"rel.an"/>
117 <def-attr n=
"tipus_prn">
118 <attr-item tags=
"prn.subj"/>
119 <attr-item tags=
"prn.obj"/>
122 <attr-item tags=
"nom"/>
123 <attr-item tags=
"acc"/>
124 <attr-item tags=
"dat"/>
125 <attr-item tags=
"gen"/>
126 <attr-item tags=
"loc"/>
127 <attr-item tags=
"ins"/>
128 <attr-item tags=
"voc"/>
131 <attr-item tags=
"nom"/>
132 <attr-item tags=
"acc"/>
133 <attr-item tags=
"voc"/>
135 <def-attr n=
"pers"> <!-- Person -->
136 <attr-item tags=
"p1"/>
137 <attr-item tags=
"p2"/>
138 <attr-item tags=
"p3"/>
140 <def-attr n=
"a_verb">
141 <attr-item tags=
"vblex"/>
142 <attr-item tags=
"vblex.uns"/>
143 <attr-item tags=
"vbser"/>
144 <attr-item tags=
"vbhaver"/>
145 <attr-item tags=
"vbmod"/>
146 <attr-item tags=
"vaux"/>
149 <attr-item tags=
"pp"/>
150 <attr-item tags=
"pii"/>
151 <attr-item tags=
"pis"/>
152 <attr-item tags=
"pri"/>
153 <attr-item tags=
"past"/>
154 <attr-item tags=
"pres"/>
155 <attr-item tags=
"inf"/>
160 <def-var n=
"numero"/>
161 <def-var n=
"caseFirstWord"/>
162 <def-var n=
"nombre"/>
163 <def-var n=
"group_gender"/>
164 <def-var n=
"nn_num"/>
165 <def-var n=
"nn_nom"/>
166 <def-var n=
"lastVerb"/>
170 <def-list n=
"nad_locative">
171 <list-item v=
"river"/>
173 <list-item v=
"ocean"/>
175 <def-list n=
"months">
176 <list-item v=
"January"/>
177 <list-item v=
"February"/>
178 <list-item v=
"March"/>
179 <list-item v=
"April"/>
181 <list-item v=
"June"/>
182 <list-item v=
"July"/>
183 <list-item v=
"August"/>
184 <list-item v=
"September"/>
185 <list-item v=
"October"/>
186 <list-item v=
"November"/>
187 <list-item v=
"December"/>
190 <list-item v=
"Monday"/>
191 <list-item v=
"Tuesday"/>
192 <list-item v=
"Wednesday"/>
193 <list-item v=
"Thursday"/>
194 <list-item v=
"Friday"/>
195 <list-item v=
"Saturday"/>
196 <list-item v=
"Sunday"/>
198 <def-list n=
"titles">
199 <list-item v=
"Mister"/>
201 <list-item v=
"Miss"/>
202 <list-item v=
"Mrs."/>
206 <def-list n=
"na_accusative">
207 <list-item v=
"concert"/>
208 <list-item v=
"airport"/>
214 <rule comment=
"Drop the/a">
216 <pattern-item n=
"det_ignore"/>
227 <rule comment=
"REGLA: NOM">
229 <pattern-item n=
"nom"/>
233 <chunk name=
"nom" case=
"caseFirstWord">
235 <tag><lit-tag v=
"NP"/></tag>
236 <tag><clip pos=
"1" side=
"tl" part=
"nbr"/></tag>
239 <clip pos=
"1" side=
"tl" part=
"lem"/>
240 <clip pos=
"1" side=
"tl" part=
"a_nom"/>
241 <clip pos=
"1" side=
"tl" part=
"gen"/>
242 <clip pos=
"1" side=
"tl" part=
"nbr"/>
249 <rule comment=
"REGLA: NOM genitive">
251 <pattern-item n=
"nom"/>
252 <pattern-item n=
"genitive"/>
256 <chunk name=
"nom-gen" case=
"caseFirstWord">
258 <tag><lit-tag v=
"NP"/></tag>
259 <tag><clip pos=
"1" side=
"tl" part=
"nbr"/></tag>
262 <clip pos=
"1" side=
"tl" part=
"lem"/>
263 <clip pos=
"1" side=
"tl" part=
"a_nom"/>
264 <clip pos=
"1" side=
"tl" part=
"gen"/>
265 <clip pos=
"1" side=
"tl" part=
"nbr"/>
273 <!-- FIXME: there are more complicated cases to be handled with prepositions -->
274 <rule comment=
"REGLA: PR NOM">
276 <pattern-item n=
"prep"/>
277 <pattern-item n=
"nom"/>
281 <chunk name=
"prep-nom">
283 <tag><lit-tag v=
"PR"/></tag>
286 <clip pos=
"1" side=
"tl" part=
"lem"/>
291 <chunk name=
"prep-nom">
293 <tag><lit-tag v=
"NOM"/></tag>
296 <clip pos=
"2" side=
"tl" part=
"lem"/>
297 <clip pos=
"2" side=
"tl" part=
"a_nom"/>
298 <clip pos=
"2" side=
"tl" part=
"gen"/>
299 <clip pos=
"2" side=
"tl" part=
"nbr"/>
300 <clip pos=
"1" side=
"tl" part=
"caso"/>
306 <rule comment=
"REGLA: PR (a/the) NOM">
308 <pattern-item n=
"prep"/>
309 <pattern-item n=
"det_ignore"/>
310 <pattern-item n=
"nom"/>
314 <chunk name=
"prep-nom">
316 <tag><lit-tag v=
"PR"/></tag>
319 <clip pos=
"1" side=
"tl" part=
"lem"/>
324 <chunk name=
"prep-nom">
326 <tag><lit-tag v=
"NOM"/></tag>
329 <clip pos=
"3" side=
"tl" part=
"lem"/>
330 <clip pos=
"3" side=
"tl" part=
"a_nom"/>
331 <clip pos=
"3" side=
"tl" part=
"gen"/>
332 <clip pos=
"3" side=
"tl" part=
"nbr"/>
333 <clip pos=
"1" side=
"tl" part=
"caso"/>
340 <!-- This rule reorders the words so that the word inflected to match the preposition is beside the preposition -->
341 <rule comment=
"REGLA: PR NOM genitive NOM ~~ e.g. with brother's dog - z psem brata">
343 <pattern-item n=
"prep"/>
344 <pattern-item n=
"nom"/>
345 <pattern-item n=
"genitive"/>
346 <pattern-item n=
"nom"/>
350 <chunk name=
"prep-nom">
352 <tag><lit-tag v=
"PR"/></tag>
355 <clip pos=
"1" side=
"tl" part=
"lem"/>
360 <chunk name=
"prep-nom" case=
"Aa">
362 <tag><lit-tag v=
"NOM"/></tag>
365 <clip pos=
"4" side=
"tl" part=
"lem"/>
366 <clip pos=
"4" side=
"tl" part=
"a_nom"/>
367 <clip pos=
"4" side=
"tl" part=
"gen"/>
368 <clip pos=
"4" side=
"tl" part=
"nbr"/>
369 <clip pos=
"1" side=
"tl" part=
"caso"/>
373 <chunk name=
"nom-gen" case=
"Aa">
375 <tag><lit-tag v=
"NP"/></tag>
376 <tag><clip pos=
"1" side=
"tl" part=
"nbr"/></tag>
379 <clip pos=
"2" side=
"tl" part=
"lem"/>
380 <clip pos=
"2" side=
"tl" part=
"a_nom"/>
381 <clip pos=
"2" side=
"tl" part=
"gen"/>
382 <clip pos=
"2" side=
"tl" part=
"nbr"/>
390 <rule comment=
"REGLA: PR (a/the) NOM genitive NOM ~~ e.g. with a brother's dog - z psem brata">
392 <pattern-item n=
"prep"/>
393 <pattern-item n=
"det_ignore"/>
394 <pattern-item n=
"nom"/>
395 <pattern-item n=
"genitive"/>
396 <pattern-item n=
"nom"/>
400 <chunk name=
"prep-nom">
402 <tag><lit-tag v=
"PR"/></tag>
405 <clip pos=
"1" side=
"tl" part=
"lem"/>
410 <chunk name=
"prep-nom" case=
"Aa">
412 <tag><lit-tag v=
"NOM"/></tag>
415 <clip pos=
"5" side=
"tl" part=
"lem"/>
416 <clip pos=
"5" side=
"tl" part=
"a_nom"/>
417 <clip pos=
"5" side=
"tl" part=
"gen"/>
418 <clip pos=
"5" side=
"tl" part=
"nbr"/>
419 <clip pos=
"1" side=
"tl" part=
"caso"/>
423 <chunk name=
"nom-gen" case=
"Aa">
425 <tag><lit-tag v=
"NP"/></tag>
426 <tag><clip pos=
"1" side=
"tl" part=
"nbr"/></tag>
429 <clip pos=
"3" side=
"tl" part=
"lem"/>
430 <clip pos=
"3" side=
"tl" part=
"a_nom"/>
431 <clip pos=
"3" side=
"tl" part=
"gen"/>
432 <clip pos=
"3" side=
"tl" part=
"nbr"/>
440 <rule comment=
"REGLA: PR">
442 <pattern-item n=
"prep"/>
448 <tag><lit-tag v=
"PR"/></tag>
451 <clip pos=
"1" side=
"tl" part=
"lem"/>
459 <rule comment=
"REGLA: ADJ">
461 <pattern-item n=
"adj"/>
467 <tag><lit-tag v=
"ADJ"/></tag>
470 <clip pos=
"1" side=
"tl" part=
"lem"/>
471 <clip pos=
"1" side=
"tl" part=
"a_adj"/>
481 <rule comment=
"REGLA: NUM NOM">
483 <pattern-item n=
"number"/>
484 <pattern-item n=
"nom"/>
491 <equal> <!-- nom, if no verb yet -->
496 <clip pos=
"1" side=
"sl" part=
"lem"/>
501 <clip pos=
"2" side=
"tl" part=
"nbr"/>
509 <clip pos=
"1" side=
"tl" part=
"lem"/>
513 <clip pos=
"2" side=
"tl" part=
"gen"/>
519 <clip pos=
"2" side=
"tl" part=
"lem"/>
523 <clip pos=
"2" side=
"tl" part=
"gen"/>
531 <equal> <!-- nom, if no verb yet -->
536 <clip pos=
"1" side=
"sl" part=
"lem"/>
540 <clip pos=
"2" side=
"tl" part=
"nbr"/>
547 <clip pos=
"1" side=
"tl" part=
"lem"/>
551 <clip pos=
"2" side=
"tl" part=
"gen"/>
557 <clip pos=
"2" side=
"tl" part=
"lem"/>
561 <clip pos=
"2" side=
"tl" part=
"gen"/>
570 <equal> <!-- nom, if no verb yet -->
575 <clip pos=
"1" side=
"sl" part=
"lem"/>
582 <clip pos=
"1" side=
"tl" part=
"lem"/>
586 <clip pos=
"2" side=
"tl" part=
"gen"/>
592 <clip pos=
"2" side=
"tl" part=
"lem"/>
596 <clip pos=
"2" side=
"tl" part=
"gen"/>
605 <equal> <!-- nom, if no verb yet -->
611 <clip pos=
"1" side=
"sl" part=
"lem"/>
615 <clip pos=
"1" side=
"sl" part=
"lem"/>
620 <clip pos=
"1" side=
"sl" part=
"gen"/>
627 <clip pos=
"1" side=
"tl" part=
"lem"/>
631 <clip pos=
"2" side=
"tl" part=
"gen"/>
637 <clip pos=
"2" side=
"tl" part=
"lem"/>
641 <clip pos=
"2" side=
"tl" part=
"gen"/>
649 <equal> <!-- nom, if no verb yet -->
655 <clip pos=
"1" side=
"sl" part=
"lem"/>
659 <clip pos=
"1" side=
"sl" part=
"lem"/>
665 <clip pos=
"1" side=
"sl" part=
"gen"/>
673 <clip pos=
"1" side=
"tl" part=
"lem"/>
682 <clip pos=
"2" side=
"tl" part=
"lem"/>
686 <clip pos=
"2" side=
"tl" part=
"gen"/>
694 <equal> <!-- nom, if no verb yet -->
699 <clip pos=
"1" side=
"sl" part=
"caso"/>
703 <clip pos=
"1" side=
"sl" part=
"gen"/>
710 <clip pos=
"1" side=
"tl" part=
"lem"/>
714 <clip pos=
"2" side=
"tl" part=
"gen"/>
720 <clip pos=
"2" side=
"tl" part=
"lem"/>
724 <clip pos=
"2" side=
"tl" part=
"gen"/>
729 <otherwise> <!-- 5+ -->
732 <clip pos=
"1" side=
"tl" part=
"lem"/>
741 <clip pos=
"2" side=
"tl" part=
"lem"/>
745 <clip pos=
"2" side=
"tl" part=
"gen"/>
755 <tag><lit-tag v=
"NUM"/></tag>
764 <tag><lit-tag v=
"NOM"/></tag>
774 <rule> <!-- REGLA: reset variables-->
776 <pattern-item n=
"sent"/>
790 <tag><lit-tag v=
"sent"/></tag>
793 <clip pos=
"1" side=
"tl" part=
"whole"/>