357 fix license on strptime.c
[illumos-gate.git] / usr / src / cmd / localedef / parser.y
blob485430b8d1e08a3a42c87ed8829edf7e96a42afb
1 %{
2 /*
3 * This file and its contents are supplied under the terms of the
4 * Common Development and Distribution License ("CDDL"), version 1.0.
5 * You may only use this file in accordance with the terms of version
6 * 1.0 of the CDDL.
8 * A full copy of the text of the CDDL should have accompanied this
9 * source. A copy of the CDDL is also available via the Internet at
10 * http://www.illumos.org/license/CDDL.
14 * Copyright 2010 Nexenta Systems, Inc. All rights reserved.
18 * POSIX localedef grammar.
21 #include <wchar.h>
22 #include <stdio.h>
23 #include <limits.h>
24 #include "localedef.h"
27 %union {
28 int num;
29 wchar_t wc;
30 char *token;
31 collsym_t *collsym;
32 collelem_t *collelem;
35 %token T_CODE_SET
36 %token T_MB_CUR_MAX
37 %token T_MB_CUR_MIN
38 %token T_COM_CHAR
39 %token T_ESC_CHAR
40 %token T_LT
41 %token T_GT
42 %token T_NL
43 %token T_SEMI
44 %token T_COMMA
45 %token T_ELLIPSIS
46 %token T_RPAREN
47 %token T_LPAREN
48 %token T_QUOTE
49 %token T_NULL
50 %token T_WS
51 %token T_END
52 %token T_COPY
53 %token T_CHARMAP
54 %token T_WIDTH
55 %token T_WIDTH_DEFAULT
56 %token T_CTYPE
57 %token T_ISUPPER
58 %token T_ISLOWER
59 %token T_ISALPHA
60 %token T_ISDIGIT
61 %token T_ISPUNCT
62 %token T_ISXDIGIT
63 %token T_ISSPACE
64 %token T_ISPRINT
65 %token T_ISGRAPH
66 %token T_ISBLANK
67 %token T_ISCNTRL
68 %token T_ISALNUM
69 %token T_ISSPECIAL
70 %token T_ISPHONOGRAM
71 %token T_ISIDEOGRAM
72 %token T_ISENGLISH
73 %token T_ISNUMBER
74 %token T_TOUPPER
75 %token T_TOLOWER
76 %token T_COLLATE
77 %token T_COLLATING_SYMBOL
78 %token T_COLLATING_ELEMENT
79 %token T_ORDER_START
80 %token T_ORDER_END
81 %token T_FORWARD
82 %token T_BACKWARD
83 %token T_POSITION
84 %token T_FROM
85 %token T_UNDEFINED
86 %token T_IGNORE
87 %token T_MESSAGES
88 %token T_YESSTR
89 %token T_NOSTR
90 %token T_YESEXPR
91 %token T_NOEXPR
92 %token T_MONETARY
93 %token T_INT_CURR_SYMBOL
94 %token T_CURRENCY_SYMBOL
95 %token T_MON_DECIMAL_POINT
96 %token T_MON_THOUSANDS_SEP
97 %token T_POSITIVE_SIGN
98 %token T_NEGATIVE_SIGN
99 %token T_MON_GROUPING
100 %token T_INT_FRAC_DIGITS
101 %token T_FRAC_DIGITS
102 %token T_P_CS_PRECEDES
103 %token T_P_SEP_BY_SPACE
104 %token T_N_CS_PRECEDES
105 %token T_N_SEP_BY_SPACE
106 %token T_P_SIGN_POSN
107 %token T_N_SIGN_POSN
108 %token T_INT_P_CS_PRECEDES
109 %token T_INT_N_CS_PRECEDES
110 %token T_INT_P_SEP_BY_SPACE
111 %token T_INT_N_SEP_BY_SPACE
112 %token T_INT_P_SIGN_POSN
113 %token T_INT_N_SIGN_POSN
114 %token T_NUMERIC
115 %token T_DECIMAL_POINT
116 %token T_THOUSANDS_SEP
117 %token T_GROUPING
118 %token T_TIME
119 %token T_ABDAY
120 %token T_DAY
121 %token T_ABMON
122 %token T_MON
123 %token T_ERA
124 %token T_ERA_D_FMT
125 %token T_ERA_T_FMT
126 %token T_ERA_D_T_FMT
127 %token T_ALT_DIGITS
128 %token T_D_T_FMT
129 %token T_D_FMT
130 %token T_T_FMT
131 %token T_AM_PM
132 %token T_T_FMT_AMPM
133 %token T_DATE_FMT
134 %token <wc> T_CHAR
135 %token <token> T_NAME
136 %token <num> T_NUMBER
137 %token <token> T_SYMBOL
138 %token <collsym> T_COLLSYM
139 %token <collelem> T_COLLELEM
143 localedef : setting_list categories
144 | categories
147 string : T_QUOTE charlist T_QUOTE
148 | T_QUOTE T_QUOTE
151 charlist : charlist T_CHAR
153 add_wcs($2);
155 | T_CHAR
157 add_wcs($1);
161 setting_list : setting_list setting
162 | setting
166 setting : T_COM_CHAR T_CHAR T_NL
168 com_char = $2;
170 | T_ESC_CHAR T_CHAR T_NL
172 esc_char = $2;
174 | T_MB_CUR_MAX T_NUMBER T_NL
176 mb_cur_max = $2;
178 | T_MB_CUR_MIN T_NUMBER T_NL
180 mb_cur_min = $2;
182 | T_CODE_SET string T_NL
184 wchar_t *w = get_wcs();
185 set_wide_encoding(to_mb_string(w));
186 free(w);
188 | T_CODE_SET T_NAME T_NL
190 set_wide_encoding($2);
194 copycat : T_COPY T_NAME T_NL
196 copy_category($2);
198 | T_COPY string T_NL
200 wchar_t *w = get_wcs();
201 copy_category(to_mb_string(w));
202 free(w);
206 categories : categories category
207 | category
211 category : charmap
212 | messages
213 | monetary
214 | ctype
215 | collate
216 | numeric
217 | time
221 charmap : T_CHARMAP T_NL charmap_list T_END T_CHARMAP T_NL
224 charmap_list : charmap_list charmap_entry
225 | charmap_entry
229 charmap_entry : T_SYMBOL T_CHAR
231 add_charmap($1, $2);
232 scan_to_eol();
234 | T_SYMBOL T_ELLIPSIS T_SYMBOL T_CHAR
236 add_charmap_range($1, $3, $4);
237 scan_to_eol();
239 | T_NL
242 ctype : T_CTYPE T_NL ctype_list T_END T_CTYPE T_NL
244 dump_ctype();
246 | T_CTYPE T_NL copycat T_END T_CTYPE T_NL
249 ctype_list : ctype_list ctype_kw
250 | ctype_kw
253 ctype_kw : T_ISUPPER cc_list T_NL
254 | T_ISLOWER cc_list T_NL
255 | T_ISALPHA cc_list T_NL
256 | T_ISDIGIT cc_list T_NL
257 | T_ISPUNCT cc_list T_NL
258 | T_ISXDIGIT cc_list T_NL
259 | T_ISSPACE cc_list T_NL
260 | T_ISPRINT cc_list T_NL
261 | T_ISGRAPH cc_list T_NL
262 | T_ISBLANK cc_list T_NL
263 | T_ISCNTRL cc_list T_NL
264 | T_ISALNUM cc_list T_NL
265 | T_ISSPECIAL cc_list T_NL
266 | T_ISENGLISH cc_list T_NL
267 | T_ISNUMBER cc_list T_NL
268 | T_ISIDEOGRAM cc_list T_NL
269 | T_ISPHONOGRAM cc_list T_NL
270 | T_TOUPPER conv_list T_NL
271 | T_TOLOWER conv_list T_NL
275 cc_list : cc_list T_SEMI T_CHAR
277 add_ctype($3);
279 | cc_list T_SEMI T_SYMBOL
281 add_charmap_undefined($3);
283 | cc_list T_SEMI T_ELLIPSIS T_SEMI T_CHAR
285 /* note that the endpoints *must* be characters */
286 add_ctype_range($5);
288 | T_CHAR
290 add_ctype($1);
292 | T_SYMBOL
294 add_charmap_undefined($1);
298 conv_list : conv_list T_SEMI conv_pair
299 | conv_pair
303 conv_pair : T_LPAREN T_CHAR T_COMMA T_CHAR T_RPAREN
305 add_caseconv($2, $4);
307 | T_LPAREN T_SYMBOL T_COMMA T_CHAR T_RPAREN
309 add_charmap_undefined($2);
311 | T_LPAREN T_SYMBOL T_COMMA T_SYMBOL T_RPAREN
313 add_charmap_undefined($2);
314 add_charmap_undefined($4);
316 | T_LPAREN T_CHAR T_COMMA T_SYMBOL T_RPAREN
318 add_charmap_undefined($4);
322 collate : T_COLLATE T_NL coll_order T_END T_COLLATE T_NL
324 dump_collate();
326 | T_COLLATE T_NL coll_optional coll_order T_END T_COLLATE T_NL
328 dump_collate();
330 | T_COLLATE T_NL copycat T_END T_COLLATE T_NL
334 coll_optional : coll_optional coll_symbols
335 | coll_optional coll_elements
336 | coll_symbols
337 | coll_elements
341 coll_symbols : T_COLLATING_SYMBOL T_SYMBOL T_NL
343 define_collsym($2);
348 coll_elements : T_COLLATING_ELEMENT T_SYMBOL T_FROM string T_NL
350 define_collelem($2, get_wcs());
354 coll_order : T_ORDER_START T_NL order_list T_ORDER_END T_NL
356 /* If no order list supplied default to one forward */
357 add_order_bit(T_FORWARD);
358 add_order_directive();
360 | T_ORDER_START order_args T_NL order_list T_ORDER_END T_NL
364 order_args : order_args T_SEMI order_arg
366 add_order_directive();
368 | order_arg
370 add_order_directive();
374 order_arg : order_arg T_COMMA order_dir
375 | order_dir
378 order_dir : T_FORWARD
380 add_order_bit(T_FORWARD);
382 | T_BACKWARD
384 add_order_bit(T_BACKWARD);
386 | T_POSITION
388 add_order_bit(T_POSITION);
392 order_list : order_list order_item
393 | order_item
396 order_item : T_COLLSYM T_NL
398 end_order_collsym($1);
400 | order_itemkw T_NL
402 end_order();
404 | order_itemkw order_weights T_NL
406 end_order();
410 order_itemkw : T_CHAR
412 start_order_char($1);
414 | T_ELLIPSIS
416 start_order_ellipsis();
418 | T_COLLELEM
420 start_order_collelem($1);
422 | T_UNDEFINED
424 start_order_undefined();
426 | T_SYMBOL
428 start_order_symbol($1);
432 order_weights : order_weights T_SEMI order_weight
433 | order_weights T_SEMI
434 | order_weight
437 order_weight : T_COLLELEM
439 add_order_collelem($1);
441 | T_COLLSYM
443 add_order_collsym($1);
445 | T_CHAR
447 add_order_char($1);
449 | T_ELLIPSIS
451 add_order_ellipsis();
453 | T_IGNORE
455 add_order_ignore();
457 | T_SYMBOL
459 add_order_symbol($1);
461 | T_QUOTE order_str T_QUOTE
463 add_order_subst();
467 order_str : order_str order_stritem
468 | order_stritem
471 order_stritem : T_CHAR
473 add_subst_char($1);
475 | T_COLLSYM
477 add_subst_collsym($1);
479 | T_COLLELEM
481 add_subst_collelem($1);
483 | T_SYMBOL
485 add_subst_symbol($1);
489 messages : T_MESSAGES T_NL messages_list T_END T_MESSAGES T_NL
491 dump_messages();
493 | T_MESSAGES T_NL copycat T_END T_MESSAGES T_NL
496 messages_list : messages_list messages_item
497 | messages_item
500 messages_kw : T_YESSTR
501 | T_NOSTR
502 | T_YESEXPR
503 | T_NOEXPR
506 messages_item : messages_kw string T_NL
508 add_message(get_wcs());
512 monetary : T_MONETARY T_NL monetary_list T_END T_MONETARY T_NL
514 dump_monetary();
516 | T_MONETARY T_NL copycat T_END T_MONETARY T_NL
519 monetary_list : monetary_list monetary_kw
520 | monetary_kw
523 monetary_strkw : T_INT_CURR_SYMBOL
524 | T_CURRENCY_SYMBOL
525 | T_MON_DECIMAL_POINT
526 | T_MON_THOUSANDS_SEP
527 | T_POSITIVE_SIGN
528 | T_NEGATIVE_SIGN
531 monetary_numkw : T_INT_FRAC_DIGITS
532 | T_FRAC_DIGITS
533 | T_P_CS_PRECEDES
534 | T_P_SEP_BY_SPACE
535 | T_N_CS_PRECEDES
536 | T_N_SEP_BY_SPACE
537 | T_P_SIGN_POSN
538 | T_N_SIGN_POSN
539 | T_INT_P_CS_PRECEDES
540 | T_INT_N_CS_PRECEDES
541 | T_INT_P_SEP_BY_SPACE
542 | T_INT_N_SEP_BY_SPACE
543 | T_INT_P_SIGN_POSN
544 | T_INT_N_SIGN_POSN
547 monetary_kw : monetary_strkw string T_NL
549 add_monetary_str(get_wcs());
551 | monetary_numkw T_NUMBER T_NL
553 add_monetary_num($2);
555 | T_MON_GROUPING mon_group_list T_NL
558 mon_group_list : T_NUMBER
560 reset_monetary_group();
561 add_monetary_group($1);
563 | mon_group_list T_SEMI T_NUMBER
565 add_monetary_group($3);
570 numeric : T_NUMERIC T_NL numeric_list T_END T_NUMERIC T_NL
572 dump_numeric();
574 | T_NUMERIC T_NL copycat T_END T_NUMERIC T_NL
578 numeric_list : numeric_list numeric_item
579 | numeric_item
583 numeric_item : numeric_strkw string T_NL
585 add_numeric_str(get_wcs());
587 | T_GROUPING group_list T_NL
590 numeric_strkw : T_DECIMAL_POINT
591 | T_THOUSANDS_SEP
595 group_list : T_NUMBER
597 reset_numeric_group();
598 add_numeric_group($1);
600 | group_list T_SEMI T_NUMBER
602 add_numeric_group($3);
607 time : T_TIME T_NL time_kwlist T_END T_TIME T_NL
609 dump_time();
611 | T_TIME T_NL copycat T_END T_NUMERIC T_NL
614 time_kwlist : time_kwlist time_kw
615 | time_kw
618 time_kw : time_strkw string T_NL
620 add_time_str(get_wcs());
622 | time_listkw time_list T_NL
624 check_time_list();
628 time_listkw : T_ABDAY
629 | T_DAY
630 | T_ABMON
631 | T_MON
632 | T_ERA
633 | T_ALT_DIGITS
634 | T_AM_PM
637 time_strkw : T_ERA_D_T_FMT
638 | T_ERA_T_FMT
639 | T_ERA_D_FMT
640 | T_D_T_FMT
641 | T_D_FMT
642 | T_T_FMT
643 | T_T_FMT_AMPM
644 | T_DATE_FMT
647 time_list : time_list T_SEMI string
649 add_time_list(get_wcs());
651 | string
653 reset_time_list();
654 add_time_list(get_wcs());