2 * Copyright 2008-2009 Katholieke Universiteit Leuven
4 * Use of this software is governed by the GNU LGPLv2.1 license
6 * Written by Sven Verdoolaege, K.U.Leuven, Departement
7 * Computerwetenschappen, Celestijnenlaan 200A, B-3001 Leuven, Belgium
14 #include <isl/stream.h>
18 enum isl_token_type type
;
21 static int same_name(const void *entry
, const void *val
)
23 const struct isl_keyword
*keyword
= (const struct isl_keyword
*)entry
;
25 return !strcmp(keyword
->name
, val
);
28 enum isl_token_type
isl_stream_register_keyword(struct isl_stream
*s
,
31 struct isl_hash_table_entry
*entry
;
32 struct isl_keyword
*keyword
;
36 s
->keywords
= isl_hash_table_alloc(s
->ctx
, 10);
38 return ISL_TOKEN_ERROR
;
39 s
->next_type
= ISL_TOKEN_LAST
;
42 name_hash
= isl_hash_string(isl_hash_init(), name
);
44 entry
= isl_hash_table_find(s
->ctx
, s
->keywords
, name_hash
,
47 return ISL_TOKEN_ERROR
;
49 keyword
= entry
->data
;
53 keyword
= isl_calloc_type(s
->ctx
, struct isl_keyword
);
55 return ISL_TOKEN_ERROR
;
56 keyword
->type
= s
->next_type
++;
57 keyword
->name
= strdup(name
);
60 return ISL_TOKEN_ERROR
;
62 entry
->data
= keyword
;
67 static struct isl_token
*isl_token_new(struct isl_ctx
*ctx
,
68 int line
, int col
, unsigned on_new_line
)
70 struct isl_token
*tok
= isl_alloc_type(ctx
, struct isl_token
);
75 tok
->on_new_line
= on_new_line
;
81 void isl_token_free(struct isl_token
*tok
)
85 if (tok
->type
== ISL_TOKEN_VALUE
)
86 isl_int_clear(tok
->u
.v
);
92 void isl_stream_error(struct isl_stream
*s
, struct isl_token
*tok
, char *msg
)
94 int line
= tok
? tok
->line
: s
->line
;
95 int col
= tok
? tok
->col
: s
->col
;
96 fprintf(stderr
, "syntax error (%d, %d): %s\n", line
, col
, msg
);
99 fprintf(stderr
, "got '%c'\n", tok
->type
);
100 else if (tok
->type
== ISL_TOKEN_IDENT
)
101 fprintf(stderr
, "got ident '%s'\n", tok
->u
.s
);
102 else if (tok
->is_keyword
)
103 fprintf(stderr
, "got keyword '%s'\n", tok
->u
.s
);
104 else if (tok
->type
== ISL_TOKEN_VALUE
) {
105 fprintf(stderr
, "got value '");
106 isl_int_print(stderr
, tok
->u
.v
, 0);
107 fprintf(stderr
, "'\n");
109 fprintf(stderr
, "got token '%s'\n", tok
->u
.s
);
111 fprintf(stderr
, "got token type %d\n", tok
->type
);
115 static struct isl_stream
* isl_stream_new(struct isl_ctx
*ctx
)
118 struct isl_stream
*s
= isl_alloc_type(ctx
, struct isl_stream
);
130 for (i
= 0; i
< 5; ++i
)
135 s
->buffer
= isl_alloc_array(ctx
, char, s
->size
);
144 struct isl_stream
* isl_stream_new_file(struct isl_ctx
*ctx
, FILE *file
)
146 struct isl_stream
*s
= isl_stream_new(ctx
);
153 struct isl_stream
* isl_stream_new_str(struct isl_ctx
*ctx
, const char *str
)
155 struct isl_stream
*s
= isl_stream_new(ctx
);
162 static int isl_stream_getc(struct isl_stream
*s
)
187 static void isl_stream_ungetc(struct isl_stream
*s
, int c
)
196 static int isl_stream_push_char(struct isl_stream
*s
, int c
)
198 if (s
->len
>= s
->size
) {
199 s
->size
= (3*s
->size
)/2;
200 s
->buffer
= isl_realloc_array(s
->ctx
, s
->buffer
, char, s
->size
);
204 s
->buffer
[s
->len
++] = c
;
208 void isl_stream_push_token(struct isl_stream
*s
, struct isl_token
*tok
)
210 isl_assert(s
->ctx
, s
->n_token
< 5, return);
211 s
->tokens
[s
->n_token
++] = tok
;
214 static enum isl_token_type
check_keywords(struct isl_stream
*s
)
216 struct isl_hash_table_entry
*entry
;
217 struct isl_keyword
*keyword
;
220 if (!strcasecmp(s
->buffer
, "exists"))
221 return ISL_TOKEN_EXISTS
;
222 if (!strcasecmp(s
->buffer
, "and"))
223 return ISL_TOKEN_AND
;
224 if (!strcasecmp(s
->buffer
, "or"))
226 if (!strcasecmp(s
->buffer
, "infty"))
227 return ISL_TOKEN_INFTY
;
228 if (!strcasecmp(s
->buffer
, "infinity"))
229 return ISL_TOKEN_INFTY
;
230 if (!strcasecmp(s
->buffer
, "NaN"))
231 return ISL_TOKEN_NAN
;
232 if (!strcasecmp(s
->buffer
, "max"))
233 return ISL_TOKEN_MAX
;
236 return ISL_TOKEN_IDENT
;
238 name_hash
= isl_hash_string(isl_hash_init(), s
->buffer
);
239 entry
= isl_hash_table_find(s
->ctx
, s
->keywords
, name_hash
, same_name
,
242 keyword
= entry
->data
;
243 return keyword
->type
;
246 return ISL_TOKEN_IDENT
;
249 int isl_stream_skip_line(struct isl_stream
*s
)
253 while ((c
= isl_stream_getc(s
)) != -1 && c
!= '\n')
257 return c
== -1 ? -1 : 0;
260 static struct isl_token
*next_token(struct isl_stream
*s
, int same_line
)
263 struct isl_token
*tok
= NULL
;
265 int old_line
= s
->line
;
268 if (same_line
&& s
->tokens
[s
->n_token
- 1]->on_new_line
)
270 return s
->tokens
[--s
->n_token
];
273 if (same_line
&& s
->c
== '\n')
278 /* skip spaces and comment lines */
279 while ((c
= isl_stream_getc(s
)) != -1) {
281 if (isl_stream_skip_line(s
) < 0)
286 } else if (!isspace(c
) || (same_line
&& c
== '\n'))
293 if (c
== -1 || (same_line
&& c
== '\n'))
311 tok
= isl_token_new(s
->ctx
, line
, col
, old_line
!= line
);
314 tok
->type
= (enum isl_token_type
)c
;
319 if ((c
= isl_stream_getc(s
)) == '>') {
320 tok
= isl_token_new(s
->ctx
, line
, col
, old_line
!= line
);
323 tok
->u
.s
= strdup("->");
324 tok
->type
= ISL_TOKEN_TO
;
328 isl_stream_ungetc(s
, c
);
330 tok
= isl_token_new(s
->ctx
, line
, col
, old_line
!= line
);
333 tok
->type
= (enum isl_token_type
) '-';
337 if (c
== '-' || isdigit(c
)) {
338 tok
= isl_token_new(s
->ctx
, line
, col
, old_line
!= line
);
341 tok
->type
= ISL_TOKEN_VALUE
;
342 isl_int_init(tok
->u
.v
);
343 if (isl_stream_push_char(s
, c
))
345 while ((c
= isl_stream_getc(s
)) != -1 && isdigit(c
))
346 if (isl_stream_push_char(s
, c
))
349 isl_stream_ungetc(s
, c
);
350 isl_stream_push_char(s
, '\0');
351 isl_int_read(tok
->u
.v
, s
->buffer
);
354 if (isalpha(c
) || c
== '_') {
355 tok
= isl_token_new(s
->ctx
, line
, col
, old_line
!= line
);
358 isl_stream_push_char(s
, c
);
359 while ((c
= isl_stream_getc(s
)) != -1 &&
360 (isalnum(c
) || c
== '_'))
361 isl_stream_push_char(s
, c
);
363 isl_stream_ungetc(s
, c
);
364 while ((c
= isl_stream_getc(s
)) != -1 && c
== '\'')
365 isl_stream_push_char(s
, c
);
367 isl_stream_ungetc(s
, c
);
368 isl_stream_push_char(s
, '\0');
369 tok
->type
= check_keywords(s
);
370 if (tok
->type
!= ISL_TOKEN_IDENT
)
372 tok
->u
.s
= strdup(s
->buffer
);
378 tok
= isl_token_new(s
->ctx
, line
, col
, old_line
!= line
);
381 tok
->type
= ISL_TOKEN_STRING
;
383 while ((c
= isl_stream_getc(s
)) != -1 && c
!= '"' && c
!= '\n')
384 isl_stream_push_char(s
, c
);
386 isl_stream_error(s
, NULL
, "unterminated string");
389 isl_stream_push_char(s
, '\0');
390 tok
->u
.s
= strdup(s
->buffer
);
395 tok
= isl_token_new(s
->ctx
, line
, col
, old_line
!= line
);
398 if ((c
= isl_stream_getc(s
)) == '=') {
399 tok
->u
.s
= strdup(":=");
400 tok
->type
= ISL_TOKEN_DEF
;
404 isl_stream_ungetc(s
, c
);
405 tok
->type
= (enum isl_token_type
) ':';
410 tok
= isl_token_new(s
->ctx
, line
, col
, old_line
!= line
);
413 if ((c
= isl_stream_getc(s
)) == '=') {
414 tok
->u
.s
= strdup(">=");
415 tok
->type
= ISL_TOKEN_GE
;
417 } else if (c
== '>') {
418 if ((c
= isl_stream_getc(s
)) == '=') {
419 tok
->u
.s
= strdup(">>=");
420 tok
->type
= ISL_TOKEN_LEX_GE
;
423 tok
->u
.s
= strdup(">>");
424 tok
->type
= ISL_TOKEN_LEX_GT
;
426 tok
->u
.s
= strdup(">");
427 tok
->type
= ISL_TOKEN_GT
;
430 isl_stream_ungetc(s
, c
);
435 tok
= isl_token_new(s
->ctx
, line
, col
, old_line
!= line
);
438 if ((c
= isl_stream_getc(s
)) == '=') {
439 tok
->u
.s
= strdup("<=");
440 tok
->type
= ISL_TOKEN_LE
;
442 } else if (c
== '<') {
443 if ((c
= isl_stream_getc(s
)) == '=') {
444 tok
->u
.s
= strdup("<<=");
445 tok
->type
= ISL_TOKEN_LEX_LE
;
448 tok
->u
.s
= strdup("<<");
449 tok
->type
= ISL_TOKEN_LEX_LT
;
451 tok
->u
.s
= strdup("<");
452 tok
->type
= ISL_TOKEN_LT
;
455 isl_stream_ungetc(s
, c
);
459 tok
= isl_token_new(s
->ctx
, line
, col
, old_line
!= line
);
462 tok
->type
= ISL_TOKEN_AND
;
463 if ((c
= isl_stream_getc(s
)) != '&' && c
!= -1) {
464 tok
->u
.s
= strdup("&");
465 isl_stream_ungetc(s
, c
);
467 tok
->u
.s
= strdup("&&");
471 tok
= isl_token_new(s
->ctx
, line
, col
, old_line
!= line
);
474 tok
->type
= ISL_TOKEN_OR
;
475 if ((c
= isl_stream_getc(s
)) != '|' && c
!= -1) {
476 tok
->u
.s
= strdup("|");
477 isl_stream_ungetc(s
, c
);
479 tok
->u
.s
= strdup("||");
483 tok
= isl_token_new(s
->ctx
, line
, col
, old_line
!= line
);
486 tok
->type
= ISL_TOKEN_UNKNOWN
;
493 struct isl_token
*isl_stream_next_token(struct isl_stream
*s
)
495 return next_token(s
, 0);
498 struct isl_token
*isl_stream_next_token_on_same_line(struct isl_stream
*s
)
500 return next_token(s
, 1);
503 int isl_stream_eat_if_available(struct isl_stream
*s
, int type
)
505 struct isl_token
*tok
;
507 tok
= isl_stream_next_token(s
);
510 if (tok
->type
== type
) {
514 isl_stream_push_token(s
, tok
);
518 int isl_stream_next_token_is(struct isl_stream
*s
, int type
)
520 struct isl_token
*tok
;
523 tok
= isl_stream_next_token(s
);
526 r
= tok
->type
== type
;
527 isl_stream_push_token(s
, tok
);
531 char *isl_stream_read_ident_if_available(struct isl_stream
*s
)
533 struct isl_token
*tok
;
535 tok
= isl_stream_next_token(s
);
538 if (tok
->type
== ISL_TOKEN_IDENT
) {
539 char *ident
= strdup(tok
->u
.s
);
543 isl_stream_push_token(s
, tok
);
547 int isl_stream_eat(struct isl_stream
*s
, int type
)
549 struct isl_token
*tok
;
551 tok
= isl_stream_next_token(s
);
554 if (tok
->type
== type
) {
558 isl_stream_error(s
, tok
, "expecting other token");
559 isl_stream_push_token(s
, tok
);
563 int isl_stream_is_empty(struct isl_stream
*s
)
565 struct isl_token
*tok
;
567 tok
= isl_stream_next_token(s
);
572 isl_stream_push_token(s
, tok
);
576 static int free_keyword(void **p
, void *user
)
578 struct isl_keyword
*keyword
= *p
;
586 void isl_stream_flush_tokens(struct isl_stream
*s
)
592 for (i
= 0; i
< s
->n_token
; ++i
)
593 isl_token_free(s
->tokens
[i
]);
597 void isl_stream_free(struct isl_stream
*s
)
602 if (s
->n_token
!= 0) {
603 struct isl_token
*tok
= isl_stream_next_token(s
);
604 isl_stream_error(s
, tok
, "unexpected token");
608 isl_hash_table_foreach(s
->ctx
, s
->keywords
, &free_keyword
, NULL
);
609 isl_hash_table_free(s
->ctx
, s
->keywords
);
611 isl_ctx_deref(s
->ctx
);