/* * Copyright 2008-2009 Katholieke Universiteit Leuven * * Use of this software is governed by the MIT license * * Written by Sven Verdoolaege, K.U.Leuven, Departement * Computerwetenschappen, Celestijnenlaan 200A, B-3001 Leuven, Belgium */ #include #include #include #include #include #include #include #include struct isl_keyword { char *name; enum isl_token_type type; }; static int same_name(const void *entry, const void *val) { const struct isl_keyword *keyword = (const struct isl_keyword *)entry; return !strcmp(keyword->name, val); } enum isl_token_type isl_stream_register_keyword(struct isl_stream *s, const char *name) { struct isl_hash_table_entry *entry; struct isl_keyword *keyword; uint32_t name_hash; if (!s->keywords) { s->keywords = isl_hash_table_alloc(s->ctx, 10); if (!s->keywords) return ISL_TOKEN_ERROR; s->next_type = ISL_TOKEN_LAST; } name_hash = isl_hash_string(isl_hash_init(), name); entry = isl_hash_table_find(s->ctx, s->keywords, name_hash, same_name, name, 1); if (!entry) return ISL_TOKEN_ERROR; if (entry->data) { keyword = entry->data; return keyword->type; } keyword = isl_calloc_type(s->ctx, struct isl_keyword); if (!keyword) return ISL_TOKEN_ERROR; keyword->type = s->next_type++; keyword->name = strdup(name); if (!keyword->name) { free(keyword); return ISL_TOKEN_ERROR; } entry->data = keyword; return keyword->type; } struct isl_token *isl_token_new(isl_ctx *ctx, int line, int col, unsigned on_new_line) { struct isl_token *tok = isl_alloc_type(ctx, struct isl_token); if (!tok) return NULL; tok->line = line; tok->col = col; tok->on_new_line = on_new_line; tok->is_keyword = 0; tok->u.s = NULL; return tok; } /* Return the type of "tok". */ int isl_token_get_type(struct isl_token *tok) { return tok ? tok->type : ISL_TOKEN_ERROR; } /* Given a token of type ISL_TOKEN_VALUE, return the value it represents. */ __isl_give isl_val *isl_token_get_val(isl_ctx *ctx, struct isl_token *tok) { if (!tok) return NULL; if (tok->type != ISL_TOKEN_VALUE) isl_die(ctx, isl_error_invalid, "not a value token", return NULL); return isl_val_int_from_isl_int(ctx, tok->u.v); } /* Given a token of type ISL_TOKEN_STRING, return the string it represents. */ __isl_give char *isl_token_get_str(isl_ctx *ctx, struct isl_token *tok) { if (!tok) return NULL; if (tok->type != ISL_TOKEN_STRING) isl_die(ctx, isl_error_invalid, "not a string token", return NULL); return strdup(tok->u.s); } void isl_token_free(struct isl_token *tok) { if (!tok) return; if (tok->type == ISL_TOKEN_VALUE) isl_int_clear(tok->u.v); else if (tok->type == ISL_TOKEN_MAP) isl_map_free(tok->u.map); else if (tok->type == ISL_TOKEN_AFF) isl_pw_aff_free(tok->u.pwaff); else free(tok->u.s); free(tok); } void isl_stream_error(struct isl_stream *s, struct isl_token *tok, char *msg) { int line = tok ? tok->line : s->line; int col = tok ? tok->col : s->col; fprintf(stderr, "syntax error (%d, %d): %s\n", line, col, msg); if (tok) { if (tok->type < 256) fprintf(stderr, "got '%c'\n", tok->type); else if (tok->type == ISL_TOKEN_IDENT) fprintf(stderr, "got ident '%s'\n", tok->u.s); else if (tok->is_keyword) fprintf(stderr, "got keyword '%s'\n", tok->u.s); else if (tok->type == ISL_TOKEN_VALUE) { fprintf(stderr, "got value '"); isl_int_print(stderr, tok->u.v, 0); fprintf(stderr, "'\n"); } else if (tok->type == ISL_TOKEN_MAP) { isl_printer *p; fprintf(stderr, "got map '"); p = isl_printer_to_file(s->ctx, stderr); p = isl_printer_print_map(p, tok->u.map); isl_printer_free(p); fprintf(stderr, "'\n"); } else if (tok->type == ISL_TOKEN_AFF) { isl_printer *p; fprintf(stderr, "got affine expression '"); p = isl_printer_to_file(s->ctx, stderr); p = isl_printer_print_pw_aff(p, tok->u.pwaff); isl_printer_free(p); fprintf(stderr, "'\n"); } else if (tok->u.s) fprintf(stderr, "got token '%s'\n", tok->u.s); else fprintf(stderr, "got token type %d\n", tok->type); } } static struct isl_stream* isl_stream_new(struct isl_ctx *ctx) { int i; struct isl_stream *s = isl_alloc_type(ctx, struct isl_stream); if (!s) return NULL; s->ctx = ctx; isl_ctx_ref(s->ctx); s->file = NULL; s->str = NULL; s->len = 0; s->line = 1; s->col = 0; s->eof = 0; s->c = -1; s->n_un = 0; for (i = 0; i < 5; ++i) s->tokens[i] = NULL; s->n_token = 0; s->keywords = NULL; s->size = 256; s->buffer = isl_alloc_array(ctx, char, s->size); if (!s->buffer) goto error; return s; error: isl_stream_free(s); return NULL; } struct isl_stream* isl_stream_new_file(struct isl_ctx *ctx, FILE *file) { struct isl_stream *s = isl_stream_new(ctx); if (!s) return NULL; s->file = file; return s; } struct isl_stream* isl_stream_new_str(struct isl_ctx *ctx, const char *str) { struct isl_stream *s; if (!str) return NULL; s = isl_stream_new(ctx); if (!s) return NULL; s->str = str; return s; } static int stream_getc(struct isl_stream *s) { int c; if (s->eof) return -1; if (s->n_un) return s->c = s->un[--s->n_un]; if (s->file) c = fgetc(s->file); else { c = *s->str++; if (c == '\0') c = -1; } if (c == -1) s->eof = 1; if (!s->eof) { if (s->c == '\n') { s->line++; s->col = 0; } else s->col++; } s->c = c; return c; } static void isl_stream_ungetc(struct isl_stream *s, int c) { isl_assert(s->ctx, s->n_un < 5, return); s->un[s->n_un++] = c; s->c = -1; } static int isl_stream_getc(struct isl_stream *s) { int c; do { c = stream_getc(s); if (c != '\\') return c; c = stream_getc(s); } while (c == '\n'); isl_stream_ungetc(s, c); return '\\'; } static int isl_stream_push_char(struct isl_stream *s, int c) { if (s->len >= s->size) { char *buffer; s->size = (3*s->size)/2; buffer = isl_realloc_array(s->ctx, s->buffer, char, s->size); if (!buffer) return -1; s->buffer = buffer; } s->buffer[s->len++] = c; return 0; } void isl_stream_push_token(struct isl_stream *s, struct isl_token *tok) { isl_assert(s->ctx, s->n_token < 5, return); s->tokens[s->n_token++] = tok; } static enum isl_token_type check_keywords(struct isl_stream *s) { struct isl_hash_table_entry *entry; struct isl_keyword *keyword; uint32_t name_hash; if (!strcasecmp(s->buffer, "exists")) return ISL_TOKEN_EXISTS; if (!strcasecmp(s->buffer, "and")) return ISL_TOKEN_AND; if (!strcasecmp(s->buffer, "or")) return ISL_TOKEN_OR; if (!strcasecmp(s->buffer, "implies")) return ISL_TOKEN_IMPLIES; if (!strcasecmp(s->buffer, "not")) return ISL_TOKEN_NOT; if (!strcasecmp(s->buffer, "infty")) return ISL_TOKEN_INFTY; if (!strcasecmp(s->buffer, "infinity")) return ISL_TOKEN_INFTY; if (!strcasecmp(s->buffer, "NaN")) return ISL_TOKEN_NAN; if (!strcasecmp(s->buffer, "min")) return ISL_TOKEN_MIN; if (!strcasecmp(s->buffer, "max")) return ISL_TOKEN_MAX; if (!strcasecmp(s->buffer, "rat")) return ISL_TOKEN_RAT; if (!strcasecmp(s->buffer, "true")) return ISL_TOKEN_TRUE; if (!strcasecmp(s->buffer, "false")) return ISL_TOKEN_FALSE; if (!strcasecmp(s->buffer, "ceild")) return ISL_TOKEN_CEILD; if (!strcasecmp(s->buffer, "floord")) return ISL_TOKEN_FLOORD; if (!strcasecmp(s->buffer, "mod")) return ISL_TOKEN_MOD; if (!strcasecmp(s->buffer, "ceil")) return ISL_TOKEN_CEIL; if (!strcasecmp(s->buffer, "floor")) return ISL_TOKEN_FLOOR; if (!s->keywords) return ISL_TOKEN_IDENT; name_hash = isl_hash_string(isl_hash_init(), s->buffer); entry = isl_hash_table_find(s->ctx, s->keywords, name_hash, same_name, s->buffer, 0); if (entry) { keyword = entry->data; return keyword->type; } return ISL_TOKEN_IDENT; } int isl_stream_skip_line(struct isl_stream *s) { int c; while ((c = isl_stream_getc(s)) != -1 && c != '\n') /* nothing */ ; return c == -1 ? -1 : 0; } static struct isl_token *next_token(struct isl_stream *s, int same_line) { int c; struct isl_token *tok = NULL; int line, col; int old_line = s->line; if (s->n_token) { if (same_line && s->tokens[s->n_token - 1]->on_new_line) return NULL; return s->tokens[--s->n_token]; } if (same_line && s->c == '\n') return NULL; s->len = 0; /* skip spaces and comment lines */ while ((c = isl_stream_getc(s)) != -1) { if (c == '#') { if (isl_stream_skip_line(s) < 0) break; c = '\n'; if (same_line) break; } else if (!isspace(c) || (same_line && c == '\n')) break; } line = s->line; col = s->col; if (c == -1 || (same_line && c == '\n')) return NULL; if (c == '(' || c == ')' || c == '+' || c == '*' || c == '%' || c == '?' || c == '^' || c == '@' || c == '$' || c == ',' || c == '.' || c == ';' || c == '[' || c == ']' || c == '{' || c == '}') { tok = isl_token_new(s->ctx, line, col, old_line != line); if (!tok) return NULL; tok->type = (enum isl_token_type)c; return tok; } if (c == '-') { int c; if ((c = isl_stream_getc(s)) == '>') { tok = isl_token_new(s->ctx, line, col, old_line != line); if (!tok) return NULL; tok->u.s = strdup("->"); tok->type = ISL_TOKEN_TO; return tok; } if (c != -1) isl_stream_ungetc(s, c); if (!isdigit(c)) { tok = isl_token_new(s->ctx, line, col, old_line != line); if (!tok) return NULL; tok->type = (enum isl_token_type) '-'; return tok; } } if (c == '-' || isdigit(c)) { int minus = c == '-'; tok = isl_token_new(s->ctx, line, col, old_line != line); if (!tok) return NULL; tok->type = ISL_TOKEN_VALUE; isl_int_init(tok->u.v); if (isl_stream_push_char(s, c)) goto error; while ((c = isl_stream_getc(s)) != -1 && isdigit(c)) if (isl_stream_push_char(s, c)) goto error; if (c != -1) isl_stream_ungetc(s, c); isl_stream_push_char(s, '\0'); isl_int_read(tok->u.v, s->buffer); if (minus && isl_int_is_zero(tok->u.v)) { tok->col++; tok->on_new_line = 0; isl_stream_push_token(s, tok); tok = isl_token_new(s->ctx, line, col, old_line != line); if (!tok) return NULL; tok->type = (enum isl_token_type) '-'; } return tok; } if (isalpha(c) || c == '_') { tok = isl_token_new(s->ctx, line, col, old_line != line); if (!tok) return NULL; isl_stream_push_char(s, c); while ((c = isl_stream_getc(s)) != -1 && (isalnum(c) || c == '_')) isl_stream_push_char(s, c); if (c != -1) isl_stream_ungetc(s, c); while ((c = isl_stream_getc(s)) != -1 && c == '\'') isl_stream_push_char(s, c); if (c != -1) isl_stream_ungetc(s, c); isl_stream_push_char(s, '\0'); tok->type = check_keywords(s); if (tok->type != ISL_TOKEN_IDENT) tok->is_keyword = 1; tok->u.s = strdup(s->buffer); if (!tok->u.s) goto error; return tok; } if (c == '"') { tok = isl_token_new(s->ctx, line, col, old_line != line); if (!tok) return NULL; tok->type = ISL_TOKEN_STRING; tok->u.s = NULL; while ((c = isl_stream_getc(s)) != -1 && c != '"' && c != '\n') isl_stream_push_char(s, c); if (c != '"') { isl_stream_error(s, NULL, "unterminated string"); goto error; } isl_stream_push_char(s, '\0'); tok->u.s = strdup(s->buffer); return tok; } if (c == '=') { int c; tok = isl_token_new(s->ctx, line, col, old_line != line); if (!tok) return NULL; if ((c = isl_stream_getc(s)) == '=') { tok->u.s = strdup("=="); tok->type = ISL_TOKEN_EQ_EQ; return tok; } if (c != -1) isl_stream_ungetc(s, c); tok->type = (enum isl_token_type) '='; return tok; } if (c == ':') { int c; tok = isl_token_new(s->ctx, line, col, old_line != line); if (!tok) return NULL; if ((c = isl_stream_getc(s)) == '=') { tok->u.s = strdup(":="); tok->type = ISL_TOKEN_DEF; return tok; } if (c != -1) isl_stream_ungetc(s, c); tok->type = (enum isl_token_type) ':'; return tok; } if (c == '>') { int c; tok = isl_token_new(s->ctx, line, col, old_line != line); if (!tok) return NULL; if ((c = isl_stream_getc(s)) == '=') { tok->u.s = strdup(">="); tok->type = ISL_TOKEN_GE; return tok; } else if (c == '>') { if ((c = isl_stream_getc(s)) == '=') { tok->u.s = strdup(">>="); tok->type = ISL_TOKEN_LEX_GE; return tok; } tok->u.s = strdup(">>"); tok->type = ISL_TOKEN_LEX_GT; } else { tok->u.s = strdup(">"); tok->type = ISL_TOKEN_GT; } if (c != -1) isl_stream_ungetc(s, c); return tok; } if (c == '<') { int c; tok = isl_token_new(s->ctx, line, col, old_line != line); if (!tok) return NULL; if ((c = isl_stream_getc(s)) == '=') { tok->u.s = strdup("<="); tok->type = ISL_TOKEN_LE; return tok; } else if (c == '<') { if ((c = isl_stream_getc(s)) == '=') { tok->u.s = strdup("<<="); tok->type = ISL_TOKEN_LEX_LE; return tok; } tok->u.s = strdup("<<"); tok->type = ISL_TOKEN_LEX_LT; } else { tok->u.s = strdup("<"); tok->type = ISL_TOKEN_LT; } if (c != -1) isl_stream_ungetc(s, c); return tok; } if (c == '&') { tok = isl_token_new(s->ctx, line, col, old_line != line); if (!tok) return NULL; tok->type = ISL_TOKEN_AND; if ((c = isl_stream_getc(s)) != '&' && c != -1) { tok->u.s = strdup("&"); isl_stream_ungetc(s, c); } else tok->u.s = strdup("&&"); return tok; } if (c == '|') { tok = isl_token_new(s->ctx, line, col, old_line != line); if (!tok) return NULL; tok->type = ISL_TOKEN_OR; if ((c = isl_stream_getc(s)) != '|' && c != -1) { tok->u.s = strdup("|"); isl_stream_ungetc(s, c); } else tok->u.s = strdup("||"); return tok; } if (c == '/') { tok = isl_token_new(s->ctx, line, col, old_line != line); if (!tok) return NULL; if ((c = isl_stream_getc(s)) != '\\' && c != -1) { tok->type = (enum isl_token_type) '/'; isl_stream_ungetc(s, c); } else { tok->u.s = strdup("/\\"); tok->type = ISL_TOKEN_AND; } return tok; } if (c == '\\') { tok = isl_token_new(s->ctx, line, col, old_line != line); if (!tok) return NULL; if ((c = isl_stream_getc(s)) != '/' && c != -1) { tok->type = (enum isl_token_type) '\\'; isl_stream_ungetc(s, c); } else { tok->u.s = strdup("\\/"); tok->type = ISL_TOKEN_OR; } return tok; } if (c == '!') { tok = isl_token_new(s->ctx, line, col, old_line != line); if (!tok) return NULL; if ((c = isl_stream_getc(s)) == '=') { tok->u.s = strdup("!="); tok->type = ISL_TOKEN_NE; return tok; } else { tok->type = ISL_TOKEN_NOT; tok->u.s = strdup("!"); } if (c != -1) isl_stream_ungetc(s, c); return tok; } tok = isl_token_new(s->ctx, line, col, old_line != line); if (!tok) return NULL; tok->type = ISL_TOKEN_UNKNOWN; return tok; error: isl_token_free(tok); return NULL; } struct isl_token *isl_stream_next_token(struct isl_stream *s) { return next_token(s, 0); } struct isl_token *isl_stream_next_token_on_same_line(struct isl_stream *s) { return next_token(s, 1); } int isl_stream_eat_if_available(struct isl_stream *s, int type) { struct isl_token *tok; tok = isl_stream_next_token(s); if (!tok) return 0; if (tok->type == type) { isl_token_free(tok); return 1; } isl_stream_push_token(s, tok); return 0; } int isl_stream_next_token_is(struct isl_stream *s, int type) { struct isl_token *tok; int r; tok = isl_stream_next_token(s); if (!tok) return 0; r = tok->type == type; isl_stream_push_token(s, tok); return r; } char *isl_stream_read_ident_if_available(struct isl_stream *s) { struct isl_token *tok; tok = isl_stream_next_token(s); if (!tok) return NULL; if (tok->type == ISL_TOKEN_IDENT) { char *ident = strdup(tok->u.s); isl_token_free(tok); return ident; } isl_stream_push_token(s, tok); return NULL; } int isl_stream_eat(struct isl_stream *s, int type) { struct isl_token *tok; tok = isl_stream_next_token(s); if (!tok) return -1; if (tok->type == type) { isl_token_free(tok); return 0; } isl_stream_error(s, tok, "expecting other token"); isl_stream_push_token(s, tok); return -1; } int isl_stream_is_empty(struct isl_stream *s) { struct isl_token *tok; tok = isl_stream_next_token(s); if (!tok) return 1; isl_stream_push_token(s, tok); return 0; } static int free_keyword(void **p, void *user) { struct isl_keyword *keyword = *p; free(keyword->name); free(keyword); return 0; } void isl_stream_flush_tokens(struct isl_stream *s) { int i; if (!s) return; for (i = 0; i < s->n_token; ++i) isl_token_free(s->tokens[i]); s->n_token = 0; } void isl_stream_free(struct isl_stream *s) { if (!s) return; free(s->buffer); if (s->n_token != 0) { struct isl_token *tok = isl_stream_next_token(s); isl_stream_error(s, tok, "unexpected token"); isl_token_free(tok); } if (s->keywords) { isl_hash_table_foreach(s->ctx, s->keywords, &free_keyword, NULL); isl_hash_table_free(s->ctx, s->keywords); } isl_ctx_deref(s->ctx); free(s); }