diff options
author | Tavian Barnes <tavianator@gmail.com> | 2009-10-28 18:57:31 -0400 |
---|---|---|
committer | Tavian Barnes <tavianator@gmail.com> | 2009-10-28 18:57:31 -0400 |
commit | 8ce6029a6a14c0ef003c88cb9fb29e522c022f9c (patch) | |
tree | 4720666135b504097ba49644612b53bbd106bb7f /dimension | |
parent | 9335c34a93f66318c5d4aaaca4b11595d349421d (diff) | |
download | dimension-8ce6029a6a14c0ef003c88cb9fb29e522c022f9c.tar.xz |
Tokenize strings and language directives.
Diffstat (limited to 'dimension')
-rw-r--r-- | dimension/tokenize.c | 143 | ||||
-rw-r--r-- | dimension/tokenize.h | 7 |
2 files changed, 147 insertions, 3 deletions
diff --git a/dimension/tokenize.c b/dimension/tokenize.c index 8401dc7..97b26be 100644 --- a/dimension/tokenize.c +++ b/dimension/tokenize.c @@ -121,7 +121,7 @@ dmnsn_tokenize_label(char *map, size_t size, dmnsn_token *token, ++i; ++*col; ++*next; - } while (*next - map < size && (isalnum(**next) || **next == '_')); + } while (*next - map < size && (isalnum(**next) || **next == '_')); token->value[i] = '\0'; @@ -146,6 +146,113 @@ dmnsn_tokenize_label(char *map, size_t size, dmnsn_token *token, return 0; } +/* Tokenize a language directive (#include, #declare, etc.) */ +static int +dmnsn_tokenize_directive(char *map, size_t size, dmnsn_token *token, + char **next, unsigned int *line, unsigned int *col) +{ + unsigned int i = 0, alloc = 32; + + if (**next != '#') { + return 1; + } + + char *directive = malloc(alloc); + + do { + if (i + 1 >= alloc) { + alloc *= 2; + directive = realloc(directive, alloc); + } + + directive[i] = **next; + + ++i; + ++*col; + ++*next; + } while (*next - map < size && (isalnum(**next) || **next == '_')); + + directive[i] = '\0'; + + /* Now check if we really found a directive */ + +#define dmnsn_directive(str, tp) \ + do { \ + if (strcmp(directive, str) == 0) { \ + free(directive); \ + token->type = tp; \ + return 0; \ + } \ + } while (0) + + dmnsn_directive("#include", DMNSN_INCLUDE); + dmnsn_directive("#declare", DMNSN_DECLARE); + + free(directive); + return 1; +} + +/* Tokenize a string */ +static int +dmnsn_tokenize_string(char *map, size_t size, dmnsn_token *token, + char **next, unsigned int *line, unsigned int *col) +{ + unsigned int i = 0, alloc = 32; + + if (**next != '"') { + return 1; + } + + token->type = DMNSN_STRING; + token->value = malloc(alloc); + + ++*next; + while (*next - map < size && **next != '"') { + if (i + 1 >= alloc) { + alloc *= 2; + token->value = realloc(token->value, alloc); + } + + if (**next == '\\') { + ++*col; + ++*next; + + switch (**next) { + case '\\': + token->value[i] = '\\'; + break; + + case '"': + token->value[i] = '"'; + break; + + case 'n': + token->value[i] = '\n'; + break; + + default: + fprintf(stderr, + "Warning: unrecognised escape sequence '\\%c'" + " on line %u, column %u\n", + (int)**next, *line, *col); + token->value[i] = **next; + break; + } + } else { + token->value[i] = **next; + } + + ++i; + ++*col; + ++*next; + } + ++*next; + + token->value[i] = '\0'; + + return 0; +} + dmnsn_array * dmnsn_tokenize(FILE *file) { @@ -250,14 +357,37 @@ dmnsn_tokenize(FILE *file) } break; + case '#': + /* Language directive */ + if (dmnsn_tokenize_directive(map, size, &token, + &next, &line, &col) == 0) { + if (token.type == DMNSN_INCLUDE) { + } + } else { + fprintf(stderr, "Invalid directive on line %u, column %u.\n", + line, col); + goto bailout; + } + break; + + case '"': + if (dmnsn_tokenize_string(map, size, &token, &next, &line, &col) != 0) { + fprintf(stderr, "Invalid string on line %u, column %u.\n", + line, col); + goto bailout; + } + break; + default: if (dmnsn_tokenize_label(map, size, &token, &next, &line, &col) != 0) { /* Unrecognised character */ fprintf(stderr, - "Unrecognized character 0x%X in input at line %u, column %u.\n", - (unsigned int)*next, line, col); + "Unrecognized character '%c' (0x%X) in input at line %u," + " column %u.\n", + (int)*next, (unsigned int)*next, line, col); goto bailout; } + break; } dmnsn_array_push(tokens, &token); @@ -351,6 +481,13 @@ dmnsn_token_name(dmnsn_token_type token_type) dmnsn_token_map(DMNSN_SPHERE, "sphere"); dmnsn_token_map(DMNSN_BOX, "box"); + /* Directives */ + dmnsn_token_map(DMNSN_INCLUDE, "#include"); + dmnsn_token_map(DMNSN_DECLARE, "#declare"); + + /* Strings */ + dmnsn_token_map(DMNSN_STRING, "string"); + /* Identifiers */ dmnsn_token_map(DMNSN_IDENTIFIER, "identifier"); diff --git a/dimension/tokenize.h b/dimension/tokenize.h index 2e82f98..cc8148f 100644 --- a/dimension/tokenize.h +++ b/dimension/tokenize.h @@ -45,8 +45,15 @@ typedef enum { DMNSN_SPHERE, DMNSN_BOX, + /* Directives (#declare, etc.) */ + DMNSN_INCLUDE, /* Only used internally */ + DMNSN_DECLARE, + /* Identifiers */ DMNSN_IDENTIFIER, + + /* Strings */ + DMNSN_STRING, } dmnsn_token_type; typedef struct dmnsn_token dmnsn_token; |