#include #include #include #include #include #include #include // NEVER, EVER HAVE TO CALL FREE (EVER) AGAIN (YES, REALLY) #define malloc(n) GC_MALLOC(n) #define realloc(o, n) GC_REALLOC(o, n) typedef enum { Undefined, Integer, Symbol } type_t; union object; typedef union object *oop; struct Undefined { type_t type; }; struct Integer { type_t type; int value; }; struct Symbol { type_t type; char *name; int defined; oop value; // NULL }; union object { type_t type; struct Undefined Undefined; struct Integer Integer; struct Symbol Symbol; }; union object _null = { .Undefined = { Undefined } }; oop null = &_null; oop _checkType(oop ptr, type_t type) { assert(ptr->type == type); return ptr; } #define get(PTR, TYPE, FIELD) _checkType(PTR, TYPE)->TYPE.FIELD #define set(PTR, TYPE, FIELD, VALUE) _checkType(PTR, TYPE)->TYPE.FIELD = VALUE void *memcheck(void *ptr) { if (NULL == ptr) { fprintf(stderr, "Error: out of memory\n"); exit(EX_OSERR); // this is as close as we have for 'resource unavailable' } return ptr; } oop makeInteger(int value) { oop newInt = memcheck(malloc(sizeof(union object))); newInt->type = Integer; newInt->Integer.value = value; return newInt; } oop makeSymbol(char *name) { oop newSymb = memcheck(malloc(sizeof(union object))); newSymb->type = Symbol; newSymb->Symbol.name = name; newSymb->Symbol.defined = 0; newSymb->Symbol.value = null; return newSymb; } void print(oop ast) { switch (ast->type) { case Undefined: printf("null"); return; case Integer: printf("%i", get(ast, Integer, value)); return; case Symbol: printf("%s=", get(ast, Symbol, name)); print(get(ast, Symbol, value)); return; } assert(0); } void println(oop ast) { print(ast); printf("\n"); } #define SYMBOL_TABLE_CHUNK 4 typedef struct table_t { oop *array; size_t size; size_t capacity; } table_t; #define TABLE_INITIALISER { NULL, 0, 0 } // first call to table_insert() will initialise storage table_t table = TABLE_INITIALISER; // safe but not strictly needed on Unix because BSS segment is initialised to all zeroes ssize_t table_search(table_t *table, char *ident) { ssize_t l = 0, r = table->size - 1; while (l <= r) { ssize_t mid = (l + r) / 2; int cmpres = strcmp(get(table->array[mid], Symbol, name), ident); if (cmpres > 0) r = mid - 1; else if (cmpres < 0) l = mid + 1; else return mid; // non-negative result => element found at this index } return -1 - l; // negative result => 'not found', reflected around -1 instead of 0 to allow 'not found' at index 0 } // ssize_t result because -1 means 'error' ssize_t table_insert(table_t *table, oop object, size_t pos) { // Should I use in my code a function starting with _ or is it a convention to prevent its usage ? _checkType(object, Symbol); if (pos > table->size) { // don't need to check for pos < 0 because size_t is unsigned return -1; } if (table->size >= table->capacity) { // on the first call table->array will be NULL and realloc() will behave like malloc() table->array = memcheck(realloc(table->array, sizeof(oop) * (table->capacity + SYMBOL_TABLE_CHUNK))); table->capacity += SYMBOL_TABLE_CHUNK; } memmove(table->array + pos + 1, table->array + pos, sizeof(*table->array) * (table->size - pos)); table->array[pos] = object; return ++(table->size); } oop intern(char *ident) { ssize_t res= table_search(&table, ident); // < 0 => not found if (res >= 0) return table.array[res]; res= -1 - res; // 'un-negate' the result by reflecting it around X=-1 oop new_symbol = makeSymbol(memcheck(strdup(ident))); table_insert(&table, new_symbol, res); return new_symbol; } oop update_symbol_value(oop symbol, oop integer) { _checkType(symbol, Symbol); _checkType(integer, Integer); symbol->Symbol.value = integer; return symbol; } int main() { char *line= 0; // this and size_t linecap= 0; // this are needed for getline() intern("chaussure"); // identifiers will have no trailing newline so let's test with no trailing newline printf("Enter identifier names!\n"); for (;;) { // using an infinite loop simplifies the break/continue logic in the body ssize_t len= getline(&line, &linecap, stdin); // use getline() to auto-grow the buffer when necessary if (len < 0) break; // stop at EOF while ((len > 0) && ('\n' == line[len-1])) line[--len]= 0; // trim newlines from the end if (len < 1) continue; // ignore empty lines printf("intern : %p\n", intern(line)); printf("after size : %zi\n", table.size); printf("after capacity : %zi\n", table.capacity); printf("\n"); for (int i = 0; i < table.size; i++) { printf("%i %s\n", i, get(table.array[i], Symbol, name)); } printf("\n"); } }