summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--allocator.c18
-rw-r--r--archive/arr.c69
-rw-r--r--arr.c110
-rw-r--r--blockarr.c13
-rw-r--r--eval.c22
-rw-r--r--identifiers.c31
-rw-r--r--location.c7
-rw-r--r--parse.c242
-rw-r--r--toc.c23
-rw-r--r--tokenizer.c110
-rw-r--r--types.h471
11 files changed, 584 insertions, 532 deletions
diff --git a/allocator.c b/allocator.c
index 2b6b0b3..6add3cf 100644
--- a/allocator.c
+++ b/allocator.c
@@ -1,21 +1,3 @@
-typedef struct Page {
- struct Page *next;
- size_t used;
- max_align_t data[];
-} Page;
-
-typedef struct DynPage {
- struct DynPage **self;
- max_align_t data[];
-} DynPage;
-
-typedef struct {
- Page *first;
- Page *last;
- DynPage **dyn;
- size_t dyn_len;
- size_t dyn_cap;
-} Allocator;
/* number of bytes a page hold, not including the header */
#define PAGE_SIZE (16384 - sizeof(Page))
diff --git a/archive/arr.c b/archive/arr.c
new file mode 100644
index 0000000..2a055b1
--- /dev/null
+++ b/archive/arr.c
@@ -0,0 +1,69 @@
+
+static void arr_create(Array *arr, size_t item_sz) {
+ arr->len = arr->cap = 0;
+ arr->item_sz = item_sz;
+ arr->data = NULL;
+}
+
+static inline void arr_reserve(Array *arr, size_t n) {
+ arr->cap = n;
+ arr->data = err_realloc(arr->data, arr->item_sz * arr->cap);
+}
+
+static inline void arr_reservea(Array *arr, size_t n, Allocator *a) {
+ arr->cap = n;
+ arr->data = allocr_realloc(a, arr->data, arr->item_sz * arr->cap);
+}
+
+/* like arr_reserve, but sets the length of the array too */
+static inline void arr_set_len(Array *arr, size_t n) {
+ arr_reserve(arr, n);
+ arr->len = n;
+}
+
+static inline void arr_set_lena(Array *arr, size_t n, Allocator *a) {
+ arr_reservea(arr, n, a);
+ arr->len = n;
+}
+
+static inline void *arr_last(Array *arr) {
+ if (arr->data)
+ return (void*)((char*)arr->data + arr->item_sz * (arr->len - 1));
+ else
+ return NULL;
+}
+
+static void *arr_add(Array *arr) {
+ if (arr->len >= arr->cap) {
+ arr_reserve(arr, (arr->cap + 1) * 2);
+ }
+ arr->len++;
+ return (void*)((char*)arr->data + arr->item_sz * (arr->len - 1));
+}
+
+static void *arr_adda(Array *arr, Allocator *a) {
+ if (arr->len >= arr->cap) {
+ arr_reservea(arr, (arr->cap + 1) * 2, a);
+ }
+ arr->len++;
+ return (void*)((char*)arr->data + arr->item_sz * (arr->len - 1));
+}
+
+static void arr_clear(Array *arr) {
+ free(arr->data);
+ arr->len = arr->cap = 0;
+ arr->data = NULL;
+}
+
+static void arr_remove_last(Array *arr) {
+ /* OPTIM (memory): Shorten array. */
+ arr->len--;
+}
+
+static void arr_free(Array *arr) {
+ free(arr->data);
+}
+
+/* NOTE: this will not work if type is a pointer! */
+#define arr_foreach(arr, type, var) for (type *var = (arr)->data, *var##_foreach_last = arr_last(arr); var; var == var##_foreach_last ? var = NULL : var++)
+#define arr_foreach_reverse(arr, type, var) for (type *var = arr_last(arr); var; var == (arr)->data ? var = NULL : var--)
diff --git a/arr.c b/arr.c
index ff94377..6ec7db2 100644
--- a/arr.c
+++ b/arr.c
@@ -1,75 +1,49 @@
+/* OPTIM: is it faster to store void *end? */
typedef struct {
- void *data;
size_t len;
size_t cap;
- size_t item_sz;
-} Array;
-
-static void arr_create(Array *arr, size_t item_sz) {
- arr->len = arr->cap = 0;
- arr->item_sz = item_sz;
- arr->data = NULL;
-}
-
-static inline void arr_reserve(Array *arr, size_t n) {
- arr->cap = n;
- arr->data = err_realloc(arr->data, arr->item_sz * arr->cap);
-}
-
-static inline void arr_reservea(Array *arr, size_t n, Allocator *a) {
- arr->cap = n;
- arr->data = allocr_realloc(a, arr->data, arr->item_sz * arr->cap);
-}
-
-/* like arr_reserve, but sets the length of the array too */
-static inline void arr_set_len(Array *arr, size_t n) {
- arr_reserve(arr, n);
- arr->len = n;
-}
-
-static inline void arr_set_lena(Array *arr, size_t n, Allocator *a) {
- arr_reservea(arr, n, a);
- arr->len = n;
-}
-
-static inline void *arr_last(Array *arr) {
- if (arr->data)
- return (void*)((char*)arr->data + arr->item_sz * (arr->len - 1));
- else
- return NULL;
-}
-
-static void *arr_add(Array *arr) {
- if (arr->len >= arr->cap) {
- arr_reserve(arr, (arr->cap + 1) * 2);
+ max_align_t data[];
+} ArrHeader;
+
+static inline ArrHeader *arr_hdr(void *arr) {
+ ArrHeader *hdr = (ArrHeader *)((char *)arr - offsetof(ArrHeader, data));
+ return hdr;
+}
+
+static inline size_t arr_len(void *arr) {
+ if (arr == NULL) return 0;
+ return arr_hdr(arr)->len;
+}
+
+static void arr_resv_(void **arr, size_t n, size_t item_sz) {
+ if (*arr == NULL) {
+ ArrHeader *hdr = err_malloc(item_sz * n + sizeof(ArrHeader));
+ hdr->len = 0;
+ hdr->cap = n;
+ *arr = hdr->data;
+ } else {
+ ArrHeader *hdr = arr_hdr(*arr);
+ hdr->cap = n;
+ hdr = realloc(hdr, item_sz * n + sizeof(ArrHeader));
+ if (hdr->len > hdr->cap) hdr->len = hdr->cap;
+ *arr = hdr->data;
}
- arr->len++;
- return (void*)((char*)arr->data + arr->item_sz * (arr->len - 1));
-}
-
-static void *arr_adda(Array *arr, Allocator *a) {
- if (arr->len >= arr->cap) {
- arr_reservea(arr, (arr->cap + 1) * 2, a);
+
+}
+
+static void *arr_add_(void **arr, size_t item_sz) {
+ ArrHeader *hdr;
+ if (*arr == NULL) {
+ arr_resv_(*arr, 10, item_sz);
+ hdr = arr_hdr(*arr);
+ } else {
+ hdr = arr_hdr(*arr);
+ if (hdr->len >= hdr->cap) {
+ arr_resv_(*arr, hdr->len * 2, item_sz);
+ hdr = arr_hdr(*arr);
+ }
}
- arr->len++;
- return (void*)((char*)arr->data + arr->item_sz * (arr->len - 1));
-}
-
-static void arr_clear(Array *arr) {
- free(arr->data);
- arr->len = arr->cap = 0;
- arr->data = NULL;
-}
-
-static void arr_remove_last(Array *arr) {
- /* OPTIM (memory): Shorten array. */
- arr->len--;
-}
-
-static void arr_free(Array *arr) {
- free(arr->data);
+ return &(((char *)hdr->data)[(hdr->len++) * item_sz]);
}
-/* NOTE: this will not work if type is a pointer! */
-#define arr_foreach(arr, type, var) for (type *var = (arr)->data, *var##_foreach_last = arr_last(arr); var; var == var##_foreach_last ? var = NULL : var++)
-#define arr_foreach_reverse(arr, type, var) for (type *var = arr_last(arr); var; var == (arr)->data ? var = NULL : var--)
+#define arr_add(arr) arr_add_((void **)arr, sizeof **arr)
diff --git a/blockarr.c b/blockarr.c
index 38bbf1b..40e2edc 100644
--- a/blockarr.c
+++ b/blockarr.c
@@ -4,19 +4,6 @@ They ensure that pointers to values in the array are not invalidated
when something is added to the array.
*/
-typedef struct {
- void *data;
- size_t n; /* number of things in this block so far */
- void *last; /* last one of them */
-} ArrBlock;
-
-typedef struct {
- size_t item_sz;
- int lg_block_sz;
- /* NOTE: dynamic array tends to over-allocate, so we're using our own */
- Array blocks;
-} BlockArr;
-
/*
Note: the block size must be a power of 2, to use right shifting instead of division
(for optimization)!
diff --git a/eval.c b/eval.c
index ee52f92..337b7e8 100644
--- a/eval.c
+++ b/eval.c
@@ -1,7 +1,3 @@
-typedef struct {
- Allocator allocr;
-} Evaluator;
-
static void evalr_create(Evaluator *ev) {
allocr_create(&ev->allocr);
}
@@ -14,24 +10,6 @@ static inline void *evalr_malloc(Evaluator *ev, size_t bytes) {
return allocr_malloc(&ev->allocr, bytes);
}
-typedef union Value {
- U8 u8;
- U16 u16;
- U32 u32;
- U64 u64;
- I8 i8;
- I16 i16;
- I32 i32;
- I64 i64;
- bool boolv;
- char charv;
- float f32;
- double f64;
- FnExpr *fn;
- void *arr;
- void *ptr;
-} Value;
-
static bool builtin_truthiness(Value *v, BuiltinType b) {
switch (b) {
case BUILTIN_I8: return v->i8 != 0;
diff --git a/identifiers.c b/identifiers.c
index 1ff225c..104894b 100644
--- a/identifiers.c
+++ b/identifiers.c
@@ -1,32 +1,3 @@
-typedef struct {
- struct Block *scope; /* NULL for file scope */
- struct Declaration *decl;
-} IdentDecl;
-
-/*
-The way you search an identifier in a tree is:
-root.children[low part of 1st char].children[high part of 1st char]
-.children[low part of 2nd char]...
-
-*/
-
-#define TREE_NCHILDREN 16
-typedef struct IdentTree {
- /* zero value is an empty trie */
- uint16_t depth;
- unsigned char index_in_parent; /* index of this in .parent.children */
- struct IdentTree *parent;
- struct IdentTree *children[TREE_NCHILDREN];
- Array decls; /* array of declarations of this identifier */
-} IdentTree;
-
-typedef IdentTree *Identifier;
-
-typedef struct {
- BlockArr trees;
- IdentTree *root;
-} Identifiers;
-
#if CHAR_MAX - CHAR_MIN > 255
#error "Currently only systems with 8-bit characters can compile toc."
/* TODO: maybe do a run-time error for large characters? */
@@ -35,7 +6,7 @@ typedef struct {
/* can this character be used in an identifier? */
static int isident(int c) {
if (c >= 'a' && c <= 'z')
- return 1;
+ return 1;
if (c >= 'A' && c <= 'Z')
return 1;
if (c >= '0' && c <= '9')
diff --git a/location.c b/location.c
index 8e68ca3..74b032c 100644
--- a/location.c
+++ b/location.c
@@ -1,10 +1,3 @@
-typedef uint32_t LineNo;
-typedef struct {
- LineNo line;
- char *code;
- const char *filename;
-} Location;
-
static bool location_after(Location a, Location b) { /* a is after b? */
return a.code > b.code;
}
diff --git a/parse.c b/parse.c
index a52ac83..0ead4da 100644
--- a/parse.c
+++ b/parse.c
@@ -1,245 +1,3 @@
-/* TODO: stmt_parse -> parse_stmt, etc. */
-typedef enum {
- TYPE_VOID,
- TYPE_UNKNOWN,
- TYPE_BUILTIN,
- TYPE_FN,
- TYPE_TUPLE,
- TYPE_ARR,
- TYPE_PTR
-} TypeKind;
-
-typedef enum {
- BUILTIN_I8,
- BUILTIN_I16,
- BUILTIN_I32,
- BUILTIN_I64,
- BUILTIN_U8,
- BUILTIN_U16,
- BUILTIN_U32,
- BUILTIN_U64,
- BUILTIN_F32,
- BUILTIN_F64,
- BUILTIN_CHAR,
- BUILTIN_BOOL,
- BUILTIN_TYPE_COUNT
-} BuiltinType;
-
-#define TYPE_FLAG_FLEXIBLE 0x01
-#define TYPE_FLAG_RESOLVED 0x02
-
-typedef struct Type {
- Location where;
- TypeKind kind;
- uint16_t flags;
- union {
- BuiltinType builtin;
- struct {
- Array types; /* [0] = ret_type, [1..] = param_types */
- } fn;
- Array tuple;
- struct {
- struct Type *of;
- union {
- UInteger n; /* this is NOT set by parse_type; it will be handled by types.c */
- struct Expression *n_expr;
- };
- } arr;
- struct {
- struct Type *of;
- } ptr;
- };
-} Type;
-
-#define BLOCK_FLAG_FN 0x01
-
-typedef struct Block {
- uint16_t flags;
- Location start;
- Location end;
- Array stmts;
- struct Block *parent;
- struct Expression *ret_expr; /* the return expression of this block, e.g. {foo(); 3} => 3 NULL for no expression. */
-} Block;
-
-typedef enum {
- EXPR_LITERAL_FLOAT,
- EXPR_LITERAL_INT,
- EXPR_LITERAL_STR,
- EXPR_LITERAL_BOOL,
- EXPR_LITERAL_CHAR,
- EXPR_IDENT, /* variable or constant */
- EXPR_BINARY_OP,
- EXPR_UNARY_OP,
- EXPR_IF,
- EXPR_WHILE,
- EXPR_FN,
- EXPR_CAST,
- EXPR_NEW,
- EXPR_CALL,
- EXPR_BLOCK,
- EXPR_DIRECT
-} ExprKind;
-
-typedef enum {
- UNARY_MINUS,
- UNARY_ADDRESS, /* &x */
- UNARY_DEREF, /* *x */
- UNARY_NOT, /* !x */
- UNARY_DEL
-} UnaryOp;
-
-typedef enum {
- BINARY_SET, /* e.g. x = y */
- BINARY_ADD,
- BINARY_SUB,
- BINARY_MUL,
- BINARY_DIV,
- BINARY_COMMA,
- BINARY_GT,
- BINARY_LT,
- BINARY_GE,
- BINARY_LE,
- BINARY_EQ,
- BINARY_NE,
- BINARY_AT_INDEX /* e.g. x[i] */
-} BinaryOp;
-
-typedef struct {
- Directive which;
- Array args; /* of Argument */
-} DirectExpr;
-
-
-typedef struct {
- struct Expression *fn;
- Array args; /* of Argument; after typing, becomes of Expression */
-} CallExpr;
-
-typedef struct {
- struct Expression *cond; /* NULL = this is an else */
- struct Expression *next_elif; /* next elif/else of this statement */
- Block body;
-} IfExpr;
-
-typedef struct {
- struct Expression *cond;
- Block body;
-} WhileExpr;
-
-typedef struct {
- Array params; /* declarations of the parameters to this function */
- Array ret_decls; /* array of decls, if this has named return values. otherwise, len & data will be 0. */
- Type ret_type;
- Block body;
-} FnExpr; /* an expression such as fn(x: int) int { 2 * x } */
-
-typedef struct {
- Type type;
- struct Expression *expr;
-} CastExpr;
-
-#define EXPR_FLAG_FOUND_TYPE 0x01
-
-typedef struct Expression {
- Location where;
- ExprKind kind;
- uint16_t flags;
- Type type;
- union {
- Floating floatl;
- UInteger intl;
- StrLiteral strl;
- bool booll;
- char charl;
- struct {
- UnaryOp op;
- struct Expression *of;
- } unary;
- struct {
- BinaryOp op;
- struct Expression *lhs;
- struct Expression *rhs;
- } binary;
- CallExpr call;
- DirectExpr direct;
- Identifier ident;
- struct {
- Type type;
- } new;
- struct {
- Type type;
- } del;
- IfExpr if_;
- WhileExpr while_;
- FnExpr fn;
- CastExpr cast;
- Block block;
- };
-} Expression;
-
-typedef struct {
- Location where;
- Identifier name; /* NULL = no name */
- Expression val;
-} Argument;
-
-#define DECL_FLAG_ANNOTATES_TYPE 0x01
-#define DECL_FLAG_CONST 0x02
-#define DECL_FLAG_HAS_EXPR 0x04
-#define DECL_FLAG_FOUND_TYPE 0x08
-#define DECL_FLAG_ERRORED_ABOUT_SELF_REFERENCE 0x10 /* has there been an error about this decl referencing itself? */
-
-/* OPTIM: Instead of using dynamic arrays, do two passes. */
-typedef struct Declaration {
- Location where;
- Array idents;
- Type type;
- uint16_t flags;
- Expression expr;
- union Value *val; /* only for constant decls. set to NULL here, and to actual value by types.c. */
-} Declaration;
-
-typedef enum {
- STMT_DECL,
- STMT_EXPR,
- STMT_RET
-} StatementKind;
-
-#define RET_FLAG_EXPR 0x01
-typedef struct {
- uint16_t flags;
- Expression expr;
-} Return;
-
-#define STMT_FLAG_VOIDED_EXPR 0x01 /* the "4;" in fn () { 4; } is a voided expression, but the "4" in fn () int { 4 } is not */
-typedef struct {
- Location where;
- StatementKind kind;
- unsigned short flags;
- union {
- Declaration decl;
- Expression expr;
- Return ret;
- };
-} Statement;
-
-typedef struct {
- Array stmts;
-} ParsedFile;
-
-typedef struct {
- Tokenizer *tokr;
- Allocator allocr;
- Block *block; /* which block are we in? NULL = file scope */
-} Parser;
-
-typedef enum {
- DECL_END_SEMICOLON,
- DECL_END_RPAREN_COMMA,
- DECL_END_LBRACE_COMMA
-} DeclEndKind;
-
static bool parse_expr(Parser *p, Expression *e, Token *end);
#define PARSE_DECL_ALLOW_CONST_WITH_NO_EXPR 0x01
diff --git a/toc.c b/toc.c
index dc8204d..94e74a8 100644
--- a/toc.c
+++ b/toc.c
@@ -10,28 +10,7 @@
#include <inttypes.h>
#include <stdbool.h>
-typedef int64_t Integer;
-typedef uint64_t UInteger;
-typedef long double Floating; /* OPTIM: Switch to double, but make sure floating-point literals are right */
-
-#define INTEGER_MAX INT64_MAX
-#define UINTEGER_MAX UINT64_MAX
-#define INTEGER_FMT "%"PRId64
-#define UINTEGER_FMT "%"PRIu64
-
-typedef uint8_t U8;
-typedef uint16_t U16;
-typedef uint32_t U32;
-typedef uint64_t U64;
-
-typedef int8_t I8;
-typedef int16_t I16;
-typedef int32_t I32;
-typedef int64_t I64;
-
-typedef float F32;
-typedef double F64;
-
+#include "types.h"
#include "location.c"
#include "err.c"
diff --git a/tokenizer.c b/tokenizer.c
index 520edd0..3393e0d 100644
--- a/tokenizer.c
+++ b/tokenizer.c
@@ -1,71 +1,3 @@
-typedef enum {
- TOKEN_KW,
- TOKEN_IDENT,
- TOKEN_DIRECT,
- TOKEN_NUM_LITERAL,
- TOKEN_CHAR_LITERAL,
- TOKEN_STR_LITERAL,
- TOKEN_EOF
-} TokenKind;
-
-typedef enum {
- DIRECT_C,
- DIRECT_COUNT
-} Directive;
-
-typedef enum {
- KW_SEMICOLON,
- KW_COLON,
- KW_AT,
- KW_COMMA,
- KW_LPAREN,
- KW_RPAREN,
- KW_LBRACE,
- KW_RBRACE,
- KW_LSQUARE,
- KW_RSQUARE,
- KW_EQEQ,
- KW_NE,
- KW_LT,
- KW_LE,
- KW_GT,
- KW_GE,
- KW_PLUS,
- KW_MINUS,
- KW_ASTERISK,
- KW_EXCLAMATION,
- KW_AMPERSAND,
- KW_SLASH,
- KW_EQ,
- KW_LAST_SYMBOL = KW_EQ, /* last one entirely consisting of symbols */
- KW_IF,
- KW_ELIF,
- KW_ELSE,
- KW_WHILE,
- KW_RETURN,
- KW_FN,
- KW_AS,
- KW_NEW,
- KW_DEL,
- KW_INT,
- KW_I8,
- KW_I16,
- KW_I32,
- KW_I64,
- KW_U8,
- KW_U16,
- KW_U32,
- KW_U64,
- KW_FLOAT,
- KW_F32,
- KW_F64,
- KW_CHAR,
- KW_BOOL,
- KW_TRUE,
- KW_FALSE,
- KW_COUNT
-} Keyword;
-
static const char *keywords[KW_COUNT] =
{";", ":", "@", ",", "(", ")", "{", "}", "[", "]", "==", "!=", "<", "<=", ">", ">=",
"+", "-", "*", "!", "&", "/",
@@ -120,48 +52,6 @@ static Directive tokenize_direct(char **s) {
return DIRECT_COUNT;
}
-typedef enum {
- NUM_LITERAL_INT,
- NUM_LITERAL_FLOAT
-} NumLiteralKind;
-
-typedef struct {
- NumLiteralKind kind;
- union {
- UInteger intval;
- Floating floatval;
- };
-} NumLiteral;
-
-typedef struct {
- char *str;
- size_t len;
-} StrLiteral;
-
-/* NOTE: Location is typedef'd in util/err.c */
-typedef struct {
- TokenKind kind;
- Location where;
- union {
- Keyword kw;
- Directive direct;
- Identifier ident;
- NumLiteral num;
- char chr;
- StrLiteral str;
- };
-} Token;
-
-typedef struct {
- Allocator allocr;
- Array tokens;
- char *s; /* string being parsed */
- const char *filename;
- LineNo line;
- Token *token; /* token currently being processed */
- Identifiers *idents;
-} Tokenizer;
-
static inline bool token_is_kw(Token *t, Keyword kw) {
return t->kind == TOKEN_KW && t->kw == kw;
}
diff --git a/types.h b/types.h
new file mode 100644
index 0000000..5960e27
--- /dev/null
+++ b/types.h
@@ -0,0 +1,471 @@
+typedef int64_t Integer;
+typedef uint64_t UInteger;
+typedef long double Floating; /* OPTIM: Switch to double, but make sure floating-point literals are right */
+
+#define INTEGER_MAX INT64_MAX
+#define UINTEGER_MAX UINT64_MAX
+#define INTEGER_FMT "%"PRId64
+#define UINTEGER_FMT "%"PRIu64
+
+typedef uint8_t U8;
+typedef uint16_t U16;
+typedef uint32_t U32;
+typedef uint64_t U64;
+
+typedef int8_t I8;
+typedef int16_t I16;
+typedef int32_t I32;
+typedef int64_t I64;
+
+typedef float F32;
+typedef double F64;
+
+typedef uint32_t LineNo;
+typedef struct {
+ LineNo line;
+ char *code;
+ const char *filename;
+} Location;
+
+typedef struct Page {
+ struct Page *next;
+ size_t used;
+ max_align_t data[];
+} Page;
+
+typedef struct DynPage {
+ struct DynPage **self;
+ max_align_t data[];
+} DynPage;
+
+typedef struct {
+ Page *first;
+ Page *last;
+ DynPage **dyn;
+ size_t dyn_len;
+ size_t dyn_cap;
+} Allocator;
+
+typedef struct {
+ void *data;
+ size_t len;
+ size_t cap;
+ size_t item_sz;
+} Array;
+
+typedef struct {
+ void *data;
+ size_t n; /* number of things in this block so far */
+ void *last; /* last one of them */
+} ArrBlock;
+
+typedef struct {
+ size_t item_sz;
+ int lg_block_sz;
+ /* NOTE: dynamic array tends to over-allocate, so we're using our own */
+ Array blocks;
+} BlockArr;
+
+typedef struct {
+ struct Block *scope; /* NULL for file scope */
+ struct Declaration *decl;
+} IdentDecl;
+
+/*
+The way you search an identifier in a tree is:
+root.children[low part of 1st char].children[high part of 1st char]
+.children[low part of 2nd char]...
+
+*/
+
+#define TREE_NCHILDREN 16
+typedef struct IdentTree {
+ /* zero value is an empty trie */
+ uint16_t depth;
+ unsigned char index_in_parent; /* index of this in .parent.children */
+ struct IdentTree *parent;
+ struct IdentTree *children[TREE_NCHILDREN];
+ Array decls; /* array of declarations of this identifier */
+} IdentTree;
+
+typedef IdentTree *Identifier;
+
+typedef struct {
+ BlockArr trees;
+ IdentTree *root;
+} Identifiers;
+
+typedef enum {
+ TOKEN_KW,
+ TOKEN_IDENT,
+ TOKEN_DIRECT,
+ TOKEN_NUM_LITERAL,
+ TOKEN_CHAR_LITERAL,
+ TOKEN_STR_LITERAL,
+ TOKEN_EOF
+} TokenKind;
+
+typedef enum {
+ DIRECT_C,
+ DIRECT_COUNT
+} Directive;
+
+typedef enum {
+ KW_SEMICOLON,
+ KW_COLON,
+ KW_AT,
+ KW_COMMA,
+ KW_LPAREN,
+ KW_RPAREN,
+ KW_LBRACE,
+ KW_RBRACE,
+ KW_LSQUARE,
+ KW_RSQUARE,
+ KW_EQEQ,
+ KW_NE,
+ KW_LT,
+ KW_LE,
+ KW_GT,
+ KW_GE,
+ KW_PLUS,
+ KW_MINUS,
+ KW_ASTERISK,
+ KW_EXCLAMATION,
+ KW_AMPERSAND,
+ KW_SLASH,
+ KW_EQ,
+ KW_LAST_SYMBOL = KW_EQ, /* last one entirely consisting of symbols */
+ KW_IF,
+ KW_ELIF,
+ KW_ELSE,
+ KW_WHILE,
+ KW_RETURN,
+ KW_FN,
+ KW_AS,
+ KW_NEW,
+ KW_DEL,
+ KW_INT,
+ KW_I8,
+ KW_I16,
+ KW_I32,
+ KW_I64,
+ KW_U8,
+ KW_U16,
+ KW_U32,
+ KW_U64,
+ KW_FLOAT,
+ KW_F32,
+ KW_F64,
+ KW_CHAR,
+ KW_BOOL,
+ KW_TRUE,
+ KW_FALSE,
+ KW_COUNT
+} Keyword;
+
+
+typedef enum {
+ NUM_LITERAL_INT,
+ NUM_LITERAL_FLOAT
+} NumLiteralKind;
+
+typedef struct {
+ NumLiteralKind kind;
+ union {
+ UInteger intval;
+ Floating floatval;
+ };
+} NumLiteral;
+
+typedef struct {
+ char *str;
+ size_t len;
+} StrLiteral;
+
+/* NOTE: Location is typedef'd in util/err.c */
+typedef struct {
+ TokenKind kind;
+ Location where;
+ union {
+ Keyword kw;
+ Directive direct;
+ Identifier ident;
+ NumLiteral num;
+ char chr;
+ StrLiteral str;
+ };
+} Token;
+
+typedef struct {
+ Allocator allocr;
+ Array tokens;
+ char *s; /* string being parsed */
+ const char *filename;
+ LineNo line;
+ Token *token; /* token currently being processed */
+ Identifiers *idents;
+} Tokenizer;
+
+
+typedef enum {
+ TYPE_VOID,
+ TYPE_UNKNOWN,
+ TYPE_BUILTIN,
+ TYPE_FN,
+ TYPE_TUPLE,
+ TYPE_ARR,
+ TYPE_PTR
+} TypeKind;
+
+typedef enum {
+ BUILTIN_I8,
+ BUILTIN_I16,
+ BUILTIN_I32,
+ BUILTIN_I64,
+ BUILTIN_U8,
+ BUILTIN_U16,
+ BUILTIN_U32,
+ BUILTIN_U64,
+ BUILTIN_F32,
+ BUILTIN_F64,
+ BUILTIN_CHAR,
+ BUILTIN_BOOL,
+ BUILTIN_TYPE_COUNT
+} BuiltinType;
+
+#define TYPE_FLAG_FLEXIBLE 0x01
+#define TYPE_FLAG_RESOLVED 0x02
+
+typedef struct Type {
+ Location where;
+ TypeKind kind;
+ uint16_t flags;
+ union {
+ BuiltinType builtin;
+ struct {
+ Array types; /* [0] = ret_type, [1..] = param_types */
+ } fn;
+ Array tuple;
+ struct {
+ struct Type *of;
+ union {
+ UInteger n; /* this is NOT set by parse_type; it will be handled by types.c */
+ struct Expression *n_expr;
+ };
+ } arr;
+ struct {
+ struct Type *of;
+ } ptr;
+ };
+} Type;
+
+#define BLOCK_FLAG_FN 0x01
+
+typedef struct Block {
+ uint16_t flags;
+ Location start;
+ Location end;
+ Array stmts;
+ struct Block *parent;
+ struct Expression *ret_expr; /* the return expression of this block, e.g. {foo(); 3} => 3 NULL for no expression. */
+} Block;
+
+typedef enum {
+ EXPR_LITERAL_FLOAT,
+ EXPR_LITERAL_INT,
+ EXPR_LITERAL_STR,
+ EXPR_LITERAL_BOOL,
+ EXPR_LITERAL_CHAR,
+ EXPR_IDENT, /* variable or constant */
+ EXPR_BINARY_OP,
+ EXPR_UNARY_OP,
+ EXPR_IF,
+ EXPR_WHILE,
+ EXPR_FN,
+ EXPR_CAST,
+ EXPR_NEW,
+ EXPR_CALL,
+ EXPR_BLOCK,
+ EXPR_DIRECT
+} ExprKind;
+
+typedef enum {
+ UNARY_MINUS,
+ UNARY_ADDRESS, /* &x */
+ UNARY_DEREF, /* *x */
+ UNARY_NOT, /* !x */
+ UNARY_DEL
+} UnaryOp;
+
+typedef enum {
+ BINARY_SET, /* e.g. x = y */
+ BINARY_ADD,
+ BINARY_SUB,
+ BINARY_MUL,
+ BINARY_DIV,
+ BINARY_COMMA,
+ BINARY_GT,
+ BINARY_LT,
+ BINARY_GE,
+ BINARY_LE,
+ BINARY_EQ,
+ BINARY_NE,
+ BINARY_AT_INDEX /* e.g. x[i] */
+} BinaryOp;
+
+typedef struct {
+ Directive which;
+ Array args; /* of Argument */
+} DirectExpr;
+
+
+typedef struct {
+ struct Expression *fn;
+ Array args; /* of Argument; after typing, becomes of Expression */
+} CallExpr;
+
+typedef struct {
+ struct Expression *cond; /* NULL = this is an else */
+ struct Expression *next_elif; /* next elif/else of this statement */
+ Block body;
+} IfExpr;
+
+typedef struct {
+ struct Expression *cond;
+ Block body;
+} WhileExpr;
+
+typedef struct {
+ Array params; /* declarations of the parameters to this function */
+ Array ret_decls; /* array of decls, if this has named return values. otherwise, len & data will be 0. */
+ Type ret_type;
+ Block body;
+} FnExpr; /* an expression such as fn(x: int) int { 2 * x } */
+
+typedef struct {
+ Type type;
+ struct Expression *expr;
+} CastExpr;
+
+#define EXPR_FLAG_FOUND_TYPE 0x01
+
+typedef struct Expression {
+ Location where;
+ ExprKind kind;
+ uint16_t flags;
+ Type type;
+ union {
+ Floating floatl;
+ UInteger intl;
+ StrLiteral strl;
+ bool booll;
+ char charl;
+ struct {
+ UnaryOp op;
+ struct Expression *of;
+ } unary;
+ struct {
+ BinaryOp op;
+ struct Expression *lhs;
+ struct Expression *rhs;
+ } binary;
+ CallExpr call;
+ DirectExpr direct;
+ Identifier ident;
+ struct {
+ Type type;
+ } new;
+ struct {
+ Type type;
+ } del;
+ IfExpr if_;
+ WhileExpr while_;
+ FnExpr fn;
+ CastExpr cast;
+ Block block;
+ };
+} Expression;
+
+typedef struct {
+ Location where;
+ Identifier name; /* NULL = no name */
+ Expression val;
+} Argument;
+
+#define DECL_FLAG_ANNOTATES_TYPE 0x01
+#define DECL_FLAG_CONST 0x02
+#define DECL_FLAG_HAS_EXPR 0x04
+#define DECL_FLAG_FOUND_TYPE 0x08
+#define DECL_FLAG_ERRORED_ABOUT_SELF_REFERENCE 0x10 /* has there been an error about this decl referencing itself? */
+
+/* OPTIM: Instead of using dynamic arrays, do two passes. */
+typedef struct Declaration {
+ Location where;
+ Array idents;
+ Type type;
+ uint16_t flags;
+ Expression expr;
+ union Value *val; /* only for constant decls. set to NULL here, and to actual value by types.c. */
+} Declaration;
+
+typedef enum {
+ STMT_DECL,
+ STMT_EXPR,
+ STMT_RET
+} StatementKind;
+
+#define RET_FLAG_EXPR 0x01
+typedef struct {
+ uint16_t flags;
+ Expression expr;
+} Return;
+
+#define STMT_FLAG_VOIDED_EXPR 0x01 /* the "4;" in fn () { 4; } is a voided expression, but the "4" in fn () int { 4 } is not */
+typedef struct {
+ Location where;
+ StatementKind kind;
+ unsigned short flags;
+ union {
+ Declaration decl;
+ Expression expr;
+ Return ret;
+ };
+} Statement;
+
+typedef struct {
+ Array stmts;
+} ParsedFile;
+
+typedef struct {
+ Tokenizer *tokr;
+ Allocator allocr;
+ Block *block; /* which block are we in? NULL = file scope */
+} Parser;
+
+typedef enum {
+ DECL_END_SEMICOLON,
+ DECL_END_RPAREN_COMMA,
+ DECL_END_LBRACE_COMMA
+} DeclEndKind;
+
+typedef struct {
+ Allocator allocr;
+} Evaluator;
+
+typedef union Value {
+ U8 u8;
+ U16 u16;
+ U32 u32;
+ U64 u64;
+ I8 i8;
+ I16 i16;
+ I32 i32;
+ I64 i64;
+ bool boolv;
+ char charv;
+ float f32;
+ double f64;
+ FnExpr *fn;
+ void *arr;
+ void *ptr;
+} Value;