diff options
-rw-r--r-- | abbrevs.txt | 1 | ||||
-rwxr-xr-x | build.sh | 10 | ||||
-rw-r--r-- | cgen.c | 16 | ||||
-rw-r--r-- | eval.c | 4 | ||||
-rw-r--r-- | main.c | 1 | ||||
-rw-r--r-- | out.c | 45 | ||||
-rw-r--r-- | parse.c | 33 | ||||
-rw-r--r-- | test.toc | 37 | ||||
-rw-r--r-- | tokenizer.c | 4 | ||||
-rw-r--r-- | types.c | 90 | ||||
-rw-r--r-- | types.h | 28 |
11 files changed, 175 insertions, 94 deletions
diff --git a/abbrevs.txt b/abbrevs.txt index d907681..49d29ce 100644 --- a/abbrevs.txt +++ b/abbrevs.txt @@ -11,6 +11,7 @@ expr - expression fn - function ident - identifier kw - keyword +mut - mutable num - number op - operator param - parameter @@ -1,5 +1,5 @@ -#!/bin/bash -if [[ $CC == "" ]]; then +#!/bin/sh +if [ "$CC" = "" ]; then CC=gcc fi @@ -12,10 +12,10 @@ fi ADDITIONAL_FLAGS='-Wno-unused-function' -if [[ $CC == "clang" ]]; then - WARNINGS='-Wall -Wextra -Wpedantic -Wshadow -Wimplicit-fallthrough -Wno-unused-parameter' +if [ "$CC" = "clang" ]; then + WARNINGS='-Wall -Wextra -Wpedantic -Wshadow -Wconversion -Wimplicit-fallthrough -Wno-unused-parameter' else - WARNINGS='-Wall -Wextra -Wpedantic -Wshadow -Wno-pointer-to-int-cast -Wno-unused-parameter' + WARNINGS='-Wall -Wextra -Wpedantic -Wshadow -Wconversion -Wno-pointer-to-int-cast -Wno-unused-parameter' fi DEBUG_FLAGS="-O0 -g3 $WARNINGS -std=c11 -DTOC_DEBUG" @@ -1,13 +1,3 @@ -typedef struct { - FILE *outc; - unsigned long ident_counter; - ParsedFile *file; - Block *block; - FnExpr *fn; /* which function are we in? (NULL for none) - not used during decls */ - Evaluator *evalr; - Identifier main_ident; -} CGenerator; - static bool cgen_stmt(CGenerator *g, Statement *s); static bool cgen_block(CGenerator *g, Block *b); static bool cgen_expr(CGenerator *g, Expression *e); @@ -89,8 +79,8 @@ static void cgen_ident(CGenerator *g, Identifier i) { } } -static void cgen_ident_id(CGenerator *g, unsigned long id) { - cgen_write(g, "a%lu_", id); +static void cgen_ident_id(CGenerator *g, IdentID id) { + cgen_write(g, "a%lu_", (unsigned long)id); } static bool cgen_type_post(CGenerator *g, Type *t, Location where); @@ -522,7 +512,7 @@ static bool cgen_decl(CGenerator *g, Declaration *d) { cgen_write(g, "{"); cgen_nl(g); if (!cgen_type_pre(g, &d->expr.type, d->expr.where)) return false; - cgen_write(g, "expr__"); + cgen_write(g, " expr__"); if (!cgen_type_post(g, &d->expr.type, d->expr.where)) return false; cgen_write(g, "; "); if (!cgen_set(g, NULL, "expr__", &d->expr, NULL)) @@ -436,7 +436,7 @@ static bool eval_expr(Evaluator *ev, Expression *e, Value *v) { /* WARNING: macros ahead */ #define eval_unary_op_one(low, up, op) \ case BUILTIN_##up: \ - v->low = op of.low; break + v->low = (up)(op of.low); break #define eval_unary_op_nums(builtin, op) \ eval_unary_op_one(i8, I8, op); \ eval_unary_op_one(i16, I16, op); \ @@ -457,7 +457,7 @@ static bool eval_expr(Evaluator *ev, Expression *e, Value *v) { #define eval_binary_op_one(low, up, op) \ case BUILTIN_##up: \ - v->low = lhs.low op rhs.low; break + v->low = (up)(lhs.low op rhs.low); break #define eval_binary_op_nums(builtin, op) \ eval_binary_op_one(i8, I8, op); \ @@ -3,6 +3,7 @@ TODO: re-do cgen arrs are pointers make sure initializers for global variables are compile-time constants +allow, e.g.: x := "foo"; x[0] = 'g'; any odd number of "s for a string */ #include "toc.c" @@ -16,8 +16,8 @@ typedef unsigned char bool; /* declarations */ -void puti(i64 i); -void asdf(i64 i, i64( (*ret__)[3])); +i64 puti(i64 i); +void dbl(i64((* x)[3])); void main__(); /* code */ int main() { @@ -25,43 +25,20 @@ int main() { return 0; } -void puti(i64 i) { +i64 puti(i64 i) { printf("%ld\n", i); } -void asdf(i64 i, i64( (*ret__)[3])) { -i64( ret[3]) = {0}; -i64( asdf[3]) = {0}; -(ret[0]) = (0*i);; -(ret[1]) = (1*i);; -(ret[2]) = (2*i);; -{ -size_t i;i64(*arr__in) = asdf; i64(*arr__out) = ret; -for (i = 0; i < 3; i++) arr__out[i] = arr__in[i]; -}; -{ -size_t i;i64(*arr__in) = *ret__; i64(*arr__out) = asdf; -for (i = 0; i < 3; i++) arr__out[i] = arr__in[i]; -}return; +void dbl(i64((* x)[3])) { +((*x)[0]) = (((*x)[0])*2);; +((*x)[1]) = (((*x)[1])*2);; +((*x)[2]) = (((*x)[2])*2);; } void main__() { -i64(* x); { -i64(*expr__); expr__ = ((i64(*))calloc(1, sizeof(i64)));x = expr__;} -(*x) = 17;; -if (((*x)==0)) { -(*x) = ((1+2)+(3-(5/62)));; -} else { -(*x) = ((4+5)+6);; -}; -(puti((*x))); -(free(x)); -void (* fptr)(i64, i64((*)[3])); { -void (*expr__)(i64, i64((*)[3])); expr__ = asdf;fptr = expr__;} +i64( a[3]) = {0}; +(a[0]) = 1;; +(dbl((&a))); +(puti((a[0]))); } -i64 foo = 5; -char( bar[5]) = "\x48\x65\x6c\x6c\x6f"; -i64 a = 123; i64 b = 123; -char x = ((char)97); -i64 sadkfj = (-1293812); @@ -3,6 +3,30 @@ static bool parse_expr(Parser *p, Expression *e, Token *end); #define PARSE_DECL_ALLOW_CONST_WITH_NO_EXPR 0x01 static bool parse_decl(Parser *p, Declaration *d, DeclEndKind ends_with, uint16_t flags); +static const char *expr_kind_to_str(ExprKind k) { + switch (k) { + case EXPR_LITERAL_FLOAT: return "float literal"; + case EXPR_LITERAL_INT: return "integer literal"; + case EXPR_LITERAL_STR: return "string literal"; + case EXPR_LITERAL_BOOL: return "boolean literal"; + case EXPR_LITERAL_CHAR: return "character literal"; + case EXPR_IF: return "if expression"; + case EXPR_WHILE: return "while expression"; + case EXPR_CALL: return "function call"; + case EXPR_DIRECT: return "directive"; + case EXPR_NEW: return "new expression"; + case EXPR_CAST: return "cast expression"; + case EXPR_UNARY_OP: return "unary operator"; + case EXPR_BINARY_OP: return "binary operator"; + case EXPR_FN: return "function expression"; + case EXPR_TUPLE: return "tuple"; + case EXPR_BLOCK: return "block"; + case EXPR_IDENT: return "identifier"; + } + assert(0); + return ""; +} + static const char *unary_op_to_str(UnaryOp u) { switch (u) { case UNARY_MINUS: return "-"; @@ -459,7 +483,8 @@ static bool parse_block(Parser *p, Block *b) { } static bool is_decl(Tokenizer *t); - +static inline bool ends_decl(Token *t, DeclEndKind ends_with); + static bool parse_decl_list(Parser *p, Declaration **decls, DeclEndKind decl_end) { Tokenizer *t = p->tokr; bool ret = true; @@ -472,8 +497,8 @@ static bool parse_decl_list(Parser *p, Declaration **decls, DeclEndKind decl_end Declaration *decl = parser_arr_add(p, decls); if (!parse_decl(p, decl, decl_end, PARSE_DECL_ALLOW_CONST_WITH_NO_EXPR)) { ret = false; - /* skip to end of param list */ - while (t->token->kind != TOKEN_EOF && !token_is_kw(t->token, KW_RPAREN)) + /* skip to end of list */ + while (t->token->kind != TOKEN_EOF && !ends_decl(t->token, decl_end)) t->token++; break; } @@ -499,6 +524,8 @@ static bool parse_fn_expr(Parser *p, FnExpr *f) { } else { if (!parse_decl_list(p, &f->params, DECL_END_RPAREN_COMMA)) return false; + arr_foreach(f->params, Declaration, pdecl) + pdecl->flags |= DECL_FLAG_PARAM; } if (t->token->kind == TOKEN_EOF) { @@ -1,33 +1,18 @@ -puti @= fn(i: int) { +puti @= fn(i: int) int { #C("printf(\"%ld\\n\", i)"); + i }; -asdf @= fn(i: int) [3]int { - ret : [3]int; - asdf : [3]int; - ret[0] = 0*i; - ret[1] = 1*i; - ret[2] = 2*i; - asdf = ret; - return asdf; +dbl @= fn(x: &[3]int) { + (*x)[0] = (*x)[0] * 2; + (*x)[1] = (*x)[1] * 2; + (*x)[2] = (*x)[2] * 2; }; main @= fn() { - x := new int; - *x = 17; - if *x == 0 { - *x = 1+2+3-5/62; - } else { - *x = 4+5+6; - } - puti(*x); -del x; - fptr := asdf; -}; - -foo := 5; -bar := "Hello"; -a, b := 123; -x := 'a'; -sadkfj := -1293812; + a : [3]int; + a[0] = 1; + dbl(&a); + puti(a[0]); +};
\ No newline at end of file diff --git a/tokenizer.c b/tokenizer.c index a665ca5..1a4f5dd 100644 --- a/tokenizer.c +++ b/tokenizer.c @@ -374,7 +374,7 @@ static bool tokenize_string(Tokenizer *t, char *str) { switch (n.kind) { case NUM_LITERAL_INT: if (n.intval > UINTEGER_MAX / (UInteger)base || - n.intval * (UInteger)base > ULLONG_MAX - (UInteger)digit) { + n.intval * (UInteger)base > UINT_MAX - (UInteger)digit) { /* too big! */ tokenization_err(t, "Number too big to fit in a numeric literal."); goto err; @@ -464,7 +464,7 @@ static bool tokenize_string(Tokenizer *t, char *str) { } *strptr = 0; token->kind = TOKEN_STR_LITERAL; - token->str.len = strptr - strlit; + token->str.len = (size_t)(strptr - strlit); token->str.str = strlit; tokr_nextchar(t); /* move past closing " */ continue; @@ -80,7 +80,61 @@ static bool type_must_eq(Location where, Type *expected, Type *got) { return true; } -/* sometimes prints an error and returns false if the given expression is not an l-value */ + +/* +this expression, which is an array, must be mutable (otherwise print an error, +return false)! +*/ +static bool expr_arr_must_mut(Expression *e) { + switch (e->kind) { + case EXPR_IDENT: { + IdentDecl *idecl = ident_decl(e->ident); + Declaration *d = idecl->decl; + if (d->flags & DECL_FLAG_CONST) { + err_print(e->where, "Cannot modify a constant array."); + return false; + } + if (d->flags & DECL_FLAG_PARAM) { + err_print(e->where, "Parameters are immutable."); + return false; + } + } return true; + case EXPR_CAST: + case EXPR_CALL: + case EXPR_NEW: + case EXPR_UNARY_OP: + return true; + case EXPR_WHILE: + assert(e->while_.body.ret_expr); + return expr_arr_must_mut(e->while_.body.ret_expr); + case EXPR_IF: + for (IfExpr *i = &e->if_; i; i->next_elif ? i = &i->next_elif->if_ : (i = NULL)) { + assert(i->body.ret_expr); + if (!expr_arr_must_mut(i->body.ret_expr)) + return false; + } + return true; + case EXPR_BLOCK: + assert(e->block.ret_expr); + return expr_arr_must_mut(e->block.ret_expr); + case EXPR_LITERAL_STR: + err_print(e->where, "String constants are immutable."); + return false; + case EXPR_LITERAL_BOOL: + case EXPR_FN: + case EXPR_TUPLE: + case EXPR_LITERAL_FLOAT: + case EXPR_LITERAL_CHAR: + case EXPR_LITERAL_INT: + case EXPR_BINARY_OP: + case EXPR_DIRECT: + break; + } + assert(0); + return false; +} + +/* prints an error and returns false if the given expression is not an l-value */ static bool expr_must_lval(Expression *e) { /* NOTE: make sure you update eval when you change this */ switch (e->kind) { @@ -94,6 +148,11 @@ static bool expr_must_lval(Expression *e) { info_print(d->where, "%s was declared here.", istr); return false; } + if (d->flags & DECL_FLAG_PARAM) { + char *istr = ident_to_str(e->ident); + err_print(e->where, "You cannot modify or take the address of a parameter (%s).", istr); + return false; + } return true; } @@ -102,7 +161,7 @@ static bool expr_must_lval(Expression *e) { break; case EXPR_BINARY_OP: switch (e->binary.op) { - case BINARY_AT_INDEX: return true; + case BINARY_AT_INDEX: return expr_arr_must_mut(e->binary.lhs); default: break; } break; @@ -114,9 +173,24 @@ static bool expr_must_lval(Expression *e) { } return true; } break; - default: - break; + case EXPR_CAST: + case EXPR_NEW: + case EXPR_FN: + case EXPR_LITERAL_FLOAT: + case EXPR_LITERAL_CHAR: + case EXPR_LITERAL_STR: + case EXPR_LITERAL_INT: + case EXPR_LITERAL_BOOL: + case EXPR_IF: + case EXPR_WHILE: + case EXPR_CALL: + case EXPR_DIRECT: + case EXPR_BLOCK: { + err_print(e->where, "Cannot use %s as l-value.", expr_kind_to_str(e->kind)); + return false; } + } + assert(0); return false; } @@ -622,11 +696,16 @@ static bool types_expr(Typer *tr, Expression *e) { if (!types_expr(tr, &arg->val)) return false; } + if (f->type.kind == TYPE_UNKNOWN) { + e->type.kind = TYPE_UNKNOWN; + return true; + } if (f->type.kind != TYPE_FN) { char *type = type_to_str(&f->type); err_print(e->where, "Calling non-function (type %s).", type); return false; } + Type *ret_type = f->type.fn.types; Type *param_types = ret_type + 1; Argument *args = c->args; @@ -831,7 +910,6 @@ static bool types_expr(Typer *tr, Expression *e) { switch (e->binary.op) { case BINARY_SET: if (!expr_must_lval(e->binary.lhs)) { - err_print(e->where, "You can only assign to an lvalue."); /* FEATURE: better err */ return false; } /* fallthrough */ @@ -988,7 +1066,7 @@ static bool types_decl(Typer *tr, Declaration *d) { goto ret; } d->type = d->expr.type; - d->type.flags &= ~TYPE_FLAG_FLEXIBLE; /* x := 5; => x is not flexible */ + d->type.flags &= (uint16_t)~(uint16_t)TYPE_FLAG_FLEXIBLE; /* x := 5; => x is not flexible */ } if (d->flags & DECL_FLAG_CONST) { if (!(d->flags & DECL_FLAG_FOUND_VAL)) { @@ -25,6 +25,8 @@ typedef int64_t I64; typedef float F32; typedef double F64; +typedef U32 IdentID; /* identifier ID for cgen (anonymous variables) */ + typedef uint32_t LineNo; typedef struct { LineNo line; @@ -342,11 +344,17 @@ typedef struct { typedef struct { struct Expression *cond; /* NULL = this is an else */ struct Expression *next_elif; /* next elif/else of this statement */ + struct { + IdentID id; + } c; Block body; } IfExpr; typedef struct { struct Expression *cond; + struct { + IdentID id; + } c; Block body; } WhileExpr; @@ -358,7 +366,7 @@ typedef struct FnExpr { struct { /* if name = NULL, this is an anonymous function, and id will be the ID of the fn. */ Identifier name; - unsigned long id; + IdentID id; } c; } FnExpr; /* an expression such as fn(x: int) int { 2 * x } */ @@ -370,12 +378,13 @@ typedef struct { #define EXPR_FLAG_FOUND_TYPE 0x01 typedef struct Expression { + Type type; Location where; ExprKind kind; uint16_t flags; - Type type; union { Floating floatl; + /* Floating floatl; */ UInteger intl; StrLiteral strl; bool booll; @@ -402,7 +411,10 @@ typedef struct Expression { WhileExpr while_; FnExpr fn; CastExpr cast; - Block block; + struct { + Block block; + IdentID block_ret_id; + }; struct Expression *tuple; }; } Expression; @@ -419,6 +431,7 @@ typedef struct Argument { #define DECL_FLAG_FOUND_TYPE 0x08 #define DECL_FLAG_ERRORED_ABOUT_SELF_REFERENCE 0x10 /* has there been an error about this decl referencing itself? */ #define DECL_FLAG_FOUND_VAL 0x20 +#define DECL_FLAG_PARAM 0x40 /* is this a parameter declaration? (needed because parameters are immutable) */ /* OPTIM: Instead of using dynamic arrays, do two passes. */ typedef struct Declaration { @@ -483,3 +496,12 @@ typedef struct Typer { Type ret_type; /* the return type of the function we're currently parsing. */ } Typer; +typedef struct { + FILE *outc; + IdentID ident_counter; + ParsedFile *file; + Block *block; + FnExpr *fn; /* which function are we in? (NULL for none) - not used during decls */ + Evaluator *evalr; + Identifier main_ident; +} CGenerator; |