// Lexer::interns::map::allocator - array allocator, resizing // Lexer::tokens - array allocator, resizing // // Parser::ast_arena - arena for asts // Lexer::interns::string_allocator - arena for interns // Intern_String keyword_struct; Intern_String keyword_union; Intern_String keyword_return; Intern_String keyword_if; Intern_String keyword_else; Intern_String keyword_for; Intern_String keyword_cast; Intern_String keyword_enum; Intern_String intern_void; Intern_String intern_int; Intern_String intern_str; Intern_String intern_unsigned; struct Ast_Package; struct Sym; struct Parse_Ctx:Lexer{ Allocator *perm; // Stores: AST, tokens, interns Allocator *heap; U64 unique_ids; Map type_map; Ast_Package *resolving_package; Map resolved; Map syms; S32 scope; Array local_syms; Token empty_token; S64 indent; String_Builder gen; Intern_String intern(String string){ return intern_string(&interns, string); } void init(Allocator *perm_allocator, Allocator *heap_allocator){ perm = perm_allocator; heap = heap_allocator; gen = {perm}; resolved = {heap}; syms = {heap}; type_map = {heap}; local_syms = {heap}; lex_init(perm, heap, this); keyword_struct= intern("struct"_s); keyword_union = intern("union"_s); keyword_cast = intern("cast"_s); keyword_return = intern("return"_s); keyword_if = intern("if"_s); keyword_else = intern("else"_s); keyword_for = intern("for"_s); keyword_enum = intern_string(&interns, "enum"_s); interns.first_keyword = keyword_struct.str; interns.last_keyword = keyword_enum.str; intern_void = intern_string(&interns, "void"_s); intern_int = intern_string(&interns, "int"_s); intern_str = intern_string(&interns, "String"_s); intern_unsigned = intern_string(&interns, "unsigned"_s); } }; thread_local Parse_Ctx *pctx; //----------------------------------------------------------------------------- // AST //----------------------------------------------------------------------------- enum Ast_Kind: U32{ AST_NONE, AST_PACKAGE, AST_STR, AST_INT, AST_CAST, AST_IDENT, AST_INDEX, AST_UNARY, AST_BINARY, AST_CALL_ITEM, AST_CALL, AST_POINTER, AST_ARRAY, AST_INIT, AST_IF, AST_IF_NODE, AST_RETURN, AST_BLOCK, AST_LAMBDA, AST_LAMBDA_ARG, AST_STRUCT, AST_CONST, AST_VAR, }; typedef U32 Ast_Flag; enum{ AST_EXPR = 1, AST_STMT = 2, AST_BINDING = 4, AST_AGGREGATE = 8, AST_ATOM = 16, AST_ITEM_INCLUDED = 32, }; struct Ast{ U64 id; Token *pos; Ast_Kind kind; Ast *parent; Ast_Flag flags; }; struct Ast_Resolved_Type; struct Ast_Expr:Ast{}; struct Ast_Atom: Ast_Expr{ union{ Intern_String intern_val; U64 int_val; }; }; struct Ast_Call_Item: Ast_Expr{ Ast_Atom *name; // index | name Ast_Expr *index; Ast_Expr *item; }; struct Ast_Call: Ast_Expr{ Ast_Resolved_Type *type; // @todo: to map Ast_Expr *name; Array exprs; }; struct Ast_Unary: Ast_Expr{ Token_Kind op; Ast_Expr *expr; }; struct Ast_Cast: Ast_Expr{ Ast_Expr *expr; Ast_Expr *typespec; }; struct Ast_Index: Ast_Expr{ Ast_Expr *expr; Ast_Expr *index; }; struct Ast_Binary: Ast_Expr{ Token_Kind op; Ast_Expr *left; Ast_Expr *right; }; struct Ast_Block : Ast { Array stmts; }; struct Ast_Return: Ast{ Ast_Expr *expr; }; struct Ast_Init: Ast{ Token_Kind op; Ast_Atom *ident; Ast_Expr *expr; }; struct Ast_If_Node: Ast{ Ast_Expr *expr ; Ast_Block *block; Ast_Init *init; }; struct Ast_If: Ast{ Array ifs; }; struct Ast_Enum : Ast{ Ast_Expr *typespec; Array children; }; struct Ast_Lambda_Arg: Ast_Expr{ Intern_String name; Ast_Expr *typespec; Ast_Expr *default_value; }; struct Ast_Lambda : Ast_Expr { Array args; Ast_Expr *ret; Ast_Block *block; }; struct Ast_Array: Ast_Expr{ Ast_Expr *base; Ast_Expr *expr; }; struct Ast_Named:Ast{ Intern_String name; }; struct Ast_Resolved_Type; struct Ast_Struct: Ast_Expr{ // Required to be Ast_Struct or Ast_Var or Ast_Const Array members; Ast_Resolved_Type *type; }; struct Ast_Var: Ast_Named{ Ast_Expr *typespec; Ast_Expr *expr; }; struct Ast_Const: Ast_Named{ union{ Ast *ast; Ast_Expr *value; Ast_Struct *agg; }; }; struct Ast_Package:Ast{ Intern_String name; Array decls; Array ordered; }; //----------------------------------------------------------------------------- // AST Constructors beginning with expressions //----------------------------------------------------------------------------- #define AST_NEW(T,ikind,ipos,iflags) \ Ast_##T *result = exp_alloc_type(pctx->perm, Ast_##T, AF_ZeroMemory);\ result->flags = iflags; \ result->kind = AST_##ikind; \ result->pos = ipos; \ result->id = ++pctx->unique_ids function Ast_Atom * ast_str(Token *pos, Intern_String string, Ast_Flag flags = 0){ AST_NEW(Atom, STR, pos, AST_ATOM | flags); result->intern_val = string; return result; } function Ast_Atom * ast_ident(Token *pos, Intern_String string, Ast_Flag flags = 0){ AST_NEW(Atom, IDENT, pos, AST_ATOM | flags); result->intern_val = string; return result; } function Ast_Atom * ast_int(Token *pos, S64 integer, Ast_Flag flags = 0){ AST_NEW(Atom, INT, pos, AST_ATOM | flags); result->int_val = integer; return result; } function Ast_Expr * ast_expr_binary(Ast_Expr *left, Ast_Expr *right, Token *op){ AST_NEW(Binary, BINARY, op, AST_EXPR); result->op = op->kind; result->left = left; result->right = right; result->left->parent = result; result->right->parent = result; return result; } function Ast_Call * ast_call(Token *pos, Ast_Expr *name, Array exprs){ AST_NEW(Call, CALL, pos, AST_EXPR); result->name = name; result->exprs = exprs.tight_copy(pctx->perm); if(result->name) result->name->parent = result; For(result->exprs) it[0]->parent = result; return result; } function Ast_Call_Item * ast_call_item(Token *pos, Ast_Expr *index, Ast_Atom *name, Ast_Expr *item){ AST_NEW(Call_Item, CALL_ITEM, pos, AST_EXPR); result->name = name; result->index = index; result->item = item; if(result->name) result->name->parent = result; if(result->index) result->index->parent = result; item->parent = result; return result; } function Ast_Expr * ast_expr_cast(Token *pos, Ast_Expr *expr, Ast_Expr *typespec){ AST_NEW(Cast, CAST, pos, AST_EXPR); result->flags = AST_EXPR; result->expr = expr; result->typespec = typespec; expr->parent = result; typespec->parent = result; return result; } function Ast_Expr * ast_expr_unary(Token *pos, Token_Kind op, Ast_Expr *expr){ AST_NEW(Unary, UNARY, pos, AST_EXPR); result->flags = AST_EXPR; result->expr = expr; result->op = op; expr->parent = result; return result; } function Ast_Expr * ast_expr_index(Token *pos, Ast_Expr *expr, Ast_Expr *index){ AST_NEW(Index, INDEX, pos, AST_EXPR); result->flags = AST_EXPR; result->expr = expr; result->index = index; expr->parent = result; index->parent = result; return result; } function Ast_Lambda * ast_lambda(Token *pos, Array params, Ast_Expr *ret, Ast_Block *block){ AST_NEW(Lambda, LAMBDA, pos, AST_EXPR); result->flags = AST_EXPR; result->args = params.tight_copy(pctx->perm); result->block = block; result->ret = ret; if(!ret) result->ret = ast_ident(result->pos, intern_void); if(result->block) result->block->parent = result; result->ret->parent = result; For(result->args) it[0]->parent = result; return result; } function Ast_Lambda_Arg * ast_expr_lambda_arg(Token *pos, Intern_String name, Ast_Expr *typespec, Ast_Expr *default_value){ AST_NEW(Lambda_Arg, LAMBDA_ARG, pos, AST_EXPR); result->flags = AST_EXPR; result->name = name; result->typespec = typespec; result->default_value = default_value; result->typespec->parent = result; if(result->default_value) result->default_value->parent = result; return result; } function Ast_Block * ast_block(Token *pos, Array stmts){ AST_NEW(Block, BLOCK, pos, AST_STMT); result->stmts = stmts.tight_copy(pctx->perm); For(result->stmts) it[0]->parent = result; return result; } function Ast_If * ast_if(Token *pos, Array ifs){ AST_NEW(If, IF, pos, AST_STMT); result->ifs = ifs.tight_copy(pctx->perm); For(result->ifs) it[0]->parent = result; return result; } function Ast_Return * ast_return(Token *pos, Ast_Expr *expr){ AST_NEW(Return, RETURN, pos, AST_STMT); if(expr){ assert(is_flag_set(expr->flags, AST_EXPR)); result->expr = expr; result->expr->parent = result; } return result; } function Ast_If_Node * ast_if_node(Token *pos, Ast_Init *init, Ast_Expr *expr, Ast_Block *block){ AST_NEW(If_Node, IF_NODE, pos, AST_STMT); result->block = block; result->expr = expr; result->init = init; if(result->block) result->block->parent = result; if(result->expr) result->expr->parent = result; if(result->init) result->init->parent = result; return result; } function Ast_Init * ast_init(Token *pos, Token_Kind op, Ast_Atom *ident, Ast_Expr *expr){ AST_NEW(Init, INIT, pos, AST_STMT); result->op = op; result->ident = ident; result->expr = expr; result->ident->parent = result; result->expr->parent = result; return result; } function Ast_Array * ast_array(Token *pos, Ast_Expr *expr){ AST_NEW(Array, ARRAY, pos, AST_EXPR); result->flags = AST_EXPR; result->expr = expr; result->expr->parent = result; return result; } function Ast_Struct * ast_struct(Token *pos, Array members){ AST_NEW(Struct, STRUCT, pos, AST_AGGREGATE); result->members = members.tight_copy(pctx->perm); For(result->members) { assert(is_flag_set(it[0]->flags, AST_BINDING)); assert(it[0]->kind == AST_VAR || it[0]->kind == AST_CONST); it[0]->parent = result; } return result; } //----------------------------------------------------------------------------- // Declarations //----------------------------------------------------------------------------- function Ast_Var * ast_var(Token *pos, Ast_Expr *typespec, Intern_String name, Ast_Expr *expr){ AST_NEW(Var, VAR, pos, AST_BINDING); result->expr = expr; result->typespec = typespec; result->name = name; if(result->expr) result->expr->parent = result; if(result->typespec) result->typespec->parent = result; return result; } function Ast_Const * ast_const(Token *pos, Intern_String name, Ast_Expr *value){ AST_NEW(Const, CONST, pos, AST_BINDING); assert(value->kind == AST_STRUCT || is_flag_set(value->flags, AST_EXPR)); result->value = value; result->name = name; result->value->parent = result; return result; } function Ast_Package * ast_package(Token *pos, String name, Array decls){ AST_NEW(Package, PACKAGE, pos, 0); result->decls = decls.tight_copy(pctx->perm); result->ordered = array_make(pctx->perm, decls.len); result->name = intern_string(&pctx->interns, name); For(result->decls) it[0]->parent = result; return result; } //----------------------------------------------------------------------------- // Utillities //----------------------------------------------------------------------------- function Ast_Struct * const_try_getting_struct(Ast *ast){ assert(ast->kind == AST_CONST); Ast_Const *constant = (Ast_Const *)ast; if(constant->value->kind == AST_STRUCT){ return (Ast_Struct *)constant->value; } return 0; } function Ast_Struct * const_get_struct(Ast *ast){ auto result = const_try_getting_struct(ast); assert(result); return result; } function Ast_Lambda * const_try_getting_lambda(Ast *ast){ assert(ast->kind == AST_CONST); Ast_Const *constant = (Ast_Const *)ast; if(constant->value->kind == AST_LAMBDA){ return (Ast_Lambda *)constant->value; } return 0; } function Ast_Lambda * const_get_lambda(Ast *ast){ auto result = const_try_getting_lambda(ast); assert(result); return result; } function Intern_String ast_get_name(Ast *ast){ assert(is_flag_set(ast->flags, AST_BINDING)); auto constant = (Ast_Named *)ast; return constant->name; } function B32 ast_is_struct(Ast *ast){ if(ast->kind == AST_CONST){ auto a = (Ast_Const *)ast; B32 result = a->agg->kind == AST_STRUCT; return result; } return false; }