//----------------------------------------------------------------------------- // AST //----------------------------------------------------------------------------- enum Ast_Kind: U32{ AST_NONE, AST_NAMESPACE, AST_MODULE, AST_FILE, AST_SCOPE, AST_VALUE, AST_CAST, AST_IDENT, AST_INDEX, AST_UNARY, AST_BINARY, AST_CALL_ITEM, AST_CALL, AST_CONSTANT_ASSERT, AST_RUNTIME_ASSERT, AST_SIZE_OF, AST_LENGTH_OF, AST_ALIGN_OF, AST_TYPE_OF, AST_SWITCH, AST_SWITCH_CASE, AST_VAR_UNPACK, AST_BREAK, AST_COMPOUND, AST_TYPE, AST_VAR, AST_CONST, AST_POINTER, AST_ARRAY, AST_FOR, AST_IF, AST_IF_NODE, AST_RETURN, AST_BLOCK, AST_PASS, AST_LAMBDA, AST_LAMBDA_EXPR, AST_LAMBDA_ARG, AST_ENUM, AST_ENUM_MEMBER, AST_STRUCT, }; typedef U32 Ast_Flag; enum{ AST_EXPR = bit_flag(1), AST_STMT = bit_flag(2), AST_STRICT = bit_flag(3), AST_AGGREGATE = bit_flag(4), AST_AGGREGATE_CHILD = bit_flag(5), AST_ATOM = bit_flag(7), AST_FOREIGN = bit_flag(8), AST_DECL = bit_flag(9), AST_GLOBAL = bit_flag(10), AST_FLAG = bit_flag(11), AST_VAR_IS_CONST = bit_flag(12), AST_OPERATOR_OVERLOAD = bit_flag(13), AST_IS_LVALUE = bit_flag(14), }; struct Ast{ U64 di; // Debug id, shouldn't ever be used in the program Token *pos; Ast_Kind kind; Ast_Scope *parent_scope; Ast_Flag flags; }; struct Ast_Type; struct Ast_Expr:Ast{ Ast_Type *resolved_type; Ast_Decl *resolved_operator_overload; union{ Ast_Type *index_original_type; Ast_Type *cast_after_type; Ast_Type *dot_access_step_resolution; }; }; struct Ast_Atom: Ast_Expr{ // We have a field type here // it has a different purpose from the // resolved_type of Ast_Expr, it describes // the inherent type of a value // // resolved_type is a solid type that // can be use during code generation // it cannot be untyped. (or at least thats the hope :) /*#import meta meta.inline_value_fields() */ union { Value value; struct { Ast_Type *type; Ast_Decl *resolved_decl; union { bool bool_val; F64 f64_val; Intern_String intern_val; BigInt big_int_val; Ast_Type *type_val; }; }; }; /*END*/ }; typedef U32 Ast_Call_Item_Flag; enum{ CALL_INDEX = bit_flag(1), CALL_NAME = bit_flag(2), CALL_INCLUDED= bit_flag(4), }; struct Ast_Call_Item: Ast_Expr{ Ast_Call_Item_Flag call_flags; S32 resolved_index; Ast_Expr *item; union { Ast_Atom *name; Ast_Expr *index; }; Intern_String resolved_name; }; struct Ast_Lambda; struct Ast_Call: Ast_Expr{ union{ Ast_Expr *name; Ast_Expr *typespec; }; Array exprs; Ast_Decl *resolved_decl; }; struct Ast_Var_Unpack: Ast_Expr{ Array vars; Ast_Expr *expr; }; struct Ast_Unary: Ast_Expr{ Token_Kind op; Ast_Expr *expr; U64 padding[2]; // For folding constants into atoms }; struct Ast_Index: Ast_Expr{ Ast_Expr *expr; Ast_Expr *index; }; struct Ast_Binary: Ast_Expr{ Token_Kind op; Ast_Expr *left; Ast_Expr *right; Ast_Type *before_type; }; struct Ast_Builtin: Ast_Expr{ Ast_Expr *expr; Intern_String assert_message; U64 padding[1]; // For folding constants into atoms }; // Problem: We are parsing out of order, in the middle of parsing a function // we can jump down a different function, we cant therfore use global map. // Each scope needs to have it's checked locals list. To lookup syms we need to // look into global scope and to the locals list. // struct Ast_Return: Ast{ Ast_Type *resolved_type; Array expr; }; struct Ast_If_Node: Ast{ Ast_Expr *expr ; Ast_Scope *scope; Ast_Binary*init; }; struct Ast_If: Ast{ Array ifs; }; struct Ast_Pass: Ast{}; struct Ast_Break: Ast{}; struct Ast_For: Ast{ Ast_Expr *init; Ast_Expr *cond; Ast_Expr *iter; Ast_Scope *scope; Ast_Decl *array_traversal_var; bool is_array_traversal; bool is_also_slice_traversal; }; struct Ast_Lambda : Ast_Expr { Array args; Array ret; Ast_Scope *scope; }; struct Ast_Array: Ast_Expr{ Ast_Expr *base; Ast_Expr *expr; U64 padding[2]; }; struct Ast_Switch_Case: Ast{ Array labels; Ast_Scope *scope; B32 fallthrough; }; struct Ast_Switch: Ast{ Ast_Expr *value; Array cases; Ast_Scope *default_scope; }; /* How does current declaration order resolver works: * First we put all the global declarations into the global scope (when parsing) all unresolved * All the types are declared INCOMPLETE and RESOLVED * We descent the tree by resolving each of the named declarations, we resolve by their name When we start resolving we set RESOLVING flag and when we complete RESOLVED flag and put into ordered list * When we meet a symbol (named declaration) while descending the tree, we resolve that symbol instead before resolving current declaration. * When we meet a declaration that requires size of a type - field access, var assignment, we need to call "complete_type", it sets COMPLETING flag. This call resolves all the dependencies of that type, sets size of type and marks it as COMPLETE and puts into ordered list. If it detects COMPLETING while resolving, we got a circular dependency. That might happen when we have that struct without pointer inside itself. */ struct Ast_Scope: Ast{ String debug_name; // Dont use List implicit_imports; List decls; Array stmts; U32 visit_id; U32 scope_id; Ast_Scope *file; // Self referential for file and module Ast_Module *module; }; enum Ast_Module_State{ MODULE_REGISTERED, MODULE_PARSED, MODULE_RESOLVED, }; struct Ast_Module: Ast_Scope{ Ast_Module_State state; String absolute_base_folder; String absolute_file_path; List all_loaded_files; }; struct Ast_File: Ast_Scope{ String absolute_base_folder; String absolute_file_path; String filecontent; }; enum Ast_Decl_State{ DECL_NOT_RESOLVED, DECL_RESOLVED, DECL_RESOLVED_TYPE, DECL_RESOLVING, }; struct Ast_Decl: Ast{ Ast_Decl_State state; Intern_String name; Intern_String unique_name; // For code generation, currently only present on lambdas U64 operator_overload_arguments_hash; Operator_Info *overload_op_info; Ast_Scope *scope; Ast_Expr *typespec; union{ Ast_Expr *expr; Ast_Lambda *lambda; }; /*#import meta meta.inline_value_fields() */ union { Value value; struct { Ast_Type *type; Ast_Decl *resolved_decl; union { bool bool_val; F64 f64_val; Intern_String intern_val; BigInt big_int_val; Ast_Type *type_val; }; }; }; /*END*/ }; //----------------------------------------------------------------------------- // AST Constructors beginning with expressions //----------------------------------------------------------------------------- #define AST_NEW(T,ikind,ipos,iflags) \ Ast_##T *result = arena_push_type(pctx->perm, Ast_##T, AF_ZeroMemory);\ result->flags = iflags; \ result->kind = AST_##ikind; \ result->parent_scope = pctx->currently_parsed_scope; \ result->pos = ipos; \ result->di = ++pctx->unique_ids #define ast_new(T,kind,pos,flags) (T *)_ast_new(sizeof(T), kind, pos, flags) CORE_Static Ast * _ast_new(size_t size, Ast_Kind kind, Token *pos, Ast_Flag flags = 0){ Ast *result = (Ast *)arena_push_size(pctx->perm, size, AF_ZeroMemory); result->flags = flags; result->kind = kind; result->parent_scope = pctx->currently_parsed_scope; result->pos = pos; result->di = ++pctx->unique_ids; return result; } CORE_Static Ast_Atom * ast_str(Token *pos, Intern_String string){ AST_NEW(Atom, VALUE, pos, AST_EXPR | AST_ATOM); result->type = untyped_string; result->intern_val = string; return result; } CORE_Static Ast_Atom * ast_ident(Token *pos, Intern_String string){ AST_NEW(Atom, IDENT, pos, AST_EXPR | AST_ATOM); result->intern_val = string; return result; } CORE_Static Ast_Atom * ast_bool(Token *pos, B32 bool_val){ AST_NEW(Atom, VALUE, pos, AST_EXPR | AST_ATOM); result->bool_val = bool_val; result->type = untyped_bool; return result; } CORE_Static Ast_Atom * ast_float(Token *pos, F64 value){ AST_NEW(Atom, VALUE, pos, AST_EXPR | AST_ATOM); result->type = untyped_float; result->f64_val = value; return result; } CORE_Static Ast_Atom * ast_int(Token *pos, BigInt val){ AST_NEW(Atom, VALUE, pos, AST_EXPR | AST_ATOM); result->type = untyped_int; result->big_int_val = bigint_copy(pctx->perm, &val); return result; } CORE_Static Ast_Atom * ast_int(Token *pos, U64 value){ return ast_int(pos, bigint_u64(value)); } CORE_Static Ast_Expr * ast_expr_binary(Ast_Expr *left, Ast_Expr *right, Token *op){ AST_NEW(Binary, BINARY, op, AST_EXPR); result->op = op->kind; result->left = left; result->right = right; return result; } CORE_Static Ast_Call * ast_call(Token *pos, Ast_Expr *name, Array exprs){ // name here specifies also typespec for compound expressions ! AST_NEW(Call, CALL, pos, AST_EXPR); result->name = name; result->exprs = exprs.tight_copy(pctx->perm); return result; } CORE_Static Ast_Call_Item * ast_call_item(Token *pos, Ast_Atom *name, Ast_Expr *index, Ast_Expr *item){ AST_NEW(Call_Item, CALL_ITEM, pos, AST_EXPR); result->name = name; result->item = item; result->index = index; return result; } CORE_Static Ast_Expr * ast_expr_unary(Token *pos, Token_Kind op, Ast_Expr *expr){ AST_NEW(Unary, UNARY, pos, AST_EXPR); result->flags = AST_EXPR; result->expr = expr; result->op = op; return result; } CORE_Static Ast_Expr * ast_expr_index(Token *pos, Ast_Expr *expr, Ast_Expr *index){ AST_NEW(Index, INDEX, pos, AST_EXPR); result->flags = AST_EXPR; result->expr = expr; result->index = index; return result; } CORE_Static Ast_Lambda * ast_lambda(Token *pos, Array params, Array ret, Ast_Scope *scope){ AST_NEW(Lambda, LAMBDA_EXPR, pos, AST_EXPR); result->flags = AST_EXPR; result->args = params.tight_copy(pctx->perm); result->ret = ret.tight_copy(pctx->perm); result->scope = scope; return result; } CORE_Static Ast_If * ast_if(Token *pos, Array ifs){ AST_NEW(If, IF, pos, AST_STMT); result->ifs = ifs.tight_copy(pctx->perm); return result; } CORE_Static Ast_For * ast_for(Token *pos, Ast_Expr *init, Ast_Expr *cond, Ast_Expr *iter, Ast_Scope *scope){ AST_NEW(For, FOR, pos, AST_STMT); result->init = init; result->cond = cond; result->iter = iter; result->scope = scope; return result; } CORE_Static Ast_Pass * ast_pass(Token *pos){ AST_NEW(Pass, PASS, pos, AST_STMT); return result; } CORE_Static Ast_Break * ast_break(Token *pos){ AST_NEW(Break, BREAK, pos, AST_STMT); return result; } CORE_Static Ast_Return * ast_return(Token *pos, Array expr){ AST_NEW(Return, RETURN, pos, AST_STMT); if(expr.len){ For(expr) assert(is_flag_set(it->flags, AST_EXPR)); result->expr = expr.tight_copy(pctx->perm); } return result; } CORE_Static Ast_If_Node * ast_if_node(Token *pos, Ast_Expr *init, Ast_Expr *expr, Ast_Scope *scope){ AST_NEW(If_Node, IF_NODE, pos, AST_STMT); result->scope = scope; result->expr = expr; result->init = (Ast_Binary *)init; if(result->init) { assert(init->kind == AST_VAR); } return result; } CORE_Static Ast_Array * ast_array(Token *pos, Ast_Expr *expr){ AST_NEW(Array, ARRAY, pos, AST_EXPR); result->expr = expr; return result; } CORE_Static Ast_Scope * begin_decl_scope(Arena *scratch, Token *pos){ AST_NEW(Scope, SCOPE, pos, AST_DECL); result->file = pctx->currently_parsed_file; result->module = pctx->currently_parsed_file->module; result->scope_id = pctx->scope_ids++; result->debug_name = pos->string; assert(result->file); pctx->currently_parsed_scope = result; return result; } CORE_Static void finalize_decl_scope(Ast_Scope *scope){ pctx->currently_parsed_scope = scope->parent_scope; } CORE_Static Ast_Scope * begin_stmt_scope(Arena *scratch, Token *pos){ AST_NEW(Scope, SCOPE, pos, AST_STMT); result->stmts = {scratch}; result->file = pctx->currently_parsed_file; result->module = pctx->currently_parsed_file->module; result->scope_id = pctx->scope_ids++; result->debug_name = pos->string; assert(result->file); pctx->currently_parsed_scope = result; return result; } CORE_Static void finalize_stmt_scope(Ast_Scope *scope){ scope->stmts = scope->stmts.tight_copy(pctx->perm); pctx->currently_parsed_scope = scope->parent_scope; } CORE_Static Ast_Decl * ast_struct(Token *pos, Ast_Scope *scope){ AST_NEW(Decl, STRUCT, pos, AST_DECL | AST_AGGREGATE); result->scope = scope; return result; } CORE_Static Ast_Decl * ast_enum(Token *pos, Ast_Expr *typespec, Ast_Scope *scope){ AST_NEW(Decl, ENUM, pos, AST_DECL | AST_AGGREGATE); result->scope = scope; result->typespec = typespec; return result; } CORE_Static Ast_Decl * ast_var(Token *pos, Ast_Expr *typespec, Intern_String name, Ast_Expr *expr){ AST_NEW(Decl, VAR, pos, AST_DECL); result->name = name; result->typespec = typespec; result->expr = expr; return result; } CORE_Static Ast_Decl * ast_const(Token *pos, Intern_String name, Value value){ AST_NEW(Decl, CONST, pos, AST_DECL); result->value = value; result->name = name; return result; } CORE_Static Ast_Decl * ast_const(Token *pos, Intern_String name, Ast_Expr *expr){ AST_NEW(Decl, CONST, pos, AST_DECL); result->expr = expr; result->name = name; return result; } CORE_Static Ast_Decl * ast_type(Token *pos, Intern_String name, Ast_Type *type){ AST_NEW(Decl, TYPE, pos, AST_DECL); result->type = type_type; result->type_val = type; result->name = name; return result; } CORE_Static Ast_Scope * ast_decl_scope(Token *pos, Arena *allocator, Ast_File *file){ AST_NEW(Scope, SCOPE, pos, AST_DECL); result->file = file; result->scope_id = pctx->scope_ids++; assert(result->file); return result; } CORE_Static Ast_Decl * ast_namespace(Token *pos, Ast_Scope *module, Intern_String name){ AST_NEW(Decl, NAMESPACE, pos, AST_DECL); result->scope = module; result->name = name; return result; } CORE_Static Ast_Builtin * ast_runtime_assert(Token *pos, Ast_Expr *expr, Intern_String message){ AST_NEW(Builtin, RUNTIME_ASSERT, pos, AST_EXPR); result->expr = expr; result->assert_message = message; return result; } CORE_Static Ast_Builtin * ast_constant_assert(Token *pos, Ast_Expr *expr, Intern_String message){ AST_NEW(Builtin, CONSTANT_ASSERT, pos, AST_EXPR); result->expr = expr; result->assert_message = message; return result; } CORE_Static Ast_Builtin * ast_sizeof(Token *pos, Ast_Expr *expr){ AST_NEW(Builtin, SIZE_OF, pos, AST_EXPR); result->expr = expr; return result; } CORE_Static Ast_Builtin * ast_len(Token *pos, Ast_Expr *expr){ AST_NEW(Builtin, LENGTH_OF, pos, AST_EXPR); result->expr = expr; return result; } CORE_Static Ast_Builtin * ast_alignof(Token *pos, Ast_Expr *expr){ AST_NEW(Builtin, ALIGN_OF, pos, AST_EXPR); result->expr = expr; return result; } CORE_Static Ast_Var_Unpack * ast_var_unpack(Token *pos, Array vars, Ast_Expr *expr){ AST_NEW(Var_Unpack, VAR_UNPACK, pos, AST_STMT); result->vars = vars.tight_copy(pctx->perm); result->expr = expr; return result; } //----------------------------------------------------------------------------- // Value //----------------------------------------------------------------------------- CORE_Static Value value_bool(B32 v){ Value value; value.bool_val = v; value.type = untyped_bool; return value; } CORE_Static Value value_int(BigInt b){ Value value; value.big_int_val = b; value.type = untyped_int; return value; } CORE_Static Value value_int(S64 s64){ Value value; value.type = untyped_int; bigint_init_signed(&value.big_int_val, s64); return value; } CORE_Static Value value_float(F64 b){ Value value; value.f64_val = b; value.type = untyped_float; return value; } CORE_Static Value value_float(BigInt a){ Value value; value.f64_val = bigint_as_float(&a); value.type = untyped_float; return value; } CORE_Static B32 is_ident(Ast *ast){ B32 result = ast->kind == AST_IDENT; return result; } CORE_Static B32 is_binary(Ast *ast){ B32 result = ast->kind == AST_BINARY; return result; } CORE_Static B32 is_atom(Ast *ast){ B32 result = is_flag_set(ast->flags, AST_ATOM); return result; }