diff options
author | dec05eba <dec05eba@protonmail.com> | 2019-03-03 13:18:08 +0100 |
---|---|---|
committer | dec05eba <dec05eba@protonmail.com> | 2020-07-25 14:36:46 +0200 |
commit | b3b0c807a75c4f854495b547d8e00a598979cbf6 (patch) | |
tree | e42017c2f5b87a939d103f48d5f90dd93193ebcc /src | |
parent | 4c5ffb35d50d514e3df4788e7cf38245c0127883 (diff) |
Add arithmetic (binop) parsing
Diffstat (limited to 'src')
-rw-r--r-- | src/ast.c | 7 | ||||
-rw-r--r-- | src/parser.c | 115 | ||||
-rw-r--r-- | src/tokenizer.c | 42 |
3 files changed, 155 insertions, 9 deletions
@@ -24,6 +24,7 @@ int funccall_init(FunctionCall *self, BufferView name, ScopedAllocator *allocato void lhsexpr_init(LhsExpr *self, int isConst, BufferView var_name) { self->isConst = isConst; + self->type_name = create_buffer_view_null(); self->var_name = var_name; self->rhs_expr = ast_none(); } @@ -41,4 +42,10 @@ int string_init(String *self, BufferView str) { void number_init(Number *self, i64 value, bool is_integer) { self->value.integer = value; self->is_integer = is_integer; +} + +void binop_init(Binop *self) { + self->lhs = ast_none(); + self->rhs = ast_none(); + self->type = BINOP_ADD; }
\ No newline at end of file diff --git a/src/parser.c b/src/parser.c index 6ea8d1d..52c5bfe 100644 --- a/src/parser.c +++ b/src/parser.c @@ -70,7 +70,7 @@ static CHECK_RESULT int parser_parse_body_loop(Parser *self, Buffer *body_list, } /* -LHS = 'const'|'var' IDENTIFIER +LHS = 'const'|'var' TOK_IDENTIFIER */ static CHECK_RESULT int parser_parse_lhs(Parser *self, LhsExpr **result, bool *assignment) { bool isConst; @@ -92,6 +92,12 @@ static CHECK_RESULT int parser_parse_lhs(Parser *self, LhsExpr **result, bool *a return_if_error(scoped_allocator_alloc(self->allocator, sizeof(LhsExpr), (void**)result)); lhsexpr_init(*result, isConst, var_name); + return_if_error(tokenizer_consume_if(&self->tokenizer, TOK_COLON, &match)); + if(match) { + return_if_error(tokenizer_accept(&self->tokenizer, TOK_IDENTIFIER)); + (*result)->type_name = self->tokenizer.value.identifier; + } + return_if_error(tokenizer_consume_if(&self->tokenizer, TOK_EQUALS, &match)); if(match) { *assignment = bool_true; @@ -165,7 +171,7 @@ static CHECK_RESULT int parser_parse_function_args(Parser *self, FunctionCall *f } /* -VARIABLE = IDENTIFIER +VARIABLE = TOK_IDENTIFIER FUNC_CALL_OR_VARIABLE = VARIABLE '(' FUNC_ARGS ')' */ static CHECK_RESULT int parser_parse_function_call_or_variable(Parser *self, Ast *expr) { @@ -227,10 +233,11 @@ static CHECK_RESULT int parser_parse_number(Parser *self, Ast *rhs_expr) { } /* -RHS = STRING | NUMBER | FUNC_CALL_OR_VARIABLE +RHS_S = STRING | NUMBER | FUNC_CALL_OR_VARIABLE */ -static CHECK_RESULT int parser_parse_rhs(Parser *self, Ast *rhs_expr) { +static CHECK_RESULT int parser_parse_rhs_single_expr(Parser *self, Ast *rhs_expr) { bool match; + *rhs_expr = ast_none(); return_if_error(tokenizer_consume_if(&self->tokenizer, TOK_STRING, &match)); if(match) { @@ -254,6 +261,95 @@ static CHECK_RESULT int parser_parse_rhs(Parser *self, Ast *rhs_expr) { return PARSER_UNEXPECTED_TOKEN; } +static CHECK_RESULT int parser_parse_rhs_binop(Parser *self, Ast *expr); + +/* +RHS_BINOP_PAREN = '(' RHS_BINOP ')' (TOK_BINOP RHS_BINOP) +*/ +static CHECK_RESULT int parser_parse_rhs_binop_paren(Parser *self, bool *match, Ast *expr) { + bool binop_match; + Ast lhs; + Ast rhs; + BinopType binop_type; + + return_if_error(tokenizer_consume_if(&self->tokenizer, TOK_OPEN_PAREN, match)); + if(!*match) + return PARSER_OK; + + return_if_error(parser_parse_rhs_binop(self, &lhs)); + return_if_error(tokenizer_accept(&self->tokenizer, TOK_CLOSING_PAREN)); + + return_if_error(tokenizer_consume_if(&self->tokenizer, TOK_BINOP, &binop_match)); + if(!binop_match) { + *expr = lhs; + return PARSER_OK; + } + binop_type = self->tokenizer.value.binop_type; + + return_if_error(parser_parse_rhs_binop(self, &rhs)); + return_if_error(scoped_allocator_alloc(self->allocator, sizeof(Binop), (void**)&expr->value.binop)); + binop_init(expr->value.binop); + expr->value.binop->type = binop_type; + expr->value.binop->lhs = lhs; + expr->value.binop->rhs = rhs; + expr->type = AST_BINOP; + return PARSER_OK; +} + +/* +RHS_BINOP_WO_PAREN = RHS_S | (RHS_S TOK_BINOP RHS_BINOP) +*/ +static CHECK_RESULT int parser_parse_rhs_binop_without_paren(Parser *self, Ast *expr) { + bool match; + Ast lhs; + Ast rhs; + BinopType binop_type; + + return_if_error(parser_parse_rhs_single_expr(self, &lhs)); + return_if_error(tokenizer_consume_if(&self->tokenizer, TOK_BINOP, &match)); + if(!match) { + *expr = lhs; + return PARSER_OK; + } + binop_type = self->tokenizer.value.binop_type; + + return_if_error(parser_parse_rhs_binop(self, &rhs)); + return_if_error(scoped_allocator_alloc(self->allocator, sizeof(Binop), (void**)&expr->value.binop)); + binop_init(expr->value.binop); + expr->value.binop->type = binop_type; + expr->value.binop->lhs = lhs; + expr->value.binop->rhs = rhs; + expr->type = AST_BINOP; + return PARSER_OK; +} + +/* +RHS_BINOP = RHS_BINOP_PAREN | RHS_BINOP_WO_PAREN + +Note: Parantheses count has to match for the beginning paranthesis and the ending parenthesis. +*/ +int parser_parse_rhs_binop(Parser *self, Ast *expr) { + bool match; + return_if_error(parser_parse_rhs_binop_paren(self, &match, expr)); + if(match) + return PARSER_OK; + return parser_parse_rhs_binop_without_paren(self, expr); +} + +/* +RHS = RHS_BINOP ';' + +Note: Parantheses count has to match for the beginning paranthesis and the ending parenthesis. +*/ +static CHECK_RESULT int parser_parse_rhs(Parser *self, Ast *rhs_expr) { + /* TODO: If binop only contains one expression, then use that directly for @rhs_expr */ + return_if_error(parser_parse_rhs_binop(self, rhs_expr)); + + /* TODO: Implement this */ + /*binop_reorder_by_precedence(binop);*/ + return PARSER_OK; +} + /* RHS_START = CLOSURE | IMPORT | RHS */ @@ -312,6 +408,17 @@ int parser_parse_body(Parser *self, Ast *ast) { *ast = rhs_expr; } + if(rhs_expr.type == AST_BINOP) { + bool match; + return_if_error(tokenizer_consume_if(&self->tokenizer, TOK_SEMICOLON, &match)); + if(!match) { + /* TODO: Specify all the binop characters instead of "binop" which doesn't make sense for the user */ + self->error = tokenizer_create_error(&self->tokenizer, "Expected ';' or binop"); + return PARSER_UNEXPECTED_TOKEN; + } + return PARSER_OK; + } + /* TODO: Check for struct and tables */ if(rhs_expr.type != AST_FUNCTION_DECL) return_if_error(tokenizer_accept(&self->tokenizer, TOK_SEMICOLON)); diff --git a/src/tokenizer.c b/src/tokenizer.c index afaeb8e..152aec4 100644 --- a/src/tokenizer.c +++ b/src/tokenizer.c @@ -116,6 +116,8 @@ static CHECK_RESULT int string_to_float_unchecked(BufferView str, f64 *result) { return 0; } +#define SET_BINOP(_binop_type) do { *token = TOK_BINOP; self->value.binop_type = (_binop_type); } while(0) + static CHECK_RESULT int tokenizer_next(Tokenizer *self, Token *token); static CHECK_RESULT int __tokenizer_next(Tokenizer *self, Token *token) { @@ -182,7 +184,6 @@ static CHECK_RESULT int __tokenizer_next(Tokenizer *self, Token *token) { self->value.string.size = string_end - self->index; self->index = string_end + 1; *token = TOK_STRING; - return TOKENIZER_OK; } else if(isDigit(c)) { int number_start; int dot_index; @@ -225,10 +226,21 @@ static CHECK_RESULT int __tokenizer_next(Tokenizer *self, Token *token) { self->number_is_integer = bool_false; } *token = TOK_NUMBER; - return TOKENIZER_OK; } else if(c == '.') { ++self->index; - *token = TOK_DOT; + SET_BINOP(BINOP_DOT); + } else if(c == '+') { + ++self->index; + SET_BINOP(BINOP_ADD); + } else if(c == '-') { + ++self->index; + SET_BINOP(BINOP_SUB); + } else if(c == '*') { + ++self->index; + SET_BINOP(BINOP_MUL); + } else if(c == '/') { + ++self->index; + SET_BINOP(BINOP_DIV); } else if(c == '=') { ++self->index; *token = TOK_EQUALS; @@ -250,6 +262,9 @@ static CHECK_RESULT int __tokenizer_next(Tokenizer *self, Token *token) { } else if(c == ';') { ++self->index; *token = TOK_SEMICOLON; + } else if(c == ':') { + ++self->index; + *token = TOK_COLON; } else if(c == '@') { const char *err_msg; ++self->index; @@ -313,6 +328,19 @@ static usize strlen(const char *str) { return len; } +/* +static const char* binop_to_string(BinopType binop_type) { + switch(binop_type) { + case BINOP_DOT: return "."; + case BINOP_ADD: return "+"; + case BINOP_SUB: return "-"; + case BINOP_MUL: return "*"; + case BINOP_DIV: return "/"; + } + assert(bool_false && "binop_to_string not implemented for binop_type"); +} +*/ + static BufferView tokenizer_expected_token_as_string(Token token) { const char *str; switch(token) { @@ -361,12 +389,16 @@ static BufferView tokenizer_expected_token_as_string(Token token) { case TOK_NUMBER: str = "number"; break; - case TOK_DOT: - str = "."; + case TOK_BINOP: + /* TODO: binop_to_string */ + str = "binop"; break; case TOK_SEMICOLON: str = ";"; break; + case TOK_COLON: + str = ":"; + break; default: str = "Unknown token"; break; |