#include "parser.hpp" #include "ast/errors/error.hpp" #include "ast/expressions/identifier.hpp" #include "ast/expressions/infix.hpp" #include "ast/expressions/integer.hpp" #include "ast/expressions/prefix.hpp" #include "token/token.hpp" #include "token/type.hpp" #include namespace parser { parser::parser(lexer::lexer& lexer) : lexer(lexer), current(token::type::ILLEGAL, ""), next(token::type::ILLEGAL, "") { next_token(); next_token(); register_prefix( token::type::IDENTIFIER, std::bind(&parser::parse_identifier, this) ); register_prefix( token::type::INT, std::bind(&parser::parse_integer, this) ); register_prefix( token::type::BANG, std::bind(&parser::parse_prefix_expr, this) ); register_prefix( token::type::MINUS, std::bind(&parser::parse_prefix_expr, this) ); using namespace std::placeholders; register_infix( token::type::PLUS, std::bind(&parser::parse_infix_expr, this, _1) ); register_infix( token::type::MINUS, std::bind(&parser::parse_infix_expr, this, _1) ); register_infix( token::type::ASTERISK, std::bind(&parser::parse_infix_expr, this, _1) ); register_infix( token::type::SLASH, std::bind(&parser::parse_infix_expr, this, _1) ); register_infix( token::type::EQ, std::bind(&parser::parse_infix_expr, this, _1) ); register_infix( token::type::NEQ, std::bind(&parser::parse_infix_expr, this, _1) ); register_infix( token::type::GT, std::bind(&parser::parse_infix_expr, this, _1) ); register_infix( token::type::LT, std::bind(&parser::parse_infix_expr, this, _1) ); } void parser::next_token() { current = next; next = lexer.next_token(); } void parser::skip_until_semicolon() { for (; current.type != token::type::SEMICOLON && current.type != token::type::END_OF_FILE; next_token()) {}; } std::unique_ptr parser::parse_program() { std::unique_ptr p = std::make_unique(); for (; current.type != token::type::END_OF_FILE; next_token()) { ast::statement* stmt = parse_statement(); if (stmt != nullptr) p->statements.push_back(stmt); } return p; } ast::statement* parser::parse_statement() { switch (current.type) { case token::type::LET: return parse_let(); case token::type::RETURN: return parse_return(); default: return parse_expression_stmt(); } } ast::expression* parser::parse_expression(precedence prec) { auto prefix_it = prefix_parse_fns.find(current.type); if (prefix_it == prefix_parse_fns.end()) { unkown_prefix_error(current); return nullptr; } prefix_parse_fn prefix = prefix_it->second; ast::expression* left = prefix(); while (next.type != token::type::SEMICOLON && prec < precedence_for(next.type)) { auto infix_it = infix_parse_fns.find(next.type); if (infix_it == infix_parse_fns.end()) return left; next_token(); infix_parse_fn infix = infix_it->second; left = infix(left); } return left; }; ast::return_stmt* parser::parse_return() { ast::return_stmt* stmt = new ast::return_stmt(current); next_token(); stmt->value = parse_expression(); if (next.type == token::type::SEMICOLON) next_token(); return stmt; } ast::let_stmt* parser::parse_let() { ast::let_stmt* stmt = new ast::let_stmt(current); if (!expect_next(token::type::IDENTIFIER)) { delete stmt; skip_until_semicolon(); return nullptr; } stmt->name = new ast::identifier{current, current.literal}; if (!expect_next(token::type::ASSIGN)) { delete stmt; skip_until_semicolon(); return nullptr; } next_token(); stmt->value = parse_expression(); if (next.type == token::type::SEMICOLON) next_token(); return stmt; } ast::expression_stmt* parser::parse_expression_stmt() { ast::expression_stmt* stmt = new ast::expression_stmt(current); stmt->expression = parse_expression(); if (next.type == token::type::SEMICOLON) next_token(); return stmt; }; bool parser::expect_next(token::type t) { if (next.type == t) { next_token(); return true; } next_error(t); return false; } void parser::next_error(token::type t) { std::stringstream ss; ss << "Expected next token to be " << t << " but instead got " << next.type; errors.push_back(new ast::error::expected_next(t, ss.str())); } void parser::unkown_prefix_error(token::token tok) { std::stringstream ss; ss << "No prefix parse function for token " << tok; errors.push_back(new ast::error::unkown_prefix(tok, ss.str())); } parser::~parser() { for (const auto& e : errors) delete e; } void parser::register_prefix(token::type type, prefix_parse_fn fn) { prefix_parse_fns[type] = fn; }; void parser::register_infix(token::type type, infix_parse_fn fn) { infix_parse_fns[type] = fn; }; ast::expression* parser::parse_identifier() { return new ast::identifier(current, current.literal); }; ast::expression* parser::parse_integer() { return new ast::integer_literal(current, std::stoi(current.literal)); }; ast::expression* parser::parse_prefix_expr() { ast::prefix_expr* ret = new ast::prefix_expr(current, current.literal); next_token(); ret->right = parse_expression(precedence::PREFIX); return ret; }; ast::expression* parser::parse_infix_expr(ast::expression* left) { ast::infix_expr* ret = new ast::infix_expr(current, current.literal, left); precedence prec = precedence_for(current.type); next_token(); ret->right = parse_expression(prec); return ret; }; } // namespace parser