Files
interpreter-cpp/src/parser/parser.cpp
Karma Riuk 2174781b77 using smart pointers instead of normal ones for
easier setup of tests (to call setup() multiple
times without leaks)
2025-07-11 11:16:16 +02:00

238 lines
6.6 KiB
C++

#include "parser.hpp"
#include "ast/errors/error.hpp"
#include "ast/expressions/identifier.hpp"
#include "ast/expressions/infix.hpp"
#include "ast/expressions/integer.hpp"
#include "ast/expressions/prefix.hpp"
#include "token/token.hpp"
#include "token/type.hpp"
#include <sstream>
namespace parser {
parser::parser(lexer::lexer& lexer)
: lexer(lexer),
current(token::type::ILLEGAL, ""),
next(token::type::ILLEGAL, "") {
next_token();
next_token();
register_prefix(
token::type::IDENTIFIER,
std::bind(&parser::parse_identifier, this)
);
register_prefix(
token::type::INT,
std::bind(&parser::parse_integer, this)
);
register_prefix(
token::type::BANG,
std::bind(&parser::parse_prefix_expr, this)
);
register_prefix(
token::type::MINUS,
std::bind(&parser::parse_prefix_expr, this)
);
using namespace std::placeholders;
register_infix(
token::type::PLUS,
std::bind(&parser::parse_infix_expr, this, _1)
);
register_infix(
token::type::MINUS,
std::bind(&parser::parse_infix_expr, this, _1)
);
register_infix(
token::type::ASTERISK,
std::bind(&parser::parse_infix_expr, this, _1)
);
register_infix(
token::type::SLASH,
std::bind(&parser::parse_infix_expr, this, _1)
);
register_infix(
token::type::EQ,
std::bind(&parser::parse_infix_expr, this, _1)
);
register_infix(
token::type::NEQ,
std::bind(&parser::parse_infix_expr, this, _1)
);
register_infix(
token::type::GT,
std::bind(&parser::parse_infix_expr, this, _1)
);
register_infix(
token::type::LT,
std::bind(&parser::parse_infix_expr, this, _1)
);
}
void parser::next_token() {
current = next;
next = lexer.next_token();
}
void parser::skip_until_semicolon() {
for (; current.type != token::type::SEMICOLON
&& current.type != token::type::END_OF_FILE;
next_token()) {};
}
std::unique_ptr<ast::program> parser::parse_program() {
std::unique_ptr<ast::program> p = std::make_unique<ast::program>();
for (; current.type != token::type::END_OF_FILE; next_token()) {
ast::statement* stmt = parse_statement();
if (stmt != nullptr)
p->statements.push_back(stmt);
}
return p;
}
ast::statement* parser::parse_statement() {
switch (current.type) {
case token::type::LET:
return parse_let();
case token::type::RETURN:
return parse_return();
default:
return parse_expression_stmt();
}
}
ast::expression* parser::parse_expression(precedence prec) {
auto prefix_it = prefix_parse_fns.find(current.type);
if (prefix_it == prefix_parse_fns.end()) {
unkown_prefix_error(current);
return nullptr;
}
prefix_parse_fn prefix = prefix_it->second;
ast::expression* left = prefix();
while (next.type != token::type::SEMICOLON
&& prec < precedence_for(next.type)) {
auto infix_it = infix_parse_fns.find(next.type);
if (infix_it == infix_parse_fns.end())
return left;
next_token();
infix_parse_fn infix = infix_it->second;
left = infix(left);
}
return left;
};
ast::return_stmt* parser::parse_return() {
ast::return_stmt* stmt = new ast::return_stmt(current);
next_token();
stmt->value = parse_expression();
if (next.type == token::type::SEMICOLON)
next_token();
return stmt;
}
ast::let_stmt* parser::parse_let() {
ast::let_stmt* stmt = new ast::let_stmt(current);
if (!expect_next(token::type::IDENTIFIER)) {
delete stmt;
skip_until_semicolon();
return nullptr;
}
stmt->name = new ast::identifier{current, current.literal};
if (!expect_next(token::type::ASSIGN)) {
delete stmt;
skip_until_semicolon();
return nullptr;
}
next_token();
stmt->value = parse_expression();
if (next.type == token::type::SEMICOLON)
next_token();
return stmt;
}
ast::expression_stmt* parser::parse_expression_stmt() {
ast::expression_stmt* stmt = new ast::expression_stmt(current);
stmt->expression = parse_expression();
if (next.type == token::type::SEMICOLON)
next_token();
return stmt;
};
bool parser::expect_next(token::type t) {
if (next.type == t) {
next_token();
return true;
}
next_error(t);
return false;
}
void parser::next_error(token::type t) {
std::stringstream ss;
ss << "Expected next token to be " << t << " but instead got "
<< next.type;
errors.push_back(new ast::error::expected_next(t, ss.str()));
}
void parser::unkown_prefix_error(token::token tok) {
std::stringstream ss;
ss << "No prefix parse function for token " << tok;
errors.push_back(new ast::error::unkown_prefix(tok, ss.str()));
}
parser::~parser() {
for (const auto& e : errors)
delete e;
}
void parser::register_prefix(token::type type, prefix_parse_fn fn) {
prefix_parse_fns[type] = fn;
};
void parser::register_infix(token::type type, infix_parse_fn fn) {
infix_parse_fns[type] = fn;
};
ast::expression* parser::parse_identifier() {
return new ast::identifier(current, current.literal);
};
ast::expression* parser::parse_integer() {
return new ast::integer_literal(current, std::stoi(current.literal));
};
ast::expression* parser::parse_prefix_expr() {
ast::prefix_expr* ret = new ast::prefix_expr(current, current.literal);
next_token();
ret->right = parse_expression(precedence::PREFIX);
return ret;
};
ast::expression* parser::parse_infix_expr(ast::expression* left) {
ast::infix_expr* ret =
new ast::infix_expr(current, current.literal, left);
precedence prec = precedence_for(current.type);
next_token();
ret->right = parse_expression(prec);
return ret;
};
} // namespace parser