elna/source/parser.cpp

535 lines
13 KiB
C++
Raw Normal View History

#include "elna/source/parser.hpp"
2024-03-01 10:13:55 +01:00
#include <stdexcept>
2024-03-07 09:15:11 +01:00
namespace elna::source
2024-03-01 10:13:55 +01:00
{
2024-03-14 08:52:45 +01:00
void empty_visitor::visit(declaration *declaration)
{
}
void empty_visitor::visit(definition *definition)
{
definition->body().accept(this);
}
void empty_visitor::visit(bang_statement *statement)
{
statement->body().accept(this);
}
void empty_visitor::visit(compound_statement *statement)
{
for (auto& nested_statement : statement->statements())
{
nested_statement->accept(this);
}
}
void empty_visitor::visit(assign_statement *statement)
{
statement->rvalue().accept(this);
}
void empty_visitor::visit(block *block)
{
for (const auto& block_definition : block->definitions())
{
block_definition->accept(this);
}
for (const auto& block_declaration : block->declarations())
{
block_declaration->accept(this);
}
block->body().accept(this);
}
void empty_visitor::visit(binary_expression *expression)
{
expression->lhs().accept(this);
expression->rhs().accept(this);
}
void empty_visitor::visit(variable_expression *variable)
{
}
void empty_visitor::visit(integer_literal *number)
{
}
2024-03-01 10:13:55 +01:00
/**
* AST node.
*/
2024-03-09 08:36:07 +01:00
void node::accept(parser_visitor *)
2024-03-01 10:13:55 +01:00
{
}
2024-03-10 08:50:55 +01:00
declaration::declaration(const std::string& identifier)
: m_identifier(identifier)
{
}
std::string& declaration::identifier() noexcept
{
return m_identifier;
}
definition::definition(const std::string& identifier, std::unique_ptr<integer_literal>&& body)
: m_identifier(std::move(identifier)), m_body(std::move(body))
2024-03-01 10:13:55 +01:00
{
}
2024-03-10 08:50:55 +01:00
void declaration::accept(parser_visitor *visitor)
{
visitor->visit(this);
}
2024-03-09 08:36:07 +01:00
void definition::accept(parser_visitor *visitor)
2024-03-01 10:13:55 +01:00
{
visitor->visit(this);
}
std::string& definition::identifier() noexcept
{
return m_identifier;
}
integer_literal& definition::body()
{
return *m_body;
}
2024-03-10 08:50:55 +01:00
block::block(std::vector<std::unique_ptr<definition>>&& definitions,
std::vector<std::unique_ptr<declaration>>&& declarations,
std::unique_ptr<statement>&& body)
2024-03-14 08:52:45 +01:00
: m_definitions(std::move(definitions)),
m_declarations(std::move(declarations)), m_body(std::move(body)),
m_table(std::make_shared<symbol_table>())
{
}
2024-03-09 08:36:07 +01:00
void block::accept(parser_visitor *visitor)
2024-03-01 10:13:55 +01:00
{
visitor->visit(this);
}
statement& block::body()
{
return *m_body;
}
std::vector<std::unique_ptr<definition>>& block::definitions() noexcept
{
return m_definitions;
}
2024-03-10 08:50:55 +01:00
std::vector<std::unique_ptr<declaration>>& block::declarations() noexcept
{
return m_declarations;
}
2024-03-14 08:52:45 +01:00
std::shared_ptr<symbol_table> block::table()
{
return m_table;
}
integer_literal::integer_literal(const std::int32_t value)
: m_number(value)
{
}
2024-03-09 08:36:07 +01:00
void integer_literal::accept(parser_visitor *visitor)
2024-03-01 10:13:55 +01:00
{
visitor->visit(this);
}
std::int32_t integer_literal::number() const noexcept
{
return m_number;
}
2024-03-07 09:15:11 +01:00
variable_expression::variable_expression(const std::string& name)
: m_name(name)
{
}
2024-03-09 08:36:07 +01:00
void variable_expression::accept(parser_visitor *visitor)
2024-03-01 10:13:55 +01:00
{
visitor->visit(this);
}
2024-03-07 09:15:11 +01:00
const std::string& variable_expression::name() const noexcept
2024-03-01 10:13:55 +01:00
{
return m_name;
}
2024-03-01 10:13:55 +01:00
binary_expression::binary_expression(std::unique_ptr<expression>&& lhs,
std::unique_ptr<expression>&& rhs, const unsigned char operation)
: m_lhs(std::move(lhs)), m_rhs(std::move(rhs))
{
switch (operation)
2024-03-01 10:13:55 +01:00
{
2024-03-03 13:11:39 +01:00
case '+':
this->m_operator = binary_operator::sum;
2024-03-03 13:11:39 +01:00
break;
case '-':
this->m_operator = binary_operator::subtraction;
2024-03-03 13:11:39 +01:00
break;
case '*':
this->m_operator = binary_operator::multiplication;
2024-03-03 13:11:39 +01:00
break;
case '/':
this->m_operator = binary_operator::division;
2024-03-03 13:11:39 +01:00
break;
default:
throw std::logic_error("Invalid binary operator");
2024-03-01 10:13:55 +01:00
}
}
2024-03-09 08:36:07 +01:00
void binary_expression::accept(parser_visitor *visitor)
2024-03-01 10:13:55 +01:00
{
visitor->visit(this);
}
expression& binary_expression::lhs()
{
return *m_lhs;
}
expression& binary_expression::rhs()
{
return *m_rhs;
}
binary_operator binary_expression::operation() const noexcept
{
return m_operator;
}
bang_statement::bang_statement(std::unique_ptr<expression>&& body)
: m_body(std::move(body))
{
}
2024-03-09 08:36:07 +01:00
void bang_statement::accept(parser_visitor *visitor)
2024-03-01 10:13:55 +01:00
{
visitor->visit(this);
}
expression& bang_statement::body()
{
return *m_body;
}
2024-03-10 08:50:55 +01:00
compound_statement::compound_statement(std::vector<std::unique_ptr<statement>>&& statements)
: m_statements(std::move(statements))
{
}
void compound_statement::accept(parser_visitor *visitor)
{
visitor->visit(this);
}
std::vector<std::unique_ptr<statement>>& compound_statement::statements()
{
return m_statements;
}
2024-03-14 08:52:45 +01:00
void assign_statement::accept(parser_visitor *visitor)
2024-03-11 10:43:26 +01:00
{
visitor->visit(this);
}
2024-03-14 08:52:45 +01:00
assign_statement::assign_statement(const std::string& lvalue, std::unique_ptr<expression>&& rvalue)
: m_lvalue(lvalue), m_rvalue(std::move(rvalue))
{
}
std::string& assign_statement::lvalue() noexcept
{
return m_lvalue;
}
expression& assign_statement::rvalue()
{
return *m_rvalue;
}
parser::parser(lexer&& tokens)
: iterator(std::move(tokens))
{
}
std::unique_ptr<block> parser::parse()
2024-03-01 10:13:55 +01:00
{
return parse_block();
2024-03-01 10:13:55 +01:00
}
2024-03-14 08:52:45 +01:00
const std::list<std::unique_ptr<error>>& parser::errors() const noexcept
{
return iterator.errors();
}
std::unique_ptr<expression> parser::parse_factor()
2024-03-01 10:13:55 +01:00
{
2024-03-14 08:52:45 +01:00
if (iterator->of() == source::token::type::identifier)
2024-03-01 10:13:55 +01:00
{
2024-03-14 08:52:45 +01:00
auto result = std::make_unique<variable_expression>(iterator->identifier());
++iterator;
return result;
2024-03-01 10:13:55 +01:00
}
2024-03-14 08:52:45 +01:00
else if (iterator->of() == source::token::token::type::number)
2024-03-01 10:13:55 +01:00
{
2024-03-14 08:52:45 +01:00
auto result = std::make_unique<integer_literal>(iterator->number());
++iterator;
return result;
2024-03-01 10:13:55 +01:00
}
2024-03-14 08:52:45 +01:00
else if (iterator->of() == source::token::type::left_paren)
2024-03-01 10:13:55 +01:00
{
2024-03-14 08:52:45 +01:00
++iterator;
2024-03-01 10:13:55 +01:00
auto expression = parse_expression();
2024-03-01 10:13:55 +01:00
2024-03-14 08:52:45 +01:00
++iterator;
2024-03-01 10:13:55 +01:00
return expression;
}
return nullptr;
}
std::unique_ptr<expression> parser::parse_term()
2024-03-01 10:13:55 +01:00
{
auto lhs = parse_factor();
2024-03-14 08:52:45 +01:00
if (lhs == nullptr || iterator.current().of() != source::token::type::factor_operator)
2024-03-03 13:11:39 +01:00
{
return lhs;
}
2024-03-14 08:52:45 +01:00
while (iterator->of() == source::token::type::factor_operator)
2024-03-03 13:11:39 +01:00
{
2024-03-14 08:52:45 +01:00
auto _operator = iterator->identifier()[0];
++iterator;
2024-03-09 08:36:07 +01:00
auto rhs = parse_factor();
lhs = std::make_unique<binary_expression>(std::move(lhs),
std::move(rhs), _operator);
2024-03-03 13:11:39 +01:00
}
2024-03-09 08:36:07 +01:00
return lhs;
2024-03-01 10:13:55 +01:00
}
std::unique_ptr<expression> parser::parse_expression()
2024-03-01 10:13:55 +01:00
{
auto term = parse_term();
2024-03-14 08:52:45 +01:00
if (term == nullptr || iterator.current().of() != source::token::type::term_operator)
2024-03-01 10:13:55 +01:00
{
return term;
}
2024-03-14 08:52:45 +01:00
while (iterator->of() == source::token::type::term_operator)
2024-03-01 10:13:55 +01:00
{
2024-03-14 08:52:45 +01:00
auto _operator = iterator->identifier()[0];
++iterator;
2024-03-09 08:36:07 +01:00
auto rhs = parse_term();
term = std::make_unique<binary_expression>(std::move(term),
std::move(rhs), _operator);
2024-03-01 10:13:55 +01:00
}
2024-03-09 08:36:07 +01:00
return term;
2024-03-01 10:13:55 +01:00
}
std::unique_ptr<definition> parser::parse_definition()
2024-03-01 10:13:55 +01:00
{
2024-03-14 08:52:45 +01:00
auto definition_identifier = iterator.advance(token::type::identifier);
2024-03-01 10:13:55 +01:00
2024-03-10 08:50:55 +01:00
if (!definition_identifier.has_value())
{
return nullptr;
}
2024-03-14 08:52:45 +01:00
if (!iterator.skip(token::type::equals))
2024-03-10 08:50:55 +01:00
{
return nullptr;
}
2024-03-01 10:13:55 +01:00
2024-03-14 08:52:45 +01:00
if (iterator->of() == source::token::type::number)
2024-03-01 10:13:55 +01:00
{
2024-03-10 08:50:55 +01:00
auto result = std::make_unique<definition>(definition_identifier.value().get().identifier(),
2024-03-14 08:52:45 +01:00
std::make_unique<integer_literal>(iterator->number()));
++iterator;
return result;
2024-03-01 10:13:55 +01:00
}
return nullptr;
}
2024-03-10 08:50:55 +01:00
std::unique_ptr<declaration> parser::parse_declaration()
{
2024-03-14 08:52:45 +01:00
auto declaration_identifier = iterator.advance(token::type::identifier);
2024-03-10 08:50:55 +01:00
if (!declaration_identifier.has_value())
{
return nullptr;
}
return std::make_unique<declaration>(declaration_identifier.value().get().identifier());
}
std::unique_ptr<statement> parser::parse_statement()
2024-03-01 10:13:55 +01:00
{
2024-03-14 08:52:45 +01:00
if (iterator.look_ahead(token::type::assignment))
{
return parse_assign_statement();
}
else if (iterator.current(token::type::bang))
2024-03-01 10:13:55 +01:00
{
2024-03-10 08:50:55 +01:00
return parse_bang_statement();
2024-03-01 10:13:55 +01:00
}
2024-03-14 08:52:45 +01:00
else if (iterator.current(token::type::begin))
2024-03-10 08:50:55 +01:00
{
return parse_compound_statement();
}
2024-03-14 08:52:45 +01:00
iterator.add_error(*iterator);
2024-03-01 10:13:55 +01:00
return nullptr;
}
2024-03-10 08:50:55 +01:00
std::unique_ptr<bang_statement> parser::parse_bang_statement()
2024-03-01 10:13:55 +01:00
{
2024-03-14 08:52:45 +01:00
if (!iterator.advance(token::type::bang))
2024-03-10 08:50:55 +01:00
{
return nullptr;
}
auto bang_body = parse_expression();
2024-03-01 10:13:55 +01:00
2024-03-10 08:50:55 +01:00
if (bang_body != nullptr)
{
return std::make_unique<bang_statement>(std::move(bang_body));
}
return nullptr;
}
std::unique_ptr<compound_statement> parser::parse_compound_statement()
{
2024-03-14 08:52:45 +01:00
if (!iterator.advance(token::type::begin))
2024-03-10 08:50:55 +01:00
{
return nullptr;
}
auto result = std::make_unique<compound_statement>();
std::unique_ptr<statement> next_statement;
2024-03-01 10:13:55 +01:00
2024-03-11 10:43:26 +01:00
while ((next_statement = parse_statement()) != nullptr)
2024-03-01 10:13:55 +01:00
{
2024-03-11 10:43:26 +01:00
result->statements().push_back(std::move(next_statement));
2024-03-14 08:52:45 +01:00
if (iterator->of() == token::type::semicolon)
2024-03-01 10:13:55 +01:00
{
2024-03-14 08:52:45 +01:00
++iterator;
2024-03-11 10:43:26 +01:00
}
2024-03-14 08:52:45 +01:00
else if (iterator->of() == token::type::end)
2024-03-11 10:43:26 +01:00
{
2024-03-14 08:52:45 +01:00
++iterator;
2024-03-11 10:43:26 +01:00
break;
}
else
{
2024-03-14 08:52:45 +01:00
iterator.add_error(*iterator);
2024-03-11 10:43:26 +01:00
break;
2024-03-01 10:13:55 +01:00
}
2024-03-10 08:50:55 +01:00
}
return result;
}
2024-03-14 08:52:45 +01:00
std::unique_ptr<assign_statement> parser::parse_assign_statement()
{
auto name = iterator.advance(token::type::identifier);
if (!name.has_value() || !iterator.skip(token::type::assignment))
{
return nullptr;
}
auto rvalue = parse_expression();
if (rvalue == nullptr)
{
return nullptr;
}
return std::make_unique<assign_statement>(name.value().get().identifier(), std::move(rvalue));
}
2024-03-10 08:50:55 +01:00
std::vector<std::unique_ptr<definition>> parser::parse_definitions()
{
std::vector<std::unique_ptr<definition>> definitions;
2024-03-14 08:52:45 +01:00
if (iterator->of() != token::type::let)
2024-03-10 08:50:55 +01:00
{
return definitions;
}
2024-03-14 08:52:45 +01:00
++iterator; // Skip const.
2024-03-10 08:50:55 +01:00
std::unique_ptr<definition> parsed_definition;
while ((parsed_definition = parse_definition()) != nullptr)
{
definitions.push_back(std::move(parsed_definition));
2024-03-01 10:13:55 +01:00
2024-03-14 08:52:45 +01:00
if (iterator->of() == source::token::type::comma)
2024-03-01 10:13:55 +01:00
{
2024-03-14 08:52:45 +01:00
++iterator;
2024-03-01 10:13:55 +01:00
}
2024-03-14 08:52:45 +01:00
else if (iterator->of() == source::token::type::semicolon)
2024-03-01 10:13:55 +01:00
{
2024-03-14 08:52:45 +01:00
++iterator;
2024-03-10 08:50:55 +01:00
break;
}
else
{
2024-03-14 08:52:45 +01:00
iterator.add_error(*iterator);
2024-03-10 08:50:55 +01:00
break;
2024-03-01 10:13:55 +01:00
}
}
return definitions;
}
2024-03-10 08:50:55 +01:00
std::vector<std::unique_ptr<declaration>> parser::parse_declarations()
2024-03-01 10:13:55 +01:00
{
2024-03-10 08:50:55 +01:00
std::vector<std::unique_ptr<declaration>> declarations;
2024-03-14 08:52:45 +01:00
if (iterator->of() != token::type::var)
2024-03-01 10:13:55 +01:00
{
2024-03-10 08:50:55 +01:00
return declarations;
}
2024-03-14 08:52:45 +01:00
++iterator; // Skip var.
2024-03-10 08:50:55 +01:00
std::unique_ptr<declaration> parsed_declaration;
while ((parsed_declaration = parse_declaration()) != nullptr)
{
declarations.push_back(std::move(parsed_declaration));
2024-03-14 08:52:45 +01:00
if (iterator->of() == token::type::comma)
2024-03-10 08:50:55 +01:00
{
2024-03-14 08:52:45 +01:00
++iterator;
2024-03-10 08:50:55 +01:00
}
2024-03-14 08:52:45 +01:00
else if (iterator->of() == token::type::semicolon)
2024-03-10 08:50:55 +01:00
{
2024-03-14 08:52:45 +01:00
++iterator;
2024-03-10 08:50:55 +01:00
break;
}
else
{
2024-03-14 08:52:45 +01:00
iterator.add_error(*iterator);
2024-03-10 08:50:55 +01:00
break;
}
2024-03-01 10:13:55 +01:00
}
2024-03-10 08:50:55 +01:00
return declarations;
}
std::unique_ptr<block> parser::parse_block()
{
auto definitions = parse_definitions();
auto declarations = parse_declarations();
auto parsed_statement = parse_statement();
if (parsed_statement == nullptr)
2024-03-01 10:13:55 +01:00
{
return nullptr;
}
2024-03-10 08:50:55 +01:00
return std::make_unique<block>(std::move(definitions),
std::move(declarations), std::move(parsed_statement));
}
2024-03-01 10:13:55 +01:00
}