remove flex/bison

This commit is contained in:
Simon 2024-07-19 01:46:06 +02:00
parent f0622cbb3f
commit ff45df6bc1
10 changed files with 13 additions and 399 deletions

View File

@ -3,27 +3,20 @@ cmake_minimum_required(VERSION 3.29)
project(stela VERSION 1.0.0 LANGUAGES CXX)
find_package(BISON REQUIRED)
find_package(FLEX REQUIRED)
BISON_TARGET(
Parser
parser.y
${CMAKE_CURRENT_BINARY_DIR}/parser.cpp
)
FLEX_TARGET(
Lexer
lexer.l
${CMAKE_CURRENT_BINARY_DIR}/lexer.cpp
)
set (CMAKE_CXX_STANDARD 20)
set(CMAKE_EXPORT_COMPILE_COMMANDS ON)
set(CMAKE_BUILD_TYPE Debug)
if (MSVC)
add_compile_options(/W4 /WX)
else()
add_compile_options(-Wall -Wextra -pedantic -Werror)
endif()
add_executable(
stela
main.cpp
interpreter.cpp
command.cpp
${BISON_Parser_OUTPUTS}
${FLEX_Lexer_OUTPUTS}
parser.cpp
)
include_directories(${CMAKE_CURRENT_BINARY_DIR} ${CMAKE_CURRENT_SOURCE_DIR})

View File

@ -35,7 +35,7 @@ class DoorControl derives GenericDoorControl {
operation Unlock() { this.locked = false; }
state_machine {
entry {
initial {
transition DoorControl;
}
DoorControl {

View File

@ -1,20 +0,0 @@
#include <iostream>
#include <sstream>
#include "command.hpp"
using namespace stela;
std::string Command::to_string() const
{
std::stringstream s;
s << "name = [" << this->m_name << "], ";
s << "arguments = [";
for(int i = 0; i < this->arguments.size(); i++) {
s << this->arguments[i];
if(i < this->arguments.size() - 1) {
s << ", ";
}
}
s << "]";
return s.str();
}

View File

@ -1,34 +0,0 @@
#pragma once
#include <string>
#include <vector>
#include <cstdint>
#include <memory>
namespace stela {
class Command {
public:
Command(std::string name, std::vector<uint64_t> arguments)
: m_name(std::move(name))
, arguments(std::move(arguments))
{}
Command(std::string name)
: m_name(std::move(name))
{}
Command() = default;
std::string to_string() const;
std::string name() const
{
return this->m_name;
}
private:
std::string m_name;
std::vector<uint64_t> arguments;
};
}

View File

@ -1,15 +0,0 @@
#include "interpreter.hpp"
#include "command.hpp"
#include <sstream>
using namespace stela;
std::string Interpreter::to_string() const
{
std::stringstream s;
s << "Interpreter: " << this->commands.size() << " commands received from command line.\n";
for(size_t i = 0; i < this->commands.size(); i++) {
s << " * " << this->commands[i].to_string() << '\n';
}
return s.str();
}

View File

@ -1,71 +0,0 @@
#pragma once
#include <vector>
#include "lexer.hpp"
#include "parser.hpp"
namespace stela {
class Command;
class Interpreter {
public:
Interpreter()
: commands()
, lexer(*this)
, parser(lexer, *this)
, m_location(0)
{}
inline int parse()
{
this->m_location = 0;
return this->parser.parse();
}
inline void clear()
{
this->m_location = 0;
this->commands.clear();
}
std::string to_string() const;
/// Switch scanner input stream. Default is standard input (std::cin).
/// It will also reset AST.
inline void switch_input_stream(std::istream* is)
{
this->lexer.switch_streams(is, nullptr);
this->commands.clear();
}
friend class Parser;
friend class Lexer;
private:
inline void add_command(const Command& command)
{
this->commands.push_back(command);
}
inline void increase_location(unsigned int location)
{
this->m_location += location;
std::cout << "increase_location(): "
<< location << ", total = " << this->m_location << '\n';
}
inline unsigned int location() const
{
return this->m_location;
}
private:
Lexer lexer;
Parser parser;
std::vector<Command> commands;
unsigned int m_location;
};
}

View File

@ -1,29 +0,0 @@
#pragma once
#if !defined(yyFlexLexerOnce)
#undef yyFlexLexer
#define yyFlexLexer stela_FlexLexer
#include <FlexLexer.h>
#endif
#undef YY_DECL
#define YY_DECL stela::Parser::symbol_type stela::Lexer::next_token()
#include "parser.hpp"
namespace stela {
class Interpreter;
class Lexer : public yyFlexLexer {
public:
Lexer(Interpreter& interpreter) : interpreter(interpreter) {}
virtual ~Lexer() = default;
virtual stela::Parser::symbol_type next_token();
private:
Interpreter& interpreter;
};
}

75
lexer.l
View File

@ -1,75 +0,0 @@
%{
#include <iostream>
#include <cstdlib>
#include "lexer.hpp"
#include "interpreter.hpp"
#include "parser.hpp"
#include "location.hh"
// Original yyterminate() macro returns int. Since we're using Bison 3 variants
// as tokens, we must redefine it to change type from `int` to `Parser::semantic_type`
#define yyterminate() stela::Parser::make_END(stela::location());
// This will track current scanner location.
// Action is called when length of the token is known.
#define YY_USER_ACTION this->interpreter.increase_location(yyleng);
// !!!WARNING!!!
// Location API is used, but the location is not initialized, 'cause I'm lazy. When making
// a token with make_{something} method you can pass detailed token location. Current location
// is accessible with m_driver.location() method. All puzzle elements are there - just
// pass location value in every action code block below. I'm going to waste more time writing
// this excuse than putting this boilerplate below...
//
// Location class can be found in location.hh and posistion.hh files. It's just a bit too much
// boilerplate for this small example. Bummer.
%}
%option nodefault noyywrap noyylineno c++ yyclass="Lexer" prefix="stela_"
%%
[a-z]+ {
std::cout << "Scanner: identifier [" << yytext << "]\n";
return stela::Parser::make_STRING(yytext, stela::location());
}
\( {
std::cout << "Scanner: '('\n";
return stela::Parser::make_LEFTPAR(stela::location());
}
\) {
std::cout << "Scanner: ')'\n";
return stela::Parser::make_RIGHTPAR(stela::location());
}
; {
std::cout << "Scanner: ';'\n";
return stela::Parser::make_SEMICOLON(stela::location());
}
, {
std::cout << "Scanner: ','\n";
return stela::Parser::make_COMMA(stela::location());
}
[\n\t ] {
//cout << "Scanner: whitechar (ignored)" << endl;
}
[1-9][0-9]* {
std::cout << "Scanner: decimal number: " << yytext << '\n';
uint64_t number = strtoull(yytext, 0, 10);
return stela::Parser::make_NUMBER(number, stela::location());
}
. {
std::cout << "Scanner: unknown character [" << yytext << "]\n";
}
<<EOF>> { return yyterminate(); }
%%

View File

@ -1,12 +1,3 @@
#include "interpreter.hpp"
#include "lexer.hpp"
#include "parser.hpp"
#include <iostream>
int main()
{
stela::Interpreter interpreter;
int result = interpreter.parse();
std::cout << "Prase completed with result: " << result << '\n';
return result;
}
int main() { }

126
parser.y
View File

@ -1,126 +0,0 @@
%skeleton "lalr1.cc"
%require "3.8.2"
%defines
%define api.parser.class { Parser }
%define api.token.constructor
%define api.value.type variant
%define parse.assert
%define api.namespace { stela }
%code requires {
#include <iostream>
#include <string>
#include <vector>
#include <cstdint>
#include "command.hpp"
namespace stela {
class Lexer;
class Interpreter;
}
}
%code top {
#include <iostream>
#include <cstdint>
#include "lexer.hpp"
#include "parser.hpp"
#include "interpreter.hpp"
#include "location.hh"
static stela::Parser::symbol_type yylex(stela::Lexer& lexer, stela::Interpreter& interpreter)
{
return lexer.next_token();
}
using namespace stela;
}
%lex-param { stela::Lexer& lexer }
%lex-param { stela::Interpreter& interpreter }
%parse-param { stela::Lexer& lexer }
%parse-param { stela::Interpreter& interpreter }
%locations
%define parse.trace
%define parse.error verbose
%define api.token.prefix {TOKEN_}
%token END 0 "end of file"
%token <std::string> STRING "string";
%token <uint64_t> NUMBER "number";
%token LEFTPAR "leftpar";
%token RIGHTPAR "rightpar";
%token SEMICOLON "semicolon";
%token COMMA "comma";
%type <stela::Command> command;
%type <std::vector<uint64_t>> arguments;
%start program
%%
program: {
std::cout << "*** RUN ***\n";
std::cout << "Type function with list of parmeters. Parameter list can be empty\n"
<< "or contain positive integers only. Examples: \n"
<< " * function()\n"
<< " * function(1,2,3)\n"
<< "Terminate listing with ; to see parsed AST\n"
<< "Terminate parser with Ctrl-D\n";
std::cout << '\n' << "prompt> ";
interpreter.clear();
}
| program command {
const Command &cmd = $2;
std::cout << "command parsed, updating AST\n";
interpreter.add_command(cmd);
std::cout << '\n' << "prompt> ";
}
| program SEMICOLON {
std::cout << "*** STOP RUN ***\n";
std::cout << interpreter.to_string() << '\n';
}
;
command : STRING LEFTPAR RIGHTPAR {
std::string &id = $1;
std::cout << "ID: " << id << '\n';
$$ = Command(id);
}
| STRING LEFTPAR arguments RIGHTPAR {
std::string &id = $1;
const std::vector<uint64_t> &args = $3;
std::cout << "function: " << id << ", " << args.size() << '\n';
$$ = Command(id, args);
}
;
arguments : NUMBER {
uint64_t number = $1;
$$ = std::vector<uint64_t>();
$$.push_back(number);
std::cout << "first argument: " << number << '\n';
}
| arguments COMMA NUMBER {
uint64_t number = $3;
std::vector<uint64_t> &args = $1;
args.push_back(number);
$$ = args;
std::cout << "next argument: " << number << ", arg list size = " << args.size() << '\n';
}
;
%%
void stela::Parser::error(const location &loc , const std::string &message) {
// Location should be initialized inside scanner action, but is not in this example.
// Let's grab location directly from driver class.
// std::cout << "Error: " << message << '\n' << "Location: " << loc << '\n';
std::cout << "Error: " << message << '\n' << "Error location: " << interpreter.location() << '\n';
}
// vim: ts=4 sw=4 et