Cleanup, restructuring

This commit is contained in:
Hans 2021-11-11 03:02:32 +01:00
parent fc035bd7a7
commit eddfeb7bfc
7 changed files with 160 additions and 89 deletions

View file

@ -2,6 +2,7 @@ cmake_minimum_required(VERSION 3.10)
project(biscuit_interpreter)
set(CMAKE_CXX_STANDARD 20)
set(CMAKE_EXPORT_COMPILE_COMMANDS ON)
add_executable(biscuit_interpreter src/common.hpp)

View file

@ -12,7 +12,7 @@ enum TokenType
enum ValueType
{
STRING,
DECIMAL,
NUMBER,
ANY
};

45
src/exceptions.hpp Normal file
View file

@ -0,0 +1,45 @@
#ifndef BISCUIT_INTERPRETER_EXCEPTIONS_HPP
#define BISCUIT_INTERPRETER_EXCEPTIONS_HPP
#include <exception>
#include "common.hpp"
struct MalformedTokenExcept : public std::exception
{
std::string malformed_str;
inline MalformedTokenExcept(const std::string& arg_str)
: malformed_str(arg_str) {}
};
struct UnknownKeywordExcept : public std::exception
{
std::string unknown_keyword;
inline UnknownKeywordExcept(const std::string& arg_str)
: unknown_keyword(arg_str) {}
};
struct WrongArgumentCountExcept : public std::exception
{
int expected, got;
std::string keyword_name;
inline WrongArgumentCountExcept(const std::string& _name, int _expected, int _got)
: expected(_expected), got(_got), keyword_name(_name) {}
};
struct WrongTokenExcept : public std::exception
{
enum TokenType expected, got;
std::string keyword_name, token_str;
inline WrongTokenExcept(const std::string& _keyword_name, const std::string& _token_str, const enum TokenType& _expected, const enum TokenType& _got)
: expected(_expected), got(_got), keyword_name(_keyword_name), token_str(_token_str) {}
};
struct TypeErrorExcept : public std::exception
{
enum ValueType expected, got;
std::string keyword_name, token_str;
inline TypeErrorExcept(const std::string& _keyword_name, const std::string& _token_str, const enum ValueType& _expected, const enum ValueType& _got)
: expected(_expected), got(_got), keyword_name(_keyword_name), token_str(_token_str) {}
};
#endif //BISCUIT_INTERPRETER_EXCEPTIONS_HPP

View file

@ -12,8 +12,8 @@ struct Keyword
const std::string name;
const int expected_num_args; // -1 means: 1 to infinity, in which case all args are of same type
const std::vector<TokenType> expected_token_types;
const std::vector<ValueType> expected_value_types;
const std::vector<enum TokenType> expected_token_types;
const std::vector<enum ValueType> expected_value_types;
};
extern const std::vector<Keyword> keywords;

View file

@ -1,10 +1,32 @@
#if defined(WIN32) || defined(WIN32) || defined(__WIN32)
#include <Windows.h>
#endif
#include <iostream>
#include <string>
#include <fstream>
#include <algorithm>
#include <sstream>
#include "common.hpp"
#include "exceptions.hpp"
#include "parse.hpp"
bool request_console();
// Must request console on Windows
#if defined(WIN32) || defined(WIN32) || defined(__WIN32)
bool request_console()
{
return AllocConsole();
}
#else
bool request_console()
{
return true;
}
#endif
std::ifstream get_infile(int argc, char ** argv)
{
if(argc != 2)
@ -24,40 +46,34 @@ std::ifstream get_infile(int argc, char ** argv)
return infile;
}
std::string code = \
R"del(
PRINT 10.0 |hello_world
)del";
int main(int argc, char * argv[])
{
/*
// Get the entire source code from the file
std::ifstream infile = get_infile(argc, argv);
std::string word;
std::vector<Token> tokens;
std::stringstream buffer;
buffer << infile.rdbuf();
*/
while(infile >> word)
{
try
{
Token token(word);
tokens.push_back(token);
}
catch(MalformedIdentifierExcept& exc)
{
std::cout << "Malformed identifier: '" << exc.malformed_str << "'"
<< "\nAborting..." << std::endl;
exit(EXIT_FAILURE);
}
catch(UnknownKeywordExcept& exc)
{
std::cout << "Unknown Keyword: '" << exc.unknown_keyword << "'"
<< "\nAborting..." << std::endl;
exit(EXIT_FAILURE);
}
catch(WrongTokenExcept& exc)
{
std::cout << "Wrong symbol type\n Aborting..." << std::endl;
exit(EXIT_FAILURE);
}
}
// On Windows, we have to explicitly request a console
/*if(!request_console())
{
std::cerr << "Failed to get console!" << std::endl;
exit(EXIT_FAILURE);
}*/
Instruction instr(tokens);
instr.print();
std::cerr << "POOP" << std::endl;
std::vector<Instruction> instructions = parse_instructions(code);
std::cerr << "Number of instructions parsed: " << instructions.size() << std::endl;
for(auto& instr : instructions)
instr.print();
return 0;
}

View file

@ -1,21 +1,72 @@
#include <iostream>
#include <exception>
#include <algorithm>
#include <vector>
#include "exceptions.hpp"
#include "keywords.hpp"
#include "parse.hpp"
#include "common.hpp"
static const std::string blank_space = "\t ";
static const std::string line_end = "\n";
// turn a line (one instruction) into tokens
std::vector<Token> tokenize_line(const std::string& line)
{
std::vector<Token> tokens;
// find all individual tokens
std::size_t end, begin = line.find_first_not_of(blank_space, 0);
while(begin != std::string::npos)
{
end = line.find_first_of(blank_space, begin);
std::string word = line.substr(begin, end - begin);
tokens.emplace_back(word);
begin = line.find_first_not_of(blank_space, end);
}
return std::move(tokens);
}
std::vector<Instruction> parse_instructions(const std::string& code_arg)
{
// Make a copy of the code and append a line_end symbol to make sure the
// parser doesn't break on EOF
std::string code = code_arg;
code.append(line_end);
std::vector<Instruction> instructions;
std::size_t end, begin = code.find_first_not_of(line_end, 0);
while(begin != std::string::npos)
{
end = code.find_first_of(line_end, begin);
std::string line = code.substr(begin, end - begin);
std::vector<Token> tokens = tokenize_line(line);
instructions.emplace_back(tokens);
begin = code.find_first_not_of(line_end, end);
}
return std::move(instructions);
}
bool is_keyword(std::string str)
{
for(char &c : str)
c = std::tolower(c);
c = (char) std::tolower(c);
for(auto &keyword : keywords)
return std::any_of(keywords.begin(), keywords.end(),[&str](auto& keyword){
return keyword.name == str;
});
/* for(auto &keyword : keywords)
if(str == keyword.name)
return true;
return 0;
*/
}
bool is_string_literal(const std::string& str)
@ -70,7 +121,7 @@ bool Token::parse_as_literal(const std::string &str)
else if(is_decimal_literal(str))
{
type = TokenType::LITERAL;
literal_type = ValueType::DECIMAL;
literal_type = ValueType::NUMBER;
val_float = std::stof(str);
val_string = str;
return true;
@ -86,7 +137,9 @@ bool Token::parse_as_identifier(const std::string &str)
if(is_identifier(str))
{
type = TokenType::IDENTIFIER;
literal_type = ValueType::ANY;
val_string = str;
val_float = 0.0f;
return true;
}
return false;
@ -94,13 +147,9 @@ bool Token::parse_as_identifier(const std::string &str)
Token::Token(const std::string &str)
{
if (parse_as_keyword(str));
else if(parse_as_literal(str));
else if(parse_as_identifier(str));
else
{
throw MalformedIdentifierExcept(str);
}
// First try to parse as str, then as literal, then as identifier
if(!(parse_as_keyword(str) && parse_as_literal(str) && parse_as_identifier(str)))
throw MalformedTokenExcept(str); // if all fails -> malformed token
}
void Token::print() const
@ -116,7 +165,7 @@ void Token::print() const
case TokenType::LITERAL:
std::cerr << "Literal of type ";
if(literal_type == ValueType::DECIMAL)
if(literal_type == ValueType::NUMBER)
std::cerr << "decimal: " << val_float;
else if(literal_type == ValueType::STRING)
std::cerr << "string: \"" << val_string << "\"";
@ -128,8 +177,6 @@ void Token::print() const
std::cerr << std::endl;
}
Instruction::Instruction(std::vector<Token>& _token_list)
{
// move over the tokens

View file

@ -1,61 +1,21 @@
#ifndef BISCUIT_PARSE_HPP_INCLUDED
#define BISCUIT_PARSE_HPP_INCLUDED
#include <exception>
#include <string>
#include <vector>
#include "keywords.hpp"
#include "common.hpp"
struct MalformedIdentifierExcept : public std::exception
{
std::string malformed_str;
MalformedIdentifierExcept(const std::string& arg_str)
: malformed_str(arg_str) {}
};
struct UnknownKeywordExcept : public std::exception
{
std::string unknown_keyword;
UnknownKeywordExcept(const std::string& arg_str)
: unknown_keyword(arg_str) {}
};
struct WrongArgumentCountExcept : public std::exception
{
int expected, got;
std::string keyword_name;
WrongArgumentCountExcept(std::string _name, int _expected, int _got)
: expected(_expected), got(_got), keyword_name(_name) {}
};
struct WrongTokenExcept : public std::exception
{
TokenType expected, got;
std::string keyword_name, token_str;
WrongTokenExcept(std::string _keyword_name, std::string _token_str, const TokenType& _expected, const TokenType& _got)
: expected(_expected), got(_got), keyword_name(_keyword_name), token_str(_token_str) {}
};
struct TypeErrorExcept : public std::exception
{
ValueType expected, got;
std::string keyword_name, token_str;
TypeErrorExcept(std::string _keyword_name, std::string _token_str, const ValueType& _expected, const ValueType& _got)
: expected(_expected), got(_got), keyword_name(_keyword_name), token_str(_token_str) {}
};
struct Token
{
private:
bool parse_as_keyword(const std::string &str);
bool parse_as_keyword(const std::string& str);
bool parse_as_literal(const std::string &str);
bool parse_as_literal(const std::string& str);
// if a word is not a keyword or literal, it must be identifier
bool parse_as_identifier(const std::string &str);
bool parse_as_identifier(const std::string& str);
public:
enum TokenType type;
@ -63,7 +23,7 @@ public:
float val_float;
std::string val_string;
Token(const std::string &str);
Token(const std::string& str);
void print() const;
};
@ -79,4 +39,6 @@ public:
void print();
};
std::vector<Instruction> parse_instructions(const std::string& code_arg);
#endif