Add Simple Parsing implementations for basic parsers

This commit is contained in:
Jan 2021-03-09 11:04:04 +01:00
parent 8d9080066f
commit 88ff98f334
14 changed files with 503 additions and 0 deletions

View File

@ -0,0 +1,65 @@
#include "ParserInputStream.h"
#include <sstream>
ParserInputStream::ParserInputStream(std::istream& stream, std::string fileName)
: m_stream(stream),
m_file_name(std::move(fileName)),
m_line_number(1)
{
}
ParserLine ParserInputStream::NextLine()
{
std::ostringstream str;
auto hasLength = false;
auto c = m_stream.get();
while (c != EOF)
{
switch (c)
{
case '\r':
c = m_stream.get();
if (c == '\n')
return ParserLine(m_file_name, m_line_number++, str.str());
str << '\r';
hasLength = true;
continue;
case '\n':
return ParserLine(m_file_name, m_line_number++, str.str());
default:
str << static_cast<char>(c);
hasLength = true;
break;
}
c = m_stream.get();
}
if (hasLength)
return ParserLine(m_file_name, m_line_number, str.str());
return ParserLine();
}
bool ParserInputStream::IncludeFile(const std::string& filename)
{
return false;
}
void ParserInputStream::PopCurrentFile()
{
}
bool ParserInputStream::IsOpen() const
{
return !m_stream.eof();
}
bool ParserInputStream::Eof() const
{
return !m_stream.eof();
}

View File

@ -0,0 +1,21 @@
#pragma once
#include <istream>
#include "Parsing/IParserLineStream.h"
class ParserInputStream final : public IParserLineStream
{
std::istream& m_stream;
std::string m_file_name;
int m_line_number;
public:
ParserInputStream(std::istream& stream, std::string fileName);
ParserLine NextLine() override;
bool IncludeFile(const std::string& filename) override;
void PopCurrentFile() override;
_NODISCARD bool IsOpen() const override;
_NODISCARD bool Eof() const override;
};

View File

@ -0,0 +1,14 @@
#include "SimpleMatcherCharacter.h"
SimpleMatcherCharacter::SimpleMatcherCharacter(const char c)
: m_char(c)
{
}
MatcherResult<SimpleParserValue> SimpleMatcherCharacter::CanMatch(ILexer<SimpleParserValue>* lexer, const unsigned tokenOffset)
{
const auto& token = lexer->GetToken(tokenOffset);
return token.m_type == SimpleParserValueType::CHARACTER && token.CharacterValue() == m_char
? MatcherResult<SimpleParserValue>::Match(1)
: MatcherResult<SimpleParserValue>::NoMatch();
}

View File

@ -0,0 +1,15 @@
#pragma once
#include "Parsing/Simple/SimpleParserValue.h"
#include "Parsing/Matcher/AbstractMatcher.h"
class SimpleMatcherCharacter final : public AbstractMatcher<SimpleParserValue>
{
char m_char;
protected:
MatcherResult<SimpleParserValue> CanMatch(ILexer<SimpleParserValue>* lexer, unsigned tokenOffset) override;
public:
explicit SimpleMatcherCharacter(char c);
};

View File

@ -0,0 +1,40 @@
#include "SimpleMatcherFactory.h"
#include "SimpleMatcherCharacter.h"
#include "SimpleMatcherKeyword.h"
#include "SimpleMatcherValueType.h"
SimpleMatcherFactory::SimpleMatcherFactory(const IMatcherForLabelSupplier<SimpleParserValue>* labelSupplier)
: AbstractMatcherFactory(labelSupplier)
{
}
MatcherFactoryWrapper<SimpleParserValue> SimpleMatcherFactory::Type(SimpleParserValueType type) const
{
return MatcherFactoryWrapper<SimpleParserValue>(std::make_unique<SimpleMatcherValueType>(type));
}
MatcherFactoryWrapper<SimpleParserValue> SimpleMatcherFactory::Keyword(std::string value) const
{
return MatcherFactoryWrapper<SimpleParserValue>(std::make_unique<SimpleMatcherKeyword>(std::move(value)));
}
MatcherFactoryWrapper<SimpleParserValue> SimpleMatcherFactory::Identifier() const
{
return MatcherFactoryWrapper<SimpleParserValue>(std::make_unique<SimpleMatcherValueType>(SimpleParserValueType::IDENTIFIER));
}
MatcherFactoryWrapper<SimpleParserValue> SimpleMatcherFactory::Integer() const
{
return MatcherFactoryWrapper<SimpleParserValue>(std::make_unique<SimpleMatcherValueType>(SimpleParserValueType::INTEGER));
}
MatcherFactoryWrapper<SimpleParserValue> SimpleMatcherFactory::FloatingPoint() const
{
return MatcherFactoryWrapper<SimpleParserValue>(std::make_unique<SimpleMatcherValueType>(SimpleParserValueType::FLOATING_POINT));
}
MatcherFactoryWrapper<SimpleParserValue> SimpleMatcherFactory::Char(char c) const
{
return MatcherFactoryWrapper<SimpleParserValue>(std::make_unique<SimpleMatcherCharacter>(c));
}

View File

@ -0,0 +1,19 @@
#pragma once
#include <string>
#include "Parsing/Simple/SimpleParserValue.h"
#include "Parsing/Matcher/AbstractMatcherFactory.h"
class SimpleMatcherFactory final : public AbstractMatcherFactory<SimpleParserValue>
{
public:
explicit SimpleMatcherFactory(const IMatcherForLabelSupplier<SimpleParserValue>* labelSupplier);
_NODISCARD MatcherFactoryWrapper<SimpleParserValue> Type(SimpleParserValueType type) const;
_NODISCARD MatcherFactoryWrapper<SimpleParserValue> Keyword(std::string value) const;
_NODISCARD MatcherFactoryWrapper<SimpleParserValue> Identifier() const;
_NODISCARD MatcherFactoryWrapper<SimpleParserValue> Integer() const;
_NODISCARD MatcherFactoryWrapper<SimpleParserValue> FloatingPoint() const;
_NODISCARD MatcherFactoryWrapper<SimpleParserValue> Char(char c) const;
};

View File

@ -0,0 +1,16 @@
#include "SimpleMatcherKeyword.h"
SimpleMatcherKeyword::SimpleMatcherKeyword(std::string value)
: m_value(std::move(value))
{
const std::hash<std::string> hash;
m_hash = hash(m_value);
}
MatcherResult<SimpleParserValue> SimpleMatcherKeyword::CanMatch(ILexer<SimpleParserValue>* lexer, const unsigned tokenOffset)
{
const auto& token = lexer->GetToken(tokenOffset);
return token.m_type == SimpleParserValueType::IDENTIFIER && token.IdentifierHash() == m_hash && token.IdentifierValue() == m_value
? MatcherResult<SimpleParserValue>::Match(1)
: MatcherResult<SimpleParserValue>::NoMatch();
}

View File

@ -0,0 +1,18 @@
#pragma once
#include <string>
#include "Parsing/Simple/SimpleParserValue.h"
#include "Parsing/Matcher/AbstractMatcher.h"
class SimpleMatcherKeyword final : public AbstractMatcher<SimpleParserValue>
{
size_t m_hash;
std::string m_value;
protected:
MatcherResult<SimpleParserValue> CanMatch(ILexer<SimpleParserValue>* lexer, unsigned tokenOffset) override;
public:
explicit SimpleMatcherKeyword(std::string value);
};

View File

@ -0,0 +1,13 @@
#include "SimpleMatcherValueType.h"
SimpleMatcherValueType::SimpleMatcherValueType(const SimpleParserValueType type)
: m_type(type)
{
}
MatcherResult<SimpleParserValue> SimpleMatcherValueType::CanMatch(ILexer<SimpleParserValue>* lexer, const unsigned tokenOffset)
{
return lexer->GetToken(tokenOffset).m_type == m_type
? MatcherResult<SimpleParserValue>::Match(1)
: MatcherResult<SimpleParserValue>::NoMatch();
}

View File

@ -0,0 +1,15 @@
#pragma once
#include "Parsing/Simple/SimpleParserValue.h"
#include "Parsing/Matcher/AbstractMatcher.h"
class SimpleMatcherValueType final : public AbstractMatcher<SimpleParserValue>
{
SimpleParserValueType m_type;
protected:
MatcherResult<SimpleParserValue> CanMatch(ILexer<SimpleParserValue>* lexer, unsigned tokenOffset) override;
public:
explicit SimpleMatcherValueType(SimpleParserValueType type);
};

View File

@ -0,0 +1,44 @@
#include "SimpleLexer.h"
SimpleLexer::SimpleLexer(IParserLineStream* stream)
: AbstractLexer(stream)
{
}
SimpleParserValue SimpleLexer::GetNextToken()
{
auto c = NextChar();
while (isspace(c))
c = NextChar();
if(c == EOF)
return SimpleParserValue::EndOfFile(TokenPos());
if (c == '\"')
return SimpleParserValue::String(GetPreviousCharacterPos(), new std::string(ReadString()));
const auto pos = GetPreviousCharacterPos();
if (isdigit(c))
{
bool isFloatingPointValue;
double doubleValue;
int integerValue;
ReadNumber(isFloatingPointValue, doubleValue, integerValue);
if (isFloatingPointValue)
return SimpleParserValue::FloatingPoint(pos, doubleValue);
return SimpleParserValue::Integer(pos, integerValue);
}
if (isalpha(c) || c == '_')
{
auto identifier = ReadIdentifier();
return SimpleParserValue::Identifier(pos, new std::string(std::move(identifier)));
}
return SimpleParserValue::Character(pos, static_cast<char>(c));
}

View File

@ -0,0 +1,13 @@
#pragma once
#include "SimpleParserValue.h"
#include "Parsing/Impl/AbstractLexer.h"
class SimpleLexer final : public AbstractLexer<SimpleParserValue>
{
protected:
SimpleParserValue GetNextToken() override;
public:
explicit SimpleLexer(IParserLineStream* stream);
};

View File

@ -0,0 +1,141 @@
#include "SimpleParserValue.h"
#include <cassert>
SimpleParserValue SimpleParserValue::Invalid(const TokenPos pos)
{
SimpleParserValue pv(pos, SimpleParserValueType::INVALID);
return pv;
}
SimpleParserValue SimpleParserValue::EndOfFile(const TokenPos pos)
{
SimpleParserValue pv(pos, SimpleParserValueType::END_OF_FILE);
return pv;
}
SimpleParserValue SimpleParserValue::Character(const TokenPos pos, const char c)
{
SimpleParserValue pv(pos, SimpleParserValueType::CHARACTER);
pv.m_value.char_value = c;
return pv;
}
SimpleParserValue SimpleParserValue::Integer(const TokenPos pos, const int value)
{
SimpleParserValue pv(pos, SimpleParserValueType::INTEGER);
pv.m_value.int_value = value;
return pv;
}
SimpleParserValue SimpleParserValue::FloatingPoint(const TokenPos pos, const double value)
{
SimpleParserValue pv(pos, SimpleParserValueType::FLOATING_POINT);
pv.m_value.double_value = value;
return pv;
}
SimpleParserValue SimpleParserValue::String(const TokenPos pos, std::string* stringValue)
{
SimpleParserValue pv(pos, SimpleParserValueType::STRING);
pv.m_value.string_value = stringValue;
return pv;
}
SimpleParserValue SimpleParserValue::Identifier(const TokenPos pos, std::string* identifier)
{
SimpleParserValue pv(pos, SimpleParserValueType::IDENTIFIER);
pv.m_value.string_value = identifier;
pv.m_hash = std::hash<std::string>()(*identifier);
return pv;
}
SimpleParserValue::SimpleParserValue(const TokenPos pos, const SimpleParserValueType type)
: m_pos(pos),
m_type(type),
m_hash(0),
m_value{}
{
}
SimpleParserValue::~SimpleParserValue()
{
switch (m_type)
{
case SimpleParserValueType::STRING:
case SimpleParserValueType::IDENTIFIER:
delete m_value.string_value;
break;
default:
break;
}
m_value = ValueType();
}
SimpleParserValue::SimpleParserValue(SimpleParserValue&& other) noexcept
: m_pos(other.m_pos),
m_type(other.m_type),
m_hash(other.m_hash),
m_value(other.m_value)
{
other.m_value = ValueType();
}
SimpleParserValue& SimpleParserValue::operator=(SimpleParserValue&& other) noexcept
{
m_pos = other.m_pos;
m_type = other.m_type;
m_value = other.m_value;
m_hash = other.m_hash;
other.m_value = ValueType();
return *this;
}
bool SimpleParserValue::IsEof() const
{
return m_type == SimpleParserValueType::END_OF_FILE;
}
const TokenPos& SimpleParserValue::GetPos() const
{
return m_pos;
}
char SimpleParserValue::CharacterValue() const
{
assert(m_type == SimpleParserValueType::CHARACTER);
return m_value.char_value;
}
int SimpleParserValue::IntegerValue() const
{
assert(m_type == SimpleParserValueType::INTEGER);
return m_value.int_value;
}
double SimpleParserValue::FloatingPointValue() const
{
assert(m_type == SimpleParserValueType::FLOATING_POINT);
return m_value.double_value;
}
std::string& SimpleParserValue::StringValue() const
{
assert(m_type == SimpleParserValueType::STRING);
return *m_value.string_value;
}
std::string& SimpleParserValue::IdentifierValue() const
{
assert(m_type == SimpleParserValueType::IDENTIFIER);
return *m_value.string_value;
}
size_t SimpleParserValue::IdentifierHash() const
{
assert(m_type == SimpleParserValueType::IDENTIFIER);
return m_hash;
}

View File

@ -0,0 +1,69 @@
#pragma once
#include <string>
#include "Parsing/IParserValue.h"
#include "Utils/ClassUtils.h"
#include "Parsing/TokenPos.h"
enum class SimpleParserValueType
{
// Meta tokens
INVALID,
END_OF_FILE,
// Single character
CHARACTER,
// Generic token types
INTEGER,
FLOATING_POINT,
STRING,
IDENTIFIER,
// End
MAX
};
class SimpleParserValue final : public IParserValue
{
public:
TokenPos m_pos;
SimpleParserValueType m_type;
size_t m_hash;
union ValueType
{
char char_value;
int int_value;
double double_value;
std::string* string_value;
} m_value;
static SimpleParserValue Invalid(TokenPos pos);
static SimpleParserValue EndOfFile(TokenPos pos);
static SimpleParserValue Character(TokenPos pos, char c);
static SimpleParserValue Integer(TokenPos pos, int value);
static SimpleParserValue FloatingPoint(TokenPos pos, double value);
static SimpleParserValue String(TokenPos pos, std::string* stringValue);
static SimpleParserValue Identifier(TokenPos pos, std::string* identifier);
private:
SimpleParserValue(TokenPos pos, SimpleParserValueType type);
public:
~SimpleParserValue() override;
SimpleParserValue(const SimpleParserValue& other) = delete;
SimpleParserValue(SimpleParserValue&& other) noexcept;
SimpleParserValue& operator=(const SimpleParserValue& other) = delete;
SimpleParserValue& operator=(SimpleParserValue&& other) noexcept;
_NODISCARD bool IsEof() const override;
_NODISCARD const TokenPos& GetPos() const override;
_NODISCARD char CharacterValue() const;
_NODISCARD int IntegerValue() const;
_NODISCARD double FloatingPointValue() const;
_NODISCARD std::string& StringValue() const;
_NODISCARD std::string& IdentifierValue() const;
_NODISCARD size_t IdentifierHash() const;
};