dc/d32/_generic_file_format_8cpp_source.html

/*

    This source file is part of Rigs of Rods

    Copyright 2022 Petr Ohlidal


    For more information, see http://www.rigsofrods.org/


    Rigs of Rods is free software: you can redistribute it and/or modify

    it under the terms of the GNU General Public License version 3, as

    published by the Free Software Foundation.


    Rigs of Rods is distributed in the hope that it will be useful,

    but WITHOUT ANY WARRANTY; without even the implied warranty of

    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

    GNU General Public License for more details.


    You should have received a copy of the GNU General Public License

    along with Rigs of Rods. If not, see <http://www.gnu.org/licenses/>.

*/


#include "GenericFileFormat.h"


#include "Application.h"

#include "Console.h"


#include <algorithm>


using namespace RoR;

using namespace Ogre;


enum class PartialToken

{

    NONE,

    COMMENT_SEMICOLON,             // Comment starting with ';'

    COMMENT_SLASH,                 // Comment starting with '//'

    COMMENT_HASH,

    STRING_QUOTED,                 // String starting/ending with '"'

    STRING_NAKED,                  // String without '"' on either end

    STRING_NAKED_CAPTURING_SPACES, // Only for OPTION_PARENTHESES_CAPTURE_SPACES - A naked string seeking the closing ')'.

    TITLE_STRING,                  // A whole-line string, with spaces

    NUMBER_STUB_MINUS,             // Sole '-' character, may start a number or a naked string.

    NUMBER_INTEGER,                // Just digits and optionally leading '-'

    NUMBER_DECIMAL,                // Like INTEGER but already containing '.'

    NUMBER_SCIENTIFIC_STUB,        // Like DECIMAL, already containing 'e' or 'E' but not the exponent value.

    NUMBER_SCIENTIFIC_STUB_MINUS,  // Like SCIENTIFIC_STUB but with only '-' in exponent.

    NUMBER_SCIENTIFIC,             // Valid decimal number in scientific notation.

    KEYWORD,                       // Unqoted string at the start of line. Accepted characters: alphanumeric and underscore

    KEYWORD_BRACED,                // Like KEYWORD but starting with '[' and ending with ']'

    BOOL_TRUE,                     // Partial 'true'

    BOOL_FALSE,                    // Partial 'false'

    GARBAGE,                       // Text not fitting any above category, will be discarded

};


struct DocumentParser

{

    DocumentParser(GenericDocument& d, const BitMask_t opt, Ogre::DataStreamPtr ds)

        : doc(d), options(opt), datastream(ds) {}


    // Config

    GenericDocument& doc;

    const BitMask_t options;

    Ogre::DataStreamPtr datastream;


    // State

    std::vector<char> tok;

    size_t line_num = 0;

    size_t line_pos = 0;

    PartialToken partial_tok_type = PartialToken::NONE;

    bool title_found = false; // Only for OPTION_FIRST_LINE_IS_TITLE


    void ProcessChar(const char c);

    void ProcessEOF();

    void ProcessSeparatorWithinBool();


    void BeginToken(const char c);

    void UpdateComment(const char c);

    void UpdateString(const char c);

    void UpdateNumber(const char c);

    void UpdateBool(const char c);

    void UpdateKeyword(const char c);

    void UpdateTitle(const char c); // Only for OPTION_FIRST_LINE_IS_TITLE

    void UpdateGarbage(const char c);


    void DiscontinueBool();

    void DiscontinueNumber();

    void DiscontinueKeyword();

    void FlushStringishToken(RoR::TokenType type);

    void FlushNumericToken();

};


void DocumentParser::BeginToken(const char c)

{

    switch (c)

    {

    case '\r':

        break;


    case ' ':

    case ',':

    case '\t':

        line_pos++;

        break;


    case ':':

        if (options & GenericDocument::OPTION_ALLOW_SEPARATOR_COLON)

        {

            line_pos++;

        }

        else

        {

            if (options & GenericDocument::OPTION_ALLOW_NAKED_STRINGS)

                partial_tok_type = PartialToken::STRING_NAKED;

            else

                partial_tok_type = PartialToken::GARBAGE;

            tok.push_back(c);

            line_pos++;

        }

        break;


    case '=':

        if (options & GenericDocument::OPTION_ALLOW_SEPARATOR_EQUALS)

        {

            line_pos++;

        }

        else

        {

            if (options & GenericDocument::OPTION_ALLOW_NAKED_STRINGS)

                partial_tok_type = PartialToken::STRING_NAKED;

            else

                partial_tok_type = PartialToken::GARBAGE;

            tok.push_back(c);

            line_pos++;

        }

        break;


    case '\n':

        doc.tokens.push_back({ TokenType::LINEBREAK, 0.f });

        line_num++;

        line_pos = 0;

        break;


    case ';':

        partial_tok_type = PartialToken::COMMENT_SEMICOLON;

        line_pos++;

        break;


    case '/':

        if (options & GenericDocument::OPTION_ALLOW_SLASH_COMMENTS)

        {

            partial_tok_type = PartialToken::COMMENT_SLASH;

        }

        else

        {

            if (options & GenericDocument::OPTION_ALLOW_NAKED_STRINGS)

                partial_tok_type = PartialToken::STRING_NAKED;

            else

                partial_tok_type = PartialToken::GARBAGE;

            tok.push_back(c);

        }

        line_pos++;

        break;


    case '#':

        if (options & GenericDocument::OPTION_ALLOW_HASH_COMMENTS)

        {

            partial_tok_type = PartialToken::COMMENT_HASH;

        }

        else

        {

            if (options & GenericDocument::OPTION_ALLOW_NAKED_STRINGS)

                partial_tok_type = PartialToken::STRING_NAKED;

            else

                partial_tok_type = PartialToken::GARBAGE;

            tok.push_back(c);

        }

        line_pos++;

        break;


    case '[':

        if (options & GenericDocument::OPTION_ALLOW_BRACED_KEYWORDS)

        {

            partial_tok_type = PartialToken::KEYWORD_BRACED;

        }

        else

        {

            if (options & GenericDocument::OPTION_ALLOW_NAKED_STRINGS)

                partial_tok_type = PartialToken::STRING_NAKED;

            else

                partial_tok_type = PartialToken::GARBAGE;

        }

        tok.push_back(c);

        line_pos++;

        break;


    case '"':

        partial_tok_type = PartialToken::STRING_QUOTED;

        line_pos++;

        break;


    case '.':

        tok.push_back(c);

        partial_tok_type = PartialToken::NUMBER_DECIMAL;

        line_pos++;

        break;


    case 't':

        tok.push_back(c);

        partial_tok_type = PartialToken::BOOL_TRUE;

        line_pos++;

        break;


    case 'f':

        tok.push_back(c);

        partial_tok_type = PartialToken::BOOL_FALSE;

        line_pos++;

        break;


    case '0':

    case '1':

    case '2':

    case '3':

    case '4':

    case '5':

    case '6':

    case '7':

    case '8':

    case '9':

        partial_tok_type = PartialToken::NUMBER_INTEGER;

        tok.push_back(c);

        line_pos++;

        break;


    case '-':

        partial_tok_type = PartialToken::NUMBER_STUB_MINUS;

        tok.push_back(c);

        line_pos++;

        break;


    default:

        if (isalpha(c) &&

            (doc.tokens.size() == 0 || doc.tokens.back().type == TokenType::LINEBREAK)) // on line start?

        {

            tok.push_back(c);

            partial_tok_type = PartialToken::KEYWORD;

        }

        else if (options & GenericDocument::OPTION_ALLOW_NAKED_STRINGS)

        {

            tok.push_back(c);

            partial_tok_type = PartialToken::STRING_NAKED;

        }

        else

        {

            partial_tok_type = PartialToken::GARBAGE;

            tok.push_back(c);

        }

        line_pos++;

        break;

    }


    if (options & GenericDocument::OPTION_FIRST_LINE_IS_TITLE

        && !title_found

        && (doc.tokens.size() == 0 || doc.tokens.back().type == TokenType::LINEBREAK)

        && partial_tok_type != PartialToken::NONE

        && partial_tok_type != PartialToken::COMMENT_SEMICOLON

        && partial_tok_type != PartialToken::COMMENT_SLASH)

    {

        title_found = true;

        partial_tok_type = PartialToken::TITLE_STRING;

    }


    if (partial_tok_type == PartialToken::GARBAGE)

    {

        App::GetConsole()->putMessage(Console::CONSOLE_MSGTYPE_INFO, Console::CONSOLE_SYSTEM_WARNING,

            fmt::format("{}, line {}, pos {}: stray character '{}'", datastream->getName(), line_num, line_pos, c));

    }

}


void DocumentParser::UpdateComment(const char c)

{

    switch (c)

    {

    case '\r':

        break;


    case '\n':

        this->FlushStringishToken(TokenType::COMMENT);

        // Break line

        doc.tokens.push_back({ TokenType::LINEBREAK, 0.f });

        line_num++;

        line_pos = 0;

        break;


    case '/':

        if (partial_tok_type != PartialToken::COMMENT_SLASH || tok.size() > 0) // With COMMENT_SLASH, skip any number of leading '/'

        {

            tok.push_back(c);

        }

        line_pos++;

        break;


    default:

        tok.push_back(c);

        line_pos++;

        break;

    }

}


void DocumentParser::UpdateString(const char c)

{

    switch (c)

    {

    case '\r':

        break;


    case ' ':

        if (partial_tok_type == PartialToken::STRING_QUOTED

            || partial_tok_type == PartialToken::STRING_NAKED_CAPTURING_SPACES)

        {

            tok.push_back(c);

        }

        else // (partial_tok_type == PartialToken::STRING_NAKED)

        {

            this->FlushStringishToken(TokenType::STRING);

        }

        line_pos++;

        break;


    case ',':

    case '\t':

        if (partial_tok_type == PartialToken::STRING_QUOTED)

        {

            tok.push_back(c);

        }

        else // (partial_tok_type == PartialToken::STRING_NAKED)

        {

            this->FlushStringishToken(TokenType::STRING);

        }

        line_pos++;

        break;


    case '\n':

        if (partial_tok_type == PartialToken::STRING_QUOTED)

        {

            App::GetConsole()->putMessage(Console::CONSOLE_MSGTYPE_INFO, Console::CONSOLE_SYSTEM_WARNING,

                fmt::format("{}, line {}, pos {}: quoted string interrupted by newline", datastream->getName(), line_num, line_pos));

        }

        this->FlushStringishToken(TokenType::STRING);

        // Break line

        doc.tokens.push_back({ TokenType::LINEBREAK, 0.f });

        line_num++;

        line_pos = 0;

        break;


    case ':':

        if (options & GenericDocument::OPTION_ALLOW_SEPARATOR_COLON

            && (partial_tok_type == PartialToken::STRING_NAKED || partial_tok_type == PartialToken::STRING_NAKED_CAPTURING_SPACES))

        {

            this->FlushStringishToken(TokenType::STRING);

        }

        else

        {

            tok.push_back(c);

        }

        line_pos++;

        break;


    case '=':

        if (options & GenericDocument::OPTION_ALLOW_SEPARATOR_EQUALS

            && (partial_tok_type == PartialToken::STRING_NAKED || partial_tok_type == PartialToken::STRING_NAKED_CAPTURING_SPACES))

        {

            this->FlushStringishToken(TokenType::STRING);

        }

        else

        {

            tok.push_back(c);

        }

        line_pos++;

        break;


    case '"':

        if (partial_tok_type == PartialToken::STRING_QUOTED)

        {

            this->FlushStringishToken(TokenType::STRING);

        }

        else // (partial_tok_type == PartialToken::STRING_NAKED)

        {

            partial_tok_type = PartialToken::GARBAGE;

            tok.push_back(c);

        }

        line_pos++;

        break;


    case '(':

        if (partial_tok_type == PartialToken::STRING_NAKED

            && options & GenericDocument::OPTION_PARENTHESES_CAPTURE_SPACES)

        {

            partial_tok_type = PartialToken::STRING_NAKED_CAPTURING_SPACES;

        }

        tok.push_back(c);

        line_pos++;

        break;


    case ')':

        if (partial_tok_type == PartialToken::STRING_NAKED_CAPTURING_SPACES)

        {

            partial_tok_type = PartialToken::STRING_NAKED;

        }

        tok.push_back(c);

        line_pos++;

        break;


    default:

        tok.push_back(c);

        line_pos++;

        break;

    }


    if (partial_tok_type == PartialToken::GARBAGE)

    {

        App::GetConsole()->putMessage(Console::CONSOLE_MSGTYPE_INFO, Console::CONSOLE_SYSTEM_WARNING,

            fmt::format("{}, line {}, pos {}: stray character '{}' in string", datastream->getName(), line_num, line_pos, c));

    }

}


void DocumentParser::UpdateNumber(const char c)

{

    switch (c)

    {

    case '\r':

        break;


    case ' ':

    case ',':

    case '\t':

        if (partial_tok_type == PartialToken::NUMBER_STUB_MINUS

            && options & GenericDocument::OPTION_ALLOW_NAKED_STRINGS)

        {

            this->FlushStringishToken(TokenType::STRING);

        }

        else

        {

            this->FlushNumericToken();

        }

        line_pos++;

        break;


    case '\n':

        if (partial_tok_type == PartialToken::NUMBER_STUB_MINUS

            && options & GenericDocument::OPTION_ALLOW_NAKED_STRINGS)

        {

            this->FlushStringishToken(TokenType::STRING);

        }

        else

        {

            this->FlushNumericToken();

        }

        // Break line

        doc.tokens.push_back({ TokenType::LINEBREAK, 0.f });

        line_num++;

        line_pos = 0;

        break;


    case ':':

        if (options & GenericDocument::OPTION_ALLOW_SEPARATOR_COLON)

        {

            if (partial_tok_type == PartialToken::NUMBER_STUB_MINUS

                && options & GenericDocument::OPTION_ALLOW_NAKED_STRINGS)

            {

                this->FlushStringishToken(TokenType::STRING);

            }

            else

            {

                this->FlushNumericToken();

            }

        }

        else

        {

            this->DiscontinueNumber();

            tok.push_back(c);

        }

        line_pos++;

        break;


    case '=':

        if (options & GenericDocument::OPTION_ALLOW_SEPARATOR_EQUALS)

        {

            if (partial_tok_type == PartialToken::NUMBER_STUB_MINUS

                && options & GenericDocument::OPTION_ALLOW_NAKED_STRINGS)

            {

                this->FlushStringishToken(TokenType::STRING);

            }

            else

            {

                this->FlushNumericToken();

            }

        }

        else

        {

            this->DiscontinueNumber();

            tok.push_back(c);

        }

        line_pos++;

        break;


    case '.':

        if (partial_tok_type == PartialToken::NUMBER_INTEGER

            || partial_tok_type == PartialToken::NUMBER_STUB_MINUS)

        {

            partial_tok_type = PartialToken::NUMBER_DECIMAL;

        }

        else

        {

            this->DiscontinueNumber();

        }

        tok.push_back(c);

        line_pos++;

        break;


    case 'e':

    case 'E':

        if (partial_tok_type == PartialToken::NUMBER_DECIMAL

            || partial_tok_type == PartialToken::NUMBER_INTEGER)

        {

            partial_tok_type = PartialToken::NUMBER_SCIENTIFIC_STUB;

        }

        else

        {

            this->DiscontinueNumber();

        }

        tok.push_back(c);

        line_pos++;

        break;


    case '-':

        if (partial_tok_type == PartialToken::NUMBER_SCIENTIFIC_STUB)

        {

            partial_tok_type = PartialToken::NUMBER_SCIENTIFIC_STUB_MINUS;

        }

        else

        {

            this->DiscontinueNumber();

        }

        tok.push_back(c);

        line_pos++;

        break;


    case '0':

    case '1':

    case '2':

    case '3':

    case '4':

    case '5':

    case '6':

    case '7':

    case '8':

    case '9':

        if (partial_tok_type == PartialToken::NUMBER_SCIENTIFIC_STUB

            || partial_tok_type == PartialToken::NUMBER_SCIENTIFIC_STUB_MINUS)

        {

            partial_tok_type = PartialToken::NUMBER_SCIENTIFIC;

        }

        else if (partial_tok_type == PartialToken::NUMBER_STUB_MINUS)

        {

            partial_tok_type = PartialToken::NUMBER_INTEGER;

        }

        tok.push_back(c);

        line_pos++;

        break;


    default:

        this->DiscontinueNumber();

        tok.push_back(c);

        line_pos++;

        break;


    }


    if (partial_tok_type == PartialToken::GARBAGE)

    {

        App::GetConsole()->putMessage(Console::CONSOLE_MSGTYPE_INFO, Console::CONSOLE_SYSTEM_WARNING,

            fmt::format("{}, line {}, pos {}: stray character '{}' in number", datastream->getName(), line_num, line_pos, c));

    }

}


void DocumentParser::ProcessSeparatorWithinBool()

{

    this->DiscontinueBool();

    switch (partial_tok_type)

    {

        case PartialToken::KEYWORD:

            this->FlushStringishToken(TokenType::KEYWORD);

            break;

        case PartialToken::STRING_NAKED:

            this->FlushStringishToken(TokenType::STRING);

            break;

        default:

            // Discard token

            tok.push_back('\0');

            App::GetConsole()->putMessage(Console::CONSOLE_MSGTYPE_INFO, Console::CONSOLE_SYSTEM_WARNING,

                fmt::format("{}, line {}, pos {}: discarding incomplete boolean token '{}'", datastream->getName(), line_num, line_pos, tok.data()));

            tok.clear();

            partial_tok_type = PartialToken::NONE;

            break;

    }

}


void DocumentParser::UpdateBool(const char c)

{

    switch (c)

    {

    case '\r':

        break;


    case ' ':

    case ',':

    case '\t':

        this->ProcessSeparatorWithinBool();

        line_pos++;

        break;


    case '\n':

        this->ProcessSeparatorWithinBool();

        // Break line

        doc.tokens.push_back({ TokenType::LINEBREAK, 0.f });

        line_num++;

        line_pos = 0;

        break;


    case ':':

        if (options & GenericDocument::OPTION_ALLOW_SEPARATOR_COLON)

        {

            this->ProcessSeparatorWithinBool();

        }

        else

        {

            this->DiscontinueBool();

            tok.push_back(c);

        }

        line_pos++;

        break;


    case '=':

        if (options & GenericDocument::OPTION_ALLOW_SEPARATOR_EQUALS)

        {

            this->ProcessSeparatorWithinBool();

        }

        else

        {

            this->DiscontinueBool();

            tok.push_back(c);

        }

        line_pos++;

        break;


    case 'r':

        if (partial_tok_type != PartialToken::BOOL_TRUE || tok.size() != 1)

        {

            this->DiscontinueBool();

        }

        tok.push_back(c);

        line_pos++;

        break;


    case 'u':

        if (partial_tok_type != PartialToken::BOOL_TRUE || tok.size() != 2)

        {

            this->DiscontinueBool();

        }

        tok.push_back(c);

        line_pos++;

        break;


    case 'a':

        if (partial_tok_type != PartialToken::BOOL_FALSE || tok.size() != 1)

        {

            this->DiscontinueBool();

        }

        tok.push_back(c);

        line_pos++;

        break;


    case 'l':

        if (partial_tok_type != PartialToken::BOOL_FALSE || tok.size() != 2)

        {

            this->DiscontinueBool();

        }

        tok.push_back(c);

        line_pos++;

        break;


    case 's':

        if (partial_tok_type != PartialToken::BOOL_FALSE || tok.size() != 3)

        {

            this->DiscontinueBool();

        }

        tok.push_back(c);

        line_pos++;

        break;


    case 'e':

        if (partial_tok_type == PartialToken::BOOL_TRUE && tok.size() == 3)

        {

            doc.tokens.push_back({ TokenType::BOOL, 1.f });

            tok.clear();

            partial_tok_type = PartialToken::NONE;

        }

        else if (partial_tok_type == PartialToken::BOOL_FALSE && tok.size() == 4)

        {

            doc.tokens.push_back({ TokenType::BOOL, 0.f });

            tok.clear();

            partial_tok_type = PartialToken::NONE;

        }

        else

        {

            this->DiscontinueBool();

            tok.push_back(c);

        }

        line_pos++;

        break;


    default:

        this->DiscontinueBool();

        tok.push_back(c);

        line_pos++;

        break;

    }


    if (partial_tok_type == PartialToken::GARBAGE)

    {

        App::GetConsole()->putMessage(Console::CONSOLE_MSGTYPE_INFO, Console::CONSOLE_SYSTEM_WARNING,

            fmt::format("{}, line {}, pos {}: stray character '{}' in boolean", datastream->getName(), line_num, line_pos, c));

    }

}


void DocumentParser::DiscontinueBool()

{

    if (doc.tokens.size() == 0 || doc.tokens.back().type == TokenType::LINEBREAK)

        partial_tok_type = PartialToken::KEYWORD;

    else if (options & GenericDocument::OPTION_ALLOW_NAKED_STRINGS)

        partial_tok_type = PartialToken::STRING_NAKED;

    else

        partial_tok_type = PartialToken::GARBAGE;

}


void DocumentParser::DiscontinueNumber()

{

    if (options & GenericDocument::OPTION_ALLOW_NAKED_STRINGS)

        partial_tok_type = PartialToken::STRING_NAKED;

    else

        partial_tok_type = PartialToken::GARBAGE;

}


void DocumentParser::DiscontinueKeyword()

{

    if (options & GenericDocument::OPTION_ALLOW_NAKED_STRINGS)

        partial_tok_type = PartialToken::STRING_NAKED;

    else

        partial_tok_type = PartialToken::GARBAGE;

}


void DocumentParser::UpdateKeyword(const char c)

{

    switch (c)

    {

    case '\r':

        break;


    case ' ':

    case ',':

    case '\t':

        this->FlushStringishToken(TokenType::KEYWORD);

        line_pos++;

        break;


    case '\n':

        this->FlushStringishToken(TokenType::KEYWORD);

        // Break line

        doc.tokens.push_back({ TokenType::LINEBREAK, 0.f });

        line_num++;

        line_pos = 0;

        break;


    case ':':

        if (options & GenericDocument::OPTION_ALLOW_SEPARATOR_COLON)

        {

            this->FlushStringishToken(TokenType::KEYWORD);

        }

        else

        {

            this->DiscontinueKeyword();

            tok.push_back(c);

        }

        line_pos++;

        break;


    case '=':

        if (options & GenericDocument::OPTION_ALLOW_SEPARATOR_EQUALS)

        {

            this->FlushStringishToken(TokenType::KEYWORD);

        }

        else

        {

            this->DiscontinueKeyword();

            tok.push_back(c);

        }

        line_pos++;

        break;


    case '_':

        tok.push_back(c);

        line_pos++;

        break;


    case '(':

        if (options & GenericDocument::OPTION_ALLOW_NAKED_STRINGS)

        {

            if (options & GenericDocument::OPTION_PARENTHESES_CAPTURE_SPACES)

                partial_tok_type = PartialToken::STRING_NAKED_CAPTURING_SPACES;

            else

                partial_tok_type = PartialToken::STRING_NAKED;

        }

        else

        {

            partial_tok_type = PartialToken::GARBAGE;

        }

        tok.push_back(c);

        line_pos++;

        break;


    case ']':

        if (partial_tok_type == PartialToken::KEYWORD_BRACED)

        {

            partial_tok_type = PartialToken::KEYWORD; // Do not allow any more ']'.

        }

        else

        {

            this->DiscontinueKeyword();

        }

        tok.push_back(c);

        line_pos++;

        break;


    default:

        if (!isalnum(c))

        {

            this->DiscontinueKeyword();

        }

        tok.push_back(c);

        line_pos++;

        break;

    }


    if (partial_tok_type == PartialToken::GARBAGE)

    {

        App::GetConsole()->putMessage(Console::CONSOLE_MSGTYPE_INFO, Console::CONSOLE_SYSTEM_WARNING,

            fmt::format("{}, line {}, pos {}: stray character '{}' in keyword", datastream->getName(), line_num, line_pos, c));

    }

}


void DocumentParser::UpdateTitle(const char c)

{

    switch (c)

    {

    case '\r':

        break;


    case '\n':

        this->FlushStringishToken(TokenType::STRING);

        // Break line

        doc.tokens.push_back({ TokenType::LINEBREAK, 0.f });

        line_num++;

        line_pos = 0;

        break;


    default:

        tok.push_back(c);

        line_pos++;

        break;

    }

}


void DocumentParser::UpdateGarbage(const char c)

{

    switch (c)

    {

    case '\r':

        break;


    case ' ':

    case ',':

    case '\t':

    case '\n':

        tok.push_back('\0');

        App::GetConsole()->putMessage(Console::CONSOLE_MSGTYPE_INFO, Console::CONSOLE_SYSTEM_WARNING,

            fmt::format("{}, line {}, pos {}: discarding garbage token '{}'", datastream->getName(), line_num, line_pos, tok.data()));

        tok.clear();

        partial_tok_type = PartialToken::NONE;

        line_pos++;

        break;


    default:

        tok.push_back(c);

        line_pos++;

        break;

    }

}


void DocumentParser::FlushStringishToken(RoR::TokenType type)

{

    doc.tokens.push_back({ type, (float)doc.string_pool.size() });

    tok.push_back('\0');

    std::copy(tok.begin(), tok.end(), std::back_inserter(doc.string_pool));

    tok.clear();

    partial_tok_type = PartialToken::NONE;

}


void DocumentParser::FlushNumericToken()

{

    tok.push_back('\0');

    if (partial_tok_type == PartialToken::NUMBER_INTEGER)

    {

        doc.tokens.push_back({ TokenType::INT, (float)Ogre::StringConverter::parseInt(tok.data()) });

    }

    else

    {

        doc.tokens.push_back({ TokenType::FLOAT, (float)Ogre::StringConverter::parseReal(tok.data()) });

    }

    tok.clear();

    partial_tok_type = PartialToken::NONE;

}


void DocumentParser::ProcessChar(const char c)

{

    switch (partial_tok_type)

    {

    case PartialToken::NONE:

        this->BeginToken(c);

        break;


    case PartialToken::COMMENT_SEMICOLON:

    case PartialToken::COMMENT_SLASH:

    case PartialToken::COMMENT_HASH:

        this->UpdateComment(c);

        break;


    case PartialToken::STRING_QUOTED:

    case PartialToken::STRING_NAKED:

    case PartialToken::STRING_NAKED_CAPTURING_SPACES:

        this->UpdateString(c);

        break;


    case PartialToken::NUMBER_INTEGER:

    case PartialToken::NUMBER_STUB_MINUS:

    case PartialToken::NUMBER_DECIMAL:

    case PartialToken::NUMBER_SCIENTIFIC:

    case PartialToken::NUMBER_SCIENTIFIC_STUB:

    case PartialToken::NUMBER_SCIENTIFIC_STUB_MINUS:

        this->UpdateNumber(c);

        break;


    case PartialToken::BOOL_TRUE:

    case PartialToken::BOOL_FALSE:

        this->UpdateBool(c);

        break;


    case PartialToken::KEYWORD:

    case PartialToken::KEYWORD_BRACED:

        this->UpdateKeyword(c);

        break;


    case PartialToken::TITLE_STRING:

        this->UpdateTitle(c);

        break;


    case PartialToken::GARBAGE:

        this->UpdateGarbage(c);

        break;

    }

}


void DocumentParser::ProcessEOF()

{

    // Flush any partial token

    switch (partial_tok_type)

    {

    case PartialToken::STRING_QUOTED:

    case PartialToken::STRING_NAKED_CAPTURING_SPACES:

    case PartialToken::TITLE_STRING:

        this->FlushStringishToken(TokenType::STRING);

        break;


    case PartialToken::KEYWORD_BRACED:

        this->FlushStringishToken(TokenType::KEYWORD);

        break;


    default:

        this->ProcessChar(' '); // Pretend processing a separator to flush any partial whitespace-incompatible token.

        break;

    }


    // Ensure newline at end of file

    if (doc.tokens.size() == 0 || doc.tokens.back().type != TokenType::LINEBREAK)

    {

        doc.tokens.push_back({ TokenType::LINEBREAK, 0.f });

    }

}


void GenericDocument::loadFromDataStream(Ogre::DataStreamPtr datastream, const BitMask_t options)

{

    // Reset the document

    tokens.clear();

    string_pool.clear();


    // Prepare context

    DocumentParser parser(*this, options, datastream);

    const size_t LINE_BUF_MAX = 10 * 1024; // 10Kb

    char buf[LINE_BUF_MAX];


    // Parse the text

    while (!datastream->eof())

    {

        size_t buf_len = datastream->read(buf, LINE_BUF_MAX);

        for (size_t i = 0; i < buf_len; i++)

        {

            const char c = buf[i];


            parser.ProcessChar(c);

        }

    }

    parser.ProcessEOF();

}


#if OGRE_PLATFORM == OGRE_PLATFORM_WIN32

    const char* EOL_STR = "\r\n"; // CR+LF

#else

    const char* EOL_STR = "\n"; // "LF"

#endif


void GenericDocument::saveToDataStream(Ogre::DataStreamPtr datastream)

{

    std::string separator;

    const char* pool_str = nullptr;

    const size_t BUF_MAX = 100;

    char buf[BUF_MAX];


    for (Token& tok : tokens)

    {

        switch (tok.type)

        {

        case TokenType::LINEBREAK:

            datastream->write(EOL_STR, strlen(EOL_STR));

            separator = "";

            break;


        case TokenType::COMMENT:

            datastream->write(";", 1);

            pool_str = string_pool.data() + (size_t)tok.data;

            datastream->write(pool_str, strlen(pool_str));

            break;


        case TokenType::STRING:

            datastream->write(separator.data(), separator.size());

            pool_str = string_pool.data() + (size_t)tok.data;

            datastream->write(pool_str, strlen(pool_str));

            separator = ", ";

            break;


        case TokenType::FLOAT:

            datastream->write(separator.data(), separator.size());

            snprintf(buf, BUF_MAX, "%g", tok.data);

            datastream->write(buf, strlen(buf));

            separator = ", ";

            break;


        case TokenType::INT:

            datastream->write(separator.data(), separator.size());

            snprintf(buf, BUF_MAX, "%d", (int)tok.data);

            datastream->write(buf, strlen(buf));

            separator = ", ";

            break;


        case TokenType::BOOL:

            datastream->write(separator.data(), separator.size());

            snprintf(buf, BUF_MAX, "%s", tok.data == 1.f ? "true" : "false");

            datastream->write(buf, strlen(buf));

            separator = ", ";

            break;


        case TokenType::KEYWORD:

            pool_str = string_pool.data() + (size_t)tok.data;

            datastream->write(pool_str, strlen(pool_str));

            separator = " ";

            break;

        }

    }

}


bool GenericDocument::loadFromResource(std::string resource_name, std::string resource_group_name, BitMask_t options/* = 0*/)

{

    try

    {

        Ogre::DataStreamPtr datastream = Ogre::ResourceGroupManager::getSingleton().openResource(resource_name, resource_group_name);

        this->loadFromDataStream(datastream, options);

        return true;

    }

    catch (Ogre::Exception& eeh)

    {

        App::GetConsole()->putMessage(Console::CONSOLE_MSGTYPE_INFO, Console::CONSOLE_SYSTEM_ERROR,

            fmt::format("GenericDocument: could not load file '{}' from resource group '{}': {}", resource_name, resource_group_name, eeh.getDescription()));

        return false;

    }

}


bool GenericDocument::saveToResource(std::string resource_name, std::string resource_group_name)

{

    try

    {

        Ogre::DataStreamPtr datastream = Ogre::ResourceGroupManager::getSingleton().createResource(resource_name, resource_group_name);

        this->saveToDataStream(datastream);

        return true;

    }

    catch (Ogre::Exception& eeh)

    {

        App::GetConsole()->putMessage(Console::CONSOLE_MSGTYPE_INFO, Console::CONSOLE_SYSTEM_ERROR,

            fmt::format("GenericDocument: could not write file '{}' to resource group '{}': {}", resource_name, resource_group_name, eeh.getDescription()));

        return false;

    }

}


bool GenericDocContext::seekNextLine()

{

    // Skip current line

    while (!this->endOfFile() && this->tokenType() != TokenType::LINEBREAK)

    {

        this->moveNext();

    }

    this->moveNext();


    // Skip comments and empty lines

    while (!this->endOfFile() && (this->isTokComment(0) || this->isTokLineBreak(0)))

    {

        this->moveNext();

    }


    return this->endOfFile();

}


int GenericDocContext::countLineArgs()

{

    int count = 0;

    while (!endOfFile(count) && this->tokenType(count) != TokenType::LINEBREAK)

        count++;

    return count;

}


// -----------------

// Editing functions


void GenericDocContext::appendTokens(int count)

{

    if (count <= 0)

        return;


    token_pos = (int)doc->tokens.size();

    for (int i = 0; i < count; i++)

    {

        doc->tokens.push_back({ TokenType::NONE, 0.f });

    }

}


bool GenericDocContext::insertToken(int offset)

{

    if (endOfFile(offset))

       return false;


    doc->tokens.insert(doc->tokens.begin() + token_pos + offset, { TokenType::NONE, 0.f });

    return true;

}


bool GenericDocContext::eraseToken(int offset)

{

    if (endOfFile(offset))

       return false;


    // Just erase the token.

    // We don't care about garbage in `string_pool` - the strings are usually just 1-6 characters long anyway.


    doc->tokens.erase(doc->tokens.begin() + token_pos + offset);

    return true;

}


bool GenericDocContext::setStringData(int offset, TokenType type, const std::string& data)

{

    if (endOfFile(offset))

       return false;


    // Insert the string at the end of the string_pool

    // We don't care about order - updating string offsets in tokens would be complicated and unlikely helpful.


    doc->tokens[token_pos + offset] = { type, (float)doc->string_pool.size() };

    std::copy(data.begin(), data.end(), std::back_inserter(doc->string_pool));

    doc->string_pool.push_back('\0');

    return true;

}


bool GenericDocContext::setFloatData(int offset, TokenType type, float data)

{

    if (endOfFile(offset))

       return false;


    doc->tokens[token_pos + offset] = { type, data };

    return true;

}