schema_editor/comdel/parser/comdellexer.cpp

#include "comdellexer.h"
#include "token.h"
#include "tokens_type.h"

#include <fstream>
#include <cctype>


/*************************************************************************
 *
 * Auxiliary functions - recognizing category of characters
 *
*************************************************************************/

inline bool identifierStart(char ch) {
    return isalpha(ch) || ch == '_';
}

inline bool identifierContinue(char ch) {
    return isalnum(ch) || ch == '_';
}

inline bool numberStart(char ch) {
    return isdigit(ch) || ch == '-';
}

inline bool isWhitespace(char ch) {
    return ch == ' ' || ch == '\t' || ch == '\n' || ch == '\r';
}


/*************************************************************************
 *
 * ComdelLexer class public methods
 *
*************************************************************************/

ComdelLexer::ComdelLexer(std::string fileName, std::string source,
                         ParseContext *parseContext)
        : source(std::move(source)),
          parseContext(parseContext),
        // TODO Update this
          fileId(this->parseContext->addFile(fileName, this->source)),
          position(this->fileId, 1, 1, 0),
          ch(this->source[0]) {}


LexerResult ComdelLexer::tokenize() {
    while (!eof()) {
        tokenBegin = position;

        auto tokenType = nextTokenType();
        if (!tokenType) {
            errors.push_back(tokenType.error());
            continue;
        }
        if (tokenType == TokenType::WHITESPACE || tokenType == TokenType::COMMENT) {
            continue;
        }

        std::string text = source.substr(tokenBegin.offset,
                                         position.offset - tokenBegin.offset);

        tokenType = from_token(text, tokenType.value());

        tokens.emplace_back(*tokenType, Span(tokenBegin, position), text);
    }

    tokens.emplace_back(TokenType::END_OF_FILE, Span(position), "");

    return LexerResult{tokens, errors};
}


/*************************************************************************
 *
 * ComdelLexer class private methods
 *
*************************************************************************/


// Numbers are sequences of digits and underscores
// with AT LEAST ONE digit.

unsigned ComdelLexer::takeNumberInRadix(Radix radix) {
    unsigned digitsTaken = 0;

    while (true) {
        if (digitIsValid(ch, radix)) { // skip and count real digits
            bump();
            digitsTaken++;
        } else if (ch == '_') { // skip underscores
            bump();
        } else { // some other character => end of number
            return digitsTaken;
        }
    }
}


bool ComdelLexer::digitIsValid(char ch, Radix radix) {

    // Check valid digits
    // digit is 0..1
    if (ch == '1' || ch == '0') {
        // OK for all radixes
        return true;
    }
    //digit is 2..9
    if (isdigit(ch)) {
        // OK for decimal and hex radixes
        return (radix != Radix::BIN_NUMBER);
    }
        // digit is a..f A..F
    else if (isxdigit(ch)) {
        // OK only for hex radix
        return (radix == Radix::HEX_NUMBER);
    }
    // NOT 0..9 a..f A..F
    return false;
}


ComdelLexer::Radix ComdelLexer::takeRadix() {
    if (ch == '0') {
        char nextChar = peek();
        if (nextChar == 'x' || nextChar == 'X') {
            bump(2);
            return Radix::HEX_NUMBER;
        } else if (nextChar == 'b' || nextChar == 'B') {
            bump(2);
            return Radix::BIN_NUMBER;
        }
    }
    return Radix::DEC_NUMBER;
}


// color is sequence of hex-digits (preceded with # which is already consumed)
unsigned ComdelLexer::takeHexColor() {
    unsigned digitsTaken = 0;

    while (true) {
        if (digitIsValid(ch, Radix::HEX_NUMBER)) { // skip and count hex digits
            bump();
            digitsTaken++;
        } else { // some other character => end of number
            return digitsTaken;
        }
    }
}


PResult<TokenType> ComdelLexer::takeString() {
    Position lo = position;

    if (ch != '"')
        return PError({Span(lo), "expected string here"});
    bump(); // skip starting "

    // Check escape-sequences  \t  \n  \\  \"  but leave them in string.
    // They will be replaced in the constructor of StringLiteral AST-node.
    while (ch != '"' && ch != '\n' && !eof()) {
        if (ch == '"') {
            // possible start of escape-sequence
            char nextCh = peek();
            if (nextCh == '\\' || nextCh == '\"' || nextCh == 't' || nextCh == 'n')
                bump();   // legal escape-sequence: skip backslash
            else
                return PError({Span(lo, position), "illegal escape-sequence (allowed:  \\n  \\\"  \\\\  \\t"});
        }
        bump(); // skip normal char OR skip second char in escape-sequence
    }

    if (eof() || ch == '\n') {
        return PError({Span(lo, position), "unterminated string"});
    }
    bump(); // skip closing "
    return TokenType::STRING;
}


PResult<TokenType> ComdelLexer::takeRawString() {
    Position lo = position;

    if (ch != '`')
        return PError({Span(lo), "expected string here"});
    bump(); // skip starting '

    // Ignore escape-sequences - take all characters until closing '
    while (ch != '`' && !eof()) {
        bump(); // skip characters
    }

    if (eof() || ch == '\n') {
        return PError({Span(lo, position), "unterminated string"});
    }
    bump(); // skip closing '
    return TokenType::STRING;
}


void ComdelLexer::skipWhitespace() {
    while (!eof()) {
        if (isWhitespace(ch)) {
            bump();
        } else {
            break;
        }
    }
}


void ComdelLexer::skipComment() {
    while (!eof() && ch != '\n') {
        bump();
    }
}


// returns false if the comment is unterminated
bool ComdelLexer::skipMultilineComment() {
    while (!eof()) {
        if (ch == '*') {
            bump();
            if (ch == '/') {
                bump();
                return true;
            }
        }
        bump();
    }
    return false;
}


PResult<TokenType> ComdelLexer::nextTokenType() {
    if (isWhitespace(ch)) {
        skipWhitespace();
        return TokenType::WHITESPACE;
    } else if (identifierStart(ch)) {
        bump();
        while (identifierContinue(ch))
            bump();
        return TokenType::IDENTIFIER;
    } else if (numberStart(ch)) {
        if (ch == '-') {
            bump();
        }
        unsigned takenDigits;
        Radix radix = takeRadix();
        takenDigits = takeNumberInRadix(radix);
        if (takenDigits == 0) {
            return PError({Span(tokenBegin, position),
                           "no digits found for number, or misspelled number"});
        }
        if (isalnum(ch)) {
            return PError({Span(tokenBegin, position),
                           "illegal digit or letter found at the end of number"});
        }
        return TokenType::NUMBER;
    } else if (ch == '!') {
        bump();
        return TokenType::NOT;
    } else if (ch == '<') {
        bump();
        return TokenType::LT;
    } else if (ch == '>') {
        bump();
        return TokenType::GT;
    } else if (ch == '#') {
        bump();

        if (digitIsValid(ch, Radix::HEX_NUMBER)) {
            unsigned takenDigits = takeHexColor();
            if (takenDigits != 6 && takenDigits != 8) {
                return PError({Span(tokenBegin, position),
                               "hex-color must have 6 or 8 hex-digits"});
            }
            if (isalnum(ch)) {
                return PError({Span(tokenBegin, position),
                               "illegal letter found at the end of hex-color"});
            }
            return TokenType::COLOR;
        } else {
            return PError({Span(tokenBegin, position),
                           "unexpected #"});
        }
    } else if (ch == '@') {
        bump();
        while (identifierContinue(ch))
            bump();
        return TokenType::KEYWORD;
    } else if (ch == '"') {
        return takeString();
    } else if (ch == '`') {
        return takeRawString();
    } else if (ch == '(') {
        bump();
        return TokenType::LPAREN;
    } else if (ch == ')') {
        bump();
        return TokenType::RPAREN;
    } else if (ch == '[') {
        bump();
        return TokenType::LBRACKET;
    } else if (ch == ']') {
        bump();
        return TokenType::RBRACKET;
    } else if (ch == '{') {
        bump();
        return TokenType::LBRACE;
    } else if (ch == '}') {
        bump();
        return TokenType::RBRACE;
    } else if (ch == '/') {
        bump();
        if (ch == '/') {
            bump();
            skipComment();
            return TokenType::COMMENT;
        } else if (ch == '*') {
            bump();
            if (!skipMultilineComment()) {
                return PError({Span(tokenBegin, position),
                               "unterminated multiline comment"});
            }
            return TokenType::COMMENT;
        }
        return PError({Span(tokenBegin, position),
                       "unexpected /"});
    } else if (ch == '.') {
        bump();
        return TokenType::DOT;
    } else if (ch == ':') {
        bump();
        return TokenType::COLON;
    } else if (ch == ';') {
        bump();
        return TokenType::SEMICOLON;
    } else if (ch == ',') {
        bump();
        return TokenType::COMMA;
    } else if (ch == '=') {
        bump();
        return TokenType::EQUALS;
    } else {
        std::stringstream message;
        message << "unexpected character `" << ch << "`";
        bump();
        return PError({Span(tokenBegin, position), message.str()});
    }
}


// Move position to the new character in input file.
// Fetch the new character in 'ch'
void ComdelLexer::bump(unsigned count) {
    for (unsigned i = 0; i < count && !eof(); i++) {
        if (ch == '\n') {
            position.line += 1;
            position.col = 1;
            parseContext->getFile(fileId).addLineOffset(position.offset + 1);
        } else {
            position.col += 1;
        }
        position.offset += 1;
        ch = source[position.offset];
    }
}


// Fetch and return next character without moving position.
// Fetch does not cross line boundary.
// Returns \n when next char does not exist (end of line or end of file)
char ComdelLexer::peek() {
    if (position.offset + 1 == source.size()) // eof
        return '\n';

    return source[position.offset + 1];
}


bool ComdelLexer::eof() {
    return position.offset == source.size();
}
Initial instance 2022-03-29 19:31:45 +00:00			`#include "comdellexer.h"`
			`#include "token.h"`
Basic refactor 2022-05-27 06:18:17 +00:00			`#include "tokens_type.h"`
Initial instance 2022-03-29 19:31:45 +00:00
			`#include <fstream>`
			`#include <cctype>`


			`/*************************************************************************`
			`*`
			`* Auxiliary functions - recognizing category of characters`
			`*`
			`*************************************************************************/`

			`inline bool identifierStart(char ch) {`
			`return isalpha(ch) \|\| ch == '_';`
			`}`

			`inline bool identifierContinue(char ch) {`
			`return isalnum(ch) \|\| ch == '_';`
			`}`

			`inline bool numberStart(char ch) {`
Added support for integers and null to connections 2022-04-08 20:46:47 +00:00			`return isdigit(ch) \|\| ch == '-';`
Initial instance 2022-03-29 19:31:45 +00:00			`}`

			`inline bool isWhitespace(char ch) {`
			`return ch == ' ' \|\| ch == '\t' \|\| ch == '\n' \|\| ch == '\r';`
			`}`


			`/*************************************************************************`
			`*`
			`* ComdelLexer class public methods`
			`*`
			`*************************************************************************/`

			`ComdelLexer::ComdelLexer(std::string fileName, std::string source,`
Basic refactor 2022-05-27 06:18:17 +00:00			`ParseContext *parseContext)`
			`: source(std::move(source)),`
			`parseContext(parseContext),`
			`// TODO Update this`
			`fileId(this->parseContext->addFile(fileName, this->source)),`
			`position(this->fileId, 1, 1, 0),`
			`ch(this->source[0]) {}`
Initial instance 2022-03-29 19:31:45 +00:00

			`LexerResult ComdelLexer::tokenize() {`
			`while (!eof()) {`
			`tokenBegin = position;`

			`auto tokenType = nextTokenType();`
Basic refactor 2022-05-27 06:18:17 +00:00			`if (!tokenType) {`
Initial instance 2022-03-29 19:31:45 +00:00			`errors.push_back(tokenType.error());`
			`continue;`
			`}`
Basic refactor 2022-05-27 06:18:17 +00:00			`if (tokenType == TokenType::WHITESPACE \|\| tokenType == TokenType::COMMENT) {`
Initial instance 2022-03-29 19:31:45 +00:00			`continue;`
			`}`

			`std::string text = source.substr(tokenBegin.offset,`
			`position.offset - tokenBegin.offset);`

Token refactor 2022-03-29 21:08:55 +00:00			`tokenType = from_token(text, tokenType.value());`

Added support for integers and null to connections 2022-04-08 20:46:47 +00:00			`tokens.emplace_back(*tokenType, Span(tokenBegin, position), text);`
Initial instance 2022-03-29 19:31:45 +00:00			`}`

Basic refactor 2022-05-27 06:18:17 +00:00			`tokens.emplace_back(TokenType::END_OF_FILE, Span(position), "");`
Initial instance 2022-03-29 19:31:45 +00:00
Basic refactor 2022-05-27 06:18:17 +00:00			`return LexerResult{tokens, errors};`
Initial instance 2022-03-29 19:31:45 +00:00			`}`


			`/*************************************************************************`
			`*`
			`* ComdelLexer class private methods`
			`*`
			`*************************************************************************/`


			`// Numbers are sequences of digits and underscores`
			`// with AT LEAST ONE digit.`

			`unsigned ComdelLexer::takeNumberInRadix(Radix radix) {`
			`unsigned digitsTaken = 0;`

Basic refactor 2022-05-27 06:18:17 +00:00			`while (true) {`
Initial instance 2022-03-29 19:31:45 +00:00			`if (digitIsValid(ch, radix)) { // skip and count real digits`
			`bump();`
			`digitsTaken++;`
Basic refactor 2022-05-27 06:18:17 +00:00			`} else if (ch == '_') { // skip underscores`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
			`} else { // some other character => end of number`
			`return digitsTaken;`
			`}`
			`}`
			`}`


			`bool ComdelLexer::digitIsValid(char ch, Radix radix) {`

Typos 2022-04-08 18:17:58 +00:00			`// Check valid digits`
			`// digit is 0..1`
Basic refactor 2022-05-27 06:18:17 +00:00			`if (ch == '1' \|\| ch == '0') {`
Initial instance 2022-03-29 19:31:45 +00:00			`// OK for all radixes`
			`return true;`
			`}`
			`//digit is 2..9`
Basic refactor 2022-05-27 06:18:17 +00:00			`if (isdigit(ch)) {`
Initial instance 2022-03-29 19:31:45 +00:00			`// OK for decimal and hex radixes`
Basic refactor 2022-05-27 06:18:17 +00:00			`return (radix != Radix::BIN_NUMBER);`
Initial instance 2022-03-29 19:31:45 +00:00			`}`
Basic refactor 2022-05-27 06:18:17 +00:00			`// digit is a..f A..F`
			`else if (isxdigit(ch)) {`
Initial instance 2022-03-29 19:31:45 +00:00			`// OK only for hex radix`
Basic refactor 2022-05-27 06:18:17 +00:00			`return (radix == Radix::HEX_NUMBER);`
Initial instance 2022-03-29 19:31:45 +00:00			`}`
			`// NOT 0..9 a..f A..F`
			`return false;`
			`}`


Basic refactor 2022-05-27 06:18:17 +00:00			`ComdelLexer::Radix ComdelLexer::takeRadix() {`
Initial instance 2022-03-29 19:31:45 +00:00			`if (ch == '0') {`
			`char nextChar = peek();`
			`if (nextChar == 'x' \|\| nextChar == 'X') {`
			`bump(2);`
			`return Radix::HEX_NUMBER;`
			`} else if (nextChar == 'b' \|\| nextChar == 'B') {`
			`bump(2);`
			`return Radix::BIN_NUMBER;`
			`}`
			`}`
			`return Radix::DEC_NUMBER;`
			`}`


Typos 2022-04-08 18:17:58 +00:00			`// color is sequence of hex-digits (preceded with # which is already consumed)`
Initial instance 2022-03-29 19:31:45 +00:00			`unsigned ComdelLexer::takeHexColor() {`
			`unsigned digitsTaken = 0;`

Basic refactor 2022-05-27 06:18:17 +00:00			`while (true) {`
Initial instance 2022-03-29 19:31:45 +00:00			`if (digitIsValid(ch, Radix::HEX_NUMBER)) { // skip and count hex digits`
			`bump();`
			`digitsTaken++;`
			`} else { // some other character => end of number`
			`return digitsTaken;`
			`}`
			`}`
			`}`


			`PResult<TokenType> ComdelLexer::takeString() {`
			`Position lo = position;`

			`if (ch != '"')`
			`return PError({Span(lo), "expected string here"});`
			`bump(); // skip starting "`

Typos 2022-04-08 18:17:58 +00:00			`// Check escape-sequences \t \n \\ \" but leave them in string.`
Initial instance 2022-03-29 19:31:45 +00:00			`// They will be replaced in the constructor of StringLiteral AST-node.`
			`while (ch != '"' && ch != '\n' && !eof()) {`
Basic refactor 2022-05-27 06:18:17 +00:00			`if (ch == '"') {`
Initial instance 2022-03-29 19:31:45 +00:00			`// possible start of escape-sequence`
			`char nextCh = peek();`
Basic refactor 2022-05-27 06:18:17 +00:00			`if (nextCh == '\\' \|\| nextCh == '\"' \|\| nextCh == 't' \|\| nextCh == 'n')`
Initial instance 2022-03-29 19:31:45 +00:00			`bump(); // legal escape-sequence: skip backslash`
			`else`
			`return PError({Span(lo, position), "illegal escape-sequence (allowed: \\n \\\" \\\\ \\t"});`
			`}`
			`bump(); // skip normal char OR skip second char in escape-sequence`
			`}`

			`if (eof() \|\| ch == '\n') {`
			`return PError({Span(lo, position), "unterminated string"});`
			`}`
			`bump(); // skip closing "`
Basic refactor 2022-05-27 06:18:17 +00:00			`return TokenType::STRING;`
Initial instance 2022-03-29 19:31:45 +00:00			`}`


Basic refactor 2022-05-27 06:18:17 +00:00			`PResult<TokenType> ComdelLexer::takeRawString() {`
Initial instance 2022-03-29 19:31:45 +00:00			`Position lo = position;`

			if (ch != '`')
			`return PError({Span(lo), "expected string here"});`
			`bump(); // skip starting '`

Typos 2022-04-08 18:17:58 +00:00			`// Ignore escape-sequences - take all characters until closing '`
Initial instance 2022-03-29 19:31:45 +00:00			while (ch != '`' && !eof()) {
			`bump(); // skip characters`
			`}`

			`if (eof() \|\| ch == '\n') {`
			`return PError({Span(lo, position), "unterminated string"});`
			`}`
			`bump(); // skip closing '`
Basic refactor 2022-05-27 06:18:17 +00:00			`return TokenType::STRING;`
Initial instance 2022-03-29 19:31:45 +00:00			`}`


			`void ComdelLexer::skipWhitespace() {`
			`while (!eof()) {`
			`if (isWhitespace(ch)) {`
			`bump();`
			`} else {`
			`break;`
			`}`
			`}`
			`}`


			`void ComdelLexer::skipComment() {`
			`while (!eof() && ch != '\n') {`
			`bump();`
			`}`
			`}`


			`// returns false if the comment is unterminated`
			`bool ComdelLexer::skipMultilineComment() {`
			`while (!eof()) {`
			`if (ch == '*') {`
			`bump();`
			`if (ch == '/') {`
			`bump();`
			`return true;`
			`}`
			`}`
			`bump();`
			`}`
			`return false;`
			`}`


			`PResult<TokenType> ComdelLexer::nextTokenType() {`
Basic refactor 2022-05-27 06:18:17 +00:00			`if (isWhitespace(ch)) {`
Initial instance 2022-03-29 19:31:45 +00:00			`skipWhitespace();`
Basic refactor 2022-05-27 06:18:17 +00:00			`return TokenType::WHITESPACE;`
			`} else if (identifierStart(ch)) {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
			`while (identifierContinue(ch))`
			`bump();`
Basic refactor 2022-05-27 06:18:17 +00:00			`return TokenType::IDENTIFIER;`
			`} else if (numberStart(ch)) {`
			`if (ch == '-') {`
Added support for integers and null to connections 2022-04-08 20:46:47 +00:00			`bump();`
			`}`
Initial instance 2022-03-29 19:31:45 +00:00			`unsigned takenDigits;`
			`Radix radix = takeRadix();`
			`takenDigits = takeNumberInRadix(radix);`
			`if (takenDigits == 0) {`
			`return PError({Span(tokenBegin, position),`
Basic refactor 2022-05-27 06:18:17 +00:00			`"no digits found for number, or misspelled number"});`
Initial instance 2022-03-29 19:31:45 +00:00			`}`
Basic refactor 2022-05-27 06:18:17 +00:00			`if (isalnum(ch)) {`
Initial instance 2022-03-29 19:31:45 +00:00			`return PError({Span(tokenBegin, position),`
Basic refactor 2022-05-27 06:18:17 +00:00			`"illegal digit or letter found at the end of number"});`
Initial instance 2022-03-29 19:31:45 +00:00			`}`
Basic refactor 2022-05-27 06:18:17 +00:00			`return TokenType::NUMBER;`
			`} else if (ch == '!') {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
Basic refactor 2022-05-27 06:18:17 +00:00			`return TokenType::NOT;`
			`} else if (ch == '<') {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
Basic refactor 2022-05-27 06:18:17 +00:00			`return TokenType::LT;`
			`} else if (ch == '>') {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
Basic refactor 2022-05-27 06:18:17 +00:00			`return TokenType::GT;`
			`} else if (ch == '#') {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`

			`if (digitIsValid(ch, Radix::HEX_NUMBER)) {`
			`unsigned takenDigits = takeHexColor();`
			`if (takenDigits != 6 && takenDigits != 8) {`
			`return PError({Span(tokenBegin, position),`
Basic refactor 2022-05-27 06:18:17 +00:00			`"hex-color must have 6 or 8 hex-digits"});`
Initial instance 2022-03-29 19:31:45 +00:00			`}`
Basic refactor 2022-05-27 06:18:17 +00:00			`if (isalnum(ch)) {`
Initial instance 2022-03-29 19:31:45 +00:00			`return PError({Span(tokenBegin, position),`
Basic refactor 2022-05-27 06:18:17 +00:00			`"illegal letter found at the end of hex-color"});`
Initial instance 2022-03-29 19:31:45 +00:00			`}`
Basic refactor 2022-05-27 06:18:17 +00:00			`return TokenType::COLOR;`
Initial instance 2022-03-29 19:31:45 +00:00			`} else {`
			`return PError({Span(tokenBegin, position),`
Typos 2022-04-08 18:17:58 +00:00			`"unexpected #"});`
Initial instance 2022-03-29 19:31:45 +00:00			`}`
Basic refactor 2022-05-27 06:18:17 +00:00			`} else if (ch == '@') {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
			`while (identifierContinue(ch))`
			`bump();`
Basic refactor 2022-05-27 06:18:17 +00:00			`return TokenType::KEYWORD;`
			`} else if (ch == '"') {`
Initial instance 2022-03-29 19:31:45 +00:00			`return takeString();`
Basic refactor 2022-05-27 06:18:17 +00:00			} else if (ch == '`') {
Initial instance 2022-03-29 19:31:45 +00:00			`return takeRawString();`
Basic refactor 2022-05-27 06:18:17 +00:00			`} else if (ch == '(') {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
Basic refactor 2022-05-27 06:18:17 +00:00			`return TokenType::LPAREN;`
			`} else if (ch == ')') {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
Basic refactor 2022-05-27 06:18:17 +00:00			`return TokenType::RPAREN;`
			`} else if (ch == '[') {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
			`return TokenType::LBRACKET;`
Basic refactor 2022-05-27 06:18:17 +00:00			`} else if (ch == ']') {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
Basic refactor 2022-05-27 06:18:17 +00:00			`return TokenType::RBRACKET;`
			`} else if (ch == '{') {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
			`return TokenType::LBRACE;`
Basic refactor 2022-05-27 06:18:17 +00:00			`} else if (ch == '}') {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
			`return TokenType::RBRACE;`
Basic refactor 2022-05-27 06:18:17 +00:00			`} else if (ch == '/') {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
Basic refactor 2022-05-27 06:18:17 +00:00			`if (ch == '/') {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
			`skipComment();`
			`return TokenType::COMMENT;`
Basic refactor 2022-05-27 06:18:17 +00:00			`} else if (ch == '*') {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
Basic refactor 2022-05-27 06:18:17 +00:00			`if (!skipMultilineComment()) {`
Initial instance 2022-03-29 19:31:45 +00:00			`return PError({Span(tokenBegin, position),`
Basic refactor 2022-05-27 06:18:17 +00:00			`"unterminated multiline comment"});`
Initial instance 2022-03-29 19:31:45 +00:00			`}`
			`return TokenType::COMMENT;`
			`}`
			`return PError({Span(tokenBegin, position),`
Typos 2022-04-08 18:17:58 +00:00			`"unexpected /"});`
Basic refactor 2022-05-27 06:18:17 +00:00			`} else if (ch == '.') {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
			`return TokenType::DOT;`
Basic refactor 2022-05-27 06:18:17 +00:00			`} else if (ch == ':') {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
			`return TokenType::COLON;`
Basic refactor 2022-05-27 06:18:17 +00:00			`} else if (ch == ';') {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
			`return TokenType::SEMICOLON;`
Basic refactor 2022-05-27 06:18:17 +00:00			`} else if (ch == ',') {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
			`return TokenType::COMMA;`
Basic refactor 2022-05-27 06:18:17 +00:00			`} else if (ch == '=') {`
Initial instance 2022-03-29 19:31:45 +00:00			`bump();`
			`return TokenType::EQUALS;`
Basic refactor 2022-05-27 06:18:17 +00:00			`} else {`
Initial instance 2022-03-29 19:31:45 +00:00			`std::stringstream message;`
			message << "unexpected character `" << ch << "`";
			`bump();`
			`return PError({Span(tokenBegin, position), message.str()});`
			`}`
			`}`


			`// Move position to the new character in input file.`
			`// Fetch the new character in 'ch'`
			`void ComdelLexer::bump(unsigned count) {`
Basic refactor 2022-05-27 06:18:17 +00:00			`for (unsigned i = 0; i < count && !eof(); i++) {`
Initial instance 2022-03-29 19:31:45 +00:00			`if (ch == '\n') {`
			`position.line += 1;`
			`position.col = 1;`
Basic refactor 2022-05-27 06:18:17 +00:00			`parseContext->getFile(fileId).addLineOffset(position.offset + 1);`
Initial instance 2022-03-29 19:31:45 +00:00			`} else {`
			`position.col += 1;`
			`}`
			`position.offset += 1;`
			`ch = source[position.offset];`
			`}`
			`}`


			`// Fetch and return next character without moving position.`
			`// Fetch does not cross line boundary.`
Typos 2022-04-08 18:17:58 +00:00			`// Returns \n when next char does not exist (end of line or end of file)`
Initial instance 2022-03-29 19:31:45 +00:00			`char ComdelLexer::peek() {`
Basic refactor 2022-05-27 06:18:17 +00:00			`if (position.offset + 1 == source.size()) // eof`
Initial instance 2022-03-29 19:31:45 +00:00			`return '\n';`

Basic refactor 2022-05-27 06:18:17 +00:00			`return source[position.offset + 1];`
Initial instance 2022-03-29 19:31:45 +00:00			`}`


			`bool ComdelLexer::eof() {`
			`return position.offset == source.size();`
			`}`