2026-02-05 19:14:31 +11:00
|
|
|
#include "lexer.h"
|
2026-02-12 08:46:12 +11:00
|
|
|
#include "SolsLiteral.h"
|
2026-02-06 15:48:13 +11:00
|
|
|
#include "SolsToken.h"
|
2026-02-05 19:14:31 +11:00
|
|
|
#include "../include/error.h"
|
2026-02-06 15:48:13 +11:00
|
|
|
#include "../include/estr.h"
|
2026-02-05 19:14:31 +11:00
|
|
|
|
2026-02-12 08:46:12 +11:00
|
|
|
|
2026-02-05 19:14:31 +11:00
|
|
|
ResultType(SolsLexer, charptr) createLexer(char* input) {
|
|
|
|
|
char* inputcopy = malloc(strlen(input) + 1);
|
|
|
|
|
if (inputcopy == NULL) {
|
|
|
|
|
return Error(SolsLexer, charptr, "Couldn't copy string into lexer (in createLexer() function)");
|
|
|
|
|
}
|
|
|
|
|
strcpy(inputcopy, input);
|
2026-02-06 15:48:13 +11:00
|
|
|
ResultType(SolsTokens, charptr) tokens = createSolsTokens();
|
|
|
|
|
if (tokens.error) {
|
|
|
|
|
Estr e = CREATE_ESTR(tokens.as.error);
|
|
|
|
|
APPEND_ESTR(e, " (in createLexer() function)");
|
|
|
|
|
return Error(SolsLexer, charptr, e.str);
|
|
|
|
|
}
|
2026-02-05 19:14:31 +11:00
|
|
|
SolsLexer lexer = {
|
|
|
|
|
.input = inputcopy,
|
2026-02-12 08:46:12 +11:00
|
|
|
.inputsize = strlen(inputcopy),
|
2026-02-06 15:48:13 +11:00
|
|
|
.output = tokens.as.success,
|
2026-02-05 19:14:31 +11:00
|
|
|
.current = 0,
|
|
|
|
|
};
|
|
|
|
|
return Success(SolsLexer, charptr, lexer);
|
|
|
|
|
}
|
|
|
|
|
|
2026-02-12 08:46:12 +11:00
|
|
|
ResultType(char, Nothing) lexerPeek(SolsLexer* lexer, size_t ahead) {
|
|
|
|
|
if (lexer->input == NULL) {
|
|
|
|
|
return Error(char, Nothing, {});
|
|
|
|
|
}
|
|
|
|
|
if (lexer->current + ahead > lexer->inputsize) {
|
|
|
|
|
return Error(char, Nothing, {});
|
|
|
|
|
}
|
|
|
|
|
return Success(char, Nothing, lexer->input[lexer->current + ahead]);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
ResultType(char, Nothing) lexerConsume(SolsLexer* lexer) {
|
|
|
|
|
if (lexer->input == NULL) {
|
|
|
|
|
return Error(char, Nothing, {});
|
|
|
|
|
}
|
|
|
|
|
if (lexer->current + 1 > lexer->inputsize) {
|
|
|
|
|
return Error(char, Nothing, {});
|
|
|
|
|
}
|
|
|
|
|
return Success(char, Nothing, lexer->input[lexer->current++]);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
ResultType(SolsToken, charptr) identifyToken(const char* token) {
|
2026-02-15 09:42:11 +11:00
|
|
|
printf("Passed token: '%s'\n", token);
|
2026-02-12 08:46:12 +11:00
|
|
|
if (token[0] == '"') {
|
|
|
|
|
if (token[strlen(token) - 1] == '"') {
|
|
|
|
|
ResultType(SolsLiteral, charptr) literal = createSolsLiteral(SLT_STRING, token);
|
|
|
|
|
if (literal.error) {
|
|
|
|
|
Estr str = CREATE_ESTR(literal.as.error);
|
|
|
|
|
APPEND_ESTR(str, " (in identifyToken() function)");
|
|
|
|
|
return Error(SolsToken, charptr, str.str);
|
|
|
|
|
}
|
|
|
|
|
SolsToken tok = {
|
|
|
|
|
.type = STT_LITERAL,
|
|
|
|
|
};
|
|
|
|
|
return Success(SolsToken, charptr, {STT_LITERAL});
|
|
|
|
|
}
|
2026-02-15 09:42:11 +11:00
|
|
|
return Error(SolsToken, charptr, "Unterminated string (in identifyToken() function)");
|
2026-02-12 08:46:12 +11:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// FIXME do tihs better sometime
|
|
|
|
|
if (strcmp(token, "puts") == 0) {
|
|
|
|
|
return Success(SolsToken, charptr, {STT_KW_PUTS});
|
|
|
|
|
}
|
|
|
|
|
if (strcmp(token, "if") == 0) {
|
|
|
|
|
return Success(SolsToken, charptr, {STT_KW_IF});
|
|
|
|
|
}
|
|
|
|
|
if (strcmp(token, "while") == 0) {
|
|
|
|
|
return Success(SolsToken, charptr, {STT_KW_WHILE});
|
|
|
|
|
}
|
|
|
|
|
if (strcmp(token, "def") == 0) {
|
|
|
|
|
return Success(SolsToken, charptr, {STT_KW_DEF});
|
|
|
|
|
}
|
|
|
|
|
if (strcmp(token, "struct") == 0) {
|
|
|
|
|
return Success(SolsToken, charptr, {STT_KW_DEF});
|
|
|
|
|
}
|
|
|
|
|
// Shh, this is our little secret now
|
|
|
|
|
if (strcmp(token, "{") == 0 || strcmp(token, "then")) {
|
|
|
|
|
return Success(SolsToken, charptr, {STT_OPEN_CURLY});
|
|
|
|
|
}
|
|
|
|
|
if (strcmp(token, "}") == 0 || strcmp(token, "end") == 0) {
|
|
|
|
|
return Success(SolsToken, charptr, {STT_CLOSE_CURLY});
|
|
|
|
|
}
|
|
|
|
|
if (strcmp(token, "(") == 0) {
|
|
|
|
|
return Success(SolsToken, charptr, {STT_OPEN_PAREN});
|
|
|
|
|
}
|
|
|
|
|
if (strcmp(token, ")") == 0) {
|
|
|
|
|
return Success(SolsToken, charptr, {STT_CLOSE_PAREN});
|
|
|
|
|
}
|
|
|
|
|
if (strcmp(token, "+") == 0 || strcmp(token, "plus") == 0) {
|
|
|
|
|
return Success(SolsToken, charptr, {STT_OP_ADD});
|
|
|
|
|
}
|
|
|
|
|
if (strcmp(token, "-") == 0 || strcmp(token, "minus") == 0) {
|
|
|
|
|
return Success(SolsToken, charptr, {STT_OP_SUB});
|
|
|
|
|
}
|
|
|
|
|
if (strcmp(token, "*") == 0 || strcmp(token, "times") == 0) {
|
|
|
|
|
return Success(SolsToken, charptr, {STT_OP_MUL});
|
|
|
|
|
}
|
|
|
|
|
if (strcmp(token, "/") == 0 || strcmp(token, "dividedby") == 0) {
|
|
|
|
|
return Success(SolsToken, charptr, {STT_OP_DIV});
|
|
|
|
|
}
|
|
|
|
|
if (strcmp(token, "=") == 0 || strcmp(token, "is") == 0) {
|
|
|
|
|
return Success(SolsToken, charptr, {STT_OP_SET});
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return Success(SolsToken, charptr, {STT_IDENTIFIER});
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
2026-02-15 09:42:11 +11:00
|
|
|
char* createParsingError(size_t lineNum, char* line, char* why) {
|
|
|
|
|
Estr error = CREATE_ESTR("\e[0;34mParsing Error \e[0;36mon line ");
|
|
|
|
|
char buf[256];
|
|
|
|
|
snprintf(buf, sizeof(buf), "%zu", lineNum);
|
|
|
|
|
APPEND_ESTR(error, buf);
|
|
|
|
|
APPEND_ESTR(error, ":\n\n ");
|
|
|
|
|
APPEND_ESTR(error, line);
|
|
|
|
|
APPEND_ESTR(error, "\n\n");
|
|
|
|
|
APPEND_ESTR(error, "-> ");
|
|
|
|
|
APPEND_ESTR(error, why);
|
|
|
|
|
APPEND_ESTR(error, "\n");
|
|
|
|
|
return error.str;
|
|
|
|
|
}
|
|
|
|
|
|
2026-02-05 19:14:31 +11:00
|
|
|
ResultType(voidptr, charptr) lex(SolsLexer* lexer) {
|
|
|
|
|
if (lexer->input == NULL) {
|
|
|
|
|
return Error(voidptr, charptr, "Lexer is not initialised");
|
|
|
|
|
}
|
|
|
|
|
|
2026-02-12 08:46:12 +11:00
|
|
|
ResultType(SolsTokens, charptr) tokens = createSolsTokens();
|
|
|
|
|
if (tokens.error) {
|
|
|
|
|
Estr e = CREATE_ESTR(tokens.as.error);
|
|
|
|
|
APPEND_ESTR(e, " (in createSolsTokens() function)");
|
|
|
|
|
return Error(voidptr, charptr, e.str);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
lexer->output = tokens.as.success;
|
2026-02-05 19:14:31 +11:00
|
|
|
lexer->current = 0;
|
|
|
|
|
|
2026-02-12 08:46:12 +11:00
|
|
|
Estr buf = CREATE_ESTR("");
|
|
|
|
|
bool inString = false;
|
|
|
|
|
|
|
|
|
|
size_t lineNum = 1;
|
|
|
|
|
size_t lineStart = 0;
|
|
|
|
|
Estr currentLine = CREATE_ESTR("");
|
|
|
|
|
|
|
|
|
|
for (; lineStart < lexer->inputsize; lineStart++) {
|
|
|
|
|
if (lexer->input[lineStart] == '\n') {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
char buf[] = {lexer->input[lineStart], '\0'};
|
|
|
|
|
APPEND_ESTR(currentLine, buf);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
for (;;) {
|
|
|
|
|
ResultType(char, Nothing) chr = lexerConsume(lexer);
|
|
|
|
|
|
|
|
|
|
if (chr.error) {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (chr.as.success == '\n') {
|
|
|
|
|
for (; lineStart < lexer->inputsize; lineStart++) {
|
|
|
|
|
if (lexer->input[lineStart] == '\n') {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
char buf[] = {lexer->input[lineStart], '\0'};
|
|
|
|
|
APPEND_ESTR(currentLine, buf);
|
|
|
|
|
}
|
|
|
|
|
lineNum ++;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (inString) {
|
|
|
|
|
char str[2] = { chr.as.success, '\0' };
|
|
|
|
|
APPEND_ESTR(buf, str);
|
|
|
|
|
if (chr.as.success == '"') {
|
|
|
|
|
inString = false;
|
|
|
|
|
}
|
2026-02-15 09:42:11 +11:00
|
|
|
continue;
|
2026-02-12 08:46:12 +11:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
switch (chr.as.success) {
|
|
|
|
|
case '"': {
|
|
|
|
|
inString = true;
|
|
|
|
|
APPEND_ESTR(buf, "\"");
|
|
|
|
|
break;
|
|
|
|
|
}
|
2026-02-15 09:42:11 +11:00
|
|
|
case '\n':
|
2026-02-12 08:46:12 +11:00
|
|
|
case ' ': {
|
2026-02-15 09:42:11 +11:00
|
|
|
if (strcmp(buf.str, "") != 0) {
|
2026-02-12 08:46:12 +11:00
|
|
|
ResultType(SolsToken, charptr) result = identifyToken(buf.str);
|
|
|
|
|
if (result.error) {
|
2026-02-15 09:42:11 +11:00
|
|
|
return Error(voidptr, charptr, createParsingError(lineNum, currentLine.str, result.as.error));
|
2026-02-12 08:46:12 +11:00
|
|
|
}
|
2026-02-15 09:42:11 +11:00
|
|
|
addTokenToSolsTokens(&lexer->output, result.as.success);
|
|
|
|
|
DESTROY_ESTR(buf);
|
|
|
|
|
buf = CREATE_ESTR("");
|
2026-02-12 08:46:12 +11:00
|
|
|
}
|
2026-02-15 09:42:11 +11:00
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
default: {
|
|
|
|
|
char newchar[] = {chr.as.success, '\0'};
|
|
|
|
|
APPEND_ESTR(buf, newchar);
|
|
|
|
|
break;
|
2026-02-12 08:46:12 +11:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2026-02-15 09:42:11 +11:00
|
|
|
if (strcmp(buf.str, "") != 0) {
|
|
|
|
|
ResultType(SolsToken, charptr) result = identifyToken(buf.str);
|
|
|
|
|
if (result.error) {
|
|
|
|
|
return Error(voidptr, charptr, createParsingError(lineNum, currentLine.str, result.as.error));
|
|
|
|
|
}
|
|
|
|
|
DESTROY_ESTR(buf);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (inString) {
|
|
|
|
|
return Error(voidptr, charptr, createParsingError(lineNum, currentLine.str, "Unterminated string"));
|
|
|
|
|
}
|
|
|
|
|
|
2026-02-05 19:14:31 +11:00
|
|
|
return Success(voidptr, charptr, NULL);
|
|
|
|
|
}
|