Stuff works a bit better now

2025-11-23 15:54:50 +11:00
parent d1711accde
commit 451de0affd
5 changed files with 253 additions and 17 deletions
--- a/src/lexer.c
+++ b/src/lexer.c
@@ -1,14 +1,13 @@
 #include "lexer.h"
-#include <stdlib.h>
-#include <stdio.h>
 #include <stdbool.h>
 #include <string.h>
+#include <stdio.h>

 void addTokenToLine(TokenLine* line, Token tok) {
    line->count++;
    Token* newTokens = realloc(line->tokens, line->count * sizeof(Token));
    if (!newTokens) {
-        perror("Failed to allocate token");
+        perror("Failed to allocate memory for token");
        exit(EXIT_FAILURE);
    }
    line->tokens = newTokens;
@@ -19,13 +18,30 @@ void addLineToLexed(LexedFile* lf, TokenLine line) {
    lf->lineCount++;
    TokenLine* newLines = realloc(lf->lines, lf->lineCount * sizeof(TokenLine));
    if (!newLines) {
-        perror("Failed to allocate line");
+        perror("Failed to allocate memory for line");
        exit(EXIT_FAILURE);
    }
    lf->lines = newLines;
    lf->lines[lf->lineCount - 1] = line;
 }

+void freeTokenLine(TokenLine* line) {
+    for (size_t i = 0; i < line->count; i++) {
+        free(line->tokens[i].text);
+    }
+    free(line->tokens);
+}
+
+void freeLexedFile(LexedFile* lf) {
+    if (lf == NULL) return;
+    for (size_t i = 0; i < lf->lineCount; i++) {
+        freeTokenLine(&lf->lines[i]);
+    }
+    free(lf->lines);
+    lf->lines = NULL;
+    lf->lineCount = 0;
+}
+
 LexedFile lexFile(const char* fileContents) {
    LexedFile result = {0};
    result.lines = NULL;
@@ -35,7 +51,7 @@ LexedFile lexFile(const char* fileContents) {
    currentLine.tokens = NULL;
    currentLine.count = 0;
    
-    char buf[1024] = {0};
+    char buf[4096] = {0}; 
    size_t bufLen = 0;
    bool inString = false;
    bool inChar = false;
@@ -44,6 +60,12 @@ LexedFile lexFile(const char* fileContents) {
    for (size_t i = 0; fileContents[i] != '\0'; i++) {
        char c = fileContents[i];
        
+        // Safety check: prevent buffer overflow
+        if (bufLen >= sizeof(buf) - 1) {
+            fprintf(stderr, "Error: Token too long (exceeds %zu characters)\n", sizeof(buf) - 1);
+            exit(EXIT_FAILURE);
+        }
+        
        switch (c) {
            case '"':
                if (!isComment) {
@@ -74,11 +96,15 @@ LexedFile lexFile(const char* fileContents) {
                        buf[bufLen] = '\0';
                        Token tok;
                        tok.text = strdup(buf);
-                        // Add tok to currentLine (need helper function)
+                        if (!tok.text) {
+                            perror("Failed to duplicate token string");
+                            exit(EXIT_FAILURE);
+                        }
                        addTokenToLine(&currentLine, tok);
                        bufLen = 0;
+                        memset(buf, 0, sizeof(buf));
                    }
-                    // Add line to result (need helper function)
+                    // Add line to result
                    addLineToLexed(&result, currentLine);
                    // Reset for next line
                    currentLine.tokens = NULL;
@@ -96,8 +122,13 @@ LexedFile lexFile(const char* fileContents) {
                        buf[bufLen] = '\0';
                        Token tok;
                        tok.text = strdup(buf);
+                        if (!tok.text) {
+                            perror("Failed to duplicate token string");
+                            exit(EXIT_FAILURE);
+                        }
                        addTokenToLine(&currentLine, tok);
                        bufLen = 0;
+                        memset(buf, 0, sizeof(buf));
                    }
                    addLineToLexed(&result, currentLine);
                    currentLine.tokens = NULL;
@@ -108,19 +139,29 @@ LexedFile lexFile(const char* fileContents) {
                break;
                
            case ' ':
+            case '\t':  // Also handle tabs as whitespace
                if (!inString && !inChar) {
                    if (bufLen > 0 && !isComment) {
                        buf[bufLen] = '\0';
                        Token tok;
                        tok.text = strdup(buf);
+                        if (!tok.text) {
+                            perror("Failed to duplicate token string");
+                            exit(EXIT_FAILURE);
+                        }
                        addTokenToLine(&currentLine, tok);
                        bufLen = 0;
+                        memset(buf, 0, sizeof(buf));
                    }
                } else {
                    buf[bufLen++] = c;
                }
                break;
                
+            case '\r':  // Handle Windows line endings
+                // Just skip carriage returns
+                break;
+                
            default:
                if (!isComment) {
                    buf[bufLen++] = c;
@@ -129,13 +170,19 @@ LexedFile lexFile(const char* fileContents) {
        }
    }
    
-    // Handle any remaining content
-    if (bufLen > 0) {
+    // Handle any remaining content at end of file
+    if (bufLen > 0 && !isComment) {
        buf[bufLen] = '\0';
        Token tok;
        tok.text = strdup(buf);
+        if (!tok.text) {
+            perror("Failed to duplicate token string");
+            exit(EXIT_FAILURE);
+        }
        addTokenToLine(&currentLine, tok);
    }
+    
+    // Add final line if it has content
    if (currentLine.count > 0) {
        addLineToLexed(&result, currentLine);
    }