feat: lex many productions

2024-11-18 20:08:42 -05:00 · 2024-11-18 20:08:42 -05:00 · d6a83ff46c
commit d6a83ff46c
parent 26f5fed321
2 changed files with 49 additions and 8 deletions
--- a/src/01_lexic/root.zig
+++ b/src/01_lexic/root.zig
@ -5,15 +5,53 @@ const token = @import("./token.zig");
 const TokenType = token.TokenType;
 const Token = token.Token;
-pub fn tokenize(input: []const u8) !void {
+pub fn tokenize(input: []const u8, alloc: std.mem.Allocator) !void {
    const input_len = input.len;
-    const next_token = try number.lex(input, input_len, 0);
+    var current_pos: usize = 0;
    var tokens = std.ArrayList(Token).init(alloc);
    defer tokens.deinit();
    while (current_pos < input_len) {
        const actual_next_pos = ignore_whitespace(input, current_pos);
        const next_token = try number.lex(input, input_len, actual_next_pos);
        if (next_token) |tuple| {
            const t = tuple[0];
            current_pos = tuple[1];
-        std.debug.print("{s}\n", .{t.value});
+            try tokens.append(t);
        } else {
-        std.debug.print("no token found :c", .{});
+            // no lexer matched
            std.debug.print("unmatched args: anytype:c\n", .{});
            break;
        }
    }
    std.debug.print("array list len: {d}", .{tokens.items.len});
 }
 /// Ignores all whitespace from usize,
 /// and returns the position where whitespace ends.
 ///
 /// Whitespace is: tabs, spaces
 pub fn ignore_whitespace(input: []const u8, start: usize) usize {
    const cap = input.len;
    var pos = start;
    while (pos < cap and (input[pos] == ' ' or input[pos] == '\t')) {
        pos += 1;
    }
    return pos;
 }
 test "should insert 1 item" {
    const input = "322";
    try tokenize(input, std.testing.allocator);
 }
 test "should insert 2 item" {
    const input = "322 644";
    try tokenize(input, std.testing.allocator);
 }
--- a/src/main.zig
+++ b/src/main.zig
@ -24,7 +24,10 @@ fn repl() !void {
    defer std.heap.page_allocator.free(bare_line);
    const line = std.mem.trim(u8, bare_line, "\r");
-    try lexic.tokenize(line);
+    var gpa = std.heap.GeneralPurposeAllocator(.{}){};
    const alloc = gpa.allocator();
    try lexic.tokenize(line, alloc);
    try bw.flush();
 }