aboutsummaryrefslogtreecommitdiffhomepage
path: root/src/jq/tokenize.zig
blob: 92f96ca888ea5308b3f5a3b9cf78f9c9c9fab261 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
const std = @import("std");

pub const TokenizeError = error{
    UnexpectedEnd,
    InvalidCharacter,
};

pub const TokenKind = enum {
    end,
    dot,
    bracket_left,
    bracket_right,
    number,
};

pub const Token = union(TokenKind) {
    end,
    dot,
    bracket_left,
    bracket_right,
    number: i64,

    pub fn kind(self: @This()) TokenKind {
        return self;
    }
};

pub fn tokenize(allocator: std.mem.Allocator, query: []const u8) ![]Token {
    var tokens = try std.array_list.Aligned(Token, null).initCapacity(allocator, 16);

    const len = query.len;

    if (len == 0) {
        return error.UnexpectedEnd;
    }

    var i: usize = 0;
    while (i < len) {
        const c = query[i];
        switch (c) {
            '.' => try tokens.append(allocator, .dot),
            '[' => try tokens.append(allocator, .bracket_left),
            ']' => try tokens.append(allocator, .bracket_right),
            else => {
                if (std.ascii.isDigit(c)) {
                    try tokens.append(allocator, .{ .number = (c - '0') });
                } else {
                    return error.InvalidCharacter;
                }
            },
        }
        i += 1;
    }

    try tokens.append(allocator, .end);
    return tokens.toOwnedSlice(allocator);
}