summaryrefslogtreecommitdiff
path: root/src/main.zig
blob: 52d823c55ab63dbbd3c298b44a6f88e8d5ab4753 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
const std = @import("std");

// const GraphemeIterator = @import("ziglyph").GraphemeIterator;
// const Data = @import("grapheme").Data;
// const GraphemeIterator = @import("grapheme").Iterator;

// const codePointWidth = @import("ziglyph").display_width.codePointWidth;
// const strWidth = @import("ziglyph").display_width.strWidth;
// const Data = @import("display_width").Data;
// const codePointWidth = @import("display_width").codePointWidth;
// const strWidth = @import("display_width").strWidth;

// const CodePointIterator = @import("ziglyph").CodePointIterator;
const CodePointIterator = @import("code_point").Iterator;

// const ascii = @import("ascii");
// const ascii = std.ascii;

// const Normalize = @import("ziglyph").Normalizer;
// const Normalize = @import("Normalize");

// const CaseFold = @import("CaseFold");

// const GenCatData = @import("GenCatData");

const NumericData = @import("NumericData");

pub fn main() !void {
    var args_iter = std.process.args();
    _ = args_iter.skip();
    const in_path = args_iter.next() orelse return error.MissingArg;

    var arena = std.heap.ArenaAllocator.init(std.heap.page_allocator);
    defer arena.deinit();
    const allocator = arena.allocator();

    const input = try std.fs.cwd().readFileAlloc(
        allocator,
        in_path,
        std.math.maxInt(u32),
    );
    defer allocator.free(input);

    // var norm_data = try Normalize.NormData.init(allocator);
    // defer norm_data.deinit();
    // var norm = Normalize{ .norm_data = &norm_data };
    // var norm = try Normalize.init(allocator);
    // defer norm.deinit();

    // var gencat_data = try GenCatData.init(allocator);
    // defer gencat_data.deinit();

    // var fold_data = try CaseFold.FoldData.init(allocator);
    // defer fold_data.deinit();
    // var caser = CaseFold{ .fold_data = &fold_data };

    var num_data = try NumericData.init(allocator);
    defer num_data.deinit();

    // var iter = GraphemeIterator.init(input, &data);
    // defer iter.deinit();
    var iter = CodePointIterator{ .bytes = input };
    // var iter = std.mem.splitScalar(u8, input, '\n');

    var result: usize = 0;
    // var prev_line: []const u8 = "";
    // var result: isize = 0;
    var timer = try std.time.Timer.start();

    // while (iter.next()) |cp| result += codePointWidth(@intCast(cp.code));
    // while (iter.next()) |_| result += 1;
    // while (iter.next()) |line| result += strWidth(line, &data);
    // while (iter.next()) |line| {
    //     const nfc = try norm.nfc(allocator, line);
    //     result += nfc.slice.len;
    //     // nfc.deinit();
    // }
    // while (iter.next()) |cp| {
    //     if (cp.code == 'É') std.debug.print("`{u}` Gc: {s}\n", .{ cp.code, @tagName(gencat_data.gc(cp.code)) });
    //     result += 1;
    // }
    // while (iter.next()) |line| {
    //     if (try caser.canonCaselessMatch(allocator, &norm, prev_line, line)) {
    //         result += line.len;
    //     }
    //     prev_line = line;
    // }
    while (iter.next()) |cp| {
        if (num_data.isNumberic(cp)) result += 1;
    }

    std.debug.print("result: {}, took: {}\n", .{ result, timer.lap() / std.time.ns_per_ms });
}