From f1cfab7059e922d45ebbe19c58acef8fa80dc85e Mon Sep 17 00:00:00 2001 From: Jose Colon Rodriguez Date: Sun, 31 Mar 2024 11:26:14 -0400 Subject: Added benchmarks; Unicode version; Removed Ziglyph dep --- bench/src/ziglyph_caseless.zig | 35 +++++++++++++++++++++++++++++++++++ 1 file changed, 35 insertions(+) create mode 100644 bench/src/ziglyph_caseless.zig (limited to 'bench/src/ziglyph_caseless.zig') diff --git a/bench/src/ziglyph_caseless.zig b/bench/src/ziglyph_caseless.zig new file mode 100644 index 0000000..f80668e --- /dev/null +++ b/bench/src/ziglyph_caseless.zig @@ -0,0 +1,35 @@ +const std = @import("std"); + +const Normalizer = @import("ziglyph").Normalizer; + +pub fn main() !void { + var args_iter = std.process.args(); + _ = args_iter.skip(); + const in_path = args_iter.next() orelse return error.MissingArg; + + var arena = std.heap.ArenaAllocator.init(std.heap.page_allocator); + defer arena.deinit(); + const allocator = arena.allocator(); + + const input = try std.fs.cwd().readFileAlloc( + allocator, + in_path, + std.math.maxInt(u32), + ); + defer allocator.free(input); + + var normalizer = try Normalizer.init(allocator); + + var iter = std.mem.splitScalar(u8, input, '\n'); + var result: usize = 0; + var buf: [256]u8 = [_]u8{'z'} ** 256; + var prev_line: []const u8 = buf[0..1]; + var timer = try std.time.Timer.start(); + + while (iter.next()) |line| { + if (try normalizer.eqlCaseless(allocator, prev_line, line)) result += 1; + @memcpy(buf[0..line.len], line); + prev_line = buf[0..line.len]; + } + std.debug.print("Ziglyph Normalizer.eqlCaseless: result: {}, took: {}\n", .{ result, timer.lap() / std.time.ns_per_ms }); +} -- cgit v1.2.3