From f1cfab7059e922d45ebbe19c58acef8fa80dc85e Mon Sep 17 00:00:00 2001 From: Jose Colon Rodriguez Date: Sun, 31 Mar 2024 11:26:14 -0400 Subject: Added benchmarks; Unicode version; Removed Ziglyph dep --- bench/src/zg_normalize.zig | 76 ++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 76 insertions(+) create mode 100644 bench/src/zg_normalize.zig (limited to 'bench/src/zg_normalize.zig') diff --git a/bench/src/zg_normalize.zig b/bench/src/zg_normalize.zig new file mode 100644 index 0000000..956106f --- /dev/null +++ b/bench/src/zg_normalize.zig @@ -0,0 +1,76 @@ +const std = @import("std"); + +const Normalize = @import("Normalize"); + +pub fn main() !void { + var args_iter = std.process.args(); + _ = args_iter.skip(); + const in_path = args_iter.next() orelse return error.MissingArg; + + var arena = std.heap.ArenaAllocator.init(std.heap.page_allocator); + defer arena.deinit(); + const allocator = arena.allocator(); + + const input = try std.fs.cwd().readFileAlloc( + allocator, + in_path, + std.math.maxInt(u32), + ); + defer allocator.free(input); + + const norm_data = try Normalize.NormData.init(allocator); + const normalize = Normalize{ .norm_data = &norm_data }; + + var iter = std.mem.splitScalar(u8, input, '\n'); + var result: usize = 0; + var timer = try std.time.Timer.start(); + + while (iter.next()) |line| { + const nfkc = try normalize.nfkc(allocator, line); + result += nfkc.slice.len; + } + std.debug.print("zg Normalize.nfkc: result: {}, took: {}\n", .{ result, timer.lap() / std.time.ns_per_ms }); + + result = 0; + iter.reset(); + timer.reset(); + + while (iter.next()) |line| { + const nfc = try normalize.nfc(allocator, line); + result += nfc.slice.len; + } + std.debug.print("zg Normalize.nfc: result: {}, took: {}\n", .{ result, timer.lap() / std.time.ns_per_ms }); + + result = 0; + iter.reset(); + timer.reset(); + + while (iter.next()) |line| { + const nfkd = try normalize.nfkd(allocator, line); + result += nfkd.slice.len; + } + std.debug.print("zg Normalize.nfkd: result: {}, took: {}\n", .{ result, timer.lap() / std.time.ns_per_ms }); + + result = 0; + iter.reset(); + timer.reset(); + + while (iter.next()) |line| { + const nfd = try normalize.nfd(allocator, line); + result += nfd.slice.len; + } + std.debug.print("zg Normalize.nfd: result: {}, took: {}\n", .{ result, timer.lap() / std.time.ns_per_ms }); + + result = 0; + iter.reset(); + var buf: [256]u8 = [_]u8{'z'} ** 256; + var prev_line: []const u8 = buf[0..1]; + timer.reset(); + + while (iter.next()) |line| { + if (try normalize.eql(allocator, prev_line, line)) result += 1; + @memcpy(buf[0..line.len], line); + prev_line = buf[0..line.len]; + } + std.debug.print("Zg Normalize.eql: result: {}, took: {}\n", .{ result, timer.lap() / std.time.ns_per_ms }); +} -- cgit v1.2.3