From f1cfab7059e922d45ebbe19c58acef8fa80dc85e Mon Sep 17 00:00:00 2001 From: Jose Colon Rodriguez Date: Sun, 31 Mar 2024 11:26:14 -0400 Subject: Added benchmarks; Unicode version; Removed Ziglyph dep --- bench/src/ziglyph_normalizer.zig | 75 ++++++++++++++++++++++++++++++++++++++++ 1 file changed, 75 insertions(+) create mode 100644 bench/src/ziglyph_normalizer.zig (limited to 'bench/src/ziglyph_normalizer.zig') diff --git a/bench/src/ziglyph_normalizer.zig b/bench/src/ziglyph_normalizer.zig new file mode 100644 index 0000000..fea162c --- /dev/null +++ b/bench/src/ziglyph_normalizer.zig @@ -0,0 +1,75 @@ +const std = @import("std"); + +const Normalizer = @import("ziglyph").Normalizer; + +pub fn main() !void { + var args_iter = std.process.args(); + _ = args_iter.skip(); + const in_path = args_iter.next() orelse return error.MissingArg; + + var arena = std.heap.ArenaAllocator.init(std.heap.page_allocator); + defer arena.deinit(); + const allocator = arena.allocator(); + + const input = try std.fs.cwd().readFileAlloc( + allocator, + in_path, + std.math.maxInt(u32), + ); + defer allocator.free(input); + + var normalizer = try Normalizer.init(allocator); + + var iter = std.mem.splitScalar(u8, input, '\n'); + var result: usize = 0; + var timer = try std.time.Timer.start(); + + while (iter.next()) |line| { + const nfkc = try normalizer.nfkc(allocator, line); + result += nfkc.slice.len; + } + std.debug.print("Ziglyph Normalizer.nfkc: result: {}, took: {}\n", .{ result, timer.lap() / std.time.ns_per_ms }); + + result = 0; + iter.reset(); + timer.reset(); + + while (iter.next()) |line| { + const nfc = try normalizer.nfc(allocator, line); + result += nfc.slice.len; + } + std.debug.print("Ziglyph Normalizer.nfc: result: {}, took: {}\n", .{ result, timer.lap() / std.time.ns_per_ms }); + + result = 0; + iter.reset(); + timer.reset(); + + while (iter.next()) |line| { + const nfkd = try normalizer.nfkd(allocator, line); + result += nfkd.slice.len; + } + std.debug.print("Ziglyph Normalizer.nfkd: result: {}, took: {}\n", .{ result, timer.lap() / std.time.ns_per_ms }); + + result = 0; + iter.reset(); + timer.reset(); + + while (iter.next()) |line| { + const nfd = try normalizer.nfd(allocator, line); + result += nfd.slice.len; + } + std.debug.print("Ziglyph Normalizer.nfd: result: {}, took: {}\n", .{ result, timer.lap() / std.time.ns_per_ms }); + + result = 0; + iter.reset(); + var buf: [256]u8 = [_]u8{'z'} ** 256; + var prev_line: []const u8 = buf[0..1]; + timer.reset(); + + while (iter.next()) |line| { + if (try normalizer.eql(allocator, prev_line, line)) result += 1; + @memcpy(buf[0..line.len], line); + prev_line = buf[0..line.len]; + } + std.debug.print("Ziglyph Normalizer.eql: result: {}, took: {}\n", .{ result, timer.lap() / std.time.ns_per_ms }); +} -- cgit v1.2.3