diff options
| author | 2025-04-30 12:58:26 -0400 | |
|---|---|---|
| committer | 2025-04-30 13:01:37 -0400 | |
| commit | 3c2c30bfbe861c6c48acd8d7507886787197a788 (patch) | |
| tree | 875ba35c1954b201207452b18a189ebd70c0b596 /src/NormPropsData.zig | |
| parent | grapheme now Graphemes, Data files gone (diff) | |
| download | zg-3c2c30bfbe861c6c48acd8d7507886787197a788.tar.gz zg-3c2c30bfbe861c6c48acd8d7507886787197a788.tar.xz zg-3c2c30bfbe861c6c48acd8d7507886787197a788.zip | |
Merge NormData with Normalize
Diffstat (limited to 'src/NormPropsData.zig')
| -rw-r--r-- | src/NormPropsData.zig | 50 |
1 files changed, 26 insertions, 24 deletions
diff --git a/src/NormPropsData.zig b/src/NormPropsData.zig index e79ae91..ca69569 100644 --- a/src/NormPropsData.zig +++ b/src/NormPropsData.zig | |||
| @@ -1,15 +1,11 @@ | |||
| 1 | const std = @import("std"); | 1 | //! Normalization Properties Data |
| 2 | const builtin = @import("builtin"); | ||
| 3 | const compress = std.compress; | ||
| 4 | const mem = std.mem; | ||
| 5 | const testing = std.testing; | ||
| 6 | 2 | ||
| 7 | s1: []u16 = undefined, | 3 | s1: []u16 = undefined, |
| 8 | s2: []u4 = undefined, | 4 | s2: []u4 = undefined, |
| 9 | 5 | ||
| 10 | const Self = @This(); | 6 | const NormProps = @This(); |
| 11 | 7 | ||
| 12 | pub fn init(allocator: mem.Allocator) !Self { | 8 | pub fn init(allocator: mem.Allocator) !NormProps { |
| 13 | const decompressor = compress.flate.inflate.decompressor; | 9 | const decompressor = compress.flate.inflate.decompressor; |
| 14 | const in_bytes = @embedFile("normp"); | 10 | const in_bytes = @embedFile("normp"); |
| 15 | var in_fbs = std.io.fixedBufferStream(in_bytes); | 11 | var in_fbs = std.io.fixedBufferStream(in_bytes); |
| @@ -17,37 +13,43 @@ pub fn init(allocator: mem.Allocator) !Self { | |||
| 17 | var reader = in_decomp.reader(); | 13 | var reader = in_decomp.reader(); |
| 18 | 14 | ||
| 19 | const endian = builtin.cpu.arch.endian(); | 15 | const endian = builtin.cpu.arch.endian(); |
| 20 | var self = Self{}; | 16 | var norms = NormProps{}; |
| 21 | 17 | ||
| 22 | const stage_1_len: u16 = try reader.readInt(u16, endian); | 18 | const stage_1_len: u16 = try reader.readInt(u16, endian); |
| 23 | self.s1 = try allocator.alloc(u16, stage_1_len); | 19 | norms.s1 = try allocator.alloc(u16, stage_1_len); |
| 24 | errdefer allocator.free(self.s1); | 20 | errdefer allocator.free(norms.s1); |
| 25 | for (0..stage_1_len) |i| self.s1[i] = try reader.readInt(u16, endian); | 21 | for (0..stage_1_len) |i| norms.s1[i] = try reader.readInt(u16, endian); |
| 26 | 22 | ||
| 27 | const stage_2_len: u16 = try reader.readInt(u16, endian); | 23 | const stage_2_len: u16 = try reader.readInt(u16, endian); |
| 28 | self.s2 = try allocator.alloc(u4, stage_2_len); | 24 | norms.s2 = try allocator.alloc(u4, stage_2_len); |
| 29 | errdefer allocator.free(self.s2); | 25 | errdefer allocator.free(norms.s2); |
| 30 | for (0..stage_2_len) |i| self.s2[i] = @intCast(try reader.readInt(u8, endian)); | 26 | for (0..stage_2_len) |i| norms.s2[i] = @intCast(try reader.readInt(u8, endian)); |
| 31 | 27 | ||
| 32 | return self; | 28 | return norms; |
| 33 | } | 29 | } |
| 34 | 30 | ||
| 35 | pub fn deinit(self: *const Self, allocator: mem.Allocator) void { | 31 | pub fn deinit(norms: *const NormProps, allocator: mem.Allocator) void { |
| 36 | allocator.free(self.s1); | 32 | allocator.free(norms.s1); |
| 37 | allocator.free(self.s2); | 33 | allocator.free(norms.s2); |
| 38 | } | 34 | } |
| 39 | 35 | ||
| 40 | /// Returns true if `cp` is already in NFD form. | 36 | /// Returns true if `cp` is already in NFD form. |
| 41 | pub fn isNfd(self: Self, cp: u21) bool { | 37 | pub fn isNfd(norms: *const NormProps, cp: u21) bool { |
| 42 | return self.s2[self.s1[cp >> 8] + (cp & 0xff)] & 1 == 0; | 38 | return norms.s2[norms.s1[cp >> 8] + (cp & 0xff)] & 1 == 0; |
| 43 | } | 39 | } |
| 44 | 40 | ||
| 45 | /// Returns true if `cp` is already in NFKD form. | 41 | /// Returns true if `cp` is already in NFKD form. |
| 46 | pub fn isNfkd(self: Self, cp: u21) bool { | 42 | pub fn isNfkd(norms: *const NormProps, cp: u21) bool { |
| 47 | return self.s2[self.s1[cp >> 8] + (cp & 0xff)] & 2 == 0; | 43 | return norms.s2[norms.s1[cp >> 8] + (cp & 0xff)] & 2 == 0; |
| 48 | } | 44 | } |
| 49 | 45 | ||
| 50 | /// Returns true if `cp` is not allowed in any normalized form. | 46 | /// Returns true if `cp` is not allowed in any normalized form. |
| 51 | pub fn isFcx(self: Self, cp: u21) bool { | 47 | pub fn isFcx(norms: *const NormProps, cp: u21) bool { |
| 52 | return self.s2[self.s1[cp >> 8] + (cp & 0xff)] & 4 == 4; | 48 | return norms.s2[norms.s1[cp >> 8] + (cp & 0xff)] & 4 == 4; |
| 53 | } | 49 | } |
| 50 | |||
| 51 | const std = @import("std"); | ||
| 52 | const builtin = @import("builtin"); | ||
| 53 | const compress = std.compress; | ||
| 54 | const mem = std.mem; | ||
| 55 | const testing = std.testing; | ||