1 files changed, 52 insertions, 0 deletions
diff --git a/data/unicode/NormalizationCorrections.txt b/data/unicode/NormalizationCorrections.txt
new file mode 100644
index 0000000..8cfb588
--- /dev/null
+++ b/data/unicode/NormalizationCorrections.txt
@@ -0,0 +1,52 @@
+# NormalizationCorrections-15.1.0.txt
+# Date: 2023-01-05
+# © 2023 Unicode®, Inc.
+# For terms of use, see https://www.unicode.org/terms_of_use.html
+#
+# Unicode Character Database
+# For documentation, see https://www.unicode.org/reports/tr44/
+#
+# This file is a normative contributory data file in the
+# Unicode Character Database.
+#
+# The normalization stability policy of the Unicode Consortium
+# ordinarily precludes any change to the decomposition
+# for any character, once established in a relevant version
+# of the UnicodeData.txt data file. However, under certain
+# exceptional (and rare) conditions, an error in a decomposition
+# mapping may be discovered that is truly just an unintended
+# typo in the data, and not a matter of dubious interpretation.
+#
+# Whenever such an error may be found, and if it meets the
+# requirements for possible exceptions to normalization
+# stability, the correction is entered in this data file,
+# so that any implementation depending on absolute stability
+# of normalization, *including* any errors in the data, can
+# safely reconstruct the exact state of the data tables at
+# any given version of Unicode.
+#
+# Currently this list has exactly six entries in it, one for the
+# typo found and corrected in Corrigendum #3, and five for
+# the typos and misidentifications found and corrected in
+# Corrigendum #4. All efforts
+# will be made to keep the entries limited to just those fixes.
+#
+# Interpretation of the fields:
+#   Field 0: Unicode code point
+#   Field 1: Original (erroneous) decomposition
+#   Field 2: Corrected decomposition
+#   Field 3: Version of Unicode for which the correction was
+#            entered into UnicodeData.txt, in n.n.n format.
+#   Comment: Indicates the Unicode Corrigendum which documents
+#            the correction
+#
+# For more information, see UAX #15, Unicode Normalization Forms.
+#
+F951;96FB;964B;3.2.0 # Corrigendum 3
+2F868;2136A;36FC;4.0.0 # Corrigendum 4
+2F874;5F33;5F53;4.0.0 # Corrigendum 4
+2F91F;43AB;243AB;4.0.0 # Corrigendum 4
+2F95F;7AAE;7AEE;4.0.0 # Corrigendum 4
+2F9BF;4D57;45D7;4.0.0 # Corrigendum 4
+# EOF

diff --git a/data/unicode/NormalizationCorrections.txt b/data/unicode/NormalizationCorrections.txt new file mode 100644 index 0000000..8cfb588 --- /dev/null +++ b/data/unicode/NormalizationCorrections.txt
@@ -0,0 +1,52 @@
	1	# NormalizationCorrections-15.1.0.txt
	2	# Date: 2023-01-05
	3	# © 2023 Unicode®, Inc.
	4	# For terms of use, see https://www.unicode.org/terms_of_use.html
	5	#
	6	# Unicode Character Database
	7	# For documentation, see https://www.unicode.org/reports/tr44/
	8	#
	9	# This file is a normative contributory data file in the
	10	# Unicode Character Database.
	11	#
	12	# The normalization stability policy of the Unicode Consortium
	13	# ordinarily precludes any change to the decomposition
	14	# for any character, once established in a relevant version
	15	# of the UnicodeData.txt data file. However, under certain
	16	# exceptional (and rare) conditions, an error in a decomposition
	17	# mapping may be discovered that is truly just an unintended
	18	# typo in the data, and not a matter of dubious interpretation.
	19	#
	20	# Whenever such an error may be found, and if it meets the
	21	# requirements for possible exceptions to normalization
	22	# stability, the correction is entered in this data file,
	23	# so that any implementation depending on absolute stability
	24	# of normalization, including any errors in the data, can
	25	# safely reconstruct the exact state of the data tables at
	26	# any given version of Unicode.
	27	#
	28	# Currently this list has exactly six entries in it, one for the
	29	# typo found and corrected in Corrigendum #3, and five for
	30	# the typos and misidentifications found and corrected in
	31	# Corrigendum #4. All efforts
	32	# will be made to keep the entries limited to just those fixes.
	33	#
	34	# Interpretation of the fields:
	35	# Field 0: Unicode code point
	36	# Field 1: Original (erroneous) decomposition
	37	# Field 2: Corrected decomposition
	38	# Field 3: Version of Unicode for which the correction was
	39	# entered into UnicodeData.txt, in n.n.n format.
	40	# Comment: Indicates the Unicode Corrigendum which documents
	41	# the correction
	42	#
	43	# For more information, see UAX #15, Unicode Normalization Forms.
	44	#
	45	F951;96FB;964B;3.2.0 # Corrigendum 3
	46	2F868;2136A;36FC;4.0.0 # Corrigendum 4
	47	2F874;5F33;5F53;4.0.0 # Corrigendum 4
	48	2F91F;43AB;243AB;4.0.0 # Corrigendum 4
	49	2F95F;7AAE;7AEE;4.0.0 # Corrigendum 4
	50	2F9BF;4D57;45D7;4.0.0 # Corrigendum 4
	51
	52	# EOF