From 681212c02b0977fd1367185dce24a6250fbe299e Mon Sep 17 00:00:00 2001 From: Robin Leroy Date: Fri, 24 May 2024 20:47:16 +0200 Subject: [PATCH] Make the invariant relating Cased to Case_Ignorable more maintainable (#831) --- .../unicode/text/UCD/UnicodeInvariantTest.txt | 19 ++++--------------- 1 file changed, 4 insertions(+), 15 deletions(-) diff --git a/unicodetools/src/main/resources/org/unicode/text/UCD/UnicodeInvariantTest.txt b/unicodetools/src/main/resources/org/unicode/text/UCD/UnicodeInvariantTest.txt index 82dfcf553..d9cbb53a4 100644 --- a/unicodetools/src/main/resources/org/unicode/text/UCD/UnicodeInvariantTest.txt +++ b/unicodetools/src/main/resources/org/unicode/text/UCD/UnicodeInvariantTest.txt @@ -227,21 +227,10 @@ In \P{U-1:gc=Cn}, R-1:NFKC_Simple_Casefold = NFKC_Simple_Casefold # Case Pair Stability: If two characters form a case pair in a version of Unicode, they will remain a case pair in each subsequent version of Unicode. If two characters do not form a case pair in a version of Unicode, they will never become a case pair in any subsequent version of Unicode. # TODO -# Red Flag: cased and case_ignorable should be disjoint - -Let $caseOverlap = [\u02B0-\u02B8\u02C0\u02C1\u02E0-\u02E4\u0345\u037A\u10FC\u1D2C-\u1D61\u1D78\u1D9B-\u1DBF\u2090-\u2094\u2C7D\uA770[\u1D62-\u1D6A\u2071\u207F\u2095-\u209C\u2C7C\uA7F2-\uA7F4\uA7F8\uA7F9 \uA69C-\uA69D\uAB5C-\uAB5F\uAB69]\U00010780\U00010783-\U00010785\U00010787-\U000107B0\U000107B2-\U000107BA\U0001E030-\U0001E06D] -# 6.1.0, added 22 overlap characters -# 7.0 added \uA69C-\uA69D\uAB5C-\uAB5F -# 14.0 new modifier letters in Latin Extended-F are Lowercase (U+107xx) -# 15.0 new modifier letters in Cyrillic Extended-D are Lowercase (U+1E030..1E06C) -# 15.0 [172-A58] Action Item for Markus Scherer, PAG: -# Give the Other_Lowercase property (and thus also Cased) -# to modifier letter U+1E06D, for Unicode Version 15.0. See L2/22-124 item UCD3. -# 15.0 [172-A59] Action Item for Markus Scherer, PAG: -# Give the Other_Lowercase property (and thus also Cased) -# to the modifier letters U+10FC and U+A7F2..A7F4 and U+AB69, -# for Unicode Version 15.0. See L2/22-124 item UCD4. -\p{cased} ∥ [\p{caseignorable} - $caseOverlap] +# Red Flag: cased and case_ignorable should be disjoint, +# except for modifier letters and ◌ͅ. + +\p{Cased} ∥ [\p{Case_Ignorable} - \p{gc=Lm} - \N{COMBINING GREEK YPOGEGRAMMENI} ] ########################## # Property Stability Policies