X-Git-Url: https://gitweb.factorcode.org/gitweb.cgi?p=factor.git;a=blobdiff_plain;f=basis%2Funicode%2FUCA%2Fdecomps.txt;h=34898a5bebb7fb0c7e20a8dd8cfcc34d07af767b;hp=3a60aa1a9fd97db682cf3c770023311f2ccc1292;hb=e3f197c3bbd776e9bb83d7fa8598687a8842d0b6;hpb=631f909b7c6544e3391bdecb4139e7e2015ae69e diff --git a/basis/unicode/UCA/decomps.txt b/basis/unicode/UCA/decomps.txt index 3a60aa1a9f..34898a5beb 100644 --- a/basis/unicode/UCA/decomps.txt +++ b/basis/unicode/UCA/decomps.txt @@ -1,7 +1,7 @@ -# decomps-14.0.0.txt -# Date: 2021-06-07, 20:52:26 GMT [KW] -# Copyright 2021 Unicode, Inc. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# decomps-15.0.0.txt +# Date: 2022-08-09, 16:06:35 GMT [KW] +# Copyright 2022 Unicode, Inc. +# For terms of use, see https://www.unicode.org/terms_of_use.html # # This file lists decompositions used in generating the Default Unicode Collation Element Table # (DUCET) for the Unicode Collation Algorithm @@ -721,6 +721,7 @@ 0CCB;;0CC6 0CC2 0CD5 # KANNADA VOWEL SIGN OO => KANNADA VOWEL SIGN E + KANNADA VOWEL SIGN UU + KANNADA LENGTH MARK 0CCB;;0CCA 0CD5 # KANNADA VOWEL SIGN OO => KANNADA VOWEL SIGN O + KANNADA LENGTH MARK 0CDD;;0CA8 0CCD # KANNADA LETTER NAKAARA POLLU => KANNADA LETTER NA + KANNADA SIGN VIRAMA +0CF3;;0902 # KANNADA SIGN COMBINING ANUSVARA ABOVE RIGHT => DEVANAGARI SIGN ANUSVARA 0D00;;0902 # MALAYALAM SIGN COMBINING ANUSVARA ABOVE => DEVANAGARI SIGN ANUSVARA 0D01;;0901 # MALAYALAM SIGN CANDRABINDU => DEVANAGARI SIGN CANDRABINDU 0D02;;0902 # MALAYALAM SIGN ANUSVARA => DEVANAGARI SIGN ANUSVARA @@ -782,6 +783,8 @@ 0F7E;;0902 # TIBETAN SIGN RJES SU NGA RO => DEVANAGARI SIGN ANUSVARA 0F7F;;0903 # TIBETAN SIGN RNAM BCAD => DEVANAGARI SIGN VISARGA 0F81;;0F71 0F80 # TIBETAN VOWEL SIGN REVERSED II => TIBETAN VOWEL SIGN AA + TIBETAN VOWEL SIGN REVERSED I +0F82;;0901 # TIBETAN SIGN NYI ZLA NAA DA => DEVANAGARI SIGN CANDRABINDU +0F83;;0901 # TIBETAN SIGN SNA LDAN => DEVANAGARI SIGN CANDRABINDU 0F93;;0F92 0FB7 # TIBETAN SUBJOINED LETTER GHA => TIBETAN SUBJOINED LETTER GA + TIBETAN SUBJOINED LETTER HA 0F9D;;0F9C 0FB7 # TIBETAN SUBJOINED LETTER DDHA => TIBETAN SUBJOINED LETTER DDA + TIBETAN SUBJOINED LETTER HA 0FA2;;0FA1 0FB7 # TIBETAN SUBJOINED LETTER DHA => TIBETAN SUBJOINED LETTER DA + TIBETAN SUBJOINED LETTER HA @@ -4778,6 +4781,7 @@ FFEB;;2192 # HALFWIDTH RIGHTWARDS ARROW => RIGHTWARDS ARROW FFEC;;2193 # HALFWIDTH DOWNWARDS ARROW => DOWNWARDS ARROW FFED;;25A0 # HALFWIDTH BLACK SQUARE => BLACK SQUARE FFEE;;25CB # HALFWIDTH WHITE CIRCLE => WHITE CIRCLE +101FD;;F8F6 # PHAISTOS DISC SIGN COMBINING OBLIQUE STROKE => GENERIC MARK BELOW 10376;;10350 # COMBINING OLD PERMIC LETTER AN => OLD PERMIC LETTER AN 10377;;10353 # COMBINING OLD PERMIC LETTER DOI => OLD PERMIC LETTER DOI 10378;;10357 # COMBINING OLD PERMIC LETTER ZATA => OLD PERMIC LETTER ZATA @@ -5090,6 +5094,9 @@ FFEE;;25CB # HALFWIDTH WHITE CIRCLE => WHITE CIRCLE 11D47;;11D26 # MASARAM GONDI RA-KARA => MASARAM GONDI LETTER RA 11D95;;0902 # GUNJALA GONDI SIGN ANUSVARA => DEVANAGARI SIGN ANUSVARA 11D96;;0903 # GUNJALA GONDI SIGN VISARGA => DEVANAGARI SIGN VISARGA +11F00;;0901 # KAWI SIGN CANDRABINDU => DEVANAGARI SIGN CANDRABINDU +11F01;;0902 # KAWI SIGN ANUSVARA => DEVANAGARI SIGN ANUSVARA +11F03;;0903 # KAWI SIGN VISARGA => DEVANAGARI SIGN VISARGA 16E94;;16E81 F8F0 # MEDEFAIDRIN DIGIT ONE ALTERNATE FORM => MEDEFAIDRIN DIGIT ONE + PSEUDO-COMBINING VARIANT MARK 1 16E95;;16E82 F8F0 # MEDEFAIDRIN DIGIT TWO ALTERNATE FORM => MEDEFAIDRIN DIGIT TWO + PSEUDO-COMBINING VARIANT MARK 1 16E96;;16E83 F8F0 # MEDEFAIDRIN DIGIT THREE ALTERNATE FORM => MEDEFAIDRIN DIGIT THREE + PSEUDO-COMBINING VARIANT MARK 1 @@ -6151,6 +6158,69 @@ FFEE;;25CB # HALFWIDTH WHITE CIRCLE => WHITE CIRCLE 1E028;;2C58 # COMBINING GLAGOLITIC LETTER BIG YUS => GLAGOLITIC SMALL LETTER BIG YUS 1E029;;2C59 # COMBINING GLAGOLITIC LETTER IOTATED BIG YUS => GLAGOLITIC SMALL LETTER IOTATED BIG YUS 1E02A;;2C5A # COMBINING GLAGOLITIC LETTER FITA => GLAGOLITIC SMALL LETTER FITA +1E030;;0430 # MODIFIER LETTER CYRILLIC SMALL A => CYRILLIC SMALL LETTER A +1E031;;0431 # MODIFIER LETTER CYRILLIC SMALL BE => CYRILLIC SMALL LETTER BE +1E032;;0432 # MODIFIER LETTER CYRILLIC SMALL VE => CYRILLIC SMALL LETTER VE +1E033;;0433 # MODIFIER LETTER CYRILLIC SMALL GHE => CYRILLIC SMALL LETTER GHE +1E034;;0434 # MODIFIER LETTER CYRILLIC SMALL DE => CYRILLIC SMALL LETTER DE +1E035;;0435 # MODIFIER LETTER CYRILLIC SMALL IE => CYRILLIC SMALL LETTER IE +1E036;;0436 # MODIFIER LETTER CYRILLIC SMALL ZHE => CYRILLIC SMALL LETTER ZHE +1E037;;0437 # MODIFIER LETTER CYRILLIC SMALL ZE => CYRILLIC SMALL LETTER ZE +1E038;;0438 # MODIFIER LETTER CYRILLIC SMALL I => CYRILLIC SMALL LETTER I +1E039;;043A # MODIFIER LETTER CYRILLIC SMALL KA => CYRILLIC SMALL LETTER KA +1E03A;;043B # MODIFIER LETTER CYRILLIC SMALL EL => CYRILLIC SMALL LETTER EL +1E03B;;043C # MODIFIER LETTER CYRILLIC SMALL EM => CYRILLIC SMALL LETTER EM +1E03C;;043E # MODIFIER LETTER CYRILLIC SMALL O => CYRILLIC SMALL LETTER O +1E03D;;043F # MODIFIER LETTER CYRILLIC SMALL PE => CYRILLIC SMALL LETTER PE +1E03E;;0440 # MODIFIER LETTER CYRILLIC SMALL ER => CYRILLIC SMALL LETTER ER +1E03F;;0441 # MODIFIER LETTER CYRILLIC SMALL ES => CYRILLIC SMALL LETTER ES +1E040;;0442 # MODIFIER LETTER CYRILLIC SMALL TE => CYRILLIC SMALL LETTER TE +1E041;;0443 # MODIFIER LETTER CYRILLIC SMALL U => CYRILLIC SMALL LETTER U +1E042;;0444 # MODIFIER LETTER CYRILLIC SMALL EF => CYRILLIC SMALL LETTER EF +1E043;;0445 # MODIFIER LETTER CYRILLIC SMALL HA => CYRILLIC SMALL LETTER HA +1E044;;0446 # MODIFIER LETTER CYRILLIC SMALL TSE => CYRILLIC SMALL LETTER TSE +1E045;;0447 # MODIFIER LETTER CYRILLIC SMALL CHE => CYRILLIC SMALL LETTER CHE +1E046;;0448 # MODIFIER LETTER CYRILLIC SMALL SHA => CYRILLIC SMALL LETTER SHA +1E047;;044B # MODIFIER LETTER CYRILLIC SMALL YERU => CYRILLIC SMALL LETTER YERU +1E048;;044D # MODIFIER LETTER CYRILLIC SMALL E => CYRILLIC SMALL LETTER E +1E049;;044E # MODIFIER LETTER CYRILLIC SMALL YU => CYRILLIC SMALL LETTER YU +1E04A;;A689 # MODIFIER LETTER CYRILLIC SMALL DZZE => CYRILLIC SMALL LETTER DZZE +1E04B;;04D9 # MODIFIER LETTER CYRILLIC SMALL SCHWA => CYRILLIC SMALL LETTER SCHWA +1E04C;;0456 # MODIFIER LETTER CYRILLIC SMALL BYELORUSSIAN-UKRAINIAN I => CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I +1E04D;;0458 # MODIFIER LETTER CYRILLIC SMALL JE => CYRILLIC SMALL LETTER JE +1E04E;;04E9 # MODIFIER LETTER CYRILLIC SMALL BARRED O => CYRILLIC SMALL LETTER BARRED O +1E04F;;04AF # MODIFIER LETTER CYRILLIC SMALL STRAIGHT U => CYRILLIC SMALL LETTER STRAIGHT U +1E050;;04CF # MODIFIER LETTER CYRILLIC SMALL PALOCHKA => CYRILLIC SMALL LETTER PALOCHKA +1E051;;0430 # CYRILLIC SUBSCRIPT SMALL LETTER A => CYRILLIC SMALL LETTER A +1E052;;0431 # CYRILLIC SUBSCRIPT SMALL LETTER BE => CYRILLIC SMALL LETTER BE +1E053;;0432 # CYRILLIC SUBSCRIPT SMALL LETTER VE => CYRILLIC SMALL LETTER VE +1E054;;0433 # CYRILLIC SUBSCRIPT SMALL LETTER GHE => CYRILLIC SMALL LETTER GHE +1E055;;0434 # CYRILLIC SUBSCRIPT SMALL LETTER DE => CYRILLIC SMALL LETTER DE +1E056;;0435 # CYRILLIC SUBSCRIPT SMALL LETTER IE => CYRILLIC SMALL LETTER IE +1E057;;0436 # CYRILLIC SUBSCRIPT SMALL LETTER ZHE => CYRILLIC SMALL LETTER ZHE +1E058;;0437 # CYRILLIC SUBSCRIPT SMALL LETTER ZE => CYRILLIC SMALL LETTER ZE +1E059;;0438 # CYRILLIC SUBSCRIPT SMALL LETTER I => CYRILLIC SMALL LETTER I +1E05A;;043A # CYRILLIC SUBSCRIPT SMALL LETTER KA => CYRILLIC SMALL LETTER KA +1E05B;;043B # CYRILLIC SUBSCRIPT SMALL LETTER EL => CYRILLIC SMALL LETTER EL +1E05C;;043E # CYRILLIC SUBSCRIPT SMALL LETTER O => CYRILLIC SMALL LETTER O +1E05D;;043F # CYRILLIC SUBSCRIPT SMALL LETTER PE => CYRILLIC SMALL LETTER PE +1E05E;;0441 # CYRILLIC SUBSCRIPT SMALL LETTER ES => CYRILLIC SMALL LETTER ES +1E05F;;0443 # CYRILLIC SUBSCRIPT SMALL LETTER U => CYRILLIC SMALL LETTER U +1E060;;0444 # CYRILLIC SUBSCRIPT SMALL LETTER EF => CYRILLIC SMALL LETTER EF +1E061;;0445 # CYRILLIC SUBSCRIPT SMALL LETTER HA => CYRILLIC SMALL LETTER HA +1E062;;0446 # CYRILLIC SUBSCRIPT SMALL LETTER TSE => CYRILLIC SMALL LETTER TSE +1E063;;0447 # CYRILLIC SUBSCRIPT SMALL LETTER CHE => CYRILLIC SMALL LETTER CHE +1E064;;0448 # CYRILLIC SUBSCRIPT SMALL LETTER SHA => CYRILLIC SMALL LETTER SHA +1E065;;044A # CYRILLIC SUBSCRIPT SMALL LETTER HARD SIGN => CYRILLIC SMALL LETTER HARD SIGN +1E066;;044B # CYRILLIC SUBSCRIPT SMALL LETTER YERU => CYRILLIC SMALL LETTER YERU +1E067;;0433 F8F1 # CYRILLIC SUBSCRIPT SMALL LETTER GHE WITH UPTURN => CYRILLIC SMALL LETTER GHE + PSEUDO-COMBINING VARIANT MARK 2 +1E068;;0456 # CYRILLIC SUBSCRIPT SMALL LETTER BYELORUSSIAN-UKRAINIAN I => CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I +1E069;;0455 # CYRILLIC SUBSCRIPT SMALL LETTER DZE => CYRILLIC SMALL LETTER DZE +1E06A;;045F # CYRILLIC SUBSCRIPT SMALL LETTER DZHE => CYRILLIC SMALL LETTER DZHE +1E06B;;04AB # MODIFIER LETTER CYRILLIC SMALL ES WITH DESCENDER => CYRILLIC SMALL LETTER ES WITH DESCENDER +1E06C;;A651 # MODIFIER LETTER CYRILLIC SMALL YERU WITH BACK YER => CYRILLIC SMALL LETTER YERU WITH BACK YER +1E06D;;04B1 # MODIFIER LETTER CYRILLIC SMALL STRAIGHT U WITH STROKE => CYRILLIC SMALL LETTER STRAIGHT U WITH STROKE +1E08F;;0456 # COMBINING CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I => CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I 1E130;;16B34 # NYIAKENG PUACHUE HMONG TONE-B => PAHAWH HMONG MARK CIM SUAM 1E131;;16B30 # NYIAKENG PUACHUE HMONG TONE-M => PAHAWH HMONG MARK CIM TUB 1E132;;16B32 # NYIAKENG PUACHUE HMONG TONE-J => PAHAWH HMONG MARK CIM KES