Skip to content

Commit 0538c9a

Browse files
authored
chore: Jsps to Unicode 15 final (#332)
* chore: Jsps to Unicode 15 final For #271 * fix(build): Jsps: don't test during gcr build The gcr build will need some work work for testing. Disable test for now. Revisit in #333 For #271 * fix(build): Fix JSPs to include unicodetools and cldr Fixes #271 * fix dockerfile Fixes: #334 * fix dockerfile again Fixes: #334 * fix(build): fix broken build-jsp.yml - the Dockerfile now requires a .tgz file with the cldr and unicodetools to use. Fixes: #271
1 parent 58e67f1 commit 0538c9a

File tree

80 files changed

+241
-225
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

80 files changed

+241
-225
lines changed

.github/workflows/build-jsp.yml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -17,6 +17,9 @@ jobs:
1717
with:
1818
repository: unicode-org/cldr
1919
path: cldr
20+
- name: Backup Unicodetools and CLDR for jsps # this is needed only for the Docker build
21+
run:
22+
mkdir -p UnicodeJsps/target && tar cfpz UnicodeJsps/target/cldr-unicodetools.tgz ./cldr ./unicodetools
2023
- name: Set up JDK 11
2124
uses: actions/setup-java@v1
2225
with:

.github/workflows/push-jsp-on-tag.yml

Lines changed: 10 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,6 +12,15 @@ jobs:
1212
uses: actions/setup-java@v1
1313
with:
1414
java-version: 11
15+
- uses: actions/checkout@v2
16+
- name: Check out CLDR
17+
uses: actions/checkout@v2
18+
with:
19+
repository: unicode-org/cldr
20+
path: cldr
21+
- name: Backup Unicodetools and CLDR for jsps
22+
run:
23+
mkdir -p UnicodeJsps/target && tar cfpz UnicodeJsps/target/cldr-unicodetools.tgz ./cldr ./unicodetools
1524
- name: Cache local Maven repository
1625
uses: actions/cache@v2
1726
with:
@@ -26,7 +35,7 @@ jobs:
2635
GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
2736
- name: Package with Maven
2837
run: >
29-
mvn -s .github/workflows/mvn-settings.xml -B compile test install package -pl UnicodeJsps
38+
mvn -s .github/workflows/mvn-settings.xml -B compile install package -pl UnicodeJsps -DskipTests=true
3039
env:
3140
GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
3241
- name: Upload UnicodeJsps.war

UnicodeJsps/Dockerfile

Lines changed: 9 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -7,19 +7,26 @@ RUN apk add --update -q wget make gcc musl-dev
77
RUN wget -np -nv --reject-regex='.*\.(lib|exe)$' --cut-dirs=4 -nH -r ${CPATH}${CVERSION}/
88
RUN cd source && gcc -I ../include/ -static -Os -o3 -o bidiref1 bidiref1.c brutils.c brtest.c brtable.c brrule.c
99
RUN ls -lh /build/source/bidiref1 && (/build/source/bidiref1 || true)
10+
# copy and unpack to /tmp/data
11+
ADD ./target/cldr-unicodetools.tgz /build/data/
12+
# move this into place (including unicodetools/unicodetools)
13+
RUN rm -rf /build/data/cldr/.git # unneeded
1014
FROM jetty:9-jre11-slim AS run
11-
# FROM tomcat:9-jdk14-openjdk-slim-buster AS run
1215
ADD port-entrypoint.sh /port-entrypoint.sh
1316
ADD ./jetty.d/ROOT /var/lib/jetty/webapps/ROOT/
1417
ENTRYPOINT [ "/port-entrypoint.sh" ]
1518
# copy the .war
16-
ADD target/UnicodeJsps.war /var/lib/jetty/webapps/
19+
ADD ./target/UnicodeJsps.war /var/lib/jetty/webapps/
1720
# copy the UCD for bidiref1
1821
COPY src/main/resources/org/unicode/jsp/bidiref1/ucd/ /usr/local/share/ucd/
1922
# this is the parent to 'ucd'
2023
ENV BIDIREFHOME /usr/local/share
2124
# copy the bidiref1 bin
2225
ENV BIDIREF1 /usr/local/bin/bidiref1
2326
COPY --from=cbuild /build/source/bidiref1 /usr/local/bin/
27+
RUN mkdir -p /var/lib/jetty/data/unicodetools
28+
COPY --from=cbuild /build/data/cldr /var/lib/jetty/data/cldr
29+
COPY --from=cbuild /build/data/unicodetools/ /var/lib/jetty/data/unicodetools/unicodetools/
30+
ENV JAVA_OPTIONS -DCLDR_DIR=/var/lib/jetty/data/cldr -DUNICODETOOLS_REPO_DIR=/var/lib/jetty/data/unicodetools
2431
# This is the default PORT. Override by setting PORT.
2532
EXPOSE 8080

UnicodeJsps/src/main/resources/org/unicode/jsp/IdentifierStatus.txt

Lines changed: 8 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
1-
# IdentifierStatus.txt
2-
# Date: 2022-05-18, 21:51:57 GMT
1+
# IdentifierStatus.txt
2+
# Date: 2022-08-26, 16:49:09 GMT
33
# © 2022 Unicode®, Inc.
44
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
55
# For terms of use, see https://www.unicode.org/terms_of_use.html
@@ -14,16 +14,17 @@
1414
# Field 0: code point
1515
# Field 1: Identifier_Status value (see Table 1 of http://www.unicode.org/reports/tr39)
1616
#
17-
# Any missing code points have the Identifier_Status value Restricted
18-
#
1917
# For the purpose of regular expressions, the property Identifier_Status is defined as
2018
# an enumerated property of code points.
2119
# The short name of Identifier_Status is the same as the long name.
2220
# The possible values are:
2321
# Allowed, Restricted
2422
# The short name of each value is the same as its long name.
25-
# The default property value for all Unicode code points U+0000..U+10FFFF
26-
# not mentioned in this data file is Restricted.
23+
24+
# All code points not explicitly listed for Identifier_Status
25+
# have the value Restricted.
26+
27+
# @missing: 0000..10FFFF; Restricted
2728

2829

2930
# Identifier_Status: Allowed
@@ -531,8 +532,6 @@ A788 ; Allowed # 5.1 MODIFIER LETTER LOW CIRCUMFLEX ACCENT
531532
A78D ; Allowed # 6.0 LATIN CAPITAL LETTER TURNED H
532533
A792..A793 ; Allowed # 6.1 [2] LATIN CAPITAL LETTER C WITH BAR..LATIN SMALL LETTER C WITH BAR
533534
A7AA ; Allowed # 6.1 LATIN CAPITAL LETTER H WITH HOOK
534-
A7AE ; Allowed # 9.0 LATIN CAPITAL LETTER SMALL CAPITAL I
535-
A7B8..A7B9 ; Allowed # 11.0 [2] LATIN CAPITAL LETTER U WITH STROKE..LATIN SMALL LETTER U WITH STROKE
536535
A7C0..A7C1 ; Allowed # 14.0 [2] LATIN CAPITAL LETTER OLD POLISH O..LATIN SMALL LETTER OLD POLISH O
537536
A7C2..A7C6 ; Allowed # 12.0 [5] LATIN CAPITAL LETTER ANGLICANA W..LATIN CAPITAL LETTER Z WITH PALATAL HOOK
538537
A7C7..A7CA ; Allowed # 13.0 [4] LATIN CAPITAL LETTER D WITH SHORT STROKE OVERLAY..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY
@@ -586,4 +585,4 @@ FA27..FA29 ; Allowed # 1.1 [3] CJK COMPATIBILITY IDEOGRAPH-FA27..CJK CO
586585
30000..3134A ; Allowed # 13.0 [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A
587586
31350..323AF ; Allowed # 15.0 [4192] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-323AF
588587

589-
# Total code points: 112159
588+
# Total code points: 112156

UnicodeJsps/src/main/resources/org/unicode/jsp/IdentifierType.txt

Lines changed: 13 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
1-
# IdentifierType.txt
2-
# Date: 2022-05-18, 21:51:56 GMT
1+
# IdentifierType.txt
2+
# Date: 2022-08-26, 16:49:09 GMT
33
# © 2022 Unicode®, Inc.
44
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
55
# For terms of use, see https://www.unicode.org/terms_of_use.html
@@ -14,17 +14,19 @@
1414
# Field 0: code point
1515
# Field 1: set of Identifier_Type values (see Table 1 of http://www.unicode.org/reports/tr39)
1616
#
17-
# Any missing code points have the Identifier_Type value Not_Character
18-
#
1917
# For the purpose of regular expressions, the property Identifier_Type is defined as
2018
# mapping each code point to a set of enumerated values.
2119
# The short name of Identifier_Type is the same as the long name.
2220
# The possible values are:
2321
# Not_Character, Deprecated, Default_Ignorable, Not_NFKC, Not_XID,
2422
# Exclusion, Obsolete, Technical, Uncommon_Use, Limited_Use, Inclusion, Recommended
2523
# The short name of each value is the same as its long name.
26-
# The default property value for all Unicode code points U+0000..U+10FFFF
27-
# not mentioned in this data file is Not_Character.
24+
25+
# All code points not explicitly listed for Identifier_Type
26+
# have the value Not_Character.
27+
28+
# @missing: 0000..10FFFF; Not_Character
29+
2830
# As usual, sets are unordered, with no duplicate values.
2931

3032

@@ -524,8 +526,6 @@ A788 ; Recommended # 5.1 MODIFIER LETTER LOW
524526
A78D ; Recommended # 6.0 LATIN CAPITAL LETTER TURNED H
525527
A792..A793 ; Recommended # 6.1 [2] LATIN CAPITAL LETTER C WITH BAR..LATIN SMALL LETTER C WITH BAR
526528
A7AA ; Recommended # 6.1 LATIN CAPITAL LETTER H WITH HOOK
527-
A7AE ; Recommended # 9.0 LATIN CAPITAL LETTER SMALL CAPITAL I
528-
A7B8..A7B9 ; Recommended # 11.0 [2] LATIN CAPITAL LETTER U WITH STROKE..LATIN SMALL LETTER U WITH STROKE
529529
A7C0..A7C1 ; Recommended # 14.0 [2] LATIN CAPITAL LETTER OLD POLISH O..LATIN SMALL LETTER OLD POLISH O
530530
A7C2..A7C6 ; Recommended # 12.0 [5] LATIN CAPITAL LETTER ANGLICANA W..LATIN CAPITAL LETTER Z WITH PALATAL HOOK
531531
A7C7..A7CA ; Recommended # 13.0 [4] LATIN CAPITAL LETTER D WITH SHORT STROKE OVERLAY..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY
@@ -579,7 +579,7 @@ FA27..FA29 ; Recommended # 1.1 [3] CJK COMPATIBILITY ID
579579
30000..3134A ; Recommended # 13.0 [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A
580580
31350..323AF ; Recommended # 15.0 [4192] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-323AF
581581

582-
# Total code points: 112142
582+
# Total code points: 112139
583583

584584
# Identifier_Type: Inclusion
585585

@@ -858,14 +858,15 @@ A67C..A67D ; Uncommon_Use # 5.1 [2] COMBINING CYRILLIC K
858858
A78B..A78C ; Uncommon_Use # 5.1 [2] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER SALTILLO
859859
A78F ; Uncommon_Use # 8.0 LATIN LETTER SINOLOGICAL DOT
860860
A7B2..A7B7 ; Uncommon_Use # 8.0 [6] LATIN CAPITAL LETTER J WITH CROSSED-TAIL..LATIN SMALL LETTER OMEGA
861+
A7B8..A7B9 ; Uncommon_Use # 11.0 [2] LATIN CAPITAL LETTER U WITH STROKE..LATIN SMALL LETTER U WITH STROKE
861862
AB60..AB63 ; Uncommon_Use # 8.0 [4] LATIN SMALL LETTER SAKHA YAT..LATIN SMALL LETTER UO
862863
10780 ; Uncommon_Use # 14.0 MODIFIER LETTER SMALL CAPITAL AA
863864
10EFD..10EFF ; Uncommon_Use # 15.0 [3] ARABIC SMALL LOW WORD SAKTA..ARABIC SMALL LOW WORD MADDA
864865
1AFF0..1AFF3 ; Uncommon_Use # 14.0 [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5
865866
1AFF5..1AFFB ; Uncommon_Use # 14.0 [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5
866867
1AFFD..1AFFE ; Uncommon_Use # 14.0 [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8
867868

868-
# Total code points: 311
869+
# Total code points: 313
869870

870871
# Identifier_Type: Uncommon_Use Technical
871872

@@ -1008,6 +1009,7 @@ A8FC ; Uncommon_Use Obsolete Not_XID # 8.0 DEVANAGARI SIGN SIDD
10081009
3031..3035 ; Technical # 1.1 [5] VERTICAL KANA REPEAT MARK..VERTICAL KANA REPEAT MARK LOWER HALF
10091010
303B..303C ; Technical # 3.2 [2] VERTICAL IDEOGRAPHIC ITERATION MARK..MASU MARK
10101011
A78E ; Technical # 6.0 LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT
1012+
A7AE ; Technical # 9.0 LATIN CAPITAL LETTER SMALL CAPITAL I
10111013
A7AF ; Technical # 11.0 LATIN LETTER SMALL CAPITAL Q
10121014
A7BA..A7BF ; Technical # 12.0 [6] LATIN CAPITAL LETTER GLOTTAL A..LATIN SMALL LETTER GLOTTAL U
10131015
A7FA ; Technical # 6.0 LATIN LETTER SMALL CAPITAL TURNED M
@@ -1024,7 +1026,7 @@ FE73 ; Technical # 3.2 ARABIC TAIL FRAGMENT
10241026
1D185..1D18B ; Technical # 3.1 [7] MUSICAL SYMBOL COMBINING DOIT..MUSICAL SYMBOL COMBINING TRIPLE TONGUE
10251027
1D1AA..1D1AD ; Technical # 3.1 [4] MUSICAL SYMBOL COMBINING DOWN BOW..MUSICAL SYMBOL COMBINING SNAP PIZZICATO
10261028

1027-
# Total code points: 500
1029+
# Total code points: 501
10281030

10291031
# Identifier_Type: Technical Exclusion
10301032

UnicodeJsps/src/main/resources/org/unicode/jsp/NamesList.txt

Lines changed: 19 additions & 28 deletions
Original file line numberDiff line numberDiff line change
@@ -1,23 +1,7 @@
11
; charset=UTF-8
22
@@@ The Unicode Standard 15.0.0
3-
@@@+ U15M220504.lst
4-
Unicode 15.0.0 names list, fourth delta.
5-
Repertoire synched with UnicodeData-15.0.0d4.txt.
6-
Rollup of alpha review fixes.
7-
Adjusted alias and added xref for 1F728.
8-
Added annotations for 1F772, 1F773.
9-
Fixed typos in annotations for 1342F and 13430.
10-
Added cross-references to 20E6.
11-
Added cross-references between 1FAAF and 262C.
12-
Updated annotation for 26A5.
13-
Added annotation for 33D7.
14-
Added annotation for 11F52.
15-
Added cross-references between 10EFD and 08DD.
16-
Added cross-references for 11B00 and 11B09.
17-
Added name alias of type correction for 1BBD.
18-
Added annotation and cross-reference for 2E95.
19-
Extended the range for CJK Unified Ideographs Extension C to 2B739.
20-
Added some annotations for Old Hungarian.
3+
@@@+ U15M220815.lst
4+
Unicode 15.0.0 final names list.
215
This file is semi-automatically derived from UnicodeData.txt and
226
a set of manually created annotations using a script to select
237
or suppress information from the data file. The rules used
@@ -3574,7 +3558,7 @@
35743558
@+ These are obsolete letters attested in a 19th century grammar of Komi.
35753559
052A CYRILLIC CAPITAL LETTER DZZHE
35763560
052B CYRILLIC SMALL LETTER DZZHE
3577-
* also used for Ossetian until 1924
3561+
@+ * also used for Ossetian until 1924
35783562
052C CYRILLIC CAPITAL LETTER DCHE
35793563
052D CYRILLIC SMALL LETTER DCHE
35803564
@ Khanty letters
@@ -3901,6 +3885,7 @@
39013885
* should not be confused with the small TAH sign used as a diacritic for some letters such as 0679
39023886
@ Extended Arabic mark
39033887
0616 ARABIC SMALL HIGH LIGATURE ALEF WITH LAM WITH YEH
3888+
% ARABIC SMALL HIGH LIGATURE ALEF WITH YEH BARREE
39043889
* early Persian
39053890
@ Quranic annotation signs
39063891
0617 ARABIC SMALL HIGH ZAIN
@@ -4085,7 +4070,7 @@
40854070
* Kazakh, Jawi
40864071
* forms digraphs
40874072
@ Digraphic letters for Kazakh
4088-
@+ Use of these characters is discouraged. They were encoded for Kazakh digraphs, but their decompositions do not reflect the preferred order of representation. Accordingly, the representation of these Kazakh digraphs should instead use the preferred two-character spellings with the correct order of elements.
4073+
@+ These characters were encoded for Kazakh digraphs, but their compatibility decompositions do not reflect the preferred order of representation. Accordingly, the representation of these Kazakh digraphs should instead use the preferred two-character spellings with the correct order of elements.
40894074
0675 ARABIC LETTER HIGH HAMZA ALEF
40904075
* preferred spelling is 0674 0627
40914076
# 0627 0674
@@ -4215,7 +4200,7 @@
42154200
* Uyghur, Kazakh, Moroccan Arabic, early Jawi, early Persian, ...
42164201
06AE ARABIC LETTER KAF WITH THREE DOTS BELOW
42174202
* Berber, early Persian
4218-
* Pegon alternative for 068A
4203+
* Pegon alternative for 08B4
42194204
06AF ARABIC LETTER GAF
42204205
* Persian, Urdu, ...
42214206
06B0 ARABIC LETTER GAF WITH RING
@@ -10158,18 +10143,22 @@
1015810143
19AA NEW TAI LUE LETTER HIGH SUA
1015910144
19AB NEW TAI LUE LETTER LOW SUA
1016010145
* a labialized consonant cluster
10161-
@ Vowel signs
10146+
@ Vowels
1016210147
19B0 NEW TAI LUE VOWEL SIGN VOWEL SHORTENER
1016310148
19B1 NEW TAI LUE VOWEL SIGN AA
1016410149
19B2 NEW TAI LUE VOWEL SIGN II
1016510150
19B3 NEW TAI LUE VOWEL SIGN U
1016610151
19B4 NEW TAI LUE VOWEL SIGN UU
1016710152
19B5 NEW TAI LUE VOWEL SIGN E
10153+
* precedes consonant in visual order
1016810154
19B6 NEW TAI LUE VOWEL SIGN AE
10155+
* precedes consonant in visual order
1016910156
19B7 NEW TAI LUE VOWEL SIGN O
10157+
* precedes consonant in visual order
1017010158
19B8 NEW TAI LUE VOWEL SIGN OA
1017110159
19B9 NEW TAI LUE VOWEL SIGN UE
1017210160
19BA NEW TAI LUE VOWEL SIGN AY
10161+
* precedes consonant in visual order
1017310162
19BB NEW TAI LUE VOWEL SIGN AAY
1017410163
19BC NEW TAI LUE VOWEL SIGN UY
1017510164
19BD NEW TAI LUE VOWEL SIGN OY
@@ -13035,7 +13024,7 @@
1303513024
x (asterisk - 002A)
1303613025
x (combining asterisk below - 0359)
1303713026
204F REVERSED SEMICOLON
13038-
* also used in Sindhi
13027+
* used occasionally in Sindhi when Sindhi is written in the Arabic script
1303913028
x (semicolon - 003B)
1304013029
x (arabic semicolon - 061B)
1304113030
2050 CLOSE UP
@@ -13423,7 +13412,7 @@
1342313412
= the set of complex numbers
1342413413
# <font> 0043 latin capital letter c
1342513414
2103 DEGREE CELSIUS
13426-
= degrees Centigrade
13415+
= degrees centigrade
1342713416
# 00B0 0043
1342813417
2104 CENTRE LINE SYMBOL
1342913418
= clone
@@ -19328,7 +19317,8 @@
1932819317
x (modifier letter short equals sign - A78A)
1932919318
@ Reversed punctuation
1933019319
2E41 REVERSED COMMA
19331-
* also used in Sindhi
19320+
* Old Hungarian
19321+
* used occasionally in Sindhi when Sindhi is written in the Arabic script
1933219322
x (comma - 002C)
1933319323
x (arabic comma - 060C)
1933419324
2E42 DOUBLE LOW-REVERSED-9 QUOTATION MARK
@@ -19365,7 +19355,7 @@
1936519355
x (paragraphos - 2E0F)
1936619356
x (capitulum - 2E3F)
1936719357
2E4E PUNCTUS ELEVATUS MARK
19368-
@+ This mark indicates a major intermediate pause where the sensus is complete but the sentence is not; this is similar in some regards to the modern use of a semicolon.
19358+
@+ * This mark indicates a major intermediate pause where the sensus is complete but the sentence is not; this is similar in some regards to the modern use of a semicolon.
1936919359
2E4F CORNISH VERSE DIVIDER
1937019360
2E50 CROSS PATTY WITH RIGHT CROSSBAR
1937119361
x (maltese cross - 2720)
@@ -25562,6 +25552,7 @@ AB2E ETHIOPIC SYLLABLE BBO
2556225552
@@ AB30 Latin Extended-E AB6F
2556325553
@ Letters for German dialectology
2556425554
AB30 LATIN SMALL LETTER BARRED ALPHA
25555+
@+ * This letter is a Latin alpha with a horizontal strikethrough bar. In some font designs, the bar might not extend beyond the edge of the letter, and in such cases, the letter should not be confused with a ligature of epsilon and iota.
2556525556
AB31 LATIN SMALL LETTER A REVERSED-SCHWA
2556625557
AB32 LATIN SMALL LETTER BLACKLETTER E
2556725558
AB33 LATIN SMALL LETTER BARRED E
@@ -35030,7 +35021,7 @@ FFFF <not a character>
3503035021
11B07 DEVANAGARI SIGN WESTERN NINE-LIKE BHALE
3503135022
11B08 DEVANAGARI SIGN REVERSED NINE-LIKE BHALE
3503235023
11B09 DEVANAGARI SIGN MINDU
35033-
x (devanagari digit zero - 0966)
35024+
x (devanagari digit zero - 0966)
3503435025
@@ 11C00 Bhaiksuki 11C6F
3503535026
@ Independent vowels
3503635027
11C00 BHAIKSUKI LETTER A
@@ -35473,7 +35464,7 @@ FFFF <not a character>
3547335464
11F3E KAWI VOWEL SIGN E
3547435465
11F3F KAWI VOWEL SIGN AI
3547535466
11F40 KAWI VOWEL SIGN EU
35476-
* represents schwa [ǝ]
35467+
* represents schwa [ə]
3547735468
@ Viramas
3547835469
11F41 KAWI SIGN KILLER
3547935470
* vowel killer, always rendered visibly

UnicodeJsps/src/main/resources/org/unicode/jsp/StandardizedVariants.txt

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
# StandardizedVariants-15.0.0.txt
2-
# Date: 2022-01-28, 21:31:00 GMT [KW]
2+
# Date: 2022-08-16, 19:08:00 GMT [KW]
33
# © 2022 Unicode®, Inc.
44
# For terms of use, see https://www.unicode.org/terms_of_use.html
55
#
@@ -364,10 +364,10 @@ A868 FE00; phags-pa letter reversed shaping subjoined ya; # PHAGS-PA SUBJOINED L
364364

365365
# Egyptian hieroglyph expanded variants
366366

367-
13443 FE00; expanded ; # LOST SIGN
368-
13444 FE00; expanded ; # HALF LOST SIGN
369-
13445 FE00; expanded ; # TALL LOST SIGN
370-
13446 FE00; expanded ; # WIDE LOST SIGN
367+
13443 FE00; expanded ; # EGYPTIAN HIEROGLYPH LOST SIGN
368+
13444 FE00; expanded ; # EGYPTIAN HIEROGLYPH HALF LOST SIGN
369+
13445 FE00; expanded ; # EGYPTIAN HIEROGLYPH TALL LOST SIGN
370+
13446 FE00; expanded ; # EGYPTIAN HIEROGLYPH WIDE LOST SIGN
371371

372372
# CJK compatibility ideographs
373373

UnicodeJsps/src/main/resources/org/unicode/jsp/confusables.txt

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
1-
# confusables.txt
2-
# Date: 2022-05-18, 21:51:56 GMT
1+
# confusables.txt
2+
# Date: 2022-08-26, 16:49:08 GMT
33
# © 2022 Unicode®, Inc.
44
# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
55
# For terms of use, see https://www.unicode.org/terms_of_use.html
@@ -7535,10 +7535,10 @@ FA7E ; 5944 ; MA # ( 奄 → 奄 ) CJK COMPATIBILITY IDEOGRAPH-FA7E → CJK UNIF
75357535

75367536
F90C ; 5948 ; MA # ( 奈 → 奈 ) CJK COMPATIBILITY IDEOGRAPH-F90C → CJK UNIFIED IDEOGRAPH-5948 #
75377537

7538-
F909 ; 5951 ; MA # ( 契 → 契 ) CJK COMPATIBILITY IDEOGRAPH-F909 → CJK UNIFIED IDEOGRAPH-5951 #
7539-
75407538
FA7F ; 5954 ; MA # ( 奔 → 奔 ) CJK COMPATIBILITY IDEOGRAPH-FA7F → CJK UNIFIED IDEOGRAPH-5954 #
75417539

7540+
F909 ; 5951 ; MA # ( 契 → 契 ) CJK COMPATIBILITY IDEOGRAPH-F909 → CJK UNIFIED IDEOGRAPH-5951 #
7541+
75427542
2F85F ; 5962 ; MA # ( 奢 → 奢 ) CJK COMPATIBILITY IDEOGRAPH-2F85F → CJK UNIFIED IDEOGRAPH-5962 #
75437543

75447544
F981 ; 5973 ; MA # ( 女 → 女 ) CJK COMPATIBILITY IDEOGRAPH-F981 → CJK UNIFIED IDEOGRAPH-5973 #

0 commit comments

Comments
 (0)