From 0f8057ccc882cd87ccfad6463d4ec15fb7b801fa Mon Sep 17 00:00:00 2001 From: Markus Scherer Date: Fri, 18 Jul 2025 15:58:05 -0700 Subject: [PATCH] pub with links, Idna2008 remove Chisoi+3 --- docs/ucdxml.md | 6 +++++- pub/copy-beta-to-draft.sh | 3 +++ unicodetools/data/idna/dev/Idna2008.txt | 16 ++++++---------- 3 files changed, 14 insertions(+), 11 deletions(-) diff --git a/docs/ucdxml.md b/docs/ucdxml.md index d1f68d718..33ebfd477 100644 --- a/docs/ucdxml.md +++ b/docs/ucdxml.md @@ -47,7 +47,11 @@ mvn compile exec:java -Dexec.mainClass="org.unicode.xml.UCDXML" -Dexec.args="--r mvn compile exec:java -Dexec.mainClass="org.unicode.xml.UCDXML" -Dexec.args="--range UNIHAN --output GROUPED" -DCLDR_DIR=$(cd ~/cldr/uni/src; pwd) -DUNICODETOOLS_GEN_DIR=$(cd ../Generated; pwd) -DUNICODETOOLS_REPO_DIR=$(pwd) -am -pl unicodetools mvn compile exec:java -Dexec.mainClass="org.unicode.xml.UCDXML" -Dexec.args="--range NOUNIHAN --output GROUPED" -DCLDR_DIR=$(cd ~/cldr/uni/src; pwd) -DUNICODETOOLS_GEN_DIR=$(cd ../Generated; pwd) -DUNICODETOOLS_REPO_DIR=$(pwd) -am -pl unicodetools -cd ../Generated/ucdxml/17.0.0/ +ls -l ../Generated/ucdxml/17.0.0 +rm ../Generated/ucdxml/17.0.0/*.zip +meld unicodetools/data/ucdxml/dev ../Generated/ucdxml/17.0.0 + +cd ../Generated/ucdxml/17.0.0 zip -9 ucd.all.flat.zip ucd.all.flat.xml zip -9 ucd.all.grouped.zip ucd.all.grouped.xml diff --git a/pub/copy-beta-to-draft.sh b/pub/copy-beta-to-draft.sh index 81182ca13..bbc59e15e 100755 --- a/pub/copy-beta-to-draft.sh +++ b/pub/copy-beta-to-draft.sh @@ -46,6 +46,9 @@ cp $UNITOOLS_DATA/idna/dev/* $DRAFT/idna mkdir -p $DRAFT/security cp $UNITOOLS_DATA/security/dev/* $DRAFT/security +mkdir -p $DRAFT/links +cp $UNITOOLS_DATA/links/dev/* $DRAFT/links + # Fix permissions. Everyone can read, and search directories. chmod a+rX -R $DRAFT diff --git a/unicodetools/data/idna/dev/Idna2008.txt b/unicodetools/data/idna/dev/Idna2008.txt index 264a54efc..e44c7b562 100644 --- a/unicodetools/data/idna/dev/Idna2008.txt +++ b/unicodetools/data/idna/dev/Idna2008.txt @@ -1,5 +1,5 @@ # Idna2008-17.0.0.txt -# Date: 2025-05-02, 07:27:27 GMT [KW] +# Date: 2025-07-18 # Copyright 2025 Unicode, Inc. # For terms of use and license, see https://www.unicode.org/terms_of_use.html # @@ -719,8 +719,8 @@ 09F2..09FB ; DISALLOWED # BENGALI RUPEE MARK..BENGALI GANDA MARK 09FC ; PVALID # BENGALI LETTER VEDIC ANUSVARA 09FD ; DISALLOWED # BENGALI ABBREVIATION SIGN -09FE..09FF ; PVALID # BENGALI SANDHI MARK..BENGALI LETTER SANSKRIT BA -0A00 ; UNASSIGNED # +09FE ; PVALID # BENGALI SANDHI MARK +09FF..0A00 ; UNASSIGNED # .. 0A01..0A03 ; PVALID # GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN VISARGA 0A04 ; UNASSIGNED # 0A05..0A0A ; PVALID # GURMUKHI LETTER A..GURMUKHI LETTER UU @@ -805,8 +805,8 @@ 0B47..0B48 ; PVALID # ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI 0B49..0B4A ; UNASSIGNED # .. 0B4B..0B4D ; PVALID # ORIYA VOWEL SIGN O..ORIYA SIGN VIRAMA -0B4E..0B52 ; UNASSIGNED # .. -0B53..0B57 ; PVALID # ORIYA SIGN DOT ABOVE..ORIYA AU LENGTH MARK +0B4E..0B54 ; UNASSIGNED # .. +0B55..0B57 ; PVALID # ORIYA SIGN OVERLINE..ORIYA AU LENGTH MARK 0B58..0B5B ; UNASSIGNED # .. 0B5C..0B5D ; DISALLOWED # ORIYA LETTER RRA..ORIYA LETTER RHA 0B5E ; UNASSIGNED # @@ -2716,11 +2716,7 @@ FFF9..FFFF ; DISALLOWED # INTERLINEAR ANNOTATION ANCHOR.. 16D40..16D6C; PVALID # KIRAT RAI SIGN ANUSVARA..KIRAT RAI SIGN SAAT 16D6D..16D6F; DISALLOWED # KIRAT RAI SIGN YUPI..KIRAT RAI DOUBLE DANDA 16D70..16D79; PVALID # KIRAT RAI DIGIT ZERO..KIRAT RAI DIGIT NINE -16D7A..16D7F; UNASSIGNED # .. -16D80..16D9D; PVALID # CHISOI LETTER A..CHISOI SIGN SISO -16D9E..16D9F; UNASSIGNED # .. -16DA0..16DA9; PVALID # CHISOI DIGIT ZERO..CHISOI DIGIT NINE -16DAA..16E3F; UNASSIGNED # .. +16D7A..16E3F; UNASSIGNED # .. 16E40..16E5F; DISALLOWED # MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN CAPITAL LETTER Y 16E60..16E7F; PVALID # MEDEFAIDRIN SMALL LETTER M..MEDEFAIDRIN SMALL LETTER Y 16E80..16E9A; DISALLOWED # MEDEFAIDRIN DIGIT ZERO..MEDEFAIDRIN EXCLAMATION OH