summaryrefslogtreecommitdiff
path: root/unicode_download.sh
diff options
context:
space:
mode:
authorFabrice Bellard <fabrice@bellard.org>2025-05-16 17:43:03 +0200
committerFabrice Bellard <fabrice@bellard.org>2025-05-16 17:43:03 +0200
commitd7cdfdc8d7b8e74a6be74f4f3535ef6eac976dc1 (patch)
tree8d42c1f5a55f57a03d187f75bb90f8296d7f12a0 /unicode_download.sh
parenta8b2d7c2b2751130000b74ac7d831fd75a0abbc3 (diff)
downloadquickjs-d7cdfdc8d7b8e74a6be74f4f3535ef6eac976dc1.tar.gz
quickjs-d7cdfdc8d7b8e74a6be74f4f3535ef6eac976dc1.zip
regexp: added v flag support - fixed corner cases of case insensitive matching
Diffstat (limited to 'unicode_download.sh')
-rwxr-xr-xunicode_download.sh12
1 files changed, 8 insertions, 4 deletions
diff --git a/unicode_download.sh b/unicode_download.sh
index e259891..ef8b30d 100755
--- a/unicode_download.sh
+++ b/unicode_download.sh
@@ -1,8 +1,9 @@
#!/bin/sh
set -e
-url="ftp://ftp.unicode.org/Public/16.0.0/ucd"
-emoji_url="${url}/emoji/emoji-data.txt"
+version="16.0.0"
+emoji_version="16.0"
+url="ftp://ftp.unicode.org/Public"
files="CaseFolding.txt DerivedNormalizationProps.txt PropList.txt \
SpecialCasing.txt CompositionExclusions.txt ScriptExtensions.txt \
@@ -12,8 +13,11 @@ PropertyValueAliases.txt"
mkdir -p unicode
for f in $files; do
- g="${url}/${f}"
+ g="${url}/${version}/ucd/${f}"
wget $g -O unicode/$f
done
-wget $emoji_url -O unicode/emoji-data.txt
+wget "${url}/${version}/ucd/emoji/emoji-data.txt" -O unicode/emoji-data.txt
+
+wget "${url}/emoji/${emoji_version}/emoji-sequences.txt" -O unicode/emoji-sequences.txt
+wget "${url}/emoji/${emoji_version}/emoji-zwj-sequences.txt" -O unicode/emoji-zwj-sequences.txt