3fe5799144
The uniset upstream has accepted my patches that eliminate the Unicode plane offsets from the output in '--32' mode. Remove the corresponding filter in update_unicode.sh. This also fixes the issue that the plane offsets were not removed from the second uniset call. Signed-off-by: Beat Bolli <dev+git@drbeat.li> Signed-off-by: Junio C Hamano <gitster@pobox.com>
34 lines
971 B
Bash
Executable File
34 lines
971 B
Bash
Executable File
#!/bin/sh
|
|
#See http://www.unicode.org/reports/tr44/
|
|
#
|
|
#Me Enclosing_Mark an enclosing combining mark
|
|
#Mn Nonspacing_Mark a nonspacing combining mark (zero advance width)
|
|
#Cf Format a format control character
|
|
#
|
|
cd "$(dirname "$0")"
|
|
UNICODEWIDTH_H=$(git rev-parse --show-toplevel)/unicode_width.h
|
|
|
|
wget -N http://www.unicode.org/Public/UCD/latest/ucd/UnicodeData.txt \
|
|
http://www.unicode.org/Public/UCD/latest/ucd/EastAsianWidth.txt &&
|
|
if ! test -d uniset; then
|
|
git clone https://github.com/depp/uniset.git &&
|
|
( cd uniset && git checkout 4b186196dd )
|
|
fi &&
|
|
(
|
|
cd uniset &&
|
|
if ! test -x uniset; then
|
|
autoreconf -i &&
|
|
./configure --enable-warnings=-Werror CFLAGS='-O0 -ggdb'
|
|
fi &&
|
|
make
|
|
) &&
|
|
UNICODE_DIR=. && export UNICODE_DIR &&
|
|
cat >$UNICODEWIDTH_H <<-EOF
|
|
static const struct interval zero_width[] = {
|
|
$(uniset/uniset --32 cat:Me,Mn,Cf + U+1160..U+11FF - U+00AD)
|
|
};
|
|
static const struct interval double_width[] = {
|
|
$(uniset/uniset --32 eaw:F,W)
|
|
};
|
|
EOF
|