diff options
Diffstat (limited to 'update_unicode.sh')
| -rwxr-xr-x | update_unicode.sh | 37 | 
1 files changed, 37 insertions, 0 deletions
diff --git a/update_unicode.sh b/update_unicode.sh new file mode 100755 index 0000000000..000b937e68 --- /dev/null +++ b/update_unicode.sh @@ -0,0 +1,37 @@ +#!/bin/sh +#See http://www.unicode.org/reports/tr44/ +# +#Me Enclosing_Mark  an enclosing combining mark +#Mn Nonspacing_Mark a nonspacing combining mark (zero advance width) +#Cf Format          a format control character +# +UNICODEWIDTH_H=../unicode_width.h +if ! test -d unicode; then +	mkdir unicode +fi && +( cd unicode && +	if ! test -f UnicodeData.txt; then +		wget http://www.unicode.org/Public/UCD/latest/ucd/UnicodeData.txt +	fi && +	if ! test -f EastAsianWidth.txt; then +		wget http://www.unicode.org/Public/UCD/latest/ucd/EastAsianWidth.txt +	fi && +	if ! test -d uniset; then +		git clone https://github.com/depp/uniset.git +	fi && +	( +		cd uniset && +		if ! test -x uniset; then +			autoreconf -i && +			./configure --enable-warnings=-Werror CFLAGS='-O0 -ggdb' +		fi && +		make +	) && +	echo "static const struct interval zero_width[] = {" >$UNICODEWIDTH_H && +	UNICODE_DIR=. ./uniset/uniset --32 cat:Me,Mn,Cf + U+1160..U+11FF - U+00AD | +	grep -v plane >>$UNICODEWIDTH_H && +	echo "};" >>$UNICODEWIDTH_H && +	echo "static const struct interval double_width[] = {" >>$UNICODEWIDTH_H && +	UNICODE_DIR=. ./uniset/uniset --32 eaw:F,W >>$UNICODEWIDTH_H && +	echo "};" >>$UNICODEWIDTH_H +)  | 
