d7343b997d0cd57009733d623f3bd96052b1a7bc
   1#!/bin/sh
   2#See http://www.unicode.org/reports/tr44/
   3#
   4#Me Enclosing_Mark  an enclosing combining mark
   5#Mn Nonspacing_Mark a nonspacing combining mark (zero advance width)
   6#Cf Format          a format control character
   7#
   8UNICODEWIDTH_H=../unicode_width.h
   9if ! test -d unicode; then
  10        mkdir unicode
  11fi &&
  12( cd unicode &&
  13        if ! test -f UnicodeData.txt; then
  14                wget http://www.unicode.org/Public/UCD/latest/ucd/UnicodeData.txt
  15        fi &&
  16        if ! test -f EastAsianWidth.txt; then
  17                wget http://www.unicode.org/Public/UCD/latest/ucd/EastAsianWidth.txt
  18        fi &&
  19        if ! test -d uniset; then
  20                git clone https://github.com/depp/uniset.git
  21        fi &&
  22        (
  23                cd uniset &&
  24                if ! test -x uniset; then
  25                        autoreconf -i &&
  26                        ./configure --enable-warnings=-Werror CFLAGS='-O0 -ggdb'
  27                fi &&
  28                make
  29        ) && {
  30                UNICODE_DIR=. && export UNICODE_DIR &&
  31                cat <<-EOF
  32                static const struct interval zero_width[] = {
  33                        $(uniset/uniset --32 cat:Me,Mn,Cf \
  34                          + U+1160..U+11FF - U+00AD | grep -v plane)
  35                };
  36                static const struct interval double_width[] = {
  37                        $(uniset/uniset --32 eaw:F,W)
  38                };
  39                EOF
  40        } >$UNICODEWIDTH_H
  41)