Blob Blame History Raw
#! /bin/sh

. ${srcdir=.}/t.frame

# create a test wordlist with tokens containing non-ascii characters,
# replace the non-ascii characters to question marks,
# check the number of tokens in the wordlist
#
# test below
# remember to use ${srcdir}

# check for non-default configuration
if [ -n "$USE_UNICODE" -a "$USE_UNICODE" != "yes" ] ; then
    exit 77
fi

if [ -z "$USE_UNICODE" ] ; then
    UNICODE_NO="--unicode=no"
fi

echo  	41 A4 BA B5 B5 20 31     20  30 20  32 30 30 33 30 33 30 33 0A \
	41 C1 BA B8 B5 20 32     20  30 20  32 30 30 32 31 32 30 32 0A \
	41 BA C1 B8 B5 20 33     20  30 20  32 30 30 33 30 33 30 31 0A \
  	42 A4 BA B8 B5 B5 20 31  20  30 20  32 30 30 33 30 33 30 33 0A \
	42 C1 BA B8 B5 B5 20 32  20  30 20  32 30 30 32 31 32 30 32 0A \
	42 BA C1 B8 B5 B5 20 33  20  30 20  32 30 30 33 30 33 30 31 0A \
	42 C1 BA B5 B8 B5 20 34  20  30 20  32 30 30 33 30 33 30 34 0A \
| ./dehex > "$TMPDIR"/input

$BOGOUTIL -C -l "$WORDLIST" < "$TMPDIR"/input
$BOGOUTIL -C -d "$WORDLIST" | egrep -v "^(\.MSG_COUNT|\.ENCODING)" > "$TMPDIR"/output.1
$BOGOUTIL -C -n -m "$WORDLIST" $UNICODE_NO
$BOGOUTIL -C -d "$WORDLIST" | egrep -v "^(\.MSG_COUNT|\.ENCODING)" > "$TMPDIR"/output.2

LEN1=`wc -l "$TMPDIR"/output.1 | $AWK '{print $1}'`
LEN2=`wc -l "$TMPDIR"/output.2 | $AWK '{print $1}'`

TOKDAT1=`head -1 "$TMPDIR"/output.2 | $AWK '{print $2 "." $4 }'`
TOKDAT2=`tail -1 "$TMPDIR"/output.2 | $AWK '{print $2 "." $4 }'`

RESULT=`printf "%d.%d %s %s" $LEN1 $LEN2 $TOKDAT1 $TOKDAT2`

WANT="7.2 6.20030303 10.20030304"

if [ "$RESULT" != "$WANT" ] || [ $verbose -gt 0 ] ; then
    echo want: \"$WANT\", have: \"$RESULT\"
fi

test "$RESULT" = "$WANT"