include ../encodings.inc
LC_ALL = LC_ALL=uk_UA.$(SOURCE_ENC)
sort = $(LC_ALL) sort
spcr = tr ' ' '\n'
CLEANFILES = *.lst *.srt *.diff *.dups *.nodups
DISTCLEANFILES = *.old
wordlist_src = ../src/Dictionary/uk_words.lst
iconv = iconv
VERSION=$(shell cat ../VERSION)
DIST = ../dist
ASPELL_DIST = $(DIST)/aspell-uk-$(VERSION)
ASPELL_DICT = $(shell pwd)/../dist/aspell-uk-$(VERSION)
MYSPELL_DICT = $(shell pwd)/../dist/myspell-uk-$(VERSION)/uk_UA | grep "[а-яіїєґ]"
LIST_CMD=LC_ALL=uk_UA.UTF-8 aspell list -l uk --dict-dir=$(ASPELL_DICT)
#LIST_CMD=hunspell -l -d $(MYSPELL_DICT)
all: regtest-aspell
# cat $(wordlist_src) | $(LC_ALL) aspell expand -l uk --local-data-dir=../ > all_aspell.lst
all_aspell_lst:
make -C ..
cat $(wordlist_src) | aspell expand -l uk --local-data-dir=$(ASPELL_DIST) --encoding=$(SOURCE_ENC) > all_aspell.lst
regtest: all_aspell_lst
cat all_aspell.lst | $(spcr) | $(sort) > all_aspell.srt
cat all_aspell.srt | uniq > all_aspell.srt.nodups
cat all_aspell.srt | uniq -d -c > all_aspell.srt.dups
-diff all_aspell.srt.nodups.old all_aspell.srt.nodups > all_aspell.srt.nodups.diff
-diff all_aspell.srt.dups.old all_aspell.srt.dups > all_aspell.srt.dups.diff
regtestroll:
-[ -f all_aspell.srt.nodups ] && mv -f all_aspell.srt.nodups all_aspell.srt.nodups.old
-[ -f all_aspell.srt.dups ] && mv -f all_aspell.srt.dups all_aspell.srt.dups.old
-[ -f Malyk.lst ] && mv -f Malyk.lst Malyk.lst.old
-[ -f ZN.lst ] && mv -f ZN.lst ZN.lst.old
-[ -f KDE.lst ] && mv -f KDE.lst KDE.lst.old
-[ -f ukr_lit.lst ] && mv -f ukr_lit.lst ukr_lit.lst.old
text:
cat src_text/Malyk.txt | $(LIST_CMD) | LC_ALL=uk_UA.UTF-8 sort | LC_ALL=uk_UA.UTF-8 uniq -i > Malyk.lst
cat src_text/ZN.txt | $(LIST_CMD) | LC_ALL=uk_UA.UTF-8 sort | LC_ALL=uk_UA.UTF-8 uniq -i > ZN.lst
cat src_text/KDE.po | sed "s/&//g" | sed "s/’/'/g" | sed -r "s/\\[a-z]//g" | $(LIST_CMD) | LC_ALL=uk_UA.UTF-8 sort | LC_ALL=uk_UA.UTF-8 uniq -i > KDE.lst
cat src_text/ukr_lit.txt | sed "s/’/'/g" | $(LIST_CMD) | LC_ALL=uk_UA.UTF-8 sort | LC_ALL=uk_UA.UTF-8 uniq -i > ukr_lit.lst
text_regtest: text
-diff Malyk.lst.old Malyk.lst > Malyk.diff
-diff ZN.lst.old ZN.lst > ZN.diff
-diff KDE.lst.old KDE.lst > KDE.diff
-diff ukr_lit.lst.old ukr_lit.lst > ukr_lit.diff
reverse: all_aspell.srt
iconv -f UTF-8 -t KOI8-U all_aspell.srt | LC_ALL=uk_UA.KOI8-U perl -ne 'print scalar reverse $$_;' | LANG=uk_UA.KOI8-U sort | LC_ALL=uk_UA.KOI8-U perl -ne 'print scalar reverse $$_;' | iconv -f KOI8-U -t UTF-8 > all_spell.reverse.lst
clean:
rm -f $(CLEANFILES)
distclean:
rm -f $(CLEANFILES) $(DISTCLEANFILES)
.PHONY: all regtest regtestroll clean clean_all all_spell_lst