Skip to content

Commit

Permalink
skk dictionaries at 2017-06-09
Browse files Browse the repository at this point in the history
  • Loading branch information
tkita committed Jun 9, 2017
1 parent 9de3b31 commit 8835e5b
Show file tree
Hide file tree
Showing 48 changed files with 1,087,053 additions and 0 deletions.
12,377 changes: 12,377 additions & 0 deletions ChangeLog

Large diffs are not rendered by default.

14,733 changes: 14,733 additions & 0 deletions ChangeLog.1

Large diffs are not rendered by default.

37,039 changes: 37,039 additions & 0 deletions ChangeLog.2

Large diffs are not rendered by default.

28,425 changes: 28,425 additions & 0 deletions ChangeLog.3

Large diffs are not rendered by default.

192 changes: 192 additions & 0 deletions Makefile
Original file line number Diff line number Diff line change
@@ -0,0 +1,192 @@
# Makefile: makefile for SKK Dictionaries.
#
# Maintainer: SKK Development Team <[email protected]>
# Version: $Id: Makefile,v 1.47 2015/01/16 07:34:37 skk-cvs Exp $
# Last Modified: $Date: 2015/01/16 07:34:37 $

BZIP2 = bzip2 -9
COUNT = skkdic-count
DATE = date
EXPR = skkdic-expr
EXPR2 = skkdic-expr2
GAWK = LC_ALL=C gawk
GREP = grep
SED = sed
GZIP = gzip -9
MD5 = md5
RM = /bin/rm -f
RUBY = ruby -I $(TOOLS_DIR)/filters
SORT = skkdic-sort
TAR = tar
#TODAY = `$(DATE) '+%Y%m%d'`
ZIP = zip
ZIPDIC_DIR = ./zipcode

DIC2PDB = dic2pdb
DICCOMPACT = diccompact.rb
KANADIC2ROMADIC = kanadic2romadic
NKF = nkf
SKKDIC2KANADIC = skkdic2kanadic
TOOLS_DIR = ../tools

SRCS = SKK-JISYO.L SKK-JISYO.ML SKK-JISYO.M SKK-JISYO.S SKK-JISYO.JIS2 \
SKK-JISYO.JIS3_4 SKK-JISYO.pubdic+ SKK-JISYO.wrong.annotated \
SKK-JISYO.okinawa SKK-JISYO.geo SKK-JISYO.jinmei SKK-JISYO.law \
SKK-JISYO.mazegaki SKK-JISYO.assoc SKK-JISYO.itaiji \
SKK-JISYO.itaiji.JIS3_4 SKK-JISYO.china_taiwan \
SKK-JISYO.propernoun SKK-JISYO.station SKK-JISYO.requested \
SKK-JISYO.fullname SKK-JISYO.JIS2004 SKK-JISYO.lisp
# SKK-JISYO.noregist SKK-JISYO.hukugougo
BIN_SRCS = #PBinlineDB.pdb
ALL_SRCS = $(SRCS) $(BIN_SRCS) SKK-JISYO.wrong SKK-JISYO.L.unannotated
# SKK-JISYO.L+ SKK-JISYO.L.taciturn SKK-JISYO.total

PYTHON = python
SKK2CDB = skk2cdb.py -f
CDB_SOURCE = ./SKK-JISYO.L
CDB_TARGET = ./`basename $(CDB_SOURCE)`.cdb

clean:
$(RM) *.gz* *.bz2* *.zip* *~ `find . -name '*~'` `find . -name '.*~'` `find . -name '.#*'` \
*.unannotated SKK-JISYO.wrong PBinlineDB.pdb *.tmp *.w PBinlineDB.dic *.taciturn SKK-JISYO.L+ SKK-JISYO.total SKK-JISYO.total+zipcode SKK-JISYO.L.header SKK-JISYO.china_taiwan

archive: gzip #zip bzip2

unannotated: SKK-JISYO.L.unannotated SKK-JISYO.wrong SKK-JISYO.china_taiwan.unannotated

SKK-JISYO.L.unannotated: SKK-JISYO.L
$(GAWK) -f $(TOOLS_DIR)/unannotation.awk SKK-JISYO.L > SKK-JISYO.L.unannotated

SKK-JISYO.wrong: SKK-JISYO.wrong.annotated
$(GAWK) -f $(TOOLS_DIR)/unannotation.awk SKK-JISYO.wrong.annotated > SKK-JISYO.wrong

SKK-JISYO.china_taiwan: csv/china_taiwan.csv
$(RUBY) $(TOOLS_DIR)/convert2skk/ctdicconv.rb csv/china_taiwan.csv > SKK-JISYO.tmp
$(EXPR) SKK-JISYO.tmp | $(SORT) - > SKK-JISYO.1.tmp
cat SKK-JISYO.china_taiwan.header SKK-JISYO.1.tmp > SKK-JISYO.china_taiwan
$(RM) SKK-JISYO.tmp SKK-JISYO.1.tmp

SKK-JISYO.china_taiwan.unannotated: SKK-JISYO.china_taiwan csv/china_taiwan.csv
$(GAWK) -f $(TOOLS_DIR)/unannotation.awk SKK-JISYO.china_taiwan > SKK-JISYO.china_taiwan.unannotated

wrong_check: SKK-JISYO.wrong
for file in $(SRCS) ; do \
if [ $$file != "SKK-JISYO.wrong.annotated" ] ; then \
$(EXPR) $$file - SKK-JISYO.wrong > $$file.tmp ;\
$(EXPR) $$file - $$file.tmp > $$file.w ;\
$(RM) $$file.tmp ;\
$(COUNT) $$file.w | $(GREP) -v '0 candidate' | \
sed -e 's/\.w:/:/' -e 's/\([1-9]\)/\1 wrong/' ;\
if [ $$? != 0 ]; then \
$(RM) $$file.w ; \
fi ;\
fi ;\
done

PBinlineDB.dic: clean SKK-JISYO.L.unannotated
$(SKKDIC2KANADIC) SKK-JISYO.L.unannotated | $(KANADIC2ROMADIC) - | $(NKF) -s > PBinlineDB.dic

PBinlineDB_compact.pdb: PBinlineDB.dic
$(DICCOMPACT) PBinlineDB.dic | $(DIC2PDB) - PBinlineDB.pdb

PBinlineDB_full.pdb: PBinlineDB.dic
$(DIC2PDB) PBinlineDB.dic PBinlineDB.pdb

PBinlineDB.pdb: PBinlineDB_full.pdb
$(RM) PBinlineDB.dic

zip: clean $(ALL_SRCS)
for file in $(ALL_SRCS); do \
$(ZIP) $$file.zip $$file ;\
$(MD5) $$file.zip >$$file.zip.md5; \
done
$(ZIP) SKK-JISYO.edict.zip SKK-JISYO.edict edict_doc.txt
$(ZIP) -r zipcode.zip $(ZIPDIC_DIR) -x@./skk.ex
$(MD5) zipcode.zip >zipcode.zip.md5

gzip: clean $(ALL_SRCS)
for file in $(ALL_SRCS); do \
$(GZIP) -fc $$file >$$file.gz ;\
$(MD5) $$file.gz >$$file.gz.md5; \
done
$(TAR) cvpf SKK-JISYO.edict.tar SKK-JISYO.edict edict_doc.txt
$(GZIP) -f SKK-JISYO.edict.tar
$(MD5) SKK-JISYO.edict.tar.gz > SKK-JISYO.edict.tar.gz.md5
$(TAR) cvzpf zipcode.tar.gz --exclude-from=./skk.ex ./zipcode
$(MD5) zipcode.tar.gz >zipcode.tar.gz.md5

SKK-JISYO.L+: SKK-JISYO.L SKK-JISYO.L.header
$(RUBY) $(TOOLS_DIR)/filters/conjugation.rb -Cpox SKK-JISYO.notes > SKK-JISYO.tmp
$(RUBY) $(TOOLS_DIR)/filters/asayaKe.rb -p SKK-JISYO.L >> SKK-JISYO.tmp
$(RUBY) $(TOOLS_DIR)/filters/complete-numerative.rb -pU SKK-JISYO.L >> SKK-JISYO.tmp
$(RUBY) $(TOOLS_DIR)/filters/abbrev-convert.rb -K -s 2 SKK-JISYO.L >> SKK-JISYO.tmp
$(RUBY) $(TOOLS_DIR)/filters/abbrev-convert.rb -w -s 2 SKK-JISYO.L >> SKK-JISYO.tmp
$(EXPR2) SKK-JISYO.L + SKK-JISYO.tmp | cat SKK-JISYO.L.header - > SKK-JISYO.L+
$(RM) SKK-JISYO.tmp SKK-JISYO.addition

SKK-JISYO.total: SKK-JISYO.L SKK-JISYO.geo SKK-JISYO.station SKK-JISYO.jinmei SKK-JISYO.propernoun SKK-JISYO.fullname SKK-JISYO.law SKK-JISYO.okinawa SKK-JISYO.hukugougo SKK-JISYO.assoc SKK-JISYO.notes SKK-JISYO.L.header
$(RUBY) $(TOOLS_DIR)/filters/conjugation.rb -Cpox SKK-JISYO.notes > SKK-JISYO.tmp
$(RUBY) $(TOOLS_DIR)/filters/asayaKe.rb -p SKK-JISYO.L >> SKK-JISYO.tmp
$(RUBY) $(TOOLS_DIR)/filters/complete-numerative.rb -pU SKK-JISYO.L >> SKK-JISYO.tmp
$(RUBY) $(TOOLS_DIR)/filters/abbrev-convert.rb -K -s 2 SKK-JISYO.L >> SKK-JISYO.tmp
$(RUBY) $(TOOLS_DIR)/filters/abbrev-convert.rb -w -s 2 SKK-JISYO.L >> SKK-JISYO.tmp
# order is very important here
$(EXPR2) SKK-JISYO.geo + SKK-JISYO.station + SKK-JISYO.jinmei + SKK-JISYO.propernoun + SKK-JISYO.fullname + SKK-JISYO.tmp + SKK-JISYO.law + SKK-JISYO.okinawa + SKK-JISYO.hukugougo + SKK-JISYO.assoc - SKK-JISYO.L > SKK-JISYO.addition
# why eliminating SKK-JISYO.L once? -- to not add too noisy
# annotations from SKK-JISYO.jinmei and so on.
$(EXPR2) SKK-JISYO.L + SKK-JISYO.addition | cat SKK-JISYO.L.header - > SKK-JISYO.total
$(RM) SKK-JISYO.tmp SKK-JISYO.addition

SKK-JISYO.total+zipcode: SKK-JISYO.total $(ZIPDIC_DIR)/SKK-JISYO.zipcode $(ZIPDIC_DIR)/SKK-JISYO.office.zipcode SKK-JISYO.L.header
$(EXPR2) SKK-JISYO.total + $(ZIPDIC_DIR)/SKK-JISYO.zipcode + $(ZIPDIC_DIR)/SKK-JISYO.office.zipcode | cat SKK-JISYO.L.header - > SKK-JISYO.total+zipcode

SKK-JISYO.L.taciturn: SKK-JISYO.L SKK-JISYO.L.header
$(RUBY) $(TOOLS_DIR)/filters/annotation-filter.rb -d SKK-JISYO.L | $(EXPR2) | cat SKK-JISYO.L.header - > SKK-JISYO.L.taciturn

SKK-JISYO.L+.taciturn: SKK-JISYO.L+ SKK-JISYO.L.header
$(RUBY) $(TOOLS_DIR)/filters/annotation-filter.rb -d SKK-JISYO.L+ | $(EXPR2) | cat SKK-JISYO.L.header - > SKK-JISYO.L+.taciturn

SKK-JISYO.total.taciturn: SKK-JISYO.total SKK-JISYO.L.header
$(RUBY) $(TOOLS_DIR)/filters/annotation-filter.rb -d SKK-JISYO.total | $(EXPR2) | cat SKK-JISYO.L.header - > SKK-JISYO.total.taciturn

SKK-JISYO.total+zipcode.taciturn: SKK-JISYO.total+zipcode SKK-JISYO.L.header
$(RUBY) $(TOOLS_DIR)/filters/annotation-filter.rb -d SKK-JISYO.total+zipcode | $(EXPR2) | cat SKK-JISYO.L.header - > SKK-JISYO.total+zipcode.taciturn

SKK-JISYO.L+.unannotated: SKK-JISYO.L+
$(GAWK) -f $(TOOLS_DIR)/unannotation.awk SKK-JISYO.L+ > SKK-JISYO.L+.unannotated

SKK-JISYO.total.unannotated: SKK-JISYO.total
$(GAWK) -f $(TOOLS_DIR)/unannotation.awk SKK-JISYO.total > SKK-JISYO.total.unannotated

SKK-JISYO.total+zipcode.unannotated: SKK-JISYO.total+zipcode
$(GAWK) -f $(TOOLS_DIR)/unannotation.awk SKK-JISYO.total+zipcode > SKK-JISYO.total+zipcode.unannotated

SKK-JISYO.L.header: SKK-JISYO.L
echo ';; (This dictionary was automatically generated from SKK dictionaries)' > SKK-JISYO.L.header
$(SED) -n '/^;; okuri-ari entries./q;p' SKK-JISYO.L >> SKK-JISYO.L.header

unannotated-all: unannotated SKK-JISYO.L+.unannotated SKK-JISYO.total.unannotated SKK-JISYO.total+zipcode.unannotated

taciturn-all: SKK-JISYO.L.taciturn SKK-JISYO.L+.taciturn SKK-JISYO.total.taciturn SKK-JISYO.total+zipcode.taciturn

annotated-all: SKK-JISYO.L+ SKK-JISYO.total SKK-JISYO.total+zipcode

all: annotated-all unannotated-all taciturn-all

cdb:
$(PYTHON) $(TOOLS_DIR)/$(SKK2CDB) $(CDB_TARGET) $(CDB_SOURCE)

# bzip2: clean $(SRCS)
# for file in $(SRCS); do \
# $(BZIP2) -fc $$file >$$file.bz2 ;\
# $(MD5) $$file.bz2 >$$file.bz2.md5; \
# done
# $(TAR) cvpf SKK-JISYO.edict.tar SKK-JISYO.edict edict_doc.txt
# $(BZIP2) -f SKK-JISYO.edict.tar
# $(MD5) SKK-JISYO.edict.tar.bz2 > SKK-JISYO.edict.tar.bz2.md5
# # $(TAR) cvpf zipcode.tar ./zipcode --exclude-from=./skk.ex
# $(TAR) cvpf zipcode.tar ./zipcode
# $(BZIP2) -f zipcode.tar
# $(MD5) zipcode.tar.bz2 >zipcode.tar.bz2.md5

# end of Makefile.
Loading

0 comments on commit 8835e5b

Please sign in to comment.