mirror of
git://xwords.git.sourceforge.net/gitroot/xwords/xwords
synced 2025-01-23 07:27:22 +01:00
fb2fcf15cc
Find-prefix feature in current code crashes on Hungarian because it allows duplicates (words that occur spelled with the same letters but different tile combinations.) Modify Makefile to exclude those (as it does for all other multi-letter-tile languages). And to pull the git source of the wordlist on demand.
88 lines
2.8 KiB
Makefile
88 lines
2.8 KiB
Makefile
# -*-mode: Makefile; -*-
|
|
# Copyright 2002-2020 by Eric House (xwords@eehouse.org). All rights
|
|
# reserved.
|
|
#
|
|
# This program is free software; you can redistribute it and/or
|
|
# modify it under the terms of the GNU General Public License
|
|
# as published by the Free Software Foundation; either version 2
|
|
# of the License, or (at your option) any later version.
|
|
#
|
|
# This program is distributed in the hope that it will be useful,
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
# GNU General Public License for more details.
|
|
#
|
|
# You should have received a copy of the GNU General Public License
|
|
# along with this program; if not, write to the Free Software
|
|
# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
|
|
|
|
XWLANG=Hungarian
|
|
LANGCODE=hu_HU
|
|
ENC = UTF-8
|
|
TARGET_TYPE ?= WINCE
|
|
|
|
DICTNOTE = "Derived from szotar/alap/ in https://github.com/laszlonemeth/magyarispell.git"
|
|
|
|
LANG_SPECIAL_INFO = \
|
|
"CS Cs cS cs" /dev/null /dev/null \
|
|
"GY Gy gY gy" /dev/null /dev/null \
|
|
"LY Ly lY ly" /dev/null /dev/null \
|
|
"NY Ny nY ny" /dev/null /dev/null \
|
|
"SZ Sz sZ sz" /dev/null /dev/null \
|
|
"TY Ty tY ty" /dev/null /dev/null \
|
|
"ZS Zs zS zs" /dev/null /dev/null \
|
|
|
|
include ../Makefile.langcommon
|
|
|
|
GIT_DIR = ./magyarispell
|
|
SRC_COMMIT = 39ee7f3f8631b953d44ed6f12cfe8ae7193fbf13
|
|
|
|
SRC = \
|
|
${GIT_DIR}/szotar/alap/fonev.1 \
|
|
${GIT_DIR}/szotar/alap/melleknev.1 \
|
|
${GIT_DIR}/szotar/alap/ige_alanyi.1 \
|
|
${GIT_DIR}/szotar/alap/ige_targy.1 \
|
|
${GIT_DIR}/szotar/alap/ragozatlan.2
|
|
|
|
PHONY: GIT_TREE
|
|
|
|
$(SRC) : GIT_TREE
|
|
|
|
GIT_TREE:
|
|
if [ ! -d $(GIT_DIR) ]; then \
|
|
mkdir -p $(GIT_DIR); \
|
|
git clone https://github.com/laszlonemeth/magyarispell.git $(GIT_DIR); \
|
|
fi
|
|
(cd $(GIT_DIR) && git checkout $(SRC_COMMIT))
|
|
|
|
hungarian_wordlist.txt: $(SRC)
|
|
cat $^ | \
|
|
sed -e 's/#.*$$//' -e 's/\[.*$$//' -e 's/ .*$$//' |\
|
|
grep -v '^$$' |\
|
|
sort -u > $@
|
|
|
|
# Filtering wordlist: When a word can be spelled with either a
|
|
# double-letter tile or two single-letter tiles, it's in the list with
|
|
# both spellings. That's what the longer sed expressions are doing
|
|
# (emitting two words)
|
|
$(XWLANG)Main.dict.gz: hungarian_wordlist.txt
|
|
cat $< \
|
|
| tr -d '\r' \
|
|
| tr [aábcdeéfghiíjklmnnyoóöőprtuúüűvzs] [AÁBCDEÉFGHIÍJKLMNNYOÓÖŐPRTUÚÜŰVZS] \
|
|
| grep -v '1\|2\|3\|4\|5\|6\|7' \
|
|
| sed -e 's,CS,1,g' \
|
|
| sed -e 's,GY,2,g' \
|
|
| sed -e 's,LY,3,g' \
|
|
| sed -e 's,NY,4,g' \
|
|
| sed -e 's,SZ,5,g' \
|
|
| sed -e 's,TY,6,g' \
|
|
| sed -e 's,ZS,7,g' \
|
|
| grep '^[1-7AÁBCDEÉFGHIÍJKLMNOÓÖŐPRSTUÚÜŰVZ]*$$' \
|
|
| tr '1234567' '\001\002\003\004\005\006\007' \
|
|
| gzip -c > $@
|
|
|
|
# Everything but creating of the Main.dict file is inherited from the
|
|
# "parent" Makefile.langcommon in the parent directory.
|
|
|
|
clean: clean_common
|
|
rm -f $(XWLANG)Main.dict.gz *.bin $(XWLANG)*.pdb $(XWLANG)*.seb hungarian_wordlist.txt
|