From 5e02ca1c869542f64e32190bb4dfb2f656991d8e Mon Sep 17 00:00:00 2001 From: ehouse Date: Wed, 22 Jun 2005 06:40:53 +0000 Subject: [PATCH] first checked in. Seems to work. --- xwords4/dawg/Dutch/.cvsignore | 3 ++ xwords4/dawg/Dutch/Makefile | 41 +++++++++++++++++++ xwords4/dawg/Dutch/info.txt | 76 +++++++++++++++++++++++++++++++++++ 3 files changed, 120 insertions(+) create mode 100644 xwords4/dawg/Dutch/.cvsignore create mode 100644 xwords4/dawg/Dutch/Makefile create mode 100644 xwords4/dawg/Dutch/info.txt diff --git a/xwords4/dawg/Dutch/.cvsignore b/xwords4/dawg/Dutch/.cvsignore new file mode 100644 index 000000000..086c16f6f --- /dev/null +++ b/xwords4/dawg/Dutch/.cvsignore @@ -0,0 +1,3 @@ +*.bin +*.xwd +*.pdb diff --git a/xwords4/dawg/Dutch/Makefile b/xwords4/dawg/Dutch/Makefile new file mode 100644 index 000000000..c51647009 --- /dev/null +++ b/xwords4/dawg/Dutch/Makefile @@ -0,0 +1,41 @@ +# -*- mode: makefile -*- +# Copyright 2002 by Eric House (fixin@peak.org). All rights reserved. +# +# This program is free software; you can redistribute it and/or +# modify it under the terms of the GNU General Public License +# as published by the Free Software Foundation; either version 2 +# of the License, or (at your option) any later version. +# +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU General Public License for more details. +# +# You should have received a copy of the GNU General Public License +# along with this program; if not, write to the Free Software +# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. + +LANG=Dutch +LANGCODE=nl_NL + +TARGET_TYPE ?= PALM + +include ../Makefile.2to8 + +include ../Makefile.langcommon + +SOURCEDICT ?= $(XWDICTPATH)/$(LANG)/Dutch__unofficial_alphabetical.dict.gz + +$(LANG)Main.dict.gz: $(SOURCEDICT) Makefile + zcat $< | tr -d '\r' | tr [a-zäöü] [A-ZÄÖÜ] | \ + grep '[AEIOU]' | grep '^[A-Z]\+$$' | sort -u | \ + gzip -c > $@ + +# Everything but creating of the Main.dict file is inherited from the +# "parent" Makefile.langcommon in the parent directory. + +clean: clean_common + rm -f $(LANG)Main.dict.gz *.bin $(LANG)*.pdb $(LANG)*.seb + +help: + @echo 'make [SOURCEDICT=Dutch__unofficial_alphabetical.dict.gz]' diff --git a/xwords4/dawg/Dutch/info.txt b/xwords4/dawg/Dutch/info.txt new file mode 100644 index 000000000..d050553e9 --- /dev/null +++ b/xwords4/dawg/Dutch/info.txt @@ -0,0 +1,76 @@ +# Copyright 2002 by Eric House (fixin@peak.org). All rights reserved. +# +# This program is free software; you can redistribute it and/or +# modify it under the terms of the GNU General Public License +# as published by the Free Software Foundation; either version 2 +# of the License, or (at your option) any later version. +# +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU General Public License for more details. +# +# You should have received a copy of the GNU General Public License +# along with this program; if not, write to the Free Software +# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. + +LANGCODE:nl_NL + + +# deal with DOS files +LANGFILTER_PRECLIP: tr -d '\r' | + +# uppercase all +LANGFILTER_POSTCLIP: | tr [a-zäöü] [A-ZÄÖÜ] +# no words not containing a vowel +LANGFILTER_POSTCLIP: | grep '[AEIOU]' +# none with illegal chars +LANGFILTER_POSTCLIP: | grep '^[A-Z]\+$' +LANGFILTER_POSTCLIP: | tr -s '\n' '\000' + +# Until I can figure out how to force sort to use a locale's collation +# rules we can't trust sort in the filtering rules above and so must +# leave the sorting work to dict2dawg.pl. + +NEEDSSORT:true + +LANGINFO:

Dutch has the same 26 letters as English, though of +LANGINFO: course the counts and values are different. Filtering rules +LANGINFO: eliminate all words that don't contain at least one vowel +LANGINFO: and any that contain letters not found on tiles.

+ +# High bit means "official". Next 7 bits are an enum where +# Dutch==B. Low byte is padding +XLOC_HEADER:0x8B00 + + + +2 0 {"_"} +6 1 'A' +2 3 'B' +2 5 'C' +5 2 'D' +16 1 'E' +2 4 'F' +2 3 'G' +2 4 'H' +4 1 'I' +2 4 'J' +3 3 'K' +3 3 'L' +3 3 'M' +8 1 'N' +6 1 'O' +3 3 'P' +1 10 'Q' +5 2 'R' +5 2 'S' +5 2 'T' +4 4 'U' +2 4 'V' +2 5 'W' +1 8 'X' +2 4 'Y' +2 4 'Z' + +# should ignore all after the above