xwords/xwords4/dawg/German/info.txt

# -*- mode: conf; coding: utf-8; -*-
# Copyright 2002 - 2010 by Eric House (xwords@eehouse.org).  All
# rights reserved.
#
# This program is free software; you can redistribute it and/or
# modify it under the terms of the GNU General Public License
# as published by the Free Software Foundation; either version 2
# of the License, or (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.

LANGCODE:de_DE
CHARSET: utf-8

# deal with DOS files
LANGFILTER: tr -d '\r'
# substitute for sharfes-s
LANGFILTER: | sed -e 's/ß/SS/g'
# uppercase all
LANGFILTER: | tr [a-zäöü] [A-ZÄÖÜ]
# no words not containing a vowel
# LANGFILTER: | grep '[AEIOUÄÖÜ]'
# none with illegal chars
LANGFILTER: | grep '^[A-ZÄÖÜ]\+$'

# Until I can figure out how to force sort to use a locale's collation
# rules we can't trust sort in the filtering rules above and so must
# leave the sorting work to dict2dawg.pl.
D2DARGS: -r -term 10

LANGINFO: <p>German has the 26 English letters plus the three umlaut
LANGINFO: vowels.  Scharfes-s is not a legal tile, but if present in
LANGINFO: the wordlist submitted it'll be converted to "SS" by our
LANGINFO: filtering rules.  Additional filtering rules eliminate all
LANGINFO: words that don't contain at least one vowel and any that
LANGINFO: contain letters not found on tiles.</p>

# High bit means "official".  Next 7 bits are an enum where
# German==3.  Low byte is padding
XLOC_HEADER:0x8300


<BEGIN_TILES>
2			0		{"_"}
5	        1		'A|a'
1			6		'Ä|ä'
2			3		'B|b'
2			4		'C|c'
4			1		'D|d'
15			1		'E|e'
2			4		'F|f'
3			2		'G|g'
4			2		'H|h'
6			1		'I|i'
1			6		'J|j'
2			4		'K|k'
3			2		'L|l'
4			3		'M|m'
9			1		'N|n'
3			2		'O|o'
1			8		'Ö|ö'
1			4		'P|p'
1			10		'Q|q'
6			1		'R|r'
7			1		'S|s'
6			1		'T|t'
6			1		'U|u'
1			6		'Ü|ü'
1			6		'V|v'
1			3		'W|w'
1			8		'X|x'
1			10		'Y|y'
1			3		'Z|z'
<END_TILES>
# should ignore all after the <END_TILES> above