xwords/xwords4/dawg/Danish/info.txt
Eric House df14108e4e add lowercase equivalents
where missing and seems possible
2019-07-07 13:00:06 -07:00

74 lines
2 KiB
Text

# Copyright 2005 by Eric House (xwords@eehouse.org). All rights reserved.
#
# This program is free software; you can redistribute it and/or
# modify it under the terms of the GNU General Public License
# as published by the Free Software Foundation; either version 2
# of the License, or (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
LANGCODE:da_DK
CHARSET: utf-8
# deal with DOS files
LANGFILTER: tr -d '\r'
# uppercase all
LANGFILTER: | tr [a-zåæø] [A-ZÅÆØ]
# no words not containing a vowel
LANGFILTER: | grep '[AEIOUYÅÆØ]'
# none with illegal chars
LANGFILTER: | grep '^[A-PR-VX-ZÅÆØ]\+$'
# remove duplicates
LANGFILTER: | sort -u
# Until I can figure out how to force sort to use a locale's collation
# rules we can't trust sort in the filtering rules above and so must
# leave the sorting work to dict2dawg.pl.
D2DARGS: -r -term 10
LANGINFO: <p>Danish uses all English letters except Q and W. There
LANGINFO: are three non-English letters: 'Å', 'Æ' and 'Ø'. </p>
# High bit means "official". Next 7 bits are an enum where
# Danish==9. Low byte is padding
XLOC_HEADER:0x8900
<BEGIN_TILES>
2 0 {"_"}
7 1 'A|a'
2 4 'Å|å'
2 4 'Æ|æ'
4 3 'B|b'
2 8 'C|c'
5 2 'D|d'
9 1 'E|e'
3 3 'F|f'
3 3 'G|g'
2 4 'H|h'
4 3 'I|i'
2 4 'J|j'
4 3 'K|k'
5 2 'L|l'
3 3 'M|m'
6 1 'N|n'
5 2 'O|o'
2 4 'Ø|ø'
2 4 'P|p'
6 1 'R|r'
5 2 'S|s'
5 2 'T|t'
3 3 'U|u'
3 3 'V|v'
1 8 'X|x'
2 4 'Y|y'
1 8 'Z|z'
<END_TILES>
# should ignore all after the <END_TILES> above