Initial revision

2024-12-27 09:58:45 +01:00 · 2003-09-07 17:16:50 +00:00 · 2003-09-07 17:16:50 +00:00 · ec410e7b21
commit ec410e7b21
parent 88f0865a4e
26 changed files with 4045 additions and 0 deletions
--- a/xwords4/xwords4/dawg/English/Makefile
+++ b/xwords4/xwords4/dawg/English/Makefile
@ -0,0 +1,40 @@
+# -*-mode: Makefile -*-
+# Copyright 2002 by Eric House (fixin@peak.org).  All rights reserved.
+#
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License
+# as published by the Free Software Foundation; either version 2
+# of the License, or (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+
+TARGET_TYPE ?= FRANK
+
+# This represents the default -- for now
+COMMAND = -f Makefile.BasEnglish TARGET_TYPE=FRANK
+
+alleng:
+	for mfile in Makefile.BasEnglish Makefile.OSW Makefile.TWL98 Makefile.CollegeEng; do \
+		$(MAKE) -f $$mfile TARGET_TYPE=$(TARGET_TYPE); \
+	done
+
+%:
+	$(MAKE) $(COMMAND) $@
+
+all:
+	$(MAKE) $(COMMAND)
+
+clean:
+	$(MAKE) $(COMMAND) clean
+
+help:
+	@echo "try make -f Makefile.[BasEnglish|CollegeEng] \\"
+	@echo "    TARGET_TYPE=[PALM|FRANK]"
+
--- a/xwords4/xwords4/dawg/English/Makefile.BasEnglish
+++ b/xwords4/xwords4/dawg/English/Makefile.BasEnglish
@ -0,0 +1,35 @@
+# -*-mode: Makefile -*-
+# Copyright 2002 by Eric House (fixin@peak.org).  All rights reserved.
+#
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License
+# as published by the Free Software Foundation; either version 2
+# of the License, or (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+
+LANG=BasEnglish
+LANGCODE=en_US
+#NEWDAWG=1
+
+TARGET_TYPE ?= FRANK
+
+include ../Makefile.2to8
+
+include ../Makefile.langcommon
+
+$(LANG)Main.dict.gz: BasEnglish.dict.gz
+	ln -s $< $@
+
+# Everything but creating of the Main.dict file is inherited from the
+# "parent" Makefile.langcommon in the parent directory.
+
+clean: clean_common
+	rm -f $(LANG)Main.dict.gz *.bin $(LANG)*.pdb $(LANG)*.seb
--- a/xwords4/xwords4/dawg/English/Makefile.CollegeEng
+++ b/xwords4/xwords4/dawg/English/Makefile.CollegeEng
@ -0,0 +1,34 @@
+# -*- mode: makefile; -*-
+# Copyright 2002 by Eric House (fixin@peak.org).  All rights reserved.
+#
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License
+# as published by the Free Software Foundation; either version 2
+# of the License, or (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+
+LANG=CollegeEng
+LANGCODE=en_US
+#NEWDAWG=1
+TARGET_TYPE=FRANK
+
+include ../Makefile.2to8
+
+include ../Makefile.langcommon
+
+$(LANG)Main.dict.gz: CollegeEng.dict.gz
+	ln -s $< $@
+
+# Everything but creating of the Main.dict file is inherited from the
+# "parent" Makefile.langcommon in the parent directory.
+
+clean: clean_common
+	rm -f $(LANG)Main.dict.gz *.bin $(LANG)*.pdb $(LANG)*.seb 
--- a/xwords4/xwords4/dawg/English/Makefile.OSPD
+++ b/xwords4/xwords4/dawg/English/Makefile.OSPD
@ -0,0 +1,33 @@
+# -*- mode: makefile; compile-command: "make -f Makefile.OSPD TARGET_TYPE=PALM"; -*-
+# Copyright 2002 by Eric House (fixin@peak.org).  All rights reserved.
+#
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License
+# as published by the Free Software Foundation; either version 2
+# of the License, or (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+
+LANG=OSPD
+LANGCODE=en_US
+NEWDAWG=1
+
+include ../Makefile.2to8
+
+include ../Makefile.langcommon
+
+$(LANG)Main.dict.gz: OSPD.dict.gz
+	ln -s $< $@
+
+# Everything but creating of the Main.dict file is inherited from the
+# "parent" Makefile.langcommon in the parent directory.
+
+clean: clean_common
+	rm -f $(LANG)Main.dict.gz *.bin 
--- a/xwords4/xwords4/dawg/English/info.data
+++ b/xwords4/xwords4/dawg/English/info.data
@ -0,0 +1,35 @@
+# I'm a comment.  Any line beginning with this char will be dropped
+
+LANGCODE:en_US
+
+<BEGIN>
+2			0		{"_"}
+9			1		'A'
+2			3		'B'
+2			3		'C'
+4			2		'D'
+12			1		'E'
+2			4		'F'
+3			2		'G'
+2			4		'H'
+9			1		'I'
+1			8		'J'
+1			5		'K'
+4			1		'L'
+2			3		'M'
+6			1		'N'
+8			1		'O'
+2			3		'P'
+1			10		'Q'
+6			1		'R'
+4			1		'S'
+6			1		'T'
+4			1		'U'
+2			4		'V'
+2			4		'W'
+1			8		'X'
+2			4		'Y'
+1			10		'Z'
+
+<END>
+# should ignore all after the <END> above
--- a/xwords4/xwords4/dawg/English/info.txt
+++ b/xwords4/xwords4/dawg/English/info.txt
@ -0,0 +1,71 @@
+# Copyright 2002 by Eric House (fixin@peak.org).  All rights reserved.
+#
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License
+# as published by the Free Software Foundation; either version 2
+# of the License, or (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+
+LANGCODE:en_US
+
+# deal with DOS files
+LANGFILTER_PRECLIP: tr -d '\r' |
+
+LANGFILTER_POSTCLIP: | tr [a-z] [A-Z]
+LANGFILTER_POSTCLIP: | grep '^[A-Z]*$'
+LANGFILTER_POSTCLIP: | tr -s '\n\r' '\000\000'
+LANGFILTER_POSTCLIP: | sort -z
+
+# We can trust sort (above) to do the right thing since there's no
+# high ascii.  dict2dawg.pl is much faster if I can trust that its
+# input is in sorted order.
+NEEDSSORT:false
+
+LANGINFO: <p>English dictionaries can contain words with any of the 26
+LANGINFO: letters you think of as making up the alphabet: A-Z.  At
+LANGINFO: this point any word in your list containing anything else
+LANGINFO: will simply be excluded from the dictionary.</p>
+
+# High bit means "official".  Next 7 bits are an enum where
+# English==1.  Low byte is padding
+XLOC_HEADER:0x8100
+
+<BEGIN_TILES>
+2			0		{"_"}
+9			1		'A'
+2			3		'B'
+2			3		'C'
+4			2		'D'
+12			1		'E'
+2			4		'F'
+3			2		'G'
+2			4		'H'
+9			1		'I'
+1			8		'J'
+1			5		'K'
+4			1		'L'
+2			3		'M'
+6			1		'N'
+8			1		'O'
+2			3		'P'
+1			10		'Q'
+6			1		'R'
+4			1		'S'
+6			1		'T'
+4			1		'U'
+2			4		'V'
+2			4		'W'
+1			8		'X'
+2			4		'Y'
+1			10		'Z'
+<END_TILES>
+
+# should ignore all after the <END> above
--- a/xwords4/xwords4/dawg/Makefile.2to8
+++ b/xwords4/xwords4/dawg/Makefile.2to8
@ -0,0 +1,7 @@
+# -*-mode: Makefile -*-
+
+# These are the targets that almost all language makefiles will want.
+
+SHORT_WORD = 2
+LONG_WORD = 8
+
--- a/xwords4/xwords4/dawg/Makefile.langcommon
+++ b/xwords4/xwords4/dawg/Makefile.langcommon
@ -0,0 +1,249 @@
+# -*-mode: Makefile -*-
+
+# Copyright 2000-2002 by Eric House (fixin@peak.org)
+#
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License
+# as published by the Free Software Foundation; either version 2
+# of the License, or (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+
+FRANK_EXT = xwd
+
+# this will make all dicts the new, larger type
+#FORCE_4 = -force4
+
+PALM_DICT_TYPE = DAWG
+PAR = ../par.pl
+#PAR = par				# available from djw.org
+
+LANGUAGE = $(shell basename $$(pwd))
+
+#all: target_all
+
+# let languages set this first, but we always add blank to it.
+BLANK_INFO =  "_" /dev/null /dev/null
+
+# Supply a default so don't have to type so much; feel free to change 
+TARGET_TYPE ?= FRANK
+
+ifdef NEWDAWG
+	TABLE_ARG = -mn
+else
+	TABLE_ARG = -m
+endif
+
+##############################################################################
+# PalmOS rules
+##############################################################################
+ifeq ($(TARGET_TYPE),PALM)
+
+ifdef NEWDAWG
+	PDBTYPE = Xwr4
+else
+	PDBTYPE = Xwr3
+endif
+
+all: $(LANG)2to8.pdb
+
+empty: $(LANG)0to0.pdb
+
+# Those languages that have bitmap files for custom glyphs will need to
+# define BMPBINFILES and perhaps provide a rule for building the files
+binfiles.stamp: $(BMPBINFILES)
+	touch binfiles.stamp
+
+palmspecials.bin: ../palm_mkspecials.pl $(BMPFILES)
+	$< $(BLANK_INFO) $(LANG_SPECIAL_INFO) > $@
+
+# can't just use values.bin because the specials bitmap info is
+# platform-specific
+palmvalues.bin: values.bin palmspecials.bin
+	cat $^ > $@
+
+# values.bin: palmspecials.bin ../xloc binfiles.stamp
+# 	cd ../ && $(MAKE) xloc
+# 	binfileparms=""; \
+# 		if [ "$(BMPBINFILES)" != "" ]; then \
+# 			for f in $(BMPBINFILES)""; \
+# 				do binfileparms="$$binfileparms -i $$f"; \
+# 			done; \
+# 		fi; \
+# 		../xloc -l $(LANGCODE) $$binfileparms -T $@
+# 		cat palmspecials.bin >> $@
+
+# header (first record) is node count (long) and 4 chars: 
+#    unsigned char firstEdgeRecNum;
+#    unsigned char charTableRecNum;
+#    unsigned char valTableRecNum;
+#    unsigned char reserved[3]; // worst case this points to a new resource
+
+# include "flags" as used on the other platforms
+palmheader%.bin: $(LANG)%_wordcount.bin $(LANG)%_flags.bin
+	rm -f $@
+	touch $@
+ifdef NEWDAWG
+	cat $(LANG)$*_flags.bin >> $@
+endif
+	cat $< >> $@
+	perl -e "print pack(\"C\",3)" >> $@	# first edge
+	perl -e "print pack(\"C\",1)" >> $@	# char table rec number
+	perl -e "print pack(\"C\",2)" >> $@	# valTable rec number
+	perl -e "print pack(\"CCC\",0)" >> $@	# reserved 3 bytes
+	perl -e "print pack(\"CC\",0)" >> $@	# c code added two more...
+
+
+# This works, but leaves out the header info that the current version
+# has.  I'm not sure anybody cares, though...
+$(LANG)%.pdb: dawg$(LANG)%.stamp table.bin palmvalues.bin palmheader%.bin 
+	$(PAR) c -a backup $@ \
+		$(basename $(@F)) $(PALM_DICT_TYPE) $(PDBTYPE) \
+		palmheader$*.bin table.bin palmvalues.bin dawg$(LANG)$*_*.bin
+
+#	start=$$(echo $@ | sed -e 's/$(LANG)\([0-9]*\)to[0-9]*.pdb/\1/'); \
+#	end=$$(echo $@ | sed -e 's/$(LANG)[0-9]*to\([0-9]*\).pdb/\1/'); \
+#	zcat $< | grep "^.\{$${start},$${end}\}$$" | \
+#		../dict2pdb -t table.bin -v values.bin -n $(basename $(@F)) \
+#		> $@
+
+# the files to export for byod
+byodbins: table.bin values.bin palmvalues.bin 
+
+#endif				# TARGET_TYPE==PALM
+
+##############################################################################
+# Franklin ebook rules
+##############################################################################
+else
+ifeq ($(TARGET_TYPE),FRANK)
+
+all: $(LANG)2to8.seb
+
+empty: $(LANG)0to0.seb
+
+# get defn of ESDK_CREATESEB_EXE
+include ${EBOOKMAN_SDK}/ebsdk.uses
+
+# a binary file (one byte) giving the number of tiles in the dict
+charcount.bin: table.bin
+ifdef NEWDAWG
+	siz=$$(wc -c $< | sed -e 's/$<//'); \
+	perl -e "print pack(\"c\",$$siz/2)" > $@
+else
+	siz=$$(wc -c $< | sed -e 's/$<//'); \
+	perl -e "print pack(\"c\",$$siz)" > $@
+endif
+
+# For each entry in the table whose face < 32, there needs to be a pair of
+# pbitm files and a string giving the printing form
+frankspecials.bin: ../frank_mkspecials.pl  $(BMPFILES)
+	$< $(BLANK_INFO) $(LANG_SPECIAL_INFO) > $@
+
+$(LANG)%.$(FRANK_EXT): dawg$(LANG)%.stamp $(LANG)%_flags.bin charcount.bin table.bin values.bin frankspecials.bin
+	cat $(LANG)$*_flags.bin charcount.bin table.bin values.bin \
+		frankspecials.bin $(LANG)StartLoc.bin $$(ls dawg$(LANG)$*_*.bin) > $@
+	cp $@ saveme.bin
+
+$(LANG)%.seb: $(LANG)%.$(FRANK_EXT) $(LANG)%.atts 
+	${ESDK_CREATESEB_EXE} $<
+	cp $< $<.saved
+
+$(LANG)%.atts:			#recreate it each time based on params
+	echo '_PUB|global+read-only|"Eric_House"' >> $@
+	echo "_NAME|global+read-only|\"$(LANG)2to8\""  >> $@
+	echo "_EXT|global+read-only|\"$(FRANK_EXT)\""  >> $@
+	echo '_LCAT|nosign+global|"CONTENT"'  >> $@
+	echo '_PERM|global+read-only|"r"' >> $@
+
+# values.bin: ../xloc 
+# 	cd ../ && $(MAKE) xloc
+# 	../xloc -l $(LANGCODE) -T $@
+
+# the files to export for byod
+byodbins: table.bin values.bin frankspecials.bin
+
+
+else
+	(Need to define TARGET_TYPE if get error poining to this line)
+endif				#ifeq ($(TARGET_TYPE),FRANK)
+endif
+
+ifeq (s$(TARGET_TYPE),s)
+It's an error not to specify a TARGET_TYPE
+endif
+
+##############################################################################
+# shared rules
+##############################################################################
+
+# For some reason I can't fathom dawg$(LANG)% gets nuked every time
+# the top-level rule fires (all: for whatever TARGET_TYPE.)  It
+# happens after the rule finishes....
+
+# 16 bits worth of flags for the start of the eventual file.  At this
+# point, the flags mean this:
+# 1: old-style DAWG.
+# 2: new-style DAWG, three bytes per node.
+# 3: new-style DAWG, four bytes per node
+$(LANG)%_flags.bin: dawg$(LANG)%.stamp
+ifdef NEWDAWG
+	if [ 3 == $$(cat $(LANG)$*_nodesize.bin) ] ; \
+		then perl -e "print pack(\"n\",0x0002)" > $@; echo "flags=2"; \
+		else perl -e "print pack(\"n\",0x0003)" > $@; echo "flags=3"; \
+	fi
+else
+	if [ 3 == $$(cat $(LANG)$*_nodesize.bin) ] ; \
+		then perl -e "print pack(\"n\",0x0001)" > $@; echo "flags=1"; \
+		else echo "ERROR: old format can't handle 4-byte"; exit 1; \
+	fi
+endif
+
+dawg$(LANG)%.stamp: $(LANG)Main.dict.gz ../dict2dawg.pl table.bin ../Makefile.langcommon
+	start=$$(echo $@ | sed -e 's/dawg$(LANG)\([0-9]*\)to[0-9]*.stamp/\1/'); \
+	end=$$(echo $@ | sed -e 's/dawg$(LANG)[0-9]*to\([0-9]*\).stamp/\1/'); \
+	echo $${start} and $$end; \
+	zcat $< | grep "^.\{$${start},$${end}\}$$" | tr '\n' '\0'| \
+		sort -z | ../dict2dawg.pl $(TABLE_ARG) table.bin -b 28000 \
+		-ob dawg$(LANG)$* \
+		-sn $(LANG)StartLoc.bin -k -term 0 -wc $(LANG)$*_wordcount.bin \
+		$(FORCE_4) -ns $(LANG)$*_nodesize.bin
+	touch $@
+
+$(LANG)%_wordcount.bin: dawg$(LANG)%.stamp
+	@echo
+
+# the files to export for byod
+allbins: 
+	$(MAKE) TARGET_TYPE=PALM byodbins
+	$(MAKE) TARGET_TYPE=FRANK byodbins
+
+table.bin:  ../xloc.pl 
+ifdef NEWDAWG
+	perl -I../ ../xloc.pl -tn > $@
+else
+	perl -I../ ../xloc.pl -t > $@
+endif
+
+values.bin:  ../xloc.pl 
+	perl -I../ ../xloc.pl -v > $@
+
+%.dict: %.dict.gz
+	zcat $< > $@
+
+clean_common:
+	rm -f $(LANG)Main.dict *.bin *.pdb *.seb dawg*.stamp *.$(FRANK_EXT) \
+		$(LANG)*.pdb $(LANG)*.seb 
+
+help:
+	@echo "make TARGET_TYPE=[FRANK|PALM]"
+
+test:
+	@echo $(LANGUAGE)
--- a/xwords4/xwords4/dawg/allchars.pl
+++ b/xwords4/xwords4/dawg/allchars.pl
@ -0,0 +1,7 @@
+#!/usr/bin/perl
+
+use strict;
+
+for (my $i = 1; $i < 255; ++$i ) {
+    printf( "%d: %s (0x%x)\n", $i, chr($i), $i );
+}
--- a/xwords4/xwords4/dawg/dawg.h
+++ b/xwords4/xwords4/dawg/dawg.h
@ -0,0 +1,47 @@
+/* 
+ * Copyright 1998 by Eric House.  All rights reserved.
+ * fixin@peak.org
+ *
+ * This program is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU General Public License
+ * as published by the Free Software Foundation; either version 2
+ * of the License, or (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+*/
+
+typedef struct dawg_header {
+    unsigned long numWords;
+    unsigned char firstEdgeRecNum;
+    unsigned char charTableRecNum;
+    unsigned char valTableRecNum;
+    unsigned char reserved[3]; // worst case this points to a new resource
+} dawg_header;
+
+typedef struct array_edge {
+    unsigned char highByte;
+    unsigned char lowByte;
+    unsigned char bits;
+} array_edge;
+
+/*
+ * the bits field has five bits for the character (0-based rather than
+ * 'a'-based, of course; one bit each indicating whether the edge may
+ * be terminal and whether it's the last edge of a sub-array; and a final
+ * bit that's overflow from the highByte field allowing indices to be in
+ * the range 0-(2^^17)-1
+ */
+#define LETTERMASK 0x1f
+#define ACCEPTINGMASK 0x20
+#define LASTEDGEMASK 0x40
+#define LASTBITMASK 0x80
+
+//#define ushort_byte_swap(d) ((unsigned short)(d<<8 | d>>8))
+
--- a/xwords4/xwords4/dawg/dict2DAWG.c
+++ b/xwords4/xwords4/dawg/dict2DAWG.c
@ -0,0 +1,685 @@
+// -*-mode: C; fill-column: 80; compile-command: "make dict2pdb"; -*-
+/*
+ * Copyright 1997 by Eric House.  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU General Public License
+ * as published by the Free Software Foundation; either version 2
+ * of the License, or (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+
+  Converts a <CR>-separated list of words, in stdin, to a DAWG written
+  to stdout in PalmOS .pdb file format.  
+
+  Called like this: dict2dawg > dict.pdb <<.
+  car
+  cars
+  cat
+  does
+  dog
+  .
+
+  Records in the database are of 48K length by default, except that
+  the last will likely be smaller and that they always end with the end
+  of a sub-array (so that iteration over a subarray doesn't have to
+  worry about boundaries.)
+
+  Records ought to hold two parallel arrays (but don't yet): first the
+  index array, of shorts, and then the bits array of unsigned chars.
+  Remember that one bit of the bits entry is actually the 17th bit of
+  the index value...
+
+  Ultimately we want to associate xloc-like date with each dictionary so
+  that langauges whose relevant letters aren't all in an ascii sequence can
+  be accomodated.  In most cases we'll be passed in a file containing a table
+  to be used for the mapping -- just a text file with one character per line
+  where A might be the 0th line, umlaut-A the first, etc.  But we'll also
+  generate such a table ourselves when not given one, and output it when
+  asked.
+
+  Bugs: It's currently necessary that input to this program be sorted
+  or some data may be lost.
+
+  To do:
+  Make it two parallel arrays.
+  Some sort of hashing on pruning.  */
+
+#include <stdio.h>
+#include <assert.h>
+#include <unistd.h>
+#include <stdlib.h>
+#include <string.h>
+#include <getopt.h>
+
+#include "swap.h"
+
+#define PRE_EDGE_RECORDCOUNT 3
+
+/* #include "pdb.h" */
+#include "dawg.h"
+/* #include "swap.c" */
+
+typedef char boolean;
+#define true 1
+#define false 0
+
+typedef unsigned char Tile;
+
+typedef struct tree_edge {
+    unsigned char letter;
+    unsigned long index;
+    boolean terminal;
+    struct tree_edge* prev;
+    struct tree_edge* next;
+    struct tree_edge* children;
+} tree_edge;
+
+#define MAXLENGTH 15
+
+
+//////////////////////////////////////////////////////////////////////////////
+// prototypes
+//////////////////////////////////////////////////////////////////////////////
+static void addToTree( unsigned char* buf, short buflen, tree_edge* nodege );
+tree_edge* newNode( unsigned char letter, boolean terminal );
+static void remember( unsigned char* c );
+void readInTables( char* orderTableFile );
+void init_prune_data();
+void prune_tree( tree_edge* edge );
+/* unsigned short byte_swap( unsigned short d ); */
+void write_children( array_edge* mainArray, tree_edge* edge );
+int count_nodes( tree_edge* edge );
+unsigned long index_children( tree_edge* edge, unsigned long firstIndex );
+void write_as_pdb( array_edge* edges, unsigned long edgeCount );
+void usage( char* progName );
+void initTables( void );
+Tile CharToTile( unsigned char ch );
+static short fileSize( char* fileName );
+void write_as_files( array_edge* edges, unsigned long edgeCount,
+		     char* fileNameBase );
+
+unsigned long gWordCount = 0;
+
+//////////////////////////////////////////////////////////////////////////////
+// globals
+//////////////////////////////////////////////////////////////////////////////
+boolean verbose = 0;
+tree_edge* rootEdge;
+int gNodeCount = 0;
+long gNodesCreated;
+long gPulled;
+char gDictName[32];
+char* gOrderTableFileName = NULL;
+/* char* gValueTableFileName = NULL; */
+short gNumUniqueTiles;
+typedef struct OrderResEntry {
+/*      unsigned char count; */
+/*      unsigned char value; */
+    unsigned char ch;
+} OrderResEntry;
+static OrderResEntry gOrderTable[32];
+static signed short gLookupTable[256];
+
+dawg_header gDawgHeader;
+
+//////////////////////////////////////////////////////////////////////////////
+// main
+//////////////////////////////////////////////////////////////////////////////
+int main( int argc, char** argv ) {
+    char buf[MAXLENGTH+10];
+    unsigned long edgeCount;
+    long maxWordLen = MAXLENGTH;
+    int got;
+    char* baseName = NULL;
+    array_edge* mainArray = NULL;
+
+    initTables();
+    memset( &gDawgHeader, 0, sizeof(gDawgHeader) );
+
+    gDictName[0] = '\0';
+
+    while ( (got = getopt(argc, argv, "t:vhn:")) != EOF ) {
+	switch ( got ) {
+	case 'm':
+	    sscanf( optarg, "%ld", &maxWordLen );
+	    fprintf( stderr, "maxWordLen set to %ld\n", maxWordLen );
+	    break;
+	case 'n':
+	    baseName = optarg;
+	    break;
+ 	case 'v':
+ 	    verbose = true;
+ 	    fprintf( stderr, "verbose set\n" );
+ 	    break;
+	case 't':
+	    gOrderTableFileName = optarg;
+	    break;
+	case 'h':
+	default:
+	    usage( argv[0] );
+	    break;
+	}
+    }
+    
+    if ( gOrderTableFileName != NULL ) {
+	readInTables( gOrderTableFileName );
+    }
+
+    assert( baseName );
+
+    rootEdge = newNode( '\0', 0 );
+    gNodesCreated = 0;
+    gPulled = 0;
+
+    while ( fgets( buf, MAXLENGTH+9, stdin ) ) {
+	unsigned char* cr = (unsigned char*)strchr( buf, '\n' );
+	short wordlen;
+	if ( cr ) {
+	    *cr = '\0';
+	}
+
+	wordlen = strlen( buf );
+
+	if ( (maxWordLen != MAXLENGTH) && (wordlen > maxWordLen) ) {
+	    continue;
+	} else if ( wordlen > MAXLENGTH ) {
+	    fprintf( stderr, "word %s too long\n", buf );
+	    exit(1);
+	}
+
+	// remember that *cr may be 0 *after* the call to remember	
+	for ( cr = buf; *cr; ++cr ) {
+	    remember(cr);
+	}
+	
+	addToTree( buf, wordlen, rootEdge );
+	++gWordCount;
+    }
+
+    fprintf( stderr, "done with addToTree (%ld nodes; %ld words)\n",
+	     gNodesCreated, gWordCount );
+
+    init_prune_data();
+    prune_tree( rootEdge );
+    
+    fprintf( stderr, "done with prune_tree: %ld pulled\n", gPulled );
+
+    edgeCount = index_children( rootEdge, 0 );
+
+    if ( edgeCount >= 0x1FFFF ) {
+	fprintf( stderr, "ERROR: too many edges: %ld (max is %ld)\n",
+		 edgeCount, (long)0x1FFFF );
+	exit( 1 );
+    }
+
+    fprintf( stderr, "done with index_children; edgeCount = %ld\n", edgeCount);
+    mainArray = (array_edge*)malloc( edgeCount * sizeof(array_edge) );
+    assert( mainArray );
+
+/*     largestDiff = smallestDiff = 0; */
+    write_children( mainArray, rootEdge );
+    fprintf( stderr, "done with write_children\n" );
+/*     fprintf( stderr, "largestDiff = %ld, smallestDiff = %ld\n", */
+/* 	     largestDiff, smallestDiff ); */
+
+    // Now we have a huge array in memory and need to write it to pdb
+    // format.
+    write_as_files( mainArray, edgeCount, baseName );
+
+/*     if ( verbose ) { */
+/* 	fprintf( stderr, "Writing %d nodes\n", edgeCount ); */
+/* 	fprintf( stderr, "{letter, next_index, terminal, lastEdge}\n" ); */
+/* 	for ( i = 0; i < edgeCount; ++i ) { */
+/* 	    array_edge* edge = &gArray[i]; */
+    // 	    fprintf( stderr, "/*[%d]*/ {%c, %d, %s, %s}\n", */
+/* 		     i, */
+/* 		     (edge->bits & LETTERMASK) + 'a', */
+/* 		     ushort_byte_swap(edge->first_child), */
+/* 		     (edge->bits&TERMINALMASK)?"true":"false", */
+/* 		     (edge->bits&LASTEDGEMASK)?"true":"false" ); */
+/* 	} */
+/*     } */
+
+/*     fprintf( stderr, "writing %ld edges to file\n", edgeCount );     */
+/*     for ( i = 0; i < edgeCount; ++i ) { */
+/* 	fwrite( &gArray[i], sizeof(array_edge), 1, stdout ); */
+/*     } */
+
+    return 0;
+} // main
+
+/* Given a node on the tree (not yet converted to a directed graph)
+ * walk down it using letters where they exist and adding them where
+ * the don't.
+ *
+ * The structure we're building here looks like this, for input "CAT"
+ * and "CAR":
+ *         /T
+ *    *-C-A
+ *         \R
+ * That is, words beginning with the same letters share the same initial
+ * branches of the tree.  Thus on entering a given level of recursion
+ * there are these possibilities:
+ * a) There's nothing here: create a new node and recurse on it.
+ * b) We find a node that holds the letter we seek: recurse on it.
+ * c) We reach the end of the list of letters without finding what we
+ * seek: create a new node at the end and recurse on it.
+ * d) We reach a node before which ours should have been found: create a
+ * new node in the right place and recurse on it.
+ */
+static void addToTree( unsigned char* buf, short buflen, tree_edge* node ) {
+    unsigned char target = *buf;
+    boolean terminal = (buflen == 1);
+    tree_edge* child;
+    tree_edge* prev = NULL;
+    tree_edge* new_node;
+
+/*      if ( !target ) { */
+/*  	assert( buflen == 0 ); */
+/*  	return; */
+/*      } */
+    if ( buflen == 0 ) return;
+    assert( buflen > 0 );
+
+    if ( node->children == NULL ) {
+	addToTree( buf+1, buflen-1,
+		   node->children = newNode( target, terminal ) );
+	return;
+    }
+
+    for ( child = node->children; child != NULL; child = child->next ) {
+	if ( child->letter == target ) {
+	    addToTree( buf+1, buflen-1, child );
+	    return;
+	} else if ( child->letter > target ) { // it's not in the tree yet.
+	    new_node = newNode( target, terminal );
+	    new_node->next = child;
+	    new_node->prev = child->prev;
+	    if ( child->prev ) {
+		child->prev->next = new_node;
+	    } else { // it's the first node!
+		node->children = new_node;
+	    }
+	    child->prev = new_node;
+
+	    addToTree( buf+1, buflen-1, new_node );
+	    return;
+	}
+	prev = child;
+    }
+
+    assert( prev != NULL );
+    new_node = newNode( target, terminal );
+    prev->next = new_node;
+    new_node->prev = prev;
+    addToTree( buf+1, buflen-1, new_node );
+    return;
+}
+
+tree_edge* newNode( unsigned char letter, boolean terminal ) {
+    tree_edge* result = (tree_edge*)malloc( sizeof(tree_edge ));
+    assert( result );
+    ++gNodesCreated;
+    result->letter = letter;
+    result->index = 0xFFFF;
+    result->terminal = terminal;
+    result->children = result->next = result->prev = NULL;
+
+    ++gNodeCount;
+    return result;
+}
+
+//////////////////////////////////////////////////////////////////////////////
+// prune_tree (and helpers)
+//////////////////////////////////////////////////////////////////////////////
+boolean sameStructure( tree_edge* node1, tree_edge* node2 ) {
+    // simple cases first.
+    if ( node1 == node2 ) return true;
+    else if ( node1 == NULL || node2 == NULL ) return false;
+    else if ( node1->letter != node2->letter ) return false;
+    else if ( node1->terminal != node2->terminal ) return false;
+    //else if ( count_nodes( node1 ) != count_nodes( node2 ) ) return false;
+    else {
+	tree_edge* children1;
+	tree_edge* children2;
+	for ( children1 = node1->children, children2 = node2->children;
+	      children1 || children2;
+	      children1 = children1->next, children2 = children2->next ) {
+	    if ( !sameStructure( children1, children2 ) )
+		return false;
+	}
+	for ( children1 = node1->next, children2 = node2->next;
+	      children1 || children2;
+	      children1 = children1->next, children2 = children2->next ) {
+	    if ( !sameStructure( children1, children2 ) )
+		return false;
+	}
+	return (children1 == NULL) && (children2 == NULL);
+    }
+}
+
+typedef struct visited_edge {
+    tree_edge* theEdge;
+    struct visited_edge* next;
+} visited_edge;
+static visited_edge* visitedEdges[256];
+
+void init_prune_data() {
+    short i;
+    for ( i = 0; i < 26; ++i ) {
+	visitedEdges[i] = NULL;
+    }
+}
+
+tree_edge* visited( tree_edge* node ) {
+    short hash = node->letter;// - 'a';
+    //assert( hash >=0 && hash < 26 );
+    if ( visitedEdges[hash] == NULL ) {
+	visitedEdges[hash] = (visited_edge*)malloc(sizeof(visited_edge));
+	assert( visitedEdges[hash] );
+	visitedEdges[hash]->theEdge = node;
+	visitedEdges[hash]->next = NULL;
+	return node;
+    } else {
+	visited_edge* visited;
+	for ( visited = visitedEdges[hash]; visited; 
+	      visited = visited->next ) {
+	    if ( verbose ) {
+		fprintf( stderr, "looking at %c and %c\n",
+			 node->letter, visited->theEdge->letter );
+	    }
+	    if ( sameStructure( node, visited->theEdge ) ) {
+		if ( verbose ) {
+		    fprintf( stderr, "pruning tree beginning with %c\n",
+			     node->letter );
+		}
+		return visited->theEdge;
+	    }
+	}
+	// didn't find it.  Insert new entry at head of list.
+	visited = (visited_edge*)malloc(sizeof(visited_edge));
+	assert( visited );
+	visited->theEdge = node;
+	visited->next = visitedEdges[hash];
+	visitedEdges[hash] = visited;
+	return node;
+    }
+} // visited
+
+int count_nodes( tree_edge* edge ) {
+    short result = 0;
+    while ( edge ) {
+	result += count_nodes( edge->children );
+	++result;
+	edge = edge->next;
+    }
+    return result;
+}
+
+/* Walk the tree.  Starting at the lowest points, lookup each node to see
+ * if an equivalent one has already been visited.  If so, replace it with
+ * (a ptr to) the first one seen.
+ */
+void prune_tree( tree_edge* edge ) {
+    tree_edge* child = edge->children;
+    tree_edge* tmp;
+
+    //    fprintf( stderr, "prune_tree called\n" );
+
+    if ( !child ) {
+	return;
+    }
+
+/*     if( edge->letter == 'c' ) { */
+/* 	fprintf( stderr, "C\n" ); */
+/*     } */
+
+    while ( child ) {
+	prune_tree( child );
+	child = child->next;
+    }
+
+    tmp = visited( edge->children );
+    if ( tmp != edge->children ) {
+	short pulled = count_nodes(edge->children);
+/* 	fprintf( stderr, "Removing %d nodes\n", pulled ); */
+	gPulled += pulled;
+	edge->children = tmp;
+    }
+}
+
+//////////////////////////////////////////////////////////////////////////////
+// write_edge (and helpers)
+//////////////////////////////////////////////////////////////////////////////
+
+unsigned long index_children( tree_edge* edge, unsigned long firstIndex ) {
+    tree_edge* child;
+    for ( child = edge->children; child; child = child->next ) {
+	if ( child->index == 0xFFFF ) {
+	    child->index = firstIndex++;
+/* 	    assert( firstIndex != 0xFFFF ); */
+/* 	    fprintf( stderr, "set index of %c (%x) to %d\n", child->letter, */
+/* 		     child, child->index ); */
+	}
+    }
+
+    for ( child = edge->children; child; child = child->next ) {
+	firstIndex = index_children( child, firstIndex );
+    }
+    return firstIndex;
+}
+
+void write_child( array_edge* mainArray, tree_edge* child ) {
+    if ( child ) {
+	array_edge* entry = &mainArray[child->index];
+	unsigned char bits = 0;
+	unsigned long childIndex
+	    = (child->children!=NULL)? child->children->index : 0;
+	assert( childIndex <= 0x0001FFFF );
+	
+	entry->lowByte = childIndex & 0x000000FF;
+	entry->highByte = (childIndex>>8) & 0x000000FF;
+
+	bits = CharToTile(child->letter) & LETTERMASK;
+
+	if ( childIndex & 0x00010000 ) {
+	    bits |= LASTBITMASK;
+	}
+	if ( child->terminal ) {
+	    bits |= ACCEPTINGMASK;
+	}
+	if ( child->next == NULL ) {
+	    bits |= LASTEDGEMASK;
+	}
+	entry->bits = bits;
+    }
+}
+
+void write_children( array_edge* mainArray, tree_edge* edge ) {
+    tree_edge* child;
+    for ( child = edge->children; child; child = child->next ) {    
+	write_child( mainArray, child );
+	write_children( mainArray, child );
+
+	// gather some stats
+/* 	if ( child->index != 0 ) { */
+/* 	    diff = edge->index - child->index; */
+/* 	    if ( diff > largestDiff ) { */
+/* 		largestDiff = diff; */
+/* 	    } */
+/* 	    if ( diff < smallestDiff ) { */
+/* 		smallestDiff = diff;  */
+/* 	    } */
+/* 	} */
+
+    }
+}
+
+//////////////////////////////////////////////////////////////////////////////
+// write_as_pdb and helpers
+//////////////////////////////////////////////////////////////////////////////
+
+void write_pdb_record_data( array_edge* edges, unsigned long startCount,
+			    unsigned long count ) {
+    unsigned long i;
+    for ( i = startCount; i < startCount + count; ++i ) {
+	fwrite( &edges[i], sizeof(array_edge), 1, stdout );
+    }
+}
+
+// I *think* that the upper bound on this is 0xFFFF/edgesize minus enough that
+// I can add edges out to the end of the subarray in which the line falls
+// can be accomodated -- which I guess is about 32-1-1 (minus one because
+// blanks take up one of the 32 slots though they don't appear in DAWGs,
+// and minus another because the boundary must appear after at least the
+// first or we just leave it there.)
+
+#define EDGES_PER_RECORD 0x3FFF
+#ifndef EDGES_PER_RECORD
+# define EDGES_PER_RECORD 0x00005528
+#endif
+
+/* Write as binary files segmented appropriately in case the target is PalmOS or
+ * other platform with restricted-length databases.
+ */
+void write_as_files( array_edge* edges, unsigned long edgeCount,
+		     char* fileNameBase ) {
+    unsigned long firstUnhousedEdge = 0;
+    short numEdgesThisFile;
+    boolean exitNext = false;
+/*     unsigned long prevEdgeCount; */
+/*     unsigned long curOffset = 0; */
+    short fileNum;
+
+    for ( fileNum = 0; !exitNext; ++fileNum ) {
+	unsigned long lastEdge;
+	char buf[40];
+	FILE* dawgOutF;
+	unsigned long firstEdgeThisFile = 0;
+
+	/* from the first edge not yet in a record, go forward EDGES_PER_RECORD
+	   edges, and than march forward further until the current subarray is
+	   finished. */
+	lastEdge = firstUnhousedEdge + EDGES_PER_RECORD - 1;
+	if ( lastEdge + 1 >= edgeCount ) {
+	    lastEdge = edgeCount - 1;
+	    assert( (edges[lastEdge].bits & LASTEDGEMASK) );
+	    exitNext = true;
+	}
+	while ( (edges[lastEdge].bits & LASTEDGEMASK) == 0 ) {
+	    ++lastEdge;
+	}
+
+	numEdgesThisFile = lastEdge - firstUnhousedEdge + 1;
+	
+	sprintf( buf, "%s_%d.bin", fileNameBase, fileNum );
+	dawgOutF = fopen( buf, "wb" );
+	fwrite( &edges[firstUnhousedEdge], sizeof(array_edge), 
+		numEdgesThisFile, dawgOutF );
+	fclose( dawgOutF );
+
+	fprintf( stderr, "wrote edges from %ld to %ld to file %s\n",
+		 firstUnhousedEdge, firstUnhousedEdge+numEdgesThisFile, buf );
+
+	firstUnhousedEdge = lastEdge + 1;
+    }
+
+    fprintf( stderr, "%ld edges yielded %d records of up to %ld edges each\n",
+	     edgeCount, fileNum, (long)EDGES_PER_RECORD );
+
+} // write_as_files
+
+/******************************************************************************
+ * Read in a file of letters, one per line, whose position in the file will
+ * determine the translation from char to Tile when the dawg is written out.
+ * If no such file is passed in, we'll create our own based on the ascii order
+ * of those chars we see in processing the dictionary.  If one is passed in,
+ * we'll use it, but we'll fail if we encounter a letter not on the list.
+ *
+ * Also, for faster lookup of Tile values we maintain a second table mapping
+ * chars to tiles.  'A' might map to 1, A-umlaut to 2, etc., if 0 is the blank
+ * char
+ *****************************************************************************/
+void initTables() {
+    memset( gOrderTable, 0, 32*sizeof(*gOrderTable) );
+    memset( gLookupTable, -1, 256*sizeof(*gLookupTable) );
+} // initTables
+
+void readInTables( char* orderTableFile ) {
+    unsigned char ch = 0;
+    FILE* f = fopen( orderTableFile, "rb" );
+    assert( f );
+
+    gNumUniqueTiles = 0;
+    while ( fscanf( f, "%c\n", &ch ) != EOF ) {
+	assert( gNumUniqueTiles <= 32 );
+	assert( ch < 255 );
+	assert( gOrderTable[gNumUniqueTiles].ch == 0 );
+	gOrderTable[gNumUniqueTiles].ch = ch;
+	gLookupTable[ch] = gNumUniqueTiles;
+	++gNumUniqueTiles;
+    }
+    fclose( f );
+
+} // readInTables
+
+/******************************************************************************
+ *
+ *****************************************************************************/
+static void remember( unsigned char* c ) {
+    signed short tile = gLookupTable[*c];
+    assert( gOrderTableFileName != NULL );
+    if ( tile == -1 ) {
+	fprintf( stderr, "ERROR: unexpected character '%c' (0x%x)\n",
+		 *c, (short)*c );
+	exit(1);
+    }
+    assert( tile < 32 );
+    *c = tile;
+} // remember
+
+/******************************************************************************
+ *
+ *****************************************************************************/
+Tile CharToTile( unsigned char ch ) {
+    return ch;
+/*      assert( gLookupTable[ch] < 32 ); */
+/*      return (Tile)gLookupTable[ch]; */
+} // CharToTile
+
+static short fileSize( char* fileName ) {
+    short result;
+    FILE* f = fopen( fileName, "rb" );
+    assert( f );
+    if ( fseek( f, 0L, SEEK_END ) != 0 ) {
+	fprintf( stderr, "error from fseek\n" );
+	exit(1);
+    }
+    result = ftell( f );
+    fclose( f );
+    return (short)result;
+} // fileSize
+
+//////////////////////////////////////////////////////////////////////////////
+// usage
+//////////////////////////////////////////////////////////////////////////////
+void usage( char* progName ) {
+    fprintf( stderr, 
+	     "USAGE: %s\n"
+	     "   [-m<maxLength>]\n"
+	     "   [-v] (verbose) \n"
+/* 	     "   [-t char-order-table-file] \n" */
+/* 	     "   [-n <pdbName>] \n" */
+	     "   <word_list >dawg_file\n",
+	     progName );
+    exit( 1 );
+}
+
--- a/xwords4/xwords4/dawg/dict2dawg.pl
+++ b/xwords4/xwords4/dawg/dict2dawg.pl
@ -0,0 +1,798 @@
+#!/usr/bin/perl
+
+##############################################################################
+# adapted from C++ code Copyright (C) 2000 Falk Hueffner
+# This version Copyright (C) 2002 Eric House (fixin@peak.org)
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful, but
+# WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+# General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307
+# USA
+##############################################################################
+
+# inputs: 0. Name of file mapping letters to 0..31 values.  In English
+# case just contains A..Z.  This will be used to translate the tries
+# on output.
+#         1. Max number of bytes per binary output file.
+#
+#         2. Basename of binary files for output.
+
+#         3. Name of file to which to write the number of the
+# startNode, since I'm not rewriting a bunch of code to expect Falk's
+# '*' node at the start.
+#
+
+#         In STDIN, the text file to be compressed.  It absolutely
+# must be sorted.  The sort doesn't have to follow the order in the
+# map file, however.
+
+# This is meant eventually to be runnable as part of a cgi system for
+# letting users generating Crosswords dicts online.
+
+
+
+use strict;
+use POSIX;
+
+my $gFirstDiff;
+my @gCurrentWord;
+my $gCurrentWord;               # save so can check for sortedness
+my $gDone = 0;
+my @gInputStrings;
+my $gNeedsSort = 1;             # read from cmd line eventually
+my @gNodes;                       # final array of nodes
+my $gNBytesPerOutfile = 0xFFFFFFFF;
+my $gTableFile;
+my $gOutFileBase;
+my $gStartNodeOut;
+my $gInFileName;
+my $gKillIfMissing = 1;
+my $gTermChar = '/n';
+my $gDumpText = 0;              # dump the dict as text after?
+my $gCountFile;
+my $gBytesPerNodeFile;          # where to write whether node size 3 or 4
+my $gWordCount = 0;
+my %gTableHash;
+my @gRevMap;
+my $debug = 0;
+my %gSubsHash;
+my $gForceFour = 0;             # use four bytes regardless of need?
+my $gNBytesPerNode;
+my $gUseUnicode;
+
+main();
+
+exit;
+
+##############################################################################
+
+sub main() { 
+
+    if ( !parseARGV() ) {
+        usage();
+        exit();
+    }
+
+    makeTableHash();
+
+    my $infile;
+
+    if ( $gInFileName ) {
+        open $infile, "<$gInFileName";
+    } else {
+        $infile = \*STDIN;
+    }
+
+    @gInputStrings = parseAndSort( $infile );
+    if ( $gInFileName ) {
+        close $infile;
+    }
+
+    # Do I need this stupid thing?  Better to move the first row to
+    # the front of the array and patch everything else.  Or fix the
+    # non-palm dictionary format to include the offset of the first
+    # node.
+
+    my $dummyNode = 0xFFFFFFFF;
+    @gNodes = ( $dummyNode );
+    
+    readNextWord();
+
+    my $firstRootChildOffset = buildNode(0);
+
+    moveTopToFront( \$firstRootChildOffset );
+
+    if ( $gStartNodeOut ) {
+        writeOutStartNode( $gStartNodeOut, $firstRootChildOffset );
+    }
+
+    print STDERR "\n... dumping table ...\n" if $debug;
+    printNodes( \@gNodes, "done with main" ) if $debug;
+
+    # write out the number of nodes if requested
+    if ( $gCountFile ) {
+        open OFILE, "> $gCountFile";
+        print OFILE pack( "N", $gWordCount );
+        close OFILE;
+        print STDERR "wrote out: got $gWordCount words\n";
+    }
+
+    if ( $gOutFileBase ) {
+        emitNodes( $gNBytesPerOutfile, $gOutFileBase );
+    }
+
+    if ( $gDumpText && @gNodes > 0 ) {
+        printOneLevel( $firstRootChildOffset, "" );
+    }
+
+    if ( $gBytesPerNodeFile ) {
+        open OFILE, "> $gBytesPerNodeFile";
+        print OFILE $gNBytesPerNode;
+        close OFILE;
+    }
+    print STDERR "Used $gNBytesPerNode per node.\n";
+} # main
+
+# We now have an array of nodes with the last subarray being the
+# logical top of the tree.  Move them to the start, fixing all fco
+# refs, so that legacy code like Palm can assume top==0.
+#
+# Note: It'd probably be a bit faster to integrate this with emitNodes
+# -- unless I need to have an in-memory list that can be used for
+# lookups.  But that's best for debugging, so keep it this way for now.
+#
+# Also Note: the first node is a dummy that can and should be tossed
+# now.
+
+sub moveTopToFront($) {
+    my ( $firstRef ) = @_;
+
+    my $firstChild = ${$firstRef};
+    ${$firstRef} = 0;
+    my @lastSub;
+
+    if ( $firstChild > 0 ) {
+        # remove the last (the root) subarray
+        @lastSub = splice( @gNodes, $firstChild );
+    } else {
+        die "there should be no words!!" if $gWordCount != 0;
+    }
+    # remove the first (garbage) node
+    shift @gNodes;
+
+    my $diff;
+    if ( $firstChild > 0 ) {
+        # -1 because all move down by 1; see prev line
+        $diff = @lastSub - 1;
+        die "something wrong with len\n" if $diff < 0;
+    } else {
+        $diff = 0;
+    }
+
+    # stick it on the front
+    splice( @gNodes, 0, 0, @lastSub);
+
+    # We add $diff to everything. There's no subtracting because
+    # nobody had any refs to the top list.
+
+    for ( my $i = 0; $i < @gNodes; ++$i ) {
+        my $fco = TrieNodeGetFirstChildOffset( $gNodes[$i] );
+        if ( $fco != 0 ) {      # 0 means NONE, not 0th!!
+            TrieNodeSetFirstChildOffset( \$gNodes[$i], $fco+$diff );
+        }
+    }
+} # moveTopToFront
+
+
+sub buildNode {
+    my ( $depth ) = @_;
+
+    if ( @gCurrentWord == $depth ) {
+        # End of word reached. If the next word isn't a continuation
+        # of the current one, then we've reached the bottom of the
+        # recursion tree.
+        readNextWord();
+        if ($gFirstDiff < $depth || $gDone) {
+            return 0;
+        }
+    }
+
+    my @newedges;
+
+    do {
+        my $letter = $gCurrentWord[$depth];
+        my $isTerminal = @gCurrentWord - 1 == $depth ? 1:0;
+
+        my $nodeOffset = buildNode($depth+1);
+        my $newNode = MakeTrieNode($letter, $isTerminal, $nodeOffset);
+        push( @newedges, $newNode );
+
+    } while ( ($gFirstDiff == $depth) && !$gDone);
+
+    TrieNodeSetIsLastSibling( \@newedges[@newedges-1], 1 );
+
+    return addNodes( \@newedges );
+} # buildNode
+
+sub addNodes {
+    my ( $newedgesR ) = @_;
+
+    my $found = findSubArray( $newedgesR );
+
+    if ( $found >= 0 ) {
+        die "0 is an invalid match!!!" if $found == 0;
+        return $found;
+    } else {
+
+        my $firstFreeIndex = @gNodes;
+
+        print STDERR "adding...\n" if $debug;
+        printNodes( $newedgesR ) if $debug;
+
+        push @gNodes, (@{$newedgesR});
+
+        registerSubArray( $newedgesR, $firstFreeIndex );
+        return $firstFreeIndex;
+    }
+} # addNodes
+
+sub printNode {
+    my ( $index, $node ) = @_;
+
+    print STDERR "[$index] ";
+
+    printf( STDERR
+            "letter=%d; isTerminal=%d; isLastSib=%d; fco=%d;\n",
+            TrieNodeGetLetter($node),
+            TrieNodeGetIsTerminal($node),
+            TrieNodeGetIsLastSibling($node),
+            TrieNodeGetFirstChildOffset($node));
+} # printNode
+
+sub printNodes {
+    my ( $nodesR, $name ) = @_;
+
+    my $len = @{$nodesR};
+    # print "printNodes($name): len = $len\n";
+
+    for ( my $i = 0; $i < $len; ++$i ) {
+        my $node = ${$nodesR}[$i];
+        printNode( $i, $node );
+    }
+
+}
+
+
+# Hashing.  We'll keep a hash of offsets into the existing nodes
+# array, and as the key use a string that represents the entire sub
+# array.  Since the key is what we're matching for, there should never
+# be more than one value per hash and so we don't need buckets.
+# Return -1 if there's no match.
+
+sub findSubArray {
+   my ( $newedgesR ) = @_;
+
+	my $key = join('', @{$newedgesR});
+
+    if ( exists( $gSubsHash{$key} ) ) {
+        return $gSubsHash{$key};
+    } else {
+        return -1;
+    }
+} # findSubArray
+
+# add to the hash
+sub registerSubArray {
+    my ( $edgesR, $nodeLoc ) = @_;
+
+    my $key = join( '', @{$edgesR} );
+
+    if ( exists $gSubsHash{$key} ) {
+        die "entry for key shouldn't exist!!";
+    } else {
+        $gSubsHash{$key} = $nodeLoc;
+    }
+
+} # registerSubArray
+
+sub readNextWord() {
+    my @word;
+
+    if ( !$gDone ) {
+        $gDone = @gInputStrings == 0;
+        if ( !$gDone ) {
+            @word = @{shift @gInputStrings};
+        } else {
+            print STDERR "gDone set to true\n" if $debug;
+        }
+
+        print STDERR "got word: ", join(',',@word), "\n" if $debug;
+    }
+    my $numCommonLetters = 0;
+    my $len = @word;
+    if ( @gCurrentWord < $len ) {
+        $len = @gCurrentWord;
+    }
+
+    while ( @gCurrentWord[$numCommonLetters] eq @word[$numCommonLetters]
+            && $numCommonLetters < $len) {
+        ++$numCommonLetters;
+    }
+
+    $gFirstDiff = $numCommonLetters;
+    die "words ", join(",",@gCurrentWord), " and ", join(",", @word), " out of order" if #$debug && 
+        @gCurrentWord > 0 && @word > 0
+        && !firstBeforeSecond( \@gCurrentWord, \@word );
+    @gCurrentWord = @word;
+} # readNextWord
+
+sub firstBeforeSecond {
+    my ( $firstR, $secondR ) = @_;
+  
+    for ( my $i = 0; ; ++$i ) {
+
+        # if we reach the end of the first word/list, we're done.
+        if ( $i == @{$firstR} ) {  
+            die "duplicate!!!" if $i == @{$secondR};
+            return 1;
+            # but if we reach the second end first, we've failed
+        } elsif ( $i == @{$secondR} ) {
+            return 0;
+        }
+
+        my $diff = ${$firstR}[$i] <=> ${$secondR}[$i];
+
+        if ( $diff == 0 ) {
+            next;
+        } else {
+            return $diff < 0;
+        }
+    }
+} # firstBeforeSecond
+
+# passed to sort.  Should remain unprototyped for effeciency's sake
+
+sub cmpWords {
+
+    my $lenA = @{$a};
+    my $lenB = @{$b};
+    my $min = $lenA > $lenB? $lenB: $lenA;
+
+    for ( my $i = 0; $i < $min; ++$i ) {
+        my $ac = ${$a}[$i];
+        my $bc = ${$b}[$i];
+
+        my $res = $ac <=> $bc;
+
+        if ( $res != 0 ) {
+            return $res;        # we're done
+        }
+    }
+
+    # If we got here, they match up to their common length.  Longer is
+    # greater.
+    my $res = @{$a} <=> @{$b};
+    return $res; # which is longer?
+} # cmpWords
+
+sub parseAndSort() {
+    my ( $infile ) = @_;
+
+    my @wordlist;
+    my @word;
+
+  WORDLOOP:
+    for ( ; ; ) {
+
+        my $dropWord = 0;
+        splice @word;           # empty it
+
+        # for each byte
+        for ( ; ; ) {
+            my $byt = getc($infile);
+
+            if ( $byt eq undef ) {
+                last WORDLOOP;
+            } elsif ( $byt eq $gTermChar ) {
+                if ( !$dropWord ) {
+                    push @wordlist, [ @word ];
+                    ++$gWordCount;
+                }
+                next WORDLOOP;
+            } elsif ( exists( $gTableHash{$byt} ) ) {
+                if ( !$dropWord ) {
+                    push @word, $gTableHash{$byt};
+                    die "word too long" if @word > 15;
+                }
+            } elsif ($gKillIfMissing) {
+                die "char $byt (", $byt+0, ") not in map file $gTableFile\n";
+            } else {
+                $dropWord = 1;
+                splice @word;     # lose anything we already have
+            }
+        }
+    }
+
+    if ( $gNeedsSort && ($gWordCount > 0)  ) {
+        @wordlist = sort cmpWords @wordlist;
+    }
+
+    print STDERR "length of list is ", @wordlist + 0, ".\n" if $debug;
+
+    return @wordlist;
+} # parseAndSort
+
+# Print binary representation of trie array.  This isn't used yet, but
+# eventually it'll want to dump to multiple files appropriate for Palm
+# that can be catenated together on other platforms.  There'll need to
+# be a file giving the offset of the first node too.  Also, might want
+# to move to 4-byte representation when the input can't otherwise be
+# handled.
+
+sub dumpNodes {
+
+    for ( my $i = 0; $i < @gNodes; ++$i ) {
+        my $node = $gNodes[$i];
+        my $bstr = pack( "I", $node );
+        print STDOUT $bstr;
+    }
+}
+
+##############################################################################
+# Little node-field setters and getters to hide what bits represent
+# what.
+##############################################################################
+
+sub TrieNodeSetIsTerminal {
+    my ( $nodeR, $isTerminal ) = @_;
+
+    if ( $isTerminal ) {
+        ${$nodeR} |= 1 << 31;
+    } else {
+        ${$nodeR} &= ~(1 << 31);
+    }
+}
+
+sub TrieNodeGetIsTerminal {
+    my ( $node ) = @_;
+    return ($node & 1 << 31) != 0;
+}
+
+sub TrieNodeSetIsLastSibling {
+    my ( $nodeR, $isLastSibling ) = @_;
+    if ( $isLastSibling ) {
+        ${$nodeR} |= 1 << 30;
+    } else {
+        ${$nodeR} &= ~(1 << 30);
+    }
+}
+
+sub TrieNodeGetIsLastSibling {
+    my ( $node ) = @_;
+    return ($node & 1 << 30) != 0;
+}
+
+sub TrieNodeSetLetter {
+    my ( $nodeR, $letter ) = @_;
+
+    die "letter ", $letter, " too big" if $letter >= 32;
+
+    my $mask = ~(0x1F << 25);
+    ${$nodeR} &= $mask;                         # clear all the bits
+    ${$nodeR} |= ($letter << 25);          # set new ones
+}
+
+sub TrieNodeGetLetter {
+    my ( $node ) = @_;
+    $node >>= 25;
+    $node &= 0x1F;
+    return $node;
+}
+
+sub TrieNodeSetFirstChildOffset {
+    my ( $nodeR, $fco ) = @_;
+
+    die "$fco larger than 25 bits" if ($fco & 0xFE000000) != 0;
+
+    my $mask = ~0x01FFFFFF;
+    ${$nodeR} &= $mask;                   # clear all the bits
+    ${$nodeR} |= $fco;                    # set new ones
+}
+
+sub TrieNodeGetFirstChildOffset {
+    my ( $node ) = @_;
+    $node &= 0x01FFFFFF;                  # 24 bits
+    return $node;
+}
+
+
+sub MakeTrieNode {
+    my ( $letter, $isTerminal, $firstChildOffset, $isLastSibling ) = @_;
+    my $result = 0;
+
+    TrieNodeSetIsTerminal( \$result, $isTerminal );
+    TrieNodeSetIsLastSibling( \$result, $isLastSibling );
+    TrieNodeSetLetter( \$result, $letter );
+    TrieNodeSetFirstChildOffset( \$result, $firstChildOffset );
+
+    return $result;
+} # MakeTrieNode
+
+# Caller may need to know the offset of the first top-level node.
+# Write it here.
+sub writeOutStartNode {
+    my ( $startNodeOut, $firstRootChildOffset ) = @_;
+
+    open NODEOUT, ">$startNodeOut";
+    print NODEOUT pack( "N", $firstRootChildOffset );
+    close NODEOUT;
+} # writeOutStartNode
+
+# build the hash for translating.  I'm using a hash assuming it'll be
+# fast.  Key is the letter; value is the 0..31 value to be output.
+sub makeTableHash {
+    my $i;
+    open TABLEFILE, "< $gTableFile";
+
+    splice @gRevMap;            # empty it
+
+    for ( $i = 0; ; ++$i ) {
+        my $ch = getc(TABLEFILE);
+        if ( $ch eq undef ) {
+            last;
+        }
+
+        if ( $gUseUnicode ) {   # skip the first byte each time: tmp HACK!!!
+            $ch = getc(TABLEFILE);
+        }
+        if ( $ch eq undef ) {
+            last;
+        }
+
+        push @gRevMap, $ch;
+
+        if ( ord($ch) == 0 ) {	# blank
+            next;       # we want to increment i when blank seen since 
+                        # it is a tile value
+        }
+
+        die "$gTableFile too large\n" if $i > 32;
+        die "only blank (0) can be 32nd char\n" if ($i == 32 && $ch != 0);
+
+        $gTableHash{$ch} = $i;
+    }
+
+    close TABLEFILE;
+} # makeTableHash
+
+# emitNodes. "input" is $gNodes.  From it we write up to
+# $nBytesPerOutfile to files named $outFileBase0..n, mapping the
+# letter field down to 5 bits with a hash built from $tableFile.  If
+# at any point we encounter a letter not in the hash we fail with an
+# error.
+
+sub emitNodes($$) {
+    my ( $gNBytesPerOutfile, $outFileBase ) = @_;
+
+    # now do the emit.
+
+    # is 17 bits enough?
+    printf STDOUT ("There are %d (0x%x) nodes in this DAWG.\n",
+                   0 + @gNodes, 0 + @gNodes );
+    if ( @gNodes > 0x1FFFF || $gForceFour ) {
+        $gNBytesPerNode = 4;
+    } else {
+        $gNBytesPerNode = 3;
+    }
+
+    my $nextIndex = 0;
+    my $nextFileNum = 0;
+
+    for ( $nextFileNum = 0; ; ++$nextFileNum ) {
+
+        if ( $nextIndex >= @gNodes ) {
+            last;	# we're done
+        }
+        
+        die "Too many outfiles; infinite loop?" if $nextFileNum > 99;
+
+        my $outName = sprintf("${outFileBase}_%03d.bin", $nextFileNum);
+        open OUTFILE, "> $outName";
+        my $curSize = 0;
+
+        while ( $nextIndex < @gNodes ) {
+
+            # scan to find the next terminal
+            my $i;
+            for ( $i = $nextIndex; 
+                  !TrieNodeGetIsLastSibling($gNodes[$i]);
+                  ++$i ) {
+
+                # do nothing but a sanity check
+                if ( $i >= @gNodes) {
+                    die "bad trie format: last node not last sibling" ;
+                }
+
+            }
+            ++$i;	# move beyond the terminal
+            my $nextSize = ($i - $nextIndex) * $gNBytesPerNode;
+            if ($curSize + $nextSize > $gNBytesPerOutfile) {
+                last;
+            } else {
+                # emit the subarray
+                while ( $nextIndex < $i ) {
+                    outputNode( $gNodes[$nextIndex], $gNBytesPerNode,
+                                \*OUTFILE );
+                    ++$nextIndex;
+                }
+                $curSize += $nextSize;
+            }
+        }
+
+        close OUTFILE;
+    }
+
+} # emitNodes
+
+sub printWord {
+    my ( $str ) = @_;
+
+    print STDERR "$str\n";
+}
+
+# print out the entire dictionary, as text, to STDERR.
+
+sub printOneLevel {
+
+    my ( $index, $str ) = @_;
+
+    for ( ; ; ) {
+
+        my $newStr = $str;
+        my $node = $gNodes[$index++];
+
+        my $lindx = $gRevMap[TrieNodeGetLetter($node)];
+
+        if ( ord($lindx) >= 0x20 ) {
+            $newStr .= "$lindx";
+        } else {
+            print STDERR "sub space" if $debug;
+            $newStr .= "\\" . chr('0'+$lindx);
+        }
+
+        if ( TrieNodeGetIsTerminal($node) ) {
+            printWord( $newStr );
+        } 
+
+        my $fco = TrieNodeGetFirstChildOffset( $node );
+        if ( $fco != 0 ) {
+            printOneLevel( $fco, $newStr );
+        }
+
+        if ( TrieNodeGetIsLastSibling($node) ) {
+            last;
+        }
+    }
+}
+
+sub outputNode {
+    my ( $node, $nBytes, $outfile ) = @_;
+
+    my $fco = TrieNodeGetFirstChildOffset($node);
+    my $fourthByte;
+
+    if ( $nBytes == 4 ) {
+        $fourthByte = $fco >> 17;
+        die "fco too big" if $fourthByte > 0xFF;
+        $fco &= 0x1FFFF;
+    }
+
+    # format according to dawg.h:
+    # typedef struct array_edge {
+    #     unsigned char highByte;
+    #     unsigned char lowByte;
+    #     unsigned char bits;
+#ifdef FOUR_BYTE
+    #     unsigned char moreBits;
+#endif
+    # } array_edge;
+
+    # define LETTERMASK 0x1f
+    # define ACCEPTINGMASK 0x20
+    # define LASTEDGEMASK 0x40
+    # define LASTBITMASK 0x80
+
+    # write the fco (less that one bit).  We want two bytes worth
+    # in three-byte mode, and three in four-byte mode (which is
+    # untested)
+    for ( my $i = 1; $i >= 0; --$i ) {
+        my $tmp = ($fco >> ($i * 8)) & 0xFF;
+        print $outfile pack( "C", $tmp );
+    }
+    $fco >>= 16;                # it should now be 1 or 0
+    die "fco not 1 or 0" if $fco > 1;
+
+    my $chIn5 = TrieNodeGetLetter($node);
+    my $bits = $chIn5;
+
+    if ( TrieNodeGetIsLastSibling($node) ) {
+        $bits |= 0x40;
+    }
+    if ( TrieNodeGetIsTerminal($node) ) {
+        $bits |= 0x20;
+    }
+    if ( $fco != 0 ) {
+        $bits |= 0x80;
+    }
+    print $outfile pack( "C", $bits );
+
+    # the final byte, if in use
+    if ( $nBytes == 4 ) {
+        print $outfile pack( "C", $fourthByte );
+    }
+} # outputNode
+
+sub usage {
+    print STDERR "usage: $0 \n"
+        . "\t[-b    bytesPerFile] (default = 0xFFFFFFFF)\n"
+        . "\t-m     mapFile\n"
+        . "\t-ob    outFileBase\n"
+        . "\t-sn    start node out file\n"
+        . "\t[-if   input file name]  -- default = stdin\n"
+        . "\t[-term ch] (word terminator -- default = '\\0'\n"
+        . "\t[-nosort] (input already sorted in accord with -m; " .
+        " default=sort'\n"
+        . "\t[-dump]  (write dictionary as text to STDERR for testing)\n"
+        . "\t[-force4](use 4 bytes per node regardless of need)\n"
+        . "\t[-r]     (reject words with letters not in mapfile)\n"
+        . "\t[-k]     (kill if any letters no in mapfile -- default)\n"
+        ;
+
+} # usage
+
+sub parseARGV {
+
+    my $arg;
+    while ( my $arg = shift(@ARGV) ) {
+
+      SWITCH: {
+          if ($arg =~ /-b/) {$gNBytesPerOutfile = shift(@ARGV), last SWITCH;}
+          if ($arg =~ /-mn/) {$gTableFile = shift(@ARGV);
+                              $gUseUnicode = 1;
+                              last SWITCH;}
+          if ($arg =~ /-m/) {$gTableFile = shift(@ARGV); last SWITCH;}
+          if ($arg =~ /-ob/) {$gOutFileBase = shift(@ARGV), last SWITCH;}
+          if ($arg =~ /-sn/) {$gStartNodeOut = shift(@ARGV), last SWITCH;}
+          if ($arg =~ /-if/) {$gInFileName = shift(@ARGV), last SWITCH;}
+          if ($arg =~ /-r/) {$gKillIfMissing = 0; last SWITCH;}
+          if ($arg =~ /-k/) {$gKillIfMissing = 1; last SWITCH;}
+          if ($arg =~ /-term/) {$gTermChar = chr(shift(@ARGV)); last SWITCH;}
+          if ($arg =~ /-dump/) {$gDumpText = 1; last SWITCH;}
+          if ($arg =~ /-nosort/) {$gNeedsSort = 0; last SWITCH;}
+          if ($arg =~ /-wc/) {$gCountFile = shift(@ARGV); last SWITCH;}
+          if ($arg =~ /-ns/) {$gBytesPerNodeFile = shift(@ARGV); last SWITCH;}
+          if ($arg =~ /-force4/) {$gForceFour = 1; last SWITCH;}
+          die "unexpected arg $arg\n";
+      }
+    }
+
+
+    print STDERR "gNBytesPerOutfile=$gNBytesPerOutfile\n" if $debug;
+    print STDERR "gTableFile=$gTableFile\n" if $debug;
+    print STDERR "gOutFileBase=$gOutFileBase\n" if $debug;
+    print STDERR "gStartNodeOut=$gStartNodeOut\n" if $debug;
+    printf STDERR "gTermChar=%s(%d)\n", $gTermChar, ord($gTermChar) if $debug;
+
+    return $gTableFile;
+    
+} # parseARGV
--- a/xwords4/xwords4/dawg/frank_mkspecials.pl
+++ b/xwords4/xwords4/dawg/frank_mkspecials.pl
@ -0,0 +1,45 @@
+#!/usr/bin/perl
+
+# Copyright 2001 by Eric House (fixin@peak.org)
+#
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License
+# as published by the Free Software Foundation; either version 2
+# of the License, or (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+
+# Given arguments consisting of triples, first a string and then pbitm
+# files representing bitmaps.  For each triple, print out the string and
+# then the converted bitmaps.
+
+use strict;
+
+while ( @ARGV ) {
+  my $str = shift();
+  my $largebmp = shift();
+  my $smallbmp = shift();
+
+  doOne( $str, $largebmp, $smallbmp );
+}
+
+sub doOne {
+  my ( $str, $largebmp, $smallbmp ) = @_;
+
+  print pack( "C", length($str) );
+  print $str;
+
+  print STDERR "looking at $largebmp", "\n";
+
+  print `cat $largebmp | ../pbitm2bin.pl`;
+  print `cat $smallbmp | ../pbitm2bin.pl`;
+}
+
+
--- a/xwords4/xwords4/dawg/gendict.c
+++ b/xwords4/xwords4/dawg/gendict.c
@ -0,0 +1,99 @@
+#include <stdio.h>
+
+/* 
+ * Copyright 1998 by Eric House.  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU General Public License
+ * as published by the Free Software Foundation; either version 2
+ * of the License, or (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+ */
+ 
+typedef char boolean;
+#define true 1
+#define false 0
+
+#define MAXWORDLEN 15
+
+boolean writeOneWord( char* word, int len );
+void usage();
+
+//////////////////////////////////////////////////////////////////////////////
+// main
+// This program generates all possible combinations of letters 'A'-'Z' of
+// lengths between 2 and MAXWORDLEN, writing them to stdout.  It's meant
+// to be used to test the dawg dictionary and a state machine based on
+// it: if the output of this program is used as input to that machine, the
+// list of words accepted by the machine should be identical to the list
+// from which the dawg was created -- provided sufficient length words
+// are created.
+//////////////////////////////////////////////////////////////////////////////
+int main( int argc, char** argv ) {
+    int i, j;
+    long lowerbound = 0;
+    long upperbound = 0;
+    char buffer[MAXWORDLEN+1];
+
+    if ( argc ==3 ) {
+	sscanf( argv[1], "%d", &lowerbound );
+	sscanf( argv[2], "%d", &upperbound );
+	if ( lowerbound < 2 || upperbound < 2 ) {
+	    usage();
+	}
+    } else {
+	usage();
+    }
+
+    for ( i = lowerbound; i <= upperbound; ++i ) {
+	buffer[0] = '\0';
+	for ( j = 0; j < i; ++j ) {
+	    strcat( buffer, "A" );
+	}
+	while ( !writeOneWord( buffer, i-1 ) ) {
+	    // do nothing
+	}
+    }
+}
+
+/* Increment the last letter if possible.  Otherwise reset it and find
+ * the first letter above it that can be incremented, resetting along
+ * the way.  If the *first* letter needs to be reset we're finished.
+ */
+boolean writeOneWord( char* word, int len ) {
+    fprintf( stdout, "%s\n", word );
+
+    if ( word[len] != 'Z' ) {
+	word[len]++;
+    } else {
+	int i;
+	word[len] = 'A';
+	for ( i = len-1; ; --i ) {
+	    if ( word[i] != 'Z' ) {
+		 word[i]++;
+		 break;
+	    } else if ( i == 0 ) { // they're *all* Zs...
+		return true; // we wrote all the words!
+	    } else {
+		 word[i] = 'A';
+	    }
+	}
+    }
+    return false;
+}
+
+void usage() {
+    fprintf( stderr,
+	     "USAGE: gendict upperbound lowerbound\n"
+	     "   (Both must be >= 2.)\n" );
+    exit( 0 );
+}
+
--- a/xwords4/xwords4/dawg/listchars.pl
+++ b/xwords4/xwords4/dawg/listchars.pl
@ -0,0 +1,36 @@
+#!/usr/bin/perl
+
+# Copyright 2001 by Eric House
+#
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License
+# as published by the Free Software Foundation; either version 2
+# of the License, or (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+
+use strict;
+
+my %lettersHash;
+
+
+while ( <> ) {
+    chomp;
+    foreach my $byte (split //) {
+        ++$lettersHash{$byte};
+    }
+}
+
+foreach my $key (sort keys(%lettersHash)) {
+    my $count = $lettersHash{$key};
+    if ( $count ) {
+        printf( "%.3d: %s: %.7d\n", ord($key), $key, $count );
+    }
+}
--- a/xwords4/xwords4/dawg/palm_mkspecials.pl
+++ b/xwords4/xwords4/dawg/palm_mkspecials.pl
@ -0,0 +1,111 @@
+#!/usr/bin/perl
+
+# Copyright 2002 by Eric House
+#
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License
+# as published by the Free Software Foundation; either version 2
+# of the License, or (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+
+# Given arguments consisting of triples, first a string and then pbitm
+# files representing bitmaps. The format looks like this:
+
+# array [0-n] of { char len; 
+#                  char[3] alt txt;
+#                  int16 offsetOfLarge;
+#                  int16 offsetOfSmall;
+#                }
+# array [0-n] of { 
+#                  bitmapLargeIfPresent;
+#                  bitmapSmallIfPresent;
+#                }
+#
+# In addition, there's padding between bitmaps if needed to get the next
+# one to a 2-byte boundary.  And the input files are not in PalmOS bitmap
+# format, so thay have to get converted into a tmp file before the sizes
+# can be known and included in the eventual output.
+
+use strict;
+
+my $tmpfile = "/tmp/tmpout$$";
+
+my $nSpecials = @ARGV / 3;
+die "wrong number of args" if (@ARGV % 3) != 0;
+my $gOffset = $nSpecials * 8;     # sizeof(Xloc_specialEntry)
+
+open TMPFILE, "> $tmpfile";
+
+for ( my $i = 0; $i < $nSpecials; ++$i ) {
+    
+    my $size;
+
+    my $str = shift( @ARGV );
+    my $len = length($str);
+    die "string $str too long" if $len > 3;
+    print $str;
+    while ( $len < 4 ) {
+        ++$len;
+        print pack("c", 0 );
+    }
+
+    doOneFile( shift( @ARGV ), \*TMPFILE, \$gOffset );
+    doOneFile( shift( @ARGV ), \*TMPFILE, \$gOffset );
+}
+
+close TMPFILE;
+
+# now append the tempfile
+open TMPFILE, "< $tmpfile";
+while ( read( TMPFILE, my $buffer, 128 ) ) {
+    print $buffer;
+}
+close TMPFILE;
+
+unlink $tmpfile;
+
+exit 0;
+
+
+sub doOneFile($$) {
+    my ( $fil, $fh, $offsetR ) = @_;
+
+    my $size = convertBmp($fil, $fh );
+    if ( ($size % 2) != 0 ) {
+        ++$size;
+        print $fh pack( "c", 0 );
+    }
+
+    print pack( "n", $size > 0? ${$offsetR} : 0 );
+
+    ${$offsetR} += $size;
+} # doOneFile
+
+sub convertBmp($$) {
+    my ( $pbitmfile, $fhandle ) = @_;
+
+    if ( $pbitmfile eq "/dev/null" ) {
+        return 0;
+    } else {
+
+        # for some reason I can't get quote marks to print into tmp.rcp using just `echo`
+        open TMP, "> tmp.rcp";
+        print TMP "BITMAP ID 1000 \"$pbitmfile\" AUTOCOMPRESS";
+        close TMP;
+
+        `pilrc tmp.rcp`;
+        print $fhandle `cat Tbmp03e8.bin`;
+        my $siz = -s "Tbmp03e8.bin";
+        `rm -f tmp.rcp Tbmp03e8.bin`;
+
+        return $siz;
+    }
+}
--- a/xwords4/xwords4/dawg/par.pl
+++ b/xwords4/xwords4/dawg/par.pl
@ -0,0 +1,234 @@
+#!/usr/bin/perl
+
+# Copyright 2002 by Eric House (fixin@peak.org)   All rights reserved.
+#
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License
+# as published by the Free Software Foundation; either version 2
+# of the License, or (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+
+# Only enough of par's features to support building a crosswords dict
+# pdb
+
+use strict;
+
+my $debug = 0;
+
+
+# stolen from par source
+my $PRC_FLAGS_RESOURCE =    (0x1<<0);
+my $PRC_FLAGS_READONLY =   (0x1<<1);
+my $PRC_FLAGS_DIRTY    =   (0x1<<2);
+my $PRC_FLAGS_BACKUP   =   (0x1<<3);
+my $PRC_FLAGS_NEWER    =   (0x1<<4);
+my $PRC_FLAGS_RESET    =   (0x1<<5);
+my $PRC_FLAGS_COPYPREVENT = (0x1<<6);
+my $PRC_FLAGS_STREAM   =   (0x1<<7);
+my $PRC_FLAGS_HIDDEN   =   (0x1<<8);
+my $PRC_FLAGS_LAUNCHABLE = (0x1<<9);
+my $PRC_FLAGS_RECYCLABLE = (0x1<<10);
+my $PRC_FLAGS_BUNDLE   =   (0x1<<11);
+my $PRC_FLAGS_OPEN     =   (0x1<<15);
+
+
+my $gAttrs = 0;
+my $gVersion = 1;               # par defaults this to 1
+
+my $cmd = shift( @ARGV );
+die "only 'c' supported now" if $cmd ne "c" && $cmd ne "-c";
+
+readHOptions( \@ARGV );
+
+my $dbfile = shift( @ARGV );
+my $name = shift( @ARGV );
+die "name $name too long" if length($name) > 31;
+my $type = shift( @ARGV );
+die "type $type must be of length 4" if length($type) != 4;
+my $cid = shift( @ARGV );
+die "cid $cid must be of length 4" if length($cid) != 4;
+
+my @fileNames;
+my @fileLengths;
+
+my $nFiles = 0;
+
+while ( @ARGV > 0 ) {
+    my $filename = shift( @ARGV );
+    push @fileNames, $filename;
+    push @fileLengths, -s $filename;
+    ++$nFiles;
+}
+
+# from par's prcp.h; thanks djw!
+# typedef struct prc_file_t {
+#     prc_byte_t name[32];
+#     prc_byte_t flags[2];
+#     prc_byte_t version[2];
+#     prc_byte_t ctime[4];
+#     prc_byte_t mtime[4];
+#     prc_byte_t btime[4];
+#     prc_byte_t modnum[4];
+#     prc_byte_t appinfo[4];
+#     prc_byte_t sortinfo[4];
+#     prc_byte_t type[4];
+#     prc_byte_t cid[4];
+#     prc_byte_t unique_id_seed[4];
+#     prc_byte_t next_record_list[4];
+#     prc_byte_t nrecords[2];
+# } prc_file_t;
+
+my $str;
+my $offset = 0;
+
+open OUTFILE, "> $dbfile" or die "couldn't open outfile $dbfile for writing";
+
+# print the string, then pad with 0s
+$offset = length($name);
+print OUTFILE $name;
+while ( $offset < 32 ) {
+    print OUTFILE pack("c", 0);
+    ++$offset;
+}
+
+$str = pack("n", $gAttrs);     # flags
+print OUTFILE $str;
+$offset += length($str);
+
+$str = pack("n", $gVersion);     # version
+print OUTFILE $str;
+$offset += length($str);
+
+my $time = time() + 2082844800;
+$str = pack("NNN", $time, $time, 0);     # ctime, mtime, btime
+print OUTFILE $str;
+$offset += length($str);
+
+$str = pack("N", 0 );    # mod num
+print OUTFILE $str;
+$offset += length($str);
+
+$str = pack("N", 0 );    # appinfo
+print OUTFILE $str;
+$offset += length($str);
+
+$str = pack("N", 0 );    # sortinfo
+print OUTFILE $str;
+$offset += length($str);
+
+
+print OUTFILE $type;            # type
+print OUTFILE $cid;             # cid
+$offset += 8;
+
+$str = pack("NN", 0, 0 ); # unique_id_seed, next_record_list
+print OUTFILE $str;
+$offset += length($str);
+
+$str = pack("n", $nFiles );     # nrecords
+print OUTFILE $str;
+$offset += length($str);
+
+$offset += $nFiles * 8;
+$offset += 2;                   # djw adds 2 bytes after size list; see below
+foreach my $len ( @fileLengths ) {
+    print OUTFILE pack( "N", $offset );
+    print OUTFILE pack( "N", 0 );
+    $offset += $len;
+}
+
+print OUTFILE pack( "n", 0 );   # djw does this sans comment: flush.c, line 87
+
+foreach my $file ( @fileNames ) {
+    open INFILE, "<$file" or die "couldn't open infile $file\n";
+    my $buffer;
+    while ( read INFILE, $buffer, 1024 ) {
+        print OUTFILE $buffer;
+    }
+    close INFILE;
+}
+
+
+close OUTFILE;
+
+exit 0;
+
+##############################################################################
+# Subroutines
+##############################################################################
+
+sub readHOptions {
+
+    my ( $argvR ) = @_;
+    
+    for ( ; ; ) {
+        my $opt = ${$argvR}[0];
+    
+        if ( $opt !~ /^-/ ) {
+            last;
+        }
+
+        # it starts with a '-': use it; else don't consume anything
+        shift @{$argvR};
+
+        if ( $opt eq "-a" ) {
+            my $attrs = shift @{$argvR};
+            processAttrString( $attrs );
+        } elsif ( $opt eq "-v" ) {
+            $gVersion = shift @{$argvR};
+        } else {
+            die "what's with \"$opt\": -a and -v are the only hattrs supported";
+        }
+    }
+
+} # readHOptions
+
+sub processAttrString {
+
+    my ( $attrs ) = @_;
+
+    foreach my $flag ( split /\|/, $attrs ) {
+
+        print STDERR "looking at flag $flag\n" if $debug;
+
+        if ( $flag =~ /resource/ ) {
+            $gAttrs |= $PRC_FLAGS_RESOURCE;
+            die "resource attr not supported";
+        } elsif ( $flag =~ /readonly/ ) {
+            $gAttrs |= $PRC_FLAGS_READONLY;
+        } elsif ( $flag =~ /dirty/ ) {
+            $gAttrs |= $PRC_FLAGS_DIRTY;
+        } elsif ( $flag =~ /backup/ ) {
+            $gAttrs |= $PRC_FLAGS_BACKUP;
+        } elsif ( $flag =~ /newer/ ) {
+            $gAttrs |= $PRC_FLAGS_NEWER;
+        } elsif ( $flag =~ /reset/ ) {
+            $gAttrs |= $PRC_FLAGS_RESET;
+        } elsif ( $flag =~ /copyprevent/ ) {
+            $gAttrs |= $PRC_FLAGS_COPYPREVENT;
+        } elsif ( $flag =~ /stream/ ) {
+            $gAttrs |= $PRC_FLAGS_STREAM;
+            die "stream attr not supported";
+        } elsif ( $flag =~ /hidden/ ) {
+            $gAttrs |= $PRC_FLAGS_HIDDEN;
+        } elsif ( $flag =~ /launchable/ ) {
+            $gAttrs |= $PRC_FLAGS_LAUNCHABLE;
+        } elsif ( $flag =~ /recyclable/ ) {
+            $gAttrs |= $PRC_FLAGS_RECYCLABLE;
+        } elsif ( $flag =~ /bundle/ ) {
+            $gAttrs |= $PRC_FLAGS_BUNDLE;
+        } elsif ( $flag =~ /open/ ) {
+            $gAttrs |= $PRC_FLAGS_OPEN;
+        } else {
+            die "flag $flag not supportd";
+        }
+    }
+} # processAttrString
--- a/xwords4/xwords4/dawg/pbitm2bin.pl
+++ b/xwords4/xwords4/dawg/pbitm2bin.pl
@ -0,0 +1,87 @@
+#!/usr/bin/perl
+#
+# Copyright 2001 by Eric House (fixin@peak.org).  All rights reserved.
+#
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License
+# as published by the Free Software Foundation; either version 2
+# of the License, or (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+#
+#
+# Given a pbitm on stdin, a text bitmap file where '#' indicates a set
+# bit and '-' indicates a clear bit, convert into binary form (on
+# stdout) where there's one bit per bit plus a byte each for the width
+# and height.  Nothing for bitdepth at this point.  And no padding: if
+# the number of bits in a row isn't a multiple of 8 then one byte will
+# hold the last bits of one row and the first of another.
+
+use strict;
+
+my $nRows = 0;
+my $nCols = 0;
+my $bits = "";			# save the chars in a single string to start
+
+# first gather information and sanity-check the data
+
+while (<>) {
+  chomp;
+  my $len = length();
+
+  if ( $nCols == 0 ) {
+    $nCols = $len;
+  } else { 
+    die "line of inconsistent length" if $nCols != $len ;
+  }
+  if ( $nCols == 0 ) {
+    last;
+  }
+
+  $bits .= $_;
+  ++$nRows;
+}
+
+my $len = length($bits);
+print pack( "C", $nCols );
+
+# if we've been given an empty file, print out a single null byte and
+# be done.  That'll be the convention for "non-existant bitmap".
+if ( $len == 0 ) {
+  exit 0;
+}
+print pack( "C", $nRows );
+printf STDERR "emitting %dx%d bitmap\n", $nCols, $nRows;
+  
+
+my @charlist = split( //,$bits);
+my $byte = 0;
+
+for ( my $count = 0; ; ++$count ) {
+
+  my $ch = $charlist[$count];
+  my $bitindex = $count % 8;
+
+  $ch == '-' || $ch == '#' || die "unknown char $ch";
+
+  my $bit = ($ch eq '#')? 1:0;
+
+  $byte |= $bit << (7 - $bitindex);
+
+  my $lastPass = $count + 1 == $len;
+  if ( $bitindex == 7 || $lastPass ) {
+    print pack( "C", $byte );
+    if ( $lastPass ) {
+      last;
+    }
+    $byte = 0;
+  }
+
+}  # for loop
--- a/xwords4/xwords4/dawg/pdb.h
+++ b/xwords4/xwords4/dawg/pdb.h
@ -0,0 +1,49 @@
+
+/* 
+ * Copyright 1997 - 2002 by Eric House (fixin@peak.org).  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU General Public License
+ * as published by the Free Software Foundation; either version 2
+ * of the License, or (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+ */
+ 
+typedef unsigned long DWORD;
+typedef unsigned short WORD;
+
+// all numbers in these structs are big-endian, MAC format
+typedef struct DocHeader {
+    char sName[32];	// 0x00
+    DWORD dwUnknown1;	// 0x20 bytes
+    DWORD dwTime1;	// 0x24 bytes
+    DWORD dwTime2;	// 0x28
+    DWORD dwTime3;	// 0x2C
+    DWORD dwLastSync;	// 0x30
+    DWORD ofsSort;	// 0x34
+    DWORD ofsCatagories;// 0x38
+    DWORD dwType;	// 0x3C
+    DWORD dwCreator;	// 0x40
+    DWORD dwUnknown2;	// 0x44
+    DWORD dwUnknown3;	// 0x48
+    WORD  wNumRecs;	// 0x4C
+} DocHeader;
+
+#define DOCHEADSZ 78
+
+typedef struct RecordHeader {
+    // <eeh> added type in experimentally! on 4/14
+/*     char type[4]; */
+    DWORD offset;
+    DWORD bits; // high byte is flags, remaining three are a unique id
+} RecordHeader;
+
+#define RECHEADSZ 8
--- a/xwords4/xwords4/dawg/pdb2dict.c
+++ b/xwords4/xwords4/dawg/pdb2dict.c
@ -0,0 +1,272 @@
+// -*-mode: C; fill-column: 80; compile-command: "make pdb2dict"; -*-
+
+/* 
+ * Copyright 1997 - 2002 by Eric House (fixin@peak.org).  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU General Public License
+ * as published by the Free Software Foundation; either version 2
+ * of the License, or (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+ */
+ 
+#include <stdio.h>
+#include <assert.h>
+#include <string.h>
+#include <stdlib.h>
+
+#include "pdb.h"
+#include "dawg.h"
+
+#include "swap.h"
+
+/////////////////////////////// prototypes //////////////////////////////////
+static void generate_dict( array_edge* memoryFile );
+static void write_words( array_edge* memoryFile, long edgeIndex,
+			 short charIndex, char* wordBuffer );
+static void skipNHeaders( FILE* file, int n, RecordHeader* recHeader );
+static array_edge* loadEdgesArray( FILE* dictFile, unsigned char* charTable );
+static void* readNthRecord( FILE* files, void* where, int whereMaxSize,
+			    int whichRec, int* foundSize );
+static void getNthOffset( FILE* file, int n, long* offset, 
+			  unsigned short* size );
+static void printWord( char* wordBuffer );
+
+///////////////////////////////// globals ///////////////////////////////////
+static unsigned char charTable[32];
+
+/******************************************************************************
+ *
+ *****************************************************************************/
+void usage() {
+    fprintf( stderr, "Usage: pdb2dict <file.pdb>\n" );
+    exit( 1 );
+}
+
+/******************************************************************************
+ *
+ *****************************************************************************/
+int main( int argc, char** argv ) {
+    char* pdbName;
+    array_edge* memoryFile;
+    FILE* dictFile;
+    if ( argc < 2 ) {
+	usage();
+    }
+
+    //    fprintf( stderr, "sizeof(WORD)=%d\n", sizeof(WORD) );
+
+    pdbName = argv[1];
+    if ( (argv < 2) || (strchr( pdbName, '.' ) == NULL) ||
+	 strcmp( (char*)strchr( pdbName, '.' ), ".pdb" ) ) {
+	usage();
+    }
+
+    dictFile = fopen( pdbName, "r" );
+    if ( dictFile == NULL ) {
+	fprintf( stderr, "%s: No such file %s\n", argv[0], pdbName );
+	exit(1);
+    }
+    memoryFile = loadEdgesArray( dictFile, charTable );
+    fclose( dictFile );
+
+    generate_dict( memoryFile );
+    free( memoryFile );
+    return 0;
+} // main
+
+/******************************************************************************
+ *
+ *****************************************************************************/
+static array_edge* loadEdgesArray( FILE* dictFile, unsigned char* charTable ) {
+    DocHeader pdbHeader;
+    dawg_header dawgHeader;
+    array_edge* firstEdge = NULL;
+    fpos_t firstHeaderOffset;
+    int curSize, i;
+
+    // read in the main pdb header
+    fread( &pdbHeader, DOCHEADSZ, 1, dictFile );
+    assert( (strncmp( (char*)&pdbHeader.dwCreator, "Xwr3", 4) == 0)
+	    && (strncmp( (char*)&pdbHeader.dwType, "DAWG", 4) == 0) );
+
+    (void)fgetpos( dictFile, &firstHeaderOffset );
+
+    (void)readNthRecord( dictFile, &dawgHeader, sizeof(dawgHeader), 0, NULL );
+    //fprintf( stderr, "word count = %ld\n", swap_long(dawgHeader.numWords) );
+    assert( dawgHeader.firstEdgeRecNum == 3 );
+
+    (void)readNthRecord( dictFile, charTable, 32, dawgHeader.charTableRecNum,
+			 NULL );
+
+    firstEdge = (array_edge*)malloc(0);
+    curSize = 0;
+    for ( i = dawgHeader.firstEdgeRecNum; i < swap_short(pdbHeader.wNumRecs);
+	  ++i ) {
+	int newSize;
+	void* rec = readNthRecord( dictFile, NULL, 0, i, &newSize );
+
+	firstEdge = (array_edge*)realloc( firstEdge, curSize + newSize );
+	memcpy( ((char*)firstEdge) + curSize, rec, newSize );
+	free( rec );
+	curSize += newSize;
+    }
+    return firstEdge;
+} // loadEdgesArray
+
+/******************************************************************************
+ *
+ *****************************************************************************/
+static void* readNthRecord( FILE* file, void* where, int whereMaxSize,
+			    int whichRec, int* foundSize ) {
+    void* result = NULL;
+    fpos_t pos;
+    long offset;
+    unsigned short size;
+
+    (void)fgetpos( file, &pos);
+
+    getNthOffset( file, whichRec, &offset, &size );
+    fseek( file, offset, 0 );
+
+    if ( where == NULL ) {
+	result = malloc( size );
+	fread( result, size, 1, file );
+    } else {
+	assert( size <= whereMaxSize );
+	fread( where, size, 1, file );	
+    }
+    if ( foundSize ) {
+	*foundSize = size;
+    }
+
+    (void)fsetpos( file, &pos);
+    return result;
+} // readNthRecord
+
+/******************************************************************************
+ * Size is my offset subtracted from the one after me, unless I'm the last
+ * entry in which case it's file size minus my offset.
+ *****************************************************************************/
+static void getNthOffset( FILE* file, int n, long* offset, 
+			  unsigned short* size ) {
+    DocHeader pdbHeader;
+    RecordHeader recHeader;
+    fpos_t pos;
+    long sizeCalc;
+
+    (void)fgetpos( file, &pos);
+    rewind( file );
+
+    //fprintf( stderr, "sizeof(pdbHeader)=%d\n", sizeof(pdbHeader) );
+    fread( &pdbHeader, DOCHEADSZ, 1, file );
+    assert( swap_short(pdbHeader.wNumRecs) > n );
+
+    skipNHeaders( file, n+1, &recHeader );
+    *offset = sizeCalc = swap_long( recHeader.offset );
+    if ( n+1 == swap_short(pdbHeader.wNumRecs) ) { // use file size
+	fseek( file, 0, SEEK_END );
+	sizeCalc = ftell( file ) - sizeCalc;
+    } else {
+	skipNHeaders( file, 1, &recHeader );	
+	sizeCalc = swap_long( recHeader.offset ) - sizeCalc;
+    }
+    *size = sizeCalc;
+
+    (void)fsetpos( file, &pos);    
+} // getNthOffset
+
+/******************************************************************************
+ * Skip over the given number of headers, returning with the last one read
+ * into the supplied buffer.
+ *****************************************************************************/
+static void skipNHeaders( FILE* file, int n, RecordHeader* recHeader ) {
+    short i;
+    for ( i = 0; i < n; ++i ) {
+	fread( recHeader, sizeof(*recHeader), 1, file );
+    }
+} // skipNHeaders
+
+/******************************************************************************
+ * beginning with an array of NULL chars, on each level of the tree
+ * iterate over each child replacing the appropriate char with the
+ * letter from the edge.  When an edge is terminal, print the word
+ * formed.  And when returning replace the letter with a null char.
+ *****************************************************************************/
+static void generate_dict( array_edge* memoryFile ) {
+    char wordBuffer[31];
+    (void)memset( wordBuffer, '\0', 31 );
+
+    write_words( memoryFile, 0, 0, wordBuffer );
+}
+
+/******************************************************************************
+ *
+ *****************************************************************************/
+void write_words( array_edge* memoryFile, long edgeIndex, short charIndex,
+		  char* wordBuffer ) {
+    array_edge* child = &memoryFile[edgeIndex];
+    for ( ; ; child = &memoryFile[++edgeIndex] ) {
+	unsigned char bits = child->bits;
+	long index = 0;
+	wordBuffer[charIndex] = charTable[(bits & LETTERMASK)];
+	if ( bits & ACCEPTINGMASK ) {
+	    printWord( wordBuffer );
+	}
+
+	index = (child->highByte * 256) + child->lowByte;
+	if ( bits & LASTBITMASK ) {
+	    index += 0x00010000;
+	}
+
+	if ( index > 0 ) {
+	    write_words( memoryFile, index, charIndex+1, wordBuffer );
+	}
+	if ( bits & LASTEDGEMASK ) {
+	    wordBuffer[charIndex] = '\0';
+	    break;
+	}
+    }
+}
+
+/******************************************************************************
+ *
+ *****************************************************************************/
+static void printWord( char* wordBuffer ) {
+    unsigned char buf[32], ch;
+    unsigned char* next = buf;
+
+    while ( (ch = *wordBuffer++) != '\0' ) {
+	if ( ch >= 0x20 ) {
+	    *next++ = ch;
+	} else {
+	    char* str = NULL;
+	    switch ( ch ) {
+	    case 1:
+		str = "CH";
+		break;
+	    case 2:
+		str = "LL";
+		break;
+	    case 3:
+		str = "RR";
+		break;
+	    default:
+		fprintf( stderr, "Got %d\n", ch );
+		assert( 0 );
+	    }
+	    strcpy( next, str );
+	    next += strlen(str);
+	}
+    }
+    *next = '\0';
+    fprintf( stdout, "%s\n", buf );
+} // appendChars
--- a/xwords4/xwords4/dawg/swap.c
+++ b/xwords4/xwords4/dawg/swap.c
@ -0,0 +1,9 @@
+
+/*  #ifdef BIG_ENDIAN */
+/*  unsigned short swap_short(unsigned short s) { return s; } */
+/*  unsigned long swap_long(unsigned long l ) { return l; } */
+
+/*  #else */
+
+
+/*  #endif */
--- a/xwords4/xwords4/dawg/swap.h
+++ b/xwords4/xwords4/dawg/swap.h
@ -0,0 +1,35 @@
+/* 
+ * Copyright 1997 by Eric House (fixin@peak.org).  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU General Public License
+ * as published by the Free Software Foundation; either version 2
+ * of the License, or (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+ */
+ 
+#ifndef _SWAP_H_
+#define _SWAP_H_
+
+#if BYTE_ORDER == LITTLE_ENDIAN
+static unsigned short swap_short( unsigned short s ) { 
+    return s >> 8 | s << 8;
+}
+
+static unsigned long swap_long( unsigned long l ) { 
+    return l >> 24 | (l>>8 & 0x0000FF00) | (l<<8 & 0x00FF0000) | l << 24;
+}
+#else
+# define swap_short(s) (s)
+# define swap_long(l) (l)
+#endif
+
+#endif /* _SWAP_H_ */
--- a/xwords4/xwords4/dawg/xloc.c
+++ b/xwords4/xwords4/dawg/xloc.c
@ -0,0 +1,673 @@
+// -*-mode: C; fill-column: 80; compile-command: "make xloc"; -*-
+/* 
+ * Copyright 1998 - 2002 by Eric House (fixin@peak.org).  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU General Public License
+ * as published by the Free Software Foundation; either version 2
+ * of the License, or (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+ */
+ 
+/* This is where the langauge tile tables live.  There's one for each
+ * supported langauge.  Tile tables give the face of each tile (e.g. "A")
+ * the value (1), and the number in the game (8).
+ *
+ * This program generates two output files, a text file which has each
+ * face on a separate line: "\0\nA\nB\n..." (where the \0 will later
+ * be mapped to BLANK), and a binary file giving the values and counts
+ * of those tiles in table form *and* additional data for any tiles with
+ * non-printing faces mapping them to alternative printing values (e.g. "_"
+ * for BLANK) and (optionally) to custom pilot bitmaps for representation
+ * on-screen.
+ *
+ * This program comes after I've attempted to do something simpler with
+ * shell scripts in makefiles.  There are too many problems with the null
+ * and sub-0x20 bytes for the non-printing characters' faces.  Thus for now
+ * rather than pass in tables I'll just maintain one for each language here.
+ */
+
+/* Here's the old comment:
+ * Build a resource for Crosswords representing the letters in the
+ * game, and the number and value of each letter.  The arrays for
+ * each language for which a version of Crosswords exists are also
+ * stored in this file.
+ *
+ * This resource is meant to replace the gInitialLetterCounts and
+ * gTileValues arrays as well as to provide indirection aiding in
+ * localization
+ *
+ * In order to keep the size of an in-memory game down, letters are
+ * stored in five bits (and in null-terminated strings) so we have a
+ * range of 31 values available.  Each will then be an index into a
+ * table built here.  This extra level of abstraction permits
+ * non-contiguous ranges of characters as, for instance, is required
+ * by the German characters having umlauts.  Note, however, that a
+ * language requiring *more* than 31 characters (including 1 for each
+ * blank) will require some redesign.
+ *
+ * An additional problem is created by the need to convert letters
+ * from lower case to upper on input to the blank-setting dialog as a
+ * courtesy to players (already present in the shipping version,
+ * alas).  For now I'll simply search the array of printing values (col.
+ * 2 below) and if I fail to find it try various transformations the first
+ * of which will be to upper-case a value in the a-z range 
+ *
+ * The arrays below consist of three columns each:
+ *  ASCII value        numTilesThatValue            tileValue
+ * The latter two are compressed into one byte, four bits each, limiting
+ * each to the range 1..16.  (Actually, I ought to confirm that the code
+ * required to deal with shifting and masking isn't bigger than the extra
+ * <= 31 bytes I'm saving.... so skip the compression for now.)
+ *
+ */
+
+#include <stdio.h>
+#include <assert.h>
+#include <unistd.h>
+#include <stdlib.h>
+
+#include "xwcommon3.h"
+//#include "../../../../xwcommon3.h"
+
+//#define MASH(a,b) ((a)<<4)|(b)
+#define MASH(a,b) (a),(b)
+
+static short endian_short( short in ) {
+    if ( 0 ) {
+	return in;
+    } else {
+	return ((in >> 8) & 0x00ff) | ((in << 8) & 0xFF00);
+    }
+}
+
+void errexit( char* msg ) {
+    fprintf( stderr, msg );
+    exit(1);
+}
+
+static short fileSize( char* fileName ) {
+    short result;
+    FILE* f = fopen( fileName, "rb" );
+    printf( "opening %s\n", fileName );
+    if ( f == NULL ) {
+	errexit( "fopen failed\n" );
+    }
+    if ( fseek( f, 0L, SEEK_END ) != 0 ) {
+	errexit( "error from fseek" );
+    }
+    result = ftell( f );
+    fclose( f );
+    printf( "length of file %s is %d\n", fileName, result );
+    return (short)result;
+}
+
+#if 0
+Graham writes:
+> PORTUGUESE            
+>
+>
+> Letter        Distribution    Face value
+>
+> A     12      1
+> B     2       3
+> C     4       3
+> CH    1       5
+> D     5       2
+> E     12      1
+> F     1       4
+> G     2       2
+> H     2       4
+> I     6       1
+> J     1       8
+> (K)   0       
+> L     4       1
+> LL    1       8
+> M     2       3
+> N     5       1
+> N tilde       1       8
+> O     9       1
+> P     2       3
+> Q     1       5
+> R     5       1
+> RR    1       8
+> S     6       1
+> T     4       1
+> U     5       1
+> V     1       4
+> (W)   0       
+> X     1       8
+> Y     1       4
+> Z     1       10
+> BLANK 2       0
+>
+> Total 100     
+
+> GREEK         
+>
+> Letter        Distribution    Face value
+>
+> alpha 12      1
+> beta  1       8
+> gamma 2       4
+> delta 2       4       
+> epsilon       8       1       
+> zeta  1       10      
+> eta   7       1       
+> theta 1       10      
+> iota  8       1       
+> kappa 4       2       
+> lambda        3       3       
+> mu    3       3       
+> nu    6       1        
+> xi    1       10      
+> omicron       9       1       
+> pi    4       2       
+> rho   5       2       
+> sigma 7       1       
+> tau   8       1       
+> upsilon       4       2
+> phi   1       8
+> chi   1       8
+> psi   1       10
+> omega 3       3
+> blank 2       0
+>
+> Total 104
+
+
+#endif
+ 
+unsigned char finnish_table[] = {
+#if 0
+from yarik@avalon.merikoski.fi
+amount  points letter
+10       1      A
+ 1       8      B
+ 1      10      C
+ 1       7      D
+ 8       1      E
+ 1       8      F
+ 1       8      G
+ 2       4      H
+10       1      I
+ 2       4      J
+ 5       2      K
+ 5       2      L
+ 3       3      M
+ 8       1      N
+ 5       2      O
+ 2       4      P
+ 2       4      R
+ 7       1      S
+ 9       1      T
+ 5       3      U
+ 2       4      V
+ 2       4      Y
+5       2      D      // an A with two dots above
+1       7      V      // an O with two dots above
+2       ?      ?      // the 'wild card'
+#endif
+};
+
+unsigned char US_english_table[] = {
+    // numTiles,	tileValue	ASCII value
+    MASH(9,			1),		'A',
+    MASH(2,			3),		'B',
+    MASH(2,			3),		'C',
+    MASH(4,			2),		'D',
+    MASH(12,			1),		'E',
+    MASH(2,			4),		'F',
+    MASH(3,			2),		'G',
+    MASH(2,			4),		'H',
+    MASH(9,			1),		'I',
+    MASH(1,			8),		'J',
+    MASH(1,			5),		'K',
+    MASH(4,			1),		'L',
+    MASH(2,			3),		'M',
+    MASH(6,			1),		'N',
+    MASH(8,			1),		'O',
+    MASH(2,			3),		'P',
+    MASH(1,			10),		'Q',
+    MASH(6,			1),		'R',
+    MASH(4,			1),		'S',
+    MASH(6,			1),		'T',
+    MASH(4,			1),		'U',
+    MASH(2,			4),		'V',
+    MASH(2,			4),		'W',
+    MASH(1,			8),		'X',
+    MASH(2,			4),		'Y',
+    MASH(1,			10),		'Z',
+
+    MASH(2,			0),		BLANK_FACE, /* BLANK1 */
+   //    0 /* TERMINATES ARRAY */
+}; // US_english_table
+
+unsigned char norwegian_table[] = {
+    // numTiles,	        tileValue	ASCII value
+    MASH(2,			0),		BLANK_FACE, /* BLANK1 */
+    MASH(7,			1),			'A',
+    MASH(3,			4),			'B', 
+    MASH(1,			10),			'C',
+    MASH(5,			1),			'D', 
+    MASH(9,			1),			'E', 
+    MASH(4,			2),			'F', 
+    MASH(4,			2),			'G', 
+    MASH(3,			3),			'H', 
+    MASH(5,			1),			'I', 
+    MASH(2,			4),			'J', 
+    MASH(4,			2),			'K', 
+    MASH(5,			1),			'L', 
+    MASH(3,			2),			'M', 
+    MASH(6,			1),			'N', 
+    MASH(4,			2),			'O', 
+    MASH(2,			4),			'P', 
+    MASH(6,			1),			'R', 
+    MASH(6,			1),			'S', 
+    MASH(6,			1),			'T', 
+    MASH(3,			4),			'U', 
+    MASH(3,			4),			'V', 
+    MASH(1,			8),			'W', 
+    MASH(1,			6),			'Y', 
+    MASH(1,			6),			'Æ', 
+    MASH(2,			5),			'Ø', 
+    MASH(2,			4),			'Å', 
+};
+
+unsigned char swedish_table[] = {
+    // numTiles,	        tileValue	ASCII value
+    MASH(2,			0),		BLANK_FACE, /* BLANK1 */
+    MASH(8,			1),		'A',
+    MASH(2,			4),		'Å', // A with circle
+    MASH(2,			3),		'Ä', // A with two dots
+    MASH(2,			4),		'B',
+    MASH(1,			10),		'C',
+    MASH(5,			1),		'D',
+    MASH(7,			1),		'E', // 15's the max....
+    MASH(2,			3),		'F',
+    MASH(3,			2),		'G',
+    MASH(2,			2),		'H',
+    MASH(5,			1),		'I',
+    MASH(1,			7),		'J',
+    MASH(3,			2),		'K',
+    MASH(5,			1),		'L',
+    MASH(3,			2),		'M',
+    MASH(6,			1),		'N',
+    MASH(5,			2),		'O',
+    MASH(2,			4),		'Ö', // O with two dots
+    MASH(2,			4),		'P',
+    MASH(8,			1),		'R',
+    MASH(8,			1),		'S',
+    MASH(8,			1),		'T',
+    MASH(3,			4),		'U',
+    MASH(2,			3),		'V',
+    MASH(1,			8),		'X',
+    MASH(1,			7),		'Y',
+    MASH(1,			8),		'Z',
+    //    0 /* TERMINATES  ARRAY */
+}; // swedish_table
+
+unsigned char polish_table[] = {
+    // numTiles,		tileValue	ASCII value
+    // NO BLANK; there are already 32 tiles....
+    // MASH(2,			0),		BLANK_FACE, /* BLANK1 */
+    MASH(8,			1),		'A',
+    MASH(1,			5),		'¡',
+    MASH(2,			3),		'B',
+    MASH(3,			2),		'C',
+    MASH(1,			6),		'Æ',
+    MASH(3,			2),		'D',
+    MASH(7,			1),		'E',
+    MASH(1,			5),		'Ê',
+    MASH(2,			4),		'F',
+    MASH(2,			3),		'G',
+    MASH(2,			3),		'H',
+    MASH(8,			1),		'I',
+    MASH(2,			3),		'J',
+    MASH(3,			2),		'K',
+    MASH(3,			2),		'L',
+    MASH(2,			3),		'£',
+    MASH(3,			2),		'M',
+    MASH(5,			1),		'N',
+    MASH(1,			7),		'Ñ',
+    MASH(6,			1),		'O',
+    MASH(1,			5),		'Ó',
+    MASH(3,			2),		'P',
+    MASH(4,			1),		'R',
+    MASH(4,			1),		'S',
+    MASH(1,			5),		'¦',
+    MASH(3,			2),		'T',
+    MASH(2,			3),		'U',
+    MASH(4,			1),		'W',
+    MASH(4,			2),		'Y',
+    MASH(5,			1),		'Z',
+    MASH(1,			7),		'¬',
+    MASH(1,			5),		'¯',
+    //    0 /* TERMINATES  ARRAY */
+}; // polish_table
+
+unsigned char french_table[] = {
+    // numTiles,		tileValue	ASCII value
+    MASH(2,			0),		BLANK_FACE, /* BLANK1 */
+    MASH(9,			1),		'A',
+    MASH(2,			3),		'B',
+    MASH(2,			3),		'C',
+    MASH(3,			2),		'D',
+    MASH(15,			1),		'E',
+    MASH(2,			4),		'F',
+    MASH(2,			2),		'G',
+    MASH(2,			4),		'H',
+    MASH(8,			1),		'I',
+    MASH(1,			8),		'J',
+    MASH(1,			10),		'K',
+    MASH(5,			1),		'L',
+    MASH(3,			2),		'M',
+    MASH(6,			1),		'N',
+    MASH(6,			1),		'O',
+    MASH(2,			3),		'P',
+    MASH(1,			8),		'Q',
+    MASH(6,			1),		'R',
+    MASH(6,			1),		'S',
+    MASH(6,			1),		'T',
+    MASH(6,			1),		'U',
+    MASH(2,			4),		'V',
+    MASH(1,			10),		'W',
+    MASH(1,			10),		'X',
+    MASH(1,			10),		'Y',
+    MASH(1,			10),		'Z',
+    //    0 /* TERMINATES ARRAY */
+}; // french_table
+
+unsigned char german_table[] = {
+    // numTiles,	        tileValue	ASCII value
+    MASH(2,			0),		BLANK_FACE, /* BLANK1 */
+    MASH(5,		        1),		'A',
+    MASH(1,			6),		196, // A mit umlaut
+    MASH(2,			3),		'B',
+    MASH(2,			4),		'C',
+    MASH(4,			1),		'D',
+    MASH(15,			1),		'E',
+    MASH(2,			4),		'F',
+    MASH(3,			2),		'G',
+    MASH(4,			2),		'H',
+    MASH(6,			1),		'I',
+    MASH(1,			6),		'J',
+    MASH(2,			4),		'K',
+    MASH(3,			2),		'L',
+    MASH(4,			3),		'M',
+    MASH(9,			1),		'N',
+    MASH(3,			2),		'O',
+    MASH(1,			8),		214, // O mit umlaut
+    MASH(1,			4),		'P',
+    MASH(1,			10),		'Q',
+    MASH(6,			1),		'R',
+    MASH(7,			1),		'S',
+    MASH(6,			1),		'T',
+    MASH(6,			1),		'U',
+    MASH(1,			6),		220, // U mit umlaut
+    MASH(1,			6),		'V',
+    MASH(1,			3),		'W',
+    MASH(1,			8),		'X',
+    MASH(1,			10),		'Y',
+    MASH(1,			3),		'Z',
+    //    0 /* TERMINATES  ARRAY */
+}; // german_table
+
+unsigned char dutch_table[] = {
+    // numTiles,	        tileValue	ASCII value
+    MASH(2,			0),		BLANK_FACE, /* BLANK1 */
+    MASH(6,			1),		'A',
+    MASH(2,			3),		'B',
+    MASH(2,			5),		'C',
+    MASH(5,			2),		'D',
+    MASH(16,			1),		'E',
+    MASH(2,			4),		'F',
+    MASH(2,			3),		'G',
+    MASH(2,			4),		'H',
+    MASH(4,			1),		'I',
+    MASH(2,			4),		'J',
+    MASH(3,			3),		'K',
+    MASH(3,			3),		'L',
+    MASH(3,			3),		'M',
+    MASH(8,			1),		'N',
+    MASH(6,			1),		'O',
+    MASH(3,			3),		'P',
+    MASH(1,			10),		'Q',
+    MASH(5,			2),		'R',
+    MASH(5,			2),		'S',
+    MASH(5,			2),		'T',
+    MASH(4,			4),		'U',
+    MASH(4,			2),		'V',
+    MASH(2,			5),		'W',
+    MASH(1,			8),		'X',
+    MASH(2,			4),		'Y',
+    MASH(2,			4),		'Z',
+    //0 /* TERMINATES  ARRAY */
+}; // dutch_table
+
+unsigned char italian_table[] = {
+    // numTiles,	        tileValue	ASCII value
+    MASH(2,			0),		BLANK_FACE, /* BLANK1 */
+    MASH(13,			1),		'A',
+    MASH(3,			5),		'B',
+    MASH(4,			4),		'C',
+    MASH(3,			5),		'D',
+    MASH(13,			1),		'E',
+    MASH(2,			8),		'F',
+    MASH(2,			5),		'G',
+    MASH(2,			8),		'H',
+    MASH(13,			1),		'I',
+    MASH(5,			3),		'L',
+    MASH(5,			3),		'M',
+    MASH(6,			2),		'N',
+    MASH(13,			1),		'O',
+    MASH(3,			5),		'P',
+    MASH(1,			10),		'Q',
+    MASH(6,			2),		'R',
+    MASH(6,			2),		'S',
+    MASH(6,			2),		'T',
+    MASH(5,			3),		'U',
+    MASH(4,			4),		'V',
+    MASH(2,			8),		'Z',
+    //    0 /* TERMINATES  ARRAY */
+}; // italian_table
+
+unsigned char spanish_table[] = {
+   // numTiles,	        tileValue	ASCII value
+   MASH( 12,			1),	'A',
+   MASH( 2,			3),	'B',
+   MASH( 4,			3),	'C',
+   MASH( 1,			5),	1,	/*'CH'*/
+   MASH( 5,			2),	'D',
+   MASH( 12,			1),	'E',
+   MASH( 1,			4),	'F',
+   MASH( 2,			2),	'G',
+   MASH( 2,			4),	'H',
+   MASH( 6,			1),	'I',
+   MASH( 1,			8),	'J',
+   MASH( 4,			1),	'L',
+   MASH( 1,			8),	2,	/*'LL'*/
+   MASH( 2,			3),	'M',
+   MASH( 5,			1),	'N',
+   MASH( 1,			8),	 209,	/*'N~'*/
+   MASH( 9,			1),	'O',
+   MASH( 2,			3),	'P',
+   MASH( 1,			5),	'Q',
+   MASH( 5,			1),	'R',
+   MASH( 1,			8),	3,	/*'RR'*/
+   MASH( 6,			1),	'S',
+   MASH( 4,			1),	'T',
+   MASH( 5,			1),	'U',
+   MASH( 1,			4),	'V',
+   MASH( 1,			8),	'X',
+   MASH( 1,			4),	'Y',
+   MASH( 1,			10),	'Z',
+   MASH( 2,			0),	BLANK_FACE, /* BLANK1 */
+}; // spanish_table
+
+/* Test case that reverses char order and puts blank at the end, violating the
+ * sometimes-assumption that blank==0.  */
+unsigned char hex_table[] = {
+    // numTiles,	        tileValue	ASCII value
+    MASH(9,			1),		'A',
+    MASH(2,			3),		'B',
+    MASH(2,			3),		'C',
+    MASH(4,			2),		'D',
+    MASH(12,			1),		'E',
+    MASH(2,			4),		'F',
+    MASH(4,			0),		BLANK_FACE, /* BLANK1 */
+    //0 /* TERMINATES  ARRAY */
+}; // hex_table
+
+unsigned char test_table[] = {
+    // numTiles,	        tileValue	ASCII value
+    MASH(1,			1),		'A',
+    MASH(1,			5),		'B',
+    MASH(1,			10),		'E',
+    //0 /* TERMINATES  ARRAY */
+}; // test_table
+
+//#define NONFILEARGS 3
+#define MAXSPECIALS 20
+
+int main( int argc, char** argv ) {
+    char* lang = NULL;
+    //    char* fileName;
+    char* facesFileName = NULL;
+    char* binaryFileName = NULL;
+
+    FILE* facesFile;
+    FILE* binFile;
+    Xloc_header header;
+    unsigned char* table;
+    short tableLength = 0;
+    //char* name = "";
+    short i;
+    short fileArgsUsed;
+    short offset;
+    int got;
+
+    while ( (got = getopt(argc, argv, "l:O:T:h")) != EOF ) {
+	switch ( got ) {
+	case 'l':
+	    lang = optarg;
+	    break;
+	case 'O':
+	    facesFileName = optarg;
+	    break;
+	case 'T':
+	    binaryFileName = optarg;
+	    break;
+	case 'h':
+	default:
+	    errexit( "Usage: xloc -l lang_code "
+		     "-O tableOutfile -T valCountOutfile\n" );
+	}
+    }
+
+    fprintf( stderr, "binoutfile = %s\n",
+	     binaryFileName?binaryFileName:"null" );
+    fprintf( stderr, "facesFileName = %s\n", 
+	     facesFileName?facesFileName:"null" );
+    fprintf( stderr, "lang = %s\n", lang );
+
+    header.padding = 0;
+
+    if ( strcmp( lang, "en_US" ) == 0 ) {
+	table = US_english_table;
+	tableLength = sizeof(US_english_table);
+	header.langCodeFlags = US_ENGLISH;
+    } else if ( strcmp( lang, "sv_SE" ) == 0 ) {
+	table = swedish_table;
+	tableLength = sizeof(swedish_table);
+	header.langCodeFlags = SWEDISH_SWEDISH;
+    } else if ( strcmp( lang, "no_NO" ) == 0 ) {
+	table = norwegian_table;
+	tableLength = sizeof(norwegian_table);
+	header.langCodeFlags = NORWEGIAN_NORWEGIAN;
+    } else if ( strcmp( lang, "pl_PL" ) == 0 ) {
+	table = polish_table;
+	tableLength = sizeof(polish_table);
+	header.langCodeFlags = POLISH_POLISH;
+    } else if ( strcmp( lang, "fr_FR" ) == 0 ) {
+	table = french_table;
+	tableLength = sizeof(french_table);
+	header.langCodeFlags = FRENCH_FRENCH;
+    } else if ( strcmp( lang, "de_DE" ) == 0 ) {
+	table = german_table;
+	tableLength = sizeof(german_table);
+	header.langCodeFlags = GERMAN_GERMAN;
+    } else if ( strcmp( lang, "nl_NL" ) == 0 ) {
+	table = dutch_table;
+	tableLength = sizeof(dutch_table);
+	header.langCodeFlags = DUTCH_DUTCH;
+    } else if ( strcmp( lang, "it_IT" ) == 0 ) {
+	table = italian_table;
+	tableLength = sizeof(italian_table);
+	header.langCodeFlags = ITALIAN_ITALIAN;
+    } else if ( strcmp( lang, "es_ES" ) == 0 ) {
+	table = spanish_table;
+	tableLength = sizeof(spanish_table);
+	header.langCodeFlags = SPANISH_SPANISH;
+    } else if ( strcmp( lang, "hex" ) == 0 ) {
+	table = hex_table;
+	tableLength = sizeof(hex_table);
+    } else if ( strcmp( lang, "test" ) == 0 ) {
+	table = test_table;
+	tableLength = sizeof(test_table);
+    } else {
+	fprintf( stderr, "unknown language code %s\n", lang );
+	exit(1);
+    }
+
+    header.langCodeFlags |= 1<<XLOC_LANG_OFFSET;
+
+    ////////////////////////////////////////////////////
+    // first the char table file
+    ////////////////////////////////////////////////////
+    if ( facesFileName != NULL ) {
+	facesFile = fopen( facesFileName, "w" );
+	assert( facesFile );
+	assert( tableLength > 0 );
+
+	for ( i = 0; i < tableLength; i += BYTES_PER_LETTER ) {
+	    fprintf( facesFile, "%c", table[i+2] );
+	}
+
+	fclose( facesFile );
+    }
+
+    ////////////////////////////////////////////////////
+    // now the binary file
+    ////////////////////////////////////////////////////
+    if ( binaryFileName != NULL ) {
+
+	binFile = fopen( binaryFileName, "w" );
+	assert( binFile );
+
+	fwrite( &header, sizeof(header), 1, binFile );
+
+	// now write out the table, where header.specialCharStart is length
+	for ( i = 0; i < tableLength; i += BYTES_PER_LETTER ) {
+	    fwrite( &table[i], sizeof(table[i])+sizeof(table[i+1]), 1, 
+		    binFile );
+	}
+
+	// record file sizes
+
+	// write data with file size included
+
+	// append the files themselves
+
+	fclose( binFile );
+    }
+    return 0;
+} // main
--- a/xwords4/xwords4/dawg/xloc.pl
+++ b/xwords4/xwords4/dawg/xloc.pl
@ -0,0 +1,42 @@
+#!/usr/bin/perl
+
+# Copyright 2002 by Eric House (fixin@peak.org).  All rights reserved.
+#
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License
+# as published by the Free Software Foundation; either version 2
+# of the License, or (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+
+# test and wrapper file for xloc.pm
+
+use strict;
+use xloc;
+
+
+
+my $arg = shift(@ARGV);
+my $lang = shift(@ARGV);
+my $path = "./$lang";
+my $infoFile = "$path/info.txt";
+
+die "info file $infoFile not found\n" if ! -s $infoFile;
+
+
+my $xlocToken = xloc::ParseTileInfo($infoFile);
+
+if ( $arg eq "-t" ) {
+    xloc::WriteMapFile( $xlocToken, 0, \*STDOUT );
+} elsif ( $arg eq "-tn" ) {
+    xloc::WriteMapFile( $xlocToken, 1, \*STDOUT );
+} elsif ( $arg eq "-v" ) {
+    xloc::WriteValuesFile( $xlocToken, \*STDOUT );
+}
--- a/xwords4/xwords4/dawg/xloc.pm
+++ b/xwords4/xwords4/dawg/xloc.pm
@ -0,0 +1,180 @@
+#!/usr/bin/perl
+
+# Copyright 2002 by Eric House (fixin@peak.org).  All rights reserved.
+#
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License
+# as published by the Free Software Foundation; either version 2
+# of the License, or (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+
+# The idea here is that all that matters about a language is stored in
+# one file (possibly excepting rules for prepping a dictionary).
+# There's a list of tile faces, counts and values, and also some
+# name-value pairs as needed.  The pairs come first, and then a list
+# of tiles.
+
+package xloc;
+
+use strict;
+use warnings;
+
+BEGIN {
+    use Exporter   ();
+    our ($VERSION, @ISA, @EXPORT, @EXPORT_OK, %EXPORT_TAGS);
+
+    $VERSION     = 1.00;
+
+    @ISA         = qw(Exporter);
+    @EXPORT      = qw(&ParseTileInfo &GetNTiles &TileFace &TileValue
+		      &TileCount &GetValue &WriteMapFile &WriteValuesFile);
+    %EXPORT_TAGS = ( );
+}
+
+# Returns what's meant to be an opaque object that can be passed back
+# for queries.  It's a hash with name-value pairs and an _INFO entry
+# containing a list of tile info lists.
+
+sub ParseTileInfo($) {
+    my ( $filePath ) = @_;
+    my %result;
+
+    open INPUT, "<$filePath" or die "couldn't open $filePath";
+
+    my $inTiles = 0;
+    my @tiles;
+    while ( <INPUT> ) {
+
+        chomp;
+        s/\#.*$//;
+        s/^\s*$//;                  # nuke all-white-space lines
+        next if !length;
+
+        if ( $inTiles ) {
+            if ( /<END_TILES>/ ) {
+                last;
+            } else {
+                my ( $count, $val, $face ) = m/^\s*(\w+)\s+(\w+)\s+(.*)\s*$/;
+                push @tiles, [ $count, $val, $face ];
+            }
+        } elsif ( /\w:/ ) {
+            my ( $nam, $val ) = split ':', $_, 2;
+            $result{$nam} .= $val;
+        } elsif ( /<BEGIN_TILES>/ ) {
+            $inTiles = 1;
+        }
+
+    }
+
+    close INPUT;
+
+    $result{"_TILES"} = [ @tiles ];
+
+    return \%result;
+}
+
+sub GetNTiles($) {
+    my ( $hashR ) = @_;
+
+    my $listR = ${$hashR}{"_TILES"};
+
+    return 0 + @{$listR};
+}
+
+sub GetValue($$) {
+    my ( $hashR, $name ) = @_;
+    return ${$hashR}{$name};
+}
+
+sub WriteMapFile($$$) {
+    my ( $hashR, $unicode, $fhr ) = @_;
+
+    my $packStr;
+    if ( $unicode ) {
+        $packStr = "n";
+    } else {
+        $packStr = "C";
+    }
+
+    my $count = GetNTiles($hashR);
+    my $specialCount = 0;
+    for ( my $i = 0; $i < $count; ++$i ) {
+        my $tileR = GetNthTile( $hashR, $i );
+        my $str = ${$tileR}[2];
+
+        if ( $str =~ /\'(.)\'/ ) {
+            print $fhr pack($packStr, ord($1) );
+        } elsif ( $str =~ /\"(.+)\"/ ) {
+            print $fhr pack($packStr, $specialCount++ );
+        } elsif ( $str =~ /(\d+)/ ) {
+            print $fhr pack( $packStr, chr($1) );
+        } else {
+            die "WriteMapFile: unrecognized face format $str";
+        }
+    }
+} # WriteMapFile
+
+sub WriteValuesFile($$) {
+    my ( $hashR, $fhr ) = @_;
+
+    my $header = GetValue( $hashR,"XLOC_HEADER" );
+    die "no XLOC_HEADER found" if ! $header;
+
+    print STDERR "header is $header\n";
+
+    print $fhr pack( "n", hex($header) );
+
+    my $count = GetNTiles($hashR);
+    for ( my $i = 0; $i < $count; ++$i ) {
+        my $tileR = GetNthTile( $hashR, $i );
+
+        print $fhr pack( "c", TileValue($tileR) );
+        print $fhr pack( "c", TileCount($tileR) );
+    }
+
+} # WriteValuesFile
+
+sub GetNthTile($$) {
+    my ( $hashR, $n ) = @_;
+    my $listR = ${$hashR}{"_TILES"};
+
+    return ${$listR}[$n];
+}
+
+sub TileFace($) {
+    my ( $tileR ) = @_;
+
+    my $str = ${$tileR}[2];
+
+    if ( $str =~ /\'(.)\'/ ) {
+        return $1;
+    } elsif ( $str =~ /\"(.+)\"/ ) {
+        return $1;
+    } elsif ( $str =~ /(\d+)/ ) {
+        return chr($1);
+    } else {
+        die "TileFace: unrecognized face format: $str";
+    }
+}
+
+sub TileValue($) {
+    my ( $tileR ) = @_;
+
+    return ${$tileR}[0];
+}
+
+sub TileCount($) {
+    my ( $tileR ) = @_;
+
+    return ${$tileR}[1];
+}
+
+1;
--- a/xwords4/xwords4/dawg/xwcommon3.h
+++ b/xwords4/xwords4/dawg/xwcommon3.h
@ -0,0 +1,132 @@
+// -*-mode: C; fill-column: 80; -*-
+
+/* 
+ * Copyright 1997 by Eric House (fixin@peak.org).  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU General Public License
+ * as published by the Free Software Foundation; either version 2
+ * of the License, or (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+ */
+ 
+#ifndef __XWCOMMON__
+#define __XWCOMMON__
+
+//#include <Hardware/Hardware.h>
+// so sue me :-)
+//#include "/home/pilot/usr/local/gnu/m68k-palmos-coff/include/PalmOS2/Hardware/Hardware.h"
+
+enum { BLANK=0,
+       EMPTY = 32,
+       DOUBLE_LETTER,
+       DOUBLE_WORD,
+       TRIPLE_LETTER,
+       TRIPLE_WORD
+};	
+
+	// a single-width diagonal stripe
+#define PAT_DOUBLE_LETTER	{ 0x8844, 0x2211, 0x8844, 0x2211 }
+	// a double-width diagonal stripe
+#define PAT_DOUBLE_WORD { 0xaa55, 0xaa55, 0xaa55, 0xaa55 }
+	// grey pattern (single-pixel checkboard)
+#define	PAT_TRIPLE_LETTER { 0xCC66, 0x3399, 0xCC66, 0x3399 }
+	// 2-pixel checkboard
+#define	PAT_TRIPLE_WORD { 0xCCCC, 0x3333, 0xCCCC, 0x3333 }
+
+
+#define BOARD_RES_TYPE 'Xbrd'
+#define TILES_RES_TYPE 'Xloc'
+#define STRL_RES_TYPE 'StrL'
+#define XW_STRL_RESOURCE_ID 1000
+// both the above resources use this ID
+#define XW_CONFIGABLE_RESOURCE_ID 1001
+
+#define BYTES_PER_LETTER 3
+
+#define BLANK_FACE '\0'
+//#define A_TILE 1
+#define A_TILE 0
+
+#define MAX_NUM_TILES 110
+#define MAX_UNIQUE_TILES (32-A_TILE)
+//b#define NUM_BLANKS 2
+#define MAX_NUM_BLANKS 4
+
+/* language header:
+ * specialCharStart simply gives the number of bytes needed to skip beyond the
+ * standard tiles table to the first of the "special" entries.
+ *
+ * langCodeFlags is more ambitious.  Each language I release will have an
+ * assigned code.  The code has a least two purposes: to prevent viewing a game
+ * with the wrong language; and to tie a language to the dictionary that can be
+ * used by the computer player.
+ *
+ * For a dictionary and language (set of tile rules) to work together, the
+ * mapping of index to character must be in sync.  In the German case, 0 must be
+ * A, 1 umlaut-A, etc.  But the number of characters and values assigned each
+ * tile do not matter.  Thus XWConfig can allow those aspects of a language to
+ * be edited.  but if a user wants to add or delete a character in an "official"
+ * language XWConfig must disallow this, forcing him instead to "clone" the
+ * language to something whose offical flag will be cleared.  
+ */
+
+typedef struct Xloc_header {
+    //unsigned char specialCharStart;
+    unsigned char langCodeFlags; // can't do bitfields; gcc for pilot and x86
+				 // seem to generate different code
+    unsigned char padding;       // ptrs to the shorts in Xloc_specialEntry
+                                 // will otherwise be odd
+} Xloc_header;
+
+#define XLOC_LANG_MASK 0x80  // high bit is "official"
+#define XLOC_LANG_OFFSET 7
+#define XLOC_OFFICIAL_MASK 0x7F // rest are for the enums below
+
+enum { 
+    HOMEBREW = 0,
+    US_ENGLISH = 1,
+    FRENCH_FRENCH = 2,
+    GERMAN_GERMAN = 3,
+    DUTCH_DUTCH = 4,
+    ITALIAN_ITALIAN = 5,
+    SPANISH_SPANISH = 6,
+    SWEDISH_SWEDISH = 7,
+    POLISH_POLISH = 8,
+    NORWEGIAN_NORWEGIAN = 9,
+};
+
+/* "Special chars", added to support Spanish "LL" and "RR", replace
+ * the ascii character code in the Xloc charinfo array with an integer
+ * between 1 and 0X1F which is an index into an larger array appended
+ * to the charinfo array.  Fields in the structs located in that array
+ * include the string to be used to represent the Tile when drawing in
+ * text (e.g.  formatting for the Tile values dialog) and the IDs of
+ * resources holding bitmaps to be used when drawing tiles large
+ * (tray) and small (board).
+ */
+typedef struct Xloc_specialEntry {
+    unsigned char textVersion[4]; /* string can be up to 3 chars long */
+    short hasLarge;
+    short hasSmall;
+} Xloc_specialEntry;
+
+
+
+
+/* #define LARGE_CH_BMP_ID 2000 */
+/* #define SMALL_CH_BMP_ID 2001 */
+/* #define LARGE_LL_BMP_ID 2002 */
+/* #define SMALL_LL_BMP_ID 2003 */
+/* #define LARGE_RR_BMP_ID 2004 */
+/* #define SMALL_RR_BMP_ID 2005 */
+
+#endif