sort to get rid of duplicates and so sort inside dict2dawg won't be needed

This commit is contained in:
ehouse 2006-04-30 02:35:26 +00:00
parent 8ba01c1979
commit 10792a168d

View file

@ -21,18 +21,19 @@ LANGCODE:nl_NL
LANGFILTER_PRECLIP: tr -d '\r' |
# uppercase all
LANGFILTER_POSTCLIP: | tr [a-zäöü] [A-ZÄÖÜ]
LANGFILTER_POSTCLIP: | tr [a-z] [A-Z]
# no words not containing a vowel
LANGFILTER_POSTCLIP: | grep '[AEIOU]'
# none with illegal chars
LANGFILTER_POSTCLIP: | grep '^[A-Z]\+$'
LANGFILTER_POSTCLIP: | sort -u
LANGFILTER_POSTCLIP: | tr -s '\n' '\000'
# Until I can figure out how to force sort to use a locale's collation
# rules we can't trust sort in the filtering rules above and so must
# leave the sorting work to dict2dawg.pl.
NEEDSSORT:true
NEEDSSORT:false
LANGINFO: <p>Dutch has the same 26 letters as English, though of
LANGINFO: course the counts and values are different. Filtering rules