2011-11-14 02:06:57 +01:00
|
|
|
/* -*- compile-command: "make MEMDEBUG=TRUE -j3"; -*- */
|
2003-11-01 06:35:29 +01:00
|
|
|
/*
|
2013-06-30 17:34:09 +02:00
|
|
|
* Copyright 1997 - 2013 by Eric House (xwords@eehouse.org). All rights
|
2009-04-05 21:22:55 +02:00
|
|
|
* reserved.
|
2003-11-01 06:35:29 +01:00
|
|
|
*
|
|
|
|
* This program is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU General Public License
|
|
|
|
* as published by the Free Software Foundation; either version 2
|
|
|
|
* of the License, or (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU General Public License
|
|
|
|
* along with this program; if not, write to the Free Software
|
|
|
|
* Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef CLIENT_ONLY /* there's an else in the middle!!! */
|
|
|
|
|
|
|
|
#include <stdio.h>
|
|
|
|
#include <stdlib.h>
|
2011-07-16 03:24:08 +02:00
|
|
|
#include <sys/mman.h>
|
|
|
|
#include <sys/types.h>
|
|
|
|
#include <sys/stat.h>
|
|
|
|
#include <unistd.h>
|
2003-11-01 06:35:29 +01:00
|
|
|
/* #include <prc.h> */
|
|
|
|
|
|
|
|
#include "comtypes.h"
|
|
|
|
#include "dictnryp.h"
|
|
|
|
#include "linuxmain.h"
|
2006-04-30 15:58:24 +02:00
|
|
|
#include "strutils.h"
|
2013-06-29 05:33:12 +02:00
|
|
|
#include "linuxutl.h"
|
2014-03-10 03:12:21 +01:00
|
|
|
#include "dictmgr.h"
|
2003-11-01 06:35:29 +01:00
|
|
|
|
|
|
|
typedef struct DictStart {
|
|
|
|
XP_U32 numNodes;
|
|
|
|
/* XP_U32 indexStart; */
|
|
|
|
array_edge* array;
|
|
|
|
} DictStart;
|
|
|
|
|
|
|
|
typedef struct LinuxDictionaryCtxt {
|
|
|
|
DictionaryCtxt super;
|
2011-07-19 03:07:15 +02:00
|
|
|
XP_U8* dictBase;
|
|
|
|
size_t dictLength;
|
|
|
|
XP_Bool useMMap;
|
2003-11-01 06:35:29 +01:00
|
|
|
} LinuxDictionaryCtxt;
|
|
|
|
|
|
|
|
|
|
|
|
/************************ Prototypes ***********************/
|
2005-10-30 06:05:45 +01:00
|
|
|
static XP_Bool initFromDictFile( LinuxDictionaryCtxt* dctx,
|
2012-09-04 06:33:46 +02:00
|
|
|
const LaunchParams* params,
|
2005-10-30 06:05:45 +01:00
|
|
|
const char* fileName );
|
2003-11-01 06:35:29 +01:00
|
|
|
static void linux_dictionary_destroy( DictionaryCtxt* dict );
|
2006-09-24 17:35:33 +02:00
|
|
|
static const XP_UCHAR* linux_dict_getShortName( const DictionaryCtxt* dict );
|
2003-11-01 06:35:29 +01:00
|
|
|
|
|
|
|
/*****************************************************************************
|
|
|
|
*
|
|
|
|
****************************************************************************/
|
|
|
|
DictionaryCtxt*
|
2012-09-04 06:33:46 +02:00
|
|
|
linux_dictionary_make( MPFORMAL const LaunchParams* params,
|
|
|
|
const char* dictFileName, XP_Bool useMMap )
|
2003-11-01 06:35:29 +01:00
|
|
|
{
|
2014-03-11 02:58:16 +01:00
|
|
|
LinuxDictionaryCtxt* result = NULL;
|
|
|
|
if ( !!dictFileName ) {
|
2014-03-11 05:01:24 +01:00
|
|
|
/* dmgr_get increments ref count before returning! */
|
2014-03-11 02:58:16 +01:00
|
|
|
result = (LinuxDictionaryCtxt*)dmgr_get( params->dictMgr, dictFileName );
|
|
|
|
}
|
2014-03-10 03:12:21 +01:00
|
|
|
if ( !result ) {
|
|
|
|
result = (LinuxDictionaryCtxt*)XP_CALLOC(mpool, sizeof(*result));
|
|
|
|
|
|
|
|
dict_super_init( &result->super );
|
|
|
|
MPASSIGN( result->super.mpool, mpool );
|
|
|
|
|
|
|
|
result->useMMap = useMMap;
|
|
|
|
|
|
|
|
if ( !!dictFileName ) {
|
|
|
|
XP_Bool success = initFromDictFile( result, params, dictFileName );
|
|
|
|
if ( success ) {
|
|
|
|
result->super.destructor = linux_dictionary_destroy;
|
|
|
|
result->super.func_dict_getShortName = linux_dict_getShortName;
|
|
|
|
setBlankTile( &result->super );
|
|
|
|
} else {
|
|
|
|
XP_ASSERT( 0 ); /* gonna crash anyway */
|
|
|
|
XP_FREE( mpool, result );
|
|
|
|
result = NULL;
|
|
|
|
}
|
2014-03-11 02:58:16 +01:00
|
|
|
|
|
|
|
dmgr_put( params->dictMgr, dictFileName, &result->super );
|
2003-11-01 06:35:29 +01:00
|
|
|
}
|
2014-03-11 05:01:24 +01:00
|
|
|
(void)dict_ref( &result->super );
|
2003-11-01 06:35:29 +01:00
|
|
|
}
|
|
|
|
|
2014-03-11 05:01:24 +01:00
|
|
|
return &result->super;
|
2003-11-01 06:35:29 +01:00
|
|
|
} /* gtk_dictionary_make */
|
|
|
|
|
2012-09-08 16:45:18 +02:00
|
|
|
static XP_UCHAR*
|
2012-09-09 18:22:00 +02:00
|
|
|
getNullTermParam( LinuxDictionaryCtxt* XP_UNUSED_DBG(dctx), const XP_U8** ptr,
|
2012-09-08 16:45:18 +02:00
|
|
|
XP_U16* headerLen )
|
|
|
|
{
|
|
|
|
XP_U16 len = 1 + XP_STRLEN( (XP_UCHAR*)*ptr );
|
|
|
|
XP_UCHAR* result = XP_MALLOC( dctx->super.mpool, len );
|
|
|
|
XP_MEMCPY( result, *ptr, len );
|
|
|
|
*ptr += len;
|
|
|
|
*headerLen -= len;
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2003-11-01 06:35:29 +01:00
|
|
|
static XP_U16
|
|
|
|
countSpecials( LinuxDictionaryCtxt* ctxt )
|
|
|
|
{
|
|
|
|
XP_U16 result = 0;
|
2009-04-05 21:22:55 +02:00
|
|
|
XP_U16 ii;
|
2003-11-01 06:35:29 +01:00
|
|
|
|
2009-04-05 21:22:55 +02:00
|
|
|
for ( ii = 0; ii < ctxt->super.nFaces; ++ii ) {
|
2009-09-13 07:28:12 +02:00
|
|
|
if ( IS_SPECIAL(ctxt->super.facePtrs[ii][0]) ) {
|
2003-11-01 06:35:29 +01:00
|
|
|
++result;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return result;
|
|
|
|
} /* countSpecials */
|
|
|
|
|
|
|
|
static XP_Bitmap
|
2011-07-19 03:07:15 +02:00
|
|
|
skipBitmap( LinuxDictionaryCtxt* XP_UNUSED_DBG(ctxt), const XP_U8** ptrp )
|
2003-11-01 06:35:29 +01:00
|
|
|
{
|
|
|
|
XP_U8 nCols, nRows, nBytes;
|
|
|
|
LinuxBMStruct* lbs = NULL;
|
2011-07-19 03:07:15 +02:00
|
|
|
const XP_U8* ptr = *ptrp;
|
2003-11-01 06:35:29 +01:00
|
|
|
|
2011-07-19 03:07:15 +02:00
|
|
|
nCols = *ptr++;
|
|
|
|
if ( nCols > 0 ) {
|
2012-09-08 05:34:06 +02:00
|
|
|
nRows = *ptr++;
|
2003-11-01 06:35:29 +01:00
|
|
|
|
|
|
|
nBytes = ((nRows * nCols) + 7) / 8;
|
|
|
|
|
|
|
|
lbs = XP_MALLOC( ctxt->super.mpool, sizeof(*lbs) + nBytes );
|
|
|
|
lbs->nRows = nRows;
|
|
|
|
lbs->nCols = nCols;
|
|
|
|
lbs->nBytes = nBytes;
|
2011-07-19 03:07:15 +02:00
|
|
|
|
2012-09-08 05:34:06 +02:00
|
|
|
memcpy( lbs + 1, ptr, nBytes );
|
|
|
|
ptr += nBytes;
|
2003-11-01 06:35:29 +01:00
|
|
|
}
|
|
|
|
|
2011-07-19 03:07:15 +02:00
|
|
|
*ptrp = ptr;
|
2003-11-01 06:35:29 +01:00
|
|
|
return lbs;
|
|
|
|
} /* skipBitmap */
|
|
|
|
|
|
|
|
static void
|
2011-07-19 03:07:15 +02:00
|
|
|
skipBitmaps( LinuxDictionaryCtxt* ctxt, const XP_U8** ptrp )
|
2003-11-01 06:35:29 +01:00
|
|
|
{
|
|
|
|
XP_U16 nSpecials;
|
|
|
|
XP_UCHAR* text;
|
|
|
|
XP_UCHAR** texts;
|
2013-04-09 16:43:04 +02:00
|
|
|
XP_UCHAR** textEnds;
|
2003-11-01 06:35:29 +01:00
|
|
|
SpecialBitmaps* bitmaps;
|
|
|
|
Tile tile;
|
2011-07-19 03:07:15 +02:00
|
|
|
const XP_U8* ptr = *ptrp;
|
2003-11-01 06:35:29 +01:00
|
|
|
|
|
|
|
nSpecials = countSpecials( ctxt );
|
|
|
|
|
|
|
|
texts = (XP_UCHAR**)XP_MALLOC( ctxt->super.mpool,
|
|
|
|
nSpecials * sizeof(*texts) );
|
2013-04-09 16:43:04 +02:00
|
|
|
textEnds = (XP_UCHAR**)XP_MALLOC( ctxt->super.mpool,
|
|
|
|
nSpecials * sizeof(*textEnds) );
|
2003-11-01 06:35:29 +01:00
|
|
|
bitmaps = (SpecialBitmaps*)XP_MALLOC( ctxt->super.mpool,
|
|
|
|
nSpecials * sizeof(*bitmaps) );
|
2009-09-04 14:30:10 +02:00
|
|
|
XP_MEMSET( bitmaps, 0, nSpecials * sizeof(*bitmaps) );
|
2003-11-01 06:35:29 +01:00
|
|
|
|
|
|
|
for ( tile = 0; tile < ctxt->super.nFaces; ++tile ) {
|
|
|
|
|
2010-02-24 05:28:22 +01:00
|
|
|
const XP_UCHAR* facep = ctxt->super.facePtrs[(short)tile];
|
2009-04-05 21:22:55 +02:00
|
|
|
if ( IS_SPECIAL(*facep) ) {
|
|
|
|
XP_U16 asIndex = (XP_U16)*facep;
|
2003-11-01 06:35:29 +01:00
|
|
|
XP_U8 txtlen;
|
2009-09-04 14:30:10 +02:00
|
|
|
XP_ASSERT( *facep < nSpecials );
|
2003-11-01 06:35:29 +01:00
|
|
|
|
|
|
|
/* get the string */
|
2013-04-09 16:43:04 +02:00
|
|
|
txtlen = *ptr++;
|
|
|
|
text = (XP_UCHAR*)XP_MALLOC(ctxt->super.mpool, txtlen+1);
|
|
|
|
memcpy( text, ptr, txtlen );
|
|
|
|
ptr += txtlen;
|
|
|
|
|
|
|
|
text[txtlen] = '\0';
|
|
|
|
texts[(XP_U16)*facep] = text;
|
|
|
|
textEnds[(XP_U16)*facep] = text + txtlen + 1;
|
|
|
|
|
|
|
|
/* Now replace the delimiter char with \0. It must be one byte in
|
|
|
|
length and of course equal to the delimiter */
|
2013-04-18 16:15:14 +02:00
|
|
|
XP_ASSERT( 0 == (SYNONYM_DELIM & 0x80) );
|
2013-04-09 16:43:04 +02:00
|
|
|
while ( '\0' != *text ) {
|
|
|
|
XP_UCHAR* cp = g_utf8_offset_to_pointer( text, 1 );
|
|
|
|
if ( 1 == (cp - text) && *text == SYNONYM_DELIM ) {
|
|
|
|
*text = '\0';
|
|
|
|
}
|
|
|
|
text = cp;
|
|
|
|
}
|
2003-11-01 06:35:29 +01:00
|
|
|
|
2013-04-09 16:43:04 +02:00
|
|
|
XP_DEBUGF( "skipping bitmaps for " XP_S, texts[asIndex] );
|
2011-07-19 03:07:15 +02:00
|
|
|
|
2013-04-09 16:43:04 +02:00
|
|
|
bitmaps[asIndex].largeBM = skipBitmap( ctxt, &ptr );
|
|
|
|
bitmaps[asIndex].smallBM = skipBitmap( ctxt, &ptr );
|
2003-11-01 06:35:29 +01:00
|
|
|
}
|
|
|
|
}
|
2011-07-19 03:07:15 +02:00
|
|
|
*ptrp = ptr;
|
2003-11-01 06:35:29 +01:00
|
|
|
|
|
|
|
ctxt->super.chars = texts;
|
2013-04-09 16:43:04 +02:00
|
|
|
ctxt->super.charEnds = textEnds;
|
2003-11-01 06:35:29 +01:00
|
|
|
ctxt->super.bitmaps = bitmaps;
|
|
|
|
} /* skipBitmaps */
|
|
|
|
|
2009-04-05 21:22:55 +02:00
|
|
|
void
|
|
|
|
dict_splitFaces( DictionaryCtxt* dict, const XP_U8* utf8,
|
|
|
|
XP_U16 nBytes, XP_U16 nFaces )
|
|
|
|
{
|
2009-09-04 14:30:10 +02:00
|
|
|
XP_UCHAR* faces = XP_MALLOC( dict->mpool, nBytes + nFaces );
|
2010-02-24 05:28:22 +01:00
|
|
|
const XP_UCHAR** ptrs = XP_MALLOC( dict->mpool, nFaces * sizeof(ptrs[0]));
|
2009-04-05 21:22:55 +02:00
|
|
|
XP_U16 ii;
|
|
|
|
XP_Bool isUTF8 = dict->isUTF8;
|
|
|
|
XP_UCHAR* next = faces;
|
|
|
|
const gchar* bytes = (const gchar*)utf8;
|
|
|
|
|
|
|
|
for ( ii = 0; ii < nFaces; ++ii ) {
|
2009-09-13 07:28:12 +02:00
|
|
|
ptrs[ii] = next;
|
2009-04-05 21:22:55 +02:00
|
|
|
if ( isUTF8 ) {
|
2013-04-06 20:43:57 +02:00
|
|
|
for ( ; ; ) {
|
|
|
|
gchar* cp = g_utf8_offset_to_pointer( bytes, 1 );
|
2014-01-07 15:58:20 +01:00
|
|
|
size_t len = cp - bytes;
|
2013-04-06 20:43:57 +02:00
|
|
|
XP_MEMCPY( next, bytes, len );
|
|
|
|
next += len;
|
|
|
|
bytes += len;
|
2013-04-09 16:43:04 +02:00
|
|
|
if ( SYNONYM_DELIM != bytes[0] ) {
|
2013-04-06 20:43:57 +02:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
++bytes; /* skip delimiter */
|
|
|
|
*next++ = '\0';
|
|
|
|
}
|
2009-04-05 21:22:55 +02:00
|
|
|
} else {
|
2009-09-04 14:30:10 +02:00
|
|
|
XP_ASSERT( 0 == *bytes );
|
|
|
|
++bytes; /* skip empty */
|
2009-04-05 21:22:55 +02:00
|
|
|
*next++ = *bytes++;
|
|
|
|
}
|
2009-09-04 14:30:10 +02:00
|
|
|
XP_ASSERT( next < faces + nFaces + nBytes );
|
2009-04-05 21:22:55 +02:00
|
|
|
*next++ = '\0';
|
|
|
|
}
|
|
|
|
XP_ASSERT( !dict->faces );
|
|
|
|
dict->faces = faces;
|
2013-04-06 20:43:57 +02:00
|
|
|
dict->facesEnd = faces + nFaces + nBytes;
|
2009-09-13 07:28:12 +02:00
|
|
|
XP_ASSERT( !dict->facePtrs );
|
|
|
|
dict->facePtrs = ptrs;
|
2009-04-05 21:22:55 +02:00
|
|
|
} /* dict_splitFaces */
|
|
|
|
|
2003-11-01 06:35:29 +01:00
|
|
|
static XP_Bool
|
2012-09-04 06:33:46 +02:00
|
|
|
initFromDictFile( LinuxDictionaryCtxt* dctx, const LaunchParams* params,
|
|
|
|
const char* fileName )
|
2003-11-01 06:35:29 +01:00
|
|
|
{
|
2009-04-05 21:22:55 +02:00
|
|
|
XP_Bool formatOk = XP_TRUE;
|
2014-01-07 15:58:20 +01:00
|
|
|
size_t dictLength;
|
2003-11-01 06:35:29 +01:00
|
|
|
XP_U32 topOffset;
|
|
|
|
unsigned short xloc;
|
|
|
|
XP_U16 flags;
|
2009-09-04 14:30:10 +02:00
|
|
|
XP_U16 facesSize;
|
2003-12-14 18:55:45 +01:00
|
|
|
XP_U16 charSize;
|
2009-04-05 21:22:55 +02:00
|
|
|
XP_Bool isUTF8 = XP_FALSE;
|
2010-12-06 04:33:10 +01:00
|
|
|
XP_Bool hasHeader = XP_FALSE;
|
2011-07-19 03:07:15 +02:00
|
|
|
const XP_U8* ptr;
|
2012-09-04 06:33:46 +02:00
|
|
|
char path[256];
|
2003-11-01 06:35:29 +01:00
|
|
|
|
2012-09-04 06:33:46 +02:00
|
|
|
if ( !getDictPath( params, fileName, path, VSIZE(path) ) ) {
|
|
|
|
XP_LOGF( "%s: path=%s", __func__, path );
|
|
|
|
goto closeAndExit;
|
|
|
|
}
|
2011-07-16 03:24:08 +02:00
|
|
|
struct stat statbuf;
|
2012-09-04 06:33:46 +02:00
|
|
|
if ( 0 != stat( path, &statbuf ) || 0 == statbuf.st_size ) {
|
2011-07-16 03:24:08 +02:00
|
|
|
goto closeAndExit;
|
|
|
|
}
|
2011-07-19 03:07:15 +02:00
|
|
|
dctx->dictLength = statbuf.st_size;
|
|
|
|
|
|
|
|
{
|
2012-09-04 06:33:46 +02:00
|
|
|
FILE* dictF = fopen( path, "r" );
|
2011-11-09 15:51:12 +01:00
|
|
|
XP_ASSERT( !!dictF );
|
|
|
|
if ( dctx->useMMap ) {
|
|
|
|
dctx->dictBase = mmap( NULL, dctx->dictLength, PROT_READ,
|
|
|
|
MAP_PRIVATE, fileno(dictF), 0 );
|
|
|
|
} else {
|
|
|
|
dctx->dictBase = XP_MALLOC( dctx->super.mpool, dctx->dictLength );
|
|
|
|
if ( dctx->dictLength != fread( dctx->dictBase, 1,
|
|
|
|
dctx->dictLength, dictF ) ) {
|
|
|
|
XP_ASSERT( 0 );
|
|
|
|
}
|
|
|
|
}
|
|
|
|
fclose( dictF );
|
2011-07-19 03:07:15 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
ptr = dctx->dictBase;
|
|
|
|
|
|
|
|
memcpy( &flags, ptr, sizeof(flags) );
|
|
|
|
ptr += sizeof( flags );
|
|
|
|
flags = ntohs(flags);
|
|
|
|
|
|
|
|
XP_DEBUGF( "flags=0X%X", flags );
|
|
|
|
hasHeader = 0 != (DICT_HEADER_MASK & flags);
|
|
|
|
if ( hasHeader ) {
|
2011-11-09 15:51:12 +01:00
|
|
|
flags &= ~DICT_HEADER_MASK;
|
|
|
|
XP_DEBUGF( "has header!" );
|
2011-07-19 03:07:15 +02:00
|
|
|
}
|
2013-04-21 04:46:35 +02:00
|
|
|
|
|
|
|
flags &= ~DICT_SYNONYMS_MASK;
|
|
|
|
|
2011-07-19 03:07:15 +02:00
|
|
|
if ( flags == 0x0001 ) {
|
2011-11-09 15:51:12 +01:00
|
|
|
dctx->super.nodeSize = 3;
|
|
|
|
charSize = 1;
|
|
|
|
dctx->super.is_4_byte = XP_FALSE;
|
2011-07-19 03:07:15 +02:00
|
|
|
} else if ( flags == 0x0002 ) {
|
2011-11-09 15:51:12 +01:00
|
|
|
dctx->super.nodeSize = 3;
|
|
|
|
charSize = 2;
|
|
|
|
dctx->super.is_4_byte = XP_FALSE;
|
2011-07-19 03:07:15 +02:00
|
|
|
} else if ( flags == 0x0003 ) {
|
2011-11-09 15:51:12 +01:00
|
|
|
dctx->super.nodeSize = 4;
|
|
|
|
charSize = 2;
|
|
|
|
dctx->super.is_4_byte = XP_TRUE;
|
2011-07-19 03:07:15 +02:00
|
|
|
} else if ( flags == 0x0004 ) {
|
2011-11-09 15:51:12 +01:00
|
|
|
dctx->super.nodeSize = 3;
|
|
|
|
dctx->super.isUTF8 = XP_TRUE;
|
|
|
|
isUTF8 = XP_TRUE;
|
|
|
|
dctx->super.is_4_byte = XP_FALSE;
|
2011-07-19 03:07:15 +02:00
|
|
|
} else if ( flags == 0x0005 ) {
|
2011-11-09 15:51:12 +01:00
|
|
|
dctx->super.nodeSize = 4;
|
|
|
|
dctx->super.isUTF8 = XP_TRUE;
|
|
|
|
isUTF8 = XP_TRUE;
|
|
|
|
dctx->super.is_4_byte = XP_TRUE;
|
2003-11-01 06:35:29 +01:00
|
|
|
} else {
|
2011-11-09 15:51:12 +01:00
|
|
|
/* case I don't know how to deal with */
|
|
|
|
formatOk = XP_FALSE;
|
|
|
|
XP_ASSERT(0);
|
2003-11-01 06:35:29 +01:00
|
|
|
}
|
2011-07-19 03:07:15 +02:00
|
|
|
|
2003-11-01 06:35:29 +01:00
|
|
|
if ( formatOk ) {
|
2011-11-09 15:51:12 +01:00
|
|
|
XP_U8 numFaceBytes, numFaces;
|
2010-12-06 04:33:10 +01:00
|
|
|
|
|
|
|
if ( hasHeader ) {
|
|
|
|
XP_U16 headerLen;
|
|
|
|
XP_U32 wordCount;
|
2011-07-19 03:07:15 +02:00
|
|
|
|
2011-11-09 15:51:12 +01:00
|
|
|
memcpy( &headerLen, ptr, sizeof(headerLen) );
|
|
|
|
ptr += sizeof(headerLen);
|
2011-07-19 03:07:15 +02:00
|
|
|
headerLen = ntohs( headerLen );
|
2012-08-25 19:20:52 +02:00
|
|
|
|
2011-11-09 15:51:12 +01:00
|
|
|
memcpy( &wordCount, ptr, sizeof(wordCount) );
|
|
|
|
ptr += sizeof(wordCount);
|
2012-08-25 19:20:52 +02:00
|
|
|
headerLen -= sizeof(wordCount);
|
2010-12-06 04:33:10 +01:00
|
|
|
dctx->super.nWords = ntohl( wordCount );
|
2014-01-07 15:58:20 +01:00
|
|
|
XP_DEBUGF( "dict contains %d words", dctx->super.nWords );
|
2012-08-25 19:20:52 +02:00
|
|
|
|
|
|
|
if ( 0 < headerLen ) {
|
2012-09-08 16:45:18 +02:00
|
|
|
dctx->super.desc = getNullTermParam( dctx, &ptr, &headerLen );
|
2012-08-25 19:20:52 +02:00
|
|
|
} else {
|
|
|
|
XP_LOGF( "%s: no note", __func__ );
|
|
|
|
}
|
2012-09-08 05:34:06 +02:00
|
|
|
if ( 0 < headerLen ) {
|
2012-09-08 16:45:18 +02:00
|
|
|
dctx->super.md5Sum = getNullTermParam( dctx, &ptr, &headerLen );
|
2012-09-08 05:34:06 +02:00
|
|
|
} else {
|
|
|
|
XP_LOGF( "%s: no md5Sum", __func__ );
|
|
|
|
}
|
2012-08-25 19:20:52 +02:00
|
|
|
ptr += headerLen;
|
2010-12-06 04:33:10 +01:00
|
|
|
}
|
|
|
|
|
2009-04-05 21:22:55 +02:00
|
|
|
if ( isUTF8 ) {
|
2011-11-09 15:51:12 +01:00
|
|
|
numFaceBytes = *ptr++;
|
2009-01-03 19:12:34 +01:00
|
|
|
}
|
2011-11-09 15:51:12 +01:00
|
|
|
numFaces = *ptr++;
|
2009-04-05 21:22:55 +02:00
|
|
|
if ( !isUTF8 ) {
|
|
|
|
numFaceBytes = numFaces * charSize;
|
|
|
|
}
|
2003-11-01 06:35:29 +01:00
|
|
|
|
2012-09-08 05:34:06 +02:00
|
|
|
if ( NULL == dctx->super.md5Sum
|
|
|
|
#ifdef DEBUG
|
|
|
|
|| XP_TRUE
|
|
|
|
#endif
|
|
|
|
) {
|
2014-01-07 15:58:20 +01:00
|
|
|
size_t curPos = ptr - dctx->dictBase;
|
2012-09-08 05:34:06 +02:00
|
|
|
gssize dictLength = dctx->dictLength - curPos;
|
2013-06-29 05:33:12 +02:00
|
|
|
|
2013-06-30 17:34:09 +02:00
|
|
|
gchar* checksum = g_compute_checksum_for_data( G_CHECKSUM_MD5, ptr, dictLength );
|
2012-09-08 05:34:06 +02:00
|
|
|
if ( NULL == dctx->super.md5Sum ) {
|
2013-06-30 16:36:56 +02:00
|
|
|
dctx->super.md5Sum = copyString( dctx->super.mpool, checksum );
|
2012-09-08 05:34:06 +02:00
|
|
|
} else {
|
2013-06-30 16:36:56 +02:00
|
|
|
XP_ASSERT( 0 == XP_STRCMP( dctx->super.md5Sum, checksum ) );
|
2012-09-08 05:34:06 +02:00
|
|
|
}
|
2013-06-30 17:34:09 +02:00
|
|
|
g_free( checksum );
|
2012-09-08 05:34:06 +02:00
|
|
|
}
|
|
|
|
|
2003-11-01 06:35:29 +01:00
|
|
|
dctx->super.nFaces = numFaces;
|
|
|
|
|
|
|
|
dctx->super.countsAndValues = XP_MALLOC( dctx->super.mpool,
|
|
|
|
numFaces*2 );
|
2009-09-04 14:30:10 +02:00
|
|
|
facesSize = numFaceBytes;
|
|
|
|
if ( !isUTF8 ) {
|
|
|
|
facesSize /= 2;
|
|
|
|
}
|
2003-11-01 06:35:29 +01:00
|
|
|
|
2009-04-05 21:22:55 +02:00
|
|
|
XP_U8 tmp[numFaceBytes];
|
2011-11-09 15:51:12 +01:00
|
|
|
memcpy( tmp, ptr, numFaceBytes );
|
|
|
|
ptr += numFaceBytes;
|
2009-01-03 19:12:34 +01:00
|
|
|
|
2009-04-05 21:22:55 +02:00
|
|
|
dict_splitFaces( &dctx->super, tmp, numFaceBytes, numFaces );
|
2003-11-01 06:35:29 +01:00
|
|
|
|
2011-11-09 15:51:12 +01:00
|
|
|
memcpy( &xloc, ptr, sizeof(xloc) );
|
|
|
|
ptr += sizeof(xloc);
|
|
|
|
memcpy( dctx->super.countsAndValues, ptr, numFaces*2 );
|
|
|
|
ptr += numFaces*2;
|
2009-01-03 19:12:34 +01:00
|
|
|
}
|
2010-09-10 10:57:22 +02:00
|
|
|
|
|
|
|
dctx->super.langCode = xloc & 0x7F;
|
2003-11-01 06:35:29 +01:00
|
|
|
|
2009-01-03 19:12:34 +01:00
|
|
|
if ( formatOk ) {
|
2011-11-09 15:51:12 +01:00
|
|
|
XP_U32 numEdges;
|
2011-07-19 03:07:15 +02:00
|
|
|
skipBitmaps( dctx, &ptr );
|
2003-11-01 06:35:29 +01:00
|
|
|
|
2014-01-07 15:58:20 +01:00
|
|
|
size_t curPos = ptr - dctx->dictBase;
|
2011-07-19 03:07:15 +02:00
|
|
|
dictLength = dctx->dictLength - curPos;
|
2003-11-01 06:35:29 +01:00
|
|
|
|
|
|
|
if ( dictLength > 0 ) {
|
2011-11-09 15:51:12 +01:00
|
|
|
memcpy( &topOffset, ptr, sizeof(topOffset) );
|
2003-11-01 06:35:29 +01:00
|
|
|
/* it's in big-endian order */
|
|
|
|
topOffset = ntohl(topOffset);
|
|
|
|
dictLength -= sizeof(topOffset); /* first four bytes are offset */
|
2011-11-09 15:51:12 +01:00
|
|
|
ptr += sizeof(topOffset);
|
2003-11-01 06:35:29 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
if ( dictLength > 0 ) {
|
2011-11-09 15:51:12 +01:00
|
|
|
numEdges = dictLength / dctx->super.nodeSize;
|
2003-11-01 06:35:29 +01:00
|
|
|
#ifdef DEBUG
|
|
|
|
XP_ASSERT( (dictLength % dctx->super.nodeSize) == 0 );
|
2011-11-09 15:51:12 +01:00
|
|
|
dctx->super.numEdges = numEdges;
|
2003-11-01 06:35:29 +01:00
|
|
|
#endif
|
2011-07-19 03:07:15 +02:00
|
|
|
dctx->super.base = (array_edge*)ptr;
|
2003-11-01 06:35:29 +01:00
|
|
|
|
|
|
|
dctx->super.topEdge = dctx->super.base + topOffset;
|
|
|
|
} else {
|
|
|
|
dctx->super.base = NULL;
|
|
|
|
dctx->super.topEdge = NULL;
|
2011-11-22 03:07:08 +01:00
|
|
|
numEdges = 0;
|
2003-11-01 06:35:29 +01:00
|
|
|
}
|
2006-04-30 15:58:24 +02:00
|
|
|
|
2009-01-03 19:12:34 +01:00
|
|
|
dctx->super.name = copyString( dctx->super.mpool, fileName );
|
2011-11-09 15:51:12 +01:00
|
|
|
|
|
|
|
if ( ! checkSanity( &dctx->super, numEdges ) ) {
|
|
|
|
goto closeAndExit;
|
|
|
|
}
|
2003-11-01 06:35:29 +01:00
|
|
|
}
|
2009-01-03 19:12:34 +01:00
|
|
|
goto ok;
|
2003-11-01 06:35:29 +01:00
|
|
|
|
2009-01-03 19:12:34 +01:00
|
|
|
closeAndExit:
|
|
|
|
formatOk = XP_FALSE;
|
|
|
|
ok:
|
2011-07-19 03:07:15 +02:00
|
|
|
|
2003-11-01 06:35:29 +01:00
|
|
|
return formatOk;
|
|
|
|
} /* initFromDictFile */
|
|
|
|
|
|
|
|
static void
|
|
|
|
freeSpecials( LinuxDictionaryCtxt* ctxt )
|
|
|
|
{
|
|
|
|
XP_U16 nSpecials = 0;
|
2009-04-05 21:22:55 +02:00
|
|
|
XP_U16 ii;
|
2003-11-01 06:35:29 +01:00
|
|
|
|
2009-04-05 21:22:55 +02:00
|
|
|
for ( ii = 0; ii < ctxt->super.nFaces; ++ii ) {
|
2009-09-13 07:28:12 +02:00
|
|
|
if ( IS_SPECIAL(ctxt->super.facePtrs[ii][0] ) ) {
|
2003-11-01 06:35:29 +01:00
|
|
|
if ( !!ctxt->super.bitmaps ) {
|
|
|
|
XP_Bitmap* bmp = ctxt->super.bitmaps[nSpecials].largeBM;
|
|
|
|
if ( !!bmp ) {
|
|
|
|
XP_FREE( ctxt->super.mpool, bmp );
|
|
|
|
}
|
|
|
|
bmp = ctxt->super.bitmaps[nSpecials].smallBM;
|
|
|
|
if ( !!bmp ) {
|
|
|
|
XP_FREE( ctxt->super.mpool, bmp );
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if ( !!ctxt->super.chars && !!ctxt->super.chars[nSpecials]) {
|
|
|
|
XP_FREE( ctxt->super.mpool, ctxt->super.chars[nSpecials] );
|
|
|
|
}
|
|
|
|
++nSpecials;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if ( !!ctxt->super.bitmaps ) {
|
|
|
|
XP_FREE( ctxt->super.mpool, ctxt->super.bitmaps );
|
|
|
|
}
|
2013-04-14 01:49:20 +02:00
|
|
|
XP_FREEP( ctxt->super.mpool, &ctxt->super.chars );
|
|
|
|
XP_FREEP( ctxt->super.mpool, &ctxt->super.charEnds );
|
2003-11-01 06:35:29 +01:00
|
|
|
} /* freeSpecials */
|
|
|
|
|
|
|
|
static void
|
|
|
|
linux_dictionary_destroy( DictionaryCtxt* dict )
|
|
|
|
{
|
|
|
|
LinuxDictionaryCtxt* ctxt = (LinuxDictionaryCtxt*)dict;
|
|
|
|
|
|
|
|
freeSpecials( ctxt );
|
|
|
|
|
2011-07-19 03:07:15 +02:00
|
|
|
if ( !!ctxt->dictBase ) {
|
2012-09-08 05:34:06 +02:00
|
|
|
if ( ctxt->useMMap ) {
|
|
|
|
(void)munmap( ctxt->dictBase, ctxt->dictLength );
|
|
|
|
} else {
|
|
|
|
XP_FREE( dict->mpool, ctxt->dictBase );
|
|
|
|
}
|
2003-11-01 06:35:29 +01:00
|
|
|
}
|
|
|
|
|
2012-08-27 05:58:28 +02:00
|
|
|
XP_FREEP( dict->mpool, &ctxt->super.desc );
|
2012-09-08 05:34:06 +02:00
|
|
|
XP_FREEP( dict->mpool, &ctxt->super.md5Sum );
|
2003-11-01 06:35:29 +01:00
|
|
|
XP_FREE( dict->mpool, ctxt->super.countsAndValues );
|
2009-04-05 21:22:55 +02:00
|
|
|
XP_FREE( dict->mpool, ctxt->super.faces );
|
2009-09-13 07:28:12 +02:00
|
|
|
XP_FREE( dict->mpool, ctxt->super.facePtrs );
|
2006-04-30 15:58:24 +02:00
|
|
|
XP_FREE( dict->mpool, ctxt->super.name );
|
2003-11-01 06:35:29 +01:00
|
|
|
XP_FREE( dict->mpool, ctxt );
|
|
|
|
} /* linux_dictionary_destroy */
|
|
|
|
|
2006-09-24 17:35:33 +02:00
|
|
|
static const XP_UCHAR*
|
|
|
|
linux_dict_getShortName( const DictionaryCtxt* dict )
|
|
|
|
{
|
|
|
|
const XP_UCHAR* full = dict_getName( dict );
|
2009-09-04 14:30:10 +02:00
|
|
|
const XP_UCHAR* c = strchr( full, '/' );
|
2006-09-24 17:35:33 +02:00
|
|
|
if ( !!c ) {
|
|
|
|
++c;
|
|
|
|
} else {
|
|
|
|
c = full;
|
|
|
|
}
|
|
|
|
return c;
|
|
|
|
}
|
|
|
|
|
2003-11-01 06:35:29 +01:00
|
|
|
#else /* CLIENT_ONLY *IS* defined */
|
|
|
|
|
|
|
|
/* initFromDictFile:
|
|
|
|
* This guy reads in from a prc file, and probably hasn't worked in a year.
|
|
|
|
*/
|
|
|
|
#define RECS_BEFORE_DAWG 3 /* a hack */
|
|
|
|
static XP_Bool
|
2005-10-30 06:05:45 +01:00
|
|
|
initFromDictFile( LinuxDictionaryCtxt* dctx, const char* fileName )
|
2003-11-01 06:35:29 +01:00
|
|
|
{
|
|
|
|
short i;
|
|
|
|
unsigned short* dataP;
|
|
|
|
unsigned nRecs;
|
|
|
|
prc_record_t* prect;
|
|
|
|
|
|
|
|
prc_t* pt = prcopen( fileName, PRC_OPEN_READ );
|
|
|
|
dctx->pt = pt; /* remember so we can close it later */
|
|
|
|
|
|
|
|
nRecs = prcgetnrecords( pt );
|
|
|
|
|
|
|
|
/* record 0 holds a struct whose 5th byte is the record num of the first
|
|
|
|
dawg record. 1 and 2 hold tile data. Let's assume 3 is the first dawg
|
|
|
|
record for now. */
|
|
|
|
|
|
|
|
prect = prcgetrecord( pt, 1 );
|
|
|
|
dctx->super.numFaces = prect->datalen; /* one char per byte */
|
|
|
|
dctx->super.faces = malloc( prect->datalen );
|
|
|
|
memcpy( dctx->super.faces, prect->data, prect->datalen );
|
|
|
|
|
|
|
|
dctx->super.counts = malloc( dctx->super.numFaces );
|
|
|
|
dctx->super.values = malloc( dctx->super.numFaces );
|
|
|
|
|
|
|
|
prect = prcgetrecord( pt, 2 );
|
|
|
|
dataP = (unsigned short*)prect->data + 1; /* skip the xloc header */
|
|
|
|
|
2014-01-07 15:58:20 +01:00
|
|
|
for ( ii = 0; ii < dctx->super.numFaces; ++ii ) {
|
2003-11-01 06:35:29 +01:00
|
|
|
unsigned short byt = *dataP++;
|
2014-01-07 15:58:20 +01:00
|
|
|
dctx->super.values[ii] = byt >> 8;
|
|
|
|
dctx->super.counts[ii] = byt & 0xFF;
|
|
|
|
if ( dctx->super.values[ii] == 0 ) {
|
|
|
|
dctx->super.counts[ii] = 4; /* 4 blanks :-) */
|
2003-11-01 06:35:29 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
dctx->numStarts = nRecs - RECS_BEFORE_DAWG;
|
|
|
|
dctx->starts = XP_MALLOC( dctx->numStarts * sizeof(*dctx->starts) );
|
|
|
|
|
|
|
|
for ( i = 0/* , offset = 0 */; i < dctx->numStarts; ++i ) {
|
|
|
|
prect = prcgetrecord( pt, i + RECS_BEFORE_DAWG );
|
|
|
|
dctx->starts[i].numNodes = prect->datalen / 3;
|
|
|
|
dctx->starts[i].array = (array_edge*)prect->data;
|
|
|
|
|
|
|
|
XP_ASSERT( (prect->datalen % 3) == 0 );
|
|
|
|
}
|
|
|
|
} /* initFromDictFile */
|
|
|
|
|
|
|
|
void
|
|
|
|
linux_dictionary_destroy( DictionaryCtxt* dict )
|
|
|
|
{
|
|
|
|
LinuxDictionaryCtxt* ctxt = (LinuxDictionaryCtxt*)dict;
|
|
|
|
prcclose( ctxt->pt );
|
|
|
|
}
|
|
|
|
|
|
|
|
#endif /* CLIENT_ONLY */
|
|
|
|
|