mirror of
git://xwords.git.sourceforge.net/gitroot/xwords/xwords
synced 2025-01-01 06:19:57 +01:00
f0d8a71deb
As with java, the platform knows utf-8 better than vanilla C, so use a JS inlined function to split a binary stream into its "face" components.
301 lines
9.2 KiB
C
301 lines
9.2 KiB
C
/* -*- compile-command: "cd ../wasm && make MEMDEBUG=TRUE install -j3"; -*- */
|
|
/*
|
|
* Copyright 2021 by Eric House (xwords@eehouse.org). All rights reserved.
|
|
*
|
|
* This program is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU General Public License
|
|
* as published by the Free Software Foundation; either version 2
|
|
* of the License, or (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, write to the Free Software
|
|
* Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
|
|
*/
|
|
|
|
#include <emscripten.h>
|
|
#include <sys/types.h>
|
|
#include <sys/stat.h>
|
|
#include <unistd.h>
|
|
#include <sys/mman.h>
|
|
|
|
#include "wasmdict.h"
|
|
#include "dictnryp.h"
|
|
#include "strutils.h"
|
|
#include "dictmgr.h"
|
|
|
|
typedef struct _WasmDictionaryCtxt {
|
|
DictionaryCtxt super;
|
|
Globals* globals;
|
|
size_t dictLength;
|
|
XP_U8* dictBase;
|
|
XP_Bool useMMap;
|
|
} WasmDictionaryCtxt;
|
|
|
|
static const XP_UCHAR*
|
|
getShortName( const DictionaryCtxt* dict )
|
|
{
|
|
const XP_UCHAR* full = dict_getName( dict );
|
|
const XP_UCHAR* ch = strchr( full, '/' );
|
|
if ( !!ch ) {
|
|
++ch;
|
|
} else {
|
|
ch = full;
|
|
}
|
|
return ch;
|
|
}
|
|
|
|
static XP_Bool
|
|
initFromPtr( WasmDictionaryCtxt* dctx, const char* name,
|
|
uint8_t* dictBase, size_t len )
|
|
{
|
|
XP_Bool formatOk = XP_TRUE;
|
|
size_t dictLength;
|
|
XP_U32 topOffset;
|
|
char path[256];
|
|
|
|
dctx->dictLength = len;
|
|
dctx->dictBase = dictBase;
|
|
|
|
const XP_U8* ptr = dctx->dictBase;
|
|
const XP_U8* end = ptr + dctx->dictLength;
|
|
formatOk = parseCommon( &dctx->super, NULL, &ptr, end );
|
|
/* && loadSpecialData( &dctx->super, &ptr, end ); */
|
|
|
|
if ( formatOk ) {
|
|
size_t curPos = ptr - dctx->dictBase;
|
|
dictLength = dctx->dictLength - curPos;
|
|
|
|
if ( dictLength > 0 ) {
|
|
memcpy( &topOffset, ptr, sizeof(topOffset) );
|
|
/* it's in big-endian order */
|
|
topOffset = ntohl(topOffset);
|
|
dictLength -= sizeof(topOffset); /* first four bytes are offset */
|
|
ptr += sizeof(topOffset);
|
|
}
|
|
|
|
XP_U32 numEdges;
|
|
if ( dictLength > 0 ) {
|
|
numEdges = dictLength / dctx->super.nodeSize;
|
|
#ifdef DEBUG
|
|
XP_ASSERT( (dictLength % dctx->super.nodeSize) == 0 );
|
|
dctx->super.numEdges = numEdges;
|
|
#endif
|
|
dctx->super.base = (array_edge*)ptr;
|
|
|
|
dctx->super.topEdge = dctx->super.base + topOffset;
|
|
} else {
|
|
dctx->super.base = NULL;
|
|
dctx->super.topEdge = NULL;
|
|
numEdges = 0;
|
|
}
|
|
|
|
dctx->super.name = copyString( dctx->super.mpool, name );
|
|
|
|
if ( ! checkSanity( &dctx->super, numEdges ) ) {
|
|
goto closeAndExit;
|
|
}
|
|
}
|
|
goto ok;
|
|
|
|
closeAndExit:
|
|
formatOk = XP_FALSE;
|
|
ok:
|
|
|
|
return formatOk;
|
|
} /* initFromDictFile */
|
|
|
|
static void
|
|
freeSpecials( WasmDictionaryCtxt* ctxt )
|
|
{
|
|
XP_U16 nSpecials = 0;
|
|
|
|
for ( XP_U16 ii = 0; ii < ctxt->super.nFaces; ++ii ) {
|
|
if ( IS_SPECIAL(ctxt->super.facePtrs[ii][0] ) ) {
|
|
if ( !!ctxt->super.bitmaps ) {
|
|
XP_Bitmap* bmp = ctxt->super.bitmaps[nSpecials].largeBM;
|
|
if ( !!bmp ) {
|
|
XP_FREE( ctxt->super.mpool, bmp );
|
|
}
|
|
bmp = ctxt->super.bitmaps[nSpecials].smallBM;
|
|
if ( !!bmp ) {
|
|
XP_FREE( ctxt->super.mpool, bmp );
|
|
}
|
|
}
|
|
if ( !!ctxt->super.chars && !!ctxt->super.chars[nSpecials]) {
|
|
XP_FREE( ctxt->super.mpool, ctxt->super.chars[nSpecials] );
|
|
}
|
|
++nSpecials;
|
|
}
|
|
}
|
|
if ( !!ctxt->super.bitmaps ) {
|
|
XP_FREE( ctxt->super.mpool, ctxt->super.bitmaps );
|
|
}
|
|
XP_FREEP( ctxt->super.mpool, &ctxt->super.chars );
|
|
XP_FREEP( ctxt->super.mpool, &ctxt->super.charEnds );
|
|
} /* freeSpecials */
|
|
|
|
static void
|
|
wasm_dictionary_destroy( DictionaryCtxt* dict, XWEnv xwe )
|
|
{
|
|
WasmDictionaryCtxt* ctxt = (WasmDictionaryCtxt*)dict;
|
|
|
|
freeSpecials( ctxt );
|
|
|
|
if ( !!ctxt->dictBase ) {
|
|
if ( ctxt->useMMap ) {
|
|
(void)munmap( ctxt->dictBase, ctxt->dictLength );
|
|
} else {
|
|
XP_FREE( dict->mpool, ctxt->dictBase );
|
|
}
|
|
}
|
|
|
|
/* super's destructor should do this!!!! */
|
|
XP_FREEP( dict->mpool, &ctxt->super.desc );
|
|
XP_FREEP( dict->mpool, &ctxt->super.md5Sum );
|
|
XP_FREEP( dict->mpool, &ctxt->super.countsAndValues );
|
|
XP_FREEP( dict->mpool, &ctxt->super.faces );
|
|
XP_FREEP( dict->mpool, &ctxt->super.facePtrs );
|
|
XP_FREEP( dict->mpool, &ctxt->super.name );
|
|
XP_FREE( dict->mpool, ctxt );
|
|
}
|
|
|
|
DictionaryCtxt*
|
|
wasm_dictionary_make_empty( Globals* globals )
|
|
{
|
|
WasmDictionaryCtxt* wdict = XP_CALLOC( globals->mpool, sizeof( *wdict ) );
|
|
dict_super_init( MPPARM(globals->mpool) (DictionaryCtxt*)wdict );
|
|
|
|
LOG_RETURNF( "%p", wdict );
|
|
return (DictionaryCtxt*)wdict;
|
|
}
|
|
|
|
DictionaryCtxt*
|
|
wasm_dictionary_make( Globals* globals, XWEnv xwe,
|
|
const char* name, uint8_t* base, size_t len )
|
|
{
|
|
WasmDictionaryCtxt* result = (WasmDictionaryCtxt*)
|
|
XP_CALLOC(globals->mpool, sizeof(*result));
|
|
result->globals = globals;
|
|
|
|
dict_super_init( MPPARM(globals->mpool) &result->super );
|
|
result->super.destructor = wasm_dictionary_destroy;
|
|
|
|
result->useMMap = false;
|
|
|
|
XP_Bool success = initFromPtr( result, name, base, len );
|
|
if ( success ) {
|
|
result->super.func_dict_getShortName = getShortName;
|
|
setBlankTile( &result->super );
|
|
} else {
|
|
XP_ASSERT( 0 ); /* gonna crash anyway */
|
|
XP_FREE( globals->mpool, result );
|
|
result = NULL;
|
|
}
|
|
(void)dict_ref( &result->super, xwe );
|
|
|
|
LOG_RETURNF( "%p", &result->super );
|
|
|
|
/* XP_U16 nf = dict_numTileFaces( &result->super ); */
|
|
/* for ( Tile tile = 0; tile < nf; ++tile ) { */
|
|
/* const XP_UCHAR* face = dict_getTileString( &result->super, tile ); */
|
|
/* XP_LOGFF( "faces[%d]: %s", tile, face ); */
|
|
/* } */
|
|
|
|
return &result->super;
|
|
}
|
|
|
|
EM_JS(void, js_splitFaces, (const uint8_t* ptr, int len,
|
|
StringProc proc, void* closure), {
|
|
const callWith = function(str) {
|
|
ccallString(proc, closure, str);
|
|
};
|
|
|
|
let jsarr = new Uint8Array(Module.HEAPU8.buffer, ptr, len);
|
|
let chrs = [];
|
|
for ( let chr of jsarr ) {
|
|
/* I'm assuming here that there is no legit utf-8 byte valued
|
|
less than 32. Is that true? PENDING */
|
|
if ( chr < 32 ) {
|
|
callWith(chr.toString());
|
|
assert(chrs.length == 0);
|
|
} else {
|
|
chrs.push(chr);
|
|
try {
|
|
let ab = new Uint8Array(chrs);
|
|
const decoder = new TextDecoder('utf-8', { fatal: true });
|
|
let asStr = decoder.decode(ab);
|
|
callWith( asStr );
|
|
chrs = [];
|
|
} catch (ex) {
|
|
/* we get here when have first of multi-byte string */
|
|
// console.log('failed decoding:' + chrs);
|
|
}
|
|
}
|
|
}
|
|
});
|
|
|
|
typedef struct _SplitState {
|
|
DictionaryCtxt* dict;
|
|
bool prevWasDelim;
|
|
XP_UCHAR* data; /* holds everything; lots of NULL chars inside */
|
|
int curOffset; /* where we are in data */
|
|
const XP_UCHAR** facePtrs; /* ptrs into data */
|
|
int curFace; /* how many faces have we seen */
|
|
} SplitState;
|
|
|
|
static void
|
|
gotDictString( void* closure, const char* str )
|
|
{
|
|
SplitState* ss = (SplitState*)closure;
|
|
if ( 0 == strcmp(str, " ") ) { /* delimter */
|
|
XP_ASSERT(!ss->prevWasDelim);
|
|
ss->prevWasDelim = true;
|
|
} else {
|
|
if ( !ss->prevWasDelim ) {
|
|
ss->facePtrs[ss->curFace++] = ss->data + ss->curOffset;
|
|
}
|
|
if ( '0' <= str[0] && str[0] <= '9') {
|
|
XP_ASSERT( !ss->prevWasDelim );
|
|
ss->data[ss->curOffset++] = atoi(str);
|
|
ss->data[ss->curOffset++] = '\0';
|
|
} else {
|
|
ss->curOffset += 1 + sprintf( ss->data + ss->curOffset, "%s", str );
|
|
}
|
|
ss->prevWasDelim = false;
|
|
}
|
|
}
|
|
|
|
void
|
|
dict_splitFaces( DictionaryCtxt* dict, XWEnv xwe, const XP_U8* utf8,
|
|
XP_U16 nBytes, XP_U16 nFaces )
|
|
{
|
|
XP_ASSERT( dict->isUTF8 ); /* assumed by code here */
|
|
|
|
SplitState ss = {
|
|
.dict = dict,
|
|
.data = XP_MALLOC( dict->mpool, nBytes + nFaces ),
|
|
.facePtrs = XP_CALLOC(dict->mpool, nFaces * sizeof(ss.facePtrs[0])),
|
|
};
|
|
js_splitFaces( utf8, nBytes, gotDictString, &ss );
|
|
XP_ASSERT( ss.curFace == nFaces ); /* got 'em all? */
|
|
|
|
XP_ASSERT( !dict->faces );
|
|
dict->faces = ss.data;
|
|
dict->facesEnd = dict->faces + nFaces + nBytes;
|
|
XP_ASSERT( !dict->facePtrs );
|
|
dict->facePtrs = ss.facePtrs;
|
|
|
|
LOG_RETURN_VOID();
|
|
} /* dict_splitFaces */
|
|
|
|
void
|
|
computeChecksum( DictionaryCtxt* dctx, XWEnv xwe, const XP_U8* ptr,
|
|
XP_U32 len, XP_UCHAR* out )
|
|
{
|
|
*out = '\0';
|
|
}
|