mirror of
git://git.savannah.nongnu.org/eliot.git
synced 2024-12-31 10:26:28 +01:00
414baa8d7a
- New parameter to most search functions, allowing to limit the number of results. No interface uses it yet.
169 lines
4.8 KiB
C++
169 lines
4.8 KiB
C++
/*****************************************************************************
|
|
* Eliot
|
|
* Copyright (C) 2005-2007 Antoine Fraboulet
|
|
* Authors: Antoine Fraboulet <antoine.fraboulet @@ free.fr>
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*****************************************************************************/
|
|
|
|
/**
|
|
* \file regexpmain.c
|
|
* \brief Program used to test regexp
|
|
* \author Antoine Fraboulet
|
|
* \date 2005
|
|
*/
|
|
|
|
#include "config.h"
|
|
|
|
#include <exception>
|
|
#include <iostream>
|
|
#include <cstdlib>
|
|
#include <cstring>
|
|
|
|
#if ENABLE_NLS
|
|
# include <libintl.h>
|
|
# define _(String) gettext(String)
|
|
#else
|
|
# define _(String) String
|
|
#endif
|
|
|
|
#include "dic.h"
|
|
#include "regexp.h"
|
|
#include "encoding.h"
|
|
|
|
|
|
#define __UNUSED__ __attribute__((unused))
|
|
|
|
/********************************************************/
|
|
/********************************************************/
|
|
/********************************************************/
|
|
|
|
const unsigned int all_letter[DIC_LETTERS] =
|
|
{
|
|
/* 1 1 1 1 1 1 1 1 1 1 2 2 2 2 2 2 2 */
|
|
/* 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 */
|
|
/* x A B C D E F G H I J K L M N O P Q R S T U V W X Y Z */
|
|
0,1,1,1,1, 1,1,1,1,1,1, 1,1,1,1,1,1,1,1,1,1,1,1, 1, 1, 1, 1
|
|
};
|
|
|
|
const unsigned int vowels[DIC_LETTERS] =
|
|
{
|
|
/* x A B C D E F G H I J K L M N O P Q R S T U V W X Y Z */
|
|
0,1,0,0,0, 1,0,0,0,1,0, 0,0,0,0,1,0,0,0,0,0,1,0, 0, 0, 1, 0
|
|
};
|
|
|
|
const unsigned int consonants[DIC_LETTERS] =
|
|
{
|
|
/* x A B C D E F G H I J K L M N O P Q R S T U V W X Y Z */
|
|
0,0,1,1,1, 0,1,1,1,0,1, 1,1,1,1,0,1,1,1,1,1,0,1, 1, 1, 1, 1
|
|
};
|
|
|
|
void init_letter_lists(struct search_RegE_list_t *iList)
|
|
{
|
|
memset (iList, 0, sizeof(*iList));
|
|
iList->minlength = 1;
|
|
iList->maxlength = 15;
|
|
iList->valid[0] = 1; // all letters
|
|
iList->symbl[0] = RE_ALL_MATCH;
|
|
iList->valid[1] = 1; // vowels
|
|
iList->symbl[1] = RE_VOWL_MATCH;
|
|
iList->valid[2] = 1; // consonants
|
|
iList->symbl[2] = RE_CONS_MATCH;
|
|
for (int i = 0; i < DIC_LETTERS; i++)
|
|
{
|
|
iList->letters[0][i] = all_letter[i];
|
|
iList->letters[1][i] = vowels[i];
|
|
iList->letters[2][i] = consonants[i];
|
|
}
|
|
iList->valid[3] = 0; // user defined list 1
|
|
iList->symbl[3] = RE_USR1_MATCH;
|
|
iList->valid[4] = 0; // user defined list 2
|
|
iList->symbl[4] = RE_USR2_MATCH;
|
|
}
|
|
|
|
/********************************************************/
|
|
/********************************************************/
|
|
/********************************************************/
|
|
void usage(const char *iBinaryName)
|
|
{
|
|
cerr << _("usage: %s dictionary") << iBinaryName << endl;
|
|
cerr << _(" dictionary: path to eliot dawg dictionary") << endl;
|
|
}
|
|
|
|
|
|
int main(int argc, char* argv[])
|
|
{
|
|
#if HAVE_SETLOCALE
|
|
// Set locale via LC_ALL
|
|
setlocale(LC_ALL, "");
|
|
#endif
|
|
|
|
#if ENABLE_NLS
|
|
// Set the message domain
|
|
bindtextdomain(PACKAGE, LOCALEDIR);
|
|
textdomain(PACKAGE);
|
|
#endif
|
|
|
|
if (argc != 2)
|
|
{
|
|
usage(argv[0]);
|
|
return 0;
|
|
}
|
|
|
|
try
|
|
{
|
|
Dictionary dic(argv[1]);
|
|
|
|
char er[200];
|
|
strcpy(er, ".");
|
|
|
|
struct search_RegE_list_t regList;
|
|
while (strcmp(er, ""))
|
|
{
|
|
cout << "**************************************************************" << endl;
|
|
cout << "**************************************************************" << endl;
|
|
cout << _("enter a regular expression:") << endl;
|
|
fgets(er, sizeof(er), stdin);
|
|
/* strip \n */
|
|
er[strlen(er) - 1] = '\0';
|
|
if (strcmp(er, "") == 0)
|
|
break;
|
|
|
|
/* automaton */
|
|
init_letter_lists(®List);
|
|
vector<wstring> wordList;
|
|
dic.searchRegExp(convertToWc(er), wordList, ®List);
|
|
|
|
cout << _("result:") << endl;
|
|
vector<wstring>::const_iterator it;
|
|
for (it = wordList.begin(); it != wordList.end(); it++)
|
|
{
|
|
cerr << convertToMb(*it) << endl;
|
|
}
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
catch (std::exception &e)
|
|
{
|
|
std::cerr << e.what() << endl;
|
|
return 1;
|
|
}
|
|
catch (...)
|
|
{
|
|
std::cerr << "Unkown exception taken" << endl;
|
|
return 1;
|
|
}
|
|
}
|