mirror of
https://github.com/xiaoyifang/goldendict-ng.git
synced 2024-11-27 19:24:08 +00:00
0e238c26fb
mdx dictionaries take the most part of all dictionaries. when loop through the filepath ,remove mdx file to reduce further check .
427 lines
13 KiB
C++
427 lines
13 KiB
C++
/* This file is (c) 2008-2012 Konstantin Isakov <ikm@goldendict.org>
|
|
* Part of GoldenDict. Licensed under GPLv3 or later, see the LICENSE file */
|
|
|
|
#include "loaddictionaries.hh"
|
|
#include "initializing.hh"
|
|
#include "bgl.hh"
|
|
#include "stardict.hh"
|
|
#include "lsa.hh"
|
|
#include "dsl.hh"
|
|
#include "mediawiki.hh"
|
|
#include "sounddir.hh"
|
|
#include "hunspell.hh"
|
|
#include "dictdfiles.hh"
|
|
#include "romaji.hh"
|
|
#include "russiantranslit.hh"
|
|
#include "german.hh"
|
|
#include "greektranslit.hh"
|
|
#include "belarusiantranslit.hh"
|
|
#include "website.hh"
|
|
#include "forvo.hh"
|
|
#include "programs.hh"
|
|
#include "voiceengines.hh"
|
|
#include "gddebug.hh"
|
|
#include "fsencoding.hh"
|
|
#include "xdxf.hh"
|
|
#include "sdict.hh"
|
|
#include "aard.hh"
|
|
#include "zipsounds.hh"
|
|
#include "mdx.hh"
|
|
#include "zim.hh"
|
|
#include "dictserver.hh"
|
|
#include "slob.hh"
|
|
#include "gls.hh"
|
|
|
|
#ifndef NO_EPWING_SUPPORT
|
|
#include "epwing.hh"
|
|
#endif
|
|
|
|
#ifdef MAKE_CHINESE_CONVERSION_SUPPORT
|
|
#include "chinese.hh"
|
|
#endif
|
|
|
|
#include <QMessageBox>
|
|
#include <QDir>
|
|
|
|
#include <set>
|
|
|
|
using std::set;
|
|
|
|
using std::string;
|
|
using std::vector;
|
|
|
|
LoadDictionaries::LoadDictionaries( Config::Class const & cfg ):
|
|
paths( cfg.paths ), soundDirs( cfg.soundDirs ), hunspell( cfg.hunspell ),
|
|
transliteration( cfg.transliteration ),
|
|
exceptionText( "Load did not finish" ), // Will be cleared upon success
|
|
maxPictureWidth( cfg.maxPictureWidth ),
|
|
maxHeadwordSize( cfg.maxHeadwordSize ),
|
|
maxHeadwordToExpand( cfg.maxHeadwordsToExpand )
|
|
{
|
|
// Populate name filters
|
|
|
|
nameFilters << "*.bgl" << "*.ifo" << "*.lsa" << "*.dat"
|
|
<< "*.dsl" << "*.dsl.dz" << "*.index" << "*.xdxf"
|
|
<< "*.xdxf.dz" << "*.dct" << "*.aar" << "*.zips"
|
|
<< "*.mdx" << "*.gls" << "*.gls.dz"
|
|
#ifdef MAKE_ZIM_SUPPORT
|
|
<< "*.zim" << "*.zimaa" << "*.slob"
|
|
#endif
|
|
#ifndef NO_EPWING_SUPPORT
|
|
<< "*catalogs"
|
|
#endif
|
|
;
|
|
}
|
|
|
|
void LoadDictionaries::run()
|
|
{
|
|
try
|
|
{
|
|
for( Config::Paths::const_iterator i = paths.begin(); i != paths.end(); ++i )
|
|
handlePath( *i );
|
|
|
|
// Make soundDirs
|
|
{
|
|
vector< sptr< Dictionary::Class > > soundDirDictionaries =
|
|
SoundDir::makeDictionaries( soundDirs, FsEncoding::encode( Config::getIndexDir() ), *this );
|
|
|
|
dictionaries.insert( dictionaries.end(), soundDirDictionaries.begin(),
|
|
soundDirDictionaries.end() );
|
|
}
|
|
|
|
// Make hunspells
|
|
{
|
|
vector< sptr< Dictionary::Class > > hunspellDictionaries =
|
|
HunspellMorpho::makeDictionaries( hunspell );
|
|
|
|
dictionaries.insert( dictionaries.end(), hunspellDictionaries.begin(),
|
|
hunspellDictionaries.end() );
|
|
}
|
|
|
|
exceptionText.clear();
|
|
}
|
|
catch( std::exception & e )
|
|
{
|
|
exceptionText = e.what();
|
|
}
|
|
}
|
|
|
|
void LoadDictionaries::handlePath( Config::Path const & path )
|
|
{
|
|
vector< string > allFiles;
|
|
|
|
QDir dir( path.path );
|
|
|
|
QFileInfoList entries = dir.entryInfoList( nameFilters, QDir::AllDirs | QDir::Files | QDir::NoDotAndDotDot );
|
|
|
|
for( QFileInfoList::const_iterator i = entries.constBegin();
|
|
i != entries.constEnd(); ++i )
|
|
{
|
|
QString fullName = i->absoluteFilePath();
|
|
|
|
if ( path.recursive && i->isDir() )
|
|
{
|
|
// Make sure the path doesn't look like with dsl resources
|
|
if ( !fullName.endsWith( ".dsl.files", Qt::CaseInsensitive ) &&
|
|
!fullName.endsWith( ".dsl.dz.files", Qt::CaseInsensitive ) )
|
|
handlePath( Config::Path( fullName, true ) );
|
|
}
|
|
|
|
if ( !i->isDir() )
|
|
allFiles.push_back( FsEncoding::encode( QDir::toNativeSeparators( fullName ) ) );
|
|
}
|
|
|
|
{
|
|
vector< sptr< Dictionary::Class > > mdxDictionaries =
|
|
Mdx::makeDictionaries( allFiles, FsEncoding::encode( Config::getIndexDir() ), *this );
|
|
|
|
dictionaries.insert( dictionaries.end(), mdxDictionaries.begin(),
|
|
mdxDictionaries.end() );
|
|
}
|
|
|
|
{
|
|
vector< sptr< Dictionary::Class > > bglDictionaries =
|
|
Bgl::makeDictionaries( allFiles, FsEncoding::encode( Config::getIndexDir() ), *this );
|
|
|
|
dictionaries.insert( dictionaries.end(), bglDictionaries.begin(),
|
|
bglDictionaries.end() );
|
|
}
|
|
|
|
{
|
|
vector< sptr< Dictionary::Class > > stardictDictionaries =
|
|
Stardict::makeDictionaries( allFiles, FsEncoding::encode( Config::getIndexDir() ), *this, maxHeadwordToExpand );
|
|
|
|
dictionaries.insert( dictionaries.end(), stardictDictionaries.begin(),
|
|
stardictDictionaries.end() );
|
|
}
|
|
|
|
{
|
|
vector< sptr< Dictionary::Class > > lsaDictionaries =
|
|
Lsa::makeDictionaries( allFiles, FsEncoding::encode( Config::getIndexDir() ), *this );
|
|
|
|
dictionaries.insert( dictionaries.end(), lsaDictionaries.begin(),
|
|
lsaDictionaries.end() );
|
|
}
|
|
|
|
{
|
|
vector< sptr< Dictionary::Class > > dslDictionaries =
|
|
Dsl::makeDictionaries(
|
|
allFiles, FsEncoding::encode( Config::getIndexDir() ), *this, maxPictureWidth, maxHeadwordSize );
|
|
|
|
dictionaries.insert( dictionaries.end(), dslDictionaries.begin(),
|
|
dslDictionaries.end() );
|
|
}
|
|
|
|
{
|
|
vector< sptr< Dictionary::Class > > dictdDictionaries =
|
|
DictdFiles::makeDictionaries( allFiles, FsEncoding::encode( Config::getIndexDir() ), *this );
|
|
|
|
dictionaries.insert( dictionaries.end(), dictdDictionaries.begin(),
|
|
dictdDictionaries.end() );
|
|
}
|
|
{
|
|
vector< sptr< Dictionary::Class > > xdxfDictionaries =
|
|
Xdxf::makeDictionaries( allFiles, FsEncoding::encode( Config::getIndexDir() ), *this );
|
|
|
|
dictionaries.insert( dictionaries.end(), xdxfDictionaries.begin(),
|
|
xdxfDictionaries.end() );
|
|
}
|
|
{
|
|
vector< sptr< Dictionary::Class > > sdictDictionaries =
|
|
Sdict::makeDictionaries( allFiles, FsEncoding::encode( Config::getIndexDir() ), *this );
|
|
|
|
dictionaries.insert( dictionaries.end(), sdictDictionaries.begin(),
|
|
sdictDictionaries.end() );
|
|
}
|
|
{
|
|
vector< sptr< Dictionary::Class > > aardDictionaries =
|
|
Aard::makeDictionaries( allFiles, FsEncoding::encode( Config::getIndexDir() ), *this, maxHeadwordToExpand );
|
|
|
|
dictionaries.insert( dictionaries.end(), aardDictionaries.begin(),
|
|
aardDictionaries.end() );
|
|
}
|
|
{
|
|
vector< sptr< Dictionary::Class > > zipSoundsDictionaries =
|
|
ZipSounds::makeDictionaries( allFiles, FsEncoding::encode( Config::getIndexDir() ), *this );
|
|
|
|
dictionaries.insert( dictionaries.end(), zipSoundsDictionaries.begin(),
|
|
zipSoundsDictionaries.end() );
|
|
}
|
|
{
|
|
vector< sptr< Dictionary::Class > > glsDictionaries =
|
|
Gls::makeDictionaries( allFiles, FsEncoding::encode( Config::getIndexDir() ), *this );
|
|
|
|
dictionaries.insert( dictionaries.end(), glsDictionaries.begin(),
|
|
glsDictionaries.end() );
|
|
}
|
|
#ifdef MAKE_ZIM_SUPPORT
|
|
{
|
|
vector< sptr< Dictionary::Class > > zimDictionaries =
|
|
Zim::makeDictionaries( allFiles, FsEncoding::encode( Config::getIndexDir() ), *this, maxHeadwordToExpand );
|
|
|
|
dictionaries.insert( dictionaries.end(), zimDictionaries.begin(),
|
|
zimDictionaries.end() );
|
|
}
|
|
{
|
|
vector< sptr< Dictionary::Class > > slobDictionaries =
|
|
Slob::makeDictionaries( allFiles, FsEncoding::encode( Config::getIndexDir() ), *this, maxHeadwordToExpand );
|
|
|
|
dictionaries.insert( dictionaries.end(), slobDictionaries.begin(),
|
|
slobDictionaries.end() );
|
|
}
|
|
#endif
|
|
#ifndef NO_EPWING_SUPPORT
|
|
{
|
|
vector< sptr< Dictionary::Class > > epwingDictionaries =
|
|
Epwing::makeDictionaries( allFiles, FsEncoding::encode( Config::getIndexDir() ), *this );
|
|
|
|
dictionaries.insert( dictionaries.end(), epwingDictionaries.begin(),
|
|
epwingDictionaries.end() );
|
|
}
|
|
#endif
|
|
}
|
|
|
|
void LoadDictionaries::indexingDictionary( string const & dictionaryName ) throw()
|
|
{
|
|
emit indexingDictionarySignal( QString::fromUtf8( dictionaryName.c_str() ) );
|
|
}
|
|
|
|
|
|
void loadDictionaries( QWidget * parent, bool showInitially,
|
|
Config::Class const & cfg,
|
|
std::vector< sptr< Dictionary::Class > > & dictionaries,
|
|
QNetworkAccessManager & dictNetMgr,
|
|
bool doDeferredInit_ )
|
|
{
|
|
dictionaries.clear();
|
|
|
|
::Initializing init( parent, showInitially );
|
|
|
|
// Start a thread to load all the dictionaries
|
|
|
|
LoadDictionaries loadDicts( cfg );
|
|
|
|
QObject::connect( &loadDicts, SIGNAL( indexingDictionarySignal( QString const & ) ),
|
|
&init, SLOT( indexing( QString const & ) ) );
|
|
|
|
QEventLoop localLoop;
|
|
|
|
QObject::connect( &loadDicts, SIGNAL( finished() ),
|
|
&localLoop, SLOT( quit() ) );
|
|
|
|
loadDicts.start();
|
|
|
|
localLoop.exec();
|
|
|
|
loadDicts.wait();
|
|
|
|
if ( loadDicts.getExceptionText().size() )
|
|
{
|
|
QMessageBox::critical( parent, QCoreApplication::translate( "LoadDictionaries", "Error loading dictionaries" ),
|
|
QString::fromUtf8( loadDicts.getExceptionText().c_str() ) );
|
|
|
|
return;
|
|
}
|
|
|
|
dictionaries = loadDicts.getDictionaries();
|
|
|
|
///// We create transliterations synchronously since they are very simple
|
|
|
|
#ifdef MAKE_CHINESE_CONVERSION_SUPPORT
|
|
// Make Chinese conversion
|
|
{
|
|
vector< sptr< Dictionary::Class > > chineseDictionaries =
|
|
Chinese::makeDictionaries( cfg.transliteration.chinese );
|
|
|
|
dictionaries.insert( dictionaries.end(), chineseDictionaries.begin(),
|
|
chineseDictionaries.end() );
|
|
}
|
|
#endif
|
|
|
|
// Make Romaji
|
|
{
|
|
vector< sptr< Dictionary::Class > > romajiDictionaries =
|
|
Romaji::makeDictionaries( cfg.transliteration.romaji );
|
|
|
|
dictionaries.insert( dictionaries.end(), romajiDictionaries.begin(),
|
|
romajiDictionaries.end() );
|
|
}
|
|
|
|
// Make Russian transliteration
|
|
if ( cfg.transliteration.enableRussianTransliteration )
|
|
dictionaries.push_back( RussianTranslit::makeDictionary() );
|
|
|
|
// Make German transliteration
|
|
if ( cfg.transliteration.enableGermanTransliteration )
|
|
dictionaries.push_back( GermanTranslit::makeDictionary() );
|
|
|
|
// Make Greek transliteration
|
|
if ( cfg.transliteration.enableGreekTransliteration )
|
|
dictionaries.push_back( GreekTranslit::makeDictionary() );
|
|
|
|
// Make Belarusian transliteration
|
|
if ( cfg.transliteration.enableBelarusianTransliteration )
|
|
{
|
|
vector< sptr< Dictionary::Class > > dicts = BelarusianTranslit::makeDictionaries();
|
|
dictionaries.insert( dictionaries.end(), dicts.begin(), dicts.end() );
|
|
}
|
|
|
|
///// We create MediaWiki dicts synchronously, since they use netmgr
|
|
|
|
{
|
|
vector< sptr< Dictionary::Class > > dicts =
|
|
MediaWiki::makeDictionaries( loadDicts, cfg.mediawikis, dictNetMgr );
|
|
|
|
dictionaries.insert( dictionaries.end(), dicts.begin(), dicts.end() );
|
|
}
|
|
|
|
///// WebSites are very simple, no need to create them asynchronously
|
|
{
|
|
vector< sptr< Dictionary::Class > > dicts =
|
|
WebSite::makeDictionaries( cfg.webSites, dictNetMgr );
|
|
|
|
dictionaries.insert( dictionaries.end(), dicts.begin(), dicts.end() );
|
|
}
|
|
|
|
//// Forvo dictionaries
|
|
|
|
{
|
|
vector< sptr< Dictionary::Class > > dicts =
|
|
Forvo::makeDictionaries( loadDicts, cfg.forvo, dictNetMgr );
|
|
|
|
dictionaries.insert( dictionaries.end(), dicts.begin(), dicts.end() );
|
|
}
|
|
|
|
//// Programs
|
|
{
|
|
vector< sptr< Dictionary::Class > > dicts =
|
|
Programs::makeDictionaries( cfg.programs );
|
|
|
|
dictionaries.insert( dictionaries.end(), dicts.begin(), dicts.end() );
|
|
}
|
|
|
|
//// Text to Speech
|
|
{
|
|
vector< sptr< Dictionary::Class > > dicts =
|
|
VoiceEngines::makeDictionaries( cfg.voiceEngines );
|
|
|
|
dictionaries.insert( dictionaries.end(), dicts.begin(), dicts.end() );
|
|
}
|
|
|
|
{
|
|
vector< sptr< Dictionary::Class > > dicts =
|
|
DictServer::makeDictionaries( cfg.dictServers );
|
|
|
|
dictionaries.insert( dictionaries.end(), dicts.begin(), dicts.end() );
|
|
}
|
|
|
|
GD_DPRINTF( "Load done\n" );
|
|
|
|
// Remove any stale index files
|
|
|
|
set< string > ids;
|
|
std::pair< std::set< string >::iterator, bool > ret;
|
|
|
|
for( unsigned x = dictionaries.size(); x--; )
|
|
{
|
|
ret = ids.insert( dictionaries[ x ]->getId() );
|
|
if( !ret.second )
|
|
{
|
|
gdWarning( "Duplicate dictionary ID found: ID=%s, name=\"%s\", path=\"%s\"",
|
|
dictionaries[ x ]->getId().c_str(),
|
|
dictionaries[ x ]->getName().c_str(),
|
|
dictionaries[ x ]->getDictionaryFilenames().empty() ?
|
|
"" : dictionaries[ x ]->getDictionaryFilenames()[ 0 ].c_str()
|
|
);
|
|
}
|
|
}
|
|
|
|
QDir indexDir( Config::getIndexDir() );
|
|
|
|
QStringList allIdxFiles = indexDir.entryList( QDir::Files );
|
|
|
|
for( QStringList::const_iterator i = allIdxFiles.constBegin();
|
|
i != allIdxFiles.constEnd(); ++i )
|
|
{
|
|
if ( ids.find( FsEncoding::encode( *i ) ) == ids.end()
|
|
&& i->size() == 32 )
|
|
indexDir.remove( *i );
|
|
else
|
|
if ( i->endsWith( "_FTS" )
|
|
&& i->size() == 36
|
|
&& ids.find( FsEncoding::encode( i->left( 32 ) ) ) == ids.end() )
|
|
indexDir.remove( *i );
|
|
}
|
|
|
|
// Run deferred inits
|
|
|
|
if ( doDeferredInit_ )
|
|
doDeferredInit( dictionaries );
|
|
}
|
|
|
|
void doDeferredInit( std::vector< sptr< Dictionary::Class > > & dictionaries )
|
|
{
|
|
for( unsigned x = 0; x < dictionaries.size(); ++x )
|
|
dictionaries[ x ]->deferredInit();
|
|
}
|