goldendict-ng/src/dict/dictionary.cc
xiaoyifang 5de4690b2d
fix: audio device change handled (#1242)
* fix: audio device change handled

* [autofix.ci] apply automated fixes

---------

Co-authored-by: autofix-ci[bot] <114827586+autofix-ci[bot]@users.noreply.github.com>
2023-10-15 23:15:45 +08:00

609 lines
15 KiB
C++

/* This file is (c) 2008-2012 Konstantin Isakov <ikm@goldendict.org>
* Part of GoldenDict. Licensed under GPLv3 or later, see the LICENSE file */
#include <vector>
#include <algorithm>
#include <cstdio>
#include "dictionary.hh"
#include <QCryptographicHash>
// For needToRebuildIndex(), read below
#include <QFileInfo>
#include <QDateTime>
#include "config.hh"
#include <QDir>
#include <QFileInfo>
#include <QCryptographicHash>
#include <QDateTime>
#include <QImage>
#include <QPainter>
#include <QRegularExpression>
#include "utils.hh"
#include "zipfile.hh"
namespace Dictionary {
bool Request::isFinished()
{
return Utils::AtomicInt::loadAcquire( isFinishedFlag );
}
void Request::update()
{
if ( !Utils::AtomicInt::loadAcquire( isFinishedFlag ) ) {
emit updated();
}
}
void Request::finish()
{
if ( !Utils::AtomicInt::loadAcquire( isFinishedFlag ) ) {
{
QMutexLocker _( &dataMutex );
isFinishedFlag.ref();
cond.wakeAll();
}
emit finished();
}
}
void Request::setErrorString( QString const & str )
{
QMutexLocker _( &errorStringMutex );
errorString = str;
}
QString Request::getErrorString()
{
QMutexLocker _( &errorStringMutex );
return errorString;
}
///////// WordSearchRequest
size_t WordSearchRequest::matchesCount()
{
QMutexLocker _( &dataMutex );
return matches.size();
}
WordMatch WordSearchRequest::operator[]( size_t index )
{
QMutexLocker _( &dataMutex );
if ( index >= matches.size() )
throw exIndexOutOfRange();
return matches[ index ];
}
vector< WordMatch > & WordSearchRequest::getAllMatches()
{
if ( !isFinished() )
throw exRequestUnfinished();
return matches;
}
void WordSearchRequest::addMatch( WordMatch const & match )
{
unsigned n;
for ( n = 0; n < matches.size(); n++ )
if ( matches[ n ].word.compare( match.word ) == 0 )
break;
if ( n >= matches.size() )
matches.push_back( match );
}
////////////// DataRequest
long DataRequest::dataSize()
{
QMutexLocker _( &dataMutex );
long size = hasAnyData ? (long)data.size() : -1;
if ( size == 0 && !isFinished() ) {
cond.wait( &dataMutex );
size = hasAnyData ? (long)data.size() : -1;
}
return size;
}
void DataRequest::appendDataSlice( const void * buffer, size_t size )
{
QMutexLocker _( &dataMutex );
size_t offset = data.size();
data.resize( data.size() + size );
memcpy( &data.front() + offset, buffer, size );
cond.wakeAll();
}
void DataRequest::appendString( std::string_view str )
{
QMutexLocker _( &dataMutex );
data.reserve( data.size() + str.size() );
data.insert( data.end(), str.begin(), str.end() );
cond.wakeAll();
}
void DataRequest::getDataSlice( size_t offset, size_t size, void * buffer )
{
if ( size == 0 ) {
return;
}
QMutexLocker _( &dataMutex );
if ( !hasAnyData )
throw exSliceOutOfRange();
memcpy( buffer, &data[ offset ], size );
}
vector< char > & DataRequest::getFullData()
{
if ( !isFinished() )
throw exRequestUnfinished();
return data;
}
Class::Class( string const & id_, vector< string > const & dictionaryFiles_ ):
id( id_ ),
dictionaryFiles( dictionaryFiles_ ),
indexedFtsDoc( 0 ),
dictionaryIconLoaded( false ),
can_FTS( false ),
FTS_index_completed( false )
{
}
void Class::deferredInit()
{
//base method.
}
sptr< WordSearchRequest > Class::stemmedMatch( wstring const & /*str*/,
unsigned /*minLength*/,
unsigned /*maxSuffixVariation*/,
unsigned long /*maxResults*/ )
{
return std::make_shared< WordSearchRequestInstant >();
}
sptr< WordSearchRequest > Class::findHeadwordsForSynonym( wstring const & )
{
return std::make_shared< WordSearchRequestInstant >();
}
vector< wstring > Class::getAlternateWritings( wstring const & ) noexcept
{
return {};
}
QString Class::getContainingFolder() const
{
if ( !dictionaryFiles.empty() ) {
auto fileInfo = QFileInfo( QString::fromStdString( dictionaryFiles[ 0 ] ) );
if ( fileInfo.isDir() )
return fileInfo.absoluteFilePath();
return fileInfo.absolutePath();
}
return {};
}
sptr< DataRequest > Class::getResource( string const & /*name*/ )
{
return std::make_shared< DataRequestInstant >( false );
}
sptr< DataRequest > Class::getSearchResults( const QString &, int, bool, bool )
{
return std::make_shared< DataRequestInstant >( false );
}
QString const & Class::getDescription()
{
return dictionaryDescription;
}
QString Class::getMainFilename()
{
return {};
}
QIcon const & Class::getIcon() noexcept
{
if ( !dictionaryIconLoaded )
loadIcon();
return dictionaryIcon;
}
void Class::loadIcon() noexcept
{
dictionaryIconLoaded = true;
}
bool Class::loadIconFromFile( QString const & _filename, bool isFullName )
{
QFileInfo info;
QString fileName( _filename );
if ( isFullName )
info = QFileInfo( fileName );
else {
fileName += "bmp";
info = QFileInfo( fileName );
if ( !info.isFile() ) {
fileName.chop( 3 );
fileName += "png";
info = QFileInfo( fileName );
}
if ( !info.isFile() ) {
fileName.chop( 3 );
fileName += "jpg";
info = QFileInfo( fileName );
}
if ( !info.isFile() ) {
fileName.chop( 3 );
fileName += "ico";
info = QFileInfo( fileName );
}
}
if ( info.isFile() ) {
QImage img( fileName );
if ( !img.isNull() ) {
// Load successful
//some icon is very large ,will crash the application.
img = img.scaledToWidth( 64 );
// Apply the color key
#if ( QT_VERSION >= QT_VERSION_CHECK( 6, 0, 0 ) )
img.setAlphaChannel( img.createMaskFromColor( QColor( 192, 192, 192 ).rgb(), Qt::MaskOutColor ) );
#endif
// Transform it to be square
int max = img.width() > img.height() ? img.width() : img.height();
QImage result( max, max, QImage::Format_ARGB32 );
result.fill( 0 ); // Black transparent
QPainter painter( &result );
painter.setRenderHint( QPainter::RenderHint::Antialiasing );
painter.drawImage( QPoint( img.width() == max ? 0 : ( max - img.width() ) / 2,
img.height() == max ? 0 : ( max - img.height() ) / 2 ),
img );
painter.end();
dictionaryIcon = QIcon( QPixmap::fromImage( result ) );
return !dictionaryIcon.isNull();
}
}
return false;
}
bool Class::loadIconFromText( QString iconUrl, QString const & text )
{
if ( text.isEmpty() )
return false;
QImage img( iconUrl );
if ( !img.isNull() ) {
int iconSize = 64;
//some icon is very large ,will crash the application.
img = img.scaledToWidth( iconSize );
QImage result( iconSize, iconSize, QImage::Format_ARGB32 );
result.fill( 0 ); // Black transparent
int max = img.width() > img.height() ? img.width() : img.height();
QPainter painter( &result );
painter.setRenderHint( QPainter::RenderHint::Antialiasing );
painter.drawImage( QPoint( img.width() == max ? 0 : ( max - img.width() ) / 2,
img.height() == max ? 0 : ( max - img.height() ) / 2 ),
img );
painter.setCompositionMode( QPainter::CompositionMode_SourceAtop );
QFont font = painter.font();
//the text should be a little smaller than the icon
font.setPixelSize( iconSize * 0.6 );
font.setWeight( QFont::Bold );
painter.setFont( font );
const QRect rectangle = QRect( 0, 0, iconSize, iconSize );
//select a single char.
auto abbrName = getAbbrName( text );
painter.setPen( QColor( 4, 57, 108, 200 ) );
painter.drawText( rectangle, Qt::AlignCenter, abbrName );
painter.end();
dictionaryIcon = QIcon( QPixmap::fromImage( result ) );
return !dictionaryIcon.isNull();
}
return false;
}
QString Class::getAbbrName( QString const & text )
{
if ( text.isEmpty() )
return {};
//remove whitespace,number,mark,puncuation,symbol
QString simplified = text;
simplified.remove(
QRegularExpression( R"([\p{Z}\p{N}\p{M}\p{P}\p{S}])", QRegularExpression::UseUnicodePropertiesOption ) );
if ( simplified.isEmpty() )
return {};
int index = qHash( simplified ) % simplified.size();
QString abbrName;
if ( !Utils::isCJKChar( simplified.at( index ).unicode() ) ) {
// take two chars.
abbrName = simplified.mid( index, 2 );
if ( abbrName.size() == 1 ) {
//make up two characters.
abbrName = abbrName + simplified.at( 0 );
}
}
else {
abbrName = simplified.mid( index, 1 );
}
return abbrName;
}
void Class::isolateCSS( QString & css, QString const & wrapperSelector )
{
if ( css.isEmpty() )
return;
QRegularExpression reg1( R"(\/\*(?:.(?!\*\/))*.?\*\/)", QRegularExpression::DotMatchesEverythingOption );
QRegularExpression reg2( R"([ \*\>\+,;:\[\{\]])" );
QRegularExpression reg3( "[,;\\{]" );
int currentPos = 0;
QString newCSS;
QString prefix( "#gdfrom-" );
prefix += QString::fromLatin1( getId().c_str() );
if ( !wrapperSelector.isEmpty() )
prefix += " " + wrapperSelector;
// Strip comments
css.replace( reg1, QString() );
for ( ;; ) {
if ( currentPos >= css.length() )
break;
QChar ch = css[ currentPos ];
if ( ch == '@' ) {
// @ rules
int n = currentPos;
if ( css.mid( currentPos, 7 ).compare( "@import", Qt::CaseInsensitive ) == 0
|| css.mid( currentPos, 10 ).compare( "@font-face", Qt::CaseInsensitive ) == 0
|| css.mid( currentPos, 10 ).compare( "@namespace", Qt::CaseInsensitive ) == 0
|| css.mid( currentPos, 8 ).compare( "@charset", Qt::CaseInsensitive ) == 0 ) {
// Copy rule as is.
n = css.indexOf( ';', currentPos );
int n2 = css.indexOf( '{', currentPos );
if ( n2 > 0 && n > n2 )
n = n2 - 1;
}
else if ( css.mid( currentPos, 6 ).compare( "@media", Qt::CaseInsensitive ) == 0 ) {
// We must to parse it content to isolate it.
// Copy all up to '{' and continue parse inside.
n = css.indexOf( '{', currentPos );
}
else if ( css.mid( currentPos, 5 ).compare( "@page", Qt::CaseInsensitive ) == 0 ) {
// Don't copy rule. GD use own page layout.
n = css.indexOf( '}', currentPos );
if ( n < 0 )
break;
currentPos = n + 1;
continue;
}
else {
// Copy rule as is.
n = css.indexOf( '}', currentPos );
}
newCSS.append( css.mid( currentPos, n < 0 ? n : n - currentPos + 1 ) );
if ( n < 0 )
break;
currentPos = n + 1;
continue;
}
if ( ch == '{' ) {
// Selector declaration block.
// We copy it up to '}' as is.
int n = css.indexOf( '}', currentPos );
newCSS.append( css.mid( currentPos, n == -1 ? n : n - currentPos + 1 ) );
if ( n < 0 )
break;
currentPos = n + 1;
continue;
}
if ( ch.isLetter() || ch == '.' || ch == '#' || ch == '*' || ch == '\\' || ch == ':' ) {
if ( ch.isLetter() || ch == '*' ) {
// Check for namespace prefix
QChar chr;
for ( int i = currentPos; i < css.length(); i++ ) {
chr = css[ i ];
if ( chr.isLetterOrNumber() || chr.isMark() || chr == '_' || chr == '-' || ( chr == '*' && i == currentPos ) )
continue;
if ( chr == '|' ) {
// Namespace prefix found, copy it as is
newCSS.append( css.mid( currentPos, i - currentPos + 1 ) );
currentPos = i + 1;
}
break;
}
if ( chr == '|' )
continue;
}
// This is some selector.
// We must to add the isolate prefix to it.
int n = css.indexOf( reg2, currentPos + 1 );
QString s = css.mid( currentPos, n < 0 ? n : n - currentPos );
if ( n < 0 ) {
newCSS.append( s );
break;
}
QString trimmed = s.trimmed();
if ( trimmed.compare( "body", Qt::CaseInsensitive ) == 0
|| trimmed.compare( "html", Qt::CaseInsensitive ) == 0 ) {
newCSS.append( s + " " + prefix + " " );
currentPos += 4;
}
else {
newCSS.append( prefix + " " );
}
n = css.indexOf( reg3, currentPos );
s = css.mid( currentPos, n < 0 ? n : n - currentPos );
newCSS.append( s );
if ( n < 0 )
break;
currentPos = n;
continue;
}
newCSS.append( ch );
++currentPos;
}
css = newCSS;
}
string makeDictionaryId( vector< string > const & dictionaryFiles ) noexcept
{
std::vector< string > sortedList;
if ( Config::isPortableVersion() ) {
// For portable version, we use relative paths
sortedList.reserve( dictionaryFiles.size() );
const QDir dictionariesDir( Config::getPortableVersionDictionaryDir() );
for ( const auto & full : dictionaryFiles ) {
QFileInfo fileInfo( QString::fromStdString( full ) );
if ( fileInfo.isAbsolute() )
sortedList.push_back( dictionariesDir.relativeFilePath( fileInfo.filePath() ).toStdString() );
else {
// Well, it's relative. We don't technically support those, but
// what the heck
sortedList.push_back( full );
}
}
}
else
sortedList = dictionaryFiles;
std::sort( sortedList.begin(), sortedList.end() );
QCryptographicHash hash( QCryptographicHash::Md5 );
for ( const auto & i : sortedList ) {
hash.addData( i.c_str(), i.size() + 1 );
}
return hash.result().toHex().data();
}
// While this file is not supposed to have any Qt stuff since it's used by
// the dictionary backends, there's no platform-independent way to get hold
// of a timestamp of the file, so we use here Qt anyway. It is supposed to
// be fixed in the future when it's needed.
bool needToRebuildIndex( vector< string > const & dictionaryFiles, string const & indexFile ) noexcept
{
unsigned long lastModified = 0;
for ( const auto & dictionaryFile : dictionaryFiles ) {
QString name = QString::fromUtf8( dictionaryFile.c_str() );
QFileInfo fileInfo( name );
unsigned long ts;
if ( fileInfo.isDir() )
continue;
if ( name.toLower().endsWith( ".zip" ) ) {
ZipFile::SplitZipFile zf( name );
if ( !zf.exists() )
return true;
ts = zf.lastModified().toSecsSinceEpoch();
}
else {
if ( !fileInfo.exists() )
continue;
ts = fileInfo.lastModified().toSecsSinceEpoch();
}
if ( ts > lastModified )
lastModified = ts;
}
QFileInfo fileInfo( indexFile.c_str() );
if ( !fileInfo.exists() )
return true;
return fileInfo.lastModified().toSecsSinceEpoch() < lastModified;
}
string getFtsSuffix()
{
return "_FTS_x";
}
QString generateRandomDictionaryId()
{
return QString(
QCryptographicHash::hash( QDateTime::currentDateTime().toString( "\"Random\"dd.MM.yyyy hh:mm:ss.zzz" ).toUtf8(),
QCryptographicHash::Md5 )
.toHex() );
}
QMap< std::string, sptr< Dictionary::Class > > dictToMap( std::vector< sptr< Dictionary::Class > > const & dicts )
{
QMap< std::string, sptr< Dictionary::Class > > dictMap;
for ( auto & dict : dicts ) {
if ( !dict )
continue;
dictMap.insert( dict.get()->getId(), dict );
}
return dictMap;
}
} // namespace Dictionary