goldendict-ng/epwing_book.hh

252 lines
5.8 KiB
C++
Raw Normal View History

2014-05-20 13:59:56 +00:00
#ifndef __EPWING_BOOK_HH_INCLUDED__
#define __EPWING_BOOK_HH_INCLUDED__
#include <qglobal.h>
#if defined( Q_OS_WIN32 ) || defined( Q_OS_MAC )
#define _FILE_OFFSET_BITS 64
#endif
#include "dictionary.hh"
#include "ex.hh"
#include "mutex.hh"
#include <QString>
2022-02-27 14:42:40 +00:00
#if (QT_VERSION >= QT_VERSION_CHECK(6,0,0))
#include <QtCore5Compat/QTextCodec>
#else
2014-05-20 13:59:56 +00:00
#include <QTextCodec>
2022-02-27 14:42:40 +00:00
#endif
2014-05-20 13:59:56 +00:00
#include <QMap>
#include <QVector>
2014-05-20 13:59:56 +00:00
#include <vector>
#include <string>
#ifdef _MSC_VER
#include <stub_msvc.h>
#endif
2014-05-20 13:59:56 +00:00
#include <eb/eb.h>
namespace Epwing {
DEF_EX_STR( exEbLibrary, "EB library report error", Dictionary::Ex )
DEF_EX_STR( exEpwing, "Epwing parsing error:", Dictionary::Ex )
void initialize();
void finalize();
namespace Book {
using std::vector;
using std::string;
enum {
TextBufferSize = 4095,
BinaryBufferSize = 50000,
TextSizeLimit = 2800000
};
struct EpwingHeadword
{
QString headword;
quint32 page;
quint32 offset;
};
class EpwingBook
{
typedef QPair< int, int > EWPos;
2014-05-20 13:59:56 +00:00
void setErrorString( QString const & func, EB_Error_Code code );
EB_Book book;
EB_Appendix appendix;
EB_Hookset hookSet, refHookSet;
2014-05-20 13:59:56 +00:00
EB_Subbook_Code subBookList[ EB_MAX_SUBBOOKS ];
EB_Subbook_Code subAppendixList[ EB_MAX_SUBBOOKS ];
EB_Position currentPosition, indexHeadwordsPosition;
2014-05-20 13:59:56 +00:00
int subBookCount, subAppendixCount;
int currentSubBook;
QString error_string;
QString mainCacheDir, rootDir;
QString cacheImagesDir, cacheSoundsDir, cacheMoviesDir, cacheFontsDir;
QString dictID;
QTextCodec * codec_ISO, * codec_GB, * codec_Euc;
QStack< unsigned int > decorationStack;
int monoWidth, monoHeight;
QStringList imageCacheList, soundsCacheList, moviesCacheList, fontsCacheList;
QMap< QString, QString > baseFontsMap, customFontsMap;
2014-05-20 13:59:56 +00:00
QVector< int > refPages, refOffsets;
2022-10-04 07:07:04 +00:00
QMap< uint64_t,bool > allHeadwordPositions;
QMap< uint64_t, bool > allRefPositions;
QVector< EWPos > LinksQueue;
2014-05-20 13:59:56 +00:00
int refOpenCount, refCloseCount;
static Mutex libMutex;
QString createCacheDir( QString const & dir);
// Close unslosed tags
void finalizeText( QString & text );
// Reset internal variables
void prepareToRead();
// Retrieve references from article
void getReferencesFromText( int page, int offset );
// Move to next article
EB_Error_Code forwardText( EB_Position & startPos );
// Retrieve article text from dictionary
2022-10-04 07:07:04 +00:00
QString getText( int page, int offset, bool text_only);
unsigned int normalizeDecorationCode( unsigned int code );
QByteArray codeToUnicode( QString const & code );
2014-05-20 13:59:56 +00:00
public:
enum DecorationCodes {
UNKNOWN = 0,
ITALIC = 1,
BOLD = 3,
EMPHASIS = 4,
SUBSCRIPT = 5,
SUPERSCRIPT = 6
};
EpwingBook();
~EpwingBook();
Mutex & getLibMutex()
{ return libMutex; }
QString const &errorString() const
{ return error_string; }
QTextCodec * codecISO()
{ return codec_ISO; }
QTextCodec * codecGB()
{ return codec_GB; }
QTextCodec *codecEuc()
{ return codec_Euc; }
int getSubBookCount()
{ return subBookCount; }
void setDictID( const string & id )
{ dictID = QString::fromUtf8( id.c_str() ); }
QString const & getImagesCacheDir()
{ return cacheImagesDir; }
QString const & getSoundsCacheDir()
{ return cacheSoundsDir; }
QString const & getMoviesCacheDir()
{ return cacheMoviesDir; }
void clearBuffers()
{
allHeadwordPositions.clear();
2022-10-04 07:07:04 +00:00
allRefPositions.clear();
LinksQueue.clear();
}
2014-05-20 13:59:56 +00:00
// Make name for resource
QString makeFName( QString const & ext, int page, int offset ) const;
// Store all files in Epwing folder
static void collectFilenames( QString const & directory,
vector< string > & files );
// Initialize dictionary book
int setBook( string const & directory );
// Set subbook inside dictionary
bool setSubBook( int book_nom );
void setCacheDirectory( QString const & cacheDir );
QString getCurrentSubBookDirectory();
QString copyright();
QString title();
// Seek to first article
void getFirstHeadword( EpwingHeadword & head );
// Find next headword and article position
bool getNextHeadword( EpwingHeadword & head );
2022-10-04 07:07:04 +00:00
bool processRef( EpwingHeadword & head );
bool readHeadword( EB_Position const & pos,
QString & headword,
bool text_only );
bool isHeadwordCorrect( QString const & headword );
void fixHeadword( QString & headword );
2014-05-20 13:59:56 +00:00
// Retrieve article from dictionary
void getArticle( QString & headword, QString & articleText,
2022-10-04 07:07:04 +00:00
int page, int offset, bool text_only, QString word=0 );
2014-05-20 13:59:56 +00:00
const char * beginDecoration( unsigned int code );
const char * endDecoration( unsigned int code );
QByteArray handleColorImage( EB_Hook_Code code,
const unsigned int * argv );
QByteArray handleMonoImage( EB_Hook_Code code,
const unsigned int * argv );
QByteArray handleWave( EB_Hook_Code code,
const unsigned int * argv );
QByteArray handleMpeg( EB_Hook_Code code,
const unsigned int * argv );
QByteArray handleNarrowFont( const unsigned int * argv,
bool text_only );
2014-05-20 13:59:56 +00:00
QByteArray handleWideFont( const unsigned int * argv,
bool text_only );
2014-05-20 13:59:56 +00:00
QByteArray handleReference( EB_Hook_Code code,
const unsigned int * argv );
bool getMatches( QString word, QVector< QString > & matches );
bool getArticlePos( QString word, QVector< int > & pages, QVector< int > & offsets );
2014-05-20 13:59:56 +00:00
};
struct EContainer
{
EpwingBook * book;
bool textOnly;
EContainer( EpwingBook * book_ ) :
book( book_ ),
textOnly( false )
{}
EContainer( EpwingBook * book_, bool text_only ) :
book( book_ ),
textOnly( text_only )
{}
};
}
}
#endif // __EPWING_BOOK_HH_INCLUDED__