mirror of
https://github.com/xiaoyifang/goldendict-ng.git
synced 2024-11-23 20:14:05 +00:00
6a34804df2
opt: add xapian fullindex support
373 lines
6.8 KiB
C++
373 lines
6.8 KiB
C++
/* This file is (c) 2008-2012 Konstantin Isakov <ikm@goldendict.org>
|
|
* Part of GoldenDict. Licensed under GPLv3 or later, see the LICENSE file */
|
|
|
|
#include "file.hh"
|
|
|
|
#include <cstring>
|
|
#include <cerrno>
|
|
#include <string>
|
|
|
|
#include <sys/types.h>
|
|
#include <sys/stat.h>
|
|
#ifndef _MSC_VER
|
|
#include <unistd.h>
|
|
#endif
|
|
|
|
#ifdef __WIN32
|
|
#include <windows.h>
|
|
#endif
|
|
|
|
#include "ufile.hh"
|
|
#include "fsencoding.hh"
|
|
#include "zipfile.hh"
|
|
|
|
namespace File {
|
|
|
|
enum
|
|
{
|
|
// We employ a writing buffer to considerably speed up file operations when
|
|
// they consists of many small writes. The default size for the buffer is 64k
|
|
WriteBufferSize = 65536
|
|
};
|
|
|
|
bool tryPossibleName( std::string const & name, std::string & copyTo )
|
|
{
|
|
if ( File::exists( name ) )
|
|
{
|
|
copyTo = name;
|
|
return true;
|
|
}
|
|
else
|
|
return false;
|
|
}
|
|
|
|
bool tryPossibleZipName( std::string const & name, std::string & copyTo )
|
|
{
|
|
if ( ZipFile::SplitZipFile( FsEncoding::decode( name.c_str() ) ).exists() )
|
|
{
|
|
copyTo = name;
|
|
return true;
|
|
}
|
|
else
|
|
return false;
|
|
}
|
|
|
|
void loadFromFile( std::string const & n, std::vector< char > & data )
|
|
{
|
|
File::Class f( n, "rb" );
|
|
|
|
f.seekEnd();
|
|
|
|
data.resize( f.tell() );
|
|
|
|
f.rewind();
|
|
|
|
f.read( &data.front(), data.size() );
|
|
}
|
|
|
|
bool exists( char const * filename ) noexcept
|
|
{
|
|
#ifdef __WIN32
|
|
#if defined(__WIN64) || defined(_MSC_VER)
|
|
struct _stat64 buf;
|
|
#else
|
|
struct _stat buf;
|
|
#endif
|
|
wchar_t wname[16384];
|
|
MultiByteToWideChar( CP_UTF8, 0, filename, -1, wname, 16384 );
|
|
#if defined(__WIN64) || defined(_MSC_VER)
|
|
return _wstat64( wname, &buf ) == 0;
|
|
#else
|
|
return _wstat( wname, &buf ) == 0;
|
|
#endif
|
|
#else
|
|
struct stat buf;
|
|
|
|
// EOVERFLOW rationale: if the file is too large, it still does exist
|
|
return stat( filename, &buf ) == 0 || errno == EOVERFLOW;
|
|
#endif
|
|
}
|
|
|
|
void Class::open( char const * filename, char const * mode )
|
|
{
|
|
QFile::OpenMode openMode = QIODevice::Text;
|
|
const char * pch = mode;
|
|
while( *pch )
|
|
{
|
|
switch( *pch )
|
|
{
|
|
case 'r': openMode |= QIODevice::ReadOnly;
|
|
break;
|
|
case 'w': openMode |= QIODevice::WriteOnly;
|
|
break;
|
|
case '+': openMode &= ~( QIODevice::ReadOnly | QIODevice::WriteOnly );
|
|
openMode |= QIODevice::ReadWrite;
|
|
break;
|
|
case 'a': openMode |= QIODevice::Append;
|
|
break;
|
|
case 'b': openMode &= ~QIODevice::Text;
|
|
break;
|
|
default: break;
|
|
}
|
|
++pch;
|
|
}
|
|
|
|
f.setFileName( FsEncoding::decode( filename ) );
|
|
|
|
//maybe directory, the xapian use directory to store the index.
|
|
if ( !f.open( openMode ) )
|
|
throw exCantOpen( std::string( filename ) + ": " + f.errorString().toUtf8().data() );
|
|
}
|
|
|
|
Class::Class( char const * filename, char const * mode ) :
|
|
writeBuffer( 0 )
|
|
{
|
|
open( filename, mode );
|
|
}
|
|
|
|
Class::Class( std::string const & filename, char const * mode )
|
|
: writeBuffer( 0 )
|
|
{
|
|
open( filename.c_str(), mode );
|
|
}
|
|
|
|
void Class::read( void * buf, qint64 size )
|
|
{
|
|
if ( !size )
|
|
return;
|
|
|
|
if ( writeBuffer )
|
|
flushWriteBuffer();
|
|
|
|
qint64 result = f.read( reinterpret_cast<char *>( buf ), size );
|
|
|
|
if ( result != size )
|
|
throw exReadError();
|
|
}
|
|
|
|
size_t Class::readRecords( void * buf, qint64 size, size_t count )
|
|
{
|
|
if ( writeBuffer )
|
|
flushWriteBuffer();
|
|
|
|
qint64 result = f.read( reinterpret_cast<char *>( buf ), size * count );
|
|
return result < 0 ? result : result / size;
|
|
}
|
|
|
|
void Class::write( void const * buf, qint64 size )
|
|
{
|
|
if ( !size )
|
|
return;
|
|
|
|
if ( size >= WriteBufferSize )
|
|
{
|
|
// If the write is large, there's not much point in buffering
|
|
flushWriteBuffer();
|
|
|
|
qint64 result = f.write( reinterpret_cast<char const *>( buf ), size );
|
|
|
|
if ( result != size )
|
|
throw exWriteError();
|
|
|
|
return;
|
|
}
|
|
|
|
if ( !writeBuffer )
|
|
{
|
|
// Allocate the writing buffer since we don't have any yet
|
|
writeBuffer = new char[ WriteBufferSize ];
|
|
if( !writeBuffer )
|
|
throw exAllocation();
|
|
writeBufferLeft = WriteBufferSize;
|
|
}
|
|
|
|
size_t toAdd = size < writeBufferLeft ? size : writeBufferLeft;
|
|
|
|
memcpy( writeBuffer + ( WriteBufferSize - writeBufferLeft ),
|
|
buf, toAdd );
|
|
|
|
size -= toAdd;
|
|
writeBufferLeft -= toAdd;
|
|
|
|
if ( !writeBufferLeft ) // Out of buffer? Flush it.
|
|
{
|
|
flushWriteBuffer();
|
|
|
|
if ( size ) // Something's still left? Add to buffer.
|
|
{
|
|
memcpy( writeBuffer, (char const *)buf + toAdd, size );
|
|
writeBufferLeft -= size;
|
|
}
|
|
}
|
|
}
|
|
|
|
size_t Class::writeRecords( void const * buf, qint64 size, size_t count )
|
|
|
|
{
|
|
flushWriteBuffer();
|
|
|
|
qint64 result = f.write( reinterpret_cast<const char *>( buf ), size * count );
|
|
return result < 0 ? result : result / size;
|
|
}
|
|
|
|
char * Class::gets( char * s, int size, bool stripNl )
|
|
|
|
{
|
|
if ( writeBuffer )
|
|
flushWriteBuffer();
|
|
|
|
qint64 len = f.readLine( s, size );
|
|
char * result = len > 0 ? s : NULL;
|
|
|
|
if ( result && stripNl )
|
|
{
|
|
|
|
char * last = result + len;
|
|
|
|
while( len-- )
|
|
{
|
|
--last;
|
|
|
|
if ( *last == '\n' || *last == '\r' )
|
|
*last = 0;
|
|
else
|
|
break;
|
|
}
|
|
}
|
|
|
|
return result;
|
|
}
|
|
|
|
std::string Class::gets( bool stripNl )
|
|
{
|
|
char buf[ 1024 ];
|
|
|
|
if ( !gets( buf, sizeof( buf ), stripNl ) )
|
|
throw exReadError();
|
|
|
|
return std::string( buf );
|
|
}
|
|
|
|
void Class::seek( qint64 offset )
|
|
{
|
|
if ( writeBuffer )
|
|
flushWriteBuffer();
|
|
|
|
if ( !f.seek( offset ) )
|
|
throw exSeekError();
|
|
}
|
|
|
|
uchar * Class::map( qint64 offset, qint64 size )
|
|
{
|
|
if( writeBuffer )
|
|
flushWriteBuffer();
|
|
|
|
return f.map( offset, size );
|
|
}
|
|
|
|
bool Class::unmap( uchar * address )
|
|
{
|
|
return f.unmap( address );
|
|
}
|
|
|
|
|
|
void Class::seekCur( qint64 offset )
|
|
{
|
|
if ( writeBuffer )
|
|
flushWriteBuffer();
|
|
|
|
if( !f.seek( f.pos() + offset ) )
|
|
throw exSeekError();
|
|
}
|
|
|
|
void Class::seekEnd( qint64 offset )
|
|
{
|
|
if ( writeBuffer )
|
|
flushWriteBuffer();
|
|
|
|
if( !f.seek( f.size() + offset ) )
|
|
throw exSeekError();
|
|
}
|
|
|
|
void Class::rewind()
|
|
{
|
|
seek( 0 );
|
|
}
|
|
|
|
qint64 Class::tell()
|
|
{
|
|
qint64 result = f.pos();
|
|
|
|
if ( result == -1 )
|
|
throw exSeekError();
|
|
|
|
if ( writeBuffer )
|
|
result += ( WriteBufferSize - writeBufferLeft );
|
|
|
|
return result;
|
|
}
|
|
|
|
bool Class::eof()
|
|
{
|
|
if ( writeBuffer )
|
|
flushWriteBuffer();
|
|
|
|
return f.atEnd();
|
|
}
|
|
|
|
QFile & Class::file()
|
|
{
|
|
flushWriteBuffer();
|
|
|
|
return f;
|
|
}
|
|
|
|
void Class::close()
|
|
{
|
|
releaseWriteBuffer();
|
|
f.close();
|
|
}
|
|
|
|
Class::~Class() noexcept
|
|
{
|
|
if ( f.isOpen() )
|
|
{
|
|
try
|
|
{
|
|
releaseWriteBuffer();
|
|
}
|
|
catch( exWriteError & )
|
|
{
|
|
}
|
|
f.close();
|
|
}
|
|
}
|
|
|
|
void Class::flushWriteBuffer()
|
|
{
|
|
if ( writeBuffer && writeBufferLeft != WriteBufferSize )
|
|
{
|
|
qint64 result = f.write( writeBuffer, WriteBufferSize - writeBufferLeft );
|
|
|
|
if ( result != WriteBufferSize - writeBufferLeft )
|
|
throw exWriteError();
|
|
|
|
writeBufferLeft = WriteBufferSize;
|
|
}
|
|
}
|
|
|
|
void Class::releaseWriteBuffer()
|
|
{
|
|
flushWriteBuffer();
|
|
|
|
if ( writeBuffer )
|
|
{
|
|
delete [] writeBuffer;
|
|
|
|
writeBuffer = 0;
|
|
}
|
|
}
|
|
|
|
|
|
}
|