fix: epwing dictionary headword correction

such as headword "1gulp n. →" was corrected as " gulp n "
This commit is contained in:
Xiao YiFang 2022-10-05 20:00:23 +08:00
parent 32689d71ad
commit 53c1db8eaf
2 changed files with 5 additions and 2 deletions

View file

@ -1032,6 +1032,9 @@ void EpwingBook::fixHeadword( QString & headword )
headword.remove( QChar( 0x30FB ) ); // Used in Japan transcription headword.remove( QChar( 0x30FB ) ); // Used in Japan transcription
//replace any unicode Number ,Symbol ,Punctuation ,Mark character to whitespace
headword.replace( QRegularExpression( "[\\p{N}\\p{S}\\p{P}\\p{M}]" ), " " );
//if( isHeadwordCorrect( headword) ) //if( isHeadwordCorrect( headword) )
// return; // return;
@ -1046,7 +1049,7 @@ void EpwingBook::fixHeadword( QString & headword )
//} //}
gd::wstring folded = Folding::applyPunctOnly( gd::toWString( fixed ) ); gd::wstring folded = Folding::applyPunctOnly( gd::toWString( fixed ) );
fixed = gd::toQString( folded ); //fixed = gd::toQString( folded );
//if( isHeadwordCorrect( fixed ) ) //if( isHeadwordCorrect( fixed ) )
//{ //{

View file

@ -596,7 +596,7 @@ bool isPunct( wchar ch )
case 0xFF64: // HALFWIDTH IDEOGRAPHIC COMMA case 0xFF64: // HALFWIDTH IDEOGRAPHIC COMMA
return true; return true;
default: default:
return QChar::isPunct(ch)||QChar::isSymbol(ch); return false;
} }
} }