Skip to content

Commit

Permalink
fix: cjk expand character can not be searched (#2016)
Browse files Browse the repository at this point in the history
* fix: cjk expand character can not be searched

* Update src/common/folding.cc

* Update src/common/globalregex.hh
  • Loading branch information
xiaoyifang authored Dec 12, 2024
1 parent a45a309 commit a533777
Show file tree
Hide file tree
Showing 2 changed files with 4 additions and 5 deletions.
5 changes: 2 additions & 3 deletions src/common/folding.cc
Original file line number Diff line number Diff line change
Expand Up @@ -22,8 +22,8 @@ std::u32string apply( std::u32string const & in, bool preserveWildcards )
{
// remove diacritics (normalization), white space, punt,
auto temp = QString::fromStdU32String( in )
.normalized( QString::NormalizationForm_KD )
.remove( RX::markSpace )
.normalized( QString::NormalizationForm_KD )
.removeIf( [ preserveWildcards ]( const QChar & ch ) -> bool {
return ch.isPunct()
&& !( preserveWildcards && ( ch == '\\' || ch == '?' || ch == '*' || ch == '[' || ch == ']' ) );
Expand Down Expand Up @@ -155,8 +155,7 @@ std::u32string applyWhitespaceAndPunctOnly( std::u32string const & in )

bool isWhitespace( char32_t ch )
{
//invisible character should be treated as whitespace as well.
return QChar::isSpace( ch ) || !QChar::isPrint( ch );
return QChar::isSpace( ch );
}

bool isWhitespaceOrPunct( char32_t ch )
Expand Down
4 changes: 2 additions & 2 deletions src/common/globalregex.hh
Original file line number Diff line number Diff line change
Expand Up @@ -71,8 +71,8 @@ const static QRegularExpression accentMark( R"(\p{M})", QRegularExpression::UseU
//contain unicode space mark,invisible, and punctuation
const static QRegularExpression markPuncSpace( R"([\p{M}\p{Z}\p{C}\p{P}])",
QRegularExpression::UseUnicodePropertiesOption );
//contain unicode space and mark.invisible
const static QRegularExpression markSpace( R"([\p{M}\p{Z}\p{C}])", QRegularExpression::UseUnicodePropertiesOption );
//contain unicode space and mark.
const static QRegularExpression markSpace( R"([\p{M}\p{Z}])", QRegularExpression::UseUnicodePropertiesOption );

const static QRegularExpression whiteSpace( "\\s+" );

Expand Down

0 comments on commit a533777

Please sign in to comment.