diff options
-rw-r--r-- | i18npool/source/characterclassification/cclass_unicode_parser.cxx | 8 |
1 files changed, 6 insertions, 2 deletions
diff --git a/i18npool/source/characterclassification/cclass_unicode_parser.cxx b/i18npool/source/characterclassification/cclass_unicode_parser.cxx index 29d69521954e..d3f18e7bbe27 100644 --- a/i18npool/source/characterclassification/cclass_unicode_parser.cxx +++ b/i18npool/source/characterclassification/cclass_unicode_parser.cxx @@ -654,8 +654,12 @@ ParserFlags cclass_Unicode::getFlagsExtended(sal_uInt32 const c) case U_OTHER_PUNCTUATION: // fdo#61754 Lets see (if we not at the start) if this is midletter // punctuation and allow it in a word if it is similarly to - // U_NON_SPACING_MARK - if (bStart || U_WB_MIDLETTER != u_getIntPropertyValue(c, UCHAR_WORD_BREAK)) + // U_NON_SPACING_MARK, for example U+00B7 MIDDLE DOT. + // tdf#123575 for U+30FB KATAKANA MIDDLE DOT property is not + // U_WB_MIDLETTER but U_WB_KATAKANA instead, explicitly test that + // and U+FF65 HALFWIDTH KATAKANA MIDDLE DOT. + if (bStart || (U_WB_MIDLETTER != u_getIntPropertyValue(c, UCHAR_WORD_BREAK) + && c != 0x30FB && c != 0xFF65)) return ParserFlags::ILLEGAL; else { |