Textsplit: lost char at korean->ascii transition
This commit is contained in:
parent
ec7379f837
commit
eb53b598d6
@ -680,8 +680,8 @@ bool TextSplit::text_to_words(const string &in)
|
|||||||
// nothing right after a CJK section). Because
|
// nothing right after a CJK section). Because
|
||||||
// katakana-western transitions sometimes have no whitespace
|
// katakana-western transitions sometimes have no whitespace
|
||||||
// (and maybe hangul too, but probably not).
|
// (and maybe hangul too, but probably not).
|
||||||
if (prev_csc != CSC_CJK && csc != prev_csc &&
|
if (prev_csc != CSC_CJK && prev_csc != CSC_HANGUL &&
|
||||||
(m_wordLen || m_span.length())) {
|
csc != prev_csc && (m_wordLen || m_span.length())) {
|
||||||
LOGDEB2("csc " << valToString(csc_names, csc) << " prev_csc " <<
|
LOGDEB2("csc " << valToString(csc_names, csc) << " prev_csc " <<
|
||||||
valToString(csc_names, prev_csc) << " wl " <<
|
valToString(csc_names, prev_csc) << " wl " <<
|
||||||
m_wordLen << " spl " << m_span.length() << endl);
|
m_wordLen << " spl " << m_span.length() << endl);
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user