Test for empty term before dereferencing utf-8 iterator

This commit is contained in:
Jean-Francois Dockes 2015-09-01 14:45:41 +02:00
parent 468c9fe575
commit cdcbb01eab

View file

@ -97,6 +97,8 @@ bool createExpansionDbs(Xapian::WritableDatabase& wdb,
// Detect and skip CJK terms. // Detect and skip CJK terms.
Utf8Iter utfit(*it); Utf8Iter utfit(*it);
if (utfit.eof()) // Empty term?? Seems to happen.
continue;
if (TextSplit::isCJK(*utfit)) { if (TextSplit::isCJK(*utfit)) {
// LOGDEB(("stemskipped: Skipping CJK\n")); // LOGDEB(("stemskipped: Skipping CJK\n"));
continue; continue;