|
a/src/rcldb/termproc.h |
|
b/src/rcldb/termproc.h |
|
... |
|
... |
115 |
|
115 |
|
116 |
virtual bool takeword(const string& itrm, int pos, int bs, int be)
|
116 |
virtual bool takeword(const string& itrm, int pos, int bs, int be)
|
117 |
{
|
117 |
{
|
118 |
m_totalterms++;
|
118 |
m_totalterms++;
|
119 |
string otrm;
|
119 |
string otrm;
|
120 |
if (!unacmaybefold(itrm, otrm, "UTF-8", true)) {
|
120 |
if (!unacmaybefold(itrm, otrm, "UTF-8", UNACOP_UNACFOLD)) {
|
121 |
LOGDEB(("splitter::takeword: unac [%s] failed\n", itrm.c_str()));
|
121 |
LOGDEB(("splitter::takeword: unac [%s] failed\n", itrm.c_str()));
|
122 |
m_unacerrors++;
|
122 |
m_unacerrors++;
|
123 |
// We don't generate a fatal error because of a bad term,
|
123 |
// We don't generate a fatal error because of a bad term,
|
124 |
// but one has to put the limit somewhere
|
124 |
// but one has to put the limit somewhere
|
125 |
if (m_unacerrors > 500 &&
|
125 |
if (m_unacerrors > 500 &&
|