void MockLemmatizer::lemmatize(const QString &input, Lvk::Nlp::WordList &words) { words.clear(); m_preSanitizer->sanitize(input); QStringList tokens; tokenize(input, tokens); foreach (const QString &token, tokens) { Lvk::Nlp::Word w(token, m_postSanitizer->sanitize(token), getLemma(token)); words.append(w); }
std::string getLemma ( const std::string & form , const CMorph & morph ) { CMorphTag morphTag = morph.getField(MORPH_POSTAG); return getLemma ( form , morphTag ); }