int LTP::parser(XML4NLP & xml) { if ( xml.QueryNote(NOTE_PARSER) ) return 0; int ret = postag(xml); if (0 != ret) { ERROR_LOG("in LTP::parser, failed to perform postag preprocessing"); return ret; } void * parser = _resource.GetParser(); if (parser == NULL) { ERROR_LOG("in LTP::parser, failed to init a parser"); return kParserError; } int stnsNum = xml.CountSentenceInDocument(); if (stnsNum == 0) { ERROR_LOG("in LTP::parser, number of sentences equals 0"); return kEmptyStringError; } for (int i = 0; i < stnsNum; ++i) { std::vector<std::string> vecWord; std::vector<std::string> vecPOS; std::vector<int> vecHead; std::vector<std::string> vecRel; if (xml.GetWordsFromSentence(vecWord, i) != 0) { ERROR_LOG("in LTP::parser, failed to get words from xml"); return kReadXmlError; } if (xml.GetPOSsFromSentence(vecPOS, i) != 0) { ERROR_LOG("in LTP::parser, failed to get postags from xml"); return kReadXmlError; } if (0 == vecWord.size()) { ERROR_LOG("Input sentence is empty."); return kEmptyStringError; } if (vecWord.size() > MAX_WORDS_NUM) { ERROR_LOG("Input sentence is too long."); return kSentenceTooLongError; } if (-1 == parser_parse(parser, vecWord, vecPOS, vecHead, vecRel)) { ERROR_LOG("in LTP::parser, failed to perform parse on sent. #%d", i+1); return kParserError; } if (0 != xml.SetParsesToSentence(vecHead, vecRel, i)) { ERROR_LOG("in LTP::parser, failed to write parse result to xml"); return kWriteXmlError; } } xml.SetNote(NOTE_PARSER); return 0; }
// perform ner over xml int LTP::ner(XML4NLP & xml) { if ( xml.QueryNote(NOTE_NE) ) { return 0; } // dependency int ret = postag(xml); if (0 != ret) { ERROR_LOG("in LTP::ner, failed to perform postag preprocess"); return ret; } void * ner = _resource.GetNER(); if (NULL == ner) { ERROR_LOG("in LTP::ner, failed to init a ner."); return kNERError; } int stnsNum = xml.CountSentenceInDocument(); if (stnsNum == 0) { ERROR_LOG("in LTP::ner, number of sentence equals 0"); return kEmptyStringError; } for (int i = 0; i < stnsNum; ++ i) { vector<string> vecWord; vector<string> vecPOS; vector<string> vecNETag; if (xml.GetWordsFromSentence(vecWord, i) != 0) { ERROR_LOG("in LTP::ner, failed to get words from xml"); return kReadXmlError; } if (xml.GetPOSsFromSentence(vecPOS, i) != 0) { ERROR_LOG("in LTP::ner, failed to get postags from xml"); return kNERError; } if (0 == vecWord.size()) { ERROR_LOG("Input sentence is empty."); return kEmptyStringError; } if (vecWord.size() > MAX_WORDS_NUM) { ERROR_LOG("Input sentence is too long."); return kSentenceTooLongError; } if (0 == ner_recognize(ner, vecWord, vecPOS, vecNETag)) { ERROR_LOG("in LTP::ner, failed to perform ner on sent. #%d", i+1); return kNERError; } xml.SetNEsToSentence(vecNETag, i); } xml.SetNote(NOTE_NE); return 0; }