5 #include <Poco/UTF8String.h>
29 for ( _it=_mapStemmer.begin(); _it!=_mapStemmer.end(); ++_it )
36 std::map<WORD_CONTENT_OFFSET, SSTRING>::const_iterator it;
37 std::string stemmerString;
39 sb_stemmer* stemmer = NULL;
43 stemmer = getStemmer( iso639_1 );
46 stemmerString = Poco::UTF8::toLower(it->second);
56 std::cout << std::endl <<
"SnowballPlugin normalize" << std::endl << std::endl;
60 std::map<WORD_CONTENT_OFFSET, WORD_LENGTH>::const_iterator it1;
61 std::cout <<
"token \t norm" << std::endl;
62 std::cout <<
"----- \t ----" << std::endl;
65 std::cout << lCData.
_mapTokens[it1->first] <<
'\t'
68 std::cout <<
"Tokens count " << lCData.
_mapOffsets.size() << std::endl << std::endl;
73 sb_stemmer* SnowballPlugin::getStemmer(
const SSTRING& iso639_1 )
75 _it=_mapStemmer.find( iso639_1 );
76 if ( _it==_mapStemmer.end() )
79 _mapStemmer[ iso639_1 ] = _stemmer;
83 _stemmer = _it->second;