@Test
public void testBasics() throws IOException {
String tags =
"# verb-main:\n" +
"動詞-自立\n";
GosenTokenizerFactory tokenizerFactory = new GosenTokenizerFactory(new HashMap<String,String>(){{
put("dictionaryDir", SenTestUtil.IPADIC_DIR);
}});
tokenizerFactory.inform(new StringMockResourceLoader(""));
Tokenizer tokenizer = tokenizerFactory.create();
tokenizer.setReader(new StringReader("私は制限スピードを超える。"));
Map<String,String> args = new HashMap<String,String>();
args.put("luceneMatchVersion", Version.LATEST.toString());
args.put("tags", "stoptags.txt");
GosenPartOfSpeechStopFilterFactory factory = new GosenPartOfSpeechStopFilterFactory(args);
factory.inform(new StringMockResourceLoader(tags));
TokenStream ts = factory.create(tokenizer);
assertTokenStreamContents(ts,
new String[] { "私", "は", "制限", "スピード", "を", "。" }
);
}