public String[] lemmatize(final String[] tokens, final String[] postags) { List<String> lemmas = new ArrayList<>(); for (int i = 0; i < tokens.length; i++) { lemmas.add(this.lemmatize(tokens[i], postags[i])); } return lemmas.toArray(new String[lemmas.size()]); }
@Test public void testForNullPointerException() { List<String> sentence = Arrays.asList("The","dogs","were","running","and","barking", "down","the","street"); List<String> sentencePOS = Arrays.asList("DT","NNS","VBD","VBG","CC","VBG","RP","DT","NN"); List<List<String>> expectedLemmas = new ArrayList<>(); expectedLemmas.add(Arrays.asList("the")); expectedLemmas.add(Arrays.asList("dog")); expectedLemmas.add(Arrays.asList("is")); expectedLemmas.add(Arrays.asList("run,run")); expectedLemmas.add(Arrays.asList("and")); expectedLemmas.add(Arrays.asList("bark,bark")); expectedLemmas.add(Arrays.asList("down")); expectedLemmas.add(Arrays.asList("the")); expectedLemmas.add(Arrays.asList("street")); List<List<String>> actualLemmas = dictionaryLemmatizer.lemmatize(sentence, sentencePOS); for (int i = 0; i < sentence.size(); i++) { // don't compare cases where the word is not in the dictionary... if (!actualLemmas.get(0).get(0).equals("O")) Assert.assertEquals(expectedLemmas.get(i), actualLemmas.get(i)); } }
@Test public void testForNullPointerException() { String[] sentence = new String[]{"The","dogs","were","running","and","barking","down","the","street"}; String[] sentencePOS = new String[]{"DT","NNS","VBD","VBG","CC","VBG","RP","DT","NN"}; String[] expectedLemma = new String[]{"the","dog","is","run","and","bark","down","the","street"}; String[] actualLemma = dictionaryLemmatizer.lemmatize(sentence, sentencePOS); for (int i = 0;i < sentence.length;i++) { // don't compare cases where the word is not in the dictionary... if (!actualLemma[i].equals("O")) Assert.assertEquals(expectedLemma[i], actualLemma[i]); } }
public String[] lemmatize(final String[] tokens, final String[] postags) { List<String> lemmas = new ArrayList<>(); for (int i = 0; i < tokens.length; i++) { lemmas.add(this.lemmatize(tokens[i], postags[i])); } return lemmas.toArray(new String[lemmas.size()]); }
public String[] lemmatize(final String[] tokens, final String[] postags) { List<String> lemmas = new ArrayList<>(); for (int i = 0; i < tokens.length; i++) { lemmas.add(this.lemmatize(tokens[i], postags[i])); } return lemmas.toArray(new String[lemmas.size()]); }