View tokenView = head.getTextAnnotation().getView(ViewNames.TOKENS); int leftIdx = head.getStartSpan() - 1; while (leftIdx >= tokenView.getStartSpan()){ Constituent cur = tokenView.getConstituentsCoveringToken(leftIdx).get(0); addExtentAttributes(cur, gazetteers, brownClusters, wordnet); if (leftIdx < tokenView.getStartSpan()){ leftIdx = tokenView.getStartSpan();
View tokenView = head.getTextAnnotation().getView(ViewNames.TOKENS); int leftIdx = head.getStartSpan() - 1; while (leftIdx >= tokenView.getStartSpan()){ Constituent cur = tokenView.getConstituentsCoveringToken(leftIdx).get(0); addExtentAttributes(cur, gazetteers, brownClusters, wordnet); if (leftIdx < tokenView.getStartSpan()){ leftIdx = tokenView.getStartSpan();
View tokenView = head.getTextAnnotation().getView(ViewNames.TOKENS); int leftIdx = head.getStartSpan() - 1; while (leftIdx >= tokenView.getStartSpan()){ Constituent cur = tokenView.getConstituentsCoveringToken(leftIdx).get(0); addExtentAttributes(cur, gazetteers, brownClusters, wordnet); if (leftIdx < tokenView.getStartSpan()){ leftIdx = tokenView.getStartSpan();
View bioView = new SpanLabelView("BIO", BIOReader.class.getCanonicalName(), ta, 1.0f); View tokenView = ta.getView(ViewNames.TOKENS); for (int i = tokenView.getStartSpan(); i < tokenView.getEndSpan(); i++){ Constituent currentToken = tokenView.getConstituentsCoveringToken(i).get(0).cloneForNewView("BIO"); currentToken.addAttribute("GAZ", gazetteers.annotateConstituent(currentToken, false)); String preBIOLevel1 = ""; String preBIOLevel2 = ""; for (int i = bioView.getStartSpan(); i < bioView.getEndSpan(); i++){ Constituent currentBIO = bioView.getConstituentsCoveringToken(i).get(0); currentBIO.addAttribute("preBIOLevel1", preBIOLevel1);
View bioView = new SpanLabelView("BIO", BIOReader.class.getCanonicalName(), ta, 1.0f); View tokenView = ta.getView(ViewNames.TOKENS); for (int i = tokenView.getStartSpan(); i < tokenView.getEndSpan(); i++){ Constituent currentToken = tokenView.getConstituentsCoveringToken(i).get(0).cloneForNewView("BIO"); currentToken.addAttribute("GAZ", gazetteers.annotateConstituent(currentToken, false)); String preBIOLevel1 = ""; String preBIOLevel2 = ""; for (int i = bioView.getStartSpan(); i < bioView.getEndSpan(); i++){ Constituent currentBIO = bioView.getConstituentsCoveringToken(i).get(0); currentBIO.addAttribute("preBIOLevel1", preBIOLevel1);
View bioView = new SpanLabelView("BIO", BIOReader.class.getCanonicalName(), ta, 1.0f); View tokenView = ta.getView(ViewNames.TOKENS); for (int i = tokenView.getStartSpan(); i < tokenView.getEndSpan(); i++){ Constituent currentToken = tokenView.getConstituentsCoveringToken(i).get(0).cloneForNewView("BIO"); currentToken.addAttribute("GAZ", gazetteers.annotateConstituent(currentToken, false)); String preBIOLevel1 = ""; String preBIOLevel2 = ""; for (int i = bioView.getStartSpan(); i < bioView.getEndSpan(); i++){ Constituent currentBIO = bioView.getConstituentsCoveringToken(i).get(0); currentBIO.addAttribute("preBIOLevel1", preBIOLevel1);
public static void addExtentAttributes(Constituent extent, Gazetteers gazetteers, BrownClusters brownClusters, WordNetManager wordnet){ View tokenView = extent.getTextAnnotation().getView(ViewNames.TOKENS); extent.addAttribute("GAZ", ((FlatGazetteers) gazetteers).annotateConstituent(extent, false)); extent.addAttribute("BC", brownClusters.getPrefixesCombined(extent.toString())); if (extent.getStartSpan() - 1 > tokenView.getStartSpan()) { extent.addAttribute("BCm1", brownClusters.getPrefixesCombined(tokenView.getConstituentsCoveringToken(extent.getStartSpan() - 1).get(0).toString())); } else { extent.addAttribute("BCm1", ","); } if (extent.getStartSpan() + 1 < tokenView.getEndSpan()) { extent.addAttribute("BCp1", brownClusters.getPrefixesCombined(tokenView.getConstituentsCoveringToken(extent.getStartSpan() + 1).get(0).toString())); } else { extent.addAttribute("BCm1", ","); } extent.addAttribute("WORDNETTAG", BIOFeatureExtractor.getWordNetTags(wordnet, extent)); extent.addAttribute("WORDNETHYM", BIOFeatureExtractor.getWordNetHyms(wordnet, extent)); }
public static void addExtentAttributes(Constituent extent, Gazetteers gazetteers, BrownClusters brownClusters, WordNetManager wordnet){ View tokenView = extent.getTextAnnotation().getView(ViewNames.TOKENS); extent.addAttribute("GAZ", ((FlatGazetteers) gazetteers).annotateConstituent(extent, false)); extent.addAttribute("BC", brownClusters.getPrefixesCombined(extent.toString())); if (extent.getStartSpan() - 1 > tokenView.getStartSpan()) { extent.addAttribute("BCm1", brownClusters.getPrefixesCombined(tokenView.getConstituentsCoveringToken(extent.getStartSpan() - 1).get(0).toString())); } else { extent.addAttribute("BCm1", ","); } if (extent.getStartSpan() + 1 < tokenView.getEndSpan()) { extent.addAttribute("BCp1", brownClusters.getPrefixesCombined(tokenView.getConstituentsCoveringToken(extent.getStartSpan() + 1).get(0).toString())); } else { extent.addAttribute("BCm1", ","); } extent.addAttribute("WORDNETTAG", BIOFeatureExtractor.getWordNetTags(wordnet, extent)); extent.addAttribute("WORDNETHYM", BIOFeatureExtractor.getWordNetHyms(wordnet, extent)); }
public static void addExtentAttributes(Constituent extent, Gazetteers gazetteers, BrownClusters brownClusters, WordNetManager wordnet){ View tokenView = extent.getTextAnnotation().getView(ViewNames.TOKENS); extent.addAttribute("GAZ", ((FlatGazetteers) gazetteers).annotateConstituent(extent, false)); extent.addAttribute("BC", brownClusters.getPrefixesCombined(extent.toString())); if (extent.getStartSpan() - 1 > tokenView.getStartSpan()) { extent.addAttribute("BCm1", brownClusters.getPrefixesCombined(tokenView.getConstituentsCoveringToken(extent.getStartSpan() - 1).get(0).toString())); } else { extent.addAttribute("BCm1", ","); } if (extent.getStartSpan() + 1 < tokenView.getEndSpan()) { extent.addAttribute("BCp1", brownClusters.getPrefixesCombined(tokenView.getConstituentsCoveringToken(extent.getStartSpan() + 1).get(0).toString())); } else { extent.addAttribute("BCm1", ","); } extent.addAttribute("WORDNETTAG", BIOFeatureExtractor.getWordNetTags(wordnet, extent)); extent.addAttribute("WORDNETHYM", BIOFeatureExtractor.getWordNetHyms(wordnet, extent)); }