private static boolean isAttributeTerm(final Term term) { final String pos = term.getMorphofeat(); return pos.startsWith("JJ") || pos.startsWith("RB") || pos.startsWith("VB"); }
public static Boolean isActiveForm(final KAFDocument document, final Term term) { final String word = term.getStr().toLowerCase(); final String pos = term.getMorphofeat(); if (!pos.startsWith("V")) { return null; } if (word.equals("been") || !pos.equals("VBN")) { return Boolean.TRUE; } return isActiveFormHelper(document, term); }
public static String extendedPos(final KAFDocument document, final Term term) { final String pos = term.getMorphofeat(); final String lemma = term.getLemma().toLowerCase(); if ("some".equals(lemma) || "many".equals(lemma) || "all".equals(lemma) || "few".equals(lemma) || "this".equals(lemma) || "these".equals(lemma) || "that".equals(lemma) || "those".equals(lemma)) { final Dep dep = document.getDepToTerm(term); if (dep == null || !"NMOD".equals(dep.getRfunc())) { return pos + "P"; // determiner (DT) or adj (JJ) used as demonstrative pronoun } } return pos; }
public static void printToken(Appendable writer, Term token, int i, String last) throws IOException { writer.append(String.format("%d", i)).append("\t"); writer.append(token.getForm()).append("\t"); writer.append("_").append("\t"); writer.append(token.getForm()).append("\t"); writer.append("_").append("\t"); writer.append(token.getMorphofeat()).append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append(last); writer.append("\n"); }
public static void printToken(Appendable writer, Term token, int i, String last) throws IOException { writer.append(String.format("%d", i)).append("\t"); writer.append(token.getForm()).append("\t"); writer.append("_").append("\t"); writer.append(token.getForm()).append("\t"); writer.append("_").append("\t"); writer.append(token.getMorphofeat()).append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append(last); writer.append("\n"); }
public static void printToken(Appendable writer, Term token, int i, String last) throws IOException { writer.append(String.format("%d", i)).append("\t"); writer.append(token.getForm()).append("\t"); writer.append("_").append("\t"); writer.append(token.getForm()).append("\t"); writer.append("_").append("\t"); writer.append(token.getMorphofeat()).append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append("_").append("\t"); writer.append(last); writer.append("\n"); }
public static String getText(final Iterable<Term> terms) { final StringBuilder builder = new StringBuilder(); boolean atBeginning = true; for (final Term term : Ordering.from(Term.OFFSET_COMPARATOR).sortedCopy(terms)) { final boolean properNoun = term.getMorphofeat().startsWith("NNP"); for (final WF word : term.getWFs()) { builder.append(atBeginning ? "" : " "); builder.append(properNoun ? word.getForm() : word.getForm().toLowerCase()); atBeginning = false; } } return builder.toString(); }
public boolean match(@Nullable final Term term) { return term != null && (this.pos == null || this.pos.equalsIgnoreCase(term.getPos()) || this.pos .equals(term.getMorphofeat())) && (this.lemma == null || this.lemma.equalsIgnoreCase(term.getLemma())) && (this.stem == null || this.stem.equalsIgnoreCase(Stemming.stem(null, term.getStr()))); }
private void applyTermSenseFiltering(final KAFDocument document) { for (final Term term : document.getTerms()) { if (term.getMorphofeat() != null && term.getMorphofeat().startsWith("NNP")) { NAFUtils.removeRefs(term, NAFUtils.RESOURCE_WN_SYNSET, null); NAFUtils.removeRefs(term, NAFUtils.RESOURCE_WN_SST, null); NAFUtils.removeRefs(term, NAFUtils.RESOURCE_BBN, null); NAFUtils.removeRefs(term, NAFUtils.RESOURCE_SUMO, null); NAFUtils.removeRefs(term, NAFUtils.RESOURCE_YAGO, null); } } }
private static Boolean isActiveFormHelper(final KAFDocument document, final Term term) { final Dep dep = document.getDepToTerm(term); if (dep == null) { return Boolean.FALSE; } final Term parent = dep.getFrom(); final String word = parent.getStr().toLowerCase(); final String pos = parent.getMorphofeat(); if (pos.startsWith("NN")) { return Boolean.FALSE; } if (word.matches("am|are|is|was|were|be|been|being")) { return Boolean.FALSE; } if (word.matches("ha(ve|s|d|ving)")) { return Boolean.TRUE; } if (pos.matches("VBZ|VBD|VBP|MD")) { return Boolean.FALSE; } return isActiveFormHelper(document, parent); }
final Term t = dep.getTo(); queue.add(t); if ("CC".equals(t.getMorphofeat()) || !Character.isLetter(t.getMorphofeat().charAt(0))) { heads.add(term);
sb.append(thisTerm.getLemma()); sb.append("\t"); sb.append(thisTerm.getMorphofeat()); sb.append("\t"); if (j == 0) { sb.append(thisTerm.getLemma()); sb.append("\t"); sb.append(thisTerm.getMorphofeat()); sb.append("\t"); sb.append(BIO.BEGIN.toString()); sb.append(thisTerm.getLemma()); sb.append("\t"); sb.append(thisTerm.getMorphofeat()); sb.append("\t"); sb.append(BIO.OUT);
if (term.getPos() != null && term.getMorphofeat() != null) { out.append(": pos ").append(term.getPos()).append('/').append(term.getMorphofeat());
final FrameBase.POS pos = FrameBase.POS.forPennTag(head.getMorphofeat());
excludeMask = InstanceMention.ALL; } else { final String pos = head.getMorphofeat(); if (pos.startsWith("NN")) { typeMask = InstanceMention.NOUN;
final String p = head.getMorphofeat().toUpperCase(); if (p.equals("NNS") || p.equals("NNPS")) { emitMeta(mentionID, KS.PLURAL, true);
final boolean named = head.getMorphofeat().startsWith("NNP"); boolean accept = named; if (!accept) { entityToModify.setNamed(head.getMorphofeat().startsWith("NNP")); if (LOGGER.isDebugEnabled()) { LOGGER.debug("Added linked "
.getMorphofeat().startsWith("VB"); final String resource = verb ? "PropBank" : "NomBank"; final ExternalRef ref = NAFUtils.getRef(predicate, resource, null);
termElem.setAttribute("morphofeat", term.getMorphofeat());
termElem.setAttribute("morphofeat", term.getMorphofeat());