edu.stanford.nlp.ie.crf.CRFBiasedClassifier java code examples

CRFBiasedClassifier<CoreLabel> crf = new CRFBiasedClassifier<>(props);
String testFile = crf.flags.testFile;
String loadPath = crf.flags.loadClassifier;
 crf.loadClassifierNoExceptions(loadPath, props);
} else if (crf.flags.loadJarClassifier != null) {
 crf.loadClassifierNoExceptions(crf.flags.loadJarClassifier, props);
} else {
 crf.loadDefaultClassifier();
  String cname = bias.nextToken();
  double w = Double.parseDouble(bias.nextToken());
  crf.setBiasWeight(cname,w);
  log.info("Setting bias for class "+cname+" to "+w);
 DocumentReaderAndWriter<CoreLabel> readerAndWriter = crf.makeReaderAndWriter();
 if (crf.flags.printFirstOrderProbs) {
  crf.printFirstOrderProbs(testFile, readerAndWriter);
 } else if (crf.flags.printProbs) {
  crf.printProbs(testFile, readerAndWriter);
 } else if (crf.flags.useKBest) {
  int k = crf.flags.kBest;
  crf.classifyAndWriteAnswersKBest(testFile, k, readerAndWriter);
 } else {
  crf.classifyAndWriteAnswers(testFile, readerAndWriter, true);

public void setBiasWeight(int cindex, double weight) {
 addBiasFeature();
 int fi = featureIndex.indexOf(BIAS);
 weights[fi][cindex] = weight;
}

@Override
public void annotate(Annotation annotation) {
 if (verbose) {
  log.info("Adding true-case annotation...");
 }
 if (annotation.containsKey(CoreAnnotations.SentencesAnnotation.class)) {
  // classify tokens for each sentence
  for (CoreMap sentence: annotation.get(CoreAnnotations.SentencesAnnotation.class)) {
   List<CoreLabel> tokens = sentence.get(CoreAnnotations.TokensAnnotation.class);
   List<CoreLabel> output = this.trueCaser.classifySentence(tokens);
   for (int i = 0, size = tokens.size(); i < size; i++) {
    // add the truecaser tag to each token
    String neTag = output.get(i).get(CoreAnnotations.AnswerAnnotation.class);
    tokens.get(i).set(CoreAnnotations.TrueCaseAnnotation.class, neTag);
    setTrueCaseText(tokens.get(i));
   }
  }
 } else {
  throw new RuntimeException("unable to find sentences in: " + annotation);
 }
}

public TrueCaseAnnotator(String modelLoc,
             String classBias,
             String mixedCaseFileName,
             boolean overwriteText,
             boolean verbose) {
 this.overwriteText = overwriteText;
 this.verbose = verbose;
 Properties props = PropertiesUtils.asProperties(
     "loadClassifier", modelLoc,
     "mixedCaseMapFile", mixedCaseFileName,
     "classBias", classBias);
 trueCaser = new CRFBiasedClassifier<>(props);
 if (modelLoc != null) {
  trueCaser.loadClassifierNoExceptions(modelLoc, props);
 } else {
  throw new RuntimeException("Model location not specified for true-case classifier!");
 }
 if (classBias != null) {
  StringTokenizer biases = new java.util.StringTokenizer(classBias,",");
  while (biases.hasMoreTokens()) {
   StringTokenizer bias = new java.util.StringTokenizer(biases.nextToken(),":");
   String cname = bias.nextToken();
   double w = Double.parseDouble(bias.nextToken());
   trueCaser.setBiasWeight(cname,w);
   if (this.verbose) log.info("Setting bias for class " + cname + " to " + w);
  }
 }
 // Load map containing mixed-case words:
 mixedCaseMap = loadMixedCaseMap(mixedCaseFileName);
}

props.setProperty("mixedCaseMapFile", mixedCaseFileName);
props.setProperty("classBias", classBias);
trueCaser = new CRFBiasedClassifier(props);
 trueCaser.loadClassifierNoExceptions(modelLoc, props);
} else {
 throw new RuntimeException("Model location not specified for true-case classifier!");
  String cname = bias.nextToken();
  double w = Double.parseDouble(bias.nextToken());
  trueCaser.setBiasWeight(cname,w);
  if(VERBOSE) System.err.println("Setting bias for class "+cname+" to "+w);

CRFBiasedClassifier<CoreLabel> crf = new CRFBiasedClassifier<>(props);
String testFile = crf.flags.testFile;
String loadPath = crf.flags.loadClassifier;
 crf.loadClassifierNoExceptions(loadPath, props);
} else if (crf.flags.loadJarClassifier != null) {
 crf.loadClassifierNoExceptions(crf.flags.loadJarClassifier, props);
} else {
 crf.loadDefaultClassifier();
  String cname = bias.nextToken();
  double w = Double.parseDouble(bias.nextToken());
  crf.setBiasWeight(cname,w);
  log.info("Setting bias for class "+cname+" to "+w);
 DocumentReaderAndWriter<CoreLabel> readerAndWriter = crf.makeReaderAndWriter();
 if (crf.flags.printFirstOrderProbs) {
  crf.printFirstOrderProbs(testFile, readerAndWriter);
 } else if (crf.flags.printProbs) {
  crf.printProbs(testFile, readerAndWriter);
 } else if (crf.flags.useKBest) {
  int k = crf.flags.kBest;
  crf.classifyAndWriteAnswersKBest(testFile, k, readerAndWriter);
 } else {
  crf.classifyAndWriteAnswers(testFile, readerAndWriter, true);

props.setProperty("mixedCaseMapFile", mixedCaseFileName);
props.setProperty("classBias", classBias);
trueCaser = new CRFBiasedClassifier(props);
 trueCaser.loadClassifierNoExceptions(modelLoc, props);
} else {
 throw new RuntimeException("Model location not specified for true-case classifier!");
  String cname = bias.nextToken();
  double w = Double.parseDouble(bias.nextToken());
  trueCaser.setBiasWeight(cname,w);
  if(VERBOSE) System.err.println("Setting bias for class "+cname+" to "+w);

public void setBiasWeight(int cindex, double weight) {
 addBiasFeature();
 int fi = featureIndex.indexOf(BIAS);
 weights[fi][cindex] = weight;
}

@SuppressWarnings("unchecked")
public void annotate(Annotation annotation) {
 if (VERBOSE) {
  System.err.print("Adding true-case annotation...");
 }
 
 if (annotation.containsKey(CoreAnnotations.SentencesAnnotation.class)) {
  // classify tokens for each sentence 
  for (CoreMap sentence: annotation.get(CoreAnnotations.SentencesAnnotation.class)) {
   List<CoreLabel> tokens = sentence.get(CoreAnnotations.TokensAnnotation.class);
   List<CoreLabel> output = this.trueCaser.classifySentence(tokens);
   for (int i = 0; i < tokens.size(); ++i) {
    
    // add the named entity tag to each token
    String neTag = output.get(i).get(CoreAnnotations.AnswerAnnotation.class);
    tokens.get(i).set(CoreAnnotations.TrueCaseAnnotation.class, neTag);
    setTrueCaseText(tokens.get(i));
   }
  }
 } else {
  throw new RuntimeException("unable to find sentences in: " + annotation);
 }
}

CRFBiasedClassifier<CoreLabel> crf = new CRFBiasedClassifier<CoreLabel>(props);
String testFile = crf.flags.testFile;
String loadPath = crf.flags.loadClassifier;
 crf.loadClassifierNoExceptions(loadPath, props);
} else if (crf.flags.loadJarClassifier != null) {
 crf.loadJarClassifier(crf.flags.loadJarClassifier, props);
} else {
 crf.loadDefaultClassifier();
  String cname = bias.nextToken();
  double w = Double.parseDouble(bias.nextToken());
  crf.setBiasWeight(cname,w);
  System.err.println("Setting bias for class "+cname+" to "+w);
 DocumentReaderAndWriter<CoreLabel> readerAndWriter = crf.makeReaderAndWriter();
 if (crf.flags.printFirstOrderProbs) {
  crf.printFirstOrderProbs(testFile, readerAndWriter);
 } else if (crf.flags.printProbs) {
  crf.printProbs(testFile, readerAndWriter);
 } else if (crf.flags.useKBest) {
  int k = crf.flags.kBest;
  crf.classifyAndWriteAnswersKBest(testFile, k, readerAndWriter);
 } else {
  crf.classifyAndWriteAnswers(testFile, readerAndWriter);

public TrueCaseAnnotator(String modelLoc,
             String classBias,
             String mixedCaseFileName,
             boolean overwriteText,
             boolean verbose) {
 this.overwriteText = overwriteText;
 this.verbose = verbose;
 Properties props = PropertiesUtils.asProperties(
     "loadClassifier", modelLoc,
     "mixedCaseMapFile", mixedCaseFileName,
     "classBias", classBias);
 trueCaser = new CRFBiasedClassifier<>(props);
 if (modelLoc != null) {
  trueCaser.loadClassifierNoExceptions(modelLoc, props);
 } else {
  throw new RuntimeException("Model location not specified for true-case classifier!");
 }
 if (classBias != null) {
  StringTokenizer biases = new java.util.StringTokenizer(classBias,",");
  while (biases.hasMoreTokens()) {
   StringTokenizer bias = new java.util.StringTokenizer(biases.nextToken(),":");
   String cname = bias.nextToken();
   double w = Double.parseDouble(bias.nextToken());
   trueCaser.setBiasWeight(cname,w);
   if (this.verbose) log.info("Setting bias for class " + cname + " to " + w);
  }
 }
 // Load map containing mixed-case words:
 mixedCaseMap = loadMixedCaseMap(mixedCaseFileName);
}

public void setBiasWeight(int cindex, double weight) {
 addBiasFeature();
 int fi = featureIndex.indexOf(BIAS);
 weights[fi][cindex] = weight;
}

@SuppressWarnings("unchecked")
public void annotate(Annotation annotation) {
 if (VERBOSE) {
  System.err.print("Adding true-case annotation...");
 }
 
 if (annotation.containsKey(CoreAnnotations.SentencesAnnotation.class)) {
  // classify tokens for each sentence 
  for (CoreMap sentence: annotation.get(CoreAnnotations.SentencesAnnotation.class)) {
   List<CoreLabel> tokens = sentence.get(CoreAnnotations.TokensAnnotation.class);
   List<CoreLabel> output = this.trueCaser.classifySentence(tokens);
   for (int i = 0; i < tokens.size(); ++i) {
    
    // add the named entity tag to each token
    String neTag = output.get(i).get(AnswerAnnotation.class);
    tokens.get(i).set(CoreAnnotations.TrueCaseAnnotation.class, neTag);
    setTrueCaseText(tokens.get(i));
   }
  }
 } else {
  throw new RuntimeException("unable to find sentences in: " + annotation);
 }
}

CRFBiasedClassifier crf = new CRFBiasedClassifier(props);
String testFile = crf.flags.testFile;
String loadPath = crf.flags.loadClassifier;
 crf.loadClassifierNoExceptions(loadPath, props);
} else if (crf.flags.loadJarClassifier != null) {
 crf.loadJarClassifier(crf.flags.loadJarClassifier, props);
} else {
 crf.loadDefaultClassifier();
  String cname = bias.nextToken();
  double w = Double.parseDouble(bias.nextToken());
  crf.setBiasWeight(cname,w);
  System.err.println("Setting bias for class "+cname+" to "+w);
 DocumentReaderAndWriter readerAndWriter = crf.makeReaderAndWriter();
 if (crf.flags.printFirstOrderProbs) {
  crf.printFirstOrderProbs(testFile, readerAndWriter);
 } else if (crf.flags.printProbs) {
  crf.printProbs(testFile, readerAndWriter);
 } else if (crf.flags.useKBest) {
  int k = crf.flags.kBest;
  crf.classifyAndWriteAnswersKBest(testFile, k, readerAndWriter);
 } else {
  crf.classifyAndWriteAnswers(testFile, readerAndWriter);

public void setBiasWeight(int cindex, double weight) {
 addBiasFeature();
 int fi = featureIndex.indexOf(BIAS);
 weights[fi][cindex] = weight;
}

@Override
public void annotate(Annotation annotation) {
 if (verbose) {
  log.info("Adding true-case annotation...");
 }
 if (annotation.containsKey(CoreAnnotations.SentencesAnnotation.class)) {
  // classify tokens for each sentence
  for (CoreMap sentence: annotation.get(CoreAnnotations.SentencesAnnotation.class)) {
   List<CoreLabel> tokens = sentence.get(CoreAnnotations.TokensAnnotation.class);
   List<CoreLabel> output = this.trueCaser.classifySentence(tokens);
   for (int i = 0, size = tokens.size(); i < size; i++) {
    // add the truecaser tag to each token
    String neTag = output.get(i).get(CoreAnnotations.AnswerAnnotation.class);
    tokens.get(i).set(CoreAnnotations.TrueCaseAnnotation.class, neTag);
    setTrueCaseText(tokens.get(i));
   }
  }
 } else {
  throw new RuntimeException("unable to find sentences in: " + annotation);
 }
}

Javadoc

CRFBiasedClassifier is used to adjust the precision-recall tradeoff of any CRF model implemented using CRFClassifier. This adjustment is performed after CRF training. The method is described in Minkov, Wang, Tomasic, and Cohen (2006): "NER Systems that Suit User's Preferences: Adjusting the Recall-Precision Trade-off for Entity Extraction". CRFBiasedClassifier can import any model serialized with CRFClassifier and supports most command-line parameters available in CRFClassifier. In addition to this, CRFBiasedClassifier also interprets the parameter -classBias, as in: java -server -mx500m edu.stanford.nlp.ie.crf.CRFBiasedClassifier -loadClassifier model.gz -testFile test.txt -classBias A:0.5,B:1.5 The command above sets a bias of 0.5 towards class A and a bias of 1.5 towards class B. These biases (which internally are treated as feature weights in the log-linear model underpinning the CRF classifier) can take any real value. As the weight of A tends towards plus infinity, the classifier will only predict A labels, and as it tends towards minus infinity, it will never predict A labels.

Most used methods

Popular in Java

Running tasks concurrently on multiple threads
getContentResolver (Context)
getExternalFilesDir (Context)
addToBackStack (FragmentTransaction)
BufferedReader (java.io)
Wraps an existing Reader and buffers the input. Expensive interaction with the underlying reader is
BufferedWriter (java.io)
Wraps an existing Writer and buffers the output. Expensive interaction with the underlying reader is
KeyStore (java.security)
KeyStore is responsible for maintaining cryptographic keys and their owners. The type of the syste
Calendar (java.util)
Calendar is an abstract base class for converting between a Date object and a set of integer fields
SortedSet (java.util)
SortedSet is a Set which iterates over its elements in a sorted order. The order is determined eithe
JLabel (javax.swing)
Best plugins for Eclipse

How to useCRFBiasedClassifier in edu.stanford.nlp.ie.crf

Best Java code snippets using edu.stanford.nlp.ie.crf.CRFBiasedClassifier (Showing top 16 results out of 315)

How to use
CRFBiasedClassifier
in
edu.stanford.nlp.ie.crf