cc.mallet.fst.CRFTrainerByValueGradients java code examples

/** Trains a CRF until convergence. */
public boolean trainIncremental (InstanceList training)
{
  return train (training, Integer.MAX_VALUE);
}

assert (trainingSet.size() > 0);
getOptimizableCRF(trainingSet); // This will set this.mcrf if necessary
getOptimizer(trainingSet); // This will set this.opt if necessary
       +(System.currentTimeMillis()-startTime)/1000 + " secs.");
    iterationCount++;
    runEvaluators();
  } catch (OptimizationException e) {
      ++numResets;
      opt = null;
      getOptimizer(trainingSet);

public void train(TextBlock textBlock) throws Exception {
  InstanceList trainingData = new InstanceList(getPipes());
  for (TextSentence textSentence : textBlock) {
    Instance textInstance = new TextInstance(textSentence, getTargetAlphabet());
    trainingData.addThruPipe(textInstance);
  }
  if (crf == null) {
    crf = new CRF(getPipes(), null);
    crf.addFullyConnectedStatesForLabels();
    crf.setWeightsDimensionAsIn(trainingData, false);
    CRFOptimizableByLabelLikelihood optLabel = new CRFOptimizableByLabelLikelihood(crf, trainingData);
    Optimizable.ByGradientValue[] opts = new Optimizable.ByGradientValue[] { optLabel };
    crfTrainer = new CRFTrainerByValueGradients(crf, opts);
    crfTrainer.setMaxResets(0);
  }
  crfTrainer.train(trainingData, Integer.MAX_VALUE);
}

/**
 * Returns a L-BFGS optimizer, creating if one doesn't exist.
 * <p>
 * Also creates an optimizable CRF if required.
 */
public Optimizer getOptimizer (InstanceList trainingSet) {
  getOptimizableCRF(trainingSet); // this will set this.mcrf if necessary
  if (opt == null || ocrf != opt.getOptimizable())
    opt = new LimitedMemoryBFGS(ocrf);  // Alternative: opt = new ConjugateGradient (0.001);
  return opt;
}

assert (trainingSet.size() > 0);
getOptimizableCRF(trainingSet); // This will set this.mcrf if necessary
getOptimizer(trainingSet); // This will set this.opt if necessary
       +(System.currentTimeMillis()-startTime)/1000 + " secs.");
    iterationCount++;
    runEvaluators();
  } catch (OptimizationException e) {
      ++numResets;
      opt = null;
      getOptimizer(trainingSet);

/**
 * Returns a L-BFGS optimizer, creating if one doesn't exist.
 * <p>
 * Also creates an optimizable CRF if required.
 */
public Optimizer getOptimizer (InstanceList trainingSet) {
  getOptimizableCRF(trainingSet); // this will set this.mcrf if necessary
  if (opt == null || ocrf != opt.getOptimizable())
    opt = new LimitedMemoryBFGS(ocrf);  // Alternative: opt = new ConjugateGradient (0.001);
  return opt;
}

assert (trainingSet.size() > 0);
getOptimizableCRF(trainingSet); // This will set this.mcrf if necessary
getOptimizer(trainingSet); // This will set this.opt if necessary
       +(System.currentTimeMillis()-startTime)/1000 + " secs.");
    iterationCount++;
    runEvaluators();
  } catch (OptimizationException e) {
      ++numResets;
      opt = null;
      getOptimizer(trainingSet);

/** Trains a CRF until convergence. */
public boolean trainIncremental (InstanceList training)
{
  return train (training, Integer.MAX_VALUE);
}

/**
 * Returns a L-BFGS optimizer, creating if one doesn't exist.
 * <p>
 * Also creates an optimizable CRF if required.
 */
public Optimizer getOptimizer (InstanceList trainingSet) {
  getOptimizableCRF(trainingSet); // this will set this.mcrf if necessary
  if (opt == null || ocrf != opt.getOptimizable())
    opt = new LimitedMemoryBFGS(ocrf);  // Alternative: opt = new ConjugateGradient (0.001);
  return opt;
}

/** Trains a CRF until convergence. */
public boolean trainIncremental (InstanceList training)
{
  return train (training, Integer.MAX_VALUE);
}

/**
 * Train a CRF on various-sized subsets of the data.  This method is typically used to accelerate training by 
 * quickly getting to reasonable parameters on only a subset of the parameters first, then on progressively more data. 
 * @param training The training Instances.
 * @param numIterationsPerProportion Maximum number of Maximizer iterations per training proportion.
 * @param trainingProportions If non-null, train on increasingly
 * larger portions of the data, e.g. new double[] {0.2, 0.5, 1.0}.  This can sometimes speedup convergence. 
 * Be sure to end in 1.0 if you want to train on all the data in the end.  
 * @return True if training has converged.
 */
public boolean train (InstanceList training, int numIterationsPerProportion, double[] trainingProportions)
{
  int trainingIteration = 0;
  assert (trainingProportions.length > 0);
  boolean converged = false;
  for (int i = 0; i < trainingProportions.length; i++) {
    assert (trainingProportions[i] <= 1.0);
    logger.info ("Training on "+trainingProportions[i]+"% of the data this round.");
    if (trainingProportions[i] == 1.0)
      converged = this.train (training, numIterationsPerProportion);
    else 
      converged = this.train (training.split (new Random(1),	
          new double[] {trainingProportions[i],	1-trainingProportions[i]})[0], numIterationsPerProportion);
    trainingIteration += numIterationsPerProportion;
  }
  return converged;
}

/**
 * Train a CRF on various-sized subsets of the data.  This method is typically used to accelerate training by 
 * quickly getting to reasonable parameters on only a subset of the parameters first, then on progressively more data. 
 * @param training The training Instances.
 * @param numIterationsPerProportion Maximum number of Maximizer iterations per training proportion.
 * @param trainingProportions If non-null, train on increasingly
 * larger portions of the data, e.g. new double[] {0.2, 0.5, 1.0}.  This can sometimes speedup convergence. 
 * Be sure to end in 1.0 if you want to train on all the data in the end.  
 * @return True if training has converged.
 */
public boolean train (InstanceList training, int numIterationsPerProportion, double[] trainingProportions)
{
  int trainingIteration = 0;
  assert (trainingProportions.length > 0);
  boolean converged = false;
  for (int i = 0; i < trainingProportions.length; i++) {
    assert (trainingProportions[i] <= 1.0);
    logger.info ("Training on "+trainingProportions[i]+"% of the data this round.");
    if (trainingProportions[i] == 1.0)
      converged = this.train (training, numIterationsPerProportion);
    else 
      converged = this.train (training.split (new Random(1),	
          new double[] {trainingProportions[i],	1-trainingProportions[i]})[0], numIterationsPerProportion);
    trainingIteration += numIterationsPerProportion;
  }
  return converged;
}

/**
 * Train a CRF on various-sized subsets of the data.  This method is typically used to accelerate training by 
 * quickly getting to reasonable parameters on only a subset of the parameters first, then on progressively more data. 
 * @param training The training Instances.
 * @param numIterationsPerProportion Maximum number of Maximizer iterations per training proportion.
 * @param trainingProportions If non-null, train on increasingly
 * larger portions of the data, e.g. new double[] {0.2, 0.5, 1.0}.  This can sometimes speedup convergence. 
 * Be sure to end in 1.0 if you want to train on all the data in the end.  
 * @return True if training has converged.
 */
public boolean train (InstanceList training, int numIterationsPerProportion, double[] trainingProportions)
{
  int trainingIteration = 0;
  assert (trainingProportions.length > 0);
  boolean converged = false;
  for (int i = 0; i < trainingProportions.length; i++) {
    assert (trainingProportions[i] <= 1.0);
    logger.info ("Training on "+trainingProportions[i]+"% of the data this round.");
    if (trainingProportions[i] == 1.0)
      converged = this.train (training, numIterationsPerProportion);
    else 
      converged = this.train (training.split (new Random(1),	
          new double[] {trainingProportions[i],	1-trainingProportions[i]})[0], numIterationsPerProportion);
    trainingIteration += numIterationsPerProportion;
  }
  return converged;
}

Javadoc

A CRF trainer that can combine multiple objective functions, each represented by a Optmizable.ByValueGradient.

Most used methods

train
Train a CRF on various-sized subsets of the data. This method is typically used to accelerate traini
getOptimizableCRF
Returns an optimizable CRF that contains a collection of objective functions. If one doesn't exist t
getOptimizer
Returns a L-BFGS optimizer, creating if one doesn't exist. Also creates an optimizable CRF if requir
runEvaluators
<init>
setMaxResets
Sets the max. number of times the optimizer can be reset before throwing an exception. Default value

Popular in Java

Reading from database using SQL prepared statement
getContentResolver (Context)
orElseThrow (Optional)
Return the contained value, if present, otherwise throw an exception to be created by the provided s
getResourceAsStream (ClassLoader)
BufferedInputStream (java.io)
A BufferedInputStream adds functionality to another input stream-namely, the ability to buffer the i
PrintWriter (java.io)
Wraps either an existing OutputStream or an existing Writerand provides convenience methods for prin
Date (java.sql)
A class which can consume and produce dates in SQL Date format. Dates are represented in SQL as yyyy
Set (java.util)
A Set is a data structure which does not allow duplicate elements.
BlockingQueue (java.util.concurrent)
A java.util.Queue that additionally supports operations that wait for the queue to become non-empty
LoggerFactory (org.slf4j)
The LoggerFactory is a utility class producing Loggers for various logging APIs, most notably for lo
Top 12 Jupyter Notebook extensions

How to useCRFTrainerByValueGradients in cc.mallet.fst

Best Java code snippets using cc.mallet.fst.CRFTrainerByValueGradients (Showing top 13 results out of 315)

How to use
CRFTrainerByValueGradients
in
cc.mallet.fst