opennlp.tools.sentdetect.SentenceDetectorME.train java code examples

 /**
  * @deprecated Use
  *             {@link #train(String, ObjectStream, SentenceDetectorFactory, TrainingParameters)}
  *             and pass in af {@link SentenceDetectorFactory}.
  */
 @Deprecated
 public static SentenceModel train(String languageCode, ObjectStream<SentenceSample> samples,
   boolean useTokenEnd, Dictionary abbreviations) throws IOException {
  return train(languageCode, samples, useTokenEnd, abbreviations,
    ModelUtil.createDefaultTrainingParameters());
 }
}

/**
 * @deprecated Use
 *             {@link #train(String, ObjectStream, SentenceDetectorFactory, TrainingParameters)}
 *             and pass in af {@link SentenceDetectorFactory}.
 */
public static SentenceModel train(String languageCode,
  ObjectStream<SentenceSample> samples, boolean useTokenEnd,
  Dictionary abbreviations, TrainingParameters mlParams) throws IOException {
 SentenceDetectorFactory sdFactory = new SentenceDetectorFactory(
   languageCode, useTokenEnd, abbreviations, null);
 return train(languageCode, samples, sdFactory, mlParams);
}

private static SentenceModel train(SentenceDetectorFactory factory)
  throws IOException {
 return SentenceDetectorME.train("eng", createSampleStream(), factory,
   TrainingParameters.defaultParams());
}

@Test(expected = InsufficientTrainingDataException.class)
public void testInsufficientData() throws IOException {
 InputStreamFactory in = new ResourceAsStreamFactory(getClass(),
   "/opennlp/tools/sentdetect/SentencesInsufficient.txt");
 TrainingParameters mlParams = new TrainingParameters();
 mlParams.put(TrainingParameters.ITERATIONS_PARAM, 100);
 mlParams.put(TrainingParameters.CUTOFF_PARAM, 0);
 SentenceDetectorFactory factory = new SentenceDetectorFactory("eng", true, null, null);
 
 SentenceDetectorME.train("eng",
   new SentenceSampleStream(
     new PlainTextByLineStream(in, StandardCharsets.UTF_8)), factory, mlParams);
 
}

/**
 * Starts the evaluation.
 *
 * @param samples
 *          the data to train and test
 * @param nFolds
 *          number of folds
 *
 * @throws IOException
 */
public void evaluate(ObjectStream<SentenceSample> samples, int nFolds) throws IOException {
 CrossValidationPartitioner<SentenceSample> partitioner =
   new CrossValidationPartitioner<>(samples, nFolds);
 while (partitioner.hasNext()) {
  CrossValidationPartitioner.TrainingSampleStream<SentenceSample> trainingSampleStream =
    partitioner.next();
  SentenceModel model;
  model = SentenceDetectorME.train(languageCode, trainingSampleStream,
    sdFactory, params);
  // do testing
  SentenceDetectorEvaluator evaluator = new SentenceDetectorEvaluator(
    new SentenceDetectorME(model), listeners);
  evaluator.evaluate(trainingSampleStream.getTestSampleStream());
  fmeasure.mergeInto(evaluator.getFMeasure());
 }
}

/**
 * @deprecated Use
 *             {@link #train(String, ObjectStream, SentenceDetectorFactory, TrainingParameters)}
 *             and pass in af {@link SentenceDetectorFactory}.
 */
public static SentenceModel train(String languageCode,
  ObjectStream<SentenceSample> samples, boolean useTokenEnd,
  Dictionary abbreviations, TrainingParameters mlParams) throws IOException {
 SentenceDetectorFactory sdFactory = new SentenceDetectorFactory(
   languageCode, useTokenEnd, abbreviations, null);
 return train(languageCode, samples, sdFactory, mlParams);
}

 /**
  * @deprecated Use
  *             {@link #train(String, ObjectStream, SentenceDetectorFactory, TrainingParameters)}
  *             and pass in af {@link SentenceDetectorFactory}.
  */
 @Deprecated
 public static SentenceModel train(String languageCode, ObjectStream<SentenceSample> samples,
   boolean useTokenEnd, Dictionary abbreviations) throws IOException {
  return train(languageCode, samples, useTokenEnd, abbreviations,
    ModelUtil.createDefaultTrainingParameters());
 }
}

 /**
  * @deprecated Use
  *             {@link #train(String, ObjectStream, SentenceDetectorFactory, TrainingParameters)}
  *             and pass in af {@link SentenceDetectorFactory}.
  */
 @Deprecated
 public static SentenceModel train(String languageCode, ObjectStream<SentenceSample> samples,
   boolean useTokenEnd, Dictionary abbreviations) throws IOException {
  return train(languageCode, samples, useTokenEnd, abbreviations,
    ModelUtil.createDefaultTrainingParameters());
 }
}

/**
 * @deprecated Use
 *             {@link #train(String, ObjectStream, SentenceDetectorFactory, TrainingParameters)}
 *             and pass in af {@link SentenceDetectorFactory}.
 */
public static SentenceModel train(String languageCode,
  ObjectStream<SentenceSample> samples, boolean useTokenEnd,
  Dictionary abbreviations, TrainingParameters mlParams) throws IOException {
 SentenceDetectorFactory sdFactory = new SentenceDetectorFactory(
   languageCode, useTokenEnd, abbreviations, null);
 return train(languageCode, samples, sdFactory, mlParams);
}

 SentenceDetectorFactory sdFactory = SentenceDetectorFactory.create(
   params.getFactory(), params.getLang(), true, dict, eos);
 model = SentenceDetectorME.train(params.getLang(), sampleStream,
   sdFactory, mlParams);
} catch (IOException e) {

private static SentenceModel train(InputStream corpus, int iterations, int cut) throws IOException
{
  ObjectStream<String> lineStream = new PlainTextByLineStream(corpus, Charset.forName("UTF-8"));
  ObjectStream<SentenceSample> sampleStream = new SentenceSampleStream(lineStream);
  SentenceModel model;
  try
  {
    model = SentenceDetectorME.train("en", sampleStream, true, null, TrainingParameters.defaultParams());
  } finally
  {
    sampleStream.close();
  }
  
  return model;
}

SentenceModel sentenceModel = SentenceDetectorME.train(language, samples,
   sdFactory, mlParams);

SentenceDetectorFactory factory = new SentenceDetectorFactory(language, true,
    abbreviationDictionary, eosCharacters);
return SentenceDetectorME.train(language, stream, factory, params);

 mod = SentenceDetectorME.train("en", sampleStream, true, dict, mlParams);
} finally {
  sampleStream.close();

 mod = SentenceDetectorME.train("en", sampleStream, sdFactory, mlParams);
} finally {
  sampleStream.close();

/**
 * Starts the evaluation.
 *
 * @param samples
 *          the data to train and test
 * @param nFolds
 *          number of folds
 *
 * @throws IOException
 */
public void evaluate(ObjectStream<SentenceSample> samples, int nFolds) throws IOException {
 CrossValidationPartitioner<SentenceSample> partitioner =
   new CrossValidationPartitioner<>(samples, nFolds);
 while (partitioner.hasNext()) {
  CrossValidationPartitioner.TrainingSampleStream<SentenceSample> trainingSampleStream =
    partitioner.next();
  SentenceModel model;
  model = SentenceDetectorME.train(languageCode, trainingSampleStream,
    sdFactory, params);
  // do testing
  SentenceDetectorEvaluator evaluator = new SentenceDetectorEvaluator(
    new SentenceDetectorME(model), listeners);
  evaluator.evaluate(trainingSampleStream.getTestSampleStream());
  fmeasure.mergeInto(evaluator.getFMeasure());
 }
}

/**
 * Starts the evaluation.
 *
 * @param samples
 *          the data to train and test
 * @param nFolds
 *          number of folds
 *
 * @throws IOException
 */
public void evaluate(ObjectStream<SentenceSample> samples, int nFolds) throws IOException {
 CrossValidationPartitioner<SentenceSample> partitioner =
   new CrossValidationPartitioner<>(samples, nFolds);
 while (partitioner.hasNext()) {
  CrossValidationPartitioner.TrainingSampleStream<SentenceSample> trainingSampleStream =
    partitioner.next();
  SentenceModel model;
  model = SentenceDetectorME.train(languageCode, trainingSampleStream,
    sdFactory, params);
  // do testing
  SentenceDetectorEvaluator evaluator = new SentenceDetectorEvaluator(
    new SentenceDetectorME(model), listeners);
  evaluator.evaluate(trainingSampleStream.getTestSampleStream());
  fmeasure.mergeInto(evaluator.getFMeasure());
 }
}

SentenceModel sentdetectModel = SentenceDetectorME.train(
  "eng", new SentenceSampleStream(new PlainTextByLineStream(in,
    StandardCharsets.UTF_8)), factory, mlParams);

 SentenceDetectorFactory sdFactory = SentenceDetectorFactory.create(
   params.getFactory(), params.getLang(), true, dict, eos);
 model = SentenceDetectorME.train(params.getLang(), sampleStream,
   sdFactory, mlParams);
} catch (IOException e) {

 SentenceDetectorFactory sdFactory = SentenceDetectorFactory.create(
   params.getFactory(), params.getLang(), true, dict, eos);
 model = SentenceDetectorME.train(params.getLang(), sampleStream,
   sdFactory, mlParams);
} catch (IOException e) {

Popular methods of SentenceDetectorME

<init>
sentPosDetect
Detect the position of the first words of sentences in a String.
sentDetect
Detect sentences in a String.
getAbbreviations
getFirstNonWS
getFirstWS
getSentenceProbabilities
Returns the probabilities associated with the most recent calls to sentDetect().
isAcceptableBreak
Allows subclasses to check an overzealous (read: poorly trained) model from flagging obvious non-bre

Popular in Java

Reading from database using SQL prepared statement
findViewById (Activity)
startActivity (Activity)
getApplicationContext (Context)
Pointer (com.sun.jna)
An abstraction for a native pointer data type. A Pointer instance represents, on the Java side, a na
BufferedInputStream (java.io)
A BufferedInputStream adds functionality to another input stream-namely, the ability to buffer the i
ServerSocket (java.net)
This class represents a server-side socket that waits for incoming client connections. A ServerSocke
Hashtable (java.util)
A plug-in replacement for JDK1.5 java.util.Hashtable. This version is based on org.cliffc.high_scale
Rectangle (java.awt)
A Rectangle specifies an area in a coordinate space that is enclosed by the Rectangle object's top-
Annotation (javassist.bytecode.annotation)
The annotation structure.An instance of this class is returned bygetAnnotations() in AnnotationsAttr
Top plugins for Android Studio

How to use trainmethodin opennlp.tools.sentdetect.SentenceDetectorME

Best Java code snippets using opennlp.tools.sentdetect.SentenceDetectorME.train (Showing top 20 results out of 315)

How to use
train
method
in
opennlp.tools.sentdetect.SentenceDetectorME