cc.mallet.extract.BIOTokenizationFilter.<init> java code examples

public DocumentExtraction (String name, LabelAlphabet dict, Tokenization input, Sequence predicted,
              Sequence target, String background)
{
 this (name, dict, input, predicted, target, background, new BIOTokenizationFilter ());
}

public ACRFExtractor (ACRF acrf, Pipe tokPipe, Pipe featurePipe)
{
 this.acrf = acrf;
 this.tokPipe = tokPipe;
 this.featurePipe = featurePipe;
 this.filter = new BIOTokenizationFilter ();
}

public ACRFExtractor (ACRF acrf, Pipe tokPipe, Pipe featurePipe)
{
 this.acrf = acrf;
 this.tokPipe = tokPipe;
 this.featurePipe = featurePipe;
 this.filter = new BIOTokenizationFilter ();
}

public DocumentExtraction (String name, LabelAlphabet dict, Tokenization input, Sequence predicted,
              Sequence target, String background)
{
 this (name, dict, input, predicted, target, background, new BIOTokenizationFilter ());
}

public DocumentExtraction (String name, LabelAlphabet dict, Tokenization input, Sequence predicted, String background)
{
 this (name, dict, input, predicted, null, background, new BIOTokenizationFilter ());
}

public ACRFExtractor (ACRF acrf, Pipe tokPipe, Pipe featurePipe)
{
 this.acrf = acrf;
 this.tokPipe = tokPipe;
 this.featurePipe = featurePipe;
 this.filter = new BIOTokenizationFilter ();
}

public DocumentExtraction (String name, LabelAlphabet dict, Tokenization input, Sequence predicted,
              Sequence target, String background)
{
 this (name, dict, input, predicted, target, background, new BIOTokenizationFilter ());
}

public CRFExtractor (CRF crf, Pipe tokpipe) {
 this (crf, tokpipe, new BIOTokenizationFilter ());
}

public DocumentExtraction (String name, LabelAlphabet dict, Tokenization input, Sequence predicted, String background)
{
 this (name, dict, input, predicted, null, background, new BIOTokenizationFilter ());
}

public DocumentExtraction (String name, LabelAlphabet dict, Tokenization input, Sequence predicted, String background)
{
 this (name, dict, input, predicted, null, background, new BIOTokenizationFilter ());
}

public CRFExtractor (CRF crf, Pipe tokpipe) {
 this (crf, tokpipe, new BIOTokenizationFilter ());
}

public CRFExtractor (CRF crf, Pipe tokpipe) {
 this (crf, tokpipe, new BIOTokenizationFilter ());
}

private void readObject (ObjectInputStream in) throws IOException, ClassNotFoundException
{
 in.defaultReadObject ();
 int version = in.readInt ();
 if ((version == 0) || (featurePipe == null)) {
  featurePipe = (Pipe) crf.getInputPipe ();
 }
 if (version < 2) {
  filter = new BIOTokenizationFilter ();
 }
}

private void readObject (ObjectInputStream in) throws IOException, ClassNotFoundException
{
 in.defaultReadObject ();
 int version = in.readInt ();
 if ((version == 0) || (featurePipe == null)) {
  featurePipe = (Pipe) crf.getInputPipe ();
 }
 if (version < 2) {
  filter = new BIOTokenizationFilter ();
 }
}

private void readObject (ObjectInputStream in) throws IOException, ClassNotFoundException
{
 in.defaultReadObject ();
 int version = in.readInt ();
 if ((version == 0) || (featurePipe == null)) {
  featurePipe = (Pipe) crf.getInputPipe ();
 }
 if (version < 2) {
  filter = new BIOTokenizationFilter ();
 }
}

 public void testToXmlBIO () {
 LabelAlphabet dict = new LabelAlphabet ();
 String document = "the quick brown fox leapt over the lazy dog";
 StringTokenization toks = new StringTokenization (document, new CharSequenceLexer ());
 Label O = dict.lookupLabel ("O");
 Label BANML = dict.lookupLabel ("B-ANIMAL");
 Label ANML = dict.lookupLabel ("ANIMAL");
 Label BVB = dict.lookupLabel ("B-VERB");
 Label VB = dict.lookupLabel ("I-VERB");
 LabelSequence tags = new LabelSequence (new Label[] { O, BANML, ANML, BANML, BVB, VB, O, ANML, ANML });
 DocumentExtraction extr = new DocumentExtraction ("Test", dict, toks, tags, null, "O", new BIOTokenizationFilter());
 String actualXml = extr.toXmlString();
 String expectedXml = "<?xml version=\"1.0\" encoding=\"UTF-8\"?>\r\n" +
     "<doc>the <ANIMAL>quick brown </ANIMAL><ANIMAL>fox </ANIMAL><VERB>leapt over </VERB>the <ANIMAL>lazy dog</ANIMAL></doc>\r\n";
 assertEquals (expectedXml, actualXml);
}

 public void testToXmlBIO () {
 LabelAlphabet dict = new LabelAlphabet ();
 String document = "the quick brown fox leapt over the lazy dog";
 StringTokenization toks = new StringTokenization (document, new CharSequenceLexer ());
 Label O = dict.lookupLabel ("O");
 Label BANML = dict.lookupLabel ("B-ANIMAL");
 Label ANML = dict.lookupLabel ("ANIMAL");
 Label BVB = dict.lookupLabel ("B-VERB");
 Label VB = dict.lookupLabel ("I-VERB");
 LabelSequence tags = new LabelSequence (new Label[] { O, BANML, ANML, BANML, BVB, VB, O, ANML, ANML });
 DocumentExtraction extr = new DocumentExtraction ("Test", dict, toks, tags, null, "O", new BIOTokenizationFilter());
 String actualXml = extr.toXmlString();
 String expectedXml = "<?xml version=\"1.0\" encoding=\"UTF-8\"?>\r\n" +
     "<doc>the <ANIMAL>quick brown </ANIMAL><ANIMAL>fox </ANIMAL><VERB>leapt over </VERB>the <ANIMAL>lazy dog</ANIMAL></doc>\r\n";
 assertEquals (expectedXml, actualXml);
}

Popular methods of BIOTokenizationFilter

Popular in Java

Start an intent from android
scheduleAtFixedRate (ScheduledExecutorService)
getApplicationContext (Context)
getSystemService (Context)
MessageFormat (java.text)
Produces concatenated messages in language-neutral way. New code should probably use java.util.Forma
Collection (java.util)
Collection is the root of the collection hierarchy. It defines operations on data collections and t
Handler (java.util.logging)
A Handler object accepts a logging request and exports the desired messages to a target, for example
SAXParseException (org.xml.sax)
Encapsulate an XML parse error or warning.> This module, both source code and documentation, is in t
Font (java.awt)
The Font class represents fonts, which are used to render text in a visible way. A font provides the
Window (java.awt)
A Window object is a top-level window with no borders and no menubar. The default layout for a windo
Github Copilot alternatives

How to use cc.mallet.extract.BIOTokenizationFilterconstructor

Best Java code snippets using cc.mallet.extract.BIOTokenizationFilter.<init> (Showing top 17 results out of 315)

How to use
cc.mallet.extract.BIOTokenizationFilter
constructor