Tabnine Logo
DocumentMetaData
Code IndexAdd Tabnine to your IDE (free)

How to use
DocumentMetaData
in
de.tudarmstadt.ukp.teaching.uima.lesson1.type

Best Java code snippets using de.tudarmstadt.ukp.teaching.uima.lesson1.type.DocumentMetaData (Showing top 8 results out of 315)

origin: de.tudarmstadt.ukp.teaching.uima/de.tudarmstadt.ukp.teaching.uima.lesson1

/** @generated */  
public DocumentMetaData(JCas jcas, int begin, int end) {
 super(jcas);
 setBegin(begin);
 setEnd(end);
 readObject();
}   
origin: de.tudarmstadt.ukp.teaching.uima/de.tudarmstadt.ukp.teaching.uima.lesson1

@Override
public void getNext(JCas aJCas) throws IOException, CollectionException {
  File file = files.poll();
  aJCas.setDocumentText(readFileToString(file));
  aJCas.setDocumentLanguage(language);
  DocumentMetaData meta = new DocumentMetaData(aJCas);
  meta.setDocumentBaseUri(path.toURI().toString());
  meta.setDocumentUri(file.toURI().toString());
  meta.addToIndexes();
}
origin: de.tudarmstadt.ukp.teaching.uima/de.tudarmstadt.ukp.teaching.uima.lesson2

@Override
public void process(JCas aJCas) throws AnalysisEngineProcessException
{
  DocumentMetaData meta = iterate(aJCas, DocumentMetaData.class).iterator().next();
  // make a new, empty document
  Document doc = new Document();
  // Add the document metadata. Use fields that are indexed (i.e. searchable), but don't
  // tokenize the field into words.
  doc.add(new Field("documentUri", meta.getDocumentUri(), Store.YES, Index.NOT_ANALYZED));
  doc.add(new Field("documentBaseUri", meta.getDocumentBaseUri(), Store.YES, Index.NOT_ANALYZED));
  doc.add(new Field("language", aJCas.getDocumentLanguage(), Store.YES, Index.NOT_ANALYZED));
  // Add all tokens to the index without any further processing.
  doc.add(new Field("token", AnnotationStream.create(iterate(aJCas, Token.class)),
      TermVector.YES));
  // Optionally store the document text. It can be retrieved but not searched.
  if (storeText) {
    doc.add(new Field("text", aJCas.getDocumentText(), Store.YES, Index.NO));
  }
  try {
    writer.addDocument(doc);
  }
  catch (IOException e) {
    throw new AnalysisEngineProcessException(e);
  }
}
origin: de.tudarmstadt.ukp.teaching.uima/de.tudarmstadt.ukp.teaching.uima.lesson1

  @Override
  public void process(JCas aJCas) throws AnalysisEngineProcessException {
    DocumentMetaData meta = iterate(aJCas, DocumentMetaData.class).iterator().next();
    System.out.println("=== METADATA ========================================");
    System.out.println("URI     : "+meta.getDocumentUri());
    System.out.println("Language: "+aJCas.getDocumentLanguage());
    System.out.println("=== TEXT ============================================");
    System.out.println(aJCas.getDocumentText());
    System.out.println("=== ANNOTATIONS =====================================");
    for (Annotation a : iterate(aJCas, Annotation.class)) {
      System.out.println(a.getType().getName() + "(" + a.getBegin() + ","
          + a.getEnd() + ") [" + a.getCoveredText() + "]");
    }
  }
}
origin: de.tudarmstadt.ukp.teaching.uima/de.tudarmstadt.ukp.teaching.uima.lesson1

/** @generated */
public DocumentMetaData(JCas jcas) {
 super(jcas);
 readObject();   
} 
origin: de.tudarmstadt.ukp.teaching.uima/de.tudarmstadt.ukp.teaching.uima.lesson1

 public FeatureStructure createFS(int addr, CASImpl cas) {
      if (DocumentMetaData_Type.this.useExistingInstance) {
       // Return eq fs instance if already created
      FeatureStructure fs = DocumentMetaData_Type.this.jcas.getJfsFromCaddr(addr);
      if (null == fs) {
       fs = new DocumentMetaData(addr, DocumentMetaData_Type.this);
       DocumentMetaData_Type.this.jcas.putJfsFromCaddr(addr, fs);
       return fs;
      }
      return fs;
  } else return new DocumentMetaData(addr, DocumentMetaData_Type.this);
  }
};
origin: de.tudarmstadt.ukp.teaching.uima/de.tudarmstadt.ukp.teaching.uima.lesson1

  @Test
  public void test() throws Exception
  {
    CollectionReader reader = CollectionReaderFactory.createCollectionReader(
        TextFileReader.class,
        createTypeSystemDescription(),
        TextFileReader.PARAM_PATH, "src/test/resources/textfiles",
        TextFileReader.PARAM_LANGUAGE, "Latin");

    int found = 0;
    CAS cas = CasCreationUtils.createCas(reader.getProcessingResourceMetaData());
    while (reader.hasNext()) {
      reader.getNext(cas);
      DocumentMetaData meta = iterate(cas.getJCas(), DocumentMetaData.class).iterator().next();
      for (Entry<String, String> entry : testFileContent.entrySet()) {
        if (meta.getDocumentUri().endsWith(entry.getKey())) {
          assertEquals(entry.getValue(), cas.getDocumentText());
          found++;
        }
      }
      cas.reset();
    }
    assertEquals(testFileContent.size(), found);
  }
}
origin: de.tudarmstadt.ukp.teaching.uima/de.tudarmstadt.ukp.teaching.uima.lesson1

/** Internal - constructor used by generator 
 * @generated */
public DocumentMetaData(int addr, TOP_Type type) {
 super(addr, type);
 readObject();
}

de.tudarmstadt.ukp.teaching.uima.lesson1.typeDocumentMetaData

Javadoc

Updated by JCasGen Mon Oct 18 10:52:32 CEST 2010 XML source: /Users/bluefire/UKP/Workspaces/dkpro-primary/uimapraktikum/lesson1/src/main/resources/desc/type/DocumentMetaData.xml

Most used methods

  • getDocumentUri
    getter for documentUri - gets
  • <init>
  • addToIndexes
  • getDocumentBaseUri
    getter for documentBaseUri - gets
  • readObject
    Write your own initialization here
  • setBegin
  • setDocumentBaseUri
    setter for documentBaseUri - sets
  • setDocumentUri
    setter for documentUri - sets
  • setEnd

Popular in Java

  • Finding current android device location
  • runOnUiThread (Activity)
  • getSystemService (Context)
  • getApplicationContext (Context)
  • GridLayout (java.awt)
    The GridLayout class is a layout manager that lays out a container's components in a rectangular gri
  • EOFException (java.io)
    Thrown when a program encounters the end of a file or stream during an input operation.
  • JComboBox (javax.swing)
  • Options (org.apache.commons.cli)
    Main entry-point into the library. Options represents a collection of Option objects, which describ
  • LogFactory (org.apache.commons.logging)
    Factory for creating Log instances, with discovery and configuration features similar to that employ
  • Reflections (org.reflections)
    Reflections one-stop-shop objectReflections scans your classpath, indexes the metadata, allows you t
  • Best plugins for Eclipse
Tabnine Logo
  • Products

    Search for Java codeSearch for JavaScript code
  • IDE Plugins

    IntelliJ IDEAWebStormVisual StudioAndroid StudioEclipseVisual Studio CodePyCharmSublime TextPhpStormVimGoLandRubyMineEmacsJupyter NotebookJupyter LabRiderDataGripAppCode
  • Company

    About UsContact UsCareers
  • Resources

    FAQBlogTabnine AcademyTerms of usePrivacy policyJava Code IndexJavascript Code Index
Get Tabnine for your IDE now