public static CollectionReader getCollectionReader(List<File> items) throws ResourceInitializationException { String[] paths = new String[items.size()]; for (int i = 0; i < paths.length; ++i) { paths[i] = items.get(i).getPath(); } return CollectionReaderFactory.createReader( XMIReader.class, TypeSystemDescriptionFactory.createTypeSystemDescriptionFromPath(), XMIReader.PARAM_FILES, paths); }
public static CollectionReader getCollectionReader(List<File> items) throws ResourceInitializationException { String[] paths = new String[items.size()]; for (int i = 0; i < paths.length; ++i) { paths[i] = items.get(i).getPath(); } return CollectionReaderFactory.createReader( XMIReader.class, TypeSystemDescriptionFactory.createTypeSystemDescriptionFromPath(), XMIReader.PARAM_FILES, paths); }
@Override public CollectionReader getCollectionReader(List<File> items) throws ResourceInitializationException { String[] paths = new String[items.size()]; for (int i = 0; i < paths.length; ++i) { paths[i] = items.get(i).getPath(); } return CollectionReaderFactory.createReader( XMIReader.class, TypeSystemDescriptionFactory.createTypeSystemDescriptionFromPath(), XMIReader.PARAM_FILES, paths); }
/** * Creates a new JCas from type system descriptor files. No auto-detection for type priorities, or * indexes is performed. * * @param typeSystemDescriptorPaths * paths to type system descriptor files * @return a new JCas * @throws UIMAException * if the JCas could not be initialized */ public static JCas createJCasFromPath(String... typeSystemDescriptorPaths) throws UIMAException { return createJCas(createTypeSystemDescriptionFromPath(typeSystemDescriptorPaths)); }
@Override public CollectionReader getCollectionReader(List<File> items) throws ResourceInitializationException { String[] paths = new String[items.size()]; for (int i = 0; i < paths.length; ++i) { paths[i] = items.get(i).getPath(); } return CollectionReaderFactory.createReader( XMIReader.class, TypeSystemDescriptionFactory.createTypeSystemDescriptionFromPath(), XMIReader.PARAM_FILES, paths); }
public static void main(String[] args) throws CmdLineException, UIMAException, IOException { Options options = new Options(); CmdLineParser parser = new CmdLineParser(options); parser.parseArgument(args); List<File> paths = new ArrayList<>(); for(String dataDirname : options.dataDirectories.split(":")){ File dataDir = new File(dataDirname.trim()); File[] domainFiles = dataDir.listFiles(new java.io.FileFilter() { @Override public boolean accept(File pathname) { return pathname.getName().endsWith(".xmi"); } }); paths.addAll(Arrays.asList(domainFiles)); } CollectionReaderDescription reader = CollectionReaderFactory.createReaderDescription( XMIReader.class, TypeSystemDescriptionFactory.createTypeSystemDescriptionFromPath(), XMIReader.PARAM_FILES, paths); AnalysisEngineDescription aed = getPipeline(options, options.dataDirectories); SimplePipeline.runPipeline(reader, aed); }
public void initTypeSystem(String... descriptorNames) { try { compiler.addClassPath(); boolean nameIsPath = false; for (int i = 0; i < descriptorNames.length; i++) { if (descriptorNames[i].endsWith(".xml")) { nameIsPath = true; descriptorNames[i] = new File(descriptorNames[i]).getAbsolutePath(); } } if (nameIsPath) { typeSystemDescription = TypeSystemDescriptionFactory.createTypeSystemDescriptionFromPath(descriptorNames); } else { typeSystemDescription = TypeSystemDescriptionFactory.createTypeSystemDescription(descriptorNames); } JCas jCas = CasCreationUtils.createCas(typeSystemDescription, null, null).getJCas(); customTypes = new HashSet<>(); } catch (Exception e) { e.printStackTrace(); System.exit(1); } }
TypeSystemDescriptionFactory.createTypeSystemDescriptionFromPath(), XMIReader.PARAM_FILES, paths);
private TypeSystem createTypeSystem() throws IOException, UIMAException { TypeSystemDescription tsDesc = null; if (typeSystemDescPaths != null && typeSystemDescPaths.length > 0) { tsDesc = createTypeSystemDescriptionFromPath(typeSystemDescPaths); } if (typeSystemDescNames != null && typeSystemDescNames.length > 0) { TypeSystemDescription tsDescFromNames = createTypeSystemDescription( typeSystemDescNames); if (tsDesc != null) { tsDesc = mergeTypeSystems(asList(tsDesc, tsDescFromNames)); } else { tsDesc = tsDescFromNames; } } if (tsDesc == null) { throw new IllegalStateException( "Type system description paths or names were not specified!"); } CAS dumbCas = CasCreationUtils.createCas(tsDesc, null, null); TypeSystem typeSystem = dumbCas.getTypeSystem(); // printAllTypes(); return typeSystem; }
TypeSystemDescriptionFactory.createTypeSystemDescriptionFromPath(), XMIReader.PARAM_FILES, paths);
parser.parseArgument(args); TypeSystemDescription typeSystem = TypeSystemDescriptionFactory.createTypeSystemDescriptionFromPath("../../../ctakes-type-system/src/main/resources/org/apache/ctakes/typesystem/types/TypeSystem.xml");
parser.parseArgument(args); TypeSystemDescription typeSystem = TypeSystemDescriptionFactory.createTypeSystemDescriptionFromPath("../../../ctakes-type-system/src/main/resources/org/apache/ctakes/typesystem/types/TypeSystem.xml");
private void run() throws Exception { CpeBuilder cpeBuilder = new CpeBuilder(); cpeBuilder.setMaxProcessingUnitThreatCount(2); // make TypeSystemDesc TypeSystemDescription tsd = TypeSystemDescriptionFactory .createTypeSystemDescriptionFromPath(tsFile.toURI().toString()); // configure CollectionReader CollectionReaderDescription colReaderDesc = CollectionReaderFactory.createReaderDescription( BratCollectionReader.class, tsd, BratCollectionReader.PARAM_BRAT_COLLECTION_DIR, bratCorpusDir.getPath(), BratCollectionReader.PARAM_MAPPING_FACTORY_CLASS, AutoBratUimaMappingFactory.class.getName()); cpeBuilder.setReader(colReaderDesc); // configure AE AnalysisEngineDescription aeDesc = createEngineDescription(XmiWriter.class, XmiWriter.PARAM_OUTPUTDIR, outputDir.getPath()); cpeBuilder.addAnalysisEngine(aeDesc); CollectionProcessingEngine cpe = cpeBuilder.createCpe(); cpe.addStatusCallbackListener(new ReportingStatusCallbackListener(cpe)); cpe.process(); } }
private static JCas makeJCas() throws UIMAException { TypeSystemDescription global = TypeSystemDescriptionFactory.createTypeSystemDescription(); TypeSystemDescription local = TypeSystemDescriptionFactory .createTypeSystemDescriptionFromPath( "src/test/resources/desc/type/webannoTestTypes.xml"); TypeSystemDescription merged = CasCreationUtils.mergeTypeSystems(asList(global, local)); JCas jcas = JCasFactory.createJCas(merged); DocumentMetaData.create(jcas).setDocumentId("doc"); return jcas; }
TypeSystemDescription local; if (new File(referenceFolder, "typesystem.xml").exists()) { local = TypeSystemDescriptionFactory.createTypeSystemDescriptionFromPath( new File(referenceFolder, "typesystem.xml").toString()); local = TypeSystemDescriptionFactory.createTypeSystemDescriptionFromPath( "src/test/resources/desc/type/webannoTestTypes.xml");
TypeSystemDescription typeSystemDescription = TypeSystemDescriptionFactory.createTypeSystemDescriptionFromPath();
TypeSystemDescription typeSystemDescription = TypeSystemDescriptionFactory.createTypeSystemDescriptionFromPath();
private JCas makeJCasOneSentence() throws UIMAException { TypeSystemDescription global = TypeSystemDescriptionFactory.createTypeSystemDescription(); TypeSystemDescription local = TypeSystemDescriptionFactory .createTypeSystemDescriptionFromPath( "src/test/resources/desc/types/webannoTestTypes.xml"); TypeSystemDescription merged = CasCreationUtils.mergeTypeSystems(asList(global, local)); JCas jcas = JCasFactory.createJCas(merged); DocumentMetaData.create(jcas).setDocumentId("doc"); TokenBuilder<Token, Sentence> tb = new TokenBuilder<>(Token.class, Sentence.class); tb.buildTokens(jcas, "This is a test ."); return jcas; } }
private JCas makeJCasOneSentence(String aText) throws UIMAException { TypeSystemDescription global = TypeSystemDescriptionFactory.createTypeSystemDescription(); TypeSystemDescription local = TypeSystemDescriptionFactory .createTypeSystemDescriptionFromPath( "src/test/resources/desc/type/webannoTestTypes.xml"); TypeSystemDescription merged = CasCreationUtils.mergeTypeSystems(asList(global, local)); JCas jcas = JCasFactory.createJCas(merged); DocumentMetaData.create(jcas).setDocumentId("doc"); TokenBuilder<Token, Sentence> tb = new TokenBuilder<>(Token.class, Sentence.class); tb.buildTokens(jcas, aText); // Remove the sentences generated by the token builder which treats the line break as a // sentence break for (Sentence s : select(jcas, Sentence.class)) { s.removeFromIndexes(); } // Add a new sentence covering the whole text new Sentence(jcas, 0, jcas.getDocumentText().length()).addToIndexes(); return jcas; } }
@Test public void testTwoSentencesWithNoSpaceInBetween() throws Exception { TypeSystemDescription global = TypeSystemDescriptionFactory.createTypeSystemDescription(); TypeSystemDescription local = TypeSystemDescriptionFactory .createTypeSystemDescriptionFromPath( "src/test/resources/desc/type/webannoTestTypes.xml"); TypeSystemDescription merged = CasCreationUtils.mergeTypeSystems(asList(global, local)); JCas jcas = JCasFactory.createJCas(merged); DocumentMetaData.create(jcas).setDocumentId("doc"); jcas.setDocumentText("onetwo"); new Token(jcas, 0, 3).addToIndexes(); new Sentence(jcas, 0, 3).addToIndexes(); new Token(jcas, 3, 6).addToIndexes(); new Sentence(jcas, 3, 6).addToIndexes(); writeAndAssertEquals(jcas); }