public void printRank (PrintWriter pw) throws FileNotFoundException { // xxx Fix this. /*System.out.print (classifier.getClass().getName() + "(."); System.out.print (") = ["); for (int i = 0; i < labeling.numLocations(); i++) System.out.print (labeling.labelAtLocation(i).toString()+"="+labeling.valueAtLocation(i)+" "); System.out.println ("]");*/ pw.print(classifier.getClass().getName()); pw.print(" "); pw.print(instance.getSource() + " "); LabelVector lv = labeling.toLabelVector(); lv.printByRank(pw); pw.println (); }
public void printRank (PrintWriter pw) throws FileNotFoundException { // xxx Fix this. /*System.out.print (classifier.getClass().getName() + "(."); System.out.print (") = ["); for (int i = 0; i < labeling.numLocations(); i++) System.out.print (labeling.labelAtLocation(i).toString()+"="+labeling.valueAtLocation(i)+" "); System.out.println ("]");*/ pw.print(classifier.getClass().getName()); pw.print(" "); pw.print(instance.getSource() + " "); LabelVector lv = labeling.toLabelVector(); lv.printByRank(pw); pw.println (); }
public Instance pipe(Instance carrier) { StringBuffer sb = new StringBuffer(); String source = (String) carrier.getSource(); Sequence as = (Sequence) carrier.getTarget(); // int startLabelIndex = as.getAlphabet().lookupIndex("start"); for (int i = 0; i < source.length(); i++) { System.out.println("target[" + i + "]=" + as.get(i).toString()); if (as.get(i).toString().equals("start") && i != 0) sb.append(' '); sb.append(source.charAt(i)); } carrier.setSource(sb.toString()); System.out.println("carrier.getSource() = " + carrier.getSource()); return carrier; }
public void printRank (PrintWriter pw) throws FileNotFoundException { // xxx Fix this. /*System.out.print (classifier.getClass().getName() + "(."); System.out.print (") = ["); for (int i = 0; i < labeling.numLocations(); i++) System.out.print (labeling.labelAtLocation(i).toString()+"="+labeling.valueAtLocation(i)+" "); System.out.println ("]");*/ pw.print(classifier.getClass().getName()); pw.print(" "); pw.print(instance.getSource() + " "); LabelVector lv = labeling.toLabelVector(); lv.printByRank(pw); pw.println (); }
public Instance pipe(Instance carrier) { StringBuffer sb = new StringBuffer(); String source = (String) carrier.getSource(); Sequence as = (Sequence) carrier.getTarget(); // int startLabelIndex = as.getAlphabet().lookupIndex("start"); for (int i = 0; i < source.length(); i++) { System.out.println("target[" + i + "]=" + as.get(i).toString()); if (as.get(i).toString().equals("start") && i != 0) sb.append(' '); sb.append(source.charAt(i)); } carrier.setSource(sb.toString()); System.out.println("carrier.getSource() = " + carrier.getSource()); return carrier; }
public Instance pipe(Instance carrier) { StringBuffer sb = new StringBuffer(); String source = (String) carrier.getSource(); Sequence as = (Sequence) carrier.getTarget(); //int startLabelIndex = as.getAlphabet().lookupIndex("start"); for (int i = 0; i < source.length(); i++) { System.out.println("target[" + i + "]=" + as.get(i).toString()); if (as.get(i).toString().equals("start") && i != 0) sb.append(' '); sb.append(source.charAt(i)); } carrier.setSource(sb.toString()); System.out.println("carrier.getSource() = " + carrier.getSource()); return carrier; }
public Instance pipe(Instance carrier) { StringBuffer sb = new StringBuffer(); String source = (String) carrier.getSource(); Sequence as = (Sequence) carrier.getTarget(); //int startLabelIndex = as.getAlphabet().lookupIndex("start"); for (int i = 0; i < source.length(); i++) { System.out.println("target[" + i + "]=" + as.get(i).toString()); if (as.get(i).toString().equals("start") && i != 0) sb.append(' '); sb.append(source.charAt(i)); } carrier.setSource(sb.toString()); System.out.println("carrier.getSource() = " + carrier.getSource()); return carrier; }
public void print (PrintWriter pw) throws FileNotFoundException { // xxx Fix this. /*System.out.print (classifier.getClass().getName() + "(."); System.out.print (") = ["); for (int i = 0; i < labeling.numLocations(); i++) System.out.print (labeling.labelAtLocation(i).toString()+"="+labeling.valueAtLocation(i)+" "); System.out.println ("]");*/ pw.print(classifier.getClass().getName()); pw.print(" "); pw.print(instance.getSource() + " "); for (int i = 0; i < labeling.numLocations(); i++) pw.print (labeling.labelAtLocation(i).toString()+"="+labeling.valueAtLocation(i)+" "); pw.println (); }
public void print (PrintWriter pw) throws FileNotFoundException { // xxx Fix this. /*System.out.print (classifier.getClass().getName() + "(."); System.out.print (") = ["); for (int i = 0; i < labeling.numLocations(); i++) System.out.print (labeling.labelAtLocation(i).toString()+"="+labeling.valueAtLocation(i)+" "); System.out.println ("]");*/ pw.print(classifier.getClass().getName()); pw.print(" "); pw.print(instance.getSource() + " "); for (int i = 0; i < labeling.numLocations(); i++) pw.print (labeling.labelAtLocation(i).toString()+"="+labeling.valueAtLocation(i)+" "); pw.println (); }
public void print (PrintWriter pw) throws FileNotFoundException { // xxx Fix this. /*System.out.print (classifier.getClass().getName() + "(."); System.out.print (") = ["); for (int i = 0; i < labeling.numLocations(); i++) System.out.print (labeling.labelAtLocation(i).toString()+"="+labeling.valueAtLocation(i)+" "); System.out.println ("]");*/ pw.print(classifier.getClass().getName()); pw.print(" "); pw.print(instance.getSource() + " "); for (int i = 0; i < labeling.numLocations(); i++) pw.print (labeling.labelAtLocation(i).toString()+"="+labeling.valueAtLocation(i)+" "); pw.println (); }
public Instance next () { if (!dataSubiterator.hasNext()) { assert (superIterator.hasNext()); superInstance = superIterator.next(); dataSubiterator = ((FeatureVectorSequence)superInstance.getData()).iterator(); targetSubiterator = ((LabelSequence)superInstance.getTarget()).iterator(); } // We are assuming sequences don't have zero length assert (dataSubiterator.hasNext()); assert (targetSubiterator.hasNext()); return new Instance (dataSubiterator.next(), targetSubiterator.next(), superInstance.getSource()+" tokensequence:"+count++, null); } public boolean hasNext () {
public Instance next () { if (!dataSubiterator.hasNext()) { assert (superIterator.hasNext()); superInstance = superIterator.next(); dataSubiterator = ((FeatureVectorSequence)superInstance.getData()).iterator(); targetSubiterator = ((LabelSequence)superInstance.getTarget()).iterator(); } // We are assuming sequences don't have zero length assert (dataSubiterator.hasNext()); assert (targetSubiterator.hasNext()); return new Instance (dataSubiterator.next(), targetSubiterator.next(), superInstance.getSource()+" tokensequence:"+count++, null); } public boolean hasNext () {
public Instance next () { if (!dataSubiterator.hasNext()) { assert (superIterator.hasNext()); superInstance = superIterator.next(); dataSubiterator = ((FeatureVectorSequence)superInstance.getData()).iterator(); targetSubiterator = ((LabelSequence)superInstance.getTarget()).iterator(); } // We are assuming sequences don't have zero length assert (dataSubiterator.hasNext()); assert (targetSubiterator.hasNext()); return new Instance (dataSubiterator.next(), targetSubiterator.next(), superInstance.getSource()+" tokensequence:"+count++, null); } public boolean hasNext () {
public Instance next () { Instance inst = subIt.next (); inst = pipe.pipe (inst); return new Instance (inst.getData (), inst.getTarget (), inst.getName (), inst.getSource ()); }
public Instance next () { Instance inst = subIt.next (); inst = pipe.pipe (inst); return new Instance (inst.getData (), inst.getTarget (), inst.getName (), inst.getSource ()); }
public Instance next () { Instance inst = subIt.next (); inst = pipe.pipe (inst); return new Instance (inst.getData (), inst.getTarget (), inst.getName (), inst.getSource ()); }
public Instance toInstance() { Instance ret; FeatureVector fv; double[] values = new double[labeling.numLocations()]; int[] indices = new int[labeling.numLocations()]; for(int i = 0; i < labeling.numLocations(); i++){ indices[i] = labeling.indexAtLocation(i); values[i] = labeling.valueAtLocation(i); } fv = new FeatureVector(labeling.getAlphabet(), indices, values); ret = new Instance(fv,null,null,instance.getSource()); return ret; } }
public Instance toInstance() { Instance ret; FeatureVector fv; double[] values = new double[labeling.numLocations()]; int[] indices = new int[labeling.numLocations()]; for(int i = 0; i < labeling.numLocations(); i++){ indices[i] = labeling.indexAtLocation(i); values[i] = labeling.valueAtLocation(i); } fv = new FeatureVector(labeling.getAlphabet(), indices, values); ret = new Instance(fv,null,null,instance.getSource()); return ret; } }
public Instance toInstance() { Instance ret; FeatureVector fv; double[] values = new double[labeling.numLocations()]; int[] indices = new int[labeling.numLocations()]; for(int i = 0; i < labeling.numLocations(); i++){ indices[i] = labeling.indexAtLocation(i); values[i] = labeling.valueAtLocation(i); } fv = new FeatureVector(labeling.getAlphabet(), indices, values); ret = new Instance(fv,null,null,instance.getSource()); return ret; } }
/** Assumes Instance.source contains the Tokenization object. */ public Extraction extract (InstanceList ilist) { Extraction extraction = new Extraction (this, getTargetAlphabet ()); for (int i = 0; i < ilist.size(); i++) { Instance inst = ilist.get(i); Tokenization tok = (Tokenization)inst.getSource(); String name = inst.getName().toString(); Sequence input = (Sequence)inst.getData (); Sequence target = (Sequence)inst.getTarget (); Sequence output = crf.transduce(input); DocumentExtraction docseq = new DocumentExtraction (name, getTargetAlphabet(), tok, output, target, backgroundTag, filter); extraction.addDocumentExtraction (docseq); } return extraction; }