TextBlock tb = new TextBlock(textBuffer.toString().trim(), currentContainedTextElements, numWords, numLinkedWords, numWordsInWrappedLines, numWrappedLines, offsetBlocks);
TextBlock tb = new TextBlock(textBuffer.toString().trim(), currentContainedTextElements, numWords, numLinkedWords, numWordsInWrappedLines, numWrappedLines, offsetBlocks);
public boolean process(TextDocument doc) throws BoilerpipeProcessingException { boolean changes = false; final List<TextBlock> blocks = doc.getTextBlocks(); final List<TextBlock> blocksNew = new ArrayList<TextBlock>(); for (TextBlock tb : blocks) { final String text = tb.getText(); final String[] paragraphs = text.split("[\n\r]+"); if (paragraphs.length < 2) { blocksNew.add(tb); continue; } final boolean isContent = tb.isContent(); final Set<String> labels = tb.getLabels(); for (String p : paragraphs) { final TextBlock tbP = new TextBlock(p); tbP.setIsContent(isContent); tbP.addLabels(labels); blocksNew.add(tbP); changes = true; } } if (changes) { blocks.clear(); blocks.addAll(blocksNew); } return changes; }
TextBlock tb = new TextBlock(textBuffer.toString().trim(), currentContainedTextElements, numWords, numLinkedWords, numWordsInWrappedLines, numWrappedLines, offsetBlocks);
TextBlock tb = new TextBlock(textBuffer.toString().trim(), currentContainedTextElements, numWords, numLinkedWords, numWordsInWrappedLines, numWrappedLines, offsetBlocks);
public boolean process(TextDocument doc) throws BoilerpipeProcessingException { boolean changes = false; final List<TextBlock> blocks = doc.getTextBlocks(); final List<TextBlock> blocksNew = new ArrayList<TextBlock>(); for (TextBlock tb : blocks) { final String text = tb.getText(); final String[] paragraphs = text.split("[\n\r]+"); if (paragraphs.length < 2) { blocksNew.add(tb); continue; } final boolean isContent = tb.isContent(); final Set<String> labels = tb.getLabels(); for (String p : paragraphs) { final TextBlock tbP = new TextBlock(p); tbP.setIsContent(isContent); tbP.addLabels(labels); blocksNew.add(tbP); changes = true; } } if (changes) { blocks.clear(); blocks.addAll(blocksNew); } return changes; }
public boolean process(TextDocument doc) throws BoilerpipeProcessingException { boolean changes = false; final List<TextBlock> blocks = doc.getTextBlocks(); final List<TextBlock> blocksNew = new ArrayList<TextBlock>(); for (TextBlock tb : blocks) { final String text = tb.getText(); final String[] paragraphs = text.split("[\n\r]+"); if (paragraphs.length < 2) { blocksNew.add(tb); continue; } final boolean isContent = tb.isContent(); final Set<String> labels = tb.getLabels(); for (String p : paragraphs) { final TextBlock tbP = new TextBlock(p); tbP.setIsContent(isContent); tbP.addLabels(labels); blocksNew.add(tbP); changes = true; } } if (changes) { blocks.clear(); blocks.addAll(blocksNew); } return changes; }
public boolean process(TextDocument doc) throws BoilerpipeProcessingException { boolean changes = false; final List<TextBlock> blocks = doc.getTextBlocks(); final List<TextBlock> blocksNew = new ArrayList<TextBlock>(); for (TextBlock tb : blocks) { final String text = tb.getText(); final String[] paragraphs = text.split("[\n\r]+"); if (paragraphs.length < 2) { blocksNew.add(tb); continue; } final boolean isContent = tb.isContent(); final Set<String> labels = tb.getLabels(); for (String p : paragraphs) { final TextBlock tbP = new TextBlock(p); tbP.setIsContent(isContent); tbP.addLabels(labels); blocksNew.add(tbP); changes = true; } } if (changes) { blocks.clear(); blocks.addAll(blocksNew); } return changes; }