public class HtmlTextExtractor extends DefaultTextExtractor
Constructor and Description |
---|
HtmlTextExtractor(OutputProcessorMetaData metaData,
XmlWriter xmlWriter,
HtmlContentGenerator contentGenerator,
HtmlTagHelper tagHelper) |
Modifier and Type | Method and Description |
---|---|
protected void |
addEmptyBreak() |
protected void |
addLinebreak() |
protected void |
addSoftBreak() |
protected void |
drawComplexText(RenderableComplexText renderableComplexText) |
protected void |
drawText(RenderableText renderableText,
long contentX2)
Renders the glyphs stored in the text node.
|
protected void |
finishBlockBox(BlockRenderBox box) |
protected void |
finishCanvasBox(CanvasRenderBox box) |
protected void |
finishInlineBox(InlineRenderBox box) |
protected void |
finishRowBox(RenderBox box) |
boolean |
performOutput(RenderBox content,
StyleBuilder.StyleCarrier[] cellStyle) |
protected void |
processInitialBox(ParagraphRenderBox box)
Prints a paragraph cell.
|
protected void |
processOtherNode(RenderNode node) |
protected void |
processRenderableContent(RenderableReplacedContentBox node) |
protected boolean |
startBlockBox(BlockRenderBox box) |
protected boolean |
startCanvasBox(CanvasRenderBox box)
Prints the contents of a canvas box.
|
protected boolean |
startInlineBox(InlineRenderBox box) |
protected boolean |
startRowBox(RenderBox box)
Like a canvas box, a row-box should be split into several cells already.
|
clearText, compute, getCodePointBuffer, getFormattedtext, getParagraphBounds, getRawResult, getRawSource, getText, getTextLength, isContentField, isOverflowX, isOverflowY, isTextLineOverflow, processParagraphChilds, processTextLine, setRawResult, startAutoBox, startOtherBox, startTableBox, startTableCellBox, startTableColumnGroupBox, startTableRowBox, startTableSectionBox
finishAutoBox, finishOtherBox, finishTableBox, finishTableCellBox, finishTableColumnGroupBox, finishTableRowBox, finishTableSectionBox, processBoxChilds, processTableColumn, startProcessing
public HtmlTextExtractor(OutputProcessorMetaData metaData, XmlWriter xmlWriter, HtmlContentGenerator contentGenerator, HtmlTagHelper tagHelper)
public boolean performOutput(RenderBox content, StyleBuilder.StyleCarrier[] cellStyle) throws IOException
IOException
protected boolean startCanvasBox(CanvasRenderBox box)
startCanvasBox
in class DefaultTextExtractor
box
- the canvas boxprotected void finishCanvasBox(CanvasRenderBox box)
finishCanvasBox
in class IterateStructuralProcessStep
protected void processInitialBox(ParagraphRenderBox box) throws IOException
box
- the paragraph boxIOException
- if an IO error occured.protected void addEmptyBreak()
addEmptyBreak
in class DefaultTextExtractor
protected void addSoftBreak()
addSoftBreak
in class DefaultTextExtractor
protected void addLinebreak()
addLinebreak
in class DefaultTextExtractor
protected boolean startBlockBox(BlockRenderBox box)
startBlockBox
in class DefaultTextExtractor
protected void finishBlockBox(BlockRenderBox box)
finishBlockBox
in class IterateStructuralProcessStep
protected boolean startRowBox(RenderBox box)
startRowBox
in class DefaultTextExtractor
protected void finishRowBox(RenderBox box)
finishRowBox
in class IterateStructuralProcessStep
protected boolean startInlineBox(InlineRenderBox box)
startInlineBox
in class DefaultTextExtractor
protected void finishInlineBox(InlineRenderBox box)
finishInlineBox
in class IterateStructuralProcessStep
protected void processOtherNode(RenderNode node)
processOtherNode
in class DefaultTextExtractor
protected void processRenderableContent(RenderableReplacedContentBox node)
processRenderableContent
in class DefaultTextExtractor
protected void drawText(RenderableText renderableText, long contentX2)
DefaultTextExtractor
drawText
in class DefaultTextExtractor
renderableText
- the text node that should be rendered.protected void drawComplexText(RenderableComplexText renderableComplexText)
drawComplexText
in class DefaultTextExtractor
Copyright © 2017 Hitachi Vantara. All rights reserved.