Package de.xima.fc.form.common.pdf
Class PDF2HTMLImportStripper
- java.lang.Object
-
- org.apache.pdfbox.contentstream.PDFStreamEngine
-
- org.apache.pdfbox.text.PDFTextStripper
-
- de.xima.fc.form.common.pdf.PDF2HTMLImportStripper
-
public class PDF2HTMLImportStripper extends org.apache.pdfbox.text.PDFTextStripper
-
-
Constructor Summary
Constructors Constructor Description PDF2HTMLImportStripper(org.apache.pdfbox.pdmodel.PDDocument document)
-
Method Summary
All Methods Instance Methods Concrete Methods Modifier and Type Method Description protected floatcomputeFontHeight(org.apache.pdfbox.pdmodel.font.PDFont arg0)voiddrawHTMLFields()StringgetHTML()com.hp.gagawa.java.NodegetHTMLBase()com.alibaba.fastjson.JSONArraygetOnValues(org.apache.pdfbox.pdmodel.interactive.form.PDButton pdField)ArrayList<String>getPageImages()protected voidprocessOperator(org.apache.pdfbox.contentstream.operator.Operator operator, List<org.apache.pdfbox.cos.COSBase> operands)protected voidprocessTextPosition(org.apache.pdfbox.text.TextPosition text)protected voidshowGlyph(org.apache.pdfbox.util.Matrix arg0, org.apache.pdfbox.pdmodel.font.PDFont arg1, int arg2, String arg3, org.apache.pdfbox.util.Vector arg4)voidstripPage(int page, String img)-
Methods inherited from class org.apache.pdfbox.text.PDFTextStripper
endArticle, endDocument, endPage, getAddMoreFormatting, getArticleEnd, getArticleStart, getAverageCharTolerance, getCharactersByArticle, getCurrentPageNo, getDropThreshold, getEndBookmark, getEndPage, getIndentThreshold, getLineSeparator, getListItemPatterns, getOutput, getPageEnd, getPageStart, getParagraphEnd, getParagraphStart, getSeparateByBeads, getSortByPosition, getSpacingTolerance, getStartBookmark, getStartPage, getSuppressDuplicateOverlappingText, getText, getWordSeparator, matchPattern, processPage, processPages, setAddMoreFormatting, setArticleEnd, setArticleStart, setAverageCharTolerance, setDropThreshold, setEndBookmark, setEndPage, setIndentThreshold, setLineSeparator, setListItemPatterns, setPageEnd, setPageStart, setParagraphEnd, setParagraphStart, setShouldSeparateByBeads, setSortByPosition, setSpacingTolerance, setStartBookmark, setStartPage, setSuppressDuplicateOverlappingText, setWordSeparator, startArticle, startArticle, startDocument, startPage, writeCharacters, writeLineSeparator, writePage, writePageEnd, writePageStart, writeParagraphEnd, writeParagraphSeparator, writeParagraphStart, writeString, writeString, writeText, writeWordSeparator
-
Methods inherited from class org.apache.pdfbox.contentstream.PDFStreamEngine
addOperator, applyTextAdjustment, beginMarkedContentSequence, beginText, decreaseLevel, endMarkedContentSequence, endText, getAppearance, getCurrentPage, getGraphicsStackSize, getGraphicsState, getInitialMatrix, getLevel, getResources, getTextLineMatrix, getTextMatrix, increaseLevel, operatorException, processAnnotation, processChildStream, processOperator, processSoftMask, processTilingPattern, processTilingPattern, processTransparencyGroup, processType3Stream, registerOperatorProcessor, restoreGraphicsStack, restoreGraphicsState, saveGraphicsStack, saveGraphicsState, setLineDashPattern, setTextLineMatrix, setTextMatrix, showAnnotation, showFontGlyph, showFontGlyph, showForm, showGlyph, showText, showTextString, showTextStrings, showTransparencyGroup, showType3Glyph, showType3Glyph, transformedPoint, transformWidth, unsupportedOperator
-
-
-
-
Constructor Detail
-
PDF2HTMLImportStripper
public PDF2HTMLImportStripper(org.apache.pdfbox.pdmodel.PDDocument document) throws IOException- Throws:
IOException
-
-
Method Detail
-
getHTML
public String getHTML()
-
getHTMLBase
public com.hp.gagawa.java.Node getHTMLBase()
-
processOperator
protected void processOperator(org.apache.pdfbox.contentstream.operator.Operator operator, List<org.apache.pdfbox.cos.COSBase> operands) throws IOException- Overrides:
processOperatorin classorg.apache.pdfbox.contentstream.PDFStreamEngine- Throws:
IOException
-
stripPage
public void stripPage(int page, String img) throws IOException- Throws:
IOException
-
getOnValues
public com.alibaba.fastjson.JSONArray getOnValues(org.apache.pdfbox.pdmodel.interactive.form.PDButton pdField)
-
drawHTMLFields
public void drawHTMLFields()
-
processTextPosition
protected void processTextPosition(org.apache.pdfbox.text.TextPosition text)
- Overrides:
processTextPositionin classorg.apache.pdfbox.text.PDFTextStripper
-
showGlyph
protected void showGlyph(org.apache.pdfbox.util.Matrix arg0, org.apache.pdfbox.pdmodel.font.PDFont arg1, int arg2, String arg3, org.apache.pdfbox.util.Vector arg4) throws IOException- Overrides:
showGlyphin classorg.apache.pdfbox.contentstream.PDFStreamEngine- Throws:
IOException
-
computeFontHeight
protected float computeFontHeight(org.apache.pdfbox.pdmodel.font.PDFont arg0) throws IOException- Throws:
IOException
-
-