public static class PDF2TextConverter.PatchedPDFTextStripper extends org.apache.pdfbox.util.PDFTextStripper
Constructor and Description |
---|
PatchedPDFTextStripper() |
Modifier and Type | Method and Description |
---|---|
protected Map<String,org.apache.pdfbox.util.operator.OperatorProcessor> |
operators() |
protected void |
processOperator(org.apache.pdfbox.util.PDFOperator operator,
List<org.apache.pdfbox.cos.COSBase> arguments) |
protected Object |
unrestrictedAccess(String name) |
protected Set<String> |
unsupportedOperators() |
endArticle, endDocument, endPage, getAddMoreFormatting, getArticleEnd, getArticleStart, getAverageCharTolerance, getCharactersByArticle, getCurrentPageNo, getDropThreshold, getEndBookmark, getEndPage, getIndentThreshold, getLineSeparator, getListItemPatterns, getOutput, getPageEnd, getPageSeparator, getPageStart, getParagraphEnd, getParagraphStart, getSeparateByBeads, getSortByPosition, getSpacingTolerance, getStartBookmark, getStartPage, getSuppressDuplicateOverlappingText, getText, getText, getWordSeparator, handleLineSeparation, inspectFontEncoding, isParagraphSeparation, matchListItemPattern, matchPattern, processPage, processPages, processTextPosition, resetEngine, setAddMoreFormatting, setArticleEnd, setArticleStart, setAverageCharTolerance, setDropThreshold, setEndBookmark, setEndPage, setIndentThreshold, setLineSeparator, setListItemPatterns, setPageEnd, setPageSeparator, setPageStart, setParagraphEnd, setParagraphStart, setShouldSeparateByBeads, setSortByPosition, setSpacingTolerance, setStartBookmark, setStartPage, setSuppressDuplicateOverlappingText, setWordSeparator, startArticle, startArticle, startDocument, startPage, writeCharacters, writeLineSeparator, writePage, writePageEnd, writePageSeperator, writePageStart, writeParagraphEnd, writeParagraphSeparator, writeParagraphStart, writeString, writeString, writeText, writeText, writeWordSeparator
getColorSpaces, getCurrentPage, getFonts, getGraphicsStack, getGraphicsState, getGraphicsStates, getResources, getTextLineMatrix, getTextMatrix, getTotalCharCnt, getValidCharCnt, getXObjects, isForceParsing, processEncodedText, processOperator, processStream, processSubStream, registerOperatorProcessor, setColorSpaces, setFonts, setForceParsing, setGraphicsStack, setGraphicsState, setGraphicsStates, setTextLineMatrix, setTextMatrix
public PatchedPDFTextStripper() throws IOException
IOException
protected Object unrestrictedAccess(String name)
protected Set<String> unsupportedOperators()
protected void processOperator(org.apache.pdfbox.util.PDFOperator operator, List<org.apache.pdfbox.cos.COSBase> arguments) throws IOException
processOperator
in class org.apache.pdfbox.util.PDFStreamEngine
IOException
Copyright © 2015 Nuxeo SA. All rights reserved.