Package org.apache.tika.parser.pdf.image
Class ImageGraphicsEngine
java.lang.Object
org.apache.pdfbox.contentstream.PDFStreamEngine
org.apache.pdfbox.contentstream.PDFGraphicsStreamEngine
org.apache.tika.parser.pdf.image.ImageGraphicsEngine
public class ImageGraphicsEngine
extends org.apache.pdfbox.contentstream.PDFGraphicsStreamEngine
Copied nearly verbatim from PDFBox
-
Field Summary
Modifier and TypeFieldDescriptionprotected final EmbeddedDocumentExtractor
protected final boolean
protected final AtomicInteger
protected static final long
protected final int
protected final Metadata
protected final ParseContext
protected final PDFParserConfig
protected boolean
protected final XHTMLContentHandler
-
Constructor Summary
ModifierConstructorDescriptionprotected
ImageGraphicsEngine
(org.apache.pdfbox.pdmodel.PDPage page, int pageNumber, EmbeddedDocumentExtractor embeddedDocumentExtractor, PDFParserConfig pdfParserConfig, Map<org.apache.pdfbox.cos.COSStream, Integer> processedInlineImages, AtomicInteger imageCounter, XHTMLContentHandler xhtml, Metadata parentMetadata, ParseContext parseContext) -
Method Summary
Modifier and TypeMethodDescriptionvoid
appendRectangle
(Point2D p0, Point2D p1, Point2D p2, Point2D p3) void
clip
(int windingRule) void
protected static void
copyUpToMaxLength
(InputStream is, OutputStream os) void
curveTo
(float x1, float y1, float x2, float y2, float x3, float y3) void
drawImage
(org.apache.pdfbox.pdmodel.graphics.image.PDImage pdImage) void
endPath()
protected void
extractInlineImageMetadataOnly
(org.apache.pdfbox.pdmodel.graphics.image.PDImage pdImage, Metadata metadata) void
fillAndStrokePath
(int windingRule) void
fillPath
(int windingRule) protected String
protected void
protected static boolean
hasMasks
(org.apache.pdfbox.pdmodel.graphics.image.PDImage pdImage) void
lineTo
(float x, float y) void
moveTo
(float x, float y) protected void
processImage
(org.apache.pdfbox.pdmodel.graphics.image.PDImage pdImage, int imageNumber) void
run()
void
shadingFill
(org.apache.pdfbox.cos.COSName shadingName) protected void
showGlyph
(org.apache.pdfbox.util.Matrix textRenderingMatrix, org.apache.pdfbox.pdmodel.font.PDFont font, int code, org.apache.pdfbox.util.Vector displacement) void
protected BufferedImage
writeToBuffer
(org.apache.pdfbox.pdmodel.graphics.image.PDImage pdImage, String suffix, boolean directJPEG, OutputStream out) Methods inherited from class org.apache.pdfbox.contentstream.PDFGraphicsStreamEngine
getPage
Methods inherited from class org.apache.pdfbox.contentstream.PDFStreamEngine
addOperator, applyTextAdjustment, beginMarkedContentSequence, beginText, decreaseLevel, endMarkedContentSequence, endText, getAppearance, getCurrentPage, getGraphicsStackSize, getGraphicsState, getInitialMatrix, getLevel, getResources, getTextLineMatrix, getTextMatrix, increaseLevel, operatorException, processAnnotation, processChildStream, processOperator, processOperator, processPage, processSoftMask, processTilingPattern, processTilingPattern, processTransparencyGroup, processType3Stream, restoreGraphicsStack, restoreGraphicsState, saveGraphicsStack, saveGraphicsState, setLineDashPattern, setTextLineMatrix, setTextMatrix, showAnnotation, showFontGlyph, showForm, showText, showTextString, showTextStrings, showTransparencyGroup, showType3Glyph, transformedPoint, transformWidth, unsupportedOperator
-
Field Details
-
MAX_IMAGE_LENGTH_BYTES
protected static final long MAX_IMAGE_LENGTH_BYTES- See Also:
-
JPEG
-
JP2
-
JB2
-
pageNumber
protected final int pageNumber -
embeddedDocumentExtractor
-
pdfParserConfig
-
processedInlineImages
-
imageCounter
-
parentMetadata
-
xhtml
-
parseContext
-
extractInlineImageMetadataOnly
protected final boolean extractInlineImageMetadataOnly -
useDirectJPEG
protected boolean useDirectJPEG
-
-
Constructor Details
-
ImageGraphicsEngine
protected ImageGraphicsEngine(org.apache.pdfbox.pdmodel.PDPage page, int pageNumber, EmbeddedDocumentExtractor embeddedDocumentExtractor, PDFParserConfig pdfParserConfig, Map<org.apache.pdfbox.cos.COSStream, Integer> processedInlineImages, AtomicInteger imageCounter, XHTMLContentHandler xhtml, Metadata parentMetadata, ParseContext parseContext)
-
-
Method Details
-
writeToBuffer
protected BufferedImage writeToBuffer(org.apache.pdfbox.pdmodel.graphics.image.PDImage pdImage, String suffix, boolean directJPEG, OutputStream out) throws IOException, TikaException - Throws:
IOException
TikaException
-
copyUpToMaxLength
protected static void copyUpToMaxLength(InputStream is, OutputStream os) throws IOException, TikaException - Throws:
IOException
TikaException
-
hasMasks
protected static boolean hasMasks(org.apache.pdfbox.pdmodel.graphics.image.PDImage pdImage) throws IOException - Throws:
IOException
-
run
- Throws:
IOException
-
drawImage
- Specified by:
drawImage
in classorg.apache.pdfbox.contentstream.PDFGraphicsStreamEngine
- Throws:
IOException
-
appendRectangle
- Specified by:
appendRectangle
in classorg.apache.pdfbox.contentstream.PDFGraphicsStreamEngine
- Throws:
IOException
-
clip
- Specified by:
clip
in classorg.apache.pdfbox.contentstream.PDFGraphicsStreamEngine
- Throws:
IOException
-
moveTo
- Specified by:
moveTo
in classorg.apache.pdfbox.contentstream.PDFGraphicsStreamEngine
- Throws:
IOException
-
lineTo
- Specified by:
lineTo
in classorg.apache.pdfbox.contentstream.PDFGraphicsStreamEngine
- Throws:
IOException
-
curveTo
- Specified by:
curveTo
in classorg.apache.pdfbox.contentstream.PDFGraphicsStreamEngine
- Throws:
IOException
-
getCurrentPoint
- Specified by:
getCurrentPoint
in classorg.apache.pdfbox.contentstream.PDFGraphicsStreamEngine
- Throws:
IOException
-
closePath
- Specified by:
closePath
in classorg.apache.pdfbox.contentstream.PDFGraphicsStreamEngine
- Throws:
IOException
-
endPath
- Specified by:
endPath
in classorg.apache.pdfbox.contentstream.PDFGraphicsStreamEngine
- Throws:
IOException
-
showGlyph
protected void showGlyph(org.apache.pdfbox.util.Matrix textRenderingMatrix, org.apache.pdfbox.pdmodel.font.PDFont font, int code, org.apache.pdfbox.util.Vector displacement) throws IOException - Overrides:
showGlyph
in classorg.apache.pdfbox.contentstream.PDFStreamEngine
- Throws:
IOException
-
strokePath
- Specified by:
strokePath
in classorg.apache.pdfbox.contentstream.PDFGraphicsStreamEngine
- Throws:
IOException
-
fillPath
- Specified by:
fillPath
in classorg.apache.pdfbox.contentstream.PDFGraphicsStreamEngine
- Throws:
IOException
-
fillAndStrokePath
- Specified by:
fillAndStrokePath
in classorg.apache.pdfbox.contentstream.PDFGraphicsStreamEngine
- Throws:
IOException
-
shadingFill
- Specified by:
shadingFill
in classorg.apache.pdfbox.contentstream.PDFGraphicsStreamEngine
- Throws:
IOException
-
processImage
protected void processImage(org.apache.pdfbox.pdmodel.graphics.image.PDImage pdImage, int imageNumber) throws IOException, TikaException, SAXException - Throws:
IOException
TikaException
SAXException
-
extractInlineImageMetadataOnly
protected void extractInlineImageMetadataOnly(org.apache.pdfbox.pdmodel.graphics.image.PDImage pdImage, Metadata metadata) throws IOException, SAXException - Throws:
IOException
SAXException
-
getSuffix
protected String getSuffix(org.apache.pdfbox.pdmodel.graphics.image.PDImage pdImage, Metadata metadata) throws IOException - Throws:
IOException
-
handleCatchableIOE
- Throws:
IOException
-
getExceptions
-