Package org.apache.tika.parser.microsoft
Class HSLFExtractor
java.lang.Object
org.apache.tika.parser.microsoft.HSLFExtractor
-
Field Summary
Modifier and TypeFieldDescriptionprotected final ParseContext
protected final OfficeParserConfig
protected final Metadata
-
Constructor Summary
-
Method Summary
Modifier and TypeMethodDescriptionprotected Detector
protected String
Returns the password to be used for this file, or null if no / default password should be usedprotected TikaConfig
protected void
handleEmbeddedOfficeDoc
(org.apache.poi.poifs.filesystem.DirectoryEntry dir, String resourceName, XHTMLContentHandler xhtml, boolean outputHtml) Handle an office document that's embedded at the POIFS levelprotected void
handleEmbeddedOfficeDoc
(org.apache.poi.poifs.filesystem.DirectoryEntry dir, XHTMLContentHandler xhtml, boolean outputHtml) Handle an office document that's embedded at the POIFS levelprotected void
handleEmbeddedResource
(TikaInputStream resource, String filename, String relationshipID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) protected void
handleEmbeddedResource
(TikaInputStream resource, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) protected void
handleEmbeddedResource
(TikaInputStream resource, Metadata embeddedMetadata, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) protected void
parse
(org.apache.poi.poifs.filesystem.DirectoryNode root, XHTMLContentHandler xhtml) protected void
parse
(org.apache.poi.poifs.filesystem.POIFSFileSystem filesystem, XHTMLContentHandler xhtml) static String
tryToGetMsgTitle
(org.apache.poi.poifs.filesystem.DirectoryEntry node, String defaultVal)
-
Field Details
-
parentMetadata
-
officeParserConfig
-
context
-
-
Constructor Details
-
HSLFExtractor
-
-
Method Details
-
parse
protected void parse(org.apache.poi.poifs.filesystem.POIFSFileSystem filesystem, XHTMLContentHandler xhtml) throws IOException, SAXException, TikaException - Throws:
IOException
SAXException
TikaException
-
parse
protected void parse(org.apache.poi.poifs.filesystem.DirectoryNode root, XHTMLContentHandler xhtml) throws IOException, SAXException, TikaException - Throws:
IOException
SAXException
TikaException
-
getTikaConfig
-
getDetector
-
getPassword
Returns the password to be used for this file, or null if no / default password should be used -
handleEmbeddedResource
protected void handleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException - Throws:
IOException
SAXException
TikaException
-
handleEmbeddedResource
protected void handleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException - Throws:
IOException
SAXException
TikaException
-
handleEmbeddedResource
protected void handleEmbeddedResource(TikaInputStream resource, Metadata embeddedMetadata, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException - Throws:
IOException
SAXException
TikaException
-
handleEmbeddedOfficeDoc
protected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException Handle an office document that's embedded at the POIFS level- Throws:
IOException
SAXException
TikaException
-
handleEmbeddedOfficeDoc
protected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, String resourceName, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException Handle an office document that's embedded at the POIFS level- Throws:
IOException
SAXException
TikaException
-
tryToGetMsgTitle
-