Package org.apache.tika.parser.microsoft
Class HSLFExtractor
java.lang.Object
org.apache.tika.parser.microsoft.HSLFExtractor
- 
Field SummaryFieldsModifier and TypeFieldDescriptionprotected final ParseContextprotected final OfficeParserConfigprotected final Metadata
- 
Constructor SummaryConstructors
- 
Method SummaryModifier and TypeMethodDescriptionprotected Detectorprotected StringReturns the password to be used for this file, or null if no / default password should be usedprotected TikaConfigprotected voidhandleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, String resourceName, XHTMLContentHandler xhtml, boolean outputHtml) Handle an office document that's embedded at the POIFS levelprotected voidhandleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, XHTMLContentHandler xhtml, boolean outputHtml) Handle an office document that's embedded at the POIFS levelprotected voidhandleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) protected voidhandleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) protected voidhandleEmbeddedResource(TikaInputStream resource, Metadata embeddedMetadata, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) protected voidparse(org.apache.poi.poifs.filesystem.DirectoryNode root, XHTMLContentHandler xhtml) protected voidparse(org.apache.poi.poifs.filesystem.POIFSFileSystem filesystem, XHTMLContentHandler xhtml) static StringtryToGetMsgTitle(org.apache.poi.poifs.filesystem.DirectoryEntry node, String defaultVal) 
- 
Field Details- 
parentMetadata
- 
officeParserConfig
- 
context
 
- 
- 
Constructor Details- 
HSLFExtractor
 
- 
- 
Method Details- 
parseprotected void parse(org.apache.poi.poifs.filesystem.POIFSFileSystem filesystem, XHTMLContentHandler xhtml) throws IOException, SAXException, TikaException - Throws:
- IOException
- SAXException
- TikaException
 
- 
parseprotected void parse(org.apache.poi.poifs.filesystem.DirectoryNode root, XHTMLContentHandler xhtml) throws IOException, SAXException, TikaException - Throws:
- IOException
- SAXException
- TikaException
 
- 
getTikaConfig
- 
getDetector
- 
getPasswordReturns the password to be used for this file, or null if no / default password should be used
- 
handleEmbeddedResourceprotected void handleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException - Throws:
- IOException
- SAXException
- TikaException
 
- 
handleEmbeddedResourceprotected void handleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException - Throws:
- IOException
- SAXException
- TikaException
 
- 
handleEmbeddedResourceprotected void handleEmbeddedResource(TikaInputStream resource, Metadata embeddedMetadata, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException - Throws:
- IOException
- SAXException
- TikaException
 
- 
handleEmbeddedOfficeDocprotected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException Handle an office document that's embedded at the POIFS level- Throws:
- IOException
- SAXException
- TikaException
 
- 
handleEmbeddedOfficeDocprotected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, String resourceName, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException Handle an office document that's embedded at the POIFS level- Throws:
- IOException
- SAXException
- TikaException
 
- 
tryToGetMsgTitle
 
-