public class HSLFExtractor extends Object
Modifier and Type | Field and Description |
---|---|
protected ParseContext |
context |
protected OfficeParserConfig |
officeParserConfig |
protected Metadata |
parentMetadata |
Constructor and Description |
---|
HSLFExtractor(ParseContext context,
Metadata metadata) |
Modifier and Type | Method and Description |
---|---|
protected Detector |
getDetector() |
protected MimeTypes |
getMimeTypes()
Deprecated.
|
protected String |
getPassword()
Returns the password to be used for this file, or null
if no / default password should be used
|
protected TikaConfig |
getTikaConfig() |
protected void |
handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir,
String resourceName,
XHTMLContentHandler xhtml,
boolean outputHtml)
Handle an office document that's embedded at the POIFS level
|
protected void |
handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir,
XHTMLContentHandler xhtml,
boolean outputHtml)
Handle an office document that's embedded at the POIFS level
|
protected void |
handleEmbeddedResource(TikaInputStream resource,
Metadata embeddedMetadata,
String filename,
String relationshipID,
org.apache.poi.hpsf.ClassID storageClassID,
String mediaType,
XHTMLContentHandler xhtml,
boolean outputHtml) |
protected void |
handleEmbeddedResource(TikaInputStream resource,
String filename,
String relationshipID,
org.apache.poi.hpsf.ClassID storageClassID,
String mediaType,
XHTMLContentHandler xhtml,
boolean outputHtml) |
protected void |
handleEmbeddedResource(TikaInputStream resource,
String filename,
String relationshipID,
String mediaType,
XHTMLContentHandler xhtml,
boolean outputHtml) |
protected void |
parse(org.apache.poi.poifs.filesystem.DirectoryNode root,
XHTMLContentHandler xhtml) |
protected void |
parse(org.apache.poi.poifs.filesystem.POIFSFileSystem filesystem,
XHTMLContentHandler xhtml) |
protected final Metadata parentMetadata
protected final OfficeParserConfig officeParserConfig
protected final ParseContext context
public HSLFExtractor(ParseContext context, Metadata metadata)
protected void parse(org.apache.poi.poifs.filesystem.POIFSFileSystem filesystem, XHTMLContentHandler xhtml) throws IOException, SAXException, TikaException
IOException
SAXException
TikaException
protected void parse(org.apache.poi.poifs.filesystem.DirectoryNode root, XHTMLContentHandler xhtml) throws IOException, SAXException, TikaException
IOException
SAXException
TikaException
protected TikaConfig getTikaConfig()
protected Detector getDetector()
protected MimeTypes getMimeTypes()
embeddedDocumentUtil
protected String getPassword()
protected void handleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException
IOException
SAXException
TikaException
protected void handleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException
IOException
SAXException
TikaException
protected void handleEmbeddedResource(TikaInputStream resource, Metadata embeddedMetadata, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException
IOException
SAXException
TikaException
protected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException
IOException
SAXException
TikaException
protected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, String resourceName, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException
IOException
SAXException
TikaException
Copyright © 2007–2023 The Apache Software Foundation. All rights reserved.