Package org.apache.tika.parser.microsoft
Class OutlookExtractor
- java.lang.Object
-
- org.apache.tika.parser.microsoft.OutlookExtractor
-
public class OutlookExtractor extends Object
Outlook Message Parser.
-
-
Nested Class Summary
Nested Classes Modifier and Type Class Description static class
OutlookExtractor.RECIPIENT_TYPE
-
Field Summary
Fields Modifier and Type Field Description protected ParseContext
context
protected OfficeParserConfig
officeParserConfig
protected Metadata
parentMetadata
-
Constructor Summary
Constructors Constructor Description OutlookExtractor(org.apache.poi.poifs.filesystem.DirectoryNode root, Metadata metadata, ParseContext context)
OutlookExtractor(org.apache.poi.poifs.filesystem.DirectoryNode root, ParseContext context)
Deprecated.useOutlookExtractor(DirectoryNode, Metadata, ParseContext)
Will be removed after 2.4.0OutlookExtractor(org.apache.poi.poifs.filesystem.POIFSFileSystem filesystem, ParseContext context)
Deprecated.useOutlookExtractor(DirectoryNode, Metadata, ParseContext)
Will be removed after 2.4.0
-
Method Summary
All Methods Static Methods Instance Methods Concrete Methods Deprecated Methods Modifier and Type Method Description static void
addEvenIfNull(Property property, String value, Metadata metadata)
protected Detector
getDetector()
static String
getMessageClass(String messageClass)
protected MimeTypes
getMimeTypes()
Deprecated.protected String
getPassword()
Returns the password to be used for this file, or null if no / default password should be usedprotected TikaConfig
getTikaConfig()
protected void
handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, String resourceName, XHTMLContentHandler xhtml, boolean outputHtml)
Handle an office document that's embedded at the POIFS levelprotected void
handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, XHTMLContentHandler xhtml, boolean outputHtml)
Handle an office document that's embedded at the POIFS levelprotected void
handleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml)
protected void
handleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml)
protected void
handleEmbeddedResource(TikaInputStream resource, Metadata embeddedMetadata, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml)
void
parse(XHTMLContentHandler xhtml)
void
parse(XHTMLContentHandler xhtml, Metadata metadata)
Deprecated.use {@link #parse(XHTMLContentHandler), will be removed after 2.4.0}
-
-
-
Field Detail
-
parentMetadata
protected final Metadata parentMetadata
-
officeParserConfig
protected final OfficeParserConfig officeParserConfig
-
context
protected final ParseContext context
-
-
Constructor Detail
-
OutlookExtractor
@Deprecated public OutlookExtractor(org.apache.poi.poifs.filesystem.POIFSFileSystem filesystem, ParseContext context) throws TikaException
Deprecated.useOutlookExtractor(DirectoryNode, Metadata, ParseContext)
Will be removed after 2.4.0- Parameters:
filesystem
-context
-- Throws:
TikaException
-
OutlookExtractor
@Deprecated public OutlookExtractor(org.apache.poi.poifs.filesystem.DirectoryNode root, ParseContext context) throws TikaException
Deprecated.useOutlookExtractor(DirectoryNode, Metadata, ParseContext)
Will be removed after 2.4.0- Parameters:
root
-context
-- Throws:
TikaException
-
OutlookExtractor
public OutlookExtractor(org.apache.poi.poifs.filesystem.DirectoryNode root, Metadata metadata, ParseContext context) throws TikaException
- Throws:
TikaException
-
-
Method Detail
-
parse
public void parse(XHTMLContentHandler xhtml) throws TikaException, SAXException, IOException
- Throws:
TikaException
SAXException
IOException
-
parse
@Deprecated public void parse(XHTMLContentHandler xhtml, Metadata metadata) throws TikaException, SAXException, IOException
Deprecated.use {@link #parse(XHTMLContentHandler), will be removed after 2.4.0}- Parameters:
xhtml
-metadata
-- Throws:
TikaException
SAXException
IOException
-
getTikaConfig
protected TikaConfig getTikaConfig()
-
getDetector
protected Detector getDetector()
-
getMimeTypes
protected MimeTypes getMimeTypes()
Deprecated.- Returns:
- mimetypes
-
getPassword
protected String getPassword()
Returns the password to be used for this file, or null if no / default password should be used
-
handleEmbeddedResource
protected void handleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException
- Throws:
IOException
SAXException
TikaException
-
handleEmbeddedResource
protected void handleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException
- Throws:
IOException
SAXException
TikaException
-
handleEmbeddedResource
protected void handleEmbeddedResource(TikaInputStream resource, Metadata embeddedMetadata, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException
- Throws:
IOException
SAXException
TikaException
-
handleEmbeddedOfficeDoc
protected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException
Handle an office document that's embedded at the POIFS level- Throws:
IOException
SAXException
TikaException
-
handleEmbeddedOfficeDoc
protected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, String resourceName, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException
Handle an office document that's embedded at the POIFS level- Throws:
IOException
SAXException
TikaException
-
-