Package org.apache.tika.parser.microsoft
Class OutlookExtractor
- java.lang.Object
-
- org.apache.tika.parser.microsoft.OutlookExtractor
-
public class OutlookExtractor extends Object
Outlook Message Parser.
-
-
Nested Class Summary
Nested Classes Modifier and Type Class Description static classOutlookExtractor.BODY_TYPES_PROCESSEDstatic classOutlookExtractor.RECIPIENT_TYPE
-
Field Summary
Fields Modifier and Type Field Description protected ParseContextcontextprotected OfficeParserConfigofficeParserConfigprotected MetadataparentMetadata
-
Constructor Summary
Constructors Constructor Description OutlookExtractor(org.apache.poi.poifs.filesystem.DirectoryNode root, Metadata metadata, ParseContext context)
-
Method Summary
All Methods Static Methods Instance Methods Concrete Methods Modifier and Type Method Description static voidaddEvenIfNull(Property property, String value, Metadata metadata)protected DetectorgetDetector()static StringgetNormalizedMessageClass(String messageClass)protected StringgetPassword()Returns the password to be used for this file, or null if no / default password should be usedprotected TikaConfiggetTikaConfig()protected voidhandleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, String resourceName, XHTMLContentHandler xhtml, boolean outputHtml)Handle an office document that's embedded at the POIFS levelprotected voidhandleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, Metadata metadata, String resourceName, XHTMLContentHandler xhtml, boolean outputHtml)Handle an office document that's embedded at the POIFS levelprotected voidhandleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, XHTMLContentHandler xhtml, boolean outputHtml)Handle an office document that's embedded at the POIFS levelprotected voidhandleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml)protected voidhandleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml)protected voidhandleEmbeddedResource(TikaInputStream resource, Metadata embeddedMetadata, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml)voidparse(XHTMLContentHandler xhtml)static StringtryToGetMsgTitle(org.apache.poi.poifs.filesystem.DirectoryEntry node, String defaultVal)
-
-
-
Field Detail
-
parentMetadata
protected final Metadata parentMetadata
-
officeParserConfig
protected final OfficeParserConfig officeParserConfig
-
context
protected final ParseContext context
-
-
Constructor Detail
-
OutlookExtractor
public OutlookExtractor(org.apache.poi.poifs.filesystem.DirectoryNode root, Metadata metadata, ParseContext context) throws TikaException- Throws:
TikaException
-
-
Method Detail
-
parse
public void parse(XHTMLContentHandler xhtml) throws TikaException, SAXException, IOException
- Throws:
TikaExceptionSAXExceptionIOException
-
getTikaConfig
protected TikaConfig getTikaConfig()
-
getDetector
protected Detector getDetector()
-
getPassword
protected String getPassword()
Returns the password to be used for this file, or null if no / default password should be used
-
handleEmbeddedResource
protected void handleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException
- Throws:
IOExceptionSAXExceptionTikaException
-
handleEmbeddedResource
protected void handleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException
- Throws:
IOExceptionSAXExceptionTikaException
-
handleEmbeddedResource
protected void handleEmbeddedResource(TikaInputStream resource, Metadata embeddedMetadata, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException
- Throws:
IOExceptionSAXExceptionTikaException
-
handleEmbeddedOfficeDoc
protected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaExceptionHandle an office document that's embedded at the POIFS level- Throws:
IOExceptionSAXExceptionTikaException
-
handleEmbeddedOfficeDoc
protected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, String resourceName, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaExceptionHandle an office document that's embedded at the POIFS level- Throws:
IOExceptionSAXExceptionTikaException
-
handleEmbeddedOfficeDoc
protected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, Metadata metadata, String resourceName, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaExceptionHandle an office document that's embedded at the POIFS level- Throws:
IOExceptionSAXExceptionTikaException
-
-