Package org.apache.tika.parser.microsoft
Class OutlookExtractor
java.lang.Object
org.apache.tika.parser.microsoft.OutlookExtractor
Outlook Message Parser.
-
Nested Class Summary
Nested ClassesModifier and TypeClassDescriptionstatic enumstatic enum -
Field Summary
FieldsModifier and TypeFieldDescriptionprotected final ParseContextprotected final OfficeParserConfigprotected final Metadata -
Constructor Summary
ConstructorsConstructorDescriptionOutlookExtractor(org.apache.poi.poifs.filesystem.DirectoryNode root, Metadata metadata, ParseContext context) -
Method Summary
Modifier and TypeMethodDescriptionstatic voidaddEvenIfNull(Property property, String value, Metadata metadata) protected Detectorstatic StringgetNormalizedMessageClass(String messageClass) protected StringReturns the password to be used for this file, or null if no / default password should be usedprotected TikaConfigprotected voidhandleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, String resourceName, XHTMLContentHandler xhtml, boolean outputHtml) Handle an office document that's embedded at the POIFS levelprotected voidhandleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, Metadata metadata, String resourceName, XHTMLContentHandler xhtml, boolean outputHtml) Handle an office document that's embedded at the POIFS levelprotected voidhandleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, XHTMLContentHandler xhtml, boolean outputHtml) Handle an office document that's embedded at the POIFS levelprotected voidhandleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) protected voidhandleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) protected voidhandleEmbeddedResource(TikaInputStream resource, Metadata embeddedMetadata, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) voidparse(XHTMLContentHandler xhtml) static StringtryToGetMsgTitle(org.apache.poi.poifs.filesystem.DirectoryEntry node, String defaultVal)
-
Field Details
-
parentMetadata
-
officeParserConfig
-
context
-
-
Constructor Details
-
OutlookExtractor
public OutlookExtractor(org.apache.poi.poifs.filesystem.DirectoryNode root, Metadata metadata, ParseContext context) throws TikaException - Throws:
TikaException
-
-
Method Details
-
addEvenIfNull
-
getNormalizedMessageClass
-
parse
- Throws:
TikaExceptionSAXExceptionIOException
-
getTikaConfig
-
getDetector
-
getPassword
Returns the password to be used for this file, or null if no / default password should be used -
handleEmbeddedResource
protected void handleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException - Throws:
IOExceptionSAXExceptionTikaException
-
handleEmbeddedResource
protected void handleEmbeddedResource(TikaInputStream resource, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException - Throws:
IOExceptionSAXExceptionTikaException
-
handleEmbeddedResource
protected void handleEmbeddedResource(TikaInputStream resource, Metadata embeddedMetadata, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException - Throws:
IOExceptionSAXExceptionTikaException
-
handleEmbeddedOfficeDoc
protected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException Handle an office document that's embedded at the POIFS level- Throws:
IOExceptionSAXExceptionTikaException
-
handleEmbeddedOfficeDoc
protected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, String resourceName, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException Handle an office document that's embedded at the POIFS level- Throws:
IOExceptionSAXExceptionTikaException
-
handleEmbeddedOfficeDoc
protected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, Metadata metadata, String resourceName, XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, TikaException Handle an office document that's embedded at the POIFS level- Throws:
IOExceptionSAXExceptionTikaException
-
tryToGetMsgTitle
-