public abstract class AbstractOfficeParser extends AbstractParser
OfficeParserConfig
uniformly.Constructor and Description |
---|
AbstractOfficeParser() |
Modifier and Type | Method and Description |
---|---|
void |
configure(ParseContext parseContext)
Checks to see if the user has specified an
OfficeParserConfig . |
int |
getByteArrayMaxOverride() |
String |
getDateFormatOverride() |
boolean |
isConcatenatePhoneticRuns() |
boolean |
isExtractAllAlternativesFromMSG() |
boolean |
isExtractMacros() |
boolean |
isIncludeDeletedContent() |
boolean |
isIncludeHeadersAndFooters() |
boolean |
isIncludeMoveFromContent() |
boolean |
isIncludeShapeBasedContent() |
boolean |
isUseSAXDocxExtractor() |
boolean |
isUseSAXPptxExtractor() |
void |
setByteArrayMaxOverride(int maxOverride)
WARNING: this sets a static variable in POI.
|
void |
setConcatenatePhoneticRuns(boolean concatenatePhoneticRuns) |
void |
setDateFormatOverride(String format) |
void |
setExtractAllAlternativesFromMSG(boolean extractAllAlternativesFromMSG)
Some .msg files can contain body content in html, rtf and/or text.
|
void |
setExtractMacros(boolean extractMacros) |
void |
setIncludeDeletedContent(boolean includeDeletedConent) |
void |
setIncludeHeadersAndFooters(boolean includeHeadersAndFooters) |
void |
setIncludeMoveFromContent(boolean includeMoveFromContent) |
void |
setIncludeShapeBasedContent(boolean includeShapeBasedContent) |
void |
setUseSAXDocxExtractor(boolean useSAXDocxExtractor) |
void |
setUseSAXPptxExtractor(boolean useSAXPptxExtractor) |
parse
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
getSupportedTypes, parse
public void configure(ParseContext parseContext)
OfficeParserConfig
.
If so, no changes are made; if not, one is added to the context.parseContext
- public boolean isIncludeDeletedContent()
OfficeParserConfig.isIncludeDeletedContent()
@Field public void setIncludeDeletedContent(boolean includeDeletedConent)
public boolean isIncludeMoveFromContent()
OfficeParserConfig.isIncludeMoveFromContent()
@Field public void setIncludeMoveFromContent(boolean includeMoveFromContent)
public boolean isUseSAXDocxExtractor()
OfficeParserConfig.isUseSAXDocxExtractor()
@Field public void setUseSAXDocxExtractor(boolean useSAXDocxExtractor)
public boolean isExtractMacros()
OfficeParserConfig.isExtractMacros()
@Field public void setExtractMacros(boolean extractMacros)
@Field public void setIncludeShapeBasedContent(boolean includeShapeBasedContent)
public boolean isIncludeShapeBasedContent()
@Field public void setUseSAXPptxExtractor(boolean useSAXPptxExtractor)
public boolean isUseSAXPptxExtractor()
@Field public void setConcatenatePhoneticRuns(boolean concatenatePhoneticRuns)
public boolean isConcatenatePhoneticRuns()
public boolean isExtractAllAlternativesFromMSG()
@Field public void setExtractAllAlternativesFromMSG(boolean extractAllAlternativesFromMSG)
extractAllAlternativesFromMSG
- whether or not to extract all alternative parts from
msg files@Field public void setByteArrayMaxOverride(int maxOverride)
maxOverride
- public int getByteArrayMaxOverride()
public String getDateFormatOverride()
@Field public void setIncludeHeadersAndFooters(boolean includeHeadersAndFooters)
public boolean isIncludeHeadersAndFooters()
Copyright © 2007–2022 The Apache Software Foundation. All rights reserved.