|
||||||||||
PREV NEXT | FRAMES NO FRAMES |
Uses of Metadata in org.apache.tika |
---|
Methods in org.apache.tika with parameters of type Metadata | |
---|---|
java.lang.String |
Tika.detect(java.io.InputStream stream,
Metadata metadata)
Detects the media type of the given document. |
java.io.Reader |
Tika.parse(java.io.InputStream stream,
Metadata metadata)
Parses the given document and returns the extracted text content. |
java.lang.String |
Tika.parseToString(java.io.InputStream stream,
Metadata metadata)
Parses the given document and returns the extracted text content. |
Uses of Metadata in org.apache.tika.detect |
---|
Methods in org.apache.tika.detect with parameters of type Metadata | |
---|---|
MediaType |
ZipContainerDetector.detect(java.io.InputStream input,
Metadata metadata)
|
MediaType |
POIFSContainerDetector.detect(java.io.InputStream input,
Metadata metadata)
|
MediaType |
ContainerDetector.detect(java.io.InputStream input,
Metadata metadata)
Detect on the generic input stream, if possible. |
MediaType |
ContainerAwareDetector.detect(java.io.InputStream input,
Metadata metadata)
|
MediaType |
TypeDetector.detect(java.io.InputStream input,
Metadata metadata)
Detects the content type of an input document based on a type hint given in the input metadata. |
MediaType |
TextDetector.detect(java.io.InputStream input,
Metadata metadata)
Looks at the beginning of the document input stream to determine whether the document is text or not. |
MediaType |
NameDetector.detect(java.io.InputStream input,
Metadata metadata)
Detects the content type of an input document based on the document name given in the input metadata. |
MediaType |
MagicDetector.detect(java.io.InputStream input,
Metadata metadata)
|
MediaType |
Detector.detect(java.io.InputStream input,
Metadata metadata)
Detects the content type of the given input document. |
MediaType |
CompositeDetector.detect(java.io.InputStream input,
Metadata metadata)
|
MediaType |
ZipContainerDetector.detect(TikaInputStream input,
Metadata metadata)
|
MediaType |
POIFSContainerDetector.detect(TikaInputStream stream,
Metadata metadata)
|
MediaType |
ContainerDetector.detect(TikaInputStream input,
Metadata metadata)
Does full, container aware detection for the file of the appropriate container type. |
MediaType |
ContainerAwareDetector.detect(TikaInputStream input,
Metadata metadata)
|
Uses of Metadata in org.apache.tika.extractor |
---|
Methods in org.apache.tika.extractor with parameters of type Metadata | |
---|---|
void |
EmbeddedDocumentExtractor.parseEmbedded(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
boolean outputHtml)
Processes the supplied embedded resource, calling the delegating parser with the appropriate details. |
boolean |
DocumentSelector.select(Metadata metadata)
Checks if a document with the given metadata matches the specified selection criteria. |
boolean |
EmbeddedDocumentExtractor.shouldParseEmbedded(Metadata metadata)
|
Uses of Metadata in org.apache.tika.fork |
---|
Methods in org.apache.tika.fork with parameters of type Metadata | |
---|---|
void |
ForkParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.gui |
---|
Methods in org.apache.tika.gui with parameters of type Metadata | |
---|---|
void |
TikaGUI.importStream(java.io.InputStream input,
Metadata md)
|
Uses of Metadata in org.apache.tika.io |
---|
Methods in org.apache.tika.io with parameters of type Metadata | |
---|---|
static TikaInputStream |
TikaInputStream.get(java.sql.Blob blob,
Metadata metadata)
Creates a TikaInputStream from the given database BLOB. |
static TikaInputStream |
TikaInputStream.get(byte[] data,
Metadata metadata)
Creates a TikaInputStream from the given array of bytes. |
static TikaInputStream |
TikaInputStream.get(java.io.File file,
Metadata metadata)
Creates a TikaInputStream from the given file. |
static TikaInputStream |
TikaInputStream.get(java.net.URI uri,
Metadata metadata)
Creates a TikaInputStream from the resource at the given URI. |
static TikaInputStream |
TikaInputStream.get(java.net.URL url,
Metadata metadata)
Creates a TikaInputStream from the resource at the given URL. |
Uses of Metadata in org.apache.tika.metadata |
---|
Methods in org.apache.tika.metadata with parameters of type Metadata | |
---|---|
static java.io.InputStream |
MetadataHelper.getInputStream(java.net.URL url,
Metadata metadata)
Deprecated. Returns the content at the given URL, and sets any related metadata entries. |
Uses of Metadata in org.apache.tika.mime |
---|
Methods in org.apache.tika.mime with parameters of type Metadata | |
---|---|
MediaType |
MimeTypes.detect(java.io.InputStream input,
Metadata metadata)
Automatically detects the MIME type of a document based on magic markers in the stream prefix and any given metadata hints. |
Uses of Metadata in org.apache.tika.parser |
---|
Methods in org.apache.tika.parser with parameters of type Metadata | |
---|---|
protected Parser |
CompositeParser.getParser(Metadata metadata)
Returns the parser that best matches the given metadata. |
protected Parser |
CompositeParser.getParser(Metadata metadata,
ParseContext context)
|
void |
ParserDecorator.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
Parser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
ExternalParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
ErrorParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
EmptyParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
DelegatingParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
CompositeParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
AutoDetectParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
|
void |
ParserPostProcessor.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
Forwards the call to the delegated parser and post-processes the results as described above. |
void |
ParserDecorator.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
Delegates the method call to the decorated parser. |
void |
Parser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
Parses a document stream into a sequence of XHTML SAX events. |
void |
ExternalParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
Executes the configured external command and passes the given document stream as a simple XHTML document to the given SAX content handler. |
void |
ErrorParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
void |
EmptyParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
void |
DelegatingParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
Looks up the delegate parser from the parsing context and delegates the parse operation to it. |
void |
CompositeParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
Delegates the call to the matching component parser. |
void |
AutoDetectParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Constructors in org.apache.tika.parser with parameters of type Metadata | |
---|---|
ParsingReader(Parser parser,
java.io.InputStream stream,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0 |
|
ParsingReader(Parser parser,
java.io.InputStream stream,
Metadata metadata,
java.util.concurrent.Executor executor)
Deprecated. This method will be removed in Apache Tika 1.0 |
|
ParsingReader(Parser parser,
java.io.InputStream stream,
Metadata metadata,
ParseContext context)
Creates a reader for the text content of the given binary stream with the given document metadata. |
|
ParsingReader(Parser parser,
java.io.InputStream stream,
Metadata metadata,
ParseContext context,
java.util.concurrent.Executor executor)
Creates a reader for the text content of the given binary stream with the given document metadata. |
Uses of Metadata in org.apache.tika.parser.asm |
---|
Methods in org.apache.tika.parser.asm with parameters of type Metadata | |
---|---|
void |
ClassParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
ClassParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.parser.audio |
---|
Methods in org.apache.tika.parser.audio with parameters of type Metadata | |
---|---|
void |
MidiParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
AudioParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
MidiParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
void |
AudioParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.parser.dwg |
---|
Methods in org.apache.tika.parser.dwg with parameters of type Metadata | |
---|---|
void |
DWGParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
|
void |
DWGParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.parser.epub |
---|
Methods in org.apache.tika.parser.epub with parameters of type Metadata | |
---|---|
void |
EpubParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
EpubContentParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
EpubParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
void |
EpubContentParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.parser.feed |
---|
Methods in org.apache.tika.parser.feed with parameters of type Metadata | |
---|---|
void |
FeedParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
|
void |
FeedParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.parser.font |
---|
Methods in org.apache.tika.parser.font with parameters of type Metadata | |
---|---|
void |
TrueTypeParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
TrueTypeParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.parser.hdf |
---|
Methods in org.apache.tika.parser.hdf with parameters of type Metadata | |
---|---|
void |
HDFParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
|
void |
HDFParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
protected void |
HDFParser.unravelStringMet(ucar.nc2.NetcdfFile ncFile,
ucar.nc2.Group group,
Metadata met)
|
Uses of Metadata in org.apache.tika.parser.html |
---|
Methods in org.apache.tika.parser.html with parameters of type Metadata | |
---|---|
void |
HtmlParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
HtmlParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.parser.image |
---|
Methods in org.apache.tika.parser.image with parameters of type Metadata | |
---|---|
static void |
ImageMetadataExtractor.handleCommonImageTags(Metadata metadata,
com.drew.metadata.Tag tag,
com.drew.metadata.Directory directory)
Maps common TIFF and EXIF tags onto the Tika TIFF image metadata namespace. |
static void |
ImageMetadataExtractor.handleGeoImageTags(Metadata metadata)
Maps EXIF Geo Tags onto the Tika Geo metadata namespace. |
void |
TiffParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
ImageParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
TiffParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
void |
ImageParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Constructors in org.apache.tika.parser.image with parameters of type Metadata | |
---|---|
ImageMetadataExtractor(Metadata metadata)
|
Uses of Metadata in org.apache.tika.parser.iwork |
---|
Methods in org.apache.tika.parser.iwork with parameters of type Metadata | |
---|---|
void |
IWorkParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
IWorkPackageParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
IWorkParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
void |
IWorkPackageParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.parser.jpeg |
---|
Methods in org.apache.tika.parser.jpeg with parameters of type Metadata | |
---|---|
void |
JpegParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
JpegParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.parser.mbox |
---|
Methods in org.apache.tika.parser.mbox with parameters of type Metadata | |
---|---|
void |
MboxParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
|
void |
MboxParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.parser.microsoft |
---|
Methods in org.apache.tika.parser.microsoft with parameters of type Metadata | |
---|---|
void |
OfficeParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
OfficeParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
Extracts properties and text from an MS Document input stream |
void |
OutlookExtractor.parse(XHTMLContentHandler xhtml,
Metadata metadata)
|
Uses of Metadata in org.apache.tika.parser.microsoft.ooxml |
---|
Methods in org.apache.tika.parser.microsoft.ooxml with parameters of type Metadata | |
---|---|
void |
MetadataExtractor.extract(Metadata metadata)
|
void |
OOXMLExtractor.getXHTML(org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
Parses the document into a sequence of XHTML SAX events sent to the given content handler. |
void |
AbstractOOXMLExtractor.getXHTML(org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
void |
OOXMLParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
OOXMLParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
static void |
OOXMLExtractorFactory.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.parser.mp3 |
---|
Methods in org.apache.tika.parser.mp3 with parameters of type Metadata | |
---|---|
void |
Mp3Parser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
Mp3Parser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.parser.netcdf |
---|
Methods in org.apache.tika.parser.netcdf with parameters of type Metadata | |
---|---|
void |
NetCDFParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
|
void |
NetCDFParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.parser.odf |
---|
Methods in org.apache.tika.parser.odf with parameters of type Metadata | |
---|---|
protected org.xml.sax.ContentHandler |
OpenDocumentMetaParser.getContentHandler(org.xml.sax.ContentHandler ch,
Metadata md)
|
void |
OpenDocumentParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
OpenDocumentContentParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
OpenDocumentParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
void |
OpenDocumentContentParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.parser.pdf |
---|
Methods in org.apache.tika.parser.pdf with parameters of type Metadata | |
---|---|
void |
PDFParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
PDFParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.parser.pkg |
---|
Methods in org.apache.tika.parser.pkg with parameters of type Metadata | |
---|---|
void |
PackageParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
PackageParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.parser.rtf |
---|
Methods in org.apache.tika.parser.rtf with parameters of type Metadata | |
---|---|
void |
RTFParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
RTFParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.parser.txt |
---|
Methods in org.apache.tika.parser.txt with parameters of type Metadata | |
---|---|
void |
TXTParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
TXTParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.parser.video |
---|
Methods in org.apache.tika.parser.video with parameters of type Metadata | |
---|---|
void |
FLVParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
|
void |
FLVParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Uses of Metadata in org.apache.tika.parser.xml |
---|
Methods in org.apache.tika.parser.xml with parameters of type Metadata | |
---|---|
protected org.xml.sax.ContentHandler |
XMLParser.getContentHandler(org.xml.sax.ContentHandler handler,
Metadata metadata)
|
protected org.xml.sax.ContentHandler |
DcXMLParser.getContentHandler(org.xml.sax.ContentHandler ch,
Metadata md)
|
void |
XMLParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata)
Deprecated. This method will be removed in Apache Tika 1.0. |
void |
XMLParser.parse(java.io.InputStream stream,
org.xml.sax.ContentHandler handler,
Metadata metadata,
ParseContext context)
|
Constructors in org.apache.tika.parser.xml with parameters of type Metadata | |
---|---|
AttributeDependantMetadataHandler(Metadata metadata,
java.lang.String nameHoldingAttribute,
java.lang.String namePrefix)
|
|
MetadataHandler(Metadata metadata,
java.lang.String name)
|
Uses of Metadata in org.apache.tika.sax |
---|
Constructors in org.apache.tika.sax with parameters of type Metadata | |
---|---|
XHTMLContentHandler(org.xml.sax.ContentHandler handler,
Metadata metadata)
|
|
||||||||||
PREV NEXT | FRAMES NO FRAMES |