Package org.apache.tika.eval.core.util
Class ContentTagParser
- java.lang.Object
-
- org.apache.tika.eval.core.util.ContentTagParser
-
public class ContentTagParser extends Object
-
-
Constructor Summary
Constructors Constructor Description ContentTagParser()
-
Method Summary
All Methods Static Methods Concrete Methods Modifier and Type Method Description static ContentTags
parseHTML(String html, Set<String> uppercaseTagsOfInterest)
static ContentTags
parseXML(String html, Set<String> uppercaseTagsOfInterest)
-
-
-
Method Detail
-
parseXML
public static ContentTags parseXML(String html, Set<String> uppercaseTagsOfInterest) throws TikaException, IOException, SAXException
- Throws:
TikaException
IOException
SAXException
-
parseHTML
public static ContentTags parseHTML(String html, Set<String> uppercaseTagsOfInterest) throws SAXException, IOException
- Throws:
SAXException
IOException
-
-