Package org.apache.tika.parser.microsoft
Class OutlookExtractor
- java.lang.Object
-
- org.apache.tika.parser.microsoft.OutlookExtractor
-
public class OutlookExtractor extends Object
Outlook Message Parser.
-
-
Nested Class Summary
Nested Classes Modifier and Type Class Description static classOutlookExtractor.RECIPIENT_TYPE
-
Field Summary
Fields Modifier and Type Field Description protected org.apache.tika.parser.ParseContextcontextprotected OfficeParserConfigofficeParserConfigprotected org.apache.tika.metadata.MetadataparentMetadata
-
Constructor Summary
Constructors Constructor Description OutlookExtractor(org.apache.poi.poifs.filesystem.DirectoryNode root, org.apache.tika.metadata.Metadata metadata, org.apache.tika.parser.ParseContext context)
-
Method Summary
All Methods Static Methods Instance Methods Concrete Methods Modifier and Type Method Description static voidaddEvenIfNull(org.apache.tika.metadata.Property property, String value, org.apache.tika.metadata.Metadata metadata)protected org.apache.tika.detect.DetectorgetDetector()static StringgetMessageClass(String messageClass)protected StringgetPassword()Returns the password to be used for this file, or null if no / default password should be usedprotected org.apache.tika.config.TikaConfiggetTikaConfig()protected voidhandleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, String resourceName, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml)Handle an office document that's embedded at the POIFS levelprotected voidhandleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml)Handle an office document that's embedded at the POIFS levelprotected voidhandleEmbeddedResource(org.apache.tika.io.TikaInputStream resource, String filename, String relationshipID, String mediaType, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml)protected voidhandleEmbeddedResource(org.apache.tika.io.TikaInputStream resource, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml)protected voidhandleEmbeddedResource(org.apache.tika.io.TikaInputStream resource, org.apache.tika.metadata.Metadata embeddedMetadata, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml)voidparse(org.apache.tika.sax.XHTMLContentHandler xhtml)static StringtryToGetMsgTitle(org.apache.poi.poifs.filesystem.DirectoryEntry node, String defaultVal)
-
-
-
Field Detail
-
parentMetadata
protected final org.apache.tika.metadata.Metadata parentMetadata
-
officeParserConfig
protected final OfficeParserConfig officeParserConfig
-
context
protected final org.apache.tika.parser.ParseContext context
-
-
Method Detail
-
addEvenIfNull
public static void addEvenIfNull(org.apache.tika.metadata.Property property, String value, org.apache.tika.metadata.Metadata metadata)
-
parse
public void parse(org.apache.tika.sax.XHTMLContentHandler xhtml) throws org.apache.tika.exception.TikaException, SAXException, IOException- Throws:
org.apache.tika.exception.TikaExceptionSAXExceptionIOException
-
getTikaConfig
protected org.apache.tika.config.TikaConfig getTikaConfig()
-
getDetector
protected org.apache.tika.detect.Detector getDetector()
-
getPassword
protected String getPassword()
Returns the password to be used for this file, or null if no / default password should be used
-
handleEmbeddedResource
protected void handleEmbeddedResource(org.apache.tika.io.TikaInputStream resource, String filename, String relationshipID, String mediaType, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, org.apache.tika.exception.TikaException- Throws:
IOExceptionSAXExceptionorg.apache.tika.exception.TikaException
-
handleEmbeddedResource
protected void handleEmbeddedResource(org.apache.tika.io.TikaInputStream resource, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, org.apache.tika.exception.TikaException- Throws:
IOExceptionSAXExceptionorg.apache.tika.exception.TikaException
-
handleEmbeddedResource
protected void handleEmbeddedResource(org.apache.tika.io.TikaInputStream resource, org.apache.tika.metadata.Metadata embeddedMetadata, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, org.apache.tika.exception.TikaException- Throws:
IOExceptionSAXExceptionorg.apache.tika.exception.TikaException
-
handleEmbeddedOfficeDoc
protected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, org.apache.tika.exception.TikaExceptionHandle an office document that's embedded at the POIFS level- Throws:
IOExceptionSAXExceptionorg.apache.tika.exception.TikaException
-
handleEmbeddedOfficeDoc
protected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, String resourceName, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, org.apache.tika.exception.TikaExceptionHandle an office document that's embedded at the POIFS level- Throws:
IOExceptionSAXExceptionorg.apache.tika.exception.TikaException
-
-