Package org.apache.tika.parser.microsoft
Class OutlookExtractor
- java.lang.Object
-
- org.apache.tika.parser.microsoft.OutlookExtractor
-
public class OutlookExtractor extends Object
Outlook Message Parser.
-
-
Nested Class Summary
Nested Classes Modifier and Type Class Description static classOutlookExtractor.RECIPIENT_TYPE
-
Field Summary
Fields Modifier and Type Field Description protected org.apache.tika.parser.ParseContextcontextprotected OfficeParserConfigofficeParserConfigprotected org.apache.tika.metadata.MetadataparentMetadata
-
Constructor Summary
Constructors Constructor Description OutlookExtractor(org.apache.poi.poifs.filesystem.DirectoryNode root, org.apache.tika.metadata.Metadata metadata, org.apache.tika.parser.ParseContext context)OutlookExtractor(org.apache.poi.poifs.filesystem.DirectoryNode root, org.apache.tika.parser.ParseContext context)Deprecated.useOutlookExtractor(DirectoryNode, Metadata, ParseContext)Will be removed after 2.4.0OutlookExtractor(org.apache.poi.poifs.filesystem.POIFSFileSystem filesystem, org.apache.tika.parser.ParseContext context)Deprecated.useOutlookExtractor(DirectoryNode, Metadata, ParseContext)Will be removed after 2.4.0
-
Method Summary
All Methods Static Methods Instance Methods Concrete Methods Deprecated Methods Modifier and Type Method Description static voidaddEvenIfNull(org.apache.tika.metadata.Property property, String value, org.apache.tika.metadata.Metadata metadata)protected org.apache.tika.detect.DetectorgetDetector()static StringgetMessageClass(String messageClass)protected org.apache.tika.mime.MimeTypesgetMimeTypes()Deprecated.protected StringgetPassword()Returns the password to be used for this file, or null if no / default password should be usedprotected org.apache.tika.config.TikaConfiggetTikaConfig()protected voidhandleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, String resourceName, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml)Handle an office document that's embedded at the POIFS levelprotected voidhandleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml)Handle an office document that's embedded at the POIFS levelprotected voidhandleEmbeddedResource(org.apache.tika.io.TikaInputStream resource, String filename, String relationshipID, String mediaType, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml)protected voidhandleEmbeddedResource(org.apache.tika.io.TikaInputStream resource, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml)protected voidhandleEmbeddedResource(org.apache.tika.io.TikaInputStream resource, org.apache.tika.metadata.Metadata embeddedMetadata, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml)voidparse(org.apache.tika.sax.XHTMLContentHandler xhtml)voidparse(org.apache.tika.sax.XHTMLContentHandler xhtml, org.apache.tika.metadata.Metadata metadata)Deprecated.use {@link #parse(XHTMLContentHandler), will be removed after 2.4.0}
-
-
-
Field Detail
-
parentMetadata
protected final org.apache.tika.metadata.Metadata parentMetadata
-
officeParserConfig
protected final OfficeParserConfig officeParserConfig
-
context
protected final org.apache.tika.parser.ParseContext context
-
-
Constructor Detail
-
OutlookExtractor
@Deprecated public OutlookExtractor(org.apache.poi.poifs.filesystem.POIFSFileSystem filesystem, org.apache.tika.parser.ParseContext context) throws org.apache.tika.exception.TikaException
Deprecated.useOutlookExtractor(DirectoryNode, Metadata, ParseContext)Will be removed after 2.4.0- Parameters:
filesystem-context-- Throws:
org.apache.tika.exception.TikaException
-
OutlookExtractor
@Deprecated public OutlookExtractor(org.apache.poi.poifs.filesystem.DirectoryNode root, org.apache.tika.parser.ParseContext context) throws org.apache.tika.exception.TikaException
Deprecated.useOutlookExtractor(DirectoryNode, Metadata, ParseContext)Will be removed after 2.4.0- Parameters:
root-context-- Throws:
org.apache.tika.exception.TikaException
-
OutlookExtractor
public OutlookExtractor(org.apache.poi.poifs.filesystem.DirectoryNode root, org.apache.tika.metadata.Metadata metadata, org.apache.tika.parser.ParseContext context) throws org.apache.tika.exception.TikaException- Throws:
org.apache.tika.exception.TikaException
-
-
Method Detail
-
addEvenIfNull
public static void addEvenIfNull(org.apache.tika.metadata.Property property, String value, org.apache.tika.metadata.Metadata metadata)
-
parse
public void parse(org.apache.tika.sax.XHTMLContentHandler xhtml) throws org.apache.tika.exception.TikaException, SAXException, IOException- Throws:
org.apache.tika.exception.TikaExceptionSAXExceptionIOException
-
parse
@Deprecated public void parse(org.apache.tika.sax.XHTMLContentHandler xhtml, org.apache.tika.metadata.Metadata metadata) throws org.apache.tika.exception.TikaException, SAXException, IOException
Deprecated.use {@link #parse(XHTMLContentHandler), will be removed after 2.4.0}- Parameters:
xhtml-metadata-- Throws:
org.apache.tika.exception.TikaExceptionSAXExceptionIOException
-
getTikaConfig
protected org.apache.tika.config.TikaConfig getTikaConfig()
-
getDetector
protected org.apache.tika.detect.Detector getDetector()
-
getMimeTypes
protected org.apache.tika.mime.MimeTypes getMimeTypes()
Deprecated.- Returns:
- mimetypes
-
getPassword
protected String getPassword()
Returns the password to be used for this file, or null if no / default password should be used
-
handleEmbeddedResource
protected void handleEmbeddedResource(org.apache.tika.io.TikaInputStream resource, String filename, String relationshipID, String mediaType, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, org.apache.tika.exception.TikaException- Throws:
IOExceptionSAXExceptionorg.apache.tika.exception.TikaException
-
handleEmbeddedResource
protected void handleEmbeddedResource(org.apache.tika.io.TikaInputStream resource, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, org.apache.tika.exception.TikaException- Throws:
IOExceptionSAXExceptionorg.apache.tika.exception.TikaException
-
handleEmbeddedResource
protected void handleEmbeddedResource(org.apache.tika.io.TikaInputStream resource, org.apache.tika.metadata.Metadata embeddedMetadata, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, org.apache.tika.exception.TikaException- Throws:
IOExceptionSAXExceptionorg.apache.tika.exception.TikaException
-
handleEmbeddedOfficeDoc
protected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, org.apache.tika.exception.TikaExceptionHandle an office document that's embedded at the POIFS level- Throws:
IOExceptionSAXExceptionorg.apache.tika.exception.TikaException
-
handleEmbeddedOfficeDoc
protected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, String resourceName, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, org.apache.tika.exception.TikaExceptionHandle an office document that's embedded at the POIFS level- Throws:
IOExceptionSAXExceptionorg.apache.tika.exception.TikaException
-
-