Package org.apache.tika.parser.microsoft
Class OutlookExtractor
java.lang.Object
org.apache.tika.parser.microsoft.OutlookExtractor
Outlook Message Parser.
-
Nested Class Summary
Nested Classes -
Field Summary
FieldsModifier and TypeFieldDescriptionprotected final org.apache.tika.parser.ParseContextprotected final OfficeParserConfigprotected final org.apache.tika.metadata.Metadata -
Constructor Summary
ConstructorsConstructorDescriptionOutlookExtractor(org.apache.poi.poifs.filesystem.DirectoryNode root, org.apache.tika.metadata.Metadata metadata, org.apache.tika.parser.ParseContext context) OutlookExtractor(org.apache.poi.poifs.filesystem.DirectoryNode root, org.apache.tika.parser.ParseContext context) Deprecated.OutlookExtractor(org.apache.poi.poifs.filesystem.POIFSFileSystem filesystem, org.apache.tika.parser.ParseContext context) Deprecated.useOutlookExtractor(DirectoryNode, Metadata, ParseContext)Will be removed after 2.4.0 -
Method Summary
Modifier and TypeMethodDescriptionstatic voidaddEvenIfNull(org.apache.tika.metadata.Property property, String value, org.apache.tika.metadata.Metadata metadata) protected org.apache.tika.detect.Detectorstatic StringgetMessageClass(String messageClass) protected org.apache.tika.mime.MimeTypesDeprecated.protected StringReturns the password to be used for this file, or null if no / default password should be usedprotected org.apache.tika.config.TikaConfigprotected voidhandleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, String resourceName, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) Handle an office document that's embedded at the POIFS levelprotected voidhandleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) Handle an office document that's embedded at the POIFS levelprotected voidhandleEmbeddedResource(org.apache.tika.io.TikaInputStream resource, String filename, String relationshipID, String mediaType, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) protected voidhandleEmbeddedResource(org.apache.tika.io.TikaInputStream resource, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) protected voidhandleEmbeddedResource(org.apache.tika.io.TikaInputStream resource, org.apache.tika.metadata.Metadata embeddedMetadata, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) voidparse(org.apache.tika.sax.XHTMLContentHandler xhtml) voidparse(org.apache.tika.sax.XHTMLContentHandler xhtml, org.apache.tika.metadata.Metadata metadata) Deprecated.use {@link #parse(XHTMLContentHandler), will be removed after 2.4.0}
-
Field Details
-
parentMetadata
protected final org.apache.tika.metadata.Metadata parentMetadata -
officeParserConfig
-
context
protected final org.apache.tika.parser.ParseContext context
-
-
Constructor Details
-
OutlookExtractor
@Deprecated public OutlookExtractor(org.apache.poi.poifs.filesystem.POIFSFileSystem filesystem, org.apache.tika.parser.ParseContext context) throws org.apache.tika.exception.TikaException Deprecated.useOutlookExtractor(DirectoryNode, Metadata, ParseContext)Will be removed after 2.4.0- Parameters:
filesystem-context-- Throws:
org.apache.tika.exception.TikaException
-
OutlookExtractor
@Deprecated public OutlookExtractor(org.apache.poi.poifs.filesystem.DirectoryNode root, org.apache.tika.parser.ParseContext context) throws org.apache.tika.exception.TikaException Deprecated.useOutlookExtractor(DirectoryNode, Metadata, ParseContext)Will be removed after 2.4.0- Parameters:
root-context-- Throws:
org.apache.tika.exception.TikaException
-
OutlookExtractor
public OutlookExtractor(org.apache.poi.poifs.filesystem.DirectoryNode root, org.apache.tika.metadata.Metadata metadata, org.apache.tika.parser.ParseContext context) throws org.apache.tika.exception.TikaException - Throws:
org.apache.tika.exception.TikaException
-
-
Method Details
-
addEvenIfNull
public static void addEvenIfNull(org.apache.tika.metadata.Property property, String value, org.apache.tika.metadata.Metadata metadata) -
getMessageClass
-
parse
public void parse(org.apache.tika.sax.XHTMLContentHandler xhtml) throws org.apache.tika.exception.TikaException, SAXException, IOException - Throws:
org.apache.tika.exception.TikaExceptionSAXExceptionIOException
-
parse
@Deprecated public void parse(org.apache.tika.sax.XHTMLContentHandler xhtml, org.apache.tika.metadata.Metadata metadata) throws org.apache.tika.exception.TikaException, SAXException, IOException Deprecated.use {@link #parse(XHTMLContentHandler), will be removed after 2.4.0}- Parameters:
xhtml-metadata-- Throws:
org.apache.tika.exception.TikaExceptionSAXExceptionIOException
-
getTikaConfig
protected org.apache.tika.config.TikaConfig getTikaConfig() -
getDetector
protected org.apache.tika.detect.Detector getDetector() -
getMimeTypes
protected org.apache.tika.mime.MimeTypes getMimeTypes()Deprecated.- Returns:
- mimetypes
-
getPassword
Returns the password to be used for this file, or null if no / default password should be used -
handleEmbeddedResource
protected void handleEmbeddedResource(org.apache.tika.io.TikaInputStream resource, String filename, String relationshipID, String mediaType, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, org.apache.tika.exception.TikaException - Throws:
IOExceptionSAXExceptionorg.apache.tika.exception.TikaException
-
handleEmbeddedResource
protected void handleEmbeddedResource(org.apache.tika.io.TikaInputStream resource, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, org.apache.tika.exception.TikaException - Throws:
IOExceptionSAXExceptionorg.apache.tika.exception.TikaException
-
handleEmbeddedResource
protected void handleEmbeddedResource(org.apache.tika.io.TikaInputStream resource, org.apache.tika.metadata.Metadata embeddedMetadata, String filename, String relationshipID, org.apache.poi.hpsf.ClassID storageClassID, String mediaType, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, org.apache.tika.exception.TikaException - Throws:
IOExceptionSAXExceptionorg.apache.tika.exception.TikaException
-
handleEmbeddedOfficeDoc
protected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, org.apache.tika.exception.TikaException Handle an office document that's embedded at the POIFS level- Throws:
IOExceptionSAXExceptionorg.apache.tika.exception.TikaException
-
handleEmbeddedOfficeDoc
protected void handleEmbeddedOfficeDoc(org.apache.poi.poifs.filesystem.DirectoryEntry dir, String resourceName, org.apache.tika.sax.XHTMLContentHandler xhtml, boolean outputHtml) throws IOException, SAXException, org.apache.tika.exception.TikaException Handle an office document that's embedded at the POIFS level- Throws:
IOExceptionSAXExceptionorg.apache.tika.exception.TikaException
-
OutlookExtractor(DirectoryNode, Metadata, ParseContext)Will be removed after 2.4.0