Class OutlookExtractor


  • public class OutlookExtractor
    extends Object
    Outlook Message Parser.
    • Field Detail

      • parentMetadata

        protected final org.apache.tika.metadata.Metadata parentMetadata
      • context

        protected final org.apache.tika.parser.ParseContext context
    • Constructor Detail

      • OutlookExtractor

        @Deprecated
        public OutlookExtractor​(org.apache.poi.poifs.filesystem.POIFSFileSystem filesystem,
                                org.apache.tika.parser.ParseContext context)
                         throws org.apache.tika.exception.TikaException
        Deprecated.
        Parameters:
        filesystem -
        context -
        Throws:
        org.apache.tika.exception.TikaException
      • OutlookExtractor

        @Deprecated
        public OutlookExtractor​(org.apache.poi.poifs.filesystem.DirectoryNode root,
                                org.apache.tika.parser.ParseContext context)
                         throws org.apache.tika.exception.TikaException
        Deprecated.
        Parameters:
        root -
        context -
        Throws:
        org.apache.tika.exception.TikaException
      • OutlookExtractor

        public OutlookExtractor​(org.apache.poi.poifs.filesystem.DirectoryNode root,
                                org.apache.tika.metadata.Metadata metadata,
                                org.apache.tika.parser.ParseContext context)
                         throws org.apache.tika.exception.TikaException
        Throws:
        org.apache.tika.exception.TikaException
    • Method Detail

      • addEvenIfNull

        public static void addEvenIfNull​(org.apache.tika.metadata.Property property,
                                         String value,
                                         org.apache.tika.metadata.Metadata metadata)
      • getMessageClass

        public static String getMessageClass​(String messageClass)
      • parse

        @Deprecated
        public void parse​(org.apache.tika.sax.XHTMLContentHandler xhtml,
                          org.apache.tika.metadata.Metadata metadata)
                   throws org.apache.tika.exception.TikaException,
                          SAXException,
                          IOException
        Deprecated.
        use {@link #parse(XHTMLContentHandler), will be removed after 2.4.0}
        Parameters:
        xhtml -
        metadata -
        Throws:
        org.apache.tika.exception.TikaException
        SAXException
        IOException
      • getTikaConfig

        protected org.apache.tika.config.TikaConfig getTikaConfig()
      • getDetector

        protected org.apache.tika.detect.Detector getDetector()
      • getMimeTypes

        protected org.apache.tika.mime.MimeTypes getMimeTypes()
        Deprecated.
        Returns:
        mimetypes
      • getPassword

        protected String getPassword()
        Returns the password to be used for this file, or null if no / default password should be used
      • handleEmbeddedResource

        protected void handleEmbeddedResource​(org.apache.tika.io.TikaInputStream resource,
                                              String filename,
                                              String relationshipID,
                                              String mediaType,
                                              org.apache.tika.sax.XHTMLContentHandler xhtml,
                                              boolean outputHtml)
                                       throws IOException,
                                              SAXException,
                                              org.apache.tika.exception.TikaException
        Throws:
        IOException
        SAXException
        org.apache.tika.exception.TikaException
      • handleEmbeddedResource

        protected void handleEmbeddedResource​(org.apache.tika.io.TikaInputStream resource,
                                              String filename,
                                              String relationshipID,
                                              org.apache.poi.hpsf.ClassID storageClassID,
                                              String mediaType,
                                              org.apache.tika.sax.XHTMLContentHandler xhtml,
                                              boolean outputHtml)
                                       throws IOException,
                                              SAXException,
                                              org.apache.tika.exception.TikaException
        Throws:
        IOException
        SAXException
        org.apache.tika.exception.TikaException
      • handleEmbeddedResource

        protected void handleEmbeddedResource​(org.apache.tika.io.TikaInputStream resource,
                                              org.apache.tika.metadata.Metadata embeddedMetadata,
                                              String filename,
                                              String relationshipID,
                                              org.apache.poi.hpsf.ClassID storageClassID,
                                              String mediaType,
                                              org.apache.tika.sax.XHTMLContentHandler xhtml,
                                              boolean outputHtml)
                                       throws IOException,
                                              SAXException,
                                              org.apache.tika.exception.TikaException
        Throws:
        IOException
        SAXException
        org.apache.tika.exception.TikaException
      • handleEmbeddedOfficeDoc

        protected void handleEmbeddedOfficeDoc​(org.apache.poi.poifs.filesystem.DirectoryEntry dir,
                                               org.apache.tika.sax.XHTMLContentHandler xhtml,
                                               boolean outputHtml)
                                        throws IOException,
                                               SAXException,
                                               org.apache.tika.exception.TikaException
        Handle an office document that's embedded at the POIFS level
        Throws:
        IOException
        SAXException
        org.apache.tika.exception.TikaException
      • handleEmbeddedOfficeDoc

        protected void handleEmbeddedOfficeDoc​(org.apache.poi.poifs.filesystem.DirectoryEntry dir,
                                               String resourceName,
                                               org.apache.tika.sax.XHTMLContentHandler xhtml,
                                               boolean outputHtml)
                                        throws IOException,
                                               SAXException,
                                               org.apache.tika.exception.TikaException
        Handle an office document that's embedded at the POIFS level
        Throws:
        IOException
        SAXException
        org.apache.tika.exception.TikaException