Class Page

All Implemented Interfaces:
Shape, Serializable, Cloneable

public class Page extends Rectangle
See Also:
  • Constructor Details

    • Page

      @Deprecated public Page(float top, float left, float width, float height, int rotation, int number, org.apache.pdfbox.pdmodel.PDPage pdPage, org.apache.pdfbox.pdmodel.PDDocument doc)
      Deprecated.
      use Page.Builder instead
    • Page

      public Page(float top, float left, float width, float height, int rotation, int number, org.apache.pdfbox.pdmodel.PDPage pdPage, org.apache.pdfbox.pdmodel.PDDocument doc, List<TextElement> characters, List<Ruling> rulings)
      Deprecated.
      use Page.Builder instead
    • Page

      public Page(float top, float left, float width, float height, int rotation, int number, org.apache.pdfbox.pdmodel.PDPage pdPage, org.apache.pdfbox.pdmodel.PDDocument doc, technology.tabula.ObjectExtractorStreamEngine streamEngine, TextStripper textStripper)
      Deprecated.
      use Page.Builder instead
    • Page

      public Page(float top, float left, float width, float height, int rotation, int number, org.apache.pdfbox.pdmodel.PDPage pdPage, org.apache.pdfbox.pdmodel.PDDocument doc, List<TextElement> characters, List<Ruling> rulings, float minCharWidth, float minCharHeight, RectangleSpatialIndex<TextElement> index)
      Deprecated.
      use Page.Builder instead
  • Method Details

    • getArea

      public Page getArea(Rectangle area)
    • getArea

      public Page getArea(float top, float left, float bottom, float right)
    • getRotation

      public Integer getRotation()
    • getPageNumber

      public int getPageNumber()
    • getMinCharWidth

      @Deprecated public float getMinCharWidth()
      Deprecated.
      with no replacement
    • getMinCharHeight

      @Deprecated public float getMinCharHeight()
      Deprecated.
      with no replacement
    • getText

      public List<TextElement> getText()
    • getText

      public List<TextElement> getText(Rectangle area)
    • getText

      @Deprecated public List<TextElement> getText(float top, float left, float bottom, float right)
      Deprecated.
      use getText(Rectangle) instead
    • getTexts

      @Deprecated public List<TextElement> getTexts()
      Deprecated.
      use getText() instead
    • getTextBounds

      public Rectangle getTextBounds()
      Returns the minimum bounding box that contains all the TextElements on this Page
    • hasText

      @Deprecated public boolean hasText()
      Deprecated.
      with no replacement
    • getRulings

      public List<Ruling> getRulings()
    • getVerticalRulings

      public List<Ruling> getVerticalRulings()
    • getHorizontalRulings

      public List<Ruling> getHorizontalRulings()
    • addRuling

      public void addRuling(Ruling ruling)
    • getUnprocessedRulings

      public List<Ruling> getUnprocessedRulings()
    • getPDPage

      public org.apache.pdfbox.pdmodel.PDPage getPDPage()
    • getPDDoc

      public org.apache.pdfbox.pdmodel.PDDocument getPDDoc()
    • getSpatialIndex

      @Deprecated public RectangleSpatialIndex<TextElement> getSpatialIndex()
      Deprecated.
      with no replacement