boolean needToCheck
boolean allowAccessibility
PDFParserConfig defaultConfig
Set<E> userConfigured
boolean enableAutoSpace
boolean suppressDuplicateOverlappingText
boolean extractAnnotationText
boolean sortByPosition
boolean extractAcroFormContent
boolean extractBookmarksText
boolean extractInlineImages
boolean extractInlineImageMetadataOnly
boolean extractUniqueInlineImagesOnly
boolean extractMarkedContent
Float averageCharTolerance
Float spacingTolerance
float dropThreshold
boolean ifXFAExtractOnlyXFA
PDFParserConfig.OCR_STRATEGY ocrStrategy
PDFParserConfig.OCRStrategyAuto ocrStrategyAuto
PDFParserConfig.OCR_RENDERING_STRATEGY ocrRenderingStrategy
int ocrDPI
org.apache.pdfbox.rendering.ImageType ocrImageType
String ocrImageFormatName
float ocrImageQuality
AccessChecker accessChecker
boolean catchIntermediateIOExceptions
boolean extractActions
boolean extractFontNames
long maxMainMemoryBytes
boolean setKCMS
boolean detectAngles
float unmappedUnicodeCharsPerPage
int totalCharsPerPage
Copyright © 2007–2021 The Apache Software Foundation. All rights reserved.