public class ConvertTextExtractor extends DocumentProcessor implements com.exalead.util.Checkable, java.io.Serializable
DocumentProcessor.FromDataModel, DocumentProcessor.Transformer<T>
acceptCondition, dataModelClass, dataModelProperty, dataModelState, DEFAULT_DISABLED, disabled, fromDataModel, name
Constructor and Description |
---|
ConvertTextExtractor() |
ConvertTextExtractor(ConvertTextExtractor o)
Copy constructor
|
Modifier and Type | Method and Description |
---|---|
<T> T |
accept(DocumentProcessor.Transformer<T> transformer,
T[] t) |
void |
check(boolean deep,
java.lang.String errorContext)
Checks this ConvertTextExtractor.
|
static ConvertTextExtractor |
fromString(java.lang.String s)
String representation of this ConvertTextExtractor.
|
java.lang.String |
getAttachments()
Includes embedded attachments
("true", "false", "optional") |
java.lang.String |
getEmbedded()
Includes embedded images
("true", "false", "optional") |
java.lang.String |
getFilter()
Native filter identifier list to be used specifically.
|
java.lang.String |
getHttpProxyUrl()
Optional HTTP proxy URL.
The URL can embed credentials if required. |
java.util.List<KeyValue> |
getKeyValue() |
long |
getMaxInputSizeKB()
Maximum document size accepted, in kilobytes.
|
long |
getMaxOutputSizeKB()
Maximum output size on the remote side, in kilobytes.
If the generated output exceeds this value, the document may be truncated or invalid. |
long |
getMaxPages()
Maximum number of pages to process for xml conversion (may be ignored).
|
int |
getMaxRecursionDepth()
Maximum recursion depth.
|
int |
getMaxRecursionDocuments()
Maximum number of documents that can be converted in one directory level.
|
int |
getMaxRecursionDocumentsTotal()
Maximum number of documents that can be converted over all levels.
|
long |
getMinInputSizeKB()
Minimum document size accepted, in kilobytes.
|
java.lang.String |
getOcr()
Converts using OCR
("true", "false", "optional") |
java.lang.String |
getOcrDetect()
Detects documents requiring OCR (and rejects them)
("true", "false") |
java.lang.String |
getOcrFallback()
Fallback to OCR if heuristics deem it necessary
("true", "false", "optional") |
java.lang.String |
getOcrLang()
OCR language(s) ("en" for English, "en;fr" for French and English, etc.)
|
int |
getOcrMaxPages()
Maximum number of pages to process for OCR.
|
java.lang.String |
getOcrPriority()
Worker thread(s) priority to be used for the OCR processing
("normal", "lowest", "very low", "low", "normal", "high", "very high") |
java.lang.String |
getOcrQuality()
OCR quality ("fast", "normal", "best")
|
long |
getOcrTimeoutMs()
OCR conversion timeout value, in milliseconds.
If the OCR process takes longer, the remote side attemps to abort the conversion process. This value overrides the timeout value if the processing involves an OCR operation. |
java.lang.String |
getOutsideIn()
This feature is no longer supported.
("true", "false", "optional") |
java.lang.String |
getOutsideInFallback()
This feature is no longer supported.
("true", "false", "optional") |
java.lang.String |
getOutsideInForPreview()
This feature is no longer supported.
("true", "false", "optional") |
java.lang.String |
getOutsideInOnly()
This feature is no longer supported.
("true", "false", "optional") |
java.lang.String |
getOutsideInSimpleXHTMLFallback()
This feature is no longer supported.
("true", "false", "optional") |
java.lang.String |
getOverrideAddresses() |
java.lang.String |
getPriority()
Worker thread(s) priority to be used for the processing
("normal", "lowest", "very low", "low", "normal", "high", "very high") |
java.lang.String |
getRetryIO()
Uses regular I/O when mmap fails.
("true", "false") |
long |
getStartPage()
Starts conversion from this page number (page number starts at 1).
This parameter is only taken into account for image processing and may be ignored. |
java.lang.String |
getStyles()
Attempts to extract more text styles for HTML conversion
("true", "false", "optional") |
long |
getTimeoutMs()
Conversion timeout value, in milliseconds.
|
boolean |
isAllowDocumentChars()
Allows the use of Unicode private range characters (E0XX) for separators
(keyword, sentence, paragraph separators, ...) |
boolean |
isAllowUnicode32()
Allows the use of 32-bit unicode points.
|
boolean |
isDisablePlugins()
Disables external plugins.
|
boolean |
isForceContent()
Forces to accept the content, even if the MIME type does not seem to be a known or supported MIME type.
|
boolean |
isForceConversion()
Attempts to generate an empty document upon conversion error (may be ignored)
|
boolean |
isLooseTextDetection()
Looses text detection to detect more text files, including suspicious ones (not *.txt or *.html)
("true", "false") |
boolean |
isStrictSizeCheck()
Strict size validation mode (even for partial reads).
|
ConvertTextExtractor |
makeCopy()
Creates and returns a deep copy of this ConvertTextExtractor.
|
static ConvertTextExtractor |
readFrom(java.io.InputStream is)
Read this ConvertTextExtractor from an XML fragment.
|
void |
setAllowDocumentChars(boolean allowDocumentChars)
Allows the use of Unicode private range characters (E0XX) for separators
(keyword, sentence, paragraph separators, ...) |
void |
setAllowUnicode32(boolean allowUnicode32)
Allows the use of 32-bit unicode points.
|
void |
setAttachments(java.lang.String attachments)
Includes embedded attachments
("true", "false", "optional") |
void |
setDisablePlugins(boolean disablePlugins)
Disables external plugins.
|
void |
setEmbedded(java.lang.String embedded)
Includes embedded images
("true", "false", "optional") |
void |
setFilter(java.lang.String filter)
Native filter identifier list to be used specifically.
|
void |
setForceContent(boolean forceContent)
Forces to accept the content, even if the MIME type does not seem to be a known or supported MIME type.
|
void |
setForceConversion(boolean forceConversion)
Attempts to generate an empty document upon conversion error (may be ignored)
|
void |
setHttpProxyUrl(java.lang.String httpProxyUrl)
Optional HTTP proxy URL.
The URL can embed credentials if required. |
void |
setLooseTextDetection(boolean looseTextDetection)
Looses text detection to detect more text files, including suspicious ones (not *.txt or *.html)
("true", "false") |
void |
setMaxInputSizeKB(long maxInputSizeKB)
Maximum document size accepted, in kilobytes.
|
void |
setMaxOutputSizeKB(long maxOutputSizeKB)
Maximum output size on the remote side, in kilobytes.
If the generated output exceeds this value, the document may be truncated or invalid. |
void |
setMaxPages(long maxPages)
Maximum number of pages to process for xml conversion (may be ignored).
|
void |
setMaxRecursionDepth(int maxRecursionDepth)
Maximum recursion depth.
|
void |
setMaxRecursionDocuments(int maxRecursionDocuments)
Maximum number of documents that can be converted in one directory level.
|
void |
setMaxRecursionDocumentsTotal(int maxRecursionDocumentsTotal)
Maximum number of documents that can be converted over all levels.
|
void |
setMinInputSizeKB(long minInputSizeKB)
Minimum document size accepted, in kilobytes.
|
void |
setOcr(java.lang.String ocr)
Converts using OCR
("true", "false", "optional") |
void |
setOcrDetect(java.lang.String ocrDetect)
Detects documents requiring OCR (and rejects them)
("true", "false") |
void |
setOcrFallback(java.lang.String ocrFallback)
Fallback to OCR if heuristics deem it necessary
("true", "false", "optional") |
void |
setOcrLang(java.lang.String ocrLang)
OCR language(s) ("en" for English, "en;fr" for French and English, etc.)
|
void |
setOcrMaxPages(int ocrMaxPages)
Maximum number of pages to process for OCR.
|
void |
setOcrPriority(java.lang.String ocrPriority)
Worker thread(s) priority to be used for the OCR processing
("normal", "lowest", "very low", "low", "normal", "high", "very high") |
void |
setOcrQuality(java.lang.String ocrQuality)
OCR quality ("fast", "normal", "best")
|
void |
setOcrTimeoutMs(long ocrTimeoutMs)
OCR conversion timeout value, in milliseconds.
If the OCR process takes longer, the remote side attemps to abort the conversion process. This value overrides the timeout value if the processing involves an OCR operation. |
void |
setOutsideIn(java.lang.String outsideIn)
This feature is no longer supported.
("true", "false", "optional") |
void |
setOutsideInFallback(java.lang.String outsideInFallback)
This feature is no longer supported.
("true", "false", "optional") |
void |
setOutsideInForPreview(java.lang.String outsideInForPreview)
This feature is no longer supported.
("true", "false", "optional") |
void |
setOutsideInOnly(java.lang.String outsideInOnly)
This feature is no longer supported.
("true", "false", "optional") |
void |
setOutsideInSimpleXHTMLFallback(java.lang.String outsideInSimpleXHTMLFallback)
This feature is no longer supported.
("true", "false", "optional") |
void |
setOverrideAddresses(java.lang.String overrideAddresses) |
void |
setPriority(java.lang.String priority)
Worker thread(s) priority to be used for the processing
("normal", "lowest", "very low", "low", "normal", "high", "very high") |
void |
setRetryIO(java.lang.String retryIO)
Uses regular I/O when mmap fails.
("true", "false") |
void |
setStartPage(long startPage)
Starts conversion from this page number (page number starts at 1).
This parameter is only taken into account for image processing and may be ignored. |
void |
setStrictSizeCheck(boolean strictSizeCheck)
Strict size validation mode (even for partial reads).
|
void |
setStyles(java.lang.String styles)
Attempts to extract more text styles for HTML conversion
("true", "false", "optional") |
void |
setTimeoutMs(long timeoutMs)
Conversion timeout value, in milliseconds.
|
java.lang.String |
toString()
String representation of this ConvertTextExtractor.
|
ConvertTextExtractor |
withAcceptCondition(AcceptCondition acceptCondition) |
ConvertTextExtractor |
withAllowDocumentChars(boolean allowDocumentChars) |
ConvertTextExtractor |
withAllowDocumentChars(java.lang.Boolean allowDocumentChars) |
ConvertTextExtractor |
withAllowUnicode32(boolean allowUnicode32) |
ConvertTextExtractor |
withAllowUnicode32(java.lang.Boolean allowUnicode32) |
ConvertTextExtractor |
withAttachments(java.lang.String attachments) |
ConvertTextExtractor |
withDataModelClass(java.lang.String dataModelClass) |
ConvertTextExtractor |
withDataModelProperty(java.lang.String dataModelProperty) |
ConvertTextExtractor |
withDataModelState(java.lang.String dataModelState) |
ConvertTextExtractor |
withDisabled(boolean disabled) |
ConvertTextExtractor |
withDisabled(java.lang.Boolean disabled) |
ConvertTextExtractor |
withDisablePlugins(boolean disablePlugins) |
ConvertTextExtractor |
withDisablePlugins(java.lang.Boolean disablePlugins) |
ConvertTextExtractor |
withEmbedded(java.lang.String embedded) |
ConvertTextExtractor |
withFilter(java.lang.String filter) |
ConvertTextExtractor |
withForceContent(boolean forceContent) |
ConvertTextExtractor |
withForceContent(java.lang.Boolean forceContent) |
ConvertTextExtractor |
withForceConversion(boolean forceConversion) |
ConvertTextExtractor |
withForceConversion(java.lang.Boolean forceConversion) |
ConvertTextExtractor |
withFromDataModel(DocumentProcessor fromDataModel) |
ConvertTextExtractor |
withHttpProxyUrl(java.lang.String httpProxyUrl) |
ConvertTextExtractor |
withKeyValue(java.util.Collection<KeyValue> __values) |
ConvertTextExtractor |
withKeyValue(KeyValue... __values) |
ConvertTextExtractor |
withLooseTextDetection(boolean looseTextDetection) |
ConvertTextExtractor |
withLooseTextDetection(java.lang.Boolean looseTextDetection) |
ConvertTextExtractor |
withMaxInputSizeKB(long maxInputSizeKB) |
ConvertTextExtractor |
withMaxInputSizeKB(java.lang.Long maxInputSizeKB) |
ConvertTextExtractor |
withMaxOutputSizeKB(long maxOutputSizeKB) |
ConvertTextExtractor |
withMaxOutputSizeKB(java.lang.Long maxOutputSizeKB) |
ConvertTextExtractor |
withMaxPages(long maxPages) |
ConvertTextExtractor |
withMaxPages(java.lang.Long maxPages) |
ConvertTextExtractor |
withMaxRecursionDepth(int maxRecursionDepth) |
ConvertTextExtractor |
withMaxRecursionDepth(java.lang.Integer maxRecursionDepth) |
ConvertTextExtractor |
withMaxRecursionDocuments(int maxRecursionDocuments) |
ConvertTextExtractor |
withMaxRecursionDocuments(java.lang.Integer maxRecursionDocuments) |
ConvertTextExtractor |
withMaxRecursionDocumentsTotal(int maxRecursionDocumentsTotal) |
ConvertTextExtractor |
withMaxRecursionDocumentsTotal(java.lang.Integer maxRecursionDocumentsTotal) |
ConvertTextExtractor |
withMinInputSizeKB(long minInputSizeKB) |
ConvertTextExtractor |
withMinInputSizeKB(java.lang.Long minInputSizeKB) |
ConvertTextExtractor |
withName(java.lang.String name) |
ConvertTextExtractor |
withOcr(java.lang.String ocr) |
ConvertTextExtractor |
withOcrDetect(java.lang.String ocrDetect) |
ConvertTextExtractor |
withOcrFallback(java.lang.String ocrFallback) |
ConvertTextExtractor |
withOcrLang(java.lang.String ocrLang) |
ConvertTextExtractor |
withOcrMaxPages(int ocrMaxPages) |
ConvertTextExtractor |
withOcrMaxPages(java.lang.Integer ocrMaxPages) |
ConvertTextExtractor |
withOcrPriority(java.lang.String ocrPriority) |
ConvertTextExtractor |
withOcrQuality(java.lang.String ocrQuality) |
ConvertTextExtractor |
withOcrTimeoutMs(long ocrTimeoutMs) |
ConvertTextExtractor |
withOcrTimeoutMs(java.lang.Long ocrTimeoutMs) |
ConvertTextExtractor |
withOutsideIn(java.lang.String outsideIn) |
ConvertTextExtractor |
withOutsideInFallback(java.lang.String outsideInFallback) |
ConvertTextExtractor |
withOutsideInForPreview(java.lang.String outsideInForPreview) |
ConvertTextExtractor |
withOutsideInOnly(java.lang.String outsideInOnly) |
ConvertTextExtractor |
withOutsideInSimpleXHTMLFallback(java.lang.String outsideInSimpleXHTMLFallback) |
ConvertTextExtractor |
withOverrideAddresses(java.lang.String overrideAddresses) |
ConvertTextExtractor |
withPriority(java.lang.String priority) |
ConvertTextExtractor |
withRetryIO(java.lang.String retryIO) |
ConvertTextExtractor |
withStartPage(long startPage) |
ConvertTextExtractor |
withStartPage(java.lang.Long startPage) |
ConvertTextExtractor |
withStrictSizeCheck(boolean strictSizeCheck) |
ConvertTextExtractor |
withStrictSizeCheck(java.lang.Boolean strictSizeCheck) |
ConvertTextExtractor |
withStyles(java.lang.String styles) |
ConvertTextExtractor |
withTimeoutMs(long timeoutMs) |
ConvertTextExtractor |
withTimeoutMs(java.lang.Long timeoutMs) |
void |
writeTo(java.io.OutputStream os)
Write this ConvertTextExtractor as an XML fragment
|
getAcceptCondition, getDataModelClass, getDataModelProperty, getDataModelState, getFromDataModel, getName, isDisabled, setAcceptCondition, setDataModelClass, setDataModelProperty, setDataModelState, setDisabled, setFromDataModel, setName
public java.util.List<KeyValue> keyValue
public boolean looseTextDetection
public static final boolean DEFAULT_LOOSE_TEXT_DETECTION
public boolean forceContent
public static final boolean DEFAULT_FORCE_CONTENT
public long minInputSizeKB
public static final long DEFAULT_MIN_INPUT_SIZE_K_B
public long maxInputSizeKB
public static final long DEFAULT_MAX_INPUT_SIZE_K_B
public int maxRecursionDepth
public static final int DEFAULT_MAX_RECURSION_DEPTH
public int maxRecursionDocuments
public static final int DEFAULT_MAX_RECURSION_DOCUMENTS
public int maxRecursionDocumentsTotal
public static final int DEFAULT_MAX_RECURSION_DOCUMENTS_TOTAL
public boolean strictSizeCheck
public static final boolean DEFAULT_STRICT_SIZE_CHECK
public java.lang.String retryIO
public java.lang.String filter
public long timeoutMs
public static final long DEFAULT_TIMEOUT_MS
public java.lang.String priority
public java.lang.String embedded
public java.lang.String attachments
public java.lang.String styles
public boolean forceConversion
public static final boolean DEFAULT_FORCE_CONVERSION
public long startPage
public static final long DEFAULT_START_PAGE
public long maxPages
public static final long DEFAULT_MAX_PAGES
public long maxOutputSizeKB
public static final long DEFAULT_MAX_OUTPUT_SIZE_K_B
public boolean allowUnicode32
public static final boolean DEFAULT_ALLOW_UNICODE32
public boolean allowDocumentChars
public static final boolean DEFAULT_ALLOW_DOCUMENT_CHARS
public java.lang.String outsideIn
public java.lang.String outsideInFallback
public java.lang.String outsideInOnly
public java.lang.String outsideInForPreview
public java.lang.String outsideInSimpleXHTMLFallback
public java.lang.String ocr
public java.lang.String ocrFallback
public java.lang.String ocrDetect
public java.lang.String ocrQuality
public java.lang.String ocrLang
public long ocrTimeoutMs
public static final long DEFAULT_OCR_TIMEOUT_MS
public int ocrMaxPages
public static final int DEFAULT_OCR_MAX_PAGES
public java.lang.String ocrPriority
public java.lang.String httpProxyUrl
public boolean disablePlugins
public static final boolean DEFAULT_DISABLE_PLUGINS
public java.lang.String overrideAddresses
public ConvertTextExtractor()
public ConvertTextExtractor(ConvertTextExtractor o)
public ConvertTextExtractor withAcceptCondition(AcceptCondition acceptCondition)
withAcceptCondition
in class DocumentProcessor
public ConvertTextExtractor withName(java.lang.String name)
withName
in class DocumentProcessor
public ConvertTextExtractor withDataModelState(java.lang.String dataModelState)
withDataModelState
in class DocumentProcessor
public ConvertTextExtractor withFromDataModel(DocumentProcessor fromDataModel)
public ConvertTextExtractor withDataModelClass(java.lang.String dataModelClass)
withDataModelClass
in class DocumentProcessor
public ConvertTextExtractor withDataModelProperty(java.lang.String dataModelProperty)
withDataModelProperty
in class DocumentProcessor
public ConvertTextExtractor withDisabled(boolean disabled)
withDisabled
in class DocumentProcessor
public ConvertTextExtractor withDisabled(java.lang.Boolean disabled)
withDisabled
in class DocumentProcessor
public java.util.List<KeyValue> getKeyValue()
public ConvertTextExtractor withKeyValue(KeyValue... __values)
public ConvertTextExtractor withKeyValue(java.util.Collection<KeyValue> __values)
public void setLooseTextDetection(boolean looseTextDetection)
public boolean isLooseTextDetection()
public ConvertTextExtractor withLooseTextDetection(boolean looseTextDetection)
public ConvertTextExtractor withLooseTextDetection(java.lang.Boolean looseTextDetection)
public void setForceContent(boolean forceContent)
public boolean isForceContent()
public ConvertTextExtractor withForceContent(boolean forceContent)
public ConvertTextExtractor withForceContent(java.lang.Boolean forceContent)
public void setMinInputSizeKB(long minInputSizeKB)
public long getMinInputSizeKB()
public ConvertTextExtractor withMinInputSizeKB(long minInputSizeKB)
public ConvertTextExtractor withMinInputSizeKB(java.lang.Long minInputSizeKB)
public void setMaxInputSizeKB(long maxInputSizeKB)
public long getMaxInputSizeKB()
public ConvertTextExtractor withMaxInputSizeKB(long maxInputSizeKB)
public ConvertTextExtractor withMaxInputSizeKB(java.lang.Long maxInputSizeKB)
public void setMaxRecursionDepth(int maxRecursionDepth)
public int getMaxRecursionDepth()
public ConvertTextExtractor withMaxRecursionDepth(int maxRecursionDepth)
public ConvertTextExtractor withMaxRecursionDepth(java.lang.Integer maxRecursionDepth)
public void setMaxRecursionDocuments(int maxRecursionDocuments)
public int getMaxRecursionDocuments()
public ConvertTextExtractor withMaxRecursionDocuments(int maxRecursionDocuments)
public ConvertTextExtractor withMaxRecursionDocuments(java.lang.Integer maxRecursionDocuments)
public void setMaxRecursionDocumentsTotal(int maxRecursionDocumentsTotal)
public int getMaxRecursionDocumentsTotal()
public ConvertTextExtractor withMaxRecursionDocumentsTotal(int maxRecursionDocumentsTotal)
public ConvertTextExtractor withMaxRecursionDocumentsTotal(java.lang.Integer maxRecursionDocumentsTotal)
public void setStrictSizeCheck(boolean strictSizeCheck)
public boolean isStrictSizeCheck()
public ConvertTextExtractor withStrictSizeCheck(boolean strictSizeCheck)
public ConvertTextExtractor withStrictSizeCheck(java.lang.Boolean strictSizeCheck)
public void setRetryIO(java.lang.String retryIO)
public java.lang.String getRetryIO()
public ConvertTextExtractor withRetryIO(java.lang.String retryIO)
public void setFilter(java.lang.String filter)
public java.lang.String getFilter()
public ConvertTextExtractor withFilter(java.lang.String filter)
public void setTimeoutMs(long timeoutMs)
public long getTimeoutMs()
public ConvertTextExtractor withTimeoutMs(long timeoutMs)
public ConvertTextExtractor withTimeoutMs(java.lang.Long timeoutMs)
public void setPriority(java.lang.String priority)
public java.lang.String getPriority()
public ConvertTextExtractor withPriority(java.lang.String priority)
public void setEmbedded(java.lang.String embedded)
public java.lang.String getEmbedded()
public ConvertTextExtractor withEmbedded(java.lang.String embedded)
public void setAttachments(java.lang.String attachments)
public java.lang.String getAttachments()
public ConvertTextExtractor withAttachments(java.lang.String attachments)
public void setStyles(java.lang.String styles)
public java.lang.String getStyles()
public ConvertTextExtractor withStyles(java.lang.String styles)
public void setForceConversion(boolean forceConversion)
public boolean isForceConversion()
public ConvertTextExtractor withForceConversion(boolean forceConversion)
public ConvertTextExtractor withForceConversion(java.lang.Boolean forceConversion)
public void setStartPage(long startPage)
public long getStartPage()
public ConvertTextExtractor withStartPage(long startPage)
public ConvertTextExtractor withStartPage(java.lang.Long startPage)
public void setMaxPages(long maxPages)
public long getMaxPages()
public ConvertTextExtractor withMaxPages(long maxPages)
public ConvertTextExtractor withMaxPages(java.lang.Long maxPages)
public void setMaxOutputSizeKB(long maxOutputSizeKB)
public long getMaxOutputSizeKB()
public ConvertTextExtractor withMaxOutputSizeKB(long maxOutputSizeKB)
public ConvertTextExtractor withMaxOutputSizeKB(java.lang.Long maxOutputSizeKB)
public void setAllowUnicode32(boolean allowUnicode32)
public boolean isAllowUnicode32()
public ConvertTextExtractor withAllowUnicode32(boolean allowUnicode32)
public ConvertTextExtractor withAllowUnicode32(java.lang.Boolean allowUnicode32)
public void setAllowDocumentChars(boolean allowDocumentChars)
public boolean isAllowDocumentChars()
public ConvertTextExtractor withAllowDocumentChars(boolean allowDocumentChars)
public ConvertTextExtractor withAllowDocumentChars(java.lang.Boolean allowDocumentChars)
public void setOutsideIn(java.lang.String outsideIn)
public java.lang.String getOutsideIn()
public ConvertTextExtractor withOutsideIn(java.lang.String outsideIn)
public void setOutsideInFallback(java.lang.String outsideInFallback)
public java.lang.String getOutsideInFallback()
public ConvertTextExtractor withOutsideInFallback(java.lang.String outsideInFallback)
public void setOutsideInOnly(java.lang.String outsideInOnly)
public java.lang.String getOutsideInOnly()
public ConvertTextExtractor withOutsideInOnly(java.lang.String outsideInOnly)
public void setOutsideInForPreview(java.lang.String outsideInForPreview)
public java.lang.String getOutsideInForPreview()
public ConvertTextExtractor withOutsideInForPreview(java.lang.String outsideInForPreview)
public void setOutsideInSimpleXHTMLFallback(java.lang.String outsideInSimpleXHTMLFallback)
public java.lang.String getOutsideInSimpleXHTMLFallback()
public ConvertTextExtractor withOutsideInSimpleXHTMLFallback(java.lang.String outsideInSimpleXHTMLFallback)
public void setOcr(java.lang.String ocr)
public java.lang.String getOcr()
public ConvertTextExtractor withOcr(java.lang.String ocr)
public void setOcrFallback(java.lang.String ocrFallback)
public java.lang.String getOcrFallback()
public ConvertTextExtractor withOcrFallback(java.lang.String ocrFallback)
public void setOcrDetect(java.lang.String ocrDetect)
public java.lang.String getOcrDetect()
public ConvertTextExtractor withOcrDetect(java.lang.String ocrDetect)
public void setOcrQuality(java.lang.String ocrQuality)
public java.lang.String getOcrQuality()
public ConvertTextExtractor withOcrQuality(java.lang.String ocrQuality)
public void setOcrLang(java.lang.String ocrLang)
public java.lang.String getOcrLang()
public ConvertTextExtractor withOcrLang(java.lang.String ocrLang)
public void setOcrTimeoutMs(long ocrTimeoutMs)
public long getOcrTimeoutMs()
public ConvertTextExtractor withOcrTimeoutMs(long ocrTimeoutMs)
public ConvertTextExtractor withOcrTimeoutMs(java.lang.Long ocrTimeoutMs)
public void setOcrMaxPages(int ocrMaxPages)
public int getOcrMaxPages()
public ConvertTextExtractor withOcrMaxPages(int ocrMaxPages)
public ConvertTextExtractor withOcrMaxPages(java.lang.Integer ocrMaxPages)
public void setOcrPriority(java.lang.String ocrPriority)
public java.lang.String getOcrPriority()
public ConvertTextExtractor withOcrPriority(java.lang.String ocrPriority)
public void setHttpProxyUrl(java.lang.String httpProxyUrl)
public java.lang.String getHttpProxyUrl()
public ConvertTextExtractor withHttpProxyUrl(java.lang.String httpProxyUrl)
public void setDisablePlugins(boolean disablePlugins)
public boolean isDisablePlugins()
public ConvertTextExtractor withDisablePlugins(boolean disablePlugins)
public ConvertTextExtractor withDisablePlugins(java.lang.Boolean disablePlugins)
public void setOverrideAddresses(java.lang.String overrideAddresses)
public java.lang.String getOverrideAddresses()
public ConvertTextExtractor withOverrideAddresses(java.lang.String overrideAddresses)
public ConvertTextExtractor makeCopy()
makeCopy
in class DocumentProcessor
public static ConvertTextExtractor readFrom(java.io.InputStream is) throws javax.xml.bind.JAXBException
javax.xml.bind.JAXBException
public void writeTo(java.io.OutputStream os) throws javax.xml.bind.JAXBException, java.io.IOException
writeTo
in class DocumentProcessor
javax.xml.bind.JAXBException
java.io.IOException
public static ConvertTextExtractor fromString(java.lang.String s) throws javax.xml.bind.JAXBException, java.io.UnsupportedEncodingException
javax.xml.bind.JAXBException
java.io.UnsupportedEncodingException
public java.lang.String toString()
toString
in class DocumentProcessor
public void check(boolean deep, java.lang.String errorContext) throws com.exalead.util.TypedException
check
in interface com.exalead.util.Checkable
check
in class DocumentProcessor
com.exalead.util.TypedException
public <T> T accept(DocumentProcessor.Transformer<T> transformer, T[] t) throws com.exalead.util.TypedException
accept
in class DocumentProcessor
com.exalead.util.TypedException
Copyright © 2021 Dassault Systèmes, All Rights Reserved.