public class AnalysisPipeline
extends java.lang.Object
implements com.exalead.util.Checkable, java.io.Serializable
Constructor and Description |
---|
AnalysisPipeline() |
AnalysisPipeline(AnalysisPipeline o)
Copy constructor
|
Modifier and Type | Method and Description |
---|---|
void |
check(boolean deep,
java.lang.String errorContext)
Checks this AnalysisPipeline.
|
static AnalysisPipeline |
fromString(java.lang.String s)
String representation of this AnalysisPipeline.
|
AcceptCondition |
getAcceptCondition() |
java.util.List<DocumentProcessor> |
getDocumentProcessor() |
java.util.Map<java.lang.String,DocumentProcessor> |
getDocumentProcessorAsMap()
Get the map of DocumentProcessor, indexed by name
|
DocumentProcessor |
getDocumentProcessorByName(java.lang.String _lookup)
Get the DocumentProcessor for which the name matches _lookup
|
java.lang.String |
getErrorAction()
Specifies the action to launch if there is a document error during processing:
"discard": Discards the document from the job.
|
FilteringConfiguration |
getFilteringConfiguration() |
java.util.List<LanguageConfiguration> |
getLanguageConfiguration() |
java.util.Map<java.lang.String,LanguageConfiguration> |
getLanguageConfigurationAsMap()
Get the map of LanguageConfiguration, indexed by language
|
LanguageConfiguration |
getLanguageConfigurationByLanguage(java.lang.String _lookup)
Get the LanguageConfiguration for which the language matches _lookup
|
MappingConfiguration |
getMappingConfiguration() |
java.lang.String |
getName() |
int |
getSemanticPipeTimeout()
CPU-time limit for the processing of a text chunk by the semantic pipe, in seconds.
|
java.util.List<SemanticProcessor> |
getSemanticProcessor() |
java.util.Map<java.lang.String,SemanticProcessor> |
getSemanticProcessorAsMap()
Get the map of SemanticProcessor, indexed by name
|
SemanticProcessor |
getSemanticProcessorByName(java.lang.String _lookup)
Get the SemanticProcessor for which the name matches _lookup
|
long |
getSlowDocumentWarningTimeUS()
If the processing of a document is longer than this time, a message will be printed in the analyzer log.
A value of 0 disables the warning feature. |
java.lang.String |
getTokenizationConfig()
Reference to the TokenizationConfig object to use for tokenization during Semantic Processing Stage.
|
boolean |
isAutoBlacklistDocuments()
Tries to add to a block list the documents triggering serious failure automatically.
This option helps preventing loop failures, that is to say, when documents always trigger the same analysis process failures. |
boolean |
isAutoconfigureFromDataModel() |
boolean |
isDocumentProcessorsProfiling()
Logs the CPU time spent for each document processor and for the main indexing phase.
The total time spent for each processor is dumped in the analyzer log at the end of the job. |
boolean |
isGlobalLogDocumentErrors()
Logs errors and exceptions reported by the processors in the global log (without stack trace).
|
boolean |
isReportDocumentErrors()
Reports the document errors in the global reporting store, for further analysis.
|
boolean |
isSemanticProcessorsProfiling()
Logs the CPU time spent for each semantic processor.
The total time spent for each processor is dumped in the analyzer log at the end of the job. Warning: This feature strongly impacts performance, only enable it if required. |
AnalysisPipeline |
makeCopy()
Creates and returns a deep copy of this AnalysisPipeline.
|
static AnalysisPipeline |
readFrom(java.io.InputStream is)
Read this AnalysisPipeline from an XML fragment.
|
boolean |
removeDocumentProcessorByName(java.lang.String _lookup)
Removes the DocumentProcessor for which the name matches _lookup
|
boolean |
removeLanguageConfigurationByLanguage(java.lang.String _lookup)
Removes the LanguageConfiguration for which the language matches _lookup
|
boolean |
removeSemanticProcessorByName(java.lang.String _lookup)
Removes the SemanticProcessor for which the name matches _lookup
|
void |
setAcceptCondition(AcceptCondition acceptCondition) |
void |
setAutoBlacklistDocuments(boolean autoBlacklistDocuments)
Tries to add to a block list the documents triggering serious failure automatically.
This option helps preventing loop failures, that is to say, when documents always trigger the same analysis process failures. |
void |
setAutoconfigureFromDataModel(boolean autoconfigureFromDataModel) |
void |
setDocumentProcessorsProfiling(boolean documentProcessorsProfiling)
Logs the CPU time spent for each document processor and for the main indexing phase.
The total time spent for each processor is dumped in the analyzer log at the end of the job. |
void |
setErrorAction(java.lang.String errorAction)
Specifies the action to launch if there is a document error during processing:
"discard": Discards the document from the job.
|
void |
setFilteringConfiguration(FilteringConfiguration filteringConfiguration) |
void |
setGlobalLogDocumentErrors(boolean globalLogDocumentErrors)
Logs errors and exceptions reported by the processors in the global log (without stack trace).
|
void |
setMappingConfiguration(MappingConfiguration mappingConfiguration) |
void |
setName(java.lang.String name) |
void |
setReportDocumentErrors(boolean reportDocumentErrors)
Reports the document errors in the global reporting store, for further analysis.
|
void |
setSemanticPipeTimeout(int semanticPipeTimeout)
CPU-time limit for the processing of a text chunk by the semantic pipe, in seconds.
|
void |
setSemanticProcessorsProfiling(boolean semanticProcessorsProfiling)
Logs the CPU time spent for each semantic processor.
The total time spent for each processor is dumped in the analyzer log at the end of the job. Warning: This feature strongly impacts performance, only enable it if required. |
void |
setSlowDocumentWarningTimeUS(long slowDocumentWarningTimeUS)
If the processing of a document is longer than this time, a message will be printed in the analyzer log.
A value of 0 disables the warning feature. |
void |
setTokenizationConfig(java.lang.String tokenizationConfig)
Reference to the TokenizationConfig object to use for tokenization during Semantic Processing Stage.
|
java.lang.String |
toString()
String representation of this AnalysisPipeline.
|
AnalysisPipeline |
withAcceptCondition(AcceptCondition acceptCondition) |
AnalysisPipeline |
withAutoBlacklistDocuments(boolean autoBlacklistDocuments) |
AnalysisPipeline |
withAutoBlacklistDocuments(java.lang.Boolean autoBlacklistDocuments) |
AnalysisPipeline |
withAutoconfigureFromDataModel(boolean autoconfigureFromDataModel) |
AnalysisPipeline |
withAutoconfigureFromDataModel(java.lang.Boolean autoconfigureFromDataModel) |
AnalysisPipeline |
withDocumentProcessor(java.util.Collection<DocumentProcessor> __values) |
AnalysisPipeline |
withDocumentProcessor(DocumentProcessor... __values) |
AnalysisPipeline |
withDocumentProcessorsProfiling(boolean documentProcessorsProfiling) |
AnalysisPipeline |
withDocumentProcessorsProfiling(java.lang.Boolean documentProcessorsProfiling) |
AnalysisPipeline |
withErrorAction(java.lang.String errorAction) |
AnalysisPipeline |
withFilteringConfiguration(FilteringConfiguration filteringConfiguration) |
AnalysisPipeline |
withGlobalLogDocumentErrors(boolean globalLogDocumentErrors) |
AnalysisPipeline |
withGlobalLogDocumentErrors(java.lang.Boolean globalLogDocumentErrors) |
AnalysisPipeline |
withLanguageConfiguration(java.util.Collection<LanguageConfiguration> __values) |
AnalysisPipeline |
withLanguageConfiguration(LanguageConfiguration... __values) |
AnalysisPipeline |
withMappingConfiguration(MappingConfiguration mappingConfiguration) |
AnalysisPipeline |
withName(java.lang.String name) |
AnalysisPipeline |
withReportDocumentErrors(boolean reportDocumentErrors) |
AnalysisPipeline |
withReportDocumentErrors(java.lang.Boolean reportDocumentErrors) |
AnalysisPipeline |
withSemanticPipeTimeout(int semanticPipeTimeout) |
AnalysisPipeline |
withSemanticPipeTimeout(java.lang.Integer semanticPipeTimeout) |
AnalysisPipeline |
withSemanticProcessor(java.util.Collection<SemanticProcessor> __values) |
AnalysisPipeline |
withSemanticProcessor(SemanticProcessor... __values) |
AnalysisPipeline |
withSemanticProcessorsProfiling(boolean semanticProcessorsProfiling) |
AnalysisPipeline |
withSemanticProcessorsProfiling(java.lang.Boolean semanticProcessorsProfiling) |
AnalysisPipeline |
withSlowDocumentWarningTimeUS(long slowDocumentWarningTimeUS) |
AnalysisPipeline |
withSlowDocumentWarningTimeUS(java.lang.Long slowDocumentWarningTimeUS) |
AnalysisPipeline |
withTokenizationConfig(java.lang.String tokenizationConfig) |
void |
writeTo(java.io.OutputStream os)
Write this AnalysisPipeline as an XML fragment
|
public java.util.List<DocumentProcessor> documentProcessor
public java.util.List<SemanticProcessor> semanticProcessor
public AcceptCondition acceptCondition
public MappingConfiguration mappingConfiguration
public FilteringConfiguration filteringConfiguration
public java.util.List<LanguageConfiguration> languageConfiguration
public java.lang.String name
public java.lang.String errorAction
public static final java.lang.String DEFAULT_ERROR_ACTION
public boolean reportDocumentErrors
public static final boolean DEFAULT_REPORT_DOCUMENT_ERRORS
public boolean globalLogDocumentErrors
public static final boolean DEFAULT_GLOBAL_LOG_DOCUMENT_ERRORS
public boolean autoBlacklistDocuments
public static final boolean DEFAULT_AUTO_BLACKLIST_DOCUMENTS
public java.lang.String tokenizationConfig
public boolean autoconfigureFromDataModel
public static final boolean DEFAULT_AUTOCONFIGURE_FROM_DATA_MODEL
public boolean documentProcessorsProfiling
public static final boolean DEFAULT_DOCUMENT_PROCESSORS_PROFILING
public int semanticPipeTimeout
public static final int DEFAULT_SEMANTIC_PIPE_TIMEOUT
public long slowDocumentWarningTimeUS
public static final long DEFAULT_SLOW_DOCUMENT_WARNING_TIME_U_S
public boolean semanticProcessorsProfiling
public static final boolean DEFAULT_SEMANTIC_PROCESSORS_PROFILING
public AnalysisPipeline()
public AnalysisPipeline(AnalysisPipeline o)
public java.util.List<DocumentProcessor> getDocumentProcessor()
public DocumentProcessor getDocumentProcessorByName(java.lang.String _lookup)
public java.util.Map<java.lang.String,DocumentProcessor> getDocumentProcessorAsMap()
public boolean removeDocumentProcessorByName(java.lang.String _lookup)
public AnalysisPipeline withDocumentProcessor(DocumentProcessor... __values)
public AnalysisPipeline withDocumentProcessor(java.util.Collection<DocumentProcessor> __values)
public java.util.List<SemanticProcessor> getSemanticProcessor()
public SemanticProcessor getSemanticProcessorByName(java.lang.String _lookup)
public java.util.Map<java.lang.String,SemanticProcessor> getSemanticProcessorAsMap()
public boolean removeSemanticProcessorByName(java.lang.String _lookup)
public AnalysisPipeline withSemanticProcessor(SemanticProcessor... __values)
public AnalysisPipeline withSemanticProcessor(java.util.Collection<SemanticProcessor> __values)
public void setAcceptCondition(AcceptCondition acceptCondition)
public AcceptCondition getAcceptCondition()
public AnalysisPipeline withAcceptCondition(AcceptCondition acceptCondition)
public void setMappingConfiguration(MappingConfiguration mappingConfiguration)
public MappingConfiguration getMappingConfiguration()
public AnalysisPipeline withMappingConfiguration(MappingConfiguration mappingConfiguration)
public void setFilteringConfiguration(FilteringConfiguration filteringConfiguration)
public FilteringConfiguration getFilteringConfiguration()
public AnalysisPipeline withFilteringConfiguration(FilteringConfiguration filteringConfiguration)
public java.util.List<LanguageConfiguration> getLanguageConfiguration()
public LanguageConfiguration getLanguageConfigurationByLanguage(java.lang.String _lookup)
public java.util.Map<java.lang.String,LanguageConfiguration> getLanguageConfigurationAsMap()
public boolean removeLanguageConfigurationByLanguage(java.lang.String _lookup)
public AnalysisPipeline withLanguageConfiguration(LanguageConfiguration... __values)
public AnalysisPipeline withLanguageConfiguration(java.util.Collection<LanguageConfiguration> __values)
public void setName(java.lang.String name)
public java.lang.String getName()
public AnalysisPipeline withName(java.lang.String name)
public void setErrorAction(java.lang.String errorAction)
public java.lang.String getErrorAction()
public AnalysisPipeline withErrorAction(java.lang.String errorAction)
public void setReportDocumentErrors(boolean reportDocumentErrors)
public boolean isReportDocumentErrors()
public AnalysisPipeline withReportDocumentErrors(boolean reportDocumentErrors)
public AnalysisPipeline withReportDocumentErrors(java.lang.Boolean reportDocumentErrors)
public void setGlobalLogDocumentErrors(boolean globalLogDocumentErrors)
public boolean isGlobalLogDocumentErrors()
public AnalysisPipeline withGlobalLogDocumentErrors(boolean globalLogDocumentErrors)
public AnalysisPipeline withGlobalLogDocumentErrors(java.lang.Boolean globalLogDocumentErrors)
public void setAutoBlacklistDocuments(boolean autoBlacklistDocuments)
public boolean isAutoBlacklistDocuments()
public AnalysisPipeline withAutoBlacklistDocuments(boolean autoBlacklistDocuments)
public AnalysisPipeline withAutoBlacklistDocuments(java.lang.Boolean autoBlacklistDocuments)
public void setTokenizationConfig(java.lang.String tokenizationConfig)
public java.lang.String getTokenizationConfig()
public AnalysisPipeline withTokenizationConfig(java.lang.String tokenizationConfig)
public void setAutoconfigureFromDataModel(boolean autoconfigureFromDataModel)
public boolean isAutoconfigureFromDataModel()
public AnalysisPipeline withAutoconfigureFromDataModel(boolean autoconfigureFromDataModel)
public AnalysisPipeline withAutoconfigureFromDataModel(java.lang.Boolean autoconfigureFromDataModel)
public void setDocumentProcessorsProfiling(boolean documentProcessorsProfiling)
public boolean isDocumentProcessorsProfiling()
public AnalysisPipeline withDocumentProcessorsProfiling(boolean documentProcessorsProfiling)
public AnalysisPipeline withDocumentProcessorsProfiling(java.lang.Boolean documentProcessorsProfiling)
public void setSemanticPipeTimeout(int semanticPipeTimeout)
public int getSemanticPipeTimeout()
public AnalysisPipeline withSemanticPipeTimeout(int semanticPipeTimeout)
public AnalysisPipeline withSemanticPipeTimeout(java.lang.Integer semanticPipeTimeout)
public void setSlowDocumentWarningTimeUS(long slowDocumentWarningTimeUS)
public long getSlowDocumentWarningTimeUS()
public AnalysisPipeline withSlowDocumentWarningTimeUS(long slowDocumentWarningTimeUS)
public AnalysisPipeline withSlowDocumentWarningTimeUS(java.lang.Long slowDocumentWarningTimeUS)
public void setSemanticProcessorsProfiling(boolean semanticProcessorsProfiling)
public boolean isSemanticProcessorsProfiling()
public AnalysisPipeline withSemanticProcessorsProfiling(boolean semanticProcessorsProfiling)
public AnalysisPipeline withSemanticProcessorsProfiling(java.lang.Boolean semanticProcessorsProfiling)
public AnalysisPipeline makeCopy()
public static AnalysisPipeline readFrom(java.io.InputStream is) throws javax.xml.bind.JAXBException
javax.xml.bind.JAXBException
public void writeTo(java.io.OutputStream os) throws javax.xml.bind.JAXBException, java.io.IOException
javax.xml.bind.JAXBException
java.io.IOException
public static AnalysisPipeline fromString(java.lang.String s) throws javax.xml.bind.JAXBException, java.io.UnsupportedEncodingException
javax.xml.bind.JAXBException
java.io.UnsupportedEncodingException
public java.lang.String toString()
toString
in class java.lang.Object
public void check(boolean deep, java.lang.String errorContext) throws com.exalead.util.TypedException
check
in interface com.exalead.util.Checkable
com.exalead.util.TypedException
Copyright © 2021 Dassault Systèmes, All Rights Reserved.