public class ClusteringConfig extends UnSupervisedLearningConfig implements com.exalead.util.Checkable, java.io.Serializable
UnSupervisedLearningConfig.Conditions, UnSupervisedLearningConfig.Descriptors, UnSupervisedLearningConfig.SkippedAnnotations
Modifier and Type | Field and Description |
---|---|
java.lang.String |
classField |
static int |
DEFAULT_MAX_BEST_DESCRIPTORS |
static int |
DEFAULT_MAX_DESCRIPTORS_USED |
java.lang.String |
descriptorsField |
java.lang.String |
headField |
int |
maxBestDescriptors |
int |
maxDescriptorsUsed |
int |
maxFreq |
int |
minFreq |
double |
minScore |
int |
minWordMatched |
java.lang.String |
nbDocsField |
double |
similarityThreshold |
conditions, DEFAULT_MAX_DOCUMENT_THRESHOLD, DEFAULT_MIN_DOCUMENT_REQUIRED, descriptors, instance, managedResourceGroup, maxDocumentThreshold, minDocumentRequired, skippedAnnotations
Constructor and Description |
---|
ClusteringConfig() |
ClusteringConfig(ClusteringConfig o)
Copy constructor
|
Modifier and Type | Method and Description |
---|---|
void |
check(boolean deep,
java.lang.String errorContext)
Checks this ClusteringConfig.
|
static ClusteringConfig |
fromString(java.lang.String s)
String representation of this ClusteringConfig.
|
java.lang.String |
getClassField()
The index unsigned field name where the classID is going to be imported.
|
java.lang.String |
getDescriptorsField()
The optional index text field name storing the best n descriptors for each cluster (tabulation separated), usable as human-readable cluster title.
|
java.lang.String |
getHeadField()
The index unsigned field name specifying if the document whether a cluster is a head.
|
int |
getMaxBestDescriptors()
Maximum amount of descriptors in descriptors field.
|
int |
getMaxDescriptorsUsed()
The maximum number of descriptors used (optional).
|
int |
getMaxFreq()
The maximum frequency a descriptor must have to be relevant.
|
int |
getMinFreq()
The minimum frequency a descriptor must have to be relevant.
|
double |
getMinScore()
The minimum score a descriptor must have to be relevant.
|
int |
getMinWordMatched()
The minimum number of matched word required to build a cluster.
|
java.lang.String |
getNbDocsField()
The index text field name specifying the number of documents in the cluster (only set on heads).
|
double |
getSimilarityThreshold()
The clustering similarity threshold.
|
ClusteringConfig |
makeCopy()
Creates and returns a deep copy of this ClusteringConfig.
|
static ClusteringConfig |
readFrom(java.io.InputStream is)
Read this ClusteringConfig from an XML fragment.
|
void |
setClassField(java.lang.String classField)
The index unsigned field name where the classID is going to be imported.
|
void |
setDescriptorsField(java.lang.String descriptorsField)
The optional index text field name storing the best n descriptors for each cluster (tabulation separated), usable as human-readable cluster title.
|
void |
setHeadField(java.lang.String headField)
The index unsigned field name specifying if the document whether a cluster is a head.
|
void |
setMaxBestDescriptors(int maxBestDescriptors)
Maximum amount of descriptors in descriptors field.
|
void |
setMaxDescriptorsUsed(int maxDescriptorsUsed)
The maximum number of descriptors used (optional).
|
void |
setMaxFreq(int maxFreq)
The maximum frequency a descriptor must have to be relevant.
|
void |
setMinFreq(int minFreq)
The minimum frequency a descriptor must have to be relevant.
|
void |
setMinScore(double minScore)
The minimum score a descriptor must have to be relevant.
|
void |
setMinWordMatched(int minWordMatched)
The minimum number of matched word required to build a cluster.
|
void |
setNbDocsField(java.lang.String nbDocsField)
The index text field name specifying the number of documents in the cluster (only set on heads).
|
void |
setSimilarityThreshold(double similarityThreshold)
The clustering similarity threshold.
|
java.lang.String |
toString()
String representation of this ClusteringConfig.
|
ClusteringConfig |
withClassField(java.lang.String classField) |
ClusteringConfig |
withConditions(java.util.Collection<LearningTriggerCondition> __values) |
ClusteringConfig |
withConditions(LearningTriggerCondition... __values)
The list of triggering conditions.
This learning job is triggered as soon as any of this condition is fulfilled. |
ClusteringConfig |
withDescriptors(java.util.Collection<Descriptor> __values) |
ClusteringConfig |
withDescriptors(Descriptor... __values)
The list of MOT annotation used to extract descriptors (if empty, words are used).
|
ClusteringConfig |
withDescriptorsField(java.lang.String descriptorsField) |
ClusteringConfig |
withHeadField(java.lang.String headField) |
ClusteringConfig |
withInstance(java.lang.String instance) |
ClusteringConfig |
withManagedResourceGroup(java.lang.String managedResourceGroup) |
ClusteringConfig |
withMaxBestDescriptors(int maxBestDescriptors) |
ClusteringConfig |
withMaxBestDescriptors(java.lang.Integer maxBestDescriptors) |
ClusteringConfig |
withMaxDescriptorsUsed(int maxDescriptorsUsed) |
ClusteringConfig |
withMaxDescriptorsUsed(java.lang.Integer maxDescriptorsUsed) |
ClusteringConfig |
withMaxDocumentThreshold(int maxDocumentThreshold) |
ClusteringConfig |
withMaxDocumentThreshold(java.lang.Integer maxDocumentThreshold) |
ClusteringConfig |
withMaxFreq(int maxFreq) |
ClusteringConfig |
withMaxFreq(java.lang.Integer maxFreq) |
ClusteringConfig |
withMinDocumentRequired(int minDocumentRequired) |
ClusteringConfig |
withMinDocumentRequired(java.lang.Integer minDocumentRequired) |
ClusteringConfig |
withMinFreq(int minFreq) |
ClusteringConfig |
withMinFreq(java.lang.Integer minFreq) |
ClusteringConfig |
withMinScore(double minScore) |
ClusteringConfig |
withMinWordMatched(int minWordMatched) |
ClusteringConfig |
withMinWordMatched(java.lang.Integer minWordMatched) |
ClusteringConfig |
withNbDocsField(java.lang.String nbDocsField) |
ClusteringConfig |
withSimilarityThreshold(double similarityThreshold) |
ClusteringConfig |
withSkippedAnnotations(java.util.Collection<StringValue> __values) |
ClusteringConfig |
withSkippedAnnotations(StringValue... __values)
The list of MOT annotation used to ignore tokens.
|
void |
writeTo(java.io.OutputStream os)
Write this ClusteringConfig as an XML fragment
|
getConditions, getDescriptors, getInstance, getManagedResourceGroup, getMaxDocumentThreshold, getMinDocumentRequired, getSkippedAnnotations, setConditions, setDescriptors, setInstance, setManagedResourceGroup, setMaxDocumentThreshold, setMinDocumentRequired, setSkippedAnnotations, withConditions, withDescriptors, withSkippedAnnotations
public double similarityThreshold
public double minScore
public int minWordMatched
public int minFreq
public int maxFreq
public java.lang.String classField
public java.lang.String headField
public java.lang.String nbDocsField
public int maxDescriptorsUsed
public static final int DEFAULT_MAX_DESCRIPTORS_USED
public java.lang.String descriptorsField
public int maxBestDescriptors
public static final int DEFAULT_MAX_BEST_DESCRIPTORS
public ClusteringConfig()
public ClusteringConfig(ClusteringConfig o)
public ClusteringConfig withInstance(java.lang.String instance)
withInstance
in class UnSupervisedLearningConfig
public ClusteringConfig withMinDocumentRequired(int minDocumentRequired)
withMinDocumentRequired
in class UnSupervisedLearningConfig
public ClusteringConfig withMinDocumentRequired(java.lang.Integer minDocumentRequired)
withMinDocumentRequired
in class UnSupervisedLearningConfig
public ClusteringConfig withMaxDocumentThreshold(int maxDocumentThreshold)
withMaxDocumentThreshold
in class UnSupervisedLearningConfig
public ClusteringConfig withMaxDocumentThreshold(java.lang.Integer maxDocumentThreshold)
withMaxDocumentThreshold
in class UnSupervisedLearningConfig
public ClusteringConfig withDescriptors(Descriptor... __values)
withDescriptors
in class UnSupervisedLearningConfig
public ClusteringConfig withDescriptors(java.util.Collection<Descriptor> __values)
withDescriptors
in class UnSupervisedLearningConfig
public ClusteringConfig withSkippedAnnotations(StringValue... __values)
withSkippedAnnotations
in class UnSupervisedLearningConfig
public ClusteringConfig withSkippedAnnotations(java.util.Collection<StringValue> __values)
withSkippedAnnotations
in class UnSupervisedLearningConfig
public ClusteringConfig withConditions(LearningTriggerCondition... __values)
withConditions
in class UnSupervisedLearningConfig
public ClusteringConfig withConditions(java.util.Collection<LearningTriggerCondition> __values)
withConditions
in class UnSupervisedLearningConfig
public ClusteringConfig withManagedResourceGroup(java.lang.String managedResourceGroup)
withManagedResourceGroup
in class UnSupervisedLearningConfig
public void setSimilarityThreshold(double similarityThreshold)
public double getSimilarityThreshold()
public ClusteringConfig withSimilarityThreshold(double similarityThreshold)
public void setMinScore(double minScore)
public double getMinScore()
public ClusteringConfig withMinScore(double minScore)
public void setMinWordMatched(int minWordMatched)
public int getMinWordMatched()
public ClusteringConfig withMinWordMatched(int minWordMatched)
public ClusteringConfig withMinWordMatched(java.lang.Integer minWordMatched)
public void setMinFreq(int minFreq)
public int getMinFreq()
public ClusteringConfig withMinFreq(int minFreq)
public ClusteringConfig withMinFreq(java.lang.Integer minFreq)
public void setMaxFreq(int maxFreq)
public int getMaxFreq()
public ClusteringConfig withMaxFreq(int maxFreq)
public ClusteringConfig withMaxFreq(java.lang.Integer maxFreq)
public void setClassField(java.lang.String classField)
public java.lang.String getClassField()
public ClusteringConfig withClassField(java.lang.String classField)
public void setHeadField(java.lang.String headField)
public java.lang.String getHeadField()
public ClusteringConfig withHeadField(java.lang.String headField)
public void setNbDocsField(java.lang.String nbDocsField)
public java.lang.String getNbDocsField()
public ClusteringConfig withNbDocsField(java.lang.String nbDocsField)
public void setMaxDescriptorsUsed(int maxDescriptorsUsed)
public int getMaxDescriptorsUsed()
public ClusteringConfig withMaxDescriptorsUsed(int maxDescriptorsUsed)
public ClusteringConfig withMaxDescriptorsUsed(java.lang.Integer maxDescriptorsUsed)
public void setDescriptorsField(java.lang.String descriptorsField)
public java.lang.String getDescriptorsField()
public ClusteringConfig withDescriptorsField(java.lang.String descriptorsField)
public void setMaxBestDescriptors(int maxBestDescriptors)
public int getMaxBestDescriptors()
public ClusteringConfig withMaxBestDescriptors(int maxBestDescriptors)
public ClusteringConfig withMaxBestDescriptors(java.lang.Integer maxBestDescriptors)
public ClusteringConfig makeCopy()
makeCopy
in class UnSupervisedLearningConfig
public static ClusteringConfig readFrom(java.io.InputStream is) throws javax.xml.bind.JAXBException
javax.xml.bind.JAXBException
public void writeTo(java.io.OutputStream os) throws javax.xml.bind.JAXBException, java.io.IOException
writeTo
in class UnSupervisedLearningConfig
javax.xml.bind.JAXBException
java.io.IOException
public static ClusteringConfig fromString(java.lang.String s) throws javax.xml.bind.JAXBException, java.io.UnsupportedEncodingException
javax.xml.bind.JAXBException
java.io.UnsupportedEncodingException
public java.lang.String toString()
toString
in class UnSupervisedLearningConfig
public void check(boolean deep, java.lang.String errorContext) throws com.exalead.util.TypedException
check
in interface com.exalead.util.Checkable
check
in class UnSupervisedLearningConfig
com.exalead.util.TypedException
Copyright © 2021 Dassault Systèmes, All Rights Reserved.