public class Crawler extends ICrawler implements java.io.Serializable, java.lang.Cloneable
Modifier and Type | Class and Description |
---|---|
static class |
Crawler.Roots
Java class for anonymous complex type.
|
static class |
Crawler.Rootsets
Java class for anonymous complex type.
|
ICrawler.MimeTypes, ICrawler.SessionIdBlacklist
Modifier and Type | Field and Description |
---|---|
protected Crawler.Roots |
roots |
protected Crawler.Rootsets |
rootsets |
aggressive, buildGroup, crawlerServer, crawlSchedulerConfig, crawlSitemaps, customCrawlConfig, defaultAccept, defaultFollow, defaultFollowRoots, defaultIndex, disableConditionalGet, enableConvertProcessor, enableSimpleSiteCollapsing, fetcher, ignoreRobotsTxt, indexRedirectSources, mimeTypes, mimeTypesMode, name, nearDuplicateDetector, nthreads, patternsDetector, rules, sessionIdBlacklist, simpleSiteCollapsingDepth, smartRefresh, smartRefreshMaxAgeS, smartRefreshMinAgeS, storeTextOnly, throttleTimeMS
Constructor and Description |
---|
Crawler()
Creates a new
Crawler instance. |
Crawler(Crawler o)
Creates a new
Crawler instance by deeply copying a given Crawler instance. |
getBuildGroup, getCrawlerServer, getCrawlSchedulerConfig, getCustomCrawlConfig, getFetcher, getMimeTypes, getMimeTypesMode, getName, getNthreads, getRules, getSessionIdBlacklist, getSimpleSiteCollapsingDepth, getSmartRefreshMaxAgeS, getSmartRefreshMinAgeS, getThrottleTimeMS, isAggressive, isCrawlSitemaps, isDefaultAccept, isDefaultFollow, isDefaultFollowRoots, isDefaultIndex, isDisableConditionalGet, isEnableConvertProcessor, isEnableSimpleSiteCollapsing, isIgnoreRobotsTxt, isIndexRedirectSources, isNearDuplicateDetector, isPatternsDetector, isSmartRefresh, isStoreTextOnly, setAggressive, setBuildGroup, setCrawlerServer, setCrawlSchedulerConfig, setCrawlSitemaps, setCustomCrawlConfig, setDefaultAccept, setDefaultFollow, setDefaultFollowRoots, setDefaultIndex, setDisableConditionalGet, setEnableConvertProcessor, setEnableSimpleSiteCollapsing, setFetcher, setIgnoreRobotsTxt, setIndexRedirectSources, setMimeTypes, setMimeTypesMode, setName, setNearDuplicateDetector, setNthreads, setPatternsDetector, setSessionIdBlacklist, setSimpleSiteCollapsingDepth, setSmartRefresh, setSmartRefreshMaxAgeS, setSmartRefreshMinAgeS, setStoreTextOnly, setThrottleTimeMS
protected Crawler.Roots roots
protected Crawler.Rootsets rootsets
public Crawler()
Crawler
instance.public Crawler(Crawler o)
Crawler
instance by deeply copying a given Crawler
instance.o
- The instance to copy.java.lang.NullPointerException
- if o
is null
.public Crawler.Roots getRoots()
Crawler.Roots
public void setRoots(Crawler.Roots value)
value
- allowed object is
Crawler.Roots
public Crawler.Rootsets getRootsets()
Crawler.Rootsets
public void setRootsets(Crawler.Rootsets value)
value
- allowed object is
Crawler.Rootsets
public Crawler withRoots(Crawler.Roots value)
public Crawler withRootsets(Crawler.Rootsets value)
public Crawler withCrawlSchedulerConfig(CrawlSchedulerConfig value)
withCrawlSchedulerConfig
in class ICrawler
public Crawler withCustomCrawlConfig(CustomCrawlConfig value)
withCustomCrawlConfig
in class ICrawler
public Crawler withMimeTypes(ICrawler.MimeTypes value)
withMimeTypes
in class ICrawler
public Crawler withSessionIdBlacklist(ICrawler.SessionIdBlacklist value)
withSessionIdBlacklist
in class ICrawler
public Crawler withFetcher(java.lang.String value)
withFetcher
in class ICrawler
public Crawler withCrawlerServer(java.lang.String value)
withCrawlerServer
in class ICrawler
public Crawler withBuildGroup(java.lang.String value)
withBuildGroup
in class ICrawler
public Crawler withStoreTextOnly(java.lang.Boolean value)
withStoreTextOnly
in class ICrawler
public Crawler withNthreads(java.lang.Integer value)
withNthreads
in class ICrawler
public Crawler withAggressive(java.lang.Boolean value)
withAggressive
in class ICrawler
public Crawler withThrottleTimeMS(java.lang.Integer value)
withThrottleTimeMS
in class ICrawler
public Crawler withIgnoreRobotsTxt(java.lang.Boolean value)
withIgnoreRobotsTxt
in class ICrawler
public Crawler withEnableConvertProcessor(java.lang.Boolean value)
withEnableConvertProcessor
in class ICrawler
public Crawler withNearDuplicateDetector(java.lang.Boolean value)
withNearDuplicateDetector
in class ICrawler
public Crawler withPatternsDetector(java.lang.Boolean value)
withPatternsDetector
in class ICrawler
public Crawler withCrawlSitemaps(java.lang.Boolean value)
withCrawlSitemaps
in class ICrawler
public Crawler withDisableConditionalGet(java.lang.Boolean value)
withDisableConditionalGet
in class ICrawler
public Crawler withDefaultAccept(java.lang.Boolean value)
withDefaultAccept
in class ICrawler
public Crawler withDefaultIndex(java.lang.Boolean value)
withDefaultIndex
in class ICrawler
public Crawler withDefaultFollow(java.lang.Boolean value)
withDefaultFollow
in class ICrawler
public Crawler withDefaultFollowRoots(java.lang.Boolean value)
withDefaultFollowRoots
in class ICrawler
public Crawler withEnableSimpleSiteCollapsing(java.lang.Boolean value)
withEnableSimpleSiteCollapsing
in class ICrawler
public Crawler withSimpleSiteCollapsingDepth(java.lang.Long value)
withSimpleSiteCollapsingDepth
in class ICrawler
public Crawler withMimeTypesMode(java.lang.String value)
withMimeTypesMode
in class ICrawler
public Crawler withIndexRedirectSources(java.lang.Boolean value)
withIndexRedirectSources
in class ICrawler
public Crawler withSmartRefresh(java.lang.Boolean value)
withSmartRefresh
in class ICrawler
public Crawler withSmartRefreshMinAgeS(java.lang.Integer value)
withSmartRefreshMinAgeS
in class ICrawler
public Crawler withSmartRefreshMaxAgeS(java.lang.Integer value)
withSmartRefreshMaxAgeS
in class ICrawler
Copyright © 2021 Dassault Systèmes, All Rights Reserved.