Example Configuration File

[License]
LicenseServerHost=licenses
LicenseServerACIPort=20000

[service]
ServicePort=17050
ServiceStatusClients=*
ServiceControlClients=*

[server]
Port=7050
QueryClients=*
AdminClients=*

[Logging]
LogLevel=FULL
LogHistorySize=0
LogTime=true
MaxLogSizeKbs=4096
OldLogFileAction=compress
0=ApplicationLogStream
1=ActionLogStream
2=SynchronizeLogStream

[ApplicationLogStream]
LogFile=application.log
LogTypeCSVs=application

[ActionLogStream]
LogFile=action.log
LogTypeCSVs=action

[SynchronizeLogStream]
LogFile=synchronize.log
LogTypeCSVs=synchronize

[Connector]
TempDirectory=temp
EnableScheduledTasks=TRUE
ScheduleRepeatSecs=86400
ScheduleCycles=-1

[Ingestion]
IngesterType=CFS
IngestHost=localhost
IngestPort=7000
IndexDatabase=WebConnector

[FetchTasks]
SSLMethod=SSLV23
Number=1
0=MyTask0

[MyTask0]
//The url from which to start the crawl
Url=http://www.mywebsite.com

//Regexes to restrict pages that are crawled for links
SpiderUrlMustHaveRegex=
SpiderUrlCantHaveRegex=

//Regexes to restrict pages that are indexed.
UrlMustHaveRegex=
UrlCantHaveRegex=
PageMustHaveRegex=
PageCantHaveRegex=

//The delay between processing pages, per sync thread
PageDelay=5s

//Stay on the same site as the starting url
StayOnSite=true

//Maximum amount of time to spend crawling, 0 indicating unlimited
SiteDuration=0s

//Maximum number of pages to ingest per synchronize run, 0 indicating unlimited
MaxPages=0

//Minimum size that a page must be for it to be ingested
MinPageSize=0

//Maximum size that a page must be for it to be ingested, 0 indicating unlimited
MaxPageSize=0

//Maximum number of links a page can have before it is not ingested, 0 indicating unlimited
MaxLinksPerPage=0

//Follow robots.txt and ROBOTS meta tag commands
FollowRobotProtocol=true

//The UserAgent sent in the request headers
SpiderAs=Autn-WKOOP

//Maximum depth to spider to, -1 indicating unlimited.
Depth=-1

//Follow links found in flash content
FollowFlash=false

//Proxy details
ProxyHost=
ProxyPort=
ProxyUser=
ProxyPassword=

//Authentication details sent if 401 is returned by the server.
//Supports Basic, NTLM V2 and Digest-MD5.
AuthUser=
AuthPassword=

_HP_HTML5_bannerTitle.htm