Sample XML file for configuring Portal Search
You can adapt this sample XML file for purposes.
<?xml version="1.0" encoding="UTF-8" ?> <searchServices> <searchService id="com.ibm.lotus.search.plugins.pse.PlacesSearchFactoryImp"> <searchServiceInfo extensionId="com.ibm.lotus.search.plugins.pse.PlacesSearchFactoryImp"> <serviceName resourceBundle="com.ibm.wps.services.search.messages.SearchConfigMessages"> default.pse.service.name</serviceName> <property name="propertyName1" value="propertyValue1" /> </searchServiceInfo> <collections> <collection id="c:/ibm/wp_profiles/PortalServer/collections/stam"> <collectionInfo removeCommonWords="true"> <location>c:/ibm/wp_profiles/PortalServer/collections/stam</location> <collectionName resourceBundle="com.ibm.wps.services.search.messages.SearchConfigMessages"> stam.collection.name</collectionName> <description resourceBundle="com.ibm.wps.services.search.messages.SearchConfigMessages"> stam.collection.description</description> <defaultLanguage>fr</defaultLanguage> <categorizer>UserDefined</categorizer> <summarizer>Automatic</summarizer> </collectionInfo> <crawlers> <crawler id="crawler1"> <crawlerInfo url="http://host:port/seedlist/myserver?Source=Portal"> <crawlerName resourceBundle="com.ibm.wps.services.search.messages.SearchConfigMessages"> crawler.name</crawlerName> <contentSourceType>Seedlist</contentSourceType> <level>1</level> <numDocsCollect>-1</numDocsCollect> <completeCrawl>true</completeCrawl> <collectTimeLimit>60</collectTimeLimit> <fetchDocTimeLimit>5</fetchDocTimeLimit> <linksExpirationPeriod>-1</linksExpirationPeriod> <brokenLinksTimeToLive>10</brokenLinksTimeToLive> <numProcesses>5</numProcesses> <encoding alwaysUse="false">Windows-1252</encoding> <addDocsAutomatically>true</addDocsAutomatically> <obeyRobotsTxt>true</obeyRobotsTxt> <proxy server="" port="8080" /> <socks server="" port="1080" /> <securityRealms> <realm username="wpsadmin" password="wpsadmin" host="host">realmName</realm> </securityRealms> </crawlerInfo> <schedulers> <scheduler> <startTime day="02" month="09" year="2008" hour="24" min="0" /> <period num="1" unit="week" /> </scheduler> </schedulers> <filters> <filter name="rule-1" indexing="true" include="true"> <basis type="url">http://host:port/seedlist</basis> </filter> </filters> </crawler> </crawlers> </collection> </collections> </searchService> </searchServices>