heritrix运行报错
下了heritrix3.1.0版本crawler-beans.cxml的配置如下
<bean id="易做图Overrides" class="org.springframework.beans.factory.config.PropertyOverrideConfigurer">
<property name="properties">
<value>
# This Properties map is specified in the Java 'property list' text format
# http://java.sun.com/javase/6/docs/api/java/util/Properties.html#load%28java.io.Reader%29
metadata.operatorContactUrl=http://127.0.0.1
metadata.jobName=test
metadata.description=Basic crawl starting with useful defaults
##..more?..##
</value>
</property>
</bean>
<!-- overrides from declared <prop> elements, more easily allowing
multiline values or even declared beans -->
<bean id="longerOverrides" class="org.springframework.beans.factory.config.PropertyOverrideConfigurer">
<property name="properties">
<props>
<prop key="seeds.textSource.value">
# URLS HERE
http://news.baidu.com/
</prop>
</props>
</property>
</bean>
<!-- CRAWL METADATA: including identification of crawler/operator -->
<bean id="metadata" class="org.archive.modules.CrawlMetadata" autowire="byName">
<property name="operatorContactUrl" value="http://127.0.0.1"/>
<property name="jobName" value="test"/>
<property name="description" value="nimei de"/>
<!-- <property name="robotsPolicyName" value="obey"/> -->
<!-- <property name="operator" value=""/> -->
<!-- <property name="operatorFrom" value=""/> -->
<!-- <property name="organization" value=""/> -->
<!-- <property name="audience" value=""/> -->
<property name="userAgentTemplate"
value="Mozilla/5.0 (compatible; heritrix/3.1.0 +@OPERATOR_CONTACT_URL@)"/>
</bean>
当这个job launch的时候后台报
An error occured
You may be able to recover and try something else by going back.
Cause: java.lang.IllegalStateException: BdbModule not started
java.lang.IllegalStateException: BdbModule not started
at org.archive.bdb.BdbModule.openDatabase(BdbModule.java:328)
at org.archive.bdb.BdbModule.getStoredMap(BdbModule.java:652)
at org.archive.crawler.reporting.StatisticsTracker.calcSeedRecordsSortedByStatusCode(StatisticsTracker.java:829)
at org.archive.crawler.reporting.SeedsReport.write(SeedsReport.java:44)
at org.archive.crawler.reporting.StatisticsTracker.writeReportFile(StatisticsTracker.java:909)
at org.archive.crawler.reporting.StatisticsTracker.writeReportFile(StatisticsTracker.java:888)
at org.archive.crawler.restlet.ReportGenResource.represent(ReportGenResource.java:50)
at org.restlet.resource.Resource.getRepresentation(Resource.java:302)
at org.restlet.resource.Resource.handleGet(Resource.java:464)
at org.restlet.Finder.handle(Finder.java:353)
at org.restlet.Filter.doHandle(Filter.java:150)
at org.restlet.Filter.handle(Filter.java:195)
at org.restlet.Router.handle(Router.java:504)
at org.restlet.Filter.doHandle(Filter.java:150)
at org.restlet.Filter.handle(Filter.java:195)
才玩这个,求解答
补充:Java , Java SE