java.lang.Object org.supermind.crawl.Fetcher
public class Fetcher
Fetcher.
Field Summary | |
---|---|
protected org.springframework.beans.factory.BeanFactory |
beanFactory
|
protected long |
bytes
|
protected CrawlSeedSource |
crawlSeedSource
|
protected int |
errors
|
protected java.lang.ThreadGroup |
group
|
protected static java.util.logging.Logger |
LOG
Logger. |
protected int |
maxPagesPerConnection
The maximum number of pipedlined HTTP GETs to perform per HTTP connection. |
protected int |
pages
|
protected boolean |
parsing
|
protected PostFetchProcessor |
postFetchProcessor
|
protected long |
start
|
protected static java.lang.String |
THREAD_GROUP_NAME
|
protected int |
threadCount
|
Constructor Summary | |
---|---|
Fetcher()
|
Method Summary | |
---|---|
protected FetcherThread |
assignThread(java.net.URL url)
Assign a fetcherthread to handle this URL. |
protected void |
close()
|
org.apache.nutch.fetcher.Fetcher.FetcherStatus |
getStatus()
|
void |
run()
|
void |
setBeanFactory(org.springframework.beans.factory.BeanFactory beanFactory)
|
void |
setMaxPagesPerConnection(int maxPagesPerConnection)
|
void |
setParsing(boolean parsing)
|
void |
setPostFetchProcessor(PostFetchProcessor postFetchProcessor)
|
void |
setSeedSource(CrawlSeedSource crawlSource)
|
void |
setThreadCount(int threadCount)
|
void |
status()
Display the status of the fetcher run. |
Methods inherited from class java.lang.Object |
---|
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait |
Field Detail |
---|
protected org.springframework.beans.factory.BeanFactory beanFactory
protected long bytes
protected CrawlSeedSource crawlSeedSource
protected int errors
protected final java.lang.ThreadGroup group
protected static java.util.logging.Logger LOG
protected int maxPagesPerConnection
protected int pages
protected boolean parsing
protected PostFetchProcessor postFetchProcessor
protected long start
protected static final java.lang.String THREAD_GROUP_NAME
protected int threadCount
Constructor Detail |
---|
public Fetcher() throws java.lang.Exception
java.lang.Exception
Method Detail |
---|
protected FetcherThread assignThread(java.net.URL url)
url
-
protected void close() throws java.io.IOException
java.io.IOException
public org.apache.nutch.fetcher.Fetcher.FetcherStatus getStatus()
public void run() throws java.io.IOException, java.lang.InterruptedException
java.io.IOException
java.lang.InterruptedException
public void setBeanFactory(org.springframework.beans.factory.BeanFactory beanFactory)
setBeanFactory
in interface org.springframework.beans.factory.BeanFactoryAware
public void setMaxPagesPerConnection(int maxPagesPerConnection)
public void setParsing(boolean parsing)
public void setPostFetchProcessor(PostFetchProcessor postFetchProcessor)
public void setSeedSource(CrawlSeedSource crawlSource) throws java.io.IOException
java.io.IOException
public void setThreadCount(int threadCount)
public void status()