public class LuceneCrawler extends java.lang.Object implements CrawlerAccess
Modifier and Type | Field and Description |
---|---|
(package private) CrawlerAccess |
crawler |
private java.util.HashMap |
properties |
(package private) org.apache.lucene.index.IndexWriter |
writer |
Constructor and Description |
---|
LuceneCrawler(CrawlerAccess crawler,
org.apache.lucene.index.IndexWriter writer)
Creates new LuceneCrawler
|
Modifier and Type | Method and Description |
---|---|
void |
add(java.lang.Object crawlerObject,
int depth)
Adds an url to the queue of the crawler.
|
void |
addObject(java.lang.Object data)
Gives any object constructed from the crawled page to the call back object.
|
static org.apache.lucene.document.Field |
content(java.lang.String data) |
void |
forceExit() |
java.lang.Object |
getProperty(java.lang.String key) |
static org.apache.lucene.document.Field |
keywords(java.lang.String data) |
static org.apache.lucene.document.Field |
location(java.lang.String data) |
void |
setProperty(java.lang.String key,
java.lang.Object value) |
static org.apache.lucene.document.Field |
subject(java.lang.String data) |
static org.apache.lucene.document.Field |
title(java.lang.String data) |
private java.util.HashMap properties
CrawlerAccess crawler
org.apache.lucene.index.IndexWriter writer
public LuceneCrawler(CrawlerAccess crawler, org.apache.lucene.index.IndexWriter writer)
public void add(java.lang.Object crawlerObject, int depth)
CrawlerAccess
add
in interface CrawlerAccess
public void addObject(java.lang.Object data)
CrawlerAccess
CrawlerAccess
implementation to decide what to do with it.addObject
in interface CrawlerAccess
public static org.apache.lucene.document.Field keywords(java.lang.String data)
public static org.apache.lucene.document.Field title(java.lang.String data)
public static org.apache.lucene.document.Field subject(java.lang.String data)
public static org.apache.lucene.document.Field content(java.lang.String data)
public static org.apache.lucene.document.Field location(java.lang.String data)
public void forceExit()
forceExit
in interface CrawlerAccess
public void setProperty(java.lang.String key, java.lang.Object value)
setProperty
in interface CrawlerAccess
public java.lang.Object getProperty(java.lang.String key)
Copyright 2004-2015 Wandora Team