public class LuceneCrawler extends java.lang.Object implements CrawlerAccess
| Modifier and Type | Field and Description |
|---|---|
(package private) CrawlerAccess |
crawler |
private java.util.HashMap |
properties |
(package private) org.apache.lucene.index.IndexWriter |
writer |
| Constructor and Description |
|---|
LuceneCrawler(CrawlerAccess crawler,
org.apache.lucene.index.IndexWriter writer)
Creates new LuceneCrawler
|
| Modifier and Type | Method and Description |
|---|---|
void |
add(java.lang.Object crawlerObject,
int depth)
Adds an url to the queue of the crawler.
|
void |
addObject(java.lang.Object data)
Gives any object constructed from the crawled page to the call back object.
|
static org.apache.lucene.document.Field |
content(java.lang.String data) |
void |
forceExit() |
java.lang.Object |
getProperty(java.lang.String key) |
static org.apache.lucene.document.Field |
keywords(java.lang.String data) |
static org.apache.lucene.document.Field |
location(java.lang.String data) |
void |
setProperty(java.lang.String key,
java.lang.Object value) |
static org.apache.lucene.document.Field |
subject(java.lang.String data) |
static org.apache.lucene.document.Field |
title(java.lang.String data) |
private java.util.HashMap properties
CrawlerAccess crawler
org.apache.lucene.index.IndexWriter writer
public LuceneCrawler(CrawlerAccess crawler, org.apache.lucene.index.IndexWriter writer)
public void add(java.lang.Object crawlerObject,
int depth)
CrawlerAccessadd in interface CrawlerAccesspublic void addObject(java.lang.Object data)
CrawlerAccessCrawlerAccess implementation to decide what to do with it.addObject in interface CrawlerAccesspublic static org.apache.lucene.document.Field keywords(java.lang.String data)
public static org.apache.lucene.document.Field title(java.lang.String data)
public static org.apache.lucene.document.Field subject(java.lang.String data)
public static org.apache.lucene.document.Field content(java.lang.String data)
public static org.apache.lucene.document.Field location(java.lang.String data)
public void forceExit()
forceExit in interface CrawlerAccesspublic void setProperty(java.lang.String key,
java.lang.Object value)
setProperty in interface CrawlerAccesspublic java.lang.Object getProperty(java.lang.String key)
Copyright 2004-2015 Wandora Team