public class BookmarkExtractor extends AbstractExtractor
| Modifier and Type | Field and Description |
|---|---|
private java.lang.String |
ADD_SI |
static java.lang.String[] |
contentTypes |
private java.text.SimpleDateFormat |
df |
private java.lang.String |
HREF_SI |
private java.lang.String |
ICON_SI |
private java.lang.String[][] |
itemProps |
private java.lang.String[][] |
itemTimeProps |
private java.lang.String |
LANG |
private Topic |
langTopic |
private java.lang.String |
MOD_SI |
private java.lang.String |
ROOT_SI |
CUSTOM_EXTRACTOR, DONE_FAILED, DONE_MANY, DONE_ONE, EXACTLY_GIVEN_URLS, FILE_EXTRACTOR, FILE_PATTERN, GIVEN_URLS_AND_ALL_CRAWLED_DOCUMENTS, GIVEN_URLS_AND_CRAWLED_DOCUMENTS_IN_URL_DOMAIN, GIVEN_URLS_AND_LINKED_DOCUMENTS, GIVEN_URLS_AND_URL_BELOW, INFO_WAIT_WHILE_WORKING, LOG_TITLE, POINT_START_URL_TEXT, RAW_EXTRACTOR, SELECT_DIALOG_TITLE, STRING_EXTRACTOR_NOT_SUPPORTED_MESSAGE, URL_EXTRACTORCLOSE, EXECUTE, INVISIBLE, VISIBLE, WAITRETURN_ERROR, RETURN_INFO| Constructor and Description |
|---|
BookmarkExtractor() |
| Modifier and Type | Method and Description |
|---|---|
boolean |
_extractTopicsFrom(java.io.File f,
TopicMap t) |
boolean |
_extractTopicsFrom(java.lang.String str,
TopicMap t) |
boolean |
_extractTopicsFrom(java.net.URL u,
TopicMap t) |
java.lang.String[] |
getContentTypes()
Returns an array of String containing the content-types this
ContentHandler can process. |
java.lang.String |
getDescription()
AdminToolManager views tool descriptions while user browses available
tools and build user customizable GUI elements such as Tools menu.
|
int |
getExtractorType() |
javax.swing.Icon |
getIcon()
All tools may have identifying graphic icon used within tool GUI elements.
|
java.lang.String |
getName()
Tools name represent the tool in UI unless the tool has been given
explicitly another GUI name.
|
private Topic |
getOrCreateTopic(TopicMap tm,
java.lang.String si) |
private Topic |
getOrCreateTopic(TopicMap tm,
java.lang.String si,
java.lang.String bn) |
private Topic |
getWandoraClass(TopicMap tm) |
private void |
makeSubclassOf(TopicMap tm,
Topic t,
Topic superclass) |
private void |
parse(org.jsoup.nodes.Document d,
TopicMap t) |
private void |
parseCategory(org.jsoup.nodes.Element c,
TopicMap t) |
private void |
parseCategory(org.jsoup.nodes.Element c,
Topic parent,
TopicMap t) |
private void |
parseItem(org.jsoup.nodes.Element i,
Topic parent,
TopicMap t) |
acceptBrowserExtractRequest, addCrawlerUrl, browserExtractorConsumesPlainText, buildSI, buildSL, clearMasterSubject, createAssociation, createAssociation, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, croppedFilename, croppedFilename, croppedUrlString, croppedUrlString, doBrowserExtract, dropExtract, dropExtract, dropExtract, execute, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFromText, getBrowserExtractorName, getCrawlerMode, getForceContent, getForceFiles, getForceUrls, getGUIText, getGUIText, getInterruptsHandled, getMasterSubject, getType, getWandora, handle, handleContent, handleCustomType, handleFiles, handleForcedContent, handleInterrupt, handleStringContent, handleUrls, initializeCustomType, instantDropHandle, makeSubclassOfWandoraClass, runInOwnThread, setData, setDisplayName, setForceContent, setForceFiles, setForceUrls, setMasterSubject, setMasterSubject, setTopicMap, setupCrawler, setWandora, takeNap, urlEncode, useTempTopicMap, useURLCrawleraddUndoMarker, addUndoMarker, allowMultipleInvocations, clearAllThreads, clearThreads, clearThreads, clearToolLock, clearToolLock, clearToolLocks, configure, execute, execute, forceStop, forceStop, getContext, getCurrentLogger, getDefaultLogger, getHistory, getLastLogger, getState, getThreads, getThreads, getToolMenuItem, getToolMenuItem, getTopicName, hlog, initialize, interruptAllThreads, interruptThreads, interruptThreads, isConfigurable, isRunning, isRunning, lockLog, log, log, log, log, requiresRefresh, run, setContext, setDefaultLogger, setLogTitle, setProgress, setProgressMax, setState, setToolLogger, singleLog, singleLog, singleLog, solveContextTopicMap, solveNameForTopicMap, writeOptionsclone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, waitconfigure, execute, execute, getContext, getToolMenuItem, hlog, initialize, isConfigurable, isRunning, log, log, log, log, requiresRefresh, setContext, setToolLogger, writeOptionsforceStop, getHistory, getState, lockLog, setLogTitle, setProgress, setProgressMax, setStateprivate java.lang.String ROOT_SI
private java.lang.String HREF_SI
private java.lang.String ADD_SI
private java.lang.String MOD_SI
private java.lang.String ICON_SI
private java.lang.String LANG
private Topic langTopic
private java.text.SimpleDateFormat df
private java.lang.String[][] itemProps
private java.lang.String[][] itemTimeProps
public static final java.lang.String[] contentTypes
public java.lang.String getName()
AbstractWandoraToolgetName in interface WandoraToolgetName in class AbstractExtractorpublic java.lang.String getDescription()
AbstractWandoraToolgetDescription in interface WandoraToolgetDescription in class AbstractExtractorpublic int getExtractorType()
getExtractorType in class AbstractExtractorpublic java.lang.String[] getContentTypes()
HandlerContentHandler can process.getContentTypes in interface HandlergetContentTypes in class AbstractExtractorpublic javax.swing.Icon getIcon()
AbstractWandoraToolgetIcon should return Icon object of
the tool.getIcon in interface WandoraToolgetIcon in class AbstractExtractorpublic boolean _extractTopicsFrom(java.io.File f,
TopicMap t)
throws java.lang.Exception
_extractTopicsFrom in class AbstractExtractorjava.lang.Exceptionpublic boolean _extractTopicsFrom(java.net.URL u,
TopicMap t)
throws java.lang.Exception
_extractTopicsFrom in class AbstractExtractorjava.lang.Exceptionpublic boolean _extractTopicsFrom(java.lang.String str,
TopicMap t)
throws java.lang.Exception
_extractTopicsFrom in class AbstractExtractorjava.lang.Exceptionprivate void parse(org.jsoup.nodes.Document d,
TopicMap t)
throws java.io.FileNotFoundException,
java.io.IOException,
TopicMapException,
java.text.ParseException
java.io.FileNotFoundExceptionjava.io.IOExceptionTopicMapExceptionjava.text.ParseExceptionprivate void parseCategory(org.jsoup.nodes.Element c,
TopicMap t)
throws TopicMapException,
java.text.ParseException
TopicMapExceptionjava.text.ParseExceptionprivate void parseCategory(org.jsoup.nodes.Element c,
Topic parent,
TopicMap t)
throws TopicMapException,
java.text.ParseException
TopicMapExceptionjava.text.ParseExceptionprivate void parseItem(org.jsoup.nodes.Element i,
Topic parent,
TopicMap t)
throws TopicMapException,
java.text.ParseException
TopicMapExceptionjava.text.ParseExceptionprivate Topic getWandoraClass(TopicMap tm) throws TopicMapException
TopicMapExceptionprivate Topic getOrCreateTopic(TopicMap tm, java.lang.String si) throws TopicMapException
TopicMapExceptionprivate Topic getOrCreateTopic(TopicMap tm, java.lang.String si, java.lang.String bn) throws TopicMapException
TopicMapExceptionprivate void makeSubclassOf(TopicMap tm, Topic t, Topic superclass) throws TopicMapException
TopicMapExceptionCopyright 2004-2015 Wandora Team