public abstract class AbstractYahooTermExtractor extends AbstractExtractor
| Modifier and Type | Field and Description |
|---|---|
private static java.lang.String |
appid |
private java.lang.String[] |
contentTypes |
protected java.lang.String |
defaultEncoding |
static java.lang.String |
DOCUMENT_SI |
static java.lang.String |
LANG |
static java.lang.String |
SOURCE_SI |
static java.lang.String |
TOPIC_SI |
static java.lang.String |
WEB_SERVICE_URL |
static java.lang.String |
YAHOO_TERM_SI |
static java.lang.String |
YAHOO_TERM_TYPE_SI |
CUSTOM_EXTRACTOR, DONE_FAILED, DONE_MANY, DONE_ONE, EXACTLY_GIVEN_URLS, FILE_EXTRACTOR, FILE_PATTERN, GIVEN_URLS_AND_ALL_CRAWLED_DOCUMENTS, GIVEN_URLS_AND_CRAWLED_DOCUMENTS_IN_URL_DOMAIN, GIVEN_URLS_AND_LINKED_DOCUMENTS, GIVEN_URLS_AND_URL_BELOW, INFO_WAIT_WHILE_WORKING, LOG_TITLE, POINT_START_URL_TEXT, RAW_EXTRACTOR, SELECT_DIALOG_TITLE, STRING_EXTRACTOR_NOT_SUPPORTED_MESSAGE, URL_EXTRACTORCLOSE, EXECUTE, INVISIBLE, VISIBLE, WAITRETURN_ERROR, RETURN_INFO| Constructor and Description |
|---|
AbstractYahooTermExtractor() |
| Modifier and Type | Method and Description |
|---|---|
abstract boolean |
_extractTopicsFrom(java.io.InputStream in,
TopicMap topicMap) |
void |
configure(Wandora admin,
Options options,
java.lang.String prefix)
If the tool is configurable, shows an user interface to configure the tool.
|
void |
fillDocumentTopic(Topic textTopic,
TopicMap topicMap,
java.lang.String content) |
void |
forgetAuthorization() |
java.lang.String[] |
getContentTypes()
Returns an array of String containing the content-types this
ContentHandler can process. |
Topic |
getDocumentType(TopicMap tm) |
protected java.lang.String |
getFileContents(java.io.File file) |
javax.swing.Icon |
getIcon()
All tools may have identifying graphic icon used within tool GUI elements.
|
protected Topic |
getOrCreateTopic(TopicMap tm,
java.lang.String si) |
protected Topic |
getOrCreateTopic(TopicMap tm,
java.lang.String si,
java.lang.String bn) |
Topic |
getSourceType(TopicMap tm) |
protected java.lang.String |
getStringFromDocument(org.w3c.dom.Document doc) |
Topic |
getTermTopic(java.lang.String term,
TopicMap tm) |
Topic |
getTermType(TopicMap tm) |
Topic |
getTopicType(TopicMap tm) |
WandoraToolType |
getType()
Tool type is used to categorize tools.
|
Topic |
getWandoraClass(TopicMap tm) |
boolean |
isConfigurable()
Whether this tool is configurable.
|
protected void |
makeSubclassOf(TopicMap tm,
Topic t,
Topic superclass) |
java.lang.String |
solveAppId() |
java.lang.String |
solveAppId(Wandora wandora) |
java.lang.String |
solveTitle(java.lang.String content) |
boolean |
useURLCrawler() |
void |
writeOptions(Wandora admin,
Options options,
java.lang.String prefix)
If the tool is configurable, saves all current tool options.
|
_extractTopicsFrom, _extractTopicsFrom, _extractTopicsFrom, acceptBrowserExtractRequest, addCrawlerUrl, browserExtractorConsumesPlainText, buildSI, buildSL, clearMasterSubject, createAssociation, createAssociation, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, croppedFilename, croppedFilename, croppedUrlString, croppedUrlString, doBrowserExtract, dropExtract, dropExtract, dropExtract, execute, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFromText, getBrowserExtractorName, getCrawlerMode, getDescription, getExtractorType, getForceContent, getForceFiles, getForceUrls, getGUIText, getGUIText, getInterruptsHandled, getMasterSubject, getName, getWandora, handle, handleContent, handleCustomType, handleFiles, handleForcedContent, handleInterrupt, handleStringContent, handleUrls, initializeCustomType, instantDropHandle, makeSubclassOfWandoraClass, runInOwnThread, setData, setDisplayName, setForceContent, setForceFiles, setForceUrls, setMasterSubject, setMasterSubject, setTopicMap, setupCrawler, setWandora, takeNap, urlEncode, useTempTopicMapaddUndoMarker, addUndoMarker, allowMultipleInvocations, clearAllThreads, clearThreads, clearThreads, clearToolLock, clearToolLock, clearToolLocks, execute, execute, forceStop, forceStop, getContext, getCurrentLogger, getDefaultLogger, getHistory, getLastLogger, getState, getThreads, getThreads, getToolMenuItem, getToolMenuItem, getTopicName, hlog, initialize, interruptAllThreads, interruptThreads, interruptThreads, isRunning, isRunning, lockLog, log, log, log, log, requiresRefresh, run, setContext, setDefaultLogger, setLogTitle, setProgress, setProgressMax, setState, setToolLogger, singleLog, singleLog, singleLog, solveContextTopicMap, solveNameForTopicMapclone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, waitexecute, execute, getContext, getToolMenuItem, hlog, initialize, isRunning, log, log, log, log, requiresRefresh, setContext, setToolLoggerforceStop, getHistory, getState, lockLog, setLogTitle, setProgress, setProgressMax, setStateprotected java.lang.String defaultEncoding
public static java.lang.String LANG
public static final java.lang.String WEB_SERVICE_URL
public static final java.lang.String SOURCE_SI
public static final java.lang.String DOCUMENT_SI
public static final java.lang.String TOPIC_SI
public static final java.lang.String YAHOO_TERM_SI
public static final java.lang.String YAHOO_TERM_TYPE_SI
private final java.lang.String[] contentTypes
private static java.lang.String appid
public javax.swing.Icon getIcon()
AbstractWandoraToolgetIcon should return Icon object of
the tool.getIcon in interface WandoraToolgetIcon in class AbstractExtractorpublic WandoraToolType getType()
AbstractWandoraToolTool type is used to categorize tools. Tool type has no real effect today, it is merely an informative property of a tool.
getType in interface WandoraToolgetType in class AbstractExtractorpublic java.lang.String[] getContentTypes()
HandlerContentHandler can process.getContentTypes in interface HandlergetContentTypes in class AbstractExtractorpublic boolean useURLCrawler()
useURLCrawler in class AbstractExtractorpublic boolean isConfigurable()
AbstractWandoraToolisConfigurable in interface WandoraToolisConfigurable in class AbstractWandoraToolpublic void configure(Wandora admin, Options options, java.lang.String prefix) throws TopicMapException
AbstractWandoraToolconfigure in interface WandoraToolconfigure in class AbstractWandoraToolTopicMapExceptionpublic void writeOptions(Wandora admin, Options options, java.lang.String prefix)
AbstractWandoraToolwriteOptions in interface WandoraToolwriteOptions in class AbstractWandoraToolpublic abstract boolean _extractTopicsFrom(java.io.InputStream in,
TopicMap topicMap)
throws java.lang.Exception
java.lang.Exceptionpublic java.lang.String solveTitle(java.lang.String content)
public void fillDocumentTopic(Topic textTopic, TopicMap topicMap, java.lang.String content)
public Topic getTermType(TopicMap tm) throws TopicMapException
TopicMapExceptionpublic Topic getTermTopic(java.lang.String term, TopicMap tm) throws TopicMapException
TopicMapExceptionpublic Topic getWandoraClass(TopicMap tm) throws TopicMapException
TopicMapExceptionpublic Topic getTopicType(TopicMap tm) throws TopicMapException
TopicMapExceptionpublic Topic getSourceType(TopicMap tm) throws TopicMapException
TopicMapExceptionpublic Topic getDocumentType(TopicMap tm) throws TopicMapException
TopicMapExceptionprotected Topic getOrCreateTopic(TopicMap tm, java.lang.String si) throws TopicMapException
TopicMapExceptionprotected Topic getOrCreateTopic(TopicMap tm, java.lang.String si, java.lang.String bn) throws TopicMapException
TopicMapExceptionprotected void makeSubclassOf(TopicMap tm, Topic t, Topic superclass) throws TopicMapException
TopicMapExceptionpublic java.lang.String solveAppId(Wandora wandora)
public java.lang.String solveAppId()
public void forgetAuthorization()
protected java.lang.String getStringFromDocument(org.w3c.dom.Document doc)
protected java.lang.String getFileContents(java.io.File file)
throws java.io.IOException,
java.io.FileNotFoundException
java.io.IOExceptionjava.io.FileNotFoundExceptionCopyright 2004-2015 Wandora Team