public class TermsExtractor extends AbstractElavaArkistoExtractor
| Modifier and Type | Field and Description |
|---|---|
static java.lang.String |
ELAVA_ARKISTO_ALSOKNOWNAS_TYPE_SI |
static java.lang.String |
ELAVA_ARKISTO_FIRSTNAME_TYPE_SI |
static java.lang.String |
ELAVA_ARKISTO_KEYWORD_TYPE_SI |
static java.lang.String |
ELAVA_ARKISTO_LASTNAME_TYPE_SI |
static java.lang.String |
ELAVA_ARKISTO_TERM_ALSOKNOWNAS_SI |
static java.lang.String |
ELAVA_ARKISTO_TERM_EXACT_MATCH_DISAMBIGUATION_SI |
static java.lang.String |
ELAVA_ARKISTO_TERM_EXACT_MATCH_SI |
static java.lang.String |
ELAVA_ARKISTO_TERM_FIRSTNAME_SI |
static java.lang.String |
ELAVA_ARKISTO_TERM_KEYWORD_SI |
static java.lang.String |
ELAVA_ARKISTO_TERM_LASTNAME_SI |
static java.lang.String |
ELAVA_ARKISTO_TERM_SI |
static java.lang.String |
ELAVA_ARKISTO_TERM_TYPE_SI |
static boolean |
EXTRACT_ALSO_KNOWN_AS |
static boolean |
EXTRACT_DISAMBIGUATION_HINT |
static boolean |
EXTRACT_EXACT_MATCH |
static boolean |
EXTRACT_FIRST_AND_LASTNAME |
static boolean |
EXTRACT_KEYWORD |
static boolean |
EXTRACT_TITLE |
static boolean |
EXTRACT_TYPE |
ELAVA_ARKISTO_ARTICLE_ID_TYPE_SI, ELAVA_ARKISTO_ARTICLE_PUBLISHED_TYPE_SI, ELAVA_ARKISTO_ARTICLE_TYPE_SI, ELAVA_ARKISTO_DATE_TYPE_SI, ELAVA_ARKISTO_MEDIA_TYPE_SI, ELAVA_ARKISTO_SERVICE_TYPE_SI, ELAVA_ARKISTO_SI, ELAVA_ARKISTO_TAG_ARTICLE_RELATION_TYPE_SI, ELAVA_ARKISTO_TAG_TYPE_SI, ELAVA_ARKISTO_TIME_TYPE_SICUSTOM_EXTRACTOR, DONE_FAILED, DONE_MANY, DONE_ONE, EXACTLY_GIVEN_URLS, FILE_EXTRACTOR, FILE_PATTERN, GIVEN_URLS_AND_ALL_CRAWLED_DOCUMENTS, GIVEN_URLS_AND_CRAWLED_DOCUMENTS_IN_URL_DOMAIN, GIVEN_URLS_AND_LINKED_DOCUMENTS, GIVEN_URLS_AND_URL_BELOW, INFO_WAIT_WHILE_WORKING, LOG_TITLE, POINT_START_URL_TEXT, RAW_EXTRACTOR, SELECT_DIALOG_TITLE, STRING_EXTRACTOR_NOT_SUPPORTED_MESSAGE, URL_EXTRACTORCLOSE, EXECUTE, INVISIBLE, VISIBLE, WAITRETURN_ERROR, RETURN_INFO| Constructor and Description |
|---|
TermsExtractor() |
_extractTopicsFrom, _extractTopicsFrom, getElavaArkistoArticleIdType, getElavaArkistoArticleTopic, getElavaArkistoArticleType, getElavaArkistoDateTopic, getElavaArkistoDateType, getElavaArkistoMediaTopic, getElavaArkistoMediaType, getElavaArkistoServiceTopic, getElavaArkistoServiceType, getElavaArkistoTagArticleRelationTopic, getElavaArkistoTagArticleRelationType, getElavaArkistoTagTopic, getElavaArkistoTagType, getElavaArkistoTimeTopic, getElavaArkistoTimeType, getElavaArkistoType, getIcon, getWandoraType, isValidData, stringifyacceptBrowserExtractRequest, addCrawlerUrl, browserExtractorConsumesPlainText, buildSI, buildSL, clearMasterSubject, createAssociation, createAssociation, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, croppedFilename, croppedFilename, croppedUrlString, croppedUrlString, doBrowserExtract, dropExtract, dropExtract, dropExtract, execute, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFromText, getBrowserExtractorName, getContentTypes, getCrawlerMode, getExtractorType, getForceContent, getForceFiles, getForceUrls, getGUIText, getGUIText, getInterruptsHandled, getMasterSubject, getType, getWandora, handle, handleContent, handleCustomType, handleFiles, handleForcedContent, handleInterrupt, handleStringContent, handleUrls, initializeCustomType, instantDropHandle, makeSubclassOfWandoraClass, runInOwnThread, setData, setDisplayName, setForceContent, setForceFiles, setForceUrls, setMasterSubject, setMasterSubject, setTopicMap, setupCrawler, setWandora, takeNap, urlEncode, useTempTopicMap, useURLCrawleraddUndoMarker, addUndoMarker, allowMultipleInvocations, clearAllThreads, clearThreads, clearThreads, clearToolLock, clearToolLock, clearToolLocks, configure, execute, execute, forceStop, forceStop, getContext, getCurrentLogger, getDefaultLogger, getHistory, getLastLogger, getState, getThreads, getThreads, getToolMenuItem, getToolMenuItem, getTopicName, hlog, initialize, interruptAllThreads, interruptThreads, interruptThreads, isConfigurable, isRunning, isRunning, lockLog, log, log, log, log, requiresRefresh, run, setContext, setDefaultLogger, setLogTitle, setProgress, setProgressMax, setState, setToolLogger, singleLog, singleLog, singleLog, solveContextTopicMap, solveNameForTopicMap, writeOptionsclone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, waitconfigure, execute, execute, getContext, getToolMenuItem, hlog, initialize, isConfigurable, isRunning, log, log, log, log, requiresRefresh, setContext, setToolLogger, writeOptionsforceStop, getHistory, getState, lockLog, setLogTitle, setProgress, setProgressMax, setStatepublic static boolean EXTRACT_TITLE
public static boolean EXTRACT_TYPE
public static boolean EXTRACT_KEYWORD
public static boolean EXTRACT_FIRST_AND_LASTNAME
public static boolean EXTRACT_EXACT_MATCH
public static boolean EXTRACT_ALSO_KNOWN_AS
public static boolean EXTRACT_DISAMBIGUATION_HINT
public static final java.lang.String ELAVA_ARKISTO_TERM_SI
public static final java.lang.String ELAVA_ARKISTO_TERM_TYPE_SI
public static final java.lang.String ELAVA_ARKISTO_TERM_KEYWORD_SI
public static final java.lang.String ELAVA_ARKISTO_TERM_LASTNAME_SI
public static final java.lang.String ELAVA_ARKISTO_TERM_FIRSTNAME_SI
public static final java.lang.String ELAVA_ARKISTO_TERM_ALSOKNOWNAS_SI
public static final java.lang.String ELAVA_ARKISTO_TERM_EXACT_MATCH_SI
public static final java.lang.String ELAVA_ARKISTO_TERM_EXACT_MATCH_DISAMBIGUATION_SI
public static final java.lang.String ELAVA_ARKISTO_LASTNAME_TYPE_SI
public static final java.lang.String ELAVA_ARKISTO_FIRSTNAME_TYPE_SI
public static final java.lang.String ELAVA_ARKISTO_ALSOKNOWNAS_TYPE_SI
public static final java.lang.String ELAVA_ARKISTO_KEYWORD_TYPE_SI
public java.lang.String getName()
AbstractWandoraToolgetName in interface WandoraToolgetName in class AbstractElavaArkistoExtractorpublic java.lang.String getDescription()
AbstractWandoraToolgetDescription in interface WandoraToolgetDescription in class AbstractElavaArkistoExtractorpublic boolean _extractTopicsFrom(java.lang.String str,
TopicMap tm)
throws java.lang.Exception
_extractTopicsFrom in class AbstractExtractorjava.lang.Exceptionpublic boolean _extractTopicsFrom(org.json.JSONArray json,
TopicMap tm)
throws java.lang.Exception
java.lang.Exceptionpublic boolean _extractTopicsFrom(org.json.JSONObject json,
TopicMap tm)
throws java.lang.Exception
java.lang.Exceptionpublic Topic getElavaArkistoKeywordType(TopicMap tm) throws TopicMapException
TopicMapExceptionpublic Topic getElavaArkistoAlsoKnownAsType(TopicMap tm) throws TopicMapException
TopicMapExceptionpublic Topic getElavaArkistoLastnameType(TopicMap tm) throws TopicMapException
TopicMapExceptionpublic Topic getElavaArkistoFirstnameType(TopicMap tm) throws TopicMapException
TopicMapExceptionpublic Topic getElavaArkistoExactMatchDisambiguationType(TopicMap tm) throws TopicMapException
TopicMapExceptionpublic Topic getElavaArkistoExactMatchType(TopicMap tm) throws TopicMapException
TopicMapExceptionpublic Topic getElavaArkistoExactMatchTopic(java.lang.String id, TopicMap tm) throws TopicMapException
TopicMapExceptionpublic Topic getElavaArkistoTermType(TopicMap tm) throws TopicMapException
TopicMapExceptionpublic Topic getElavaArkistoTermTopic(java.lang.String id, TopicMap tm) throws TopicMapException
TopicMapExceptionpublic Topic getElavaArkistoTermTypeType(TopicMap tm) throws TopicMapException
TopicMapExceptionpublic Topic getElavaArkistoTermTypeTopic(java.lang.String type, TopicMap tm) throws TopicMapException
TopicMapExceptionCopyright 2004-2015 Wandora Team