public class ZemantaExtractor extends AbstractZemantaExtractor implements BrowserPluginExtractor
| Modifier and Type | Class and Description |
|---|---|
class |
ZemantaExtractor.ZemantaParser |
defaultEncoding, DOCUMENT_SI, EXTRACT_RELEVANCE, LANG, SOURCE_SI, TOPIC_SI, ZEMANTA_ARTICLE_SI, ZEMANTA_ARTICLE_TITLE_SI, ZEMANTA_CATEGORIZATION_SI, ZEMANTA_CATEGORY_SI, ZEMANTA_CONFIDENCE_SI, ZEMANTA_DATE_SI, ZEMANTA_IMAGE_ATTRIBUTION_SI, ZEMANTA_IMAGE_DESCRIPTION_SI, ZEMANTA_IMAGE_LICENSE_SI, ZEMANTA_IMAGE_SI, ZEMANTA_KEYWORD_SI, ZEMANTA_LARGE_IMAGE_SI, ZEMANTA_LINK_ANCHOR_SI, ZEMANTA_LINK_SI, ZEMANTA_LINK_TITLE_SI, ZEMANTA_LINK_TYPE_SI, ZEMANTA_LINK_URL_SI, ZEMANTA_MEDIUM_IMAGE_SI, ZEMANTA_PUBLISHED_DATE_SI, ZEMANTA_RELEVANCE_SI, ZEMANTA_SCHEMA_SI, ZEMANTA_SI, ZEMANTA_SMALL_IMAGE_SI, ZEMANTA_URL, ZEMANTA_ZEMIFIED_SICUSTOM_EXTRACTOR, DONE_FAILED, DONE_MANY, DONE_ONE, EXACTLY_GIVEN_URLS, FILE_EXTRACTOR, FILE_PATTERN, GIVEN_URLS_AND_ALL_CRAWLED_DOCUMENTS, GIVEN_URLS_AND_CRAWLED_DOCUMENTS_IN_URL_DOMAIN, GIVEN_URLS_AND_LINKED_DOCUMENTS, GIVEN_URLS_AND_URL_BELOW, INFO_WAIT_WHILE_WORKING, LOG_TITLE, POINT_START_URL_TEXT, RAW_EXTRACTOR, SELECT_DIALOG_TITLE, STRING_EXTRACTOR_NOT_SUPPORTED_MESSAGE, URL_EXTRACTORRETURN_ERROR, RETURN_INFO| Constructor and Description |
|---|
ZemantaExtractor() |
| Modifier and Type | Method and Description |
|---|---|
boolean |
_extractTopicsFrom(java.io.File file,
TopicMap topicMap) |
boolean |
_extractTopicsFrom(java.io.InputStream in,
TopicMap topicMap) |
boolean |
_extractTopicsFrom(java.lang.String data,
TopicMap topicMap) |
boolean |
_extractTopicsFrom(java.net.URL url,
TopicMap topicMap) |
java.lang.String |
getDescription()
AdminToolManager views tool descriptions while user browses available
tools and build user customizable GUI elements such as Tools menu.
|
java.lang.String |
getName()
Tools name represent the tool in UI unless the tool has been given
explicitly another GUI name.
|
configure, doBrowserExtract, fillDocumentTopic, forgetAuthorization, getArticleTitleTopic, getArticleTitleType, getArticleTopic, getArticleType, getCategorizationTopic, getCategorizationType, getCategoryTopic, getCategoryType, getConfidenceTopic, getConfidenceType, getContentTypes, getDateTopic, getDateType, getDefaultLangType, getDocumentType, getFileContents, getIcon, getImageAttributionType, getImageDescriptionType, getImageLicenseType, getImageTopic, getImageType, getKeywordTopic, getKeywordType, getLargeImageType, getLinkAnchorTopic, getLinkAnchorType, getLinkTitleTopic, getLinkTitleType, getLinkType, getLinkTypeTopic, getLinkTypeType, getLinkUrlTopic, getLinkUrlType, getMediumImageType, getOrCreateTopic, getOrCreateTopic, getOrCreateTopic, getPublishedDateType, getRelevanceTopic, getRelevanceType, getSchemaTopic, getSchemaType, getSmallImageType, getSourceType, getStringFromDocument, getTopicType, getType, getWandoraClass, getZemantaType, getZemifiedTopic, getZemifiedType, isConfigurable, makeSubclassOf, sendRequest, solveAPIKey, solveAPIKey, solveTitle, useURLCrawler, writeOptionsacceptBrowserExtractRequest, addCrawlerUrl, browserExtractorConsumesPlainText, buildSI, buildSL, clearMasterSubject, createAssociation, createAssociation, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, croppedFilename, croppedFilename, croppedUrlString, croppedUrlString, dropExtract, dropExtract, dropExtract, execute, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFromText, getBrowserExtractorName, getCrawlerMode, getExtractorType, getForceContent, getForceFiles, getForceUrls, getGUIText, getGUIText, getInterruptsHandled, getMasterSubject, getWandora, handle, handleContent, handleCustomType, handleFiles, handleForcedContent, handleInterrupt, handleStringContent, handleUrls, initializeCustomType, instantDropHandle, makeSubclassOfWandoraClass, runInOwnThread, setData, setDisplayName, setForceContent, setForceFiles, setForceUrls, setMasterSubject, setMasterSubject, setTopicMap, setupCrawler, setWandora, takeNap, urlEncode, useTempTopicMapaddUndoMarker, addUndoMarker, allowMultipleInvocations, clearAllThreads, clearThreads, clearThreads, clearToolLock, clearToolLock, clearToolLocks, execute, execute, forceStop, forceStop, getContext, getCurrentLogger, getDefaultLogger, getHistory, getLastLogger, getState, getThreads, getThreads, getToolMenuItem, getToolMenuItem, getTopicName, hlog, initialize, interruptAllThreads, interruptThreads, interruptThreads, isRunning, isRunning, lockLog, log, log, log, log, requiresRefresh, run, setContext, setDefaultLogger, setLogTitle, setProgress, setProgressMax, setState, setToolLogger, singleLog, singleLog, singleLog, solveContextTopicMap, solveNameForTopicMapclone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, waitacceptBrowserExtractRequest, doBrowserExtract, getBrowserExtractorNameexecute, execute, getContext, getToolMenuItem, hlog, initialize, isRunning, log, log, log, log, requiresRefresh, setContext, setToolLoggerforceStop, getHistory, getState, lockLog, setLogTitle, setProgress, setProgressMax, setStatepublic java.lang.String getName()
AbstractWandoraToolgetName in interface WandoraToolgetName in class AbstractExtractorpublic java.lang.String getDescription()
AbstractWandoraToolgetDescription in interface WandoraToolgetDescription in class AbstractExtractorpublic boolean _extractTopicsFrom(java.net.URL url,
TopicMap topicMap)
throws java.lang.Exception
_extractTopicsFrom in class AbstractExtractorjava.lang.Exceptionpublic boolean _extractTopicsFrom(java.io.File file,
TopicMap topicMap)
throws java.lang.Exception
_extractTopicsFrom in class AbstractExtractorjava.lang.Exceptionpublic boolean _extractTopicsFrom(java.io.InputStream in,
TopicMap topicMap)
throws java.lang.Exception
_extractTopicsFrom in class AbstractZemantaExtractorjava.lang.Exceptionpublic boolean _extractTopicsFrom(java.lang.String data,
TopicMap topicMap)
throws java.lang.Exception
_extractTopicsFrom in class AbstractExtractorjava.lang.ExceptionCopyright 2004-2015 Wandora Team