public class XMLSubj3ctRecordExtractor extends AbstractExtractor
Modifier and Type | Class and Description |
---|---|
private class |
XMLSubj3ctRecordExtractor.Subj3ctResultParser |
Modifier and Type | Field and Description |
---|---|
private java.lang.String[] |
contentTypes |
private java.lang.String |
defaultEncoding |
static boolean |
DESCRIPTION_AS_OCCURRENCE |
static boolean |
DESCRIPTION_AS_PLAYER |
protected java.lang.String |
DESCRIPTION_SI |
protected java.lang.String |
EQUIVALENCE_SI |
protected java.lang.String |
EQUIVALENT_TOPIC_SI |
static boolean |
OVERRIDE_BASENAME |
protected java.lang.String |
PROVENANCE_SI |
protected java.lang.String |
RECORDLINK_SI |
protected java.lang.String |
REPRESENTATION_SI |
protected java.lang.String |
REPRESENTATION_TOPIC_SI |
protected java.lang.String |
SI_BASE |
protected java.lang.String |
SUBJ3CT |
protected java.lang.String |
SUBJ3CT_TYPE_SI |
protected java.lang.String |
TOPIC_SI |
protected java.lang.String |
TRUST_SI |
CUSTOM_EXTRACTOR, DONE_FAILED, DONE_MANY, DONE_ONE, EXACTLY_GIVEN_URLS, FILE_EXTRACTOR, FILE_PATTERN, GIVEN_URLS_AND_ALL_CRAWLED_DOCUMENTS, GIVEN_URLS_AND_CRAWLED_DOCUMENTS_IN_URL_DOMAIN, GIVEN_URLS_AND_LINKED_DOCUMENTS, GIVEN_URLS_AND_URL_BELOW, INFO_WAIT_WHILE_WORKING, LOG_TITLE, POINT_START_URL_TEXT, RAW_EXTRACTOR, SELECT_DIALOG_TITLE, STRING_EXTRACTOR_NOT_SUPPORTED_MESSAGE, URL_EXTRACTOR
CLOSE, EXECUTE, INVISIBLE, VISIBLE, WAIT
RETURN_ERROR, RETURN_INFO
Constructor and Description |
---|
XMLSubj3ctRecordExtractor()
Creates a new instance of XMLSubj3ctRecordExtractor
|
Modifier and Type | Method and Description |
---|---|
boolean |
_extractTopicsFrom(java.io.File file,
TopicMap topicMap) |
boolean |
_extractTopicsFrom(java.io.InputStream in,
TopicMap topicMap) |
boolean |
_extractTopicsFrom(java.lang.String in,
TopicMap topicMap) |
boolean |
_extractTopicsFrom(java.net.URL url,
TopicMap topicMap) |
java.lang.String[] |
getContentTypes()
Returns an array of String containing the content-types this
ContentHandler can process. |
java.lang.String |
getDescription()
AdminToolManager views tool descriptions while user browses available
tools and build user customizable GUI elements such as Tools menu.
|
Topic |
getDescriptionTopic(java.lang.String description,
TopicMap tm) |
Topic |
getDescriptionType(TopicMap tm) |
Topic |
getEquivalenceType(TopicMap tm) |
Topic |
getEquivalentTopicType(TopicMap tm) |
javax.swing.Icon |
getIcon()
All tools may have identifying graphic icon used within tool GUI elements.
|
java.lang.String |
getName()
Tools name represent the tool in UI unless the tool has been given
explicitly another GUI name.
|
protected Topic |
getOrCreateTopic(TopicMap tm,
java.lang.String si) |
protected Topic |
getOrCreateTopic(TopicMap tm,
java.lang.String si,
java.lang.String bn) |
Topic |
getProvenanceTopic(java.lang.String provinance,
TopicMap tm) |
Topic |
getProvenanceType(TopicMap tm) |
Topic |
getRecordlinkTopic(java.lang.String recordlink,
TopicMap tm) |
Topic |
getRecordlinkType(TopicMap tm) |
Topic |
getRepresentationTopicType(TopicMap tm) |
Topic |
getRepresentationType(TopicMap tm) |
Topic |
getSubj3ctClass(TopicMap tm) |
Topic |
getSubj3ctType(TopicMap tm) |
Topic |
getTopicType(TopicMap tm) |
Topic |
getTrustTopic(java.lang.String trust,
TopicMap tm) |
Topic |
getTrustType(TopicMap tm) |
Topic |
getWandoraClass(TopicMap tm) |
protected void |
makeSubclassOf(TopicMap tm,
Topic t,
Topic superclass) |
boolean |
useURLCrawler() |
acceptBrowserExtractRequest, addCrawlerUrl, browserExtractorConsumesPlainText, buildSI, buildSL, clearMasterSubject, createAssociation, createAssociation, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, croppedFilename, croppedFilename, croppedUrlString, croppedUrlString, doBrowserExtract, dropExtract, dropExtract, dropExtract, execute, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFromText, getBrowserExtractorName, getCrawlerMode, getExtractorType, getForceContent, getForceFiles, getForceUrls, getGUIText, getGUIText, getInterruptsHandled, getMasterSubject, getType, getWandora, handle, handleContent, handleCustomType, handleFiles, handleForcedContent, handleInterrupt, handleStringContent, handleUrls, initializeCustomType, instantDropHandle, makeSubclassOfWandoraClass, runInOwnThread, setData, setDisplayName, setForceContent, setForceFiles, setForceUrls, setMasterSubject, setMasterSubject, setTopicMap, setupCrawler, setWandora, takeNap, urlEncode, useTempTopicMap
addUndoMarker, addUndoMarker, allowMultipleInvocations, clearAllThreads, clearThreads, clearThreads, clearToolLock, clearToolLock, clearToolLocks, configure, execute, execute, forceStop, forceStop, getContext, getCurrentLogger, getDefaultLogger, getHistory, getLastLogger, getState, getThreads, getThreads, getToolMenuItem, getToolMenuItem, getTopicName, hlog, initialize, interruptAllThreads, interruptThreads, interruptThreads, isConfigurable, isRunning, isRunning, lockLog, log, log, log, log, requiresRefresh, run, setContext, setDefaultLogger, setLogTitle, setProgress, setProgressMax, setState, setToolLogger, singleLog, singleLog, singleLog, solveContextTopicMap, solveNameForTopicMap, writeOptions
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
configure, execute, execute, getContext, getToolMenuItem, hlog, initialize, isConfigurable, isRunning, log, log, log, log, requiresRefresh, setContext, setToolLogger, writeOptions
forceStop, getHistory, getState, lockLog, setLogTitle, setProgress, setProgressMax, setState
public static final boolean OVERRIDE_BASENAME
public static final boolean DESCRIPTION_AS_OCCURRENCE
public static final boolean DESCRIPTION_AS_PLAYER
protected java.lang.String SUBJ3CT
protected java.lang.String SI_BASE
protected java.lang.String PROVENANCE_SI
protected java.lang.String DESCRIPTION_SI
protected java.lang.String RECORDLINK_SI
protected java.lang.String TRUST_SI
protected java.lang.String EQUIVALENCE_SI
protected java.lang.String EQUIVALENT_TOPIC_SI
protected java.lang.String REPRESENTATION_SI
protected java.lang.String REPRESENTATION_TOPIC_SI
protected java.lang.String TOPIC_SI
protected java.lang.String SUBJ3CT_TYPE_SI
private java.lang.String defaultEncoding
private final java.lang.String[] contentTypes
public XMLSubj3ctRecordExtractor()
public java.lang.String getName()
AbstractWandoraTool
getName
in interface WandoraTool
getName
in class AbstractExtractor
public java.lang.String getDescription()
AbstractWandoraTool
getDescription
in interface WandoraTool
getDescription
in class AbstractExtractor
public javax.swing.Icon getIcon()
AbstractWandoraTool
getIcon
should return Icon
object of
the tool.getIcon
in interface WandoraTool
getIcon
in class AbstractExtractor
public java.lang.String[] getContentTypes()
Handler
ContentHandler
can process.getContentTypes
in interface Handler
getContentTypes
in class AbstractExtractor
public boolean useURLCrawler()
useURLCrawler
in class AbstractExtractor
public boolean _extractTopicsFrom(java.net.URL url, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.io.File file, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.io.InputStream in, TopicMap topicMap) throws java.lang.Exception
java.lang.Exception
public boolean _extractTopicsFrom(java.lang.String in, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public Topic getProvenanceTopic(java.lang.String provinance, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getProvenanceType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getTrustTopic(java.lang.String trust, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getTrustType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getDescriptionTopic(java.lang.String description, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getDescriptionType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getRecordlinkTopic(java.lang.String recordlink, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getRecordlinkType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getTopicType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getSubj3ctType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getEquivalenceType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getEquivalentTopicType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getRepresentationType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getRepresentationTopicType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getSubj3ctClass(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getWandoraClass(TopicMap tm) throws TopicMapException
TopicMapException
protected Topic getOrCreateTopic(TopicMap tm, java.lang.String si) throws TopicMapException
TopicMapException
protected Topic getOrCreateTopic(TopicMap tm, java.lang.String si, java.lang.String bn) throws TopicMapException
TopicMapException
protected void makeSubclassOf(TopicMap tm, Topic t, Topic superclass) throws TopicMapException
TopicMapException
Copyright 2004-2015 Wandora Team