public class DublinCoreXMLExtractor extends AbstractExtractor
Modifier and Type | Class and Description |
---|---|
private class |
DublinCoreXMLExtractor.DublinCoreXMLParser |
Modifier and Type | Field and Description |
---|---|
protected java.lang.String |
ABSTRACT_SI |
protected java.lang.String |
ALTERNATIVE_SI |
static boolean |
APPEND_OCCURRENCE_ABSTRACT |
static boolean |
APPEND_OCCURRENCE_ALTERNATIVE |
static boolean |
APPEND_OCCURRENCE_DESCRIPTION |
static boolean |
APPEND_OCCURRENCE_TABLEOFCONTENTS |
protected java.lang.String |
AUDIENCE_SI |
protected java.lang.String |
AVAILABLE_SI |
private java.lang.String[] |
contentTypes |
protected java.lang.String |
CONTRIBUTOR_SI |
protected java.lang.String |
COVERAGE_SI |
protected java.lang.String |
CREATED_SI |
protected java.lang.String |
CREATOR_SI |
protected java.lang.String |
DATE_SI |
private java.lang.String |
defaultEncoding |
static boolean |
DESCRIPTION_AS_OCCURRENCE |
static boolean |
DESCRIPTION_AS_PLAYER |
protected java.lang.String |
DESCRIPTION_SI |
protected java.lang.String |
EXTENT_SI |
protected java.lang.String |
FORMAT_SI |
static boolean |
IDENTIFIER_AS_SI |
protected java.lang.String |
IDENTIFIER_SI |
protected java.lang.String |
ISSUED_SI |
protected java.lang.String |
LANGUAGE_SI |
protected java.lang.String |
MEDIUM_SI |
protected java.lang.String |
MODIFIED_SI |
protected java.lang.String |
PUBLISHER_SI |
protected java.lang.String |
RECORD_SI |
protected java.lang.String |
RELATION_SI |
protected java.lang.String |
RIGHTS_SI |
protected java.lang.String |
SI_BASE |
protected java.lang.String |
SOURCE_SI |
protected java.lang.String |
SUBJECT_SI |
protected java.lang.String |
TABLEOFCONTENTS_SI |
protected java.lang.String |
TYPE_SI |
protected java.lang.String |
VALID_SI |
CUSTOM_EXTRACTOR, DONE_FAILED, DONE_MANY, DONE_ONE, EXACTLY_GIVEN_URLS, FILE_EXTRACTOR, FILE_PATTERN, GIVEN_URLS_AND_ALL_CRAWLED_DOCUMENTS, GIVEN_URLS_AND_CRAWLED_DOCUMENTS_IN_URL_DOMAIN, GIVEN_URLS_AND_LINKED_DOCUMENTS, GIVEN_URLS_AND_URL_BELOW, INFO_WAIT_WHILE_WORKING, LOG_TITLE, POINT_START_URL_TEXT, RAW_EXTRACTOR, SELECT_DIALOG_TITLE, STRING_EXTRACTOR_NOT_SUPPORTED_MESSAGE, URL_EXTRACTOR
CLOSE, EXECUTE, INVISIBLE, VISIBLE, WAIT
RETURN_ERROR, RETURN_INFO
Constructor and Description |
---|
DublinCoreXMLExtractor()
Creates a new instance of DublinCoreXMLExtractor
|
Modifier and Type | Method and Description |
---|---|
boolean |
_extractTopicsFrom(java.io.File file,
TopicMap topicMap) |
boolean |
_extractTopicsFrom(java.io.InputStream in,
TopicMap topicMap) |
boolean |
_extractTopicsFrom(java.lang.String in,
TopicMap topicMap) |
boolean |
_extractTopicsFrom(java.net.URL url,
TopicMap topicMap) |
private boolean |
equalTags(java.lang.String t1,
java.lang.String t2) |
Topic |
getAbstractTopic(java.lang.String abst,
TopicMap tm) |
Topic |
getAbstractType(TopicMap tm) |
Topic |
getAlternativeTopic(java.lang.String alt,
TopicMap tm) |
Topic |
getAlternativeType(TopicMap tm) |
Topic |
getAudienceTopic(java.lang.String audience,
TopicMap tm) |
Topic |
getAudienceType(TopicMap tm) |
Topic |
getAvailableTopic(java.lang.String available,
TopicMap tm) |
Topic |
getAvailableType(TopicMap tm) |
java.lang.String[] |
getContentTypes()
Returns an array of String containing the content-types this
ContentHandler can process. |
Topic |
getContributorTopic(java.lang.String contributor,
TopicMap tm) |
Topic |
getContributorType(TopicMap tm) |
Topic |
getCoverageTopic(java.lang.String coverage,
TopicMap tm) |
Topic |
getCoverageType(TopicMap tm) |
Topic |
getCreatedTopic(java.lang.String created,
TopicMap tm) |
Topic |
getCreatedType(TopicMap tm) |
Topic |
getCreatorTopic(java.lang.String creator,
TopicMap tm) |
Topic |
getCreatorType(TopicMap tm) |
Topic |
getDateTopic(java.lang.String date,
TopicMap tm) |
Topic |
getDateType(TopicMap tm) |
Topic |
getDCClass(TopicMap tm) |
java.lang.String |
getDescription()
AdminToolManager views tool descriptions while user browses available
tools and build user customizable GUI elements such as Tools menu.
|
Topic |
getDescriptionTopic(java.lang.String description,
TopicMap tm) |
Topic |
getDescriptionType(TopicMap tm) |
Topic |
getExtentTopic(java.lang.String extent,
TopicMap tm) |
Topic |
getExtentType(TopicMap tm) |
Topic |
getFormatTopic(java.lang.String format,
TopicMap tm) |
Topic |
getFormatType(TopicMap tm) |
javax.swing.Icon |
getIcon()
All tools may have identifying graphic icon used within tool GUI elements.
|
Topic |
getIdentifierTopic(java.lang.String identifier,
TopicMap tm) |
Topic |
getIdentifierType(TopicMap tm) |
Topic |
getIssuedTopic(java.lang.String issued,
TopicMap tm) |
Topic |
getIssuedType(TopicMap tm) |
Topic |
getLanguageTopic(java.lang.String language,
TopicMap tm) |
Topic |
getLanguageType(TopicMap tm) |
Topic |
getMediumTopic(java.lang.String medium,
TopicMap tm) |
Topic |
getMediumType(TopicMap tm) |
Topic |
getModifiedTopic(java.lang.String modified,
TopicMap tm) |
Topic |
getModifiedType(TopicMap tm) |
java.lang.String |
getName()
Tools name represent the tool in UI unless the tool has been given
explicitly another GUI name.
|
protected Topic |
getOrCreateTopic(TopicMap tm,
java.lang.String si) |
protected Topic |
getOrCreateTopic(TopicMap tm,
java.lang.String si,
java.lang.String bn) |
protected Topic |
getOrCreateTopic(TopicMap tm,
java.lang.String si,
java.lang.String bn,
Topic type) |
Topic |
getPublisherTopic(java.lang.String publisher,
TopicMap tm) |
Topic |
getPublisherType(TopicMap tm) |
Topic |
getRecordType(TopicMap tm) |
Topic |
getRelationTopic(java.lang.String relation,
TopicMap tm) |
Topic |
getRelationType(TopicMap tm) |
Topic |
getRightsTopic(java.lang.String rights,
TopicMap tm) |
Topic |
getRightsType(TopicMap tm) |
Topic |
getSourceTopic(java.lang.String source,
TopicMap tm) |
Topic |
getSourceType(TopicMap tm) |
Topic |
getSubjectTopic(java.lang.String subject,
TopicMap tm) |
Topic |
getSubjectType(TopicMap tm) |
Topic |
getTableOfContentsTopic(java.lang.String toc,
TopicMap tm) |
Topic |
getTableOfContentsType(TopicMap tm) |
Topic |
getTopic(TopicMap tm,
java.lang.String str,
java.lang.String SIBase,
Topic type) |
Topic |
getTypeTopic(java.lang.String type,
TopicMap tm) |
Topic |
getTypeType(TopicMap tm) |
Topic |
getValidTopic(java.lang.String valid,
TopicMap tm) |
Topic |
getValidType(TopicMap tm) |
Topic |
getWandoraClass(TopicMap tm) |
protected java.lang.String |
makeSI(java.lang.String base,
java.lang.String endPoint) |
protected void |
makeSubclassOf(TopicMap tm,
Topic t,
Topic superclass) |
boolean |
useURLCrawler() |
acceptBrowserExtractRequest, addCrawlerUrl, browserExtractorConsumesPlainText, buildSI, buildSL, clearMasterSubject, createAssociation, createAssociation, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, croppedFilename, croppedFilename, croppedUrlString, croppedUrlString, doBrowserExtract, dropExtract, dropExtract, dropExtract, execute, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFromText, getBrowserExtractorName, getCrawlerMode, getExtractorType, getForceContent, getForceFiles, getForceUrls, getGUIText, getGUIText, getInterruptsHandled, getMasterSubject, getType, getWandora, handle, handleContent, handleCustomType, handleFiles, handleForcedContent, handleInterrupt, handleStringContent, handleUrls, initializeCustomType, instantDropHandle, makeSubclassOfWandoraClass, runInOwnThread, setData, setDisplayName, setForceContent, setForceFiles, setForceUrls, setMasterSubject, setMasterSubject, setTopicMap, setupCrawler, setWandora, takeNap, urlEncode, useTempTopicMap
addUndoMarker, addUndoMarker, allowMultipleInvocations, clearAllThreads, clearThreads, clearThreads, clearToolLock, clearToolLock, clearToolLocks, configure, execute, execute, forceStop, forceStop, getContext, getCurrentLogger, getDefaultLogger, getHistory, getLastLogger, getState, getThreads, getThreads, getToolMenuItem, getToolMenuItem, getTopicName, hlog, initialize, interruptAllThreads, interruptThreads, interruptThreads, isConfigurable, isRunning, isRunning, lockLog, log, log, log, log, requiresRefresh, run, setContext, setDefaultLogger, setLogTitle, setProgress, setProgressMax, setState, setToolLogger, singleLog, singleLog, singleLog, solveContextTopicMap, solveNameForTopicMap, writeOptions
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
configure, execute, execute, getContext, getToolMenuItem, hlog, initialize, isConfigurable, isRunning, log, log, log, log, requiresRefresh, setContext, setToolLogger, writeOptions
forceStop, getHistory, getState, lockLog, setLogTitle, setProgress, setProgressMax, setState
public static boolean IDENTIFIER_AS_SI
public static boolean DESCRIPTION_AS_PLAYER
public static boolean DESCRIPTION_AS_OCCURRENCE
public static boolean APPEND_OCCURRENCE_DESCRIPTION
public static boolean APPEND_OCCURRENCE_ALTERNATIVE
public static boolean APPEND_OCCURRENCE_TABLEOFCONTENTS
public static boolean APPEND_OCCURRENCE_ABSTRACT
protected java.lang.String SI_BASE
protected java.lang.String RECORD_SI
protected java.lang.String CREATOR_SI
protected java.lang.String TYPE_SI
protected java.lang.String PUBLISHER_SI
protected java.lang.String CONTRIBUTOR_SI
protected java.lang.String DATE_SI
protected java.lang.String DESCRIPTION_SI
protected java.lang.String LANGUAGE_SI
protected java.lang.String SUBJECT_SI
protected java.lang.String IDENTIFIER_SI
protected java.lang.String FORMAT_SI
protected java.lang.String SOURCE_SI
protected java.lang.String RELATION_SI
protected java.lang.String COVERAGE_SI
protected java.lang.String RIGHTS_SI
protected java.lang.String AUDIENCE_SI
protected java.lang.String ALTERNATIVE_SI
protected java.lang.String TABLEOFCONTENTS_SI
protected java.lang.String ABSTRACT_SI
protected java.lang.String CREATED_SI
protected java.lang.String VALID_SI
protected java.lang.String AVAILABLE_SI
protected java.lang.String ISSUED_SI
protected java.lang.String MODIFIED_SI
protected java.lang.String EXTENT_SI
protected java.lang.String MEDIUM_SI
private java.lang.String defaultEncoding
private final java.lang.String[] contentTypes
public DublinCoreXMLExtractor()
public java.lang.String getName()
AbstractWandoraTool
getName
in interface WandoraTool
getName
in class AbstractExtractor
public java.lang.String getDescription()
AbstractWandoraTool
getDescription
in interface WandoraTool
getDescription
in class AbstractExtractor
public javax.swing.Icon getIcon()
AbstractWandoraTool
getIcon
should return Icon
object of
the tool.getIcon
in interface WandoraTool
getIcon
in class AbstractExtractor
public java.lang.String[] getContentTypes()
Handler
ContentHandler
can process.getContentTypes
in interface Handler
getContentTypes
in class AbstractExtractor
public boolean useURLCrawler()
useURLCrawler
in class AbstractExtractor
public boolean _extractTopicsFrom(java.net.URL url, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.io.File file, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.io.InputStream in, TopicMap topicMap) throws java.lang.Exception
java.lang.Exception
public boolean _extractTopicsFrom(java.lang.String in, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public Topic getDescriptionTopic(java.lang.String description, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getDescriptionType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getIdentifierTopic(java.lang.String identifier, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getIdentifierType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getSubjectTopic(java.lang.String subject, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getSubjectType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getTypeTopic(java.lang.String type, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getTypeType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getFormatTopic(java.lang.String format, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getFormatType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getDateTopic(java.lang.String date, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getDateType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getPublisherTopic(java.lang.String publisher, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getPublisherType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getContributorTopic(java.lang.String contributor, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getContributorType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getLanguageTopic(java.lang.String language, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getLanguageType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getCreatorTopic(java.lang.String creator, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getCreatorType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getSourceTopic(java.lang.String source, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getSourceType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getRelationTopic(java.lang.String relation, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getRelationType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getCoverageTopic(java.lang.String coverage, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getCoverageType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getRightsTopic(java.lang.String rights, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getRightsType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getAudienceTopic(java.lang.String audience, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getAudienceType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getAlternativeTopic(java.lang.String alt, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getAlternativeType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getTableOfContentsTopic(java.lang.String toc, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getTableOfContentsType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getAbstractTopic(java.lang.String abst, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getAbstractType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getCreatedTopic(java.lang.String created, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getCreatedType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getValidTopic(java.lang.String valid, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getValidType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getAvailableTopic(java.lang.String available, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getAvailableType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getIssuedTopic(java.lang.String issued, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getIssuedType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getModifiedTopic(java.lang.String modified, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getModifiedType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getExtentTopic(java.lang.String extent, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getExtentType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getMediumTopic(java.lang.String medium, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getMediumType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getRecordType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getDCClass(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getWandoraClass(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getTopic(TopicMap tm, java.lang.String str, java.lang.String SIBase, Topic type) throws TopicMapException
TopicMapException
protected Topic getOrCreateTopic(TopicMap tm, java.lang.String si) throws TopicMapException
TopicMapException
protected Topic getOrCreateTopic(TopicMap tm, java.lang.String si, java.lang.String bn) throws TopicMapException
TopicMapException
protected Topic getOrCreateTopic(TopicMap tm, java.lang.String si, java.lang.String bn, Topic type) throws TopicMapException
TopicMapException
protected void makeSubclassOf(TopicMap tm, Topic t, Topic superclass) throws TopicMapException
TopicMapException
protected java.lang.String makeSI(java.lang.String base, java.lang.String endPoint)
private boolean equalTags(java.lang.String t1, java.lang.String t2)
Copyright 2004-2015 Wandora Team