public abstract class AbstractUmbelExtractor extends AbstractExtractor
Modifier and Type | Field and Description |
---|---|
static boolean |
ADD_DISTANCE_AS_PLAYER |
private java.lang.String[] |
contentTypes |
protected static java.lang.String |
csvEncoding |
protected static char |
csvLineSeparator |
protected static char |
csvStringCharacter |
protected static char |
csvValueSeparator |
static int |
FILE_CONTAINS_PLAIN_UMBEL_CONCEPT |
static int |
FILE_CONTAINS_UMBEL_CONCEPT_URLS |
static int |
FILE_IS_CSV_OF_UMBEL_CONCEPTS |
static int |
fileProcessor |
static int |
filterDistancesBelow |
static boolean |
getOnlyImmediateNeighbours |
static java.lang.String |
LANG |
static java.lang.String |
UMBEL_ALT_LABEL_URI |
static java.lang.String |
UMBEL_BROADER_NARROWER_TYPE_NAME |
static java.lang.String |
UMBEL_BROADER_NARROWER_TYPE_SI |
static java.lang.String |
UMBEL_BROADER_TYPE_NAME |
static java.lang.String |
UMBEL_BROADER_TYPE_SI |
static java.lang.String[] |
UMBEL_BROADER_URI |
static java.lang.String |
UMBEL_CONCEPT_STRING_SPLITTER |
static java.lang.String |
UMBEL_CONCEPT_TYPE_NAME |
static java.lang.String |
UMBEL_CONCEPT_TYPE_SI |
static java.lang.String |
UMBEL_CONCEPT_URI_BASE |
static java.lang.String |
UMBEL_DEFINITION_URI |
static java.lang.String |
UMBEL_DISJOINT_TYPE_NAME |
static java.lang.String |
UMBEL_DISJOINT_TYPE_SI |
static java.lang.String[] |
UMBEL_DISJOINT_URI |
static java.lang.String |
UMBEL_DISTANCE_TYPE_NAME |
static java.lang.String |
UMBEL_DISTANCE_TYPE_SI |
static java.lang.String |
UMBEL_NARROWER_TYPE_NAME |
static java.lang.String |
UMBEL_NARROWER_TYPE_SI |
static java.lang.String[] |
UMBEL_NARROWER_URI |
static java.lang.String |
UMBEL_PREF_LABEL_URI |
static java.lang.String |
UMBEL_SUBCLASS_TYPE_NAME |
static java.lang.String |
UMBEL_SUBCLASS_TYPE_SI |
static java.lang.String[] |
UMBEL_SUBCLASS_URI |
static java.lang.String |
UMBEL_SUPER_TYPE_URI_BASE |
static java.lang.String |
UMBEL_SUPERCLASS_SUBCLASS_TYPE_NAME |
static java.lang.String |
UMBEL_SUPERCLASS_SUBCLASS_TYPE_SI |
static java.lang.String |
UMBEL_SUPERCLASS_TYPE_NAME |
static java.lang.String |
UMBEL_SUPERCLASS_TYPE_SI |
static java.lang.String[] |
UMBEL_SUPERCLASS_URI |
static java.lang.String |
UMBEL_TYPE_NAME |
static java.lang.String |
UMBEL_TYPE_SI |
static java.lang.String |
UMBEL_TYPE_TYPE_NAME |
static java.lang.String |
UMBEL_TYPE_TYPE_SI |
static java.lang.String[] |
UMBEL_TYPE_URI |
static boolean |
useXTMSuperclassSubclassTopics |
CUSTOM_EXTRACTOR, DONE_FAILED, DONE_MANY, DONE_ONE, EXACTLY_GIVEN_URLS, FILE_EXTRACTOR, FILE_PATTERN, GIVEN_URLS_AND_ALL_CRAWLED_DOCUMENTS, GIVEN_URLS_AND_CRAWLED_DOCUMENTS_IN_URL_DOMAIN, GIVEN_URLS_AND_LINKED_DOCUMENTS, GIVEN_URLS_AND_URL_BELOW, INFO_WAIT_WHILE_WORKING, LOG_TITLE, POINT_START_URL_TEXT, RAW_EXTRACTOR, SELECT_DIALOG_TITLE, STRING_EXTRACTOR_NOT_SUPPORTED_MESSAGE, URL_EXTRACTOR
CLOSE, EXECUTE, INVISIBLE, VISIBLE, WAIT
RETURN_ERROR, RETURN_INFO
Constructor and Description |
---|
AbstractUmbelExtractor() |
Modifier and Type | Method and Description |
---|---|
boolean |
_extractTopicsFrom(java.io.File file,
TopicMap topicMap) |
boolean |
_extractTopicsFrom(java.net.URL url,
TopicMap topicMap) |
protected boolean |
equalsAny(java.lang.String a,
java.lang.String[] b) |
abstract java.lang.String |
getApiRequestUrlFor(java.lang.String str) |
protected Tuples.T3<Topic,Topic,Topic> |
getAssociationTopicsForUmbelPredicate(java.lang.String predicate,
TopicMap tm) |
protected Topic |
getBroaderNarrowerTypeTopic(TopicMap topicMap) |
protected Topic |
getBroaderTypeTopic(TopicMap topicMap) |
protected Topic |
getConceptTopic(java.lang.String si,
java.lang.String label,
TopicMap topicMap) |
protected Topic |
getConceptTopic(java.lang.String si,
TopicMap topicMap) |
protected Topic |
getConceptTypeTopic(TopicMap topicMap) |
java.lang.String[] |
getContentTypes()
Returns an array of String containing the content-types this
ContentHandler can process. |
java.lang.String |
getDescription()
AdminToolManager views tool descriptions while user browses available
tools and build user customizable GUI elements such as Tools menu.
|
protected Topic |
getDisjointTypeTopic(TopicMap topicMap) |
protected Topic |
getDistanceTopic(int distance,
TopicMap topicMap) |
protected Topic |
getDistanceTypeTopic(TopicMap topicMap) |
int |
getExtractorType() |
javax.swing.Icon |
getIcon()
All tools may have identifying graphic icon used within tool GUI elements.
|
java.lang.String |
getName()
Tools name represent the tool in UI unless the tool has been given
explicitly another GUI name.
|
protected Topic |
getNarrowerTypeTopic(TopicMap topicMap) |
protected Topic |
getSubclassTypeTopic(TopicMap topicMap) |
protected Topic |
getSuperclassSubclassTypeTopic(TopicMap topicMap) |
protected Topic |
getSuperclassTypeTopic(TopicMap topicMap) |
protected Topic |
getTopic(java.lang.String si,
java.lang.String name,
TopicMap topicMap) |
protected Topic |
getTopic(java.lang.String si,
TopicMap topicMap) |
protected Topic |
getTypeTypeTopic(TopicMap topicMap) |
java.lang.String |
getUmbelConceptURI(java.lang.String label) |
protected Topic |
getUmbelTypeTopic(TopicMap topicMap) |
protected boolean |
isURL(java.lang.String u) |
protected org.json.JSONObject |
performRequest(java.lang.String urlStr,
java.lang.String concept) |
protected java.lang.String |
robustGet(org.json.JSONObject json,
java.lang.String key) |
protected int |
robustGetInt(org.json.JSONObject json,
java.lang.String key) |
boolean |
useURLCrawler() |
_extractTopicsFrom, acceptBrowserExtractRequest, addCrawlerUrl, browserExtractorConsumesPlainText, buildSI, buildSL, clearMasterSubject, createAssociation, createAssociation, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, croppedFilename, croppedFilename, croppedUrlString, croppedUrlString, doBrowserExtract, dropExtract, dropExtract, dropExtract, execute, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFromText, getBrowserExtractorName, getCrawlerMode, getForceContent, getForceFiles, getForceUrls, getGUIText, getGUIText, getInterruptsHandled, getMasterSubject, getType, getWandora, handle, handleContent, handleCustomType, handleFiles, handleForcedContent, handleInterrupt, handleStringContent, handleUrls, initializeCustomType, instantDropHandle, makeSubclassOfWandoraClass, runInOwnThread, setData, setDisplayName, setForceContent, setForceFiles, setForceUrls, setMasterSubject, setMasterSubject, setTopicMap, setupCrawler, setWandora, takeNap, urlEncode, useTempTopicMap
addUndoMarker, addUndoMarker, allowMultipleInvocations, clearAllThreads, clearThreads, clearThreads, clearToolLock, clearToolLock, clearToolLocks, configure, execute, execute, forceStop, forceStop, getContext, getCurrentLogger, getDefaultLogger, getHistory, getLastLogger, getState, getThreads, getThreads, getToolMenuItem, getToolMenuItem, getTopicName, hlog, initialize, interruptAllThreads, interruptThreads, interruptThreads, isConfigurable, isRunning, isRunning, lockLog, log, log, log, log, requiresRefresh, run, setContext, setDefaultLogger, setLogTitle, setProgress, setProgressMax, setState, setToolLogger, singleLog, singleLog, singleLog, solveContextTopicMap, solveNameForTopicMap, writeOptions
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
configure, execute, execute, getContext, getToolMenuItem, hlog, initialize, isConfigurable, isRunning, log, log, log, log, requiresRefresh, setContext, setToolLogger, writeOptions
forceStop, getHistory, getState, lockLog, setLogTitle, setProgress, setProgressMax, setState
public static final java.lang.String UMBEL_CONCEPT_STRING_SPLITTER
public static final int FILE_CONTAINS_UMBEL_CONCEPT_URLS
public static final int FILE_CONTAINS_PLAIN_UMBEL_CONCEPT
public static final int FILE_IS_CSV_OF_UMBEL_CONCEPTS
public static int fileProcessor
public static boolean ADD_DISTANCE_AS_PLAYER
public static int filterDistancesBelow
public static boolean getOnlyImmediateNeighbours
public static boolean useXTMSuperclassSubclassTopics
protected static char csvStringCharacter
protected static char csvLineSeparator
protected static char csvValueSeparator
protected static java.lang.String csvEncoding
public static java.lang.String LANG
public static final java.lang.String UMBEL_CONCEPT_URI_BASE
public static final java.lang.String UMBEL_SUPER_TYPE_URI_BASE
public static final java.lang.String UMBEL_TYPE_SI
public static final java.lang.String UMBEL_TYPE_NAME
public static final java.lang.String UMBEL_CONCEPT_TYPE_SI
public static final java.lang.String UMBEL_CONCEPT_TYPE_NAME
public static final java.lang.String UMBEL_BROADER_NARROWER_TYPE_SI
public static final java.lang.String UMBEL_BROADER_NARROWER_TYPE_NAME
public static final java.lang.String UMBEL_NARROWER_TYPE_SI
public static final java.lang.String UMBEL_NARROWER_TYPE_NAME
public static final java.lang.String UMBEL_BROADER_TYPE_SI
public static final java.lang.String UMBEL_BROADER_TYPE_NAME
public static final java.lang.String UMBEL_SUPERCLASS_SUBCLASS_TYPE_SI
public static final java.lang.String UMBEL_SUPERCLASS_SUBCLASS_TYPE_NAME
public static final java.lang.String UMBEL_SUBCLASS_TYPE_SI
public static final java.lang.String UMBEL_SUBCLASS_TYPE_NAME
public static final java.lang.String UMBEL_SUPERCLASS_TYPE_SI
public static final java.lang.String UMBEL_SUPERCLASS_TYPE_NAME
public static final java.lang.String UMBEL_TYPE_TYPE_SI
public static final java.lang.String UMBEL_TYPE_TYPE_NAME
public static final java.lang.String UMBEL_DISTANCE_TYPE_SI
public static final java.lang.String UMBEL_DISTANCE_TYPE_NAME
public static final java.lang.String UMBEL_DISJOINT_TYPE_SI
public static final java.lang.String UMBEL_DISJOINT_TYPE_NAME
public static final java.lang.String UMBEL_PREF_LABEL_URI
public static final java.lang.String UMBEL_ALT_LABEL_URI
public static final java.lang.String UMBEL_DEFINITION_URI
public static final java.lang.String[] UMBEL_SUBCLASS_URI
public static final java.lang.String[] UMBEL_SUPERCLASS_URI
public static final java.lang.String[] UMBEL_NARROWER_URI
public static final java.lang.String[] UMBEL_BROADER_URI
public static final java.lang.String[] UMBEL_TYPE_URI
public static final java.lang.String[] UMBEL_DISJOINT_URI
private final java.lang.String[] contentTypes
public java.lang.String getName()
AbstractWandoraTool
getName
in interface WandoraTool
getName
in class AbstractExtractor
public java.lang.String getDescription()
AbstractWandoraTool
getDescription
in interface WandoraTool
getDescription
in class AbstractExtractor
public javax.swing.Icon getIcon()
AbstractWandoraTool
getIcon
should return Icon
object of
the tool.getIcon
in interface WandoraTool
getIcon
in class AbstractExtractor
public java.lang.String[] getContentTypes()
Handler
ContentHandler
can process.getContentTypes
in interface Handler
getContentTypes
in class AbstractExtractor
public boolean useURLCrawler()
useURLCrawler
in class AbstractExtractor
public int getExtractorType()
getExtractorType
in class AbstractExtractor
public abstract java.lang.String getApiRequestUrlFor(java.lang.String str)
public boolean _extractTopicsFrom(java.net.URL url, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.io.File file, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public java.lang.String getUmbelConceptURI(java.lang.String label)
protected org.json.JSONObject performRequest(java.lang.String urlStr, java.lang.String concept)
protected java.lang.String robustGet(org.json.JSONObject json, java.lang.String key)
protected int robustGetInt(org.json.JSONObject json, java.lang.String key)
protected Topic getConceptTopic(java.lang.String si, java.lang.String label, TopicMap topicMap)
protected boolean isURL(java.lang.String u)
protected Topic getUmbelTypeTopic(TopicMap topicMap) throws TopicMapException
TopicMapException
protected Topic getBroaderNarrowerTypeTopic(TopicMap topicMap) throws TopicMapException
TopicMapException
protected Topic getNarrowerTypeTopic(TopicMap topicMap) throws TopicMapException
TopicMapException
protected Topic getBroaderTypeTopic(TopicMap topicMap) throws TopicMapException
TopicMapException
protected Topic getDisjointTypeTopic(TopicMap topicMap) throws TopicMapException
TopicMapException
protected Topic getTypeTypeTopic(TopicMap topicMap) throws TopicMapException
TopicMapException
protected Topic getSuperclassSubclassTypeTopic(TopicMap topicMap) throws TopicMapException
TopicMapException
protected Topic getSubclassTypeTopic(TopicMap topicMap) throws TopicMapException
TopicMapException
protected Topic getSuperclassTypeTopic(TopicMap topicMap) throws TopicMapException
TopicMapException
protected Topic getConceptTypeTopic(TopicMap topicMap) throws TopicMapException
TopicMapException
protected Topic getDistanceTopic(int distance, TopicMap topicMap) throws TopicMapException
TopicMapException
protected Topic getDistanceTypeTopic(TopicMap topicMap) throws TopicMapException
TopicMapException
protected Tuples.T3<Topic,Topic,Topic> getAssociationTopicsForUmbelPredicate(java.lang.String predicate, TopicMap tm)
protected boolean equalsAny(java.lang.String a, java.lang.String[] b)
Copyright 2004-2015 Wandora Team