public class GellishExtractor extends AbstractExtractor implements WandoraTool
Modifier and Type | Field and Description |
---|---|
static boolean |
CONNECT_TO_WANDORA_CLASS |
static java.lang.String |
DEFAULT_LANG |
static boolean |
EXTRACT_EXTRAS |
java.lang.String |
locatorPrefix |
static boolean |
REMOVE_SPACES_IN_IDS |
CUSTOM_EXTRACTOR, DONE_FAILED, DONE_MANY, DONE_ONE, EXACTLY_GIVEN_URLS, FILE_EXTRACTOR, FILE_PATTERN, GIVEN_URLS_AND_ALL_CRAWLED_DOCUMENTS, GIVEN_URLS_AND_CRAWLED_DOCUMENTS_IN_URL_DOMAIN, GIVEN_URLS_AND_LINKED_DOCUMENTS, GIVEN_URLS_AND_URL_BELOW, INFO_WAIT_WHILE_WORKING, LOG_TITLE, POINT_START_URL_TEXT, RAW_EXTRACTOR, SELECT_DIALOG_TITLE, STRING_EXTRACTOR_NOT_SUPPORTED_MESSAGE, URL_EXTRACTOR
CLOSE, EXECUTE, INVISIBLE, VISIBLE, WAIT
RETURN_ERROR, RETURN_INFO
Constructor and Description |
---|
GellishExtractor()
Creates a new instance of GellishExtractor
|
Modifier and Type | Method and Description |
---|---|
boolean |
_extractTopicsFrom(java.io.BufferedReader breader,
TopicMap topicMap) |
boolean |
_extractTopicsFrom(java.io.File thesaurusFile,
TopicMap topicMap) |
boolean |
_extractTopicsFrom(java.lang.String str,
TopicMap topicMap) |
boolean |
_extractTopicsFrom(java.net.URL url,
TopicMap topicMap) |
protected boolean |
associationExists(Topic t1,
Topic t2,
Topic at) |
java.lang.String |
getDescription()
AdminToolManager views tool descriptions while user browses available
tools and build user customizable GUI elements such as Tools menu.
|
protected Topic |
getGellishClassTopic(TopicMap tm) |
java.lang.String |
getGUIText(int textType) |
java.lang.String |
getName()
Tools name represent the tool in UI unless the tool has been given
explicitly another GUI name.
|
protected Topic |
getOrCreateConceptTopic(TopicMap tm,
java.lang.String id,
java.lang.String name) |
protected Topic |
getOrCreateTopic(TopicMap topicmap,
Locator si,
java.lang.String baseName,
java.lang.String displayName) |
protected Topic |
getOrCreateTopic(TopicMap topicmap,
Locator si,
java.lang.String baseName,
java.lang.String displayName,
Topic typeTopic) |
protected Topic |
getOrCreateTopic(TopicMap topicmap,
java.lang.String si,
java.lang.String baseName,
java.lang.String displayName) |
protected java.lang.String |
getToken(int i,
java.lang.String[] arr) |
protected boolean |
isValid(java.lang.String str) |
protected Locator |
makeSI(java.lang.String str) |
protected Locator |
makeSI(java.lang.String prefix,
java.lang.String str) |
protected Locator |
makeSI(java.lang.String prefix,
java.lang.String str,
java.lang.String postfix) |
protected void |
makeSubclassOf(TopicMap tm,
Topic t,
Topic superclass) |
protected void |
makeSubclassOfGellish(TopicMap tm,
Topic subclass) |
protected java.lang.String |
removeSpacesIn(java.lang.String str) |
boolean |
useTempTopicMap() |
acceptBrowserExtractRequest, addCrawlerUrl, browserExtractorConsumesPlainText, buildSI, buildSL, clearMasterSubject, createAssociation, createAssociation, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, croppedFilename, croppedFilename, croppedUrlString, croppedUrlString, doBrowserExtract, dropExtract, dropExtract, dropExtract, execute, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFromText, getBrowserExtractorName, getContentTypes, getCrawlerMode, getExtractorType, getForceContent, getForceFiles, getForceUrls, getGUIText, getIcon, getInterruptsHandled, getMasterSubject, getType, getWandora, handle, handleContent, handleCustomType, handleFiles, handleForcedContent, handleInterrupt, handleStringContent, handleUrls, initializeCustomType, instantDropHandle, makeSubclassOfWandoraClass, runInOwnThread, setData, setDisplayName, setForceContent, setForceFiles, setForceUrls, setMasterSubject, setMasterSubject, setTopicMap, setupCrawler, setWandora, takeNap, urlEncode, useURLCrawler
addUndoMarker, addUndoMarker, allowMultipleInvocations, clearAllThreads, clearThreads, clearThreads, clearToolLock, clearToolLock, clearToolLocks, configure, execute, execute, forceStop, forceStop, getContext, getCurrentLogger, getDefaultLogger, getHistory, getLastLogger, getState, getThreads, getThreads, getToolMenuItem, getToolMenuItem, getTopicName, hlog, initialize, interruptAllThreads, interruptThreads, interruptThreads, isConfigurable, isRunning, isRunning, lockLog, log, log, log, log, requiresRefresh, run, setContext, setDefaultLogger, setLogTitle, setProgress, setProgressMax, setState, setToolLogger, singleLog, singleLog, singleLog, solveContextTopicMap, solveNameForTopicMap, writeOptions
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
configure, execute, execute, execute, getContext, getIcon, getToolMenuItem, getType, hlog, initialize, isConfigurable, isRunning, log, log, log, log, requiresRefresh, setContext, setToolLogger, writeOptions
forceStop, getHistory, getState, lockLog, setLogTitle, setProgress, setProgressMax, setState
public java.lang.String locatorPrefix
public static java.lang.String DEFAULT_LANG
public static boolean EXTRACT_EXTRAS
public static boolean REMOVE_SPACES_IN_IDS
public static boolean CONNECT_TO_WANDORA_CLASS
public GellishExtractor()
public java.lang.String getName()
AbstractWandoraTool
getName
in interface WandoraTool
getName
in class AbstractExtractor
public java.lang.String getDescription()
AbstractWandoraTool
getDescription
in interface WandoraTool
getDescription
in class AbstractExtractor
public java.lang.String getGUIText(int textType)
getGUIText
in class AbstractExtractor
public boolean _extractTopicsFrom(java.lang.String str, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.net.URL url, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.io.File thesaurusFile, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.io.BufferedReader breader, TopicMap topicMap) throws java.lang.Exception
java.lang.Exception
protected java.lang.String getToken(int i, java.lang.String[] arr)
protected boolean isValid(java.lang.String str)
protected java.lang.String removeSpacesIn(java.lang.String str)
protected Topic getOrCreateConceptTopic(TopicMap tm, java.lang.String id, java.lang.String name)
protected Topic getOrCreateTopic(TopicMap topicmap, java.lang.String si, java.lang.String baseName, java.lang.String displayName)
protected Topic getOrCreateTopic(TopicMap topicmap, Locator si, java.lang.String baseName, java.lang.String displayName)
protected Topic getOrCreateTopic(TopicMap topicmap, Locator si, java.lang.String baseName, java.lang.String displayName, Topic typeTopic)
protected Locator makeSI(java.lang.String str)
protected Locator makeSI(java.lang.String prefix, java.lang.String str)
protected Locator makeSI(java.lang.String prefix, java.lang.String str, java.lang.String postfix)
protected void makeSubclassOfGellish(TopicMap tm, Topic subclass) throws TopicMapException
TopicMapException
protected void makeSubclassOf(TopicMap tm, Topic t, Topic superclass) throws TopicMapException
TopicMapException
protected Topic getGellishClassTopic(TopicMap tm) throws TopicMapException
TopicMapException
public boolean useTempTopicMap()
useTempTopicMap
in class AbstractExtractor
Copyright 2004-2015 Wandora Team