public class Sentences2Associations extends AbstractExtractor implements WandoraTool
Modifier and Type | Field and Description |
---|---|
static boolean |
ADD_SOURCE_AS_PLAYER |
private java.net.URL |
basePath |
static java.lang.String[] |
contentTypes |
static java.lang.String |
ORDER_SI_BASE |
static java.lang.String |
ROLE_SI_BASE |
static java.lang.String |
SENTENCE_SI_BASE |
static java.lang.String |
SENTENCES_TO_ASSOCIATIONS |
static java.lang.String |
SOURCE_SI |
static java.lang.String |
WORD_SI_BASE |
CUSTOM_EXTRACTOR, DONE_FAILED, DONE_MANY, DONE_ONE, EXACTLY_GIVEN_URLS, FILE_EXTRACTOR, FILE_PATTERN, GIVEN_URLS_AND_ALL_CRAWLED_DOCUMENTS, GIVEN_URLS_AND_CRAWLED_DOCUMENTS_IN_URL_DOMAIN, GIVEN_URLS_AND_LINKED_DOCUMENTS, GIVEN_URLS_AND_URL_BELOW, INFO_WAIT_WHILE_WORKING, LOG_TITLE, POINT_START_URL_TEXT, RAW_EXTRACTOR, SELECT_DIALOG_TITLE, STRING_EXTRACTOR_NOT_SUPPORTED_MESSAGE, URL_EXTRACTOR
CLOSE, EXECUTE, INVISIBLE, VISIBLE, WAIT
RETURN_ERROR, RETURN_INFO
Constructor and Description |
---|
Sentences2Associations()
Creates a new instance of Sentences2Associations
|
Modifier and Type | Method and Description |
---|---|
boolean |
_extractTopicsFrom(java.io.File file,
TopicMap topicMap) |
boolean |
_extractTopicsFrom(java.lang.String str,
TopicMap tm) |
boolean |
_extractTopicsFrom(java.net.URL url,
TopicMap topicMap) |
void |
_extractTopicsFromStream(java.lang.String locator,
java.io.InputStream inputStream,
TopicMap tm) |
boolean |
browserExtractorConsumesPlainText() |
java.lang.String |
doBrowserExtract(BrowserExtractRequest request,
Wandora wandora) |
java.lang.String[] |
getContentTypes()
Returns an array of String containing the content-types this
ContentHandler can process. |
java.lang.String |
getDescription()
AdminToolManager views tool descriptions while user browses available
tools and build user customizable GUI elements such as Tools menu.
|
java.lang.String |
getGUIText(int textType) |
java.lang.String |
getName()
Tools name represent the tool in UI unless the tool has been given
explicitly another GUI name.
|
protected Topic |
getOrCreateTopic(TopicMap tm,
java.lang.String si,
java.lang.String bn) |
Topic |
getSentenceTopic(TopicMap tm) |
Topic |
getSentenceTypeTopic(TopicMap tm) |
Topic |
getWordTopic(TopicMap tm,
java.lang.String word) |
boolean |
isSentenceDelimiter(int c) |
boolean |
isWordDelimiter(int c) |
boolean |
useTempTopicMap() |
acceptBrowserExtractRequest, addCrawlerUrl, buildSI, buildSL, clearMasterSubject, createAssociation, createAssociation, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, croppedFilename, croppedFilename, croppedUrlString, croppedUrlString, dropExtract, dropExtract, dropExtract, execute, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFromText, getBrowserExtractorName, getCrawlerMode, getExtractorType, getForceContent, getForceFiles, getForceUrls, getGUIText, getIcon, getInterruptsHandled, getMasterSubject, getType, getWandora, handle, handleContent, handleCustomType, handleFiles, handleForcedContent, handleInterrupt, handleStringContent, handleUrls, initializeCustomType, instantDropHandle, makeSubclassOfWandoraClass, runInOwnThread, setData, setDisplayName, setForceContent, setForceFiles, setForceUrls, setMasterSubject, setMasterSubject, setTopicMap, setupCrawler, setWandora, takeNap, urlEncode, useURLCrawler
addUndoMarker, addUndoMarker, allowMultipleInvocations, clearAllThreads, clearThreads, clearThreads, clearToolLock, clearToolLock, clearToolLocks, configure, execute, execute, forceStop, forceStop, getContext, getCurrentLogger, getDefaultLogger, getHistory, getLastLogger, getState, getThreads, getThreads, getToolMenuItem, getToolMenuItem, getTopicName, hlog, initialize, interruptAllThreads, interruptThreads, interruptThreads, isConfigurable, isRunning, isRunning, lockLog, log, log, log, log, requiresRefresh, run, setContext, setDefaultLogger, setLogTitle, setProgress, setProgressMax, setState, setToolLogger, singleLog, singleLog, singleLog, solveContextTopicMap, solveNameForTopicMap, writeOptions
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
configure, execute, execute, execute, getContext, getIcon, getToolMenuItem, getType, hlog, initialize, isConfigurable, isRunning, log, log, log, log, requiresRefresh, setContext, setToolLogger, writeOptions
forceStop, getHistory, getState, lockLog, setLogTitle, setProgress, setProgressMax, setState
public static boolean ADD_SOURCE_AS_PLAYER
public static java.lang.String SOURCE_SI
public static java.lang.String WORD_SI_BASE
public static java.lang.String ROLE_SI_BASE
public static java.lang.String SENTENCE_SI_BASE
public static java.lang.String ORDER_SI_BASE
public static java.lang.String SENTENCES_TO_ASSOCIATIONS
private java.net.URL basePath
public static final java.lang.String[] contentTypes
public Sentences2Associations()
public java.lang.String getName()
AbstractWandoraTool
getName
in interface WandoraTool
getName
in class AbstractExtractor
public java.lang.String getDescription()
AbstractWandoraTool
getDescription
in interface WandoraTool
getDescription
in class AbstractExtractor
public boolean useTempTopicMap()
useTempTopicMap
in class AbstractExtractor
public java.lang.String getGUIText(int textType)
getGUIText
in class AbstractExtractor
public boolean browserExtractorConsumesPlainText()
browserExtractorConsumesPlainText
in class AbstractExtractor
public java.lang.String doBrowserExtract(BrowserExtractRequest request, Wandora wandora) throws TopicMapException
doBrowserExtract
in interface BrowserPluginExtractor
doBrowserExtract
in class AbstractExtractor
TopicMapException
public boolean _extractTopicsFrom(java.net.URL url, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.io.File file, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.lang.String str, TopicMap tm) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public void _extractTopicsFromStream(java.lang.String locator, java.io.InputStream inputStream, TopicMap tm)
public boolean isWordDelimiter(int c)
public boolean isSentenceDelimiter(int c)
public Topic getSentenceTopic(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getWordTopic(TopicMap tm, java.lang.String word) throws TopicMapException
TopicMapException
public Topic getSentenceTypeTopic(TopicMap tm) throws TopicMapException
TopicMapException
protected Topic getOrCreateTopic(TopicMap tm, java.lang.String si, java.lang.String bn) throws TopicMapException
TopicMapException
public java.lang.String[] getContentTypes()
Handler
ContentHandler
can process.getContentTypes
in interface Handler
getContentTypes
in class AbstractExtractor
Copyright 2004-2015 Wandora Team