public class RISExtractor extends AbstractExtractor
Modifier and Type | Field and Description |
---|---|
private java.lang.String |
mEncoding |
java.lang.String[] |
risContentTypes |
CUSTOM_EXTRACTOR, DONE_FAILED, DONE_MANY, DONE_ONE, EXACTLY_GIVEN_URLS, FILE_EXTRACTOR, FILE_PATTERN, GIVEN_URLS_AND_ALL_CRAWLED_DOCUMENTS, GIVEN_URLS_AND_CRAWLED_DOCUMENTS_IN_URL_DOMAIN, GIVEN_URLS_AND_LINKED_DOCUMENTS, GIVEN_URLS_AND_URL_BELOW, INFO_WAIT_WHILE_WORKING, LOG_TITLE, POINT_START_URL_TEXT, RAW_EXTRACTOR, SELECT_DIALOG_TITLE, STRING_EXTRACTOR_NOT_SUPPORTED_MESSAGE, URL_EXTRACTOR
CLOSE, EXECUTE, INVISIBLE, VISIBLE, WAIT
RETURN_ERROR, RETURN_INFO
Constructor and Description |
---|
RISExtractor() |
Modifier and Type | Method and Description |
---|---|
boolean |
_extractTopicsFrom(java.io.File f,
TopicMap map) |
boolean |
_extractTopicsFrom(java.lang.String str,
TopicMap topicMap) |
boolean |
_extractTopicsFrom(java.net.URL u,
TopicMap t) |
void |
configure(Wandora admin,
Options options,
java.lang.String prefix)
If the tool is configurable, shows an user interface to configure the tool.
|
Topic |
createTopic(TopicMap topicMap,
java.lang.String baseString) |
Topic |
createTopic(TopicMap topicMap,
java.lang.String siString,
java.lang.String baseString) |
Topic |
createTopic(TopicMap topicMap,
java.lang.String siString,
java.lang.String baseNameString,
java.lang.String baseString) |
Topic |
createTopic(TopicMap topicMap,
java.lang.String siString,
java.lang.String baseNameString,
java.lang.String baseString,
Topic type) |
Topic |
createTopic(TopicMap topicMap,
java.lang.String siString,
java.lang.String baseNameString,
java.lang.String baseString,
Topic[] types) |
Topic |
createTopic(TopicMap topicMap,
java.lang.String siString,
java.lang.String baseString,
Topic type) |
Topic |
createTopic(TopicMap topicMap,
java.lang.String baseString,
Topic type) |
private boolean |
extract(java.nio.CharBuffer cb,
TopicMap map) |
java.lang.String[] |
getContentTypes()
Returns an array of String containing the content-types this
ContentHandler can process. |
protected java.lang.String |
getDateString(RISReference.Date date)
ISO 8601
|
java.lang.String |
getDescription()
AdminToolManager views tool descriptions while user browses available
tools and build user customizable GUI elements such as Tools menu.
|
java.lang.String |
getName()
Tools name represent the tool in UI unless the tool has been given
explicitly another GUI name.
|
private java.lang.String |
implode(java.lang.String[] vals,
java.lang.String sep) |
boolean |
isConfigurable()
Whether this tool is configurable.
|
static void |
main(java.lang.String[] args) |
private void |
makeSubClass(TopicMap map,
Topic subClass,
Topic superClass) |
private java.lang.String |
url(java.lang.String str) |
boolean |
useTempTopicMap() |
acceptBrowserExtractRequest, addCrawlerUrl, browserExtractorConsumesPlainText, buildSI, buildSL, clearMasterSubject, createAssociation, createAssociation, croppedFilename, croppedFilename, croppedUrlString, croppedUrlString, doBrowserExtract, dropExtract, dropExtract, dropExtract, execute, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFromText, getBrowserExtractorName, getCrawlerMode, getExtractorType, getForceContent, getForceFiles, getForceUrls, getGUIText, getGUIText, getIcon, getInterruptsHandled, getMasterSubject, getType, getWandora, handle, handleContent, handleCustomType, handleFiles, handleForcedContent, handleInterrupt, handleStringContent, handleUrls, initializeCustomType, instantDropHandle, makeSubclassOfWandoraClass, runInOwnThread, setData, setDisplayName, setForceContent, setForceFiles, setForceUrls, setMasterSubject, setMasterSubject, setTopicMap, setupCrawler, setWandora, takeNap, urlEncode, useURLCrawler
addUndoMarker, addUndoMarker, allowMultipleInvocations, clearAllThreads, clearThreads, clearThreads, clearToolLock, clearToolLock, clearToolLocks, execute, execute, forceStop, forceStop, getContext, getCurrentLogger, getDefaultLogger, getHistory, getLastLogger, getState, getThreads, getThreads, getToolMenuItem, getToolMenuItem, getTopicName, hlog, initialize, interruptAllThreads, interruptThreads, interruptThreads, isRunning, isRunning, lockLog, log, log, log, log, requiresRefresh, run, setContext, setDefaultLogger, setLogTitle, setProgress, setProgressMax, setState, setToolLogger, singleLog, singleLog, singleLog, solveContextTopicMap, solveNameForTopicMap, writeOptions
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
execute, execute, getContext, getToolMenuItem, hlog, initialize, isRunning, log, log, log, log, requiresRefresh, setContext, setToolLogger, writeOptions
forceStop, getHistory, getState, lockLog, setLogTitle, setProgress, setProgressMax, setState
private java.lang.String mEncoding
public final java.lang.String[] risContentTypes
public java.lang.String getName()
AbstractWandoraTool
getName
in interface WandoraTool
getName
in class AbstractExtractor
public java.lang.String getDescription()
AbstractWandoraTool
getDescription
in interface WandoraTool
getDescription
in class AbstractExtractor
public Topic createTopic(TopicMap topicMap, java.lang.String baseString) throws TopicMapException
createTopic
in class AbstractExtractor
TopicMapException
public Topic createTopic(TopicMap topicMap, java.lang.String siString, java.lang.String baseString) throws TopicMapException
createTopic
in class AbstractExtractor
TopicMapException
public Topic createTopic(TopicMap topicMap, java.lang.String siString, java.lang.String baseString, Topic type) throws TopicMapException
createTopic
in class AbstractExtractor
TopicMapException
public Topic createTopic(TopicMap topicMap, java.lang.String baseString, Topic type) throws TopicMapException
createTopic
in class AbstractExtractor
TopicMapException
public Topic createTopic(TopicMap topicMap, java.lang.String siString, java.lang.String baseNameString, java.lang.String baseString) throws TopicMapException
createTopic
in class AbstractExtractor
TopicMapException
public Topic createTopic(TopicMap topicMap, java.lang.String siString, java.lang.String baseNameString, java.lang.String baseString, Topic type) throws TopicMapException
createTopic
in class AbstractExtractor
TopicMapException
public Topic createTopic(TopicMap topicMap, java.lang.String siString, java.lang.String baseNameString, java.lang.String baseString, Topic[] types) throws TopicMapException
createTopic
in class AbstractExtractor
TopicMapException
public boolean useTempTopicMap()
useTempTopicMap
in class AbstractExtractor
public boolean isConfigurable()
AbstractWandoraTool
isConfigurable
in interface WandoraTool
isConfigurable
in class AbstractWandoraTool
public void configure(Wandora admin, Options options, java.lang.String prefix) throws TopicMapException
AbstractWandoraTool
configure
in interface WandoraTool
configure
in class AbstractWandoraTool
TopicMapException
private java.lang.String url(java.lang.String str)
private boolean extract(java.nio.CharBuffer cb, TopicMap map)
public boolean _extractTopicsFrom(java.io.File f, TopicMap map) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public java.lang.String[] getContentTypes()
Handler
ContentHandler
can process.getContentTypes
in interface Handler
getContentTypes
in class AbstractExtractor
private java.lang.String implode(java.lang.String[] vals, java.lang.String sep)
public boolean _extractTopicsFrom(java.net.URL u, TopicMap t) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.lang.String str, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public static void main(java.lang.String[] args) throws java.lang.Exception
java.lang.Exception
protected java.lang.String getDateString(RISReference.Date date)
date
- Copyright 2004-2015 Wandora Team