public abstract class AbstractGuardianExtractor extends AbstractExtractor
Modifier and Type | Field and Description |
---|---|
static java.lang.String |
API_URL_SI |
static java.lang.String |
CONTENT_SI |
private java.lang.String[] |
contentTypes |
static java.lang.String |
DATE_SI |
static java.lang.String |
FIELD_BASE_SI |
private static java.util.HashMap<java.lang.String,java.lang.String> |
fieldNames |
static java.lang.String |
GUARDIAN_BASE_SI |
static java.lang.String |
ID_SI |
static java.lang.String |
LANG_SI |
static java.lang.String |
PUBLICATION_TIME_SI |
static java.lang.String |
SECTION_ID_SI |
static java.lang.String |
SECTION_NAME_SI |
static java.lang.String |
TAG_BASE_SI |
static java.lang.String |
TITLE_SI |
static java.lang.String |
WEB_URL_SI |
CUSTOM_EXTRACTOR, DONE_FAILED, DONE_MANY, DONE_ONE, EXACTLY_GIVEN_URLS, FILE_EXTRACTOR, FILE_PATTERN, GIVEN_URLS_AND_ALL_CRAWLED_DOCUMENTS, GIVEN_URLS_AND_CRAWLED_DOCUMENTS_IN_URL_DOMAIN, GIVEN_URLS_AND_LINKED_DOCUMENTS, GIVEN_URLS_AND_URL_BELOW, INFO_WAIT_WHILE_WORKING, LOG_TITLE, POINT_START_URL_TEXT, RAW_EXTRACTOR, SELECT_DIALOG_TITLE, STRING_EXTRACTOR_NOT_SUPPORTED_MESSAGE, URL_EXTRACTOR
CLOSE, EXECUTE, INVISIBLE, VISIBLE, WAIT
RETURN_ERROR, RETURN_INFO
Constructor and Description |
---|
AbstractGuardianExtractor() |
Modifier and Type | Method and Description |
---|---|
static Topic |
getContentType(TopicMap tm) |
java.lang.String[] |
getContentTypes()
Returns an array of String containing the content-types this
ContentHandler can process. |
static Topic |
getDateTopic(TopicMap tm,
java.lang.String date) |
static Topic |
getDateType(TopicMap tm) |
java.lang.String |
getDescription()
AdminToolManager views tool descriptions while user browses available
tools and build user customizable GUI elements such as Tools menu.
|
static Topic |
getFieldTopic(TopicMap tm,
java.lang.String siExt,
java.lang.String id) |
static Topic |
getFieldTopicType(TopicMap tm) |
static Topic |
getFieldType(TopicMap tm,
java.lang.String siExt) |
static Topic |
getGuardianType(TopicMap tm) |
javax.swing.Icon |
getIcon()
All tools may have identifying graphic icon used within tool GUI elements.
|
static Topic |
getIDType(TopicMap tm) |
protected static Topic |
getLangTopic(TopicMap tm) |
java.lang.String |
getName()
Tools name represent the tool in UI unless the tool has been given
explicitly another GUI name.
|
protected static Topic |
getOrCreateTopic(TopicMap tm,
java.lang.String si) |
protected static Topic |
getOrCreateTopic(TopicMap tm,
java.lang.String si,
java.lang.String bn) |
static Topic |
getPubTimeType(TopicMap tm) |
static Topic |
getTagTopic(TopicMap tm,
java.lang.String siExt,
java.lang.String id) |
static Topic |
getTagTopicType(TopicMap tm) |
static Topic |
getTagType(TopicMap tm,
java.lang.String siExt) |
static Topic |
getTitleType(TopicMap tm) |
protected static Topic |
getWandoraClassTopic(TopicMap tm) |
protected static void |
makeSubclassOf(TopicMap tm,
Topic t,
Topic superclass) |
boolean |
runInOwnThread()
Whether or not this tool should fork own thread.
|
boolean |
useURLCrawler() |
_extractTopicsFrom, _extractTopicsFrom, _extractTopicsFrom, acceptBrowserExtractRequest, addCrawlerUrl, browserExtractorConsumesPlainText, buildSI, buildSL, clearMasterSubject, createAssociation, createAssociation, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, croppedFilename, croppedFilename, croppedUrlString, croppedUrlString, doBrowserExtract, dropExtract, dropExtract, dropExtract, execute, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFromText, getBrowserExtractorName, getCrawlerMode, getExtractorType, getForceContent, getForceFiles, getForceUrls, getGUIText, getGUIText, getInterruptsHandled, getMasterSubject, getType, getWandora, handle, handleContent, handleCustomType, handleFiles, handleForcedContent, handleInterrupt, handleStringContent, handleUrls, initializeCustomType, instantDropHandle, makeSubclassOfWandoraClass, setData, setDisplayName, setForceContent, setForceFiles, setForceUrls, setMasterSubject, setMasterSubject, setTopicMap, setupCrawler, setWandora, takeNap, urlEncode, useTempTopicMap
addUndoMarker, addUndoMarker, allowMultipleInvocations, clearAllThreads, clearThreads, clearThreads, clearToolLock, clearToolLock, clearToolLocks, configure, execute, execute, forceStop, forceStop, getContext, getCurrentLogger, getDefaultLogger, getHistory, getLastLogger, getState, getThreads, getThreads, getToolMenuItem, getToolMenuItem, getTopicName, hlog, initialize, interruptAllThreads, interruptThreads, interruptThreads, isConfigurable, isRunning, isRunning, lockLog, log, log, log, log, requiresRefresh, run, setContext, setDefaultLogger, setLogTitle, setProgress, setProgressMax, setState, setToolLogger, singleLog, singleLog, singleLog, solveContextTopicMap, solveNameForTopicMap, writeOptions
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
configure, execute, execute, getContext, getToolMenuItem, hlog, initialize, isConfigurable, isRunning, log, log, log, log, requiresRefresh, setContext, setToolLogger, writeOptions
forceStop, getHistory, getState, lockLog, setLogTitle, setProgress, setProgressMax, setState
private final java.lang.String[] contentTypes
public static final java.lang.String GUARDIAN_BASE_SI
public static final java.lang.String FIELD_BASE_SI
public static final java.lang.String TAG_BASE_SI
public static final java.lang.String CONTENT_SI
public static final java.lang.String DATE_SI
public static final java.lang.String ID_SI
public static final java.lang.String TITLE_SI
public static final java.lang.String PUBLICATION_TIME_SI
public static final java.lang.String SECTION_ID_SI
public static final java.lang.String SECTION_NAME_SI
public static final java.lang.String WEB_URL_SI
public static final java.lang.String API_URL_SI
public static final java.lang.String LANG_SI
private static java.util.HashMap<java.lang.String,java.lang.String> fieldNames
public java.lang.String getName()
AbstractWandoraTool
getName
in interface WandoraTool
getName
in class AbstractExtractor
public java.lang.String getDescription()
AbstractWandoraTool
getDescription
in interface WandoraTool
getDescription
in class AbstractExtractor
public javax.swing.Icon getIcon()
AbstractWandoraTool
getIcon
should return Icon
object of
the tool.getIcon
in interface WandoraTool
getIcon
in class AbstractExtractor
public java.lang.String[] getContentTypes()
Handler
ContentHandler
can process.getContentTypes
in interface Handler
getContentTypes
in class AbstractExtractor
public boolean useURLCrawler()
useURLCrawler
in class AbstractExtractor
public boolean runInOwnThread()
AbstractWandoraTool
runInOwnThread
in class AbstractExtractor
public static Topic getIDType(TopicMap tm) throws TopicMapException
TopicMapException
public static Topic getTitleType(TopicMap tm) throws TopicMapException
TopicMapException
public static Topic getDateType(TopicMap tm) throws TopicMapException
TopicMapException
public static Topic getDateTopic(TopicMap tm, java.lang.String date) throws TopicMapException
TopicMapException
public static Topic getPubTimeType(TopicMap tm) throws TopicMapException
TopicMapException
public static Topic getContentType(TopicMap tm) throws TopicMapException
TopicMapException
public static Topic getFieldTopic(TopicMap tm, java.lang.String siExt, java.lang.String id)
public static Topic getTagTopic(TopicMap tm, java.lang.String siExt, java.lang.String id)
public static Topic getGuardianType(TopicMap tm) throws TopicMapException
TopicMapException
public static Topic getFieldTopicType(TopicMap tm) throws TopicMapException
TopicMapException
public static Topic getTagTopicType(TopicMap tm) throws TopicMapException
TopicMapException
protected static Topic getWandoraClassTopic(TopicMap tm) throws TopicMapException
TopicMapException
protected static Topic getLangTopic(TopicMap tm) throws TopicMapException
TopicMapException
protected static Topic getOrCreateTopic(TopicMap tm, java.lang.String si) throws TopicMapException
TopicMapException
protected static Topic getOrCreateTopic(TopicMap tm, java.lang.String si, java.lang.String bn) throws TopicMapException
TopicMapException
protected static void makeSubclassOf(TopicMap tm, Topic t, Topic superclass) throws TopicMapException
TopicMapException
Copyright 2004-2015 Wandora Team