public abstract class AbstractBingExtractor extends AbstractExtractor
Modifier and Type | Field and Description |
---|---|
private static java.util.HashMap<java.lang.String,java.lang.String> |
auth |
static java.lang.String |
BING_CONTENTTYPE_SI |
static java.lang.String |
BING_DATETIME_SI |
static java.lang.String |
BING_DESCRIPTION_SI |
static java.lang.String |
BING_FILESIZE_SI |
static java.lang.String |
BING_HEIGHT_SI |
static java.lang.String |
BING_IMAGERESULT_SI |
static java.lang.String |
BING_ROOT |
static java.lang.String |
BING_TITLE_SI |
static java.lang.String |
BING_URL |
static java.lang.String |
BING_WEBRESULT_SI |
static java.lang.String |
BING_WIDTH_SI |
private java.lang.String[] |
contentTypes |
protected java.lang.String |
defaultEncoding |
private static java.lang.String |
dialogName |
protected boolean |
EXTRACT_RELEVANCE |
static java.lang.String |
LANG |
static java.lang.String |
QUERY_SI |
static java.lang.String |
SOURCE_SI |
static java.lang.String |
TOPIC_SI |
CUSTOM_EXTRACTOR, DONE_FAILED, DONE_MANY, DONE_ONE, EXACTLY_GIVEN_URLS, FILE_EXTRACTOR, FILE_PATTERN, GIVEN_URLS_AND_ALL_CRAWLED_DOCUMENTS, GIVEN_URLS_AND_CRAWLED_DOCUMENTS_IN_URL_DOMAIN, GIVEN_URLS_AND_LINKED_DOCUMENTS, GIVEN_URLS_AND_URL_BELOW, INFO_WAIT_WHILE_WORKING, LOG_TITLE, POINT_START_URL_TEXT, RAW_EXTRACTOR, SELECT_DIALOG_TITLE, STRING_EXTRACTOR_NOT_SUPPORTED_MESSAGE, URL_EXTRACTOR
CLOSE, EXECUTE, INVISIBLE, VISIBLE, WAIT
RETURN_ERROR, RETURN_INFO
Constructor and Description |
---|
AbstractBingExtractor() |
Modifier and Type | Method and Description |
---|---|
abstract boolean |
_extractTopicsFrom(java.io.InputStream in,
TopicMap topicMap) |
void |
configure(Wandora wandora,
Options options,
java.lang.String prefix)
If the tool is configurable, shows an user interface to configure the tool.
|
void |
fillQueryTopic(Topic queryTopic,
TopicMap topicMap,
java.lang.String query) |
static void |
forgetAuth() |
Topic |
getBingClass(TopicMap tm) |
java.lang.String[] |
getContentTypes()
Returns an array of String containing the content-types this
ContentHandler can process. |
Topic |
getContentTypeType(TopicMap tm) |
Topic |
getDateTimeTopic(java.lang.String datetime,
TopicMap tm) |
Topic |
getDateTimeType(TopicMap tm) |
Topic |
getDescriptionTopic(java.lang.String description,
TopicMap tm) |
Topic |
getDescriptionType(TopicMap tm) |
protected java.lang.String |
getFileContents(java.io.File file) |
Topic |
getFileSizeType(TopicMap tm) |
Topic |
getHeightType(TopicMap tm) |
javax.swing.Icon |
getIcon()
All tools may have identifying graphic icon used within tool GUI elements.
|
Topic |
getImageSearchResultTopic(TopicMap tm,
java.lang.String title,
java.lang.String url,
java.lang.String width,
java.lang.String height,
java.lang.String contentType,
java.lang.String fileSize) |
Topic |
getImageSearchResultType(TopicMap tm) |
protected Topic |
getOrCreateTopic(TopicMap tm,
java.lang.String si) |
protected Topic |
getOrCreateTopic(TopicMap tm,
java.lang.String si,
java.lang.String bn) |
Topic |
getQueryType(TopicMap tm) |
Topic |
getSourceType(TopicMap tm) |
protected java.lang.String |
getStringFromDocument(org.w3c.dom.Document doc) |
Topic |
getTitleTopic(java.lang.String title,
TopicMap tm) |
Topic |
getTitleType(TopicMap tm) |
Topic |
getTopicType(TopicMap tm) |
WandoraToolType |
getType()
Tool type is used to categorize tools.
|
Topic |
getWandoraClass(TopicMap tm) |
Topic |
getWebSearchResultTopic(TopicMap tm,
java.lang.String title,
java.lang.String description,
java.lang.String url,
java.lang.String datetime) |
Topic |
getWebSearchResultType(TopicMap tm) |
Topic |
getWidthType(TopicMap tm) |
boolean |
isConfigurable()
Whether this tool is configurable.
|
protected void |
makeSubclassOf(TopicMap tm,
Topic t,
Topic superclass) |
java.util.HashMap<java.lang.String,java.lang.String> |
solveAuth(Wandora wandora) |
boolean |
useURLCrawler() |
void |
writeOptions(Wandora wandora,
Options options,
java.lang.String prefix)
If the tool is configurable, saves all current tool options.
|
_extractTopicsFrom, _extractTopicsFrom, _extractTopicsFrom, acceptBrowserExtractRequest, addCrawlerUrl, browserExtractorConsumesPlainText, buildSI, buildSL, clearMasterSubject, createAssociation, createAssociation, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, croppedFilename, croppedFilename, croppedUrlString, croppedUrlString, doBrowserExtract, dropExtract, dropExtract, dropExtract, execute, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFromText, getBrowserExtractorName, getCrawlerMode, getDescription, getExtractorType, getForceContent, getForceFiles, getForceUrls, getGUIText, getGUIText, getInterruptsHandled, getMasterSubject, getName, getWandora, handle, handleContent, handleCustomType, handleFiles, handleForcedContent, handleInterrupt, handleStringContent, handleUrls, initializeCustomType, instantDropHandle, makeSubclassOfWandoraClass, runInOwnThread, setData, setDisplayName, setForceContent, setForceFiles, setForceUrls, setMasterSubject, setMasterSubject, setTopicMap, setupCrawler, setWandora, takeNap, urlEncode, useTempTopicMap
addUndoMarker, addUndoMarker, allowMultipleInvocations, clearAllThreads, clearThreads, clearThreads, clearToolLock, clearToolLock, clearToolLocks, execute, execute, forceStop, forceStop, getContext, getCurrentLogger, getDefaultLogger, getHistory, getLastLogger, getState, getThreads, getThreads, getToolMenuItem, getToolMenuItem, getTopicName, hlog, initialize, interruptAllThreads, interruptThreads, interruptThreads, isRunning, isRunning, lockLog, log, log, log, log, requiresRefresh, run, setContext, setDefaultLogger, setLogTitle, setProgress, setProgressMax, setState, setToolLogger, singleLog, singleLog, singleLog, solveContextTopicMap, solveNameForTopicMap
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
execute, execute, getContext, getToolMenuItem, hlog, initialize, isRunning, log, log, log, log, requiresRefresh, setContext, setToolLogger
forceStop, getHistory, getState, lockLog, setLogTitle, setProgress, setProgressMax, setState
protected boolean EXTRACT_RELEVANCE
protected java.lang.String defaultEncoding
public static java.lang.String LANG
public static final java.lang.String BING_ROOT
public static final java.lang.String BING_URL
public static final java.lang.String SOURCE_SI
public static final java.lang.String QUERY_SI
public static final java.lang.String TOPIC_SI
public static final java.lang.String BING_TITLE_SI
public static final java.lang.String BING_DESCRIPTION_SI
public static final java.lang.String BING_DATETIME_SI
public static final java.lang.String BING_WIDTH_SI
public static final java.lang.String BING_HEIGHT_SI
public static final java.lang.String BING_CONTENTTYPE_SI
public static final java.lang.String BING_FILESIZE_SI
public static final java.lang.String BING_WEBRESULT_SI
public static final java.lang.String BING_IMAGERESULT_SI
private final java.lang.String[] contentTypes
private static java.util.HashMap<java.lang.String,java.lang.String> auth
private static final java.lang.String dialogName
public javax.swing.Icon getIcon()
AbstractWandoraTool
getIcon
should return Icon
object of
the tool.getIcon
in interface WandoraTool
getIcon
in class AbstractExtractor
public WandoraToolType getType()
AbstractWandoraTool
Tool type is used to categorize tools. Tool type has no real effect today, it is merely an informative property of a tool.
getType
in interface WandoraTool
getType
in class AbstractExtractor
public java.lang.String[] getContentTypes()
Handler
ContentHandler
can process.getContentTypes
in interface Handler
getContentTypes
in class AbstractExtractor
public boolean useURLCrawler()
useURLCrawler
in class AbstractExtractor
public boolean isConfigurable()
AbstractWandoraTool
isConfigurable
in interface WandoraTool
isConfigurable
in class AbstractWandoraTool
public void configure(Wandora wandora, Options options, java.lang.String prefix) throws TopicMapException
AbstractWandoraTool
configure
in interface WandoraTool
configure
in class AbstractWandoraTool
TopicMapException
public void writeOptions(Wandora wandora, Options options, java.lang.String prefix)
AbstractWandoraTool
writeOptions
in interface WandoraTool
writeOptions
in class AbstractWandoraTool
public abstract boolean _extractTopicsFrom(java.io.InputStream in, TopicMap topicMap) throws java.lang.Exception
java.lang.Exception
public void fillQueryTopic(Topic queryTopic, TopicMap topicMap, java.lang.String query)
public Topic getWebSearchResultTopic(TopicMap tm, java.lang.String title, java.lang.String description, java.lang.String url, java.lang.String datetime) throws TopicMapException
TopicMapException
public Topic getImageSearchResultTopic(TopicMap tm, java.lang.String title, java.lang.String url, java.lang.String width, java.lang.String height, java.lang.String contentType, java.lang.String fileSize) throws TopicMapException
TopicMapException
public Topic getTitleTopic(java.lang.String title, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getDescriptionTopic(java.lang.String description, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getDateTimeTopic(java.lang.String datetime, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getTitleType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getDescriptionType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getDateTimeType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getWidthType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getHeightType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getContentTypeType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getFileSizeType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getBingClass(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getWandoraClass(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getTopicType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getSourceType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getQueryType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getWebSearchResultType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getImageSearchResultType(TopicMap tm) throws TopicMapException
TopicMapException
protected Topic getOrCreateTopic(TopicMap tm, java.lang.String si) throws TopicMapException
TopicMapException
protected Topic getOrCreateTopic(TopicMap tm, java.lang.String si, java.lang.String bn) throws TopicMapException
TopicMapException
protected void makeSubclassOf(TopicMap tm, Topic t, Topic superclass) throws TopicMapException
TopicMapException
public java.util.HashMap<java.lang.String,java.lang.String> solveAuth(Wandora wandora)
public static void forgetAuth()
protected java.lang.String getStringFromDocument(org.w3c.dom.Document doc)
protected java.lang.String getFileContents(java.io.File file) throws java.io.IOException, java.io.FileNotFoundException
java.io.IOException
java.io.FileNotFoundException
Copyright 2004-2015 Wandora Team