public class BookmarkExtractor extends AbstractExtractor
Modifier and Type | Field and Description |
---|---|
private java.lang.String |
ADD_SI |
static java.lang.String[] |
contentTypes |
private java.text.SimpleDateFormat |
df |
private java.lang.String |
HREF_SI |
private java.lang.String |
ICON_SI |
private java.lang.String[][] |
itemProps |
private java.lang.String[][] |
itemTimeProps |
private java.lang.String |
LANG |
private Topic |
langTopic |
private java.lang.String |
MOD_SI |
private java.lang.String |
ROOT_SI |
CUSTOM_EXTRACTOR, DONE_FAILED, DONE_MANY, DONE_ONE, EXACTLY_GIVEN_URLS, FILE_EXTRACTOR, FILE_PATTERN, GIVEN_URLS_AND_ALL_CRAWLED_DOCUMENTS, GIVEN_URLS_AND_CRAWLED_DOCUMENTS_IN_URL_DOMAIN, GIVEN_URLS_AND_LINKED_DOCUMENTS, GIVEN_URLS_AND_URL_BELOW, INFO_WAIT_WHILE_WORKING, LOG_TITLE, POINT_START_URL_TEXT, RAW_EXTRACTOR, SELECT_DIALOG_TITLE, STRING_EXTRACTOR_NOT_SUPPORTED_MESSAGE, URL_EXTRACTOR
CLOSE, EXECUTE, INVISIBLE, VISIBLE, WAIT
RETURN_ERROR, RETURN_INFO
Constructor and Description |
---|
BookmarkExtractor() |
Modifier and Type | Method and Description |
---|---|
boolean |
_extractTopicsFrom(java.io.File f,
TopicMap t) |
boolean |
_extractTopicsFrom(java.lang.String str,
TopicMap t) |
boolean |
_extractTopicsFrom(java.net.URL u,
TopicMap t) |
java.lang.String[] |
getContentTypes()
Returns an array of String containing the content-types this
ContentHandler can process. |
java.lang.String |
getDescription()
AdminToolManager views tool descriptions while user browses available
tools and build user customizable GUI elements such as Tools menu.
|
int |
getExtractorType() |
javax.swing.Icon |
getIcon()
All tools may have identifying graphic icon used within tool GUI elements.
|
java.lang.String |
getName()
Tools name represent the tool in UI unless the tool has been given
explicitly another GUI name.
|
private Topic |
getOrCreateTopic(TopicMap tm,
java.lang.String si) |
private Topic |
getOrCreateTopic(TopicMap tm,
java.lang.String si,
java.lang.String bn) |
private Topic |
getWandoraClass(TopicMap tm) |
private void |
makeSubclassOf(TopicMap tm,
Topic t,
Topic superclass) |
private void |
parse(org.jsoup.nodes.Document d,
TopicMap t) |
private void |
parseCategory(org.jsoup.nodes.Element c,
TopicMap t) |
private void |
parseCategory(org.jsoup.nodes.Element c,
Topic parent,
TopicMap t) |
private void |
parseItem(org.jsoup.nodes.Element i,
Topic parent,
TopicMap t) |
acceptBrowserExtractRequest, addCrawlerUrl, browserExtractorConsumesPlainText, buildSI, buildSL, clearMasterSubject, createAssociation, createAssociation, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, croppedFilename, croppedFilename, croppedUrlString, croppedUrlString, doBrowserExtract, dropExtract, dropExtract, dropExtract, execute, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFromText, getBrowserExtractorName, getCrawlerMode, getForceContent, getForceFiles, getForceUrls, getGUIText, getGUIText, getInterruptsHandled, getMasterSubject, getType, getWandora, handle, handleContent, handleCustomType, handleFiles, handleForcedContent, handleInterrupt, handleStringContent, handleUrls, initializeCustomType, instantDropHandle, makeSubclassOfWandoraClass, runInOwnThread, setData, setDisplayName, setForceContent, setForceFiles, setForceUrls, setMasterSubject, setMasterSubject, setTopicMap, setupCrawler, setWandora, takeNap, urlEncode, useTempTopicMap, useURLCrawler
addUndoMarker, addUndoMarker, allowMultipleInvocations, clearAllThreads, clearThreads, clearThreads, clearToolLock, clearToolLock, clearToolLocks, configure, execute, execute, forceStop, forceStop, getContext, getCurrentLogger, getDefaultLogger, getHistory, getLastLogger, getState, getThreads, getThreads, getToolMenuItem, getToolMenuItem, getTopicName, hlog, initialize, interruptAllThreads, interruptThreads, interruptThreads, isConfigurable, isRunning, isRunning, lockLog, log, log, log, log, requiresRefresh, run, setContext, setDefaultLogger, setLogTitle, setProgress, setProgressMax, setState, setToolLogger, singleLog, singleLog, singleLog, solveContextTopicMap, solveNameForTopicMap, writeOptions
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
configure, execute, execute, getContext, getToolMenuItem, hlog, initialize, isConfigurable, isRunning, log, log, log, log, requiresRefresh, setContext, setToolLogger, writeOptions
forceStop, getHistory, getState, lockLog, setLogTitle, setProgress, setProgressMax, setState
private java.lang.String ROOT_SI
private java.lang.String HREF_SI
private java.lang.String ADD_SI
private java.lang.String MOD_SI
private java.lang.String ICON_SI
private java.lang.String LANG
private Topic langTopic
private java.text.SimpleDateFormat df
private java.lang.String[][] itemProps
private java.lang.String[][] itemTimeProps
public static final java.lang.String[] contentTypes
public java.lang.String getName()
AbstractWandoraTool
getName
in interface WandoraTool
getName
in class AbstractExtractor
public java.lang.String getDescription()
AbstractWandoraTool
getDescription
in interface WandoraTool
getDescription
in class AbstractExtractor
public int getExtractorType()
getExtractorType
in class AbstractExtractor
public java.lang.String[] getContentTypes()
Handler
ContentHandler
can process.getContentTypes
in interface Handler
getContentTypes
in class AbstractExtractor
public javax.swing.Icon getIcon()
AbstractWandoraTool
getIcon
should return Icon
object of
the tool.getIcon
in interface WandoraTool
getIcon
in class AbstractExtractor
public boolean _extractTopicsFrom(java.io.File f, TopicMap t) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.net.URL u, TopicMap t) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.lang.String str, TopicMap t) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
private void parse(org.jsoup.nodes.Document d, TopicMap t) throws java.io.FileNotFoundException, java.io.IOException, TopicMapException, java.text.ParseException
java.io.FileNotFoundException
java.io.IOException
TopicMapException
java.text.ParseException
private void parseCategory(org.jsoup.nodes.Element c, TopicMap t) throws TopicMapException, java.text.ParseException
TopicMapException
java.text.ParseException
private void parseCategory(org.jsoup.nodes.Element c, Topic parent, TopicMap t) throws TopicMapException, java.text.ParseException
TopicMapException
java.text.ParseException
private void parseItem(org.jsoup.nodes.Element i, Topic parent, TopicMap t) throws TopicMapException, java.text.ParseException
TopicMapException
java.text.ParseException
private Topic getWandoraClass(TopicMap tm) throws TopicMapException
TopicMapException
private Topic getOrCreateTopic(TopicMap tm, java.lang.String si) throws TopicMapException
TopicMapException
private Topic getOrCreateTopic(TopicMap tm, java.lang.String si, java.lang.String bn) throws TopicMapException
TopicMapException
private void makeSubclassOf(TopicMap tm, Topic t, Topic superclass) throws TopicMapException
TopicMapException
Copyright 2004-2015 Wandora Team