public class JavabibExtractor extends AbstractExtractor implements WandoraTool
Modifier and Type | Field and Description |
---|---|
static java.util.HashSet<java.lang.String> |
associationFields |
private java.lang.String |
baseLocator |
private static java.util.Map<java.lang.String,java.lang.String> |
charMap |
private static java.util.Map<java.lang.String,java.lang.String> |
charMap2 |
private static java.util.regex.Pattern |
charMapPattern |
private java.lang.String[] |
contentTypes |
private java.lang.String |
defaultEncoding |
private boolean |
encounteredExceptions |
static java.util.HashSet<java.lang.String> |
occurrenceFields |
CUSTOM_EXTRACTOR, DONE_FAILED, DONE_MANY, DONE_ONE, EXACTLY_GIVEN_URLS, FILE_EXTRACTOR, FILE_PATTERN, GIVEN_URLS_AND_ALL_CRAWLED_DOCUMENTS, GIVEN_URLS_AND_CRAWLED_DOCUMENTS_IN_URL_DOMAIN, GIVEN_URLS_AND_LINKED_DOCUMENTS, GIVEN_URLS_AND_URL_BELOW, INFO_WAIT_WHILE_WORKING, LOG_TITLE, POINT_START_URL_TEXT, RAW_EXTRACTOR, SELECT_DIALOG_TITLE, STRING_EXTRACTOR_NOT_SUPPORTED_MESSAGE, URL_EXTRACTOR
CLOSE, EXECUTE, INVISIBLE, VISIBLE, WAIT
RETURN_ERROR, RETURN_INFO
Constructor and Description |
---|
JavabibExtractor()
Creates a new instance of JavabibExtractor
|
Modifier and Type | Method and Description |
---|---|
boolean |
_extractTopicsFrom(java.io.File file,
TopicMap topicMap) |
boolean |
_extractTopicsFrom(java.io.Reader reader,
TopicMap tm) |
boolean |
_extractTopicsFrom(java.lang.String str,
TopicMap topicMap) |
boolean |
_extractTopicsFrom(java.net.URL file,
TopicMap topicMap) |
private void |
addAssociation(TopicMap tm,
Topic entryTopic,
bibtex.dom.BibtexEntry entry,
java.lang.String key) |
private void |
addOccurrence(TopicMap tm,
Topic entryTopic,
bibtex.dom.BibtexEntry entry,
java.lang.String key) |
boolean |
browserExtractorConsumesPlainText() |
Locator |
buildSI(java.lang.String siend) |
private Topic |
createPersonTopic(TopicMap tm,
bibtex.dom.BibtexPerson p) |
void |
execute(Wandora admin,
Context context)
Runs the tool.
|
private java.lang.String |
expandCharacters(java.lang.String s) |
java.lang.String[] |
getContentTypes()
Returns an array of String containing the content-types this
ContentHandler can process. |
java.lang.String |
getDescription()
AdminToolManager views tool descriptions while user browses available
tools and build user customizable GUI elements such as Tools menu.
|
java.lang.String |
getGUIText(int textType) |
java.lang.String |
getName()
Tools name represent the tool in UI unless the tool has been given
explicitly another GUI name.
|
private Topic |
getOrCreateTopic(TopicMap tm,
java.lang.String topic) |
private Topic |
getOrCreateTopic(TopicMap tm,
java.lang.String topic,
boolean addToBibtexClass) |
private boolean |
handleExceptions(java.lang.Exception[] exceptions) |
boolean |
useTempTopicMap() |
private java.lang.String |
valueToString(bibtex.dom.BibtexNode v) |
acceptBrowserExtractRequest, addCrawlerUrl, buildSL, clearMasterSubject, createAssociation, createAssociation, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, croppedFilename, croppedFilename, croppedUrlString, croppedUrlString, doBrowserExtract, dropExtract, dropExtract, dropExtract, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFromText, getBrowserExtractorName, getCrawlerMode, getExtractorType, getForceContent, getForceFiles, getForceUrls, getGUIText, getIcon, getInterruptsHandled, getMasterSubject, getType, getWandora, handle, handleContent, handleCustomType, handleFiles, handleForcedContent, handleInterrupt, handleStringContent, handleUrls, initializeCustomType, instantDropHandle, makeSubclassOfWandoraClass, runInOwnThread, setData, setDisplayName, setForceContent, setForceFiles, setForceUrls, setMasterSubject, setMasterSubject, setTopicMap, setupCrawler, setWandora, takeNap, urlEncode, useURLCrawler
addUndoMarker, addUndoMarker, allowMultipleInvocations, clearAllThreads, clearThreads, clearThreads, clearToolLock, clearToolLock, clearToolLocks, configure, execute, execute, forceStop, forceStop, getContext, getCurrentLogger, getDefaultLogger, getHistory, getLastLogger, getState, getThreads, getThreads, getToolMenuItem, getToolMenuItem, getTopicName, hlog, initialize, interruptAllThreads, interruptThreads, interruptThreads, isConfigurable, isRunning, isRunning, lockLog, log, log, log, log, requiresRefresh, run, setContext, setDefaultLogger, setLogTitle, setProgress, setProgressMax, setState, setToolLogger, singleLog, singleLog, singleLog, solveContextTopicMap, solveNameForTopicMap, writeOptions
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
configure, execute, execute, getContext, getIcon, getToolMenuItem, getType, hlog, initialize, isConfigurable, isRunning, log, log, log, log, requiresRefresh, setContext, setToolLogger, writeOptions
forceStop, getHistory, getState, lockLog, setLogTitle, setProgress, setProgressMax, setState
private java.lang.String baseLocator
private java.lang.String defaultEncoding
private boolean encounteredExceptions
private static final java.util.regex.Pattern charMapPattern
private static final java.util.Map<java.lang.String,java.lang.String> charMap
private static final java.util.Map<java.lang.String,java.lang.String> charMap2
public static final java.util.HashSet<java.lang.String> associationFields
public static final java.util.HashSet<java.lang.String> occurrenceFields
private final java.lang.String[] contentTypes
public JavabibExtractor()
public java.lang.String getName()
AbstractWandoraTool
getName
in interface WandoraTool
getName
in class AbstractExtractor
public java.lang.String getDescription()
AbstractWandoraTool
getDescription
in interface WandoraTool
getDescription
in class AbstractExtractor
public java.lang.String getGUIText(int textType)
getGUIText
in class AbstractExtractor
public boolean browserExtractorConsumesPlainText()
browserExtractorConsumesPlainText
in class AbstractExtractor
private Topic getOrCreateTopic(TopicMap tm, java.lang.String topic) throws TopicMapException
TopicMapException
private Topic getOrCreateTopic(TopicMap tm, java.lang.String topic, boolean addToBibtexClass) throws TopicMapException
TopicMapException
private java.lang.String expandCharacters(java.lang.String s)
private java.lang.String valueToString(bibtex.dom.BibtexNode v)
private void addOccurrence(TopicMap tm, Topic entryTopic, bibtex.dom.BibtexEntry entry, java.lang.String key) throws TopicMapException
TopicMapException
private void addAssociation(TopicMap tm, Topic entryTopic, bibtex.dom.BibtexEntry entry, java.lang.String key) throws TopicMapException
TopicMapException
private Topic createPersonTopic(TopicMap tm, bibtex.dom.BibtexPerson p) throws TopicMapException
TopicMapException
public boolean useTempTopicMap()
useTempTopicMap
in class AbstractExtractor
public void execute(Wandora admin, Context context)
WandoraTool
execute
in interface WandoraTool
execute
in class AbstractExtractor
private boolean handleExceptions(java.lang.Exception[] exceptions)
public boolean _extractTopicsFrom(java.io.Reader reader, TopicMap tm) throws java.lang.Exception
java.lang.Exception
public boolean _extractTopicsFrom(java.net.URL file, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.io.File file, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.lang.String str, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public Locator buildSI(java.lang.String siend)
buildSI
in class AbstractExtractor
public java.lang.String[] getContentTypes()
Handler
ContentHandler
can process.getContentTypes
in interface Handler
getContentTypes
in class AbstractExtractor
Copyright 2004-2015 Wandora Team