public abstract class AbstractRDFExtractor extends AbstractExtractor
Modifier and Type | Field and Description |
---|---|
java.lang.String |
baseUrl |
private java.lang.String[] |
contentTypes |
private java.lang.String |
defaultEncoding |
static java.lang.String |
defaultLanguage |
static java.lang.String |
defaultOccurrenceScopeSI |
static java.lang.String |
RDF_LIST_ORDER |
CUSTOM_EXTRACTOR, DONE_FAILED, DONE_MANY, DONE_ONE, EXACTLY_GIVEN_URLS, FILE_EXTRACTOR, FILE_PATTERN, GIVEN_URLS_AND_ALL_CRAWLED_DOCUMENTS, GIVEN_URLS_AND_CRAWLED_DOCUMENTS_IN_URL_DOMAIN, GIVEN_URLS_AND_LINKED_DOCUMENTS, GIVEN_URLS_AND_URL_BELOW, INFO_WAIT_WHILE_WORKING, LOG_TITLE, POINT_START_URL_TEXT, RAW_EXTRACTOR, SELECT_DIALOG_TITLE, STRING_EXTRACTOR_NOT_SUPPORTED_MESSAGE, URL_EXTRACTOR
CLOSE, EXECUTE, INVISIBLE, VISIBLE, WAIT
RETURN_ERROR, RETURN_INFO
Constructor and Description |
---|
AbstractRDFExtractor() |
Modifier and Type | Method and Description |
---|---|
boolean |
_extractTopicsFrom(java.io.File file,
TopicMap topicMap) |
boolean |
_extractTopicsFrom(java.io.InputStream in,
TopicMap topicMap) |
boolean |
_extractTopicsFrom(java.lang.String in,
TopicMap tm) |
boolean |
_extractTopicsFrom(java.net.URL url,
TopicMap topicMap) |
void |
execute(Wandora wandora,
Context context)
Runs the tool.
|
java.lang.String |
getBaseUrl() |
java.lang.String[] |
getContentTypes()
Returns an array of String containing the content-types this
ContentHandler can process. |
java.lang.String |
getDescription()
AdminToolManager views tool descriptions while user browses available
tools and build user customizable GUI elements such as Tools menu.
|
javax.swing.Icon |
getIcon()
All tools may have identifying graphic icon used within tool GUI elements.
|
abstract RDF2TopicMapsMapping[] |
getMappings() |
java.lang.String |
getName()
Tools name represent the tool in UI unless the tool has been given
explicitly another GUI name.
|
Topic |
getOrCreateTopic(TopicMap map,
java.lang.String si) |
Topic |
getOrCreateTopic(TopicMap map,
java.lang.String si,
java.lang.String basename) |
java.lang.String |
getRDFContainerFormat()
Override this if the RDF is in some other container format than XML/RDF.
|
void |
handleStatement(com.hp.hpl.jena.rdf.model.Statement stmt,
TopicMap map) |
void |
importRDF(java.io.InputStream in,
TopicMap map) |
void |
RDF2TopicMap(com.hp.hpl.jena.rdf.model.Model model,
TopicMap map) |
void |
setBaseUrl(java.lang.String url) |
java.lang.String |
solveBasenameFor(java.lang.String si) |
Topic |
solveObjectRoleFor(com.hp.hpl.jena.rdf.model.Property predicate,
com.hp.hpl.jena.rdf.model.RDFNode object,
TopicMap map) |
Topic |
solveSubjectRoleFor(com.hp.hpl.jena.rdf.model.Property predicate,
com.hp.hpl.jena.rdf.model.Resource subject,
TopicMap map) |
boolean |
useURLCrawler() |
acceptBrowserExtractRequest, addCrawlerUrl, browserExtractorConsumesPlainText, buildSI, buildSL, clearMasterSubject, createAssociation, createAssociation, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, croppedFilename, croppedFilename, croppedUrlString, croppedUrlString, doBrowserExtract, dropExtract, dropExtract, dropExtract, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFromText, getBrowserExtractorName, getCrawlerMode, getExtractorType, getForceContent, getForceFiles, getForceUrls, getGUIText, getGUIText, getInterruptsHandled, getMasterSubject, getType, getWandora, handle, handleContent, handleCustomType, handleFiles, handleForcedContent, handleInterrupt, handleStringContent, handleUrls, initializeCustomType, instantDropHandle, makeSubclassOfWandoraClass, runInOwnThread, setData, setDisplayName, setForceContent, setForceFiles, setForceUrls, setMasterSubject, setMasterSubject, setTopicMap, setupCrawler, setWandora, takeNap, urlEncode, useTempTopicMap
addUndoMarker, addUndoMarker, allowMultipleInvocations, clearAllThreads, clearThreads, clearThreads, clearToolLock, clearToolLock, clearToolLocks, configure, execute, execute, forceStop, forceStop, getContext, getCurrentLogger, getDefaultLogger, getHistory, getLastLogger, getState, getThreads, getThreads, getToolMenuItem, getToolMenuItem, getTopicName, hlog, initialize, interruptAllThreads, interruptThreads, interruptThreads, isConfigurable, isRunning, isRunning, lockLog, log, log, log, log, requiresRefresh, run, setContext, setDefaultLogger, setLogTitle, setProgress, setProgressMax, setState, setToolLogger, singleLog, singleLog, singleLog, solveContextTopicMap, solveNameForTopicMap, writeOptions
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
configure, execute, execute, getContext, getToolMenuItem, hlog, initialize, isConfigurable, isRunning, log, log, log, log, requiresRefresh, setContext, setToolLogger, writeOptions
forceStop, getHistory, getState, lockLog, setLogTitle, setProgress, setProgressMax, setState
private java.lang.String defaultEncoding
public static java.lang.String defaultLanguage
public static final java.lang.String defaultOccurrenceScopeSI
private final java.lang.String[] contentTypes
public java.lang.String baseUrl
public static final java.lang.String RDF_LIST_ORDER
public java.lang.String getName()
AbstractWandoraTool
getName
in interface WandoraTool
getName
in class AbstractExtractor
public java.lang.String getDescription()
AbstractWandoraTool
getDescription
in interface WandoraTool
getDescription
in class AbstractExtractor
public javax.swing.Icon getIcon()
AbstractWandoraTool
getIcon
should return Icon
object of
the tool.getIcon
in interface WandoraTool
getIcon
in class AbstractExtractor
public java.lang.String[] getContentTypes()
Handler
ContentHandler
can process.getContentTypes
in interface Handler
getContentTypes
in class AbstractExtractor
public boolean useURLCrawler()
useURLCrawler
in class AbstractExtractor
public void execute(Wandora wandora, Context context)
WandoraTool
execute
in interface WandoraTool
execute
in class AbstractExtractor
public java.lang.String getBaseUrl()
public void setBaseUrl(java.lang.String url)
public boolean _extractTopicsFrom(java.net.URL url, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.io.File file, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.io.InputStream in, TopicMap topicMap) throws java.lang.Exception
java.lang.Exception
public boolean _extractTopicsFrom(java.lang.String in, TopicMap tm) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public java.lang.String getRDFContainerFormat()
public void importRDF(java.io.InputStream in, TopicMap map)
public void RDF2TopicMap(com.hp.hpl.jena.rdf.model.Model model, TopicMap map)
public void handleStatement(com.hp.hpl.jena.rdf.model.Statement stmt, TopicMap map) throws TopicMapException
TopicMapException
public abstract RDF2TopicMapsMapping[] getMappings()
public Topic solveSubjectRoleFor(com.hp.hpl.jena.rdf.model.Property predicate, com.hp.hpl.jena.rdf.model.Resource subject, TopicMap map)
public Topic solveObjectRoleFor(com.hp.hpl.jena.rdf.model.Property predicate, com.hp.hpl.jena.rdf.model.RDFNode object, TopicMap map)
public java.lang.String solveBasenameFor(java.lang.String si)
Copyright 2004-2015 Wandora Team