public abstract class OmaKaupunkiAbstractExtractor extends AbstractExtractor
CUSTOM_EXTRACTOR, DONE_FAILED, DONE_MANY, DONE_ONE, EXACTLY_GIVEN_URLS, FILE_EXTRACTOR, FILE_PATTERN, GIVEN_URLS_AND_ALL_CRAWLED_DOCUMENTS, GIVEN_URLS_AND_CRAWLED_DOCUMENTS_IN_URL_DOMAIN, GIVEN_URLS_AND_LINKED_DOCUMENTS, GIVEN_URLS_AND_URL_BELOW, INFO_WAIT_WHILE_WORKING, LOG_TITLE, POINT_START_URL_TEXT, RAW_EXTRACTOR, SELECT_DIALOG_TITLE, STRING_EXTRACTOR_NOT_SUPPORTED_MESSAGE, URL_EXTRACTOR
CLOSE, EXECUTE, INVISIBLE, VISIBLE, WAIT
RETURN_ERROR, RETURN_INFO
Constructor and Description |
---|
OmaKaupunkiAbstractExtractor() |
acceptBrowserExtractRequest, addCrawlerUrl, browserExtractorConsumesPlainText, buildSI, buildSL, clearMasterSubject, createAssociation, createAssociation, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, croppedFilename, croppedFilename, croppedUrlString, croppedUrlString, doBrowserExtract, dropExtract, dropExtract, dropExtract, execute, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFromText, getBrowserExtractorName, getCrawlerMode, getDescription, getExtractorType, getForceContent, getForceFiles, getForceUrls, getGUIText, getGUIText, getInterruptsHandled, getMasterSubject, getType, getWandora, handle, handleContent, handleCustomType, handleFiles, handleForcedContent, handleInterrupt, handleStringContent, handleUrls, initializeCustomType, instantDropHandle, makeSubclassOfWandoraClass, runInOwnThread, setData, setDisplayName, setForceContent, setForceFiles, setForceUrls, setMasterSubject, setMasterSubject, setTopicMap, setupCrawler, setWandora, takeNap, urlEncode, useTempTopicMap
addUndoMarker, addUndoMarker, allowMultipleInvocations, clearAllThreads, clearThreads, clearThreads, clearToolLock, clearToolLock, clearToolLocks, configure, execute, execute, forceStop, forceStop, getContext, getCurrentLogger, getDefaultLogger, getHistory, getLastLogger, getState, getThreads, getThreads, getToolMenuItem, getToolMenuItem, getTopicName, hlog, initialize, interruptAllThreads, interruptThreads, interruptThreads, isConfigurable, isRunning, isRunning, lockLog, log, log, log, log, requiresRefresh, run, setContext, setDefaultLogger, setLogTitle, setProgress, setProgressMax, setState, setToolLogger, singleLog, singleLog, singleLog, solveContextTopicMap, solveNameForTopicMap, writeOptions
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
configure, execute, execute, getContext, getToolMenuItem, hlog, initialize, isConfigurable, isRunning, log, log, log, log, requiresRefresh, setContext, setToolLogger, writeOptions
forceStop, getHistory, getState, lockLog, setLogTitle, setProgress, setProgressMax, setState
public static boolean USE_EXISTING_TOPICS
public static final java.lang.String OMA_KAUPUNKI_SI
public static final java.lang.String OMA_KAUPUNKI_EVENT_SI
public static final java.lang.String OMA_KAUPUNKI_EVENT_START_TIME_SI
public static final java.lang.String OMA_KAUPUNKI_EVENT_END_TIME_SI
public static final java.lang.String OMA_KAUPUNKI_EVENT_CREATED_SI
public static final java.lang.String OMA_KAUPUNKI_EVENT_TITLE_SI
public static final java.lang.String OMA_KAUPUNKI_EVENT_BODY_SI
public static final java.lang.String OMA_KAUPUNKI_EVENT_CATEGORY_PARENT_SI
public static final java.lang.String OMA_KAUPUNKI_EVENT_CATEGORY_PLURAL_SI
public static final java.lang.String OMA_KAUPUNKI_EVENT_CATEGORY_IDENTIFIER_SI
public static final java.lang.String OMA_KAUPUNKI_EVENT_CATEGORY_SI
public static final java.lang.String OMA_KAUPUNKI_EVENT_VENUE_SI
public static final java.lang.String OMA_KAUPUNKI_EVENT_IDENTIFIER_SI
public static final java.lang.String OMA_KAUPUNKI_SERVICE_SI
public static final java.lang.String OMA_KAUPUNKI_SERVICE_IDENTIFIER_SI
public static final java.lang.String OMA_KAUPUNKI_SERVICE_CREATED_SI
public static final java.lang.String OMA_KAUPUNKI_SERVICE_DESCRIPTION_SI
public static final java.lang.String OMA_KAUPUNKI_SERVICE_CATEGORY_SI
public static final java.lang.String OMA_KAUPUNKI_SERVICE_CATEGORY_PARENT_SI
public static final java.lang.String OMA_KAUPUNKI_SERVICE_CATEGORY_PLURAL_SI
public static final java.lang.String OMA_KAUPUNKI_SERVICE_CATEGORY_IDENTIFIER_SI
public static final java.lang.String OMA_KAUPUNKI_SERVICE_PHONE_SI
public static final java.lang.String OMA_KAUPUNKI_SERVICE_TITLE_SI
public static final java.lang.String OMA_KAUPUNKI_SERVICE_TAG_SI
public static final java.lang.String OMA_KAUPUNKI_SERVICE_ADDRESS_SI
public static final java.lang.String OMA_KAUPUNKI_SERVICE_HOMEPAGE_SI
public static final java.lang.String GEO_COORDINATE_TYPE_SI
public static final java.lang.String OMA_KAUPUNKI_DATE_SI
public static final java.lang.String LANG
private final java.lang.String[] contentTypes
private java.net.URL extractURL
private boolean shouldHandlePagination
private java.lang.String defaultPagingOption
public javax.swing.Icon getIcon()
AbstractWandoraTool
getIcon
should return Icon
object of
the tool.getIcon
in interface WandoraTool
getIcon
in class AbstractExtractor
public java.lang.String getName()
AbstractWandoraTool
getName
in interface WandoraTool
getName
in class AbstractExtractor
public java.lang.String[] getContentTypes()
Handler
ContentHandler
can process.getContentTypes
in interface Handler
getContentTypes
in class AbstractExtractor
public boolean useURLCrawler()
useURLCrawler
in class AbstractExtractor
public boolean _extractTopicsFrom(java.net.URL url, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.io.File file, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.lang.String str, TopicMap topicMap) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(java.io.InputStream inputStream, TopicMap topicMap) throws java.lang.Exception
java.lang.Exception
public abstract boolean parseOmaKaupunki(org.json.JSONObject json, TopicMap topicMap)
protected void handleError(org.json.JSONObject error)
protected void handlePagination(org.json.JSONObject pagination, TopicMap tm)
private void nap()
public java.lang.String robustGetString(org.json.JSONObject json, java.lang.String key)
public long robustGetLong(org.json.JSONObject json, java.lang.String key)
public double robustGetDouble(org.json.JSONObject json, java.lang.String key)
protected static Topic getOrCreateTopic(TopicMap tm, java.lang.String si) throws TopicMapException
TopicMapException
protected static Topic getOrCreateTopic(TopicMap tm, java.lang.String si, java.lang.String bn) throws TopicMapException
TopicMapException
protected static Topic getOrCreateTopic(TopicMap tm, java.lang.String si, java.lang.String bn, Topic type) throws TopicMapException
TopicMapException
protected static void makeSubclassOf(TopicMap tm, Topic t, Topic superclass) throws TopicMapException
TopicMapException
protected Topic getATopic(java.lang.String str, java.lang.String si, Topic type, TopicMap tm) throws TopicMapException
TopicMapException
protected Topic getUTopic(java.lang.String si, Topic type, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getGeoCoordinateType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getEventIdentifierType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getEventVenueType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getEventVenueTopic(long venueID, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getDateType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getDateTopic(java.lang.String date, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getEventStartTimeType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getEventEndTimeType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getEventCreatedType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getEventTitleType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getEventBodyType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getEventCategoryPluralType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getEventCategoryIdentifierType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getEventCategoryType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getEventCategoryParentType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getEventCategoryTopic(long categoryID, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getEventType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getServiceCategoryPluralType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getServiceCategoryIdentifierType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getServiceCreatedType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getServicePhoneType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getServiceTitleType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getServiceDescriptionType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getServiceCategoryType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getServiceCategoryParentType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getServiceCategoryTopic(long categoryID, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getServiceTagTopic(java.lang.String tag, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getServiceTagType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getServiceHomepageType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getServiceAddressType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getServiceIdentifierType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getServiceType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getOmaKaupunkiType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getWandoraClass(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getDefaultLangTopic(TopicMap tm) throws TopicMapException
TopicMapException
Copyright 2004-2015 Wandora Team