public class TermsExtractor extends AbstractElavaArkistoExtractor
Modifier and Type | Field and Description |
---|---|
static java.lang.String |
ELAVA_ARKISTO_ALSOKNOWNAS_TYPE_SI |
static java.lang.String |
ELAVA_ARKISTO_FIRSTNAME_TYPE_SI |
static java.lang.String |
ELAVA_ARKISTO_KEYWORD_TYPE_SI |
static java.lang.String |
ELAVA_ARKISTO_LASTNAME_TYPE_SI |
static java.lang.String |
ELAVA_ARKISTO_TERM_ALSOKNOWNAS_SI |
static java.lang.String |
ELAVA_ARKISTO_TERM_EXACT_MATCH_DISAMBIGUATION_SI |
static java.lang.String |
ELAVA_ARKISTO_TERM_EXACT_MATCH_SI |
static java.lang.String |
ELAVA_ARKISTO_TERM_FIRSTNAME_SI |
static java.lang.String |
ELAVA_ARKISTO_TERM_KEYWORD_SI |
static java.lang.String |
ELAVA_ARKISTO_TERM_LASTNAME_SI |
static java.lang.String |
ELAVA_ARKISTO_TERM_SI |
static java.lang.String |
ELAVA_ARKISTO_TERM_TYPE_SI |
static boolean |
EXTRACT_ALSO_KNOWN_AS |
static boolean |
EXTRACT_DISAMBIGUATION_HINT |
static boolean |
EXTRACT_EXACT_MATCH |
static boolean |
EXTRACT_FIRST_AND_LASTNAME |
static boolean |
EXTRACT_KEYWORD |
static boolean |
EXTRACT_TITLE |
static boolean |
EXTRACT_TYPE |
ELAVA_ARKISTO_ARTICLE_ID_TYPE_SI, ELAVA_ARKISTO_ARTICLE_PUBLISHED_TYPE_SI, ELAVA_ARKISTO_ARTICLE_TYPE_SI, ELAVA_ARKISTO_DATE_TYPE_SI, ELAVA_ARKISTO_MEDIA_TYPE_SI, ELAVA_ARKISTO_SERVICE_TYPE_SI, ELAVA_ARKISTO_SI, ELAVA_ARKISTO_TAG_ARTICLE_RELATION_TYPE_SI, ELAVA_ARKISTO_TAG_TYPE_SI, ELAVA_ARKISTO_TIME_TYPE_SI
CUSTOM_EXTRACTOR, DONE_FAILED, DONE_MANY, DONE_ONE, EXACTLY_GIVEN_URLS, FILE_EXTRACTOR, FILE_PATTERN, GIVEN_URLS_AND_ALL_CRAWLED_DOCUMENTS, GIVEN_URLS_AND_CRAWLED_DOCUMENTS_IN_URL_DOMAIN, GIVEN_URLS_AND_LINKED_DOCUMENTS, GIVEN_URLS_AND_URL_BELOW, INFO_WAIT_WHILE_WORKING, LOG_TITLE, POINT_START_URL_TEXT, RAW_EXTRACTOR, SELECT_DIALOG_TITLE, STRING_EXTRACTOR_NOT_SUPPORTED_MESSAGE, URL_EXTRACTOR
CLOSE, EXECUTE, INVISIBLE, VISIBLE, WAIT
RETURN_ERROR, RETURN_INFO
Constructor and Description |
---|
TermsExtractor() |
_extractTopicsFrom, _extractTopicsFrom, getElavaArkistoArticleIdType, getElavaArkistoArticleTopic, getElavaArkistoArticleType, getElavaArkistoDateTopic, getElavaArkistoDateType, getElavaArkistoMediaTopic, getElavaArkistoMediaType, getElavaArkistoServiceTopic, getElavaArkistoServiceType, getElavaArkistoTagArticleRelationTopic, getElavaArkistoTagArticleRelationType, getElavaArkistoTagTopic, getElavaArkistoTagType, getElavaArkistoTimeTopic, getElavaArkistoTimeType, getElavaArkistoType, getIcon, getWandoraType, isValidData, stringify
acceptBrowserExtractRequest, addCrawlerUrl, browserExtractorConsumesPlainText, buildSI, buildSL, clearMasterSubject, createAssociation, createAssociation, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, createTopic, croppedFilename, croppedFilename, croppedUrlString, croppedUrlString, doBrowserExtract, dropExtract, dropExtract, dropExtract, execute, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFrom, extractTopicsFromText, getBrowserExtractorName, getContentTypes, getCrawlerMode, getExtractorType, getForceContent, getForceFiles, getForceUrls, getGUIText, getGUIText, getInterruptsHandled, getMasterSubject, getType, getWandora, handle, handleContent, handleCustomType, handleFiles, handleForcedContent, handleInterrupt, handleStringContent, handleUrls, initializeCustomType, instantDropHandle, makeSubclassOfWandoraClass, runInOwnThread, setData, setDisplayName, setForceContent, setForceFiles, setForceUrls, setMasterSubject, setMasterSubject, setTopicMap, setupCrawler, setWandora, takeNap, urlEncode, useTempTopicMap, useURLCrawler
addUndoMarker, addUndoMarker, allowMultipleInvocations, clearAllThreads, clearThreads, clearThreads, clearToolLock, clearToolLock, clearToolLocks, configure, execute, execute, forceStop, forceStop, getContext, getCurrentLogger, getDefaultLogger, getHistory, getLastLogger, getState, getThreads, getThreads, getToolMenuItem, getToolMenuItem, getTopicName, hlog, initialize, interruptAllThreads, interruptThreads, interruptThreads, isConfigurable, isRunning, isRunning, lockLog, log, log, log, log, requiresRefresh, run, setContext, setDefaultLogger, setLogTitle, setProgress, setProgressMax, setState, setToolLogger, singleLog, singleLog, singleLog, solveContextTopicMap, solveNameForTopicMap, writeOptions
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
configure, execute, execute, getContext, getToolMenuItem, hlog, initialize, isConfigurable, isRunning, log, log, log, log, requiresRefresh, setContext, setToolLogger, writeOptions
forceStop, getHistory, getState, lockLog, setLogTitle, setProgress, setProgressMax, setState
public static boolean EXTRACT_TITLE
public static boolean EXTRACT_TYPE
public static boolean EXTRACT_KEYWORD
public static boolean EXTRACT_FIRST_AND_LASTNAME
public static boolean EXTRACT_EXACT_MATCH
public static boolean EXTRACT_ALSO_KNOWN_AS
public static boolean EXTRACT_DISAMBIGUATION_HINT
public static final java.lang.String ELAVA_ARKISTO_TERM_SI
public static final java.lang.String ELAVA_ARKISTO_TERM_TYPE_SI
public static final java.lang.String ELAVA_ARKISTO_TERM_KEYWORD_SI
public static final java.lang.String ELAVA_ARKISTO_TERM_LASTNAME_SI
public static final java.lang.String ELAVA_ARKISTO_TERM_FIRSTNAME_SI
public static final java.lang.String ELAVA_ARKISTO_TERM_ALSOKNOWNAS_SI
public static final java.lang.String ELAVA_ARKISTO_TERM_EXACT_MATCH_SI
public static final java.lang.String ELAVA_ARKISTO_TERM_EXACT_MATCH_DISAMBIGUATION_SI
public static final java.lang.String ELAVA_ARKISTO_LASTNAME_TYPE_SI
public static final java.lang.String ELAVA_ARKISTO_FIRSTNAME_TYPE_SI
public static final java.lang.String ELAVA_ARKISTO_ALSOKNOWNAS_TYPE_SI
public static final java.lang.String ELAVA_ARKISTO_KEYWORD_TYPE_SI
public java.lang.String getName()
AbstractWandoraTool
getName
in interface WandoraTool
getName
in class AbstractElavaArkistoExtractor
public java.lang.String getDescription()
AbstractWandoraTool
getDescription
in interface WandoraTool
getDescription
in class AbstractElavaArkistoExtractor
public boolean _extractTopicsFrom(java.lang.String str, TopicMap tm) throws java.lang.Exception
_extractTopicsFrom
in class AbstractExtractor
java.lang.Exception
public boolean _extractTopicsFrom(org.json.JSONArray json, TopicMap tm) throws java.lang.Exception
java.lang.Exception
public boolean _extractTopicsFrom(org.json.JSONObject json, TopicMap tm) throws java.lang.Exception
java.lang.Exception
public Topic getElavaArkistoKeywordType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getElavaArkistoAlsoKnownAsType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getElavaArkistoLastnameType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getElavaArkistoFirstnameType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getElavaArkistoExactMatchDisambiguationType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getElavaArkistoExactMatchType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getElavaArkistoExactMatchTopic(java.lang.String id, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getElavaArkistoTermType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getElavaArkistoTermTopic(java.lang.String id, TopicMap tm) throws TopicMapException
TopicMapException
public Topic getElavaArkistoTermTypeType(TopicMap tm) throws TopicMapException
TopicMapException
public Topic getElavaArkistoTermTypeTopic(java.lang.String type, TopicMap tm) throws TopicMapException
TopicMapException
Copyright 2004-2015 Wandora Team