public class WikipediaRevisionPairReader extends WikipediaRevisionReaderBase
Modifier and Type | Field and Description |
---|---|
static String |
PARAM_MAX_CHANGE
Restrict revision pairs to cases where the length of the revisions does not differ more than
this value (counted in characters).
|
static String |
PARAM_MIN_CHANGE
Restrict revision pairs to cases where the length of the revisions differ more than this
value (counted in characters).
|
static String |
PARAM_SKIP_FIRST_N_PAIRS
The number of revision pairs that should be skipped in the beginning.
|
static String |
REVISION_1 |
static String |
REVISION_2 |
protected int |
skipFirstNPairs |
currentArticle, currentArticleIndex, currentRevisionIndex, nrOfArticles, outputPlainText, pageBuffer, pageIter, PARAM_OUTPUT_PLAIN_TEXT, PARAM_PAGE_BUFFER, PARAM_PATH_TO_REVISION_ID_LIST, PARAM_REVISION_ID_LIST, parser, revIdIterator, revisionApi, revisionIdFile, revisionIdParamArray, revisionIds, timestampIter
dbconfig, PARAM_CREATE_DATABASE_CONFIG_ANNOTATION, PARAM_DB, PARAM_HOST, PARAM_LANGUAGE, PARAM_PASSWORD, PARAM_USER, wiki
Constructor and Description |
---|
WikipediaRevisionPairReader() |
Modifier and Type | Method and Description |
---|---|
void |
getNext(org.apache.uima.jcas.JCas jcas) |
void |
initialize(org.apache.uima.UimaContext context) |
addDocumentMetaData, addRevisionAnnotation, getProgress, getTimestampIter, hasNext
close, getLogger, getNext, initialize
destroy, getCasInitializer, getProcessingResourceMetaData, initialize, isConsuming, reconfigure, setCasInitializer, typeSystemInit
getConfigParameterValue, getConfigParameterValue, setConfigParameterValue, setConfigParameterValue
getCasManager, getMetaData, getRelativePathResolver, getResourceManager, getUimaContext, getUimaContextAdmin, setLogger, setMetaData
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
public static final String REVISION_1
public static final String REVISION_2
public static final String PARAM_MIN_CHANGE
public static final String PARAM_MAX_CHANGE
public static final String PARAM_SKIP_FIRST_N_PAIRS
protected int skipFirstNPairs
public void initialize(org.apache.uima.UimaContext context) throws org.apache.uima.resource.ResourceInitializationException
initialize
in class WikipediaRevisionReaderBase
org.apache.uima.resource.ResourceInitializationException
public void getNext(org.apache.uima.jcas.JCas jcas) throws IOException, org.apache.uima.collection.CollectionException
getNext
in class WikipediaReaderBase
IOException
org.apache.uima.collection.CollectionException
Copyright © 2007–2018 Ubiquitous Knowledge Processing (UKP) Lab, Technische Universität Darmstadt. All rights reserved.