public class HtmlReader
extends org.apache.uima.fit.component.JCasCollectionReader_ImplBase
Modifier and Type | Field and Description |
---|---|
static String |
ENCODING_AUTO
Automatically detect encoding.
|
static String |
PARAM_ENCODING
Name of configuration parameter that contains the character encoding used by the input files.
|
static String |
PARAM_LANGUAGE
Set this as the language of the produced documents.
|
static String |
PARAM_SOURCE_LOCATION
URL from which the input is read.
|
Constructor and Description |
---|
HtmlReader() |
Modifier and Type | Method and Description |
---|---|
void |
getNext(org.apache.uima.jcas.JCas jcas) |
org.apache.uima.util.Progress[] |
getProgress() |
boolean |
hasNext() |
void |
initialize(org.apache.uima.UimaContext context) |
close, getLogger, getNext, initialize
destroy, getCasInitializer, getProcessingResourceMetaData, initialize, isConsuming, reconfigure, setCasInitializer, typeSystemInit
getConfigParameterValue, getConfigParameterValue, setConfigParameterValue, setConfigParameterValue
getCasManager, getMetaData, getResourceManager, getUimaContext, getUimaContextAdmin, setLogger, setMetaData
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
public static final String ENCODING_AUTO
CharsetDetector
,
Constant Field Valuespublic static final String PARAM_ENCODING
public static final String PARAM_SOURCE_LOCATION
public static final String PARAM_LANGUAGE
public void initialize(org.apache.uima.UimaContext context) throws org.apache.uima.resource.ResourceInitializationException
initialize
in class org.apache.uima.fit.component.JCasCollectionReader_ImplBase
org.apache.uima.resource.ResourceInitializationException
public boolean hasNext() throws IOException, org.apache.uima.collection.CollectionException
IOException
org.apache.uima.collection.CollectionException
public org.apache.uima.util.Progress[] getProgress()
public void getNext(org.apache.uima.jcas.JCas jcas) throws IOException, org.apache.uima.collection.CollectionException
getNext
in class org.apache.uima.fit.component.JCasCollectionReader_ImplBase
IOException
org.apache.uima.collection.CollectionException
Copyright © 2007–2016 Ubiquitous Knowledge Processing (UKP) Lab, Technische Universität Darmstadt. All rights reserved.