public class Web1TConverter extends Object
Modifier and Type | Field and Description |
---|---|
static String |
SENTENCE_END |
static String |
SENTENCE_START |
Constructor and Description |
---|
Web1TConverter(String outputPath) |
Web1TConverter(String outputPath,
int aMinNGramLength,
int aMaxNGramLength) |
Modifier and Type | Method and Description |
---|---|
void |
add(ConditionalFrequencyDistribution<Integer,String> cfd) |
void |
add(org.apache.uima.jcas.JCas jcas,
Set<String> inputPaths,
org.apache.uima.cas.Type sentenceType) |
void |
createIndex() |
int |
getMaxNgramLength() |
int |
getMinFrequency() |
int |
getMinNgramLength() |
String |
getOutputEncoding() |
float |
getSplitThreshold() |
boolean |
isToLowercase() |
boolean |
isWriteIndexes() |
void |
setMaxNgramLength(int maxNgramLength) |
void |
setMinFrequency(int minFrequency) |
void |
setMinNgramLength(int minNgramLength) |
void |
setOutputEncoding(String outputEncoding) |
void |
setSplitThreshold(float splitThreshold) |
void |
setToLowercase(boolean toLowercase) |
void |
setWriteIndexes(boolean writeIndexes) |
public static final String SENTENCE_START
public static final String SENTENCE_END
public Web1TConverter(String outputPath) throws IOException
IOException
public Web1TConverter(String outputPath, int aMinNGramLength, int aMaxNGramLength) throws IOException
IOException
public void add(org.apache.uima.jcas.JCas jcas, Set<String> inputPaths, org.apache.uima.cas.Type sentenceType) throws IOException
IOException
public void add(ConditionalFrequencyDistribution<Integer,String> cfd) throws IOException
IOException
public void createIndex() throws IOException
IOException
public boolean isWriteIndexes()
public void setWriteIndexes(boolean writeIndexes)
public float getSplitThreshold()
public void setSplitThreshold(float splitThreshold)
public String getOutputEncoding()
public void setOutputEncoding(String outputEncoding)
public int getMinNgramLength()
public void setMinNgramLength(int minNgramLength)
public int getMaxNgramLength()
public void setMaxNgramLength(int maxNgramLength)
public int getMinFrequency()
public void setMinFrequency(int minFrequency)
public boolean isToLowercase()
public void setToLowercase(boolean toLowercase)
Copyright © 2007–2018 Ubiquitous Knowledge Processing (UKP) Lab, Technische Universität Darmstadt. All rights reserved.