de.unihd.dbs.uima.reader.tempeval2reader
public class Tempeval2Reader extends org.apache.uima.collection.CollectionReader_ImplBase
Modifier and Type | Field and Description |
---|---|
static java.lang.String |
FILE_BASE_SEGMENTATION
Parameter for files in the input directory
|
static java.lang.String |
FILE_DCT |
java.util.HashMap<java.lang.String,Dct> |
hmDct
HashMap for all document creation times
|
java.util.HashMap<java.lang.String,Token> |
hmToken
HashMap for all tokens of a document
|
java.lang.Integer |
numberOfDocuments
Needed information to create cas objects for all "documents"
|
static java.lang.String |
PARAM_INPUTDIR
Name of configuration parameter that must be set to the path of a directory
containing input files.
|
Constructor and Description |
---|
Tempeval2Reader() |
Modifier and Type | Method and Description |
---|---|
java.lang.Integer |
addSentenceAnnotation(java.lang.String sentenceString,
java.lang.String fileId,
java.lang.Integer sentId,
java.lang.Integer positionCounter,
org.apache.uima.jcas.JCas jcas) |
java.lang.Integer |
addTokenAnnotation(java.lang.String tokenString,
java.lang.String fileId,
java.lang.Integer sentId,
java.lang.Integer tokId,
java.lang.Integer positionCounter,
org.apache.uima.jcas.JCas jcas)
Add token annotation to jcas
|
void |
close() |
void |
getNext(org.apache.uima.cas.CAS cas) |
org.apache.uima.util.Progress[] |
getProgress() |
boolean |
hasNext() |
void |
initialize() |
java.lang.String |
resetParentheses(java.lang.String tokenString) |
void |
setDocumentCreationTime(java.lang.String docname,
java.util.List<java.io.File> inputFiles,
org.apache.uima.jcas.JCas jcas) |
void |
setTextSentencesTokens(java.lang.String docname,
java.util.List<java.io.File> inputFiles,
org.apache.uima.jcas.JCas jcas) |
destroy, getCasInitializer, getProcessingResourceMetaData, initialize, isConsuming, reconfigure, setCasInitializer, typeSystemInit
getConfigParameterValue, getConfigParameterValue, setConfigParameterValue, setConfigParameterValue
getCasManager, getLogger, getMetaData, getResourceManager, getUimaContext, getUimaContextAdmin, setLogger
equals, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
public static final java.lang.String FILE_BASE_SEGMENTATION
public static final java.lang.String FILE_DCT
public java.lang.Integer numberOfDocuments
public java.util.HashMap<java.lang.String,Token> hmToken
public java.util.HashMap<java.lang.String,Dct> hmDct
public static final java.lang.String PARAM_INPUTDIR
public void initialize() throws org.apache.uima.resource.ResourceInitializationException
initialize
in class org.apache.uima.collection.CollectionReader_ImplBase
org.apache.uima.resource.ResourceInitializationException
public void getNext(org.apache.uima.cas.CAS cas) throws java.io.IOException, org.apache.uima.collection.CollectionException
java.io.IOException
org.apache.uima.collection.CollectionException
public boolean hasNext() throws java.io.IOException, org.apache.uima.collection.CollectionException
java.io.IOException
org.apache.uima.collection.CollectionException
BaseCollectionReader.hasNext()
public org.apache.uima.util.Progress[] getProgress()
BaseCollectionReader.getProgress()
public void close() throws java.io.IOException
java.io.IOException
BaseCollectionReader.close()
public void setDocumentCreationTime(java.lang.String docname, java.util.List<java.io.File> inputFiles, org.apache.uima.jcas.JCas jcas) throws java.io.IOException
java.io.IOException
public void setTextSentencesTokens(java.lang.String docname, java.util.List<java.io.File> inputFiles, org.apache.uima.jcas.JCas jcas) throws java.io.IOException
java.io.IOException
public java.lang.String resetParentheses(java.lang.String tokenString)
public java.lang.Integer addSentenceAnnotation(java.lang.String sentenceString, java.lang.String fileId, java.lang.Integer sentId, java.lang.Integer positionCounter, org.apache.uima.jcas.JCas jcas)
public java.lang.Integer addTokenAnnotation(java.lang.String tokenString, java.lang.String fileId, java.lang.Integer sentId, java.lang.Integer tokId, java.lang.Integer positionCounter, org.apache.uima.jcas.JCas jcas)
tokenString
- fileId
- tokId
- positionCounter
- jcas
-