public class BC2GMDataset extends Dataset
Dataset.Tag| Constructor and Description |
|---|
BC2GMDataset() |
BC2GMDataset(Tokenizer tokenizer) |
| Modifier and Type | Method and Description |
|---|---|
protected void |
addAlternateMentions(Sentence sentence,
HashMap<String,LinkedList<Dataset.Tag>> tags) |
protected HashMap<String,LinkedList<Dataset.Tag>> |
getAlternateTags(BufferedReader tagFile,
String geneLabel) |
protected Sentence |
getSentence(String id,
String sentenceText,
Tokenizer tokenizer,
HashMap<String,LinkedList<Dataset.Tag>> tags) |
protected HashMap<String,LinkedList<Dataset.Tag>> |
getTags(BufferedReader tagFile,
String geneLabel) |
protected static int |
getTokenIndex(List<Token> tokens,
int index) |
void |
load(org.apache.commons.configuration.HierarchicalConfiguration config) |
void |
load(String sentenceFilename,
String mentionsFilename,
String alternateMentionsFilename,
String geneLabel) |
List<Dataset> |
split(int n) |
getSentences, getTokenCountMention, getTokenCountTotal, getTypeCounts, setTokenizerpublic BC2GMDataset(Tokenizer tokenizer)
public BC2GMDataset()
public void load(org.apache.commons.configuration.HierarchicalConfiguration config)
public void load(String sentenceFilename, String mentionsFilename, String alternateMentionsFilename, String geneLabel)
protected HashMap<String,LinkedList<Dataset.Tag>> getTags(BufferedReader tagFile, String geneLabel) throws IOException
IOExceptionprotected HashMap<String,LinkedList<Dataset.Tag>> getAlternateTags(BufferedReader tagFile, String geneLabel) throws IOException
IOExceptionprotected Sentence getSentence(String id, String sentenceText, Tokenizer tokenizer, HashMap<String,LinkedList<Dataset.Tag>> tags)
protected void addAlternateMentions(Sentence sentence, HashMap<String,LinkedList<Dataset.Tag>> tags)
Copyright © 2018 JULIE Lab, Germany. All rights reserved.