public class NGramsDependency
extends java.lang.Object
Modifier and Type | Field and Description |
---|---|
protected java.util.List<de.ims.icarus.language.dependency.DependencySentenceData> |
corpus |
protected int |
fringeSize |
protected java.util.Map<java.lang.String,java.util.ArrayList<DependencyItemInNuclei>> |
nGramCache |
protected int |
nGramCount |
protected int |
nGramLimit |
protected java.util.Map<java.lang.Integer,java.util.ArrayList<java.lang.Integer>> |
nilCache |
protected java.util.Map<java.lang.Integer,java.util.ArrayList<java.lang.Integer>> |
nilEqualSentencesCache |
protected java.util.Map<java.lang.String,java.util.ArrayList<java.lang.Integer>> |
nilLexiconCache |
protected de.ims.icarus.util.Options |
options |
protected java.util.List<NGramQAttributes> |
queryList |
protected boolean |
useFringe |
protected boolean |
useNumberWildcard |
Constructor and Description |
---|
NGramsDependency() |
NGramsDependency(int nGramCount,
de.ims.icarus.util.Options options,
de.ims.icarus.search_tools.Search search) |
NGramsDependency(de.ims.icarus.util.Options options,
java.util.List<NGramQAttributes> queryList,
de.ims.icarus.search_tools.Search search) |
Modifier and Type | Method and Description |
---|---|
protected java.lang.String |
ensureValid(java.lang.String input) |
static NGramsDependency |
getInstance() |
java.util.List<java.lang.String> |
getLabelVariation(java.lang.String tag) |
int |
getPasses() |
java.util.Map<java.lang.String,java.util.ArrayList<DependencyItemInNuclei>> |
getResult() |
protected java.lang.String |
getTagQueryDependency(java.lang.String qtag) |
void |
initializeUniGrams(de.ims.icarus.language.dependency.DependencySentenceData dd,
int sentenceNr)
Step 1) Initialize Corpus / Create uniGrams
Loop trough the Corpus and add all occurring Words with their specific PoSTags
to the nGramCache.
|
void |
nGramResults()
Print out Resulting nGrams:
|
protected void |
nGramResults(java.util.Map<java.lang.String,java.util.ArrayList<DependencyItemInNuclei>> inputNGram)
Print out Resulting nGrams:
|
void |
outputToFile() |
protected DependencySentenceInfo |
returnDependencySentenceInfoNREqual(java.util.ArrayList<DependencyItemInNuclei> l1,
int sentenceNR) |
protected int nGramCount
protected int nGramLimit
protected boolean useFringe
protected int fringeSize
protected boolean useNumberWildcard
protected java.util.Map<java.lang.String,java.util.ArrayList<DependencyItemInNuclei>> nGramCache
protected java.util.List<NGramQAttributes> queryList
protected de.ims.icarus.util.Options options
protected java.util.Map<java.lang.Integer,java.util.ArrayList<java.lang.Integer>> nilCache
protected java.util.Map<java.lang.Integer,java.util.ArrayList<java.lang.Integer>> nilEqualSentencesCache
protected java.util.Map<java.lang.String,java.util.ArrayList<java.lang.Integer>> nilLexiconCache
protected java.util.List<de.ims.icarus.language.dependency.DependencySentenceData> corpus
public NGramsDependency()
public NGramsDependency(de.ims.icarus.util.Options options, java.util.List<NGramQAttributes> queryList, de.ims.icarus.search_tools.Search search)
public NGramsDependency(int nGramCount, de.ims.icarus.util.Options options, de.ims.icarus.search_tools.Search search)
public static NGramsDependency getInstance()
protected java.lang.String ensureValid(java.lang.String input)
protected DependencySentenceInfo returnDependencySentenceInfoNREqual(java.util.ArrayList<DependencyItemInNuclei> l1, int sentenceNR)
l1
- sentenceNR
- public java.util.List<java.lang.String> getLabelVariation(java.lang.String tag)
public void initializeUniGrams(de.ims.icarus.language.dependency.DependencySentenceData dd, int sentenceNr)
dd
- sentenceNr
- protected java.lang.String getTagQueryDependency(java.lang.String qtag)
public java.util.Map<java.lang.String,java.util.ArrayList<DependencyItemInNuclei>> getResult()
public int getPasses()
public void outputToFile()
javax.xml.parsers.ParserConfigurationException
protected void nGramResults(java.util.Map<java.lang.String,java.util.ArrayList<DependencyItemInNuclei>> inputNGram)
public void nGramResults()