Serialized Form


Package kea.filters

Class kea.filters.KEAFilter extends weka.filters.Filter implements Serializable

serialVersionUID: 1L

Serialized Fields

m_DocumentAtt

int m_DocumentAtt
Index of attribute containing the documents


m_KeyphrasesAtt

int m_KeyphrasesAtt
Index of attribute containing the keyphrases


m_MaxPhraseLength

int m_MaxPhraseLength
The maximum length of phrases


m_MinPhraseLength

int m_MinPhraseLength
The minimum length of phrases


m_max_recall

double m_max_recall

m_numPhrases

int m_numPhrases
The number of phrases to extract.


m_Indexers

int m_Indexers
Experimental! Number of human indexers (times a keyphrase appears in the keyphrase set)


doc

int doc

m_DESCRreplace

boolean m_DESCRreplace
Should non-descriptors be replaced by corresponding descriptors?


m_NODEfeature

boolean m_NODEfeature
Is the node degree (number of related terms in candidate set) being used?


m_LENGTHfeature

boolean m_LENGTHfeature
Is the length of a phrase in words being used?


m_STDEVfeature

boolean m_STDEVfeature
Experimental feature! If m_STDEVused = true, should the standard deviation of position of phrase occurrences be considered? If set to true, the indicies of features need to be adjusted in the code manually!


m_KFused

boolean m_KFused
Experimental feature! Is keyphrase frequency attribute being used? If set to true, adjust the indicies in the code!


m_Debug

boolean m_Debug
Flag for debugging mode


m_DisallowInternalPeriods

boolean m_DisallowInternalPeriods
Determines whether internal periods are allowed


m_MinNumOccur

int m_MinNumOccur
The minimum number of occurences of a phrase


m_NumFeatures

int m_NumFeatures
The number of features describing a phrase


m_TfidfIndex

int m_TfidfIndex
Indices of attributes in m_ClassifierData


m_FirstOccurIndex

int m_FirstOccurIndex

m_LengthIndex

int m_LengthIndex
Indicies of attributes for new features


m_NodeIndex

int m_NodeIndex

m_STDEVIndex

int m_STDEVIndex

m_KeyFreqIndex

int m_KeyFreqIndex

m_PunctFilter

KEAPhraseFilter m_PunctFilter
The punctuation filter used by this filter


m_NumbersFilter

NumbersFilter m_NumbersFilter
The numbers filter used by this filter


m_Classifier

weka.classifiers.Classifier m_Classifier
The actual classifier used to compute probabilities


m_Dictionary

java.util.HashMap m_Dictionary
The dictionary containing the document frequencies


m_KeyphraseDictionary

java.util.HashMap m_KeyphraseDictionary
The dictionary containing the keyphrases


m_NumDocs

int m_NumDocs
The number of documents in the global frequencies corpus


m_ClassifierData

weka.core.Instances m_ClassifierData
Template for the classifier data


m_Stemmer

Stemmer m_Stemmer
The default stemmer to be used


m_Stopwords

Stopwords m_Stopwords
The list of stop words to be used


m_documentLanguage

java.lang.String m_documentLanguage
The default language to be used


m_vocabulary

java.lang.String m_vocabulary
The Vocabulary name


m_vocabularyFormat

java.lang.String m_vocabularyFormat
The Vocabulary format


m_CheckForProperNouns

boolean m_CheckForProperNouns
Determines whether check for proper nouns is performed

Class kea.filters.KEAPhraseFilter extends weka.filters.Filter implements Serializable

serialVersionUID: 1L

Serialized Fields

m_SelectCols

weka.core.Range m_SelectCols
Stores which columns to select as a funky range


m_DisallowInternalPeriods

boolean m_DisallowInternalPeriods
Determines whether internal periods are allowed

Class kea.filters.NumbersFilter extends weka.filters.Filter implements Serializable

serialVersionUID: 1L


Package kea.stemmers

Class kea.stemmers.FrenchStemmer extends Stemmer implements Serializable

serialVersionUID: 1L

Serialized Fields

sb

java.lang.StringBuffer sb
Buffer for the terms while stemming them.


tb

java.lang.StringBuffer tb
A temporary buffer, used to reconstruct R2


R0

java.lang.String R0
Region R0 is equal to the whole buffer


RV

java.lang.String RV
Region RV "If the word begins with two vowels, RV is the region after the third letter, otherwise the region after the first vowel not at the beginning of the word, or the end of the word if these positions cannot be found."


R1

java.lang.String R1
Region R1 "R1 is the region after the first non-vowel following a vowel or is the null region at the end of the word if there is no such non-vowel"


R2

java.lang.String R2
Region R2 "R2 is the region after the first non-vowel in R1 following a vowel or is the null region at the end of the word if there is no such non-vowel"


suite

boolean suite
Set to true if we need to perform step 2


modified

boolean modified
Set to true if the buffer was modified

Class kea.stemmers.GermanStemmer extends Stemmer implements Serializable

serialVersionUID: 1L

Serialized Fields

sb

java.lang.StringBuffer sb
Buffer for the terms while stemming them.


uppercase

boolean uppercase
Indicates if a term is handled as a noun.


substCount

int substCount
Amount of characters that are removed with substitute() while stemming.

Class kea.stemmers.IteratedLovinsStemmer extends LovinsStemmer implements Serializable

serialVersionUID: 1L

Class kea.stemmers.LovinsStemmer extends Stemmer implements Serializable

serialVersionUID: 1L

Class kea.stemmers.NoStemmer extends Stemmer implements Serializable

serialVersionUID: 1L

Class kea.stemmers.PorterStemmer extends Stemmer implements Serializable

serialVersionUID: 1L

Class kea.stemmers.SpanishStemmer extends Stemmer implements Serializable

Serialized Fields

stemmer

SpanishStemmerSB stemmer

Class kea.stemmers.SpanishStemmerSB extends org.tartarus.snowball.SnowballProgram implements Serializable

serialVersionUID: 1L

Serialized Fields

a_0

org.tartarus.snowball.Among[] a_0

a_1

org.tartarus.snowball.Among[] a_1

a_2

org.tartarus.snowball.Among[] a_2

a_3

org.tartarus.snowball.Among[] a_3

a_4

org.tartarus.snowball.Among[] a_4

a_5

org.tartarus.snowball.Among[] a_5

a_6

org.tartarus.snowball.Among[] a_6

a_7

org.tartarus.snowball.Among[] a_7

a_8

org.tartarus.snowball.Among[] a_8

a_9

org.tartarus.snowball.Among[] a_9

I_p2

int I_p2

I_p1

int I_p1

I_pV

int I_pV

Class kea.stemmers.SremovalStemmer extends Stemmer implements Serializable

serialVersionUID: 1L

Class kea.stemmers.Stemmer extends java.lang.Object implements Serializable


Package kea.stopwords

Class kea.stopwords.Stopwords extends java.lang.Object implements Serializable

Class kea.stopwords.StopwordsEnglish extends Stopwords implements Serializable

serialVersionUID: 1L

Class kea.stopwords.StopwordsFrench extends Stopwords implements Serializable

serialVersionUID: 1L

Class kea.stopwords.StopwordsGerman extends Stopwords implements Serializable

serialVersionUID: 1L

Class kea.stopwords.StopwordsSpanish extends Stopwords implements Serializable

serialVersionUID: 1L


Package kea.util

Class kea.util.Counter extends java.lang.Object implements Serializable

serialVersionUID: 1L

Serialized Fields

m_val

int m_val
Integer value stored


Package kea.vocab

Class kea.vocab.Vocabulary extends java.lang.Object implements Serializable

serialVersionUID: 1L

Serialized Fields

useSkos

boolean useSkos
Boolean describing which vocabulary format has been chosen: true if SKOS, false if text.


VocabularyEN

java.util.HashMap VocabularyEN
Vocabulary index


VocabularyENrev

java.util.HashMap VocabularyENrev
Vocabulary reverse index


VocabularyUSE

java.util.HashMap VocabularyUSE
Vocabulary non-descriptors - descriptors list


VocabularyREL

java.util.HashMap VocabularyREL
Vocabulary related terms


VocabularyRT

java.util.HashMap VocabularyRT

m_language

java.lang.String m_language
The document language


m_Stemmer

Stemmer m_Stemmer
The default stemmer to be used


m_Stopwords

Stopwords m_Stopwords
The list of stop words to be used