Constant Field Values


Contents
ca.uottawa.*

ca.uottawa.balie.Balie
public static final boolean DEBUG_ABBREVIATION_LOOKUP false
public static final boolean DEBUG_LANGUAGE_IDENTIFICATION true
public static final boolean DEBUG_LIGATURE false
public static final boolean DEBUG_POS_LOOKUP false
public static final boolean DEBUG_PRINT_SBD_TEST_CORPUS false
public static final boolean DEBUG_PUNCT_LOOKUP false
public static final boolean DEBUG_TOKEN false
public static final boolean DEBUG_TOKENIZER false
public static final boolean DEBUG_UNBREAKABLE_LOOKUP false
public static final java.lang.String ENCODING_DEFAULT "default"
public static final java.lang.String ENCODING_LITTLE_INDIAN "UnicodeLittle"
public static final java.lang.String ENCODING_UTF8 "utf8"
public static final java.lang.String ENGLISH_TOKEN_LIST_ON_DISK "./TokenListEng.sig"
public static final java.lang.String FRENCH_TOKEN_LIST_ON_DISK "./TokenListFre.sig"
public static final java.lang.String GERMAN_TOKEN_LIST_ON_DISK "./TokenListGer.sig"
public static final java.lang.String LANGUAGE_ENGLISH "English"
public static final java.lang.String LANGUAGE_FRENCH "French"
public static final java.lang.String LANGUAGE_GERMAN "German"
public static final java.lang.String LANGUAGE_ID_MODEL "./LanguageIdentificationModel.sig"
public static final java.lang.String LANGUAGE_ID_TESTING_CORPUS "../BaLIECorpora/Corpus - Language Identification/Test"
public static final java.lang.String LANGUAGE_ID_TRAINING_CORPUS "../BaLIECorpora/Corpus - Language Identification/Train"
public static final java.lang.String LANGUAGE_ROMANIAN "Romanian"
public static final java.lang.String LANGUAGE_SPANISH "Spanish"
public static final java.lang.String LANGUAGE_UNKNOWN "Unknown"
public static final java.lang.String OUT_LI_TEST_MODEL "../BaLIECorpora/Arff/LangIDTestModel.arff"
public static final java.lang.String OUT_LI_TRAIN_MODEL "../BaLIECorpora/Arff/LangIDTrainModel.arff"
public static final java.lang.String OUT_SBD_TEST_MODEL "../BaLIECorpora/Arff/SBDTestModel.arff"
public static final java.lang.String OUT_SBD_TRAIN_MODEL "../BaLIECorpora/Arff/SBDTrainModel.arff"
public static final java.lang.String QTAG_ENGLISH "../qTag/qtag-eng"
public static final java.lang.String QTAG_FRENCH "../qTag/qtag-fre"
public static final java.lang.String QTAG_FRENCH_CORPUS "./Corpus - Part-of-Speech/French/french_corpus.txt"
public static final java.lang.String QTAG_GERMAN "../qTag/qtag-ger"
public static final java.lang.String QTAG_ROMANIAN "../qTag/qtag-ro"
public static final java.lang.String QTAG_ROMANIAN_CORPUS "./Corpus - Part-of-Speech/Romanian/romanian_corpus.txt"
public static final java.lang.String QTAG_SPANISH "../qTag/qtag-spa"
public static final java.lang.String QTAG_SPANISH_CORPUS "./Corpus - Part-of-Speech/Spanish/spanish_corpus.txt"
public static final java.lang.String ROMANIAN_TOKEN_LIST_ON_DISK "./TokenListRom.sig"
public static final java.lang.String SBR_MODEL "./SentenceBoundariesRecognition.sig"
public static final java.lang.String SBR_TESTING_CORPUS "../BaLIECorpora/Corpus - Sentence Boundaries/test.xml"
public static final java.lang.String SBR_TRAINING_CORPUS "../BaLIECorpora/Corpus - Sentence Boundaries/train.xml"
public static final java.lang.String SPANISH_TOKEN_LIST_ON_DISK "./TokenListSpa.sig"
public static final java.lang.String UNBREAK_TOKEN_LIST_ON_DISK "./TokenListUnb.sig"

ca.uottawa.balie.Canonizer
public static final int RULE_EXPAND_LIGATURES 8
public static final int RULE_LOWERCASE 1
public static final int RULE_NORMALIZE_PUNCT 2
public static final int RULE_REMOVE_INTERNAL_PUNCT 4

ca.uottawa.balie.HashCodeUtil
public static final int SEED 23

ca.uottawa.balie.TokenConsts
public static final int NE_CAR 8
public static final int NE_END 2048
public static final int NE_LANGUAGE 512
public static final int NE_LOCATION 2
public static final int NE_MONTH 256
public static final int NE_ORGANIZATION 4
public static final int NE_PERSON 1
public static final int NE_START 1024
public static final int POS_ADJECTIVE 4
public static final int POS_ADVERB 16
public static final int POS_CONJUNCTION 32
public static final int POS_DETERMINER 1
public static final int POS_NOUN 2
public static final int POS_NUMBER 536870912
public static final int POS_NUMBER_LIKE 1073741824
public static final int POS_PARTICLE 128
public static final int POS_POSSESSIVE 512
public static final int POS_PREPOSITION 64
public static final int POS_PRONOUN 256
public static final int POS_PROPER_NAME_LIKE 268435456
public static final int POS_UNKNOWN -2147483648
public static final int POS_VERB 8
public static final int PUNCT_AMPERSAND 1048576
public static final int PUNCT_APOSTROPHE 1024
public static final int PUNCT_BACK_SLASH 8192
public static final int PUNCT_CLOSE_BRACKET 131072
public static final int PUNCT_CLOSE_PARENTHESIS 128
public static final int PUNCT_COLON 32
public static final int PUNCT_COMMA 2
public static final int PUNCT_COMMERCIAL_AT 512
public static final int PUNCT_COPYRIGHT 33554432
public static final int PUNCT_CURRENCY 16777216
public static final int PUNCT_DASH 2048
public static final int PUNCT_EXCLAMATION 4
public static final int PUNCT_INTERROGATION 8
public static final int PUNCT_INV_EXCLAMATION 262144
public static final int PUNCT_INV_INTERROGATION 524288
public static final int PUNCT_LINEFEED 536870912
public static final int PUNCT_MISC_ARITHMETIC 16384
public static final int PUNCT_NEWLINE 1073741824
public static final int PUNCT_OPEN_BRACKET 65536
public static final int PUNCT_OPEN_PARENTHESIS 64
public static final int PUNCT_PERCENT 32768
public static final int PUNCT_PERIOD 1
public static final int PUNCT_PIPE 8388608
public static final int PUNCT_QUOTE 256
public static final int PUNCT_SEMI_COLON 16
public static final int PUNCT_SLASH 4096
public static final int PUNCT_TABULATION 268435456
public static final int PUNCT_TILDE 4194304
public static final int PUNCT_UNDERSCORE 2097152
public static final int PUNCT_UNKNOWN -2147483648
public static final int TYPE_PUNCTUATION 1
public static final int TYPE_WORD 2

ca.uottawa.balie.WekaAttributeSelection
public static final int DEFAULT_NUM_ATTRIBUTES 100
public static final int WEKA_CHI_SQUARE 0
public static final int WEKA_INFO_GAIN 1
public static final int WEKA_ONER 6
public static final int WEKA_RELIEF 5
public static final int WEKA_SVM 4
public static final int WEKA_SYM_UNCERT 3
public static final int WEKA_WRAPPER 2

ca.uottawa.balie.WekaPersistance
public static final int PRINT_TESTING_SET 1
public static final int PRINT_TRAINING_SET 0