Parameter optimization.
[Category diff] +1 194 -1 21 +2 15 -2 1 +3 1 -3 15 +4 152 -4 90 +5 108 -5 197 +6 94 -6 136 +7 28 -7 132 [Weighted category diff] +1 230 -1 23 +2 15 -2 1 +3 1 -3 15 +4 180 -4 106 +5 122 -5 224 +6 107 -6 158 +7 29 -7 157 show diff for ./en_user_log_phones_2011_08.csv +1 171 -1 9 +2 7 -2 1 +3 1 -3 7 +4 123 -4 76 +5 84 -5 157 +6 66 -6 119 +7 20 -7 103 Before ---- count ---- Count(1):75.64%, 177913 Count(2):1.06%, 2510 Count(3):0.56%, 1319 Count(4):6.63%, 15612 Count(5):9.87%, 23223 Count(6):2.79%, 6580 Count(7):3.41%, 8038 ---- weight ---- Weight(1):96.88%, 2009907 Weight(2):0.24%, 5157 Weight(3):0.09%, 2025 Weight(4):0.77%, 16095 Weight(5):1.11%, 23077 Weight(6):0.39%, 8172 Weight(7):0.48%, 10146 ---- score ---- Conservative score = 66.406 Normal score = 81.512 Agressive score = 89.064 Insane score = 92.841 After ---- count ---- Count(1):75.71%, 178087 Count(2):1.07%, 2524 Count(3):0.55%, 1305 Count(4):6.66%, 15677 Count(5):9.83%, 23133 Count(6):2.78%, 6539 Count(7):3.37%, 7930 ---- weight ---- Weight(1):96.89%, 2010118 Weight(2):0.24%, 5171 Weight(3):0.09%, 2011 Weight(4):0.78%, 16184 Weight(5):1.1%, 22972 Weight(6):0.39%, 8109 Weight(7):0.48%, 10014 ---- score ---- Conservative score = 66.431 Normal score = 81.531 Agressive score = 89.08 Insane score = 92.855 No diffs for 10+ freq user log. Change-Id: Ica4a7604507a2c91aaa7daf5bacf4fce4039f547main
parent
a8f4efd013
commit
15b1a0fd14
|
@ -35,7 +35,7 @@ const float ScoringParams::OMISSION_COST = 0.4676f;
|
||||||
const float ScoringParams::OMISSION_COST_SAME_CHAR = 0.399f;
|
const float ScoringParams::OMISSION_COST_SAME_CHAR = 0.399f;
|
||||||
const float ScoringParams::OMISSION_COST_FIRST_CHAR = 0.5256f;
|
const float ScoringParams::OMISSION_COST_FIRST_CHAR = 0.5256f;
|
||||||
const float ScoringParams::INSERTION_COST = 0.7248f;
|
const float ScoringParams::INSERTION_COST = 0.7248f;
|
||||||
const float ScoringParams::TERMINAL_INSERTION_COST = 0.9828f;
|
const float ScoringParams::TERMINAL_INSERTION_COST = 0.8128f;
|
||||||
const float ScoringParams::INSERTION_COST_SAME_CHAR = 0.5508f;
|
const float ScoringParams::INSERTION_COST_SAME_CHAR = 0.5508f;
|
||||||
const float ScoringParams::INSERTION_COST_PROXIMITY_CHAR = 0.674f;
|
const float ScoringParams::INSERTION_COST_PROXIMITY_CHAR = 0.674f;
|
||||||
const float ScoringParams::INSERTION_COST_FIRST_CHAR = 0.639f;
|
const float ScoringParams::INSERTION_COST_FIRST_CHAR = 0.639f;
|
||||||
|
@ -43,10 +43,10 @@ const float ScoringParams::TRANSPOSITION_COST = 0.5608f;
|
||||||
const float ScoringParams::SPACE_SUBSTITUTION_COST = 0.339f;
|
const float ScoringParams::SPACE_SUBSTITUTION_COST = 0.339f;
|
||||||
const float ScoringParams::ADDITIONAL_PROXIMITY_COST = 0.4576f;
|
const float ScoringParams::ADDITIONAL_PROXIMITY_COST = 0.4576f;
|
||||||
const float ScoringParams::SUBSTITUTION_COST = 0.3806f;
|
const float ScoringParams::SUBSTITUTION_COST = 0.3806f;
|
||||||
const float ScoringParams::COST_NEW_WORD = 0.0292f;
|
const float ScoringParams::COST_NEW_WORD = 0.0312f;
|
||||||
const float ScoringParams::COST_SECOND_OR_LATER_WORD_FIRST_CHAR_UPPERCASE = 0.3224f;
|
const float ScoringParams::COST_SECOND_OR_LATER_WORD_FIRST_CHAR_UPPERCASE = 0.3224f;
|
||||||
const float ScoringParams::DISTANCE_WEIGHT_LANGUAGE = 1.1214f;
|
const float ScoringParams::DISTANCE_WEIGHT_LANGUAGE = 1.1214f;
|
||||||
const float ScoringParams::COST_FIRST_LOOKAHEAD = 0.4786f;
|
const float ScoringParams::COST_FIRST_LOOKAHEAD = 0.4836f;
|
||||||
const float ScoringParams::COST_LOOKAHEAD = 0.00624f;
|
const float ScoringParams::COST_LOOKAHEAD = 0.00624f;
|
||||||
const float ScoringParams::HAS_PROXIMITY_TERMINAL_COST = 0.06836f;
|
const float ScoringParams::HAS_PROXIMITY_TERMINAL_COST = 0.06836f;
|
||||||
const float ScoringParams::HAS_EDIT_CORRECTION_TERMINAL_COST = 0.0362f;
|
const float ScoringParams::HAS_EDIT_CORRECTION_TERMINAL_COST = 0.0362f;
|
||||||
|
|
Loading…
Reference in New Issue