diff options
Diffstat (limited to 'spellchecker/src/CorpusReader.java')
-rw-r--r-- | spellchecker/src/CorpusReader.java | 3 |
1 files changed, 2 insertions, 1 deletions
diff --git a/spellchecker/src/CorpusReader.java b/spellchecker/src/CorpusReader.java index 8281210..686f243 100644 --- a/spellchecker/src/CorpusReader.java +++ b/spellchecker/src/CorpusReader.java @@ -119,7 +119,8 @@ public class CorpusReader { // probability as result. if (NGram.indexOf(' ') != -1) { // bigram, must be the nominator - smoothedCount += 1; + // we do not have a lot of bigrams + smoothedCount += .01; } else { // unigram, must be the denominator smoothedCount += 1; |