diff --git a/CHANGELOG b/CHANGELOG index 68725f3..fec7e5e 100644 --- a/CHANGELOG +++ b/CHANGELOG @@ -15,7 +15,8 @@ v0.2 (unreleased): - Added copyvio detector functionality: specifying a max time for checks; improved exclusion support. URL loading and parsing is parallelized to speed up check times, with a multi-threaded worker model that avoids concurrent - requests to the same domain. Fixed assorted bugs. + requests to the same domain. Improvements to the comparison algorithm. Fixed + assorted bugs. - Added support for Wikimedia Labs when creating a config file. - Added and improved lazy importing for various dependencies. - Fixed a bug in job scheduling. diff --git a/earwigbot/wiki/copyvios/markov.py b/earwigbot/wiki/copyvios/markov.py index 491c875..057fcc1 100644 --- a/earwigbot/wiki/copyvios/markov.py +++ b/earwigbot/wiki/copyvios/markov.py @@ -30,7 +30,7 @@ class MarkovChain(object): """Implements a basic ngram Markov chain of words.""" START = -1 END = -2 - degree = 3 # 2 for bigrams, 3 for trigrams, etc. + degree = 5 # 2 for bigrams, 3 for trigrams, etc. def __init__(self, text): self.text = text