|
@@ -241,6 +241,10 @@ class CopyrightMixin(object): |
|
|
article_chain = _MarkovChain(clean) |
|
|
article_chain = _MarkovChain(clean) |
|
|
last_query = time() |
|
|
last_query = time() |
|
|
|
|
|
|
|
|
|
|
|
if article_chain.size() < 20: # Auto-fail very small articles |
|
|
|
|
|
return _CopyvioCheckResult(False, best_confidence, best_match, |
|
|
|
|
|
num_queries, article_chain, best_chains) |
|
|
|
|
|
|
|
|
while (chunks and best_confidence < min_confidence and |
|
|
while (chunks and best_confidence < min_confidence and |
|
|
(max_queries < 0 or num_queries < max_queries)): |
|
|
(max_queries < 0 or num_queries < max_queries)): |
|
|
urls = search(chunks.pop(0)) |
|
|
urls = search(chunks.pop(0)) |
|
|