From 0f3414c576c4a5252aa768f22cba4db81fc7e6e8 Mon Sep 17 00:00:00 2001 From: Ben Kurtovic Date: Sun, 22 Jul 2012 02:24:59 -0400 Subject: [PATCH] Refactor the last bit of parsing code into support.copyvios. Will clean up in a bit. --- pages/copyvios.mako | 34 +++------------------------------- pages/support/copyvios/__init__.py | 30 ++++++++++++++++++++++++++++++ pages/support/copyvios/checker.py | 2 +- pages/support/copyvios/highlighter.py | 2 +- 4 files changed, 35 insertions(+), 33 deletions(-) diff --git a/pages/copyvios.mako b/pages/copyvios.mako index 48bb056..d114312 100644 --- a/pages/copyvios.mako +++ b/pages/copyvios.mako @@ -1,35 +1,7 @@ -<%! - from urlparse import parse_qs - from earwigbot.bot import Bot -%>\ -<%namespace module="support.copyvios" import="get_results, highlight_delta"/>\ -<%namespace module="support.sites" import="get_site, get_sites"/>\ +<%include file="/support/header.mako" args="environ=environ, title='Copyvio Detector', add_css=('copyvios.css',), add_js=('copyvios.js',)"/>\ +<%namespace module="support.copyvios" import="main, highlight_delta"/>\ <%namespace module="support.misc" import="urlstrip"/>\ -<% - lang = orig_lang = project = name = title = url = None - site = page = result = None - - # Parse the query string. - query = parse_qs(environ["QUERY_STRING"]) - if "lang" in query: - lang = orig_lang = query["lang"][0].decode("utf8").lower() - if "::" in lang: - lang, name = lang.split("::", 1) - if "project" in query: - project = query["project"][0].decode("utf8").lower() - if "title" in query: - title = query["title"][0].decode("utf8") - if "url" in query: - url = query["url"][0].decode("utf8") - - bot = Bot(".earwigbot") - all_langs, all_projects = get_sites(bot) - if lang and project and title: - site = get_site(bot, lang, project, name, all_projects) - if site: - page, result = get_results(bot, site, title, url, query) -%>\ -<%include file="/support/header.mako" args="environ=environ, title='Copyvio Detector', add_css=('copyvios.css',), add_js=('copyvios.js',)"/> +<% lang, project, name, title, url, site, page, result = main(environ) %>

Copyvio Detector

This tool attempts to detect copyright violations in articles. Simply give the title of the page you want to check and hit Submit. The tool will then search for its content elsewhere on the web and display a report if a similar webpage is found. If you also provide a URL, it will not query any search engines and instead display a report comparing the article to that particular webpage, like the Duplication Detector. Check out the FAQ for more information and technical details.

diff --git a/pages/support/copyvios/__init__.py b/pages/support/copyvios/__init__.py index 0908dfe..9d2d27f 100644 --- a/pages/support/copyvios/__init__.py +++ b/pages/support/copyvios/__init__.py @@ -1,4 +1,34 @@ # -*- coding: utf-8 -*- +from urlparse import parse_qs +from earwigbot.bot import Bot + from .checker import get_results from .highlighter import highlight_delta +from ..sites import get_site, get_sites + +def main(context, environ): + lang = orig_lang = project = name = title = url = None + site = page = result = None + + # Parse the query string. + query = parse_qs(environ["QUERY_STRING"]) + if "lang" in query: + lang = orig_lang = query["lang"][0].decode("utf8").lower() + if "::" in lang: + lang, name = lang.split("::", 1) + if "project" in query: + project = query["project"][0].decode("utf8").lower() + if "title" in query: + title = query["title"][0].decode("utf8") + if "url" in query: + url = query["url"][0].decode("utf8") + + bot = Bot(".earwigbot") + all_langs, all_projects = get_sites(bot) + if lang and project and title: + site = get_site(bot, lang, project, name, all_projects) + if site: + page, result = get_results(bot, site, title, url, query) + + return lang, project, name, title, url, site, page, result diff --git a/pages/support/copyvios/checker.py b/pages/support/copyvios/checker.py index 5731ac7..ea39627 100644 --- a/pages/support/copyvios/checker.py +++ b/pages/support/copyvios/checker.py @@ -8,7 +8,7 @@ from earwigbot import exceptions from ..misc import open_sql_connection -def get_results(context, bot, site, title, url, query): +def get_results(bot, site, title, url, query): page = site.get_page(title) try: page.get() # Make sure that the page exists before we check it! diff --git a/pages/support/copyvios/highlighter.py b/pages/support/copyvios/highlighter.py index 0c0b17e..33d78e0 100644 --- a/pages/support/copyvios/highlighter.py +++ b/pages/support/copyvios/highlighter.py @@ -2,7 +2,7 @@ from re import sub, UNICODE -def highlight_delta(context, chain, delta): +def highlight_delta(chain, delta): processed = [] prev_prev = prev = chain.START i = 0