Преглед изворни кода

Add a bunch of temporary debugging code.

tags/v0.2
Ben Kurtovic пре 9 година
родитељ
комит
32ef0fbf1f
1 измењених фајлова са 15 додато и 0 уклоњено
  1. +15
    -0
      earwigbot/wiki/copyvios/workers.py

+ 15
- 0
earwigbot/wiki/copyvios/workers.py Прегледај датотеку

@@ -21,6 +21,7 @@
# SOFTWARE.

from gzip import GzipFile
from logging import getLogger
from math import log
from Queue import Empty, Queue
from socket import error
@@ -142,6 +143,8 @@ class _CopyvioWorker(object):
self._queue = None
self._opener = build_opener()

self._logger = None

def _open_url(self, source):
"""Open a URL and return its parsed content, or None.

@@ -202,23 +205,32 @@ class _CopyvioWorker(object):
timeout = None

if self._queue:
self._logger.debug(u"Popping source from existing queue ({0})".format(self._site))
source = self._queue.pop()
self._logger.debug(u"Got URL: {0}".format(source.url))
with self._queues.lock:
if not self._queue:
self._logger.debug(u"Destroying site {0}".format(self._site))
del self._queues.sites[self._site]
self._queue = None
else:
self._logger.debug("Waiting for unassigned URL queue")
site, queue = self._queues.unassigned.get(timeout=timeout)
if site is StopIteration:
return StopIteration
self._logger.debug(u"Got queue: {0}".format(site))
source = queue.pop()
self._logger.debug(u"Got URL: {0}".format(source.url))
with self._queues.lock:
if not queue:
self._logger.debug(u"Destroying site {0}".format(site))
del self._queues.sites[site]
else:
self._logger.debug(u"Saving site {0}".format(site))
self._site = site
self._queue = queue
if not source.active():
self._logger.debug(u"Inactive source; trying again")
return self._dequeue()
return source

@@ -246,6 +258,7 @@ class _CopyvioWorker(object):
thread.name = "cvworker-" + name
thread.daemon = True
thread.start()
self._logger = getLogger("earwigbot.wiki.cvworker." + name)


class CopyvioWorkspace(object):
@@ -358,7 +371,9 @@ class CopyvioWorkspace(object):
"""Wait for the workers to finish handling the sources."""
self._logger.debug("Waiting on {0} sources".format(len(self.sources)))
for source in self.sources:
self._logger.debug("Waiting on source: {0}".format(source.url))
source.join(self._until)
self._logger.debug("Done waiting")

def compare(self, source, source_chain):
"""Compare a source to the article, and update the best known one."""


Loading…
Откажи
Сачувај