Additional IRC commands and bot tasks for EarwigBot https://en.wikipedia.org/wiki/User:EarwigBot
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

afc_undated.py 7.7 KiB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186
  1. # -*- coding: utf-8 -*-
  2. #
  3. # Copyright (C) 2009-2013 Ben Kurtovic <ben.kurtovic@verizon.net>
  4. #
  5. # Permission is hereby granted, free of charge, to any person obtaining a copy
  6. # of this software and associated documentation files (the "Software"), to deal
  7. # in the Software without restriction, including without limitation the rights
  8. # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  9. # copies of the Software, and to permit persons to whom the Software is
  10. # furnished to do so, subject to the following conditions:
  11. #
  12. # The above copyright notice and this permission notice shall be included in
  13. # all copies or substantial portions of the Software.
  14. #
  15. # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  16. # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  17. # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  18. # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  19. # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  20. # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  21. # SOFTWARE.
  22. from datetime import datetime
  23. import mwparserfromhell
  24. from earwigbot.tasks import Task
  25. from earwigbot.wiki.constants import *
  26. class AFCUndated(Task):
  27. """A task to clear [[Category:Undated AfC submissions]]."""
  28. name = "afc_undated"
  29. number = 5
  30. def setup(self):
  31. cfg = self.config.tasks.get(self.name, {})
  32. self.category = cfg.get("category", "Undated AfC submissions")
  33. default_summary = "Adding timestamp to undated [[WP:AFC|Articles for creation]] submission."
  34. self.summary = self.make_summary(cfg.get("summary", default_summary))
  35. self.namespaces = {
  36. "submission": [NS_USER, NS_PROJECT, NS_PROJECT_TALK],
  37. "talk": [NS_TALK, NS_FILE_TALK, NS_TEMPLATE_TALK, NS_HELP_TALK,
  38. NS_CATEGORY_TALK]
  39. }
  40. self.aliases = {
  41. "submission": ["AFC submission"],
  42. "talk": ["WikiProject Articles for creation"]
  43. }
  44. def run(self, **kwargs):
  45. try:
  46. self.statistics = self.bot.tasks.get("afc_statistics")
  47. except KeyError:
  48. err = "Requires afc_statistics task (from earwigbot_plugins)"
  49. self.logger.error(err)
  50. return
  51. self.site = self.bot.wiki.get_site()
  52. category = self.site.get_category(self.category)
  53. logmsg = u"Undated category [[{0}]] has {1} members"
  54. self.logger.info(logmsg.format(category.title, category.size))
  55. if category.size:
  56. self.build_aliases()
  57. counter = 0
  58. for page in category:
  59. if not counter % 10:
  60. if self.shutoff_enabled():
  61. return
  62. self.process_page(page)
  63. counter += 1
  64. def build_aliases(self):
  65. """Build template name aliases for the AFC templates."""
  66. for key in self.aliases:
  67. base = self.aliases[key][0]
  68. aliases = [base, "Template:" + base]
  69. result = self.site.api_query(
  70. action="query", list="backlinks", bllimit=50,
  71. blfilterredir="redirects", bltitle=aliases[1])
  72. for data in result["query"]["backlinks"]:
  73. redir = self.site.get_page(data["title"])
  74. aliases.append(redir.title)
  75. if redir.namespace == NS_TEMPLATE:
  76. aliases.append(redir.title.split(":", 1)[1])
  77. self.aliases[key] = aliases
  78. def process_page(self, page):
  79. """Date the necessary templates inside a page object."""
  80. if not page.check_exclusion():
  81. msg = u"Skipping [[{0}]]; bot excluded from editing"
  82. self.logger.info(msg.format(page.title))
  83. return
  84. is_sub = page.namespace in self.namespaces["submission"]
  85. is_talk = page.namespace in self.namespaces["talk"]
  86. if is_sub:
  87. aliases = self.aliases["subission"]
  88. timestamps = {}
  89. elif is_talk:
  90. aliases = self.aliases["talk"]
  91. timestamp, reviewer = self.get_talkdata(page)
  92. else:
  93. msg = u"[[{0}]] is undated, but in a namespace I don't know how to process"
  94. self.logger.warn(msg.format(page.title))
  95. return
  96. if not timestamp:
  97. return
  98. code = mwparserfromhell.parse(page.get())
  99. changes = 0
  100. for template in code.filter_templates():
  101. has_ts = template.has("ts", ignore_empty=True)
  102. has_reviewer = template.has("reviewer", ignore_empty=True)
  103. if template.name.matches(aliases) and not has_ts:
  104. if is_sub:
  105. status = self.get_status(template)
  106. if status in timestamps:
  107. timestamp = timestamps[status]
  108. else:
  109. timestamp = self.get_timestamp(page, status)
  110. timestamps[status] = timestamp
  111. template.add("ts", timestamp)
  112. if is_talk and not has_reviewer:
  113. template.add("reviewer", reviewer)
  114. changes += 1
  115. if changes:
  116. msg = u"Dating [[{0}]]: {1}x {2}"
  117. self.logger.info(msg.format(page.title, changes, aliases[0]))
  118. page.edit(unicode(code), self.summary)
  119. else:
  120. msg = u"[[{0}]] is undated, but I can't figure out what to replace"
  121. self.logger.warn(msg.format(page.title))
  122. def get_status(self, template):
  123. """Get the status code that corresponds to a given template."""
  124. valid = ["P", "R", "T", "D"]
  125. if template.has(1):
  126. status = template.get(1).value.strip().upper()
  127. if status in valid:
  128. return status
  129. return "P"
  130. def get_timestamp(self, page, chart):
  131. """Get the timestamp associated with a particular submission."""
  132. log = u"[[{0}]]: Getting timestamp for state {1}"
  133. self.logger.debug(log.format(page.title, chart))
  134. search = self.statistics.search_history
  135. user, ts, revid = search(page.pageid, chart, chart, [])
  136. if not ts:
  137. log = u"Couldn't find timestamp in [[{0}]] with state {1}"
  138. self.logger.warn(log.format(page.title, chart))
  139. return None
  140. return ts.strftime("%Y%m%d%H%M%S")
  141. def get_talkdata(self, page):
  142. """Get the timestamp and reviewer associated with a talkpage.
  143. This is the mover for a normal article submission, and the uploader for
  144. a file page.
  145. """
  146. subject = page.toggle_talk()
  147. if subject.namespace == NS_FILE:
  148. return self.get_filedata(subject)
  149. self.logger.debug(u"[[{0}]]: Getting talkdata".format(page.title))
  150. chart = self.statistics.CHART_ACCEPT
  151. user, ts, revid = self.statistics.get_special(subject.pageid, chart)
  152. if not ts:
  153. log = u"Couldn't get talkdata for [[{0}]]"
  154. self.logger.warn(log.format(page.title))
  155. return None, None
  156. return ts.strftime("%Y%m%d%H%M%S"), user
  157. def get_filedata(self, page):
  158. """Get the timestamp and reviewer associated with a file talkpage."""
  159. self.logger.debug(u"[[{0}]]: Getting filedata".format(page.title))
  160. result = self.site.api_query(action="query", prop="imageinfo",
  161. titles=page.title)
  162. data = result["query"]["pages"].values()[0]
  163. if "imageinfo" not in data:
  164. log = u"Couldn't get filedata for [[{0}]]"
  165. self.logger.warn(log.format(page.title))
  166. return None, None
  167. info = data["imageinfo"][0]
  168. ts = datetime.strptime(info["timestamp"], "%Y-%m-%dT%H:%M:%SZ")
  169. return ts.strftime("%Y%m%d%H%M%S"), info["user"]