Compare commits
25 Commits
| Author | SHA1 | Date | |
|---|---|---|---|
| 2f022d9d30 | |||
| 56701107db | |||
| 7ccfb90888 | |||
| 22a2cc5799 | |||
| 9d471bee20 | |||
| 16a774fae5 | |||
| 038dd6e36a | |||
| e468260f7f | |||
| da99dee429 | |||
| b96c5d4a33 | |||
| 73bf26b627 | |||
| df2f13fb66 | |||
| 7b27577915 | |||
| d76f914615 | |||
| d9d385cfe8 | |||
| 2076932cbf | |||
| 9fe1c36482 | |||
| c730d9ba9c | |||
| 3ed67431cf | |||
| 287942e174 | |||
| 4de2116717 | |||
| 3349c9f3d3 | |||
| a250074caa | |||
| 581e043255 | |||
| e932303c40 |
2
.gitignore
vendored
2
.gitignore
vendored
@@ -62,3 +62,5 @@ target/
|
||||
|
||||
# Test
|
||||
test.py
|
||||
|
||||
disabled
|
||||
|
||||
3
.gitmodules
vendored
Normal file
3
.gitmodules
vendored
Normal file
@@ -0,0 +1,3 @@
|
||||
[submodule "jogobot"]
|
||||
path = jogobot
|
||||
url = ../jogobot
|
||||
@@ -1,7 +1,7 @@
|
||||
#!/usr/bin/env python3
|
||||
# -*- coding: utf-8 -*-
|
||||
#
|
||||
# chartsbot.py
|
||||
# charts.py
|
||||
#
|
||||
# original version by:
|
||||
#
|
||||
@@ -11,7 +11,7 @@
|
||||
#
|
||||
# modified by:
|
||||
#
|
||||
# Copyright 2015 GOLDERWEB – Jonathan Golder <jonathan@golderweb.de>
|
||||
# Copyright 2016 GOLDERWEB – Jonathan Golder <jonathan@golderweb.de>
|
||||
#
|
||||
# This program is free software; you can redistribute it and/or modify
|
||||
# it under the terms of the GNU General Public License as published by
|
||||
@@ -46,10 +46,14 @@ The following parameters are supported:
|
||||
|
||||
|
||||
import locale
|
||||
import os
|
||||
import sys
|
||||
|
||||
import pywikibot
|
||||
from pywikibot import pagegenerators
|
||||
|
||||
import jogobot
|
||||
|
||||
from summarypage import SummaryPage
|
||||
|
||||
# This is required for the text that is shown when you run this script
|
||||
@@ -87,6 +91,9 @@ class ChartsBot( ):
|
||||
# Force parsing of countrylist
|
||||
self.force_reload = force_reload
|
||||
|
||||
# Output Information
|
||||
jogobot.output( "Chartsbot invoked" )
|
||||
|
||||
# Set the edit summary message
|
||||
self.site = pywikibot.Site()
|
||||
self.summary = "Bot: Aktualisiere Übersichtsseite Nummer-eins-Hits"
|
||||
@@ -94,14 +101,6 @@ class ChartsBot( ):
|
||||
# Set locale to 'de_DE.UTF-8'
|
||||
locale.setlocale(locale.LC_ALL, 'de_DE.UTF-8')
|
||||
|
||||
# provisional-onwiki-activation
|
||||
page_active = pywikibot.Page( self.site, "Benutzer:JogoBot/active" )
|
||||
text_active = page_active.get()
|
||||
|
||||
if "true" not in text_active.lower():
|
||||
pywikibot.output( "Bot ist deaktiviert!" )
|
||||
return False
|
||||
|
||||
def run(self):
|
||||
"""Process each page from the generator."""
|
||||
for page in self.generator:
|
||||
@@ -126,7 +125,7 @@ class ChartsBot( ):
|
||||
text = sumpage.get_new_text()
|
||||
|
||||
if not self.save(text, page, self.summary, False):
|
||||
pywikibot.output(u'Page %s not saved.' % page.title(asLink=True))
|
||||
jogobot.output(u'Page %s not saved.' % page.title(asLink=True))
|
||||
|
||||
def load(self, page):
|
||||
"""Load the text of the given page."""
|
||||
@@ -134,11 +133,11 @@ class ChartsBot( ):
|
||||
# Load the page
|
||||
text = page.get()
|
||||
except pywikibot.NoPage:
|
||||
pywikibot.output(u"Page %s does not exist; skipping."
|
||||
% page.title(asLink=True))
|
||||
jogobot.output( u"Page %s does not exist; skipping."
|
||||
% page.title(asLink=True), "ERROR" )
|
||||
except pywikibot.IsRedirectPage:
|
||||
pywikibot.output(u"Page %s is a redirect; skipping."
|
||||
% page.title(asLink=True))
|
||||
jogobot.output( u"Page %s is a redirect; skipping."
|
||||
% page.title(asLink=True), "ERROR" )
|
||||
else:
|
||||
return text
|
||||
return None
|
||||
@@ -148,13 +147,17 @@ class ChartsBot( ):
|
||||
"""Update the given page with new text."""
|
||||
# only save if something was changed (and not just revision)
|
||||
if text != page.get():
|
||||
# Show the title of the page we're working on.
|
||||
# Highlight the title in purple.
|
||||
pywikibot.output(u"\n\n>>> \03{lightpurple}%s\03{default} <<<"
|
||||
% page.title())
|
||||
# show what was changed
|
||||
pywikibot.showDiff(page.get(), text)
|
||||
pywikibot.output(u'Comment: %s' % comment)
|
||||
|
||||
# Show diff only in interactive mode or in verbose mode
|
||||
if not self.always or pywikibot.config.verbose_output:
|
||||
|
||||
# Show the title of the page we're working on.
|
||||
# Highlight the title in purple.
|
||||
jogobot.output( u">>> \03{lightpurple}%s\03{default} <<<"
|
||||
% page.title())
|
||||
# show what was changed
|
||||
pywikibot.showDiff(page.get(), text)
|
||||
jogobot.output(u'Comment: %s' % comment)
|
||||
|
||||
if self.always or pywikibot.input_yn(
|
||||
u'Do you want to accept these changes?',
|
||||
@@ -165,17 +168,17 @@ class ChartsBot( ):
|
||||
page.save(summary=comment or self.comment,
|
||||
minor=minorEdit, botflag=botflag)
|
||||
except pywikibot.LockedPage:
|
||||
pywikibot.output(u"Page %s is locked; skipping."
|
||||
% page.title(asLink=True))
|
||||
jogobot.output( u"Page %s is locked; skipping."
|
||||
% page.title(asLink=True), "ERROR" )
|
||||
except pywikibot.EditConflict:
|
||||
pywikibot.output(
|
||||
jogobot.output(
|
||||
u'Skipping %s because of edit conflict'
|
||||
% (page.title()))
|
||||
% (page.title()), "ERROR")
|
||||
except pywikibot.SpamfilterError as error:
|
||||
pywikibot.output(
|
||||
jogobot.output(
|
||||
u'Cannot change %s because of spam blacklist \
|
||||
entry %s'
|
||||
% (page.title(), error.url))
|
||||
% (page.title(), error.url), "ERROR")
|
||||
else:
|
||||
return True
|
||||
return False
|
||||
@@ -190,43 +193,65 @@ def main(*args):
|
||||
@param args: command line arguments
|
||||
@type args: list of unicode
|
||||
"""
|
||||
|
||||
# Process global arguments to determine desired site
|
||||
local_args = pywikibot.handle_args(args)
|
||||
|
||||
# This factory is responsible for processing command line arguments
|
||||
# that are also used by other scripts and that determine on which pages
|
||||
# to work on.
|
||||
genFactory = pagegenerators.GeneratorFactory()
|
||||
# The generator gives the pages that should be worked upon.
|
||||
gen = None
|
||||
# Get the jogobot-task_slug (basename of current file without ending)
|
||||
task_slug = os.path.basename(__file__)[:-len(".py")]
|
||||
|
||||
# If always is True, bot won't ask for confirmation of edit (automode)
|
||||
always = False
|
||||
# Before run, we need to check wether we are currently active or not
|
||||
try:
|
||||
# Will throw Exception if disabled/blocked
|
||||
jogobot.is_active( task_slug )
|
||||
|
||||
# If force_reload is True, bot will always parse Countrylist regardless of
|
||||
# parsing is needed or not
|
||||
force_reload = False
|
||||
except jogobot.jogobot.Blocked:
|
||||
(type, value, traceback) = sys.exc_info()
|
||||
jogobot.output( "\03{lightpurple} %s (%s)" % (value, type ),
|
||||
"CRITICAL" )
|
||||
|
||||
# Parse command line arguments
|
||||
for arg in local_args:
|
||||
if arg.startswith("-always"):
|
||||
always = True
|
||||
elif arg.startswith("-force-reload"):
|
||||
force_reload = True
|
||||
else:
|
||||
genFactory.handleArg(arg)
|
||||
except jogobot.jogobot.Disabled:
|
||||
(type, value, traceback) = sys.exc_info()
|
||||
jogobot.output( "\03{red} %s (%s)" % (value, type ),
|
||||
"ERROR" )
|
||||
|
||||
if not gen:
|
||||
gen = genFactory.getCombinedGenerator()
|
||||
if gen:
|
||||
# The preloading generator is responsible for downloading multiple
|
||||
# pages from the wiki simultaneously.
|
||||
gen = pagegenerators.PreloadingGenerator(gen)
|
||||
bot = ChartsBot(gen, always, force_reload)
|
||||
if bot:
|
||||
bot.run()
|
||||
# Bot/Task is active
|
||||
else:
|
||||
pywikibot.showHelp()
|
||||
# This factory is responsible for processing command line arguments
|
||||
# that are also used by other scripts and that determine on which pages
|
||||
# to work on.
|
||||
genFactory = pagegenerators.GeneratorFactory()
|
||||
# The generator gives the pages that should be worked upon.
|
||||
gen = None
|
||||
|
||||
# If always is True, bot won't ask for confirmation of edit (automode)
|
||||
always = False
|
||||
|
||||
# If force_reload is True, bot will always parse Countrylist regardless
|
||||
# if parsing is needed or not
|
||||
force_reload = False
|
||||
|
||||
# Parse command line arguments
|
||||
for arg in local_args:
|
||||
if arg.startswith("-always"):
|
||||
always = True
|
||||
elif arg.startswith("-force-reload"):
|
||||
force_reload = True
|
||||
else:
|
||||
pass
|
||||
genFactory.handleArg(arg)
|
||||
|
||||
if not gen:
|
||||
gen = genFactory.getCombinedGenerator()
|
||||
if gen:
|
||||
# The preloading generator is responsible for downloading multiple
|
||||
# pages from the wiki simultaneously.
|
||||
gen = pagegenerators.PreloadingGenerator(gen)
|
||||
bot = ChartsBot(gen, always, force_reload)
|
||||
if bot:
|
||||
bot.run()
|
||||
else:
|
||||
pywikibot.showHelp()
|
||||
|
||||
if( __name__ == "__main__" ):
|
||||
main()
|
||||
169
countrylist.py
169
countrylist.py
@@ -25,6 +25,7 @@
|
||||
Provides a class for handling charts list per country and year
|
||||
"""
|
||||
|
||||
import re
|
||||
import locale
|
||||
from datetime import datetime
|
||||
|
||||
@@ -97,15 +98,15 @@ class CountryList():
|
||||
|
||||
def find_year( self ):
|
||||
"""
|
||||
Try to find the year related to CountryList
|
||||
Try to find the year related to CountryList using regex
|
||||
"""
|
||||
self.year = datetime.now().year
|
||||
match = re.search( r"^.+\((\d{4})\)", self.page.title() )
|
||||
|
||||
# Check if year is in page.title, if not try last year
|
||||
if str( self.year ) not in self.page.title():
|
||||
self.year -= 1
|
||||
# If last year does not match, raise YearError
|
||||
if str( self.year ) not in self.page.title():
|
||||
# We matched something
|
||||
if match:
|
||||
self.year = int(match.group(1))
|
||||
|
||||
else:
|
||||
raise CountryListError( "CountryList year is errorneous!" )
|
||||
|
||||
def parse( self ):
|
||||
@@ -113,6 +114,9 @@ class CountryList():
|
||||
Handles the parsing process
|
||||
"""
|
||||
|
||||
# Set revid
|
||||
self.revid = self.page.latest_revision_id
|
||||
|
||||
# Parse page with mwparser
|
||||
self.generate_wikicode()
|
||||
|
||||
@@ -350,6 +354,45 @@ missing!" )
|
||||
for ref in self._interpret_raw.ifilter_tags(matches="ref"):
|
||||
self._interpret_raw.remove( ref )
|
||||
|
||||
# Handle SortKeyName and SortKey
|
||||
for template in self._interpret_raw.ifilter_templates(
|
||||
matches="SortKey" ):
|
||||
|
||||
if template.name == "SortKeyName":
|
||||
# Differing Link-Destination is provided as param 3
|
||||
if template.has(3):
|
||||
# Construct link out of Template, Params:
|
||||
# 1 = Surname
|
||||
# 2 = Name
|
||||
# 3 = Link-Dest
|
||||
interpret_link = mwparser.nodes.wikilink.Wikilink(
|
||||
str(template.get(3).value),
|
||||
str(template.get(1).value) + " " +
|
||||
str(template.get(2).value) )
|
||||
|
||||
# Default Link-Dest [[Surname Name]]
|
||||
else:
|
||||
interpret_link = mwparser.nodes.wikilink.Wikilink(
|
||||
str(template.get(1).value) + " " +
|
||||
str(template.get(2).value) )
|
||||
|
||||
# Replace Template with link
|
||||
self._interpret_raw.replace( template, interpret_link )
|
||||
|
||||
# SortKey
|
||||
else:
|
||||
# Replace SortKey with text from param 2 if present
|
||||
if template.has(2):
|
||||
self._interpret_raw.replace( template,
|
||||
template.get(2).value)
|
||||
# Else Remove SortKey (text should follow behind SortKey)
|
||||
else:
|
||||
self._interpret_raw.replace( template, None)
|
||||
|
||||
# Normally won't be needed as there should be only one
|
||||
# SortKey-Temlate but ... its a wiki
|
||||
break
|
||||
|
||||
# Remove whitespace
|
||||
self._interpret_raw = str(self._interpret_raw).strip()
|
||||
else:
|
||||
@@ -409,6 +452,23 @@ missing!" )
|
||||
else:
|
||||
return str(keywords[0])
|
||||
|
||||
def __str__( self ):
|
||||
"""
|
||||
Returns str repression for Object
|
||||
"""
|
||||
if self.parsed:
|
||||
return ("CountryList( Link = \"{link}\", Revid = \"{revid}\", " +
|
||||
"Interpret = \"{interpret}\", Titel = \"{titel}\", " +
|
||||
"Chartein = \"{chartein}\" )").format(
|
||||
link=repr(self.wikilink),
|
||||
revid=self.revid,
|
||||
interpret=self.interpret,
|
||||
titel=self.titel,
|
||||
chartein=repr(self.chartein))
|
||||
else:
|
||||
return "CountryList( Link = \"{link}\" )".format(
|
||||
link=repr(self.wikilink))
|
||||
|
||||
|
||||
class CountryListError( Exception ):
|
||||
"""
|
||||
@@ -422,3 +482,98 @@ class CountryListEntryError( CountryListError ):
|
||||
Handles errors occuring in class CountryList related to entrys
|
||||
"""
|
||||
pass
|
||||
|
||||
|
||||
class CountryListUnitTest():
|
||||
"""
|
||||
Defines Test-Functions for CountryList-Module
|
||||
"""
|
||||
|
||||
testcases = ( { "Link": mwparser.nodes.Wikilink( "Benutzer:JogoBot/Charts/Tests/Liste der Nummer-eins-Hits in Frankreich (2015)" ), # noqa
|
||||
"revid": 148453827,
|
||||
"interpret": "[[Adele (Sängerin)|Adele]]",
|
||||
"titel": "[[Hello (Adele-Lied)|Hello]]",
|
||||
"chartein": datetime( 2015, 10, 23 ) },
|
||||
{ "Link": mwparser.nodes.Wikilink( "Benutzer:JogoBot/Charts/Tests/Liste der Nummer-eins-Hits in Belgien (2015)", "Wallonien"), # noqa
|
||||
"revid": 148455281,
|
||||
"interpret": "[[Nicky Jam]] & [[Enrique Iglesias (Sänger)|Enrique Iglesias]]", # noqa
|
||||
"titel": "El perdón",
|
||||
"chartein": datetime( 2015, 9, 12 ) } )
|
||||
|
||||
def __init__( self, page=None ):
|
||||
"""
|
||||
Constructor
|
||||
Set attribute page
|
||||
"""
|
||||
if page:
|
||||
self.page_link = mwparser.nodes.Wikilink( page )
|
||||
else:
|
||||
self.page_link = None
|
||||
|
||||
def treat( self ):
|
||||
"""
|
||||
Start testing either manually with page provided by cmd-arg page or
|
||||
automatically with predefined test case
|
||||
"""
|
||||
if self.page_link:
|
||||
self.man_test()
|
||||
else:
|
||||
self.auto_test()
|
||||
|
||||
def auto_test( self ):
|
||||
"""
|
||||
Run automatic tests with predefined test data from wiki
|
||||
"""
|
||||
|
||||
for case in type(self).testcases:
|
||||
|
||||
self.countrylist = CountryList( case["Link"] )
|
||||
|
||||
if( self.countrylist.is_parsing_needed( case["revid"] ) or not
|
||||
self.countrylist.is_parsing_needed( case["revid"] + 1 ) ):
|
||||
raise Exception(
|
||||
"CountryList.is_parsing_needed() does not work!" )
|
||||
|
||||
self.countrylist.parse()
|
||||
|
||||
for key in case:
|
||||
|
||||
if key == "Link":
|
||||
continue
|
||||
|
||||
if not case[key] == getattr(self.countrylist, key ):
|
||||
raise Exception( key + " – " + str(
|
||||
getattr(self.countrylist, key ) ))
|
||||
|
||||
def man_test( self ):
|
||||
"""
|
||||
Run manual test with page given in parameter
|
||||
"""
|
||||
self.countrylist = CountryList( self.page_link )
|
||||
|
||||
self.countrylist.parse()
|
||||
|
||||
print( self.countrylist )
|
||||
print( "Since we have no data to compare, you need to manually " +
|
||||
"check data above against given page to ensure correct " +
|
||||
"working of module!" )
|
||||
|
||||
|
||||
def main(*args):
|
||||
"""
|
||||
Handling direct calls --> unittest
|
||||
"""
|
||||
# Process global arguments to determine desired site
|
||||
local_args = pywikibot.handle_args(args)
|
||||
|
||||
# Parse command line arguments
|
||||
for arg in local_args:
|
||||
if arg.startswith("-page:"):
|
||||
page = arg[ len("-page:"): ]
|
||||
|
||||
# Call unittest-class
|
||||
test = CountryListUnitTest( page )
|
||||
test.treat()
|
||||
|
||||
if __name__ == "__main__":
|
||||
main()
|
||||
|
||||
1
jogobot
Submodule
1
jogobot
Submodule
Submodule jogobot added at 2173f2984f
Reference in New Issue
Block a user