4 Commits

Author SHA1 Message Date
33b2e47312 Describe version test-v7 2017-10-28 22:43:53 +02:00
3bd17ce692 Merge branch 'fs#160-urlencoded-chars' into develop 2017-10-28 22:36:55 +02:00
5f4640d5ff Replace urlencoded chars with unicode equivalent
Otherwise we get value errors while marking since pwb replaces those

Related Task: [FS#160](https://fs.golderweb.de/index.php?do=details&task_id=160)
2017-10-28 22:35:25 +02:00
7e0456ae4f Merge branch 'test-v6' back into develop 2017-10-28 22:34:30 +02:00
2 changed files with 7 additions and 1 deletions

View File

@@ -18,10 +18,12 @@ Those can be installed using pip and the _requirements.txt_ file provided with t
Versions Versions
-------- --------
* test-v7
- Fixed problem with url encoded chars in article title
* test-v6 * test-v6
- jogobot status API enabled (Bot can be disabled onwiki) - jogobot status API enabled (Bot can be disabled onwiki)
- Fixed Problem with space between article title and anchor - Fixed problem with space between article title and anchor
* test-v5 * test-v5
- Feature _markpages_ working in full-automatic mode with _always_-flag - Feature _markpages_ working in full-automatic mode with _always_-flag

View File

@@ -28,6 +28,7 @@ Provides classes for working with RedFams
import hashlib import hashlib
import locale import locale
import re import re
import urllib.parse
from datetime import datetime from datetime import datetime
import mwparserfromhell as mwparser # noqa import mwparserfromhell as mwparser # noqa
@@ -291,6 +292,9 @@ class RedFamParser( RedFam ):
# Make sure first letter is uppercase # Make sure first letter is uppercase
article = article[0].upper() + article[1:] article = article[0].upper() + article[1:]
# Unquote possible url encoded special chars
article = urllib.parse.unquote( article )
# Split in title and anchor part # Split in title and anchor part
article = article.split("#", 1) article = article.split("#", 1)
# Replace underscores in title with spaces # Replace underscores in title with spaces