Merge branch 'fs#160-urlencoded-chars' into develop

This commit is contained in:
2017-10-28 22:36:55 +02:00

View File

@@ -28,6 +28,7 @@ Provides classes for working with RedFams
import hashlib import hashlib
import locale import locale
import re import re
import urllib.parse
from datetime import datetime from datetime import datetime
import mwparserfromhell as mwparser # noqa import mwparserfromhell as mwparser # noqa
@@ -291,6 +292,9 @@ class RedFamParser( RedFam ):
# Make sure first letter is uppercase # Make sure first letter is uppercase
article = article[0].upper() + article[1:] article = article[0].upper() + article[1:]
# Unquote possible url encoded special chars
article = urllib.parse.unquote( article )
# Split in title and anchor part # Split in title and anchor part
article = article.split("#", 1) article = article.split("#", 1)
# Replace underscores in title with spaces # Replace underscores in title with spaces