From 8b7dc5dbf28915b4f5efa0558aa75047a3d45c7a Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?GOLDERWEB=20=E2=80=93=20Jonathan=20Golder?= Date: Fri, 11 Sep 2015 16:18:46 +0200 Subject: [PATCH] Improve sectionheading regex to reduce false positives, require at least two links --- red_fam.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/red_fam.py b/red_fam.py index ba550e3..2215dc6 100644 --- a/red_fam.py +++ b/red_fam.py @@ -62,7 +62,7 @@ class RED_FAM_PARSER( RED_FAM ): __timestamp_format2 = "%H:%M, %d. %b %Y (%Z)" # Catch missing point after month abreviation # Define section heading re.pattern - __sectionhead_pat = re.compile( r"={3,4}[^=]*={3,4}" ) + __sectionhead_pat = re.compile( r"^=+.*\[\[.+\]\].*\[\[.+\]\].*=+$" ) # Define timestamp re.pattern __timestamp_pat = re.compile( r"\d{2}:\d{2}, (\d{1,2}. (Jan|Feb|Mär|Apr|Mai|Jun|Jul|Aug|Sep|Okt|Nov|Dez).? \d{4}) \(CES?T\)" )