summaryrefslogtreecommitdiffstats
path: root/parsers/logbooks.py
diff options
context:
space:
mode:
Diffstat (limited to 'parsers/logbooks.py')
-rw-r--r--parsers/logbooks.py16
1 files changed, 10 insertions, 6 deletions
diff --git a/parsers/logbooks.py b/parsers/logbooks.py
index 11cd70f..aa4ec92 100644
--- a/parsers/logbooks.py
+++ b/parsers/logbooks.py
@@ -52,10 +52,10 @@ data for old logbooks. New design needed, with a mechanism for flagging fixtures
'''
MAX_LOGBOOK_ENTRY_TITLE_LENGTH = 200
BLOG_PARSER_SETTINGS = {
-# "2017": ("ukcavingblog.html", "parser_blog"), # now folded in to logbooks.html
- "2018": ("ukcavingblog.html", "parser_blog"),
+# "2022": ("ukcavingblog.html", "parser_blog"),
"2019": ("ukcavingblog.html", "parser_blog"),
- "2022": ("ukcavingblog.html", "parser_blog"),
+ "2018": ("ukcavingblog.html", "parser_blog"),
+# "2017": ("ukcavingblog.html", "parser_blog"), # now folded in to logbooks.html
}
DEFAULT_LOGBOOK_FILE = "logbook.html"
DEFAULT_LOGBOOK_PARSER = "parser_html"
@@ -86,7 +86,7 @@ LOGBOOK_PARSER_SETTINGS = {
"1982": ("log.htm", "parser_html_01"),
}
-entries = { "2022": 64, "2019": 56, "2018": 75, "2017": 76, "2016": 81, "2015": 79,
+entries = { "2022": 86, "2019": 56, "2018": 86, "2017": 76, "2016": 83, "2015": 79,
"2014": 65, "2013": 51, "2012": 75, "2011": 68, "2010": 22, "2009": 53,
"2008": 49, "2007": 113, "2006": 60, "2005": 55, "2004": 76, "2003": 42, "2002": 31,
"2001": 48, "2000": 54, "1999": 79, "1998": 43, "1997": 53, "1996": 95, "1995": 42,
@@ -510,7 +510,7 @@ def parser_blog(year, expedition, txt, sq=""):
tu = 0
logbook_entry_count = 0
for i in range(0, len(tripparas)):
- trippara = tripparas[i]
+ tripcontent = tripparas[i]
triphead = tripheads[i]
logbook_entry_count += 1
tid = set_trip_id(year,logbook_entry_count) +"_blog" + sq
@@ -550,7 +550,11 @@ def parser_blog(year, expedition, txt, sq=""):
# tripname must have the location then a hyphen at the beginning as it is ignored by export function
location = "Unknown"
tripname = f"Expo - UK Caving Blog{sq} post {logbook_entry_count}" # must be unique for a given date
- tripcontent = f"\n\nBlog Author: {trippeople}" + trippara
+ tripcontent = re.sub(r"(width=\"\d+\")","",tripcontent)
+ tripcontent = re.sub(r"height=\"\d+\"","",tripcontent)
+ tripcontent = re.sub(r"width: \d+px","",tripcontent)
+ tripcontent = re.sub(r"\n\n+","\n\n",tripcontent)
+ tripcontent = f"\n\nBlog Author: {trippeople}" + tripcontent
entrytuple = (tripdate, location, tripname, tripcontent,
trippeople, expedition, tu, tid)