diff options
author | Sam Wenham <sam@wenhams.co.uk> | 2019-07-11 12:29:38 +0100 |
---|---|---|
committer | Sam Wenham <sam@wenhams.co.uk> | 2019-07-11 12:29:38 +0100 |
commit | a26109cb3006dd64e1bec38100397ad636813e98 (patch) | |
tree | aef17c7a0a75a5123500745e62663a5278a02131 /parsers/logbooks.py | |
parent | 6b5b9a531555f3003af3d829979accf0bc103b18 (diff) | |
download | troggle-a26109cb3006dd64e1bec38100397ad636813e98.tar.gz troggle-a26109cb3006dd64e1bec38100397ad636813e98.tar.bz2 troggle-a26109cb3006dd64e1bec38100397ad636813e98.zip |
Allow comments against names in logbooks in brackets
Convert accent chars in names into simple chars as this is what people enter in the logbook
Diffstat (limited to 'parsers/logbooks.py')
-rw-r--r-- | parsers/logbooks.py | 8 |
1 files changed, 5 insertions, 3 deletions
diff --git a/parsers/logbooks.py b/parsers/logbooks.py index 12124ca..e5817a6 100644 --- a/parsers/logbooks.py +++ b/parsers/logbooks.py @@ -25,9 +25,10 @@ from utils import save_carefully # # the logbook loading section # -def GetTripPersons(trippeople, expedition, logtime_underground): +def GetTripPersons(trippeople, expedition, logtime_underground): res = [ ] author = None + round_bracket_regex = re.compile(r"[\(\[].*?[\)\]]") for tripperson in re.split(r",|\+|&|&(?!\w+;)| and ", trippeople): tripperson = tripperson.strip() mul = re.match(r"<u>(.*?)</u>$(?i)", tripperson) @@ -35,6 +36,7 @@ def GetTripPersons(trippeople, expedition, logtime_underground): tripperson = mul.group(1).strip() if tripperson and tripperson[0] != '*': #assert tripperson in personyearmap, "'%s' << %s\n\n %s" % (tripperson, trippeople, personyearmap) + tripperson = re.sub(round_bracket_regex, "", tripperson).strip() personyear = GetPersonExpeditionNameLookup(expedition).get(tripperson.lower()) if not personyear: print(" - No name match for: '%s'" % tripperson) @@ -172,8 +174,8 @@ def Parseloghtmltxt(year, expedition, txt): tripid, tripid1, tripdate, trippeople, triptitle, triptext, tu = s.groups() ldate = ParseDate(tripdate.strip(), year) #assert tripid[:-1] == "t" + tripdate, (tripid, tripdate) - #trippeople = re.sub(r"Ol(?!l)", "Olly", trippeople) - #trippeople = re.sub(r"Wook(?!e)", "Wookey", trippeople) + #trippeople = re.sub(r"Ol(?!l)", "Olly", trippeople) + #trippeople = re.sub(r"Wook(?!e)", "Wookey", trippeople) triptitles = triptitle.split(" - ") if len(triptitles) >= 2: tripcave = triptitles[0] |