diff options
Diffstat (limited to 'parsers/logbooks.py')
-rw-r--r-- | parsers/logbooks.py | 12 |
1 files changed, 12 insertions, 0 deletions
diff --git a/parsers/logbooks.py b/parsers/logbooks.py index 2ede83f..3d96b3b 100644 --- a/parsers/logbooks.py +++ b/parsers/logbooks.py @@ -139,6 +139,18 @@ def GetTripPersons(trippeople, expedition, logtime_underground, tid=None): # print(f'# {tid}') # print(f" - {tid} '{trippeople}' ") + """ + re.split(r",|\+|&|&(?!\w+;)| and ", trippeople) + + , : The comma character + \+ : The plus sign (+); escaped to treat as a literal character + & : The literal string "&" (HTML-encoded ampersand) + &(?!\w+;) : An ampersand (&) not followed by one or more word characters (\w+) and a semicolon (;) + : Uses negative lookahead assertion (?!...) to ensure it's not part of an HTML entity like " " + and : The literal string " and " (with spaces before and after) + + This will split the 'trippeople' string at any of these delimiters. + """ for tripperson in re.split(r",|\+|&|&(?!\w+;)| and ", trippeople): tripperson = tripperson.strip() # author_u = re.match(r"(?i)<u>(.*?)</u>$", tripperson) |