summaryrefslogtreecommitdiffstats
path: root/parsers/logbooks.py
diff options
context:
space:
mode:
Diffstat (limited to 'parsers/logbooks.py')
-rw-r--r--parsers/logbooks.py12
1 files changed, 12 insertions, 0 deletions
diff --git a/parsers/logbooks.py b/parsers/logbooks.py
index 2ede83f..3d96b3b 100644
--- a/parsers/logbooks.py
+++ b/parsers/logbooks.py
@@ -139,6 +139,18 @@ def GetTripPersons(trippeople, expedition, logtime_underground, tid=None):
# print(f'# {tid}')
# print(f" - {tid} '{trippeople}' ")
+ """
+ re.split(r",|\+|&|&(?!\w+;)| and ", trippeople)
+
+ , : The comma character
+ \+ : The plus sign (+); escaped to treat as a literal character
+ & : The literal string "&" (HTML-encoded ampersand)
+ &(?!\w+;) : An ampersand (&) not followed by one or more word characters (\w+) and a semicolon (;)
+ : Uses negative lookahead assertion (?!...) to ensure it's not part of an HTML entity like " "
+ and : The literal string " and " (with spaces before and after)
+
+ This will split the 'trippeople' string at any of these delimiters.
+ """
for tripperson in re.split(r",|\+|&|&(?!\w+;)| and ", trippeople):
tripperson = tripperson.strip()
# author_u = re.match(r"(?i)<u>(.*?)</u>$", tripperson)