diff --git a/prepare_tei.py b/prepare_tei.py index f99fcf4..f618684 100644 --- a/prepare_tei.py +++ b/prepare_tei.py @@ -88,6 +88,10 @@ def convert_citations(string): """ + inline_citation_pattern = re.compile(r"(§|§|§)(§|§|§)(?P.+?)(\!(?P.*?))?(§|§|§)(§|§|§)") + inline_citations = re.findall(inline_citation_pattern, string) + logging.info("Found %s inline citations." % len(inline_citations)) + string = re.sub(inline_citation_pattern, r"", string) citation_pattern = re.compile(r"(§|§|§)(?P.+?)(\!(?P.*?))?(§|§|§)") citations = re.findall(citation_pattern, string)