diff --git a/fix_tei.py b/fix_tei.py index 9143e4e..da65d39 100644 --- a/fix_tei.py +++ b/fix_tei.py @@ -106,6 +106,7 @@ def convert_citations(string): """ citations = [] + # BUG: a dot as in 197f. is not recognized! year_citations_pattern = re.compile(r"(§|§|§)(§|§|§)(?P.+?)(\!(?P.*?))?(§|§|§)(§|§|§)") year_citations = re.findall(year_citations_pattern, string) logging.info("Found %s year citations." % len(year_citations))