Skip to content

Commit

Permalink
Rudimentary index handling
Browse files Browse the repository at this point in the history
kthoden committed Mar 4, 2020
1 parent a76d0f5 commit 3e2e66f
Showing 1 changed file with 23 additions and 3 deletions.
26 changes: 23 additions & 3 deletions src/tei2imxml.py
Original file line number Diff line number Diff line change
@@ -1085,11 +1085,31 @@ def handle_refs_default(ref):
############
# Indexing #
############
# indexName="person"><term corresp="https://www.wikidata.org/wiki/Q6882">James Joyce</term></index>"
index_entries = xml_tree.xpath("//t:body//t:index", namespaces=NS_MAP)
for entry in index_entries:
# hier weiter!
pass
index_type = entry.get("indexName")
tagname = "EOAindex"
if index_type != "keyword":
tagname += index_type
entry.tag = tagname
entry_tail = entry.tail
entry_content = entry.find("t:term", namespaces=NS_MAP)
try:
sortkey = entry_content.get("sortKey")
print("sortkey found")
except AttributeError:
sortkey = ""
print("no sortkey")
entry_text = ""
if len(sortkey) > 0:
entry_text = f"{sortkey}@"
# markup ignored for now
remainder = libeoaconvert.gettext(entry_content)
entry_text += remainder
# re-assemble
entry.clear()
entry.text = entry_text
entry.tail = entry_tail

########
# Math #

0 comments on commit 3e2e66f

Please sign in to comment.