Speed up docx parsing by caching xpaths

2025-06-23 15:30:45 -04:00 · 2013-05-11 17:34:20 +05:30 · 2013-05-11 17:34:20 +05:30 · fab6e1ce7f
commit fab6e1ce7f
parent 90374d24c4
1 changed files with 6 additions and 1 deletions
--- a/src/calibre/ebooks/docx/names.py
+++ b/src/calibre/ebooks/docx/names.py
@ -45,8 +45,13 @@ namespaces = {
    'dcterms': 'http://purl.org/dc/terms/'
 }

+xpath_cache = {}
+
 def XPath(expr):
-    return X(expr, namespaces=namespaces)
+    ans = xpath_cache.get(expr, None)
+    if ans is None:
+        xpath_cache[expr] = ans = X(expr, namespaces=namespaces)
+    return ans

 def is_tag(x, q):
    tag = getattr(x, 'tag', x)