diff options
author | Bryan Newbold <bnewbold@robocracy.org> | 2021-11-02 18:14:43 -0700 |
---|---|---|
committer | Bryan Newbold <bnewbold@robocracy.org> | 2021-11-02 18:14:43 -0700 |
commit | 9dc891b8098542bb089c8c47098b60a8beb76a53 (patch) | |
tree | 2c9b1c569b6b9bb4041ef51076d024b6980089c5 /python/fatcat_web/hacks.py | |
parent | 6464631dbe5c4afeb76f2f3c9d63b89f917c9a3b (diff) | |
download | fatcat-9dc891b8098542bb089c8c47098b60a8beb76a53.tar.gz fatcat-9dc891b8098542bb089c8c47098b60a8beb76a53.zip |
fmt (black): fatcat_web/
Diffstat (limited to 'python/fatcat_web/hacks.py')
-rw-r--r-- | python/fatcat_web/hacks.py | 12 |
1 files changed, 9 insertions, 3 deletions
diff --git a/python/fatcat_web/hacks.py b/python/fatcat_web/hacks.py index 9e6f6ab5..06350b41 100644 --- a/python/fatcat_web/hacks.py +++ b/python/fatcat_web/hacks.py @@ -1,17 +1,23 @@ - import re STRIP_EXTLINK_XML_RE = re.compile(r"<ext-link.*xlink:type=\"simple\">") + def strip_extlink_xml(unstr): unstr = unstr.replace("</ext-link>", "") unstr = STRIP_EXTLINK_XML_RE.sub("", unstr) return unstr + def test_strip_extlink_xml(): assert strip_extlink_xml("asdf") == "asdf" - assert strip_extlink_xml("""LOCKSS (2014) Available: <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="http://lockss.org/" xlink:type="simple">http://lockss.org/</ext-link>. Accessed: 2014 November 1.""") == \ - """LOCKSS (2014) Available: http://lockss.org/. Accessed: 2014 November 1.""" + assert ( + strip_extlink_xml( + """LOCKSS (2014) Available: <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:href="http://lockss.org/" xlink:type="simple">http://lockss.org/</ext-link>. Accessed: 2014 November 1.""" + ) + == """LOCKSS (2014) Available: http://lockss.org/. Accessed: 2014 November 1.""" + ) + def wayback_suffix(entity): """ |