aboutsummaryrefslogtreecommitdiffstats
path: root/fatcat_scholar/hacks.py
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2021-06-11 15:13:17 -0700
committerBryan Newbold <bnewbold@archive.org>2021-06-11 15:13:17 -0700
commit388eeaf4fa137522ec90c96e57581ced33205e57 (patch)
treeea6832c4fe8026373e9c3b712e1b68687d7e8eb6 /fatcat_scholar/hacks.py
parent3bae05c4a4cd7d6d9b892b952b7ca35454319479 (diff)
downloadfatcat-scholar-388eeaf4fa137522ec90c96e57581ced33205e57.tar.gz
fatcat-scholar-388eeaf4fa137522ec90c96e57581ced33205e57.zip
update citation_pdf_url HTML meta tag to new access URL style
Diffstat (limited to 'fatcat_scholar/hacks.py')
-rw-r--r--fatcat_scholar/hacks.py29
1 files changed, 18 insertions, 11 deletions
diff --git a/fatcat_scholar/hacks.py b/fatcat_scholar/hacks.py
index 0f16fc7..e7d4566 100644
--- a/fatcat_scholar/hacks.py
+++ b/fatcat_scholar/hacks.py
@@ -126,15 +126,14 @@ def test_wayback_direct_url() -> None:
)
-def make_access_redirect_url(access_type: str, access_url: str) -> str:
+def make_access_redirect_url(work_ident: str, access_type: str, access_url: str) -> str:
if access_type == "wayback" and "://web.archive.org/" in access_url:
segments = access_url.split("/")
- dt = segments[4]
original_url = "/".join(segments[5:])
- return f"https://scholar.archive.org/access/wayback/{dt}/{original_url}"
+ return f"https://scholar.archive.org/work/{work_ident}/access/wayback/{original_url}"
elif access_type == "ia_file" and "://archive.org/download/" in access_url:
suffix = "/".join(access_url.split("/")[4:])
- return f"https://scholar.archive.org/access/ia_file/{suffix}"
+ return f"https://scholar.archive.org/work/{work_ident}/access/ia_file/{suffix}"
else:
return access_url
@@ -142,31 +141,39 @@ def make_access_redirect_url(access_type: str, access_url: str) -> str:
def test_make_access_redirect_url() -> None:
assert (
make_access_redirect_url(
- "wayback", "https://web.archive.org/web/1234/http://fatcat.wiki/thing.pdf"
+ "lmobci36t5aelogzjsazuwxpie",
+ "wayback",
+ "https://web.archive.org/web/1234/http://fatcat.wiki/thing.pdf",
)
- == "https://scholar.archive.org/access/wayback/1234/http://fatcat.wiki/thing.pdf"
+ == "https://scholar.archive.org/work/lmobci36t5aelogzjsazuwxpie/access/wayback/http://fatcat.wiki/thing.pdf"
)
assert (
make_access_redirect_url(
+ "lmobci36t5aelogzjsazuwxpie",
"wayback",
"https://web.archive.org/web/1234/http://fatcat.wiki/thing.pdf?param=asdf",
)
- == "https://scholar.archive.org/access/wayback/1234/http://fatcat.wiki/thing.pdf?param=asdf"
+ == "https://scholar.archive.org/work/lmobci36t5aelogzjsazuwxpie/access/wayback/http://fatcat.wiki/thing.pdf?param=asdf"
)
assert (
make_access_redirect_url(
- "ia_file", "https://archive.org/download/something/file.pdf"
+ "lmobci36t5aelogzjsazuwxpie",
+ "ia_file",
+ "https://archive.org/download/something/file.pdf",
)
- == "https://scholar.archive.org/access/ia_file/something/file.pdf"
+ == "https://scholar.archive.org/work/lmobci36t5aelogzjsazuwxpie/access/ia_file/something/file.pdf"
)
assert (
- make_access_redirect_url("blah", "https://mit.edu/file.pdf")
+ make_access_redirect_url(
+ "lmobci36t5aelogzjsazuwxpie", "blah", "https://mit.edu/file.pdf"
+ )
== "https://mit.edu/file.pdf"
)
assert (
make_access_redirect_url(
+ "lmobci36t5aelogzjsazuwxpie",
"wayback",
"https://web.archive.org/web/20170811115414/http://sudjms.net/issues/5-4/pdf/8)A%20comparison%20study%20of%20histochemical%20staining%20of%20various%20tissues%20after.pdf",
)
- == "https://scholar.archive.org/access/wayback/20170811115414/http://sudjms.net/issues/5-4/pdf/8)A%20comparison%20study%20of%20histochemical%20staining%20of%20various%20tissues%20after.pdf"
+ == "https://scholar.archive.org/work/lmobci36t5aelogzjsazuwxpie/access/wayback/http://sudjms.net/issues/5-4/pdf/8)A%20comparison%20study%20of%20histochemical%20staining%20of%20various%20tissues%20after.pdf"
)