summaryrefslogtreecommitdiffstats
path: root/python/fatcat_tools/importers
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@robocracy.org>2020-02-14 00:12:23 -0800
committerBryan Newbold <bnewbold@robocracy.org>2020-02-14 00:12:23 -0800
commit016d6d28c24f616897bdb7587205cfe2cc32ec89 (patch)
tree9245e8501418abbb8dc13abe553c103dae27bfaa /python/fatcat_tools/importers
parentfd86c5ac74512a92bc5cbe25f8ec1f963d6cc1e6 (diff)
downloadfatcat-016d6d28c24f616897bdb7587205cfe2cc32ec89.tar.gz
fatcat-016d6d28c24f616897bdb7587205cfe2cc32ec89.zip
remove arabesque short wayback URL hack
Diffstat (limited to 'python/fatcat_tools/importers')
-rw-r--r--python/fatcat_tools/importers/shadow.py6
1 files changed, 0 insertions, 6 deletions
diff --git a/python/fatcat_tools/importers/shadow.py b/python/fatcat_tools/importers/shadow.py
index 1a76299e..4cd22775 100644
--- a/python/fatcat_tools/importers/shadow.py
+++ b/python/fatcat_tools/importers/shadow.py
@@ -155,12 +155,6 @@ class ShadowLibraryImporter(EntityImporter):
if u.rel == 'social':
u.rel = 'academicsocial'
- # new wayback URLs, could replace bad old short wayback URLs (from arabesque bug)
- new_wb_urls = [u.url for u in fe.urls]
- new_short_wb_urls = ['https://web.archive.org/web/{}/{}'.format(
- u.split('/')[4][:12], '/'.join(u.split('/')[5:])) for u in new_wb_urls]
- existing.urls = [u for u in existing.urls if not u.url in new_short_wb_urls]
-
# merge the existing into this one and update
merged_urls = {}
for u in fe.urls + existing.urls: