aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@robocracy.org>2019-06-24 14:07:48 -0700
committerBryan Newbold <bnewbold@robocracy.org>2019-06-24 14:07:50 -0700
commitfa9e3a2e8992779b80877b19090eaf15c8c7bc0e (patch)
tree0a1abcdb17b59258591d27d8c78794b5fa93ac6d
parent946fe6872e068de0694040bc04bb0ddf5d5c13b6 (diff)
downloadfatcat-fa9e3a2e8992779b80877b19090eaf15c8c7bc0e.tar.gz
fatcat-fa9e3a2e8992779b80877b19090eaf15c8c7bc0e.zip
matched importer: urls, not url
This matches the docs in the header. Previous matched imports were using 'cdx' objects with no 'dt' key, but this makes more sense. As far as I know the old 'url' code path was never actually used (or tested, derp).
-rw-r--r--python/fatcat_tools/importers/matched.py2
1 files changed, 1 insertions, 1 deletions
diff --git a/python/fatcat_tools/importers/matched.py b/python/fatcat_tools/importers/matched.py
index 3ef617d3..9cbd071f 100644
--- a/python/fatcat_tools/importers/matched.py
+++ b/python/fatcat_tools/importers/matched.py
@@ -96,7 +96,7 @@ class MatchedImporter(EntityImporter):
# parse URLs and CDX
urls = set()
- for url in obj.get('url', []):
+ for url in obj.get('urls', []):
url = make_rel_url(url, default_link_rel=self.default_link_rel)
if url != None:
urls.add(url)