diff options
author | Bryan Newbold <bnewbold@robocracy.org> | 2019-06-24 14:07:48 -0700 |
---|---|---|
committer | Bryan Newbold <bnewbold@robocracy.org> | 2019-06-24 14:07:50 -0700 |
commit | fa9e3a2e8992779b80877b19090eaf15c8c7bc0e (patch) | |
tree | 0a1abcdb17b59258591d27d8c78794b5fa93ac6d | |
parent | 946fe6872e068de0694040bc04bb0ddf5d5c13b6 (diff) | |
download | fatcat-fa9e3a2e8992779b80877b19090eaf15c8c7bc0e.tar.gz fatcat-fa9e3a2e8992779b80877b19090eaf15c8c7bc0e.zip |
matched importer: urls, not url
This matches the docs in the header. Previous matched imports were using
'cdx' objects with no 'dt' key, but this makes more sense. As far as I
know the old 'url' code path was never actually used (or tested, derp).
-rw-r--r-- | python/fatcat_tools/importers/matched.py | 2 |
1 files changed, 1 insertions, 1 deletions
diff --git a/python/fatcat_tools/importers/matched.py b/python/fatcat_tools/importers/matched.py index 3ef617d3..9cbd071f 100644 --- a/python/fatcat_tools/importers/matched.py +++ b/python/fatcat_tools/importers/matched.py @@ -96,7 +96,7 @@ class MatchedImporter(EntityImporter): # parse URLs and CDX urls = set() - for url in obj.get('url', []): + for url in obj.get('urls', []): url = make_rel_url(url, default_link_rel=self.default_link_rel) if url != None: urls.add(url) |