diff options
author | Bryan Newbold <bnewbold@archive.org> | 2020-01-21 10:59:27 -0800 |
---|---|---|
committer | Bryan Newbold <bnewbold@archive.org> | 2020-01-21 10:59:27 -0800 |
commit | a1b44161e206873be30c0640f5fab7a284023ba1 (patch) | |
tree | 9c5f2aa24a6d000e803b19427eb8a66730cd72be /python/sandcrawler/db.py | |
parent | fb7717ae410f72ff33017c176f64dff556b86f5b (diff) | |
download | sandcrawler-a1b44161e206873be30c0640f5fab7a284023ba1.tar.gz sandcrawler-a1b44161e206873be30c0640f5fab7a284023ba1.zip |
persist: work around GROBID timeouts with no status_code
Diffstat (limited to 'python/sandcrawler/db.py')
-rw-r--r-- | python/sandcrawler/db.py | 2 |
1 files changed, 1 insertions, 1 deletions
diff --git a/python/sandcrawler/db.py b/python/sandcrawler/db.py index 3ec325e..e1414ba 100644 --- a/python/sandcrawler/db.py +++ b/python/sandcrawler/db.py @@ -161,7 +161,7 @@ class SandcrawlerPostgresClient: r['metadata'] = json.dumps(r['metadata'], sort_keys=True) batch = [(d['key'], d.get('grobid_version') or None, - d['status_code'], + d.get('status_code') or None, d['status'], d.get('fatcat_release') or None, d.get('updated') or datetime.datetime.now(), |