diff options
author | Bryan Newbold <bnewbold@archive.org> | 2020-02-19 11:52:25 -0800 |
---|---|---|
committer | Bryan Newbold <bnewbold@archive.org> | 2020-02-19 11:52:25 -0800 |
commit | af051a2f401b97919d5e073f0962d4147fbfac8b (patch) | |
tree | 831cf5f8cbc50643d22d4c7faa21f6d4085fdbe5 /python/sandcrawler/db.py | |
parent | e6f2a585868b0277145659b9d653a0288f76f5b6 (diff) | |
download | sandcrawler-af051a2f401b97919d5e073f0962d4147fbfac8b.tar.gz sandcrawler-af051a2f401b97919d5e073f0962d4147fbfac8b.zip |
pdf_trio persist fixes from prod
Diffstat (limited to 'python/sandcrawler/db.py')
-rw-r--r-- | python/sandcrawler/db.py | 8 |
1 files changed, 4 insertions, 4 deletions
diff --git a/python/sandcrawler/db.py b/python/sandcrawler/db.py index 673912c..03cc15f 100644 --- a/python/sandcrawler/db.py +++ b/python/sandcrawler/db.py @@ -219,10 +219,10 @@ class SandcrawlerPostgresClient: d['status'], d.get('versions', {}).get('pdftrio_version') or None, d.get('versions', {}).get('models_date') or None, - d.get('ensemble_score') or None, - d.get('bert_score') or None, - d.get('linear_score') or None, - d.get('image_score') or None, + d.get('ensemble_score'), + d.get('bert_score'), + d.get('linear_score'), + d.get('image_score'), ) for d in batch] # filter out duplicate rows by key (sha1hex) |