diff options
author | Bryan Newbold <bnewbold@archive.org> | 2020-05-21 20:24:12 -0700 |
---|---|---|
committer | Bryan Newbold <bnewbold@archive.org> | 2020-05-21 20:24:12 -0700 |
commit | 383349341a09f9d05f58b6104064af7b0c89dcc1 (patch) | |
tree | 344797bb1fb1c43fb116013ba23a96de7c090389 /fatcat_scholar/work_pipeline.py | |
parent | fee17cf6518e13b6f1c3945dd769aba56d7606d5 (diff) | |
download | fatcat-scholar-383349341a09f9d05f58b6104064af7b0c89dcc1.tar.gz fatcat-scholar-383349341a09f9d05f58b6104064af7b0c89dcc1.zip |
handle petabox read timeouts a bit
Diffstat (limited to 'fatcat_scholar/work_pipeline.py')
-rw-r--r-- | fatcat_scholar/work_pipeline.py | 7 |
1 files changed, 6 insertions, 1 deletions
diff --git a/fatcat_scholar/work_pipeline.py b/fatcat_scholar/work_pipeline.py index 363535c..f0c0e6f 100644 --- a/fatcat_scholar/work_pipeline.py +++ b/fatcat_scholar/work_pipeline.py @@ -3,6 +3,7 @@ import os import io import sys import minio +import requests import argparse from pydantic import BaseModel, validator from typing import List, Dict, Tuple, Optional, Any, Sequence @@ -255,7 +256,11 @@ class WorkPipeline(): if not sim_pub: continue # XXX: control flow tweak? - sim_fulltext = self.fetch_sim(sim_issue, sim_pub, release.pages, release.ident) + try: + sim_fulltext = self.fetch_sim(sim_issue, sim_pub, release.pages, release.ident) + except requests.exceptions.ReadTimeout as e: + print(str(e), file=sys.stderr) + continue if sim_fulltext: break |