summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@robocracy.org>2020-03-28 19:57:35 -0700
committerBryan Newbold <bnewbold@robocracy.org>2020-03-28 19:57:41 -0700
commit4b75a81cbd0faeefa6a0f04b97ecc6832924ee69 (patch)
treee729b83e33cfb686448a24129d010a088e1289dc
parent2a3148df02962b84d0409f9f9900324d04404065 (diff)
downloadfatcat-4b75a81cbd0faeefa6a0f04b97ecc6832924ee69.tar.gz
fatcat-4b75a81cbd0faeefa6a0f04b97ecc6832924ee69.zip
ingest: more DOI patterns to treat as OA
These are journal/publisher patterns which we suspect to actually be OA based on the large quantity of papers that crawl successfully. The better long-term solution will be to flag containers in some way as OA (or "should crawl"), but this is a good short-term solution.
-rw-r--r--python/fatcat_tools/workers/changelog.py26
1 files changed, 26 insertions, 0 deletions
diff --git a/python/fatcat_tools/workers/changelog.py b/python/fatcat_tools/workers/changelog.py
index 5783bbfc..d1e7c2db 100644
--- a/python/fatcat_tools/workers/changelog.py
+++ b/python/fatcat_tools/workers/changelog.py
@@ -110,6 +110,32 @@ class EntityUpdatesWorker(FatcatWorker):
# the lancet (often hybrid OA)
"10.1016/s0140-6736",
"10.1016/s2213-2600",
+ # journal of virology
+ "10.1128/jvi.",
+ # FEBS letters
+ "10.1002/1873-3468.",
+ # Journal of Neuroscience
+ "10.1523/jneurosci.",
+ # Chemical and pharmaceutical bulletin
+ "10.1248/cpb.",
+ # Japanese Journal of Radiological Technology
+ "10.6009/jjrt.",
+ # Seibutsu Butsuri
+ "10.2142/biophys.",
+ # Chemical Communications
+ "10.1039/d0cc",
+ # Yakugaku zasshi
+ "10.1248/yakushi.",
+ # bulletin AMS
+ "10.1090/s0002-9904",
+ # Current Biology
+ "10.1016/j.cub.",
+ # Antarctica A Keystone in a Changing World
+ "10.3133/ofr",
+ # Clinical Cancer Research
+ "10.1158/1078-0432.",
+ # Transactions of the Japan Society of Mechanical Engineers
+ "10.1299/kikai",
]
def want_live_ingest(self, release, ingest_request):