diff options
author | Bryan Newbold <bnewbold@robocracy.org> | 2019-07-30 19:34:52 -0700 |
---|---|---|
committer | Bryan Newbold <bnewbold@robocracy.org> | 2019-07-30 20:48:54 -0700 |
commit | 6a00a6f4ac3a2d1f029bae6402d1dd117a58416e (patch) | |
tree | 6e5ea9cfabbf8948dd6c48e3d689a97fdeb48313 | |
parent | 31f1f306110035f7283ef507eed0fc863407d3df (diff) | |
download | chocula-6a00a6f4ac3a2d1f029bae6402d1dd117a58416e.tar.gz chocula-6a00a6f4ac3a2d1f029bae6402d1dd117a58416e.zip |
chocula: updated fetches, new ISSN-L and DOAJ files
-rwxr-xr-x | chocula.py | 6 | ||||
-rwxr-xr-x | data/fetch.sh | 11 |
2 files changed, 10 insertions, 7 deletions
@@ -56,13 +56,13 @@ import pycountry ################### File Config -ISSNL_FILE = 'data/20190220.ISSN-to-ISSN-L.txt' +ISSNL_FILE = 'data/20190730.ISSN-to-ISSN-L.txt' ENTREZ_FILE = 'data/entrez-journals.csv' ROAD_FILE = 'data/road-2018-01-24.tsv' ROAD_DATE = '2018-01-24' -DOAJ_FILE = 'data/doaj_20190124.csv' -DOAJ_DATE = '2019-01-24' +DOAJ_FILE = 'data/journalcsv__doaj_20190731_0130_utf8.csv' +DOAJ_DATE = '2019-07-31' CROSSREF_FILE = 'data/doi_titles_file_2019-01-24.csv' SHERPA_ROMEO_JOURNAL_FILE = 'data/romeo-journals.csv' SHERPA_ROMEO_POLICY_FILE = 'data/romeo-policies.csv' diff --git a/data/fetch.sh b/data/fetch.sh index 5d315a7..f55f934 100755 --- a/data/fetch.sh +++ b/data/fetch.sh @@ -9,7 +9,7 @@ wget -c https://archive.org/download/road-issn-2018/road-2018-01-24.tsv wget -c https://archive.org/download/doaj_bulk_metadata_2019/doaj_20190124.csv #wget -c https://archive.org/download/issn_issnl_mappings/20190129.ISSN-to-ISSN-L.txt -wget -c https://archive.org/download/issn_issnl_mappings/20190220.ISSN-to-ISSN-L.txt +wget -c https://archive.org/download/issn_issnl_mappings/20190730.ISSN-to-ISSN-L.txt wget -c https://archive.org/download/crossref_doi_titles/doi_titles_file_2019-01-24.csv @@ -38,7 +38,10 @@ wget -c https://archive.org/download/norwegian_register_journals/2018-03-02%20No #wget -c https://archive.org/download/open_academic_graph_2019/mag_venues.zip #unzip mag_venues.zip -#wget -c https://archive.org/download/szczepanski-oa-journal-list-2018/Jan-Szczepanski-Open-Access-Journals-2018_0.docx -#wget -c https://archive.org/download/szczepanski-oa-journal-list-2018/Jan-Szczepanski-Open-Access-Journals-2018_0.converted.csv - wget -c https://archive.org/download/szczepanski-oa-journal-list-2018/Jan-Szczepanski-Open-Access-Journals-2018_0.fixed.json + +wget -c https://archive.org/download/ezb_snapshot_2019-07-11/ezb_metadata.json +wget -c https://archive.org/download/ISSN-GOLD-OA-3/ISSN_Gold-OA_3.0.csv +wget -c https://archive.org/download/openapc-dataset/apc_de.2019-07-30.csv +wget -c https://archive.org/download/wikidata-journal-metadata/wikidata_journals_sparql.2019-07-30.tsv + |