aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@robocracy.org>2019-02-20 18:30:49 -0800
committerBryan Newbold <bnewbold@robocracy.org>2019-02-20 18:30:49 -0800
commit57ce552a090fbb75ae150c83356ce86656f6432d (patch)
tree8e6561adbe0aef748bd335c8fa3e06bc7a128a9c
parent1f534e74c5b16efb47095d5d04d3cd515156c95d (diff)
downloadchocula-57ce552a090fbb75ae150c83356ce86656f6432d.tar.gz
chocula-57ce552a090fbb75ae150c83356ce86656f6432d.zip
update ISSN-L file
-rwxr-xr-xdata/fetch.sh6
-rwxr-xr-xparse_merge_metadata.py2
2 files changed, 6 insertions, 2 deletions
diff --git a/data/fetch.sh b/data/fetch.sh
index b56a94e..c289a20 100755
--- a/data/fetch.sh
+++ b/data/fetch.sh
@@ -8,7 +8,8 @@ wget -c https://archive.org/download/road-issn-2018/road-2018-01-24.tsv
wget -c https://archive.org/download/doaj_bulk_metadata_2019/doaj_20190124.csv
-wget -c https://archive.org/download/issn_issnl_mappings/20190129.ISSN-to-ISSN-L.txt
+#wget -c https://archive.org/download/issn_issnl_mappings/20190129.ISSN-to-ISSN-L.txt
+wget -c https://archive.org/download/issn_issnl_mappings/20190220.ISSN-to-ISSN-L.txt
wget -c https://archive.org/download/crossref_doi_titles/doi_titles_file_2019-01-24.csv
@@ -34,5 +35,8 @@ wget -c https://archive.org/download/SerialsOnMicrofilmCollection/MASTER%20TITLE
wget -c https://archive.org/download/norwegian_register_journals/2018-03-02%20Norwegian%20Register%20for%20Scientific%20Journals%20and%20Series.csv
+#wget -c https://archive.org/download/open_academic_graph_2019/mag_venues.zip
+#unzip mag_venues.zip
+
#wget -c https://archive.org/download/szczepanski-oa-journal-list-2018/Jan-Szczepanski-Open-Access-Journals-2018_0.docx
#wget -c https://archive.org/download/szczepanski-oa-journal-list-2018/Jan-Szczepanski-Open-Access-Journals-2018_0.converted.csv
diff --git a/parse_merge_metadata.py b/parse_merge_metadata.py
index c008fd1..bb43bcb 100755
--- a/parse_merge_metadata.py
+++ b/parse_merge_metadata.py
@@ -5,7 +5,7 @@ import ftfy
import pycountry
from collections import Counter
-ISSNL_FILE = 'data/20190129.ISSN-to-ISSN-L.txt'
+ISSNL_FILE = 'data/20190220.ISSN-to-ISSN-L.txt'
ENTREZ_FILE = 'data/entrez-journals.csv'
ROAD_FILE = 'data/road-2018-01-24.tsv'