diff options
author | Bryan Newbold <bnewbold@archive.org> | 2020-04-01 15:27:25 -0700 |
---|---|---|
committer | Bryan Newbold <bnewbold@archive.org> | 2020-04-01 15:27:25 -0700 |
commit | 485c8b8432d839bb3cc0bd67152adda4bbf0df20 (patch) | |
tree | be8b0b11c3a9ec722366945bcd880245222cc6c7 /bin/parse_cord19_csv.py | |
parent | 7f30c43cd4955d596ebc51a56aea7996b1005e47 (diff) | |
download | fatcat-covid19-485c8b8432d839bb3cc0bd67152adda4bbf0df20.tar.gz fatcat-covid19-485c8b8432d839bb3cc0bd67152adda4bbf0df20.zip |
move scripts/ to bin/
Diffstat (limited to 'bin/parse_cord19_csv.py')
-rwxr-xr-x | bin/parse_cord19_csv.py | 15 |
1 files changed, 15 insertions, 0 deletions
diff --git a/bin/parse_cord19_csv.py b/bin/parse_cord19_csv.py new file mode 100755 index 0000000..536e5d3 --- /dev/null +++ b/bin/parse_cord19_csv.py @@ -0,0 +1,15 @@ +#!/usr/bin/env python3 + +import sys +import csv +import json + +CSVFILE = sys.argv[1] + +with open(CSVFILE, newline='') as csvfile: + reader = csv.DictReader(csvfile) + for row in reader: + row = dict(row) + row['mag_id'] = row.pop('Microsoft Academic Paper ID') + row['who_covidence_id'] = row.pop('WHO #Covidence').replace('#', '') + print(json.dumps(row, sort_keys=True)) |