index
:
sandcrawler
bnewbold-args
bnewbold-backfill
bnewbold-persist-grobid-errors
bnewbold-refactor-loggging
master
trawler
[no description]
about
summary
refs
log
tree
commit
diff
stats
log msg
author
committer
range
path:
root
/
notes
/
ingest
Mode
Name
Size
-rw-r--r--
.gitignore
13
log
stats
plain
-rw-r--r--
2019-10-23_testing.md
219
log
stats
plain
-rw-r--r--
2020-01-14_bulk.md
1533
log
stats
plain
-rw-r--r--
2020-02-04_ingest_backfills.md
7888
log
stats
plain
-rw-r--r--
2020-02-18_ingest_backfills.md
1870
log
stats
plain
-rw-r--r--
2020-02-21_ingest_backfills.md
6096
log
stats
plain
-rw-r--r--
2020-02-22_fixed_domain.txt
13352
log
stats
plain
-rw-r--r--
2020-02_unpaywall.md
28454
log
stats
plain
-rw-r--r--
2020-03-02_ingests.txt
8092
log
stats
plain
-rw-r--r--
2020-03-oa_but_not_marked.md
1040
log
stats
plain
-rw-r--r--
2020-03_mag.md
25212
log
stats
plain
-rw-r--r--
2020-03_s2.md
1781
log
stats
plain
-rw-r--r--
2020-04-13_covid19.md
3312
log
stats
plain
-rw-r--r--
2020-04_datacite.md
6086
log
stats
plain
-rw-r--r--
2020-04_unpaywall.md
14468
log
stats
plain
-rw-r--r--
2020-05_oai_pmh.md
17309
log
stats
plain
-rw-r--r--
2020-05_pubmed.md
446
log
stats
plain
-rw-r--r--
2020-07_mag.md
16379
log
stats
plain
-rw-r--r--
2020-08_daily_improvements.md
9712
log
stats
plain
-rw-r--r--
2020-09_oa_doi.md
16083
log
stats
plain
-rw-r--r--
2020-09_reingest.md
8418
log
stats
plain
-rw-r--r--
2020-09_scielo.md
770
log
stats
plain
-rw-r--r--
2020-10_daily.md
9698
log
stats
plain
-rw-r--r--
2020-10_unpaywall.md
14222
log
stats
plain
-rw-r--r--
2020-11_doaj.md
14273
log
stats
plain
-rw-r--r--
2020-12-08_patch_crawl_notes.md
3913
log
stats
plain
-rw-r--r--
2021-04_unpaywall.md
17620
log
stats
plain
-rw-r--r--
2021-05_daily_improvements.md
17459
log
stats
plain
-rw-r--r--
2021-07_unpaywall.md
14837
log
stats
plain
-rw-r--r--
2021-08_mag.md
18428
log
stats
plain
-rw-r--r--
2021-08_oai_pmh_patch.md
9331
log
stats
plain
-rw-r--r--
NEXT.md
1582
log
stats
plain
-rwxr-xr-x
es_csv_to_json.py
976
log
stats
plain