<feed xmlns='http://www.w3.org/2005/Atom'>
<title>sandcrawler/python/scripts, branch master</title>
<subtitle>[no description]</subtitle>
<id>https://git.bnewbold.net/sandcrawler/atom?h=master</id>
<link rel='self' href='https://git.bnewbold.net/sandcrawler/atom?h=master'/>
<link rel='alternate' type='text/html' href='https://git.bnewbold.net/sandcrawler/'/>
<updated>2022-09-28T22:40:35+00:00</updated>
<entry>
<title>update oai-pmh ingest request transform script</title>
<updated>2022-09-28T22:40:35+00:00</updated>
<author>
<name>Bryan Newbold</name>
<email>bnewbold@archive.org</email>
</author>
<published>2022-09-28T22:40:35+00:00</published>
<link rel='alternate' type='text/html' href='https://git.bnewbold.net/sandcrawler/commit/?id=dfd4605d84712eccb95a63e50b0bcb343642b433'/>
<id>urn:sha1:dfd4605d84712eccb95a63e50b0bcb343642b433</id>
<content type='text'>
</content>
</entry>
<entry>
<title>doaj and unpaywall transforms: more domains to skip</title>
<updated>2022-07-21T01:02:56+00:00</updated>
<author>
<name>Bryan Newbold</name>
<email>bnewbold@archive.org</email>
</author>
<published>2022-07-21T01:02:56+00:00</published>
<link rel='alternate' type='text/html' href='https://git.bnewbold.net/sandcrawler/commit/?id=a72019e6e788be64420719c5045e40614098c106'/>
<id>urn:sha1:a72019e6e788be64420719c5045e40614098c106</id>
<content type='text'>
</content>
</entry>
<entry>
<title>row2json script: fix argument type</title>
<updated>2022-07-15T20:19:12+00:00</updated>
<author>
<name>Bryan Newbold</name>
<email>bnewbold@archive.org</email>
</author>
<published>2022-07-15T20:19:12+00:00</published>
<link rel='alternate' type='text/html' href='https://git.bnewbold.net/sandcrawler/commit/?id=3f8fed325a3dd8d51652dffab89880c1cf25656b'/>
<id>urn:sha1:3f8fed325a3dd8d51652dffab89880c1cf25656b</id>
<content type='text'>
</content>
</entry>
<entry>
<title>row2json script: add flag to enable recrawling</title>
<updated>2022-07-15T20:07:10+00:00</updated>
<author>
<name>Bryan Newbold</name>
<email>bnewbold@archive.org</email>
</author>
<published>2022-07-15T20:07:10+00:00</published>
<link rel='alternate' type='text/html' href='https://git.bnewbold.net/sandcrawler/commit/?id=ce386a7a1f38c2c6289ce9d0bde269b4b1349154'/>
<id>urn:sha1:ce386a7a1f38c2c6289ce9d0bde269b4b1349154</id>
<content type='text'>
</content>
</entry>
<entry>
<title>more sentry config changes</title>
<updated>2022-02-25T19:45:45+00:00</updated>
<author>
<name>Bryan Newbold</name>
<email>bnewbold@archive.org</email>
</author>
<published>2022-02-25T19:45:45+00:00</published>
<link rel='alternate' type='text/html' href='https://git.bnewbold.net/sandcrawler/commit/?id=a0766e6a0100694434ddb2a4a895287806049ed8'/>
<id>urn:sha1:a0766e6a0100694434ddb2a4a895287806049ed8</id>
<content type='text'>
</content>
</entry>
<entry>
<title>switch from 'raven' to 'sentry-sdk'</title>
<updated>2022-02-25T00:35:10+00:00</updated>
<author>
<name>Bryan Newbold</name>
<email>bnewbold@archive.org</email>
</author>
<published>2022-02-25T00:35:10+00:00</published>
<link rel='alternate' type='text/html' href='https://git.bnewbold.net/sandcrawler/commit/?id=7f7846b99042897afd5916b9263320c0e2775706'/>
<id>urn:sha1:7f7846b99042897afd5916b9263320c0e2775706</id>
<content type='text'>
</content>
</entry>
<entry>
<title>add CDX sha1hex lookup/fetch helper script</title>
<updated>2021-11-30T23:29:41+00:00</updated>
<author>
<name>Bryan Newbold</name>
<email>bnewbold@archive.org</email>
</author>
<published>2021-11-30T23:29:41+00:00</published>
<link rel='alternate' type='text/html' href='https://git.bnewbold.net/sandcrawler/commit/?id=0328598e3b643edd0a2033ca97c607f596dfb092'/>
<id>urn:sha1:0328598e3b643edd0a2033ca97c607f596dfb092</id>
<content type='text'>
</content>
</entry>
<entry>
<title>remove grobid2json helper file, replace with grobid_tei_xml</title>
<updated>2021-10-28T02:10:35+00:00</updated>
<author>
<name>Bryan Newbold</name>
<email>bnewbold@archive.org</email>
</author>
<published>2021-10-28T02:10:35+00:00</published>
<link rel='alternate' type='text/html' href='https://git.bnewbold.net/sandcrawler/commit/?id=a0e275a4bad46ef41585f0207d6dfa1e3c38bc35'/>
<id>urn:sha1:a0e275a4bad46ef41585f0207d6dfa1e3c38bc35</id>
<content type='text'>
</content>
</entry>
<entry>
<title>make fmt (black 21.9b0)</title>
<updated>2021-10-28T01:50:17+00:00</updated>
<author>
<name>Bryan Newbold</name>
<email>bnewbold@archive.org</email>
</author>
<published>2021-10-28T01:50:17+00:00</published>
<link rel='alternate' type='text/html' href='https://git.bnewbold.net/sandcrawler/commit/?id=826c7538e091fac14d987a3cd654975da964e240'/>
<id>urn:sha1:826c7538e091fac14d987a3cd654975da964e240</id>
<content type='text'>
</content>
</entry>
<entry>
<title>make fmt</title>
<updated>2021-10-26T19:54:37+00:00</updated>
<author>
<name>Bryan Newbold</name>
<email>bnewbold@archive.org</email>
</author>
<published>2021-10-26T19:54:37+00:00</published>
<link rel='alternate' type='text/html' href='https://git.bnewbold.net/sandcrawler/commit/?id=05bd7cbcc62588e431c5efd533189e246b2a997e'/>
<id>urn:sha1:05bd7cbcc62588e431c5efd533189e246b2a997e</id>
<content type='text'>
</content>
</entry>
</feed>
