summaryrefslogtreecommitdiffstats
path: root/extra/sitemap
diff options
context:
space:
mode:
Diffstat (limited to 'extra/sitemap')
-rwxr-xr-xextra/sitemap/release_url_lists.sh2
1 files changed, 2 insertions, 0 deletions
diff --git a/extra/sitemap/release_url_lists.sh b/extra/sitemap/release_url_lists.sh
index d5c8d4ef..280ecab1 100755
--- a/extra/sitemap/release_url_lists.sh
+++ b/extra/sitemap/release_url_lists.sh
@@ -19,6 +19,8 @@ EXPORT_FILE_GZ="$2"
zcat $EXPORT_FILE_GZ \
| rg '"release_ids"' \
| rg 'archive.org/' \
+ | rg 'application/pdf' \
+ | rg '"url":' \
| rg -v '"stub"' \
| jq -r '[.work_id, .ident] | @tsv' \
| uniq -w 26 \