aboutsummaryrefslogtreecommitdiffstats
path: root/sql
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2020-10-17 17:10:51 -0700
committerBryan Newbold <bnewbold@archive.org>2020-10-17 17:10:51 -0700
commite1698ffa62f0292ad9f8d0e53207dfa3aa23818d (patch)
tree5e9aab198a5a4b1f91865f72a8a03b2955c7ad83 /sql
parent4f5c66fd33263a146609efbfcbfde4a344f0ac2d (diff)
downloadsandcrawler-e1698ffa62f0292ad9f8d0e53207dfa3aa23818d.tar.gz
sandcrawler-e1698ffa62f0292ad9f8d0e53207dfa3aa23818d.zip
update SQL ingest monitoring commands to be past-month by default
Diffstat (limited to 'sql')
-rw-r--r--sql/monitoring_queries.md10
1 files changed, 5 insertions, 5 deletions
diff --git a/sql/monitoring_queries.md b/sql/monitoring_queries.md
index fd0ce51..1738731 100644
--- a/sql/monitoring_queries.md
+++ b/sql/monitoring_queries.md
@@ -1,21 +1,21 @@
## fatcat-changelog pipeline
-Overall ingest status, past 3 days:
+Overall ingest status, past 30 days:
SELECT ingest_file_result.ingest_type, ingest_file_result.status, COUNT(*)
FROM ingest_file_result
LEFT JOIN ingest_request
ON ingest_file_result.ingest_type = ingest_request.ingest_type
AND ingest_file_result.base_url = ingest_request.base_url
- WHERE ingest_request.created >= NOW() - '3 day'::INTERVAL
+ WHERE ingest_request.created >= NOW() - '30 day'::INTERVAL
AND ingest_request.ingest_type = 'pdf'
AND ingest_request.ingest_request_source = 'fatcat-changelog'
GROUP BY ingest_file_result.ingest_type, ingest_file_result.status
ORDER BY COUNT DESC
LIMIT 20;
-Broken domains, past 3 days:
+Broken domains, past 30 days:
SELECT domain, status, COUNT((domain, status))
FROM (
@@ -29,7 +29,7 @@ Broken domains, past 3 days:
AND ingest_file_result.base_url = ingest_request.base_url
WHERE
-- ingest_request.created >= NOW() - '3 day'::INTERVAL
- ingest_file_result.updated >= NOW() - '3 day'::INTERVAL
+ ingest_file_result.updated >= NOW() - '30 day'::INTERVAL
AND ingest_request.ingest_type = 'pdf'
AND ingest_request.ingest_request_source = 'fatcat-changelog'
) t1
@@ -39,7 +39,7 @@ Broken domains, past 3 days:
ORDER BY COUNT DESC
LIMIT 25;
-Throughput per day, and success, for past month:
+Throughput per day, and success, for past 30 days:
SELECT ingest_request.ingest_type,
date(ingest_request.created),