aboutsummaryrefslogtreecommitdiffstats
path: root/sql
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2020-11-03 16:24:16 -0800
committerBryan Newbold <bnewbold@archive.org>2020-11-03 16:24:16 -0800
commit644c6abdb424a3759e06df6b2541d41fb353e95c (patch)
tree9b5f998ea4ded6ea9d09ee266b0e29fef8bdaddf /sql
parentc145488142d4b5413323322dfc1422efdece83f7 (diff)
downloadsandcrawler-644c6abdb424a3759e06df6b2541d41fb353e95c.tar.gz
sandcrawler-644c6abdb424a3759e06df6b2541d41fb353e95c.zip
tweak html_meta SQL schema
Diffstat (limited to 'sql')
-rw-r--r--sql/migrations/2019-12-19-060141_init/up.sql4
1 files changed, 2 insertions, 2 deletions
diff --git a/sql/migrations/2019-12-19-060141_init/up.sql b/sql/migrations/2019-12-19-060141_init/up.sql
index 6a8c52b..73bd7f1 100644
--- a/sql/migrations/2019-12-19-060141_init/up.sql
+++ b/sql/migrations/2019-12-19-060141_init/up.sql
@@ -118,12 +118,12 @@ CREATE TABLE IF NOT EXISTS html_meta (
sha1hex TEXT PRIMARY KEY CHECK (octet_length(sha1hex) = 40),
updated TIMESTAMP WITH TIME ZONE DEFAULT now() NOT NULL,
status TEXT CHECK (octet_length(status) >= 1) NOT NULL,
+ scope TEXT CHECK (octet_length(status) >= 1),
has_teixml BOOLEAN NOT NULL,
has_thumbnail BOOLEAN NOT NULL,
word_count INT CHECK (word_count >= 0),
- resource_count INT CHECK (resource_count >= 0),
biblio JSONB,
- resources JSONB,
+ resources JSONB
-- biblio JSON fields are similar to fatcat release schema
-- resources JSON object is a list of objects with keys like webcapture CDX schema
);