From 3bcb9c1c318564f92ce91bee88eb29f92670138a Mon Sep 17 00:00:00 2001 From: Bryan Newbold Date: Wed, 7 Apr 2021 23:13:25 -0700 Subject: SQL snapshot doc update --- sql/README.md | 7 +++++-- 1 file changed, 5 insertions(+), 2 deletions(-) diff --git a/sql/README.md b/sql/README.md index 42dba31..e34feec 100644 --- a/sql/README.md +++ b/sql/README.md @@ -139,10 +139,13 @@ Questions we might want to answer http get :3030/cdx?url=eq.https://coleccionables.mercadolibre.com.ar/arduino-pdf_Installments_NoInterest_BestSellers_YES http get :3030/file_meta?sha1hex=eq.120582c855a7cc3c70a8527c560d7f27e6027278 -## Full Database Dumps + +## Full SQL Database Dumps Run a dump in compressed, postgres custom format: export DATESLUG="`date +%Y-%m-%d.%H%M%S`" - time sudo -u postgres pg_dump --verbose --format=custom sandcrawler > /sandcrawler-db/snapshots/sandcrawler_full_dbdump_${DATESLUG}.pgdump + time sudo -u postgres pg_dump --verbose --format=custom sandcrawler > sandcrawler_full_dbdump_${DATESLUG}.pgdump +As of 2021-04-07, this process runs for about 4 hours and the compressed +snapshot is 88 GBytes (compared with 551.34G database disk consumption). -- cgit v1.2.3