From 94544a6b32064d299a93025b48297070db2edcd8 Mon Sep 17 00:00:00 2001 From: Bryan Newbold Date: Tue, 7 Apr 2020 16:08:53 -0700 Subject: update bulk export instructions - don't do expanded and regular release dumps - default to sqldump_public for item name (as that is common-case) --- extra/sql_dumps/README.md | 6 ++---- 1 file changed, 2 insertions(+), 4 deletions(-) diff --git a/extra/sql_dumps/README.md b/extra/sql_dumps/README.md index 00639fb9..3871549d 100644 --- a/extra/sql_dumps/README.md +++ b/extra/sql_dumps/README.md @@ -31,15 +31,13 @@ Or, in production: # production, as 'fatcat' user, in /srv/fatcat/src/rust: cat /tmp/fatcat_ident_releases.tsv | ./target/release/fatcat-export release --expand files,filesets,webcaptures,container -j8 | pigz > /srv/fatcat/snapshots/release_export_expanded.json.gz + cat /tmp/fatcat_ident_releases.tsv | ./target/release/fatcat-export release -j8 | pigz > /srv/fatcat/snapshots/release_export.json.gz cat /tmp/fatcat_ident_creators.tsv | ./target/release/fatcat-export creator -j8 | pigz > /srv/fatcat/snapshots/creator_export.json.gz cat /tmp/fatcat_ident_containers.tsv | ./target/release/fatcat-export container -j8 | pigz > /srv/fatcat/snapshots/container_export.json.gz cat /tmp/fatcat_ident_files.tsv | ./target/release/fatcat-export file -j8 | pigz > /srv/fatcat/snapshots/file_export.json.gz cat /tmp/fatcat_ident_filesets.tsv | ./target/release/fatcat-export fileset -j8 | pigz > /srv/fatcat/snapshots/fileset_export.json.gz cat /tmp/fatcat_ident_webcaptures.tsv | ./target/release/fatcat-export webcapture -j8 | pigz > /srv/fatcat/snapshots/webcapture_export.json.gz - # redundant with "release_export_expanded" - cat /tmp/fatcat_ident_releases.tsv | ./target/release/fatcat-export release -j8 | pigz > /srv/fatcat/snapshots/release_export.json.gz - Then usually move all these files to `/srv/fatcat/snapshots/`. ## HOWTO: Dump abstracts, release identifiers, file hashes, etc @@ -109,7 +107,7 @@ The `./ia_item_exports_readme.md` and `sqldump` files should be included as a `README.md` when appropriate: ia upload fatcat_bulk_exports_YYYY-MM-DD ia_exports_item_readme.md --remote-name=README.md - ia upload fatcat_sqldump_full_YYYY-MM-DD ia_sqldump_item_readme.md --remote-name=README.md + ia upload fatcat_sqldump_public_YYYY-MM-DD ia_sqldump_item_readme.md --remote-name=README.md Uploads should can be `--no-derive` to save cluster time. -- cgit v1.2.3