1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
|
#!/usr/bin/env python3
import argparse
import os
import sys
import sentry_sdk
from fatcat_tools import authenticated_api
from fatcat_tools.cleanups import FileCleaner, JsonLinePusher
def run_files(args: argparse.Namespace) -> None:
fmi = FileCleaner(
args.api,
dry_run_mode=args.dry_run,
edit_batch_size=args.batch_size,
editgroup_description=args.editgroup_description_override,
)
JsonLinePusher(fmi, args.json_file).run()
def main() -> None:
parser = argparse.ArgumentParser(formatter_class=argparse.ArgumentDefaultsHelpFormatter)
parser.add_argument(
"--fatcat-api-url", default="http://localhost:9411/v0", help="connect to this host/port"
)
parser.add_argument("--batch-size", help="size of batch to send", default=50, type=int)
parser.add_argument(
"--editgroup-description-override",
help="editgroup description override",
default=None,
type=str,
)
parser.add_argument(
"--dry-run", help="dry-run mode (don't actually update)", default=False, type=bool
)
subparsers = parser.add_subparsers()
sub_files = subparsers.add_parser(
"files", help="attempt metadata cleanups over a list of file entities"
)
sub_files.set_defaults(
func=run_files,
auth_var="FATCAT_AUTH_WORKER_CLEANUP",
)
sub_files.add_argument(
"json_file",
help="files JSON file to import from",
default=sys.stdin,
type=argparse.FileType("r"),
)
args = parser.parse_args()
if not args.__dict__.get("func"):
print("tell me what to do!")
sys.exit(-1)
# allow editgroup description override via env variable (but CLI arg takes
# precedence)
if not args.editgroup_description_override and os.environ.get(
"FATCAT_EDITGROUP_DESCRIPTION"
):
args.editgroup_description_override = os.environ.get("FATCAT_EDITGROUP_DESCRIPTION")
args.api = authenticated_api(
args.fatcat_api_url,
# token is an optional kwarg (can be empty string, None, etc)
token=os.environ.get(args.auth_var),
)
sentry_sdk.init(environment=args.env)
args.func(args)
if __name__ == "__main__":
main()
|