blob: 94102329b94d42cacfe892d2d34237e1dadcbe00 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
|
#!/usr/bin/env bash
set -e -u -o pipefail
export LC_ALL=C
HASH_FILE=$1
zcat $HASH_FILE \
| awk '{print $3 "\t" $1}' \
| rg -v '^\t' \
| sort -S 4G \
| uniq -d -w 40 \
> sha1_ident.dupes.tsv
wc -l sha1_ident.dupes.tsv >> counts.txt
|