aboutsummaryrefslogtreecommitdiffstats
path: root/extra/cleanups/check_hashes.sh
blob: 94102329b94d42cacfe892d2d34237e1dadcbe00 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
#!/usr/bin/env bash

set -e -u -o pipefail

export LC_ALL=C

HASH_FILE=$1

zcat $HASH_FILE \
    | awk '{print $3 "\t" $1}' \
    | rg -v '^\t' \
    | sort -S 4G \
    | uniq -d -w 40 \
    > sha1_ident.dupes.tsv

wc -l sha1_ident.dupes.tsv >> counts.txt