aboutsummaryrefslogtreecommitdiffstats
path: root/notes/url_pattern_heuristic_verification.txt
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2022-07-16 13:08:05 -0700
committerBryan Newbold <bnewbold@archive.org>2022-07-16 13:08:05 -0700
commitda12c99e0d9cdbdc8868a94f8d78b6cd3b2653fa (patch)
tree36075e3f7c275050c3e445332e7d7fd9e5741b46 /notes/url_pattern_heuristic_verification.txt
parentab8f4b0f957fa020f94fbb373e4d41f3cbb94293 (diff)
downloadsandcrawler-da12c99e0d9cdbdc8868a94f8d78b6cd3b2653fa.tar.gz
sandcrawler-da12c99e0d9cdbdc8868a94f8d78b6cd3b2653fa.zip
html ingest: allow fuzzy CDX sha1 match based on encoding/not-encoding
Diffstat (limited to 'notes/url_pattern_heuristic_verification.txt')
0 files changed, 0 insertions, 0 deletions