aboutsummaryrefslogtreecommitdiffstats
path: root/python
diff options
context:
space:
mode:
Diffstat (limited to 'python')
-rw-r--r--python/refcat/tasks.py5
1 files changed, 1 insertions, 4 deletions
diff --git a/python/refcat/tasks.py b/python/refcat/tasks.py
index 42fa924..792a9c3 100644
--- a/python/refcat/tasks.py
+++ b/python/refcat/tasks.py
@@ -467,15 +467,12 @@ class URLList(Refcat):
List of mostly cleaned, unique URLs from refs.
"""
def requires(self):
- return URLTabs()
+ return URLTabsCleaned()
def run(self):
output = shellout("""
zstdcat -T0 {input} |
cut -f 3 |
- skate-cleanup -X -c url -B -S -f 1 |
- LC_ALL=C sort -u -T {tmpdir} -k1,1 -S25% |
- LC_ALL=C grep -E '^https?://' |
zstd -T0 -c > {output}
""",
n=self.n,