aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
-rw-r--r--python/refcat/tasks.py3
1 files changed, 2 insertions, 1 deletions
diff --git a/python/refcat/tasks.py b/python/refcat/tasks.py
index 43eb4b2..75a3daa 100644
--- a/python/refcat/tasks.py
+++ b/python/refcat/tasks.py
@@ -337,7 +337,7 @@ class OpenCitations(luigi.ExternalTask, Refcat):
class RefsWithUnstructured(Refcat):
"""
Augment refs with data from biblio.unstructured - do this first, so we can
- use it in all subsequent steps.
+ use it in all subsequent steps. Do some basic cleanup.
"""
def requires(self):
return Refs()
@@ -345,6 +345,7 @@ class RefsWithUnstructured(Refcat):
def run(self):
output = shellout("""
zstdcat -T0 {input} |
+ skate-cleanup -c ref |
skate-from-unstructured |
zstd -T0 -c > {output}
""",