diff options
Diffstat (limited to 'python')
-rw-r--r-- | python/refcat/tasks.py | 5 |
1 files changed, 3 insertions, 2 deletions
diff --git a/python/refcat/tasks.py b/python/refcat/tasks.py index cf23a55..4880f43 100644 --- a/python/refcat/tasks.py +++ b/python/refcat/tasks.py @@ -751,7 +751,7 @@ class OpenLibraryWorksSorted(Refcat): class UnmatchedMapped(Refcat): """ Map unmatched refs (in release schema) to titles to do approximate title - matches with OL; 29m16.100s. + matches with OL; 35m14.801s. """ def requires(self): @@ -760,12 +760,13 @@ class UnmatchedMapped(Refcat): def run(self): output = shellout(""" zstdcat -T0 {input} | - skate-map -m cns | + skate-map -m cns -skip-on-empty 1 | LC_ALL=C sort -T {tmpdir} -S25% -k1,1 --parallel 4 | zstd -T0 -c > {output} """, tmpdir=self.tmpdir, input=self.input().path) + luigi.LocalTarget(output).move(self.output().path) def output(self): return luigi.LocalTarget(path=self.path(ext="tsv.zst"), format=Zstd) |