diff options
author | Martin Czygan <martin.czygan@gmail.com> | 2021-05-24 21:42:54 +0200 |
---|---|---|
committer | Martin Czygan <martin.czygan@gmail.com> | 2021-05-24 21:42:54 +0200 |
commit | 18846ab86dae4145b91e7cbbfa1be07a0239275e (patch) | |
tree | 39908f5cc20c5c04dd12d426484f0bb4414b1037 /python | |
parent | 7dba9e88abe328e59da73d475b17d627cd190901 (diff) | |
download | refcat-18846ab86dae4145b91e7cbbfa1be07a0239275e.tar.gz refcat-18846ab86dae4145b91e7cbbfa1be07a0239275e.zip |
use container title mapper, cts
Diffstat (limited to 'python')
-rw-r--r-- | python/refcat/tasks.py | 5 |
1 files changed, 3 insertions, 2 deletions
diff --git a/python/refcat/tasks.py b/python/refcat/tasks.py index fa72062..8b29f94 100644 --- a/python/refcat/tasks.py +++ b/python/refcat/tasks.py @@ -750,7 +750,8 @@ class OpenLibraryWorksSorted(Refcat): class UnmatchedMapped(Refcat): """ - Map unmatched refs (in release schema) to titles to do approximate title matches with OL. + Map unmatched refs (in release schema) to titles to do approximate title + matches with OL; 29m16.100s. """ def requires(self): @@ -759,7 +760,7 @@ class UnmatchedMapped(Refcat): def run(self): output = shellout(""" zstdcat -T0 {input} | - skate-map -m ts | + skate-map -m cts | LC_ALL=C sort -T {tmpdir} -S25% -k1,1 --parallel 4 | zstd -T0 -c > {output} """, |