aboutsummaryrefslogtreecommitdiffstats
path: root/python
diff options
context:
space:
mode:
authorMartin Czygan <martin.czygan@gmail.com>2021-06-03 11:01:34 +0200
committerMartin Czygan <martin.czygan@gmail.com>2021-06-03 11:01:34 +0200
commitf70b8304afbe0edeb570ecde90f05cf1d36cfffa (patch)
treed836aaede521969cae0934a0c263b4bc05024ded /python
parent094178acfa32ec913b0adc4655e25a9316e29510 (diff)
downloadrefcat-f70b8304afbe0edeb570ecde90f05cf1d36cfffa.tar.gz
refcat-f70b8304afbe0edeb570ecde90f05cf1d36cfffa.zip
unmapped: we want normalized container names
Diffstat (limited to 'python')
-rw-r--r--python/refcat/tasks.py4
1 files changed, 3 insertions, 1 deletions
diff --git a/python/refcat/tasks.py b/python/refcat/tasks.py
index afa615f..885dc58 100644
--- a/python/refcat/tasks.py
+++ b/python/refcat/tasks.py
@@ -938,6 +938,8 @@ class UnmatchedMapped(Refcat):
"""
Map unmatched refs (converted to release schema on the fly) to container
names to do approximate title matches with OL; 35m14.801s.
+
+ XXX: We want normalized container names.
"""
def requires(self):
return RefsWithoutIdentifiers()
@@ -946,7 +948,7 @@ class UnmatchedMapped(Refcat):
output = shellout("""
zstdcat -T0 {input} |
skate-conv -f ref |
- skate-map -m ff -x container_name -skip-on-empty 1 |
+ skate-map -m rcns -skip-on-empty 1 |
LC_ALL=C sort -T {tmpdir} -S25% -k1,1 --parallel 4 |
zstd -T0 -c > {output}
""",