diff options
Diffstat (limited to 'backfill')
| -rwxr-xr-x | backfill/backfill_hbase_from_cdx.py | 7 | 
1 files changed, 4 insertions, 3 deletions
| diff --git a/backfill/backfill_hbase_from_cdx.py b/backfill/backfill_hbase_from_cdx.py index 04ae7d9..e6596d5 100755 --- a/backfill/backfill_hbase_from_cdx.py +++ b/backfill/backfill_hbase_from_cdx.py @@ -167,17 +167,18 @@ class MRCDXBackfillHBase(MRJob):                  raw_cdx.startswith('#')):              # Skip line +            # XXX: tests don't cover this path; need coverage!              self.increment_counter('lines', 'invalid') -            return _, status +            return _, dict(status="invalid")          info = transform_line(raw_cdx)          if info is None:              self.increment_counter('lines', 'invalid') -            return +            return _, dict(status="invalid")          if info['file:mime'] not in self.mime_filter:              self.increment_counter('lines', 'skip') -            return +            return _, dict(status="skip")          key = info.pop('key')          info['f:c'] = json.dumps(info['f:c'], sort_keys=True, indent=None) | 
