trough dedup - handle case of no warc records written

This commit is contained in:
Noah Levitt 2017-11-30 12:55:39 -08:00
parent 61a7c234e8
commit c5f33bda7a

View File

@ -292,11 +292,10 @@ class TroughDedupDb(object):
return None return None
def notify(self, recorded_url, records): def notify(self, recorded_url, records):
if (records[0].get_header(warctools.WarcRecord.TYPE) == warctools.WarcRecord.RESPONSE if (records and records[0].type == b'response'
and recorded_url.response_recorder.payload_size() > 0): and recorded_url.response_recorder.payload_size() > 0):
digest_key = warcprox.digest_str( digest_key = warcprox.digest_str(
recorded_url.payload_digest, recorded_url.payload_digest, self.options.base32)
self.options.base32)
if recorded_url.warcprox_meta and 'captures-bucket' in recorded_url.warcprox_meta: if recorded_url.warcprox_meta and 'captures-bucket' in recorded_url.warcprox_meta:
self.save( self.save(
digest_key, records[0], digest_key, records[0],