mirror of
https://github.com/internetarchive/warcprox.git
synced 2025-01-18 13:22:09 +01:00
zlib decompression
This commit is contained in:
parent
c008c2eca7
commit
ee9e375560
4
setup.py
4
setup.py
@ -2,7 +2,7 @@
|
|||||||
'''
|
'''
|
||||||
setup.py - setuptools installation configuration for warcprox
|
setup.py - setuptools installation configuration for warcprox
|
||||||
|
|
||||||
Copyright (C) 2013-2022 Internet Archive
|
Copyright (C) 2013-2021 Internet Archive
|
||||||
|
|
||||||
This program is free software; you can redistribute it and/or
|
This program is free software; you can redistribute it and/or
|
||||||
modify it under the terms of the GNU General Public License
|
modify it under the terms of the GNU General Public License
|
||||||
@ -44,7 +44,7 @@ except:
|
|||||||
|
|
||||||
setuptools.setup(
|
setuptools.setup(
|
||||||
name='warcprox',
|
name='warcprox',
|
||||||
version='2.4.30',
|
version='2.4.29',
|
||||||
description='WARC writing MITM HTTP/S proxy',
|
description='WARC writing MITM HTTP/S proxy',
|
||||||
url='https://github.com/internetarchive/warcprox',
|
url='https://github.com/internetarchive/warcprox',
|
||||||
author='Noah Levitt',
|
author='Noah Levitt',
|
||||||
|
@ -2,7 +2,7 @@
|
|||||||
warcprox/warcproxy.py - recording proxy, extends mitmproxy to record traffic,
|
warcprox/warcproxy.py - recording proxy, extends mitmproxy to record traffic,
|
||||||
enqueue info on the recorded url queue
|
enqueue info on the recorded url queue
|
||||||
|
|
||||||
Copyright (C) 2013-2018 Internet Archive
|
Copyright (C) 2013-2022 Internet Archive
|
||||||
|
|
||||||
This program is free software; you can redistribute it and/or
|
This program is free software; you can redistribute it and/or
|
||||||
modify it under the terms of the GNU General Public License
|
modify it under the terms of the GNU General Public License
|
||||||
@ -46,6 +46,8 @@ import tempfile
|
|||||||
import hashlib
|
import hashlib
|
||||||
import doublethink
|
import doublethink
|
||||||
import re
|
import re
|
||||||
|
import zlib
|
||||||
|
import base64
|
||||||
|
|
||||||
class WarcProxyHandler(warcprox.mitmproxy.MitmProxyHandler):
|
class WarcProxyHandler(warcprox.mitmproxy.MitmProxyHandler):
|
||||||
'''
|
'''
|
||||||
@ -175,6 +177,13 @@ class WarcProxyHandler(warcprox.mitmproxy.MitmProxyHandler):
|
|||||||
warcprox_meta = json.loads(self.headers['Warcprox-Meta'])
|
warcprox_meta = json.loads(self.headers['Warcprox-Meta'])
|
||||||
self._security_check(warcprox_meta)
|
self._security_check(warcprox_meta)
|
||||||
self._enforce_limits(warcprox_meta)
|
self._enforce_limits(warcprox_meta)
|
||||||
|
if 'compressed_blocks' in warcprox_meta:
|
||||||
|
# b64decode and decompress
|
||||||
|
blocks_decompressed = zlib.decompress(base64.b64decode(warcprox_meta['compressed_blocks']))
|
||||||
|
# decode() and json.loads
|
||||||
|
warcprox_meta['blocks'] = json.loads(blocks_decompressed.decode())
|
||||||
|
# delete compressed_blocks (just in case?)
|
||||||
|
del warcprox_meta['compressed_blocks']
|
||||||
self._enforce_blocks(warcprox_meta)
|
self._enforce_blocks(warcprox_meta)
|
||||||
|
|
||||||
def _connect_to_remote_server(self):
|
def _connect_to_remote_server(self):
|
||||||
|
Loading…
x
Reference in New Issue
Block a user