mirror of https://github.com/webrecorder/pywb.git synced 2025-03-23 22:52:25 +01:00
Ilya Kreymer d8b67319e1 rewrite refactoring:
- rewrite headers after content to ensure content-length/content-encoding rewritten if content modified
- header rewriter: remove proxyrewriter, set default rule to 'prefix' or 'keep' if url rewriting or not
- set is_content_rw if record.content_stream(), assume content is modified
- add BufferedRewriter as base for dash, hls, amf rewriting which processes the full stream
- should_rw_content() determines if should attempt content rewriting
- support banner-only insert mode: added HTMLInsertOnlyRewriter, enable if no custom JS rules
- test: enable banner-only test mode
2017-05-22 18:52:17 -07:00

71 lines
2.2 KiB

from contextlib import closing
from io import BytesIO, StringIO
import json
import xml.etree.ElementTree as ET
from pywb.rewrite.content_rewriter import BufferedRewriter
# ============================================================================
class RewriteDASH(BufferedRewriter):
def rewrite_stream(self, stream):
res_buff, best_ids = self.rewrite_dash(stream)
return res_buff
def rewrite_dash(self, stream):
ET.register_namespace('', 'urn:mpeg:dash:schema:mpd:2011')
namespaces = {'mpd': 'urn:mpeg:dash:schema:mpd:2011'}
tree = ET.ElementTree()
root = tree.getroot()
best_ids = []
for period in root.findall('mpd:Period', namespaces):
for adaptset in period.findall('mpd:AdaptationSet', namespaces):
best = None
for repres in adaptset.findall('mpd:Representation', namespaces):
bandwidth = int(repres.get('bandwidth', '0'))
if not best or bandwidth > int(best.get('bandwidth', '0')):
best = repres
if best:
for repres in adaptset.findall('mpd:Representation', namespaces):
if repres != best:
string_io = StringIO()
tree.write(string_io, encoding='unicode', xml_declaration=True)
buff_io = BytesIO()
return buff_io, best_ids
# ============================================================================
def rewrite_fb_dash(string):
DASH_SPLIT = r'\n",dash_prefetched_representation_ids:'
inx = string.find(DASH_SPLIT)
if inx < 0:
return string
string = string[:inx]
buff = string.encode('utf-8').decode('unicode-escape')
buff = buff.encode('utf-8')
io = BytesIO(buff)
io, best_ids = RewriteDASH().rewrite_dash(io)
string = json.dumps(io.read().decode('utf-8'))
string = string[1:-1].replace('<', r'\x3C')
string += DASH_SPLIT
string += json.dumps(best_ids)
return string