From fc5d7cc7cd7545651481bd2f37fc0259ea697f58 Mon Sep 17 00:00:00 2001 From: Ilya Kreymer Date: Thu, 25 Feb 2016 18:49:31 -0800 Subject: [PATCH] rewrite: add rewriting of content="" attribute if it is a url --- pywb/rewrite/html_rewriter.py | 2 ++ pywb/rewrite/test/test_html_rewriter.py | 6 ++++++ 2 files changed, 8 insertions(+) diff --git a/pywb/rewrite/html_rewriter.py b/pywb/rewrite/html_rewriter.py index 50629514..b93efe7a 100644 --- a/pywb/rewrite/html_rewriter.py +++ b/pywb/rewrite/html_rewriter.py @@ -294,6 +294,8 @@ class HTMLRewriterMixin(object): elif (tag == 'meta') and (attr_name == 'content'): if self.has_attr(tag_attrs, ('http-equiv', 'refresh')): attr_value = self._rewrite_meta_refresh(attr_value) + elif attr_value.startswith(self.DATA_RW_PROTOCOLS): + attr_value = self._rewrite_url(attr_value, rw_mod) # special case: param value, conditional rewrite elif (tag == 'param'): diff --git a/pywb/rewrite/test/test_html_rewriter.py b/pywb/rewrite/test/test_html_rewriter.py index 0ceface3..002529e6 100644 --- a/pywb/rewrite/test/test_html_rewriter.py +++ b/pywb/rewrite/test/test_html_rewriter.py @@ -93,6 +93,12 @@ ur""" >>> parse('') +>>> parse('') + + +>>> parse('') + + # Custom -data attribs >>> parse('
')