diff --git a/pywb/rewrite/lxml_html_rewriter.py b/pywb/rewrite/lxml_html_rewriter.py index 415334d3..ef809cf8 100644 --- a/pywb/rewrite/lxml_html_rewriter.py +++ b/pywb/rewrite/lxml_html_rewriter.py @@ -77,8 +77,18 @@ class RewriterTarget(object): self.rewriter.parse_data(data) self.rewriter.out.write(u'-->') - def pi(self, data): - self.rewriter.out.write(u'') + def doctype(self, root_tag, public_id, system_id): + self.rewriter.out.write(u'') + + def pi(self, target, data): + self.rewriter.out.write(u'') def close(self): return '' diff --git a/pywb/rewrite/test/test_html_rewriter.py b/pywb/rewrite/test/test_html_rewriter.py index 20b0ad37..9dbe55ed 100644 --- a/pywb/rewrite/test/test_html_rewriter.py +++ b/pywb/rewrite/test/test_html_rewriter.py @@ -46,6 +46,9 @@ ur""" >>> parse('') +>>> parse('') + + >>> parse('') @@ -63,6 +66,7 @@ ur""" >>> parse('
')
+# Style >>> parse('') @@ -77,11 +81,29 @@ ur""" >>> parse('Test', head_insert = '') Test ->>> parse('
SomeTest
', head_insert = '/* Insert */') -/* Insert */
SomeTest
+>>> parse('
SomeTest
', head_insert = '/* Insert */') +/* Insert */
SomeTest
>>> parse('
SomeTest
', head_insert = '')
SomeTest
+ +>>> parse('') + + +# uncommon markup +>>> parse('') + + +# no special cdata treatment, preserved in ') + + +# CDATA outside of ') + + +>>> parse('') + """ from pywb.rewrite.url_rewriter import UrlRewriter