From 0f4d779b00649a6b3e0d2224ee8a90afba5863b7 Mon Sep 17 00:00:00 2001 From: Ilya Kreymer Date: Sat, 18 Jul 2015 18:23:57 -0700 Subject: [PATCH] html rewrite: add 'force_html_decl' option, which if set in rewrite_opts, can be used to force an HTML decl, eg. if a default one was not provided --- pywb/rewrite/html_rewriter.py | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/pywb/rewrite/html_rewriter.py b/pywb/rewrite/html_rewriter.py index afbeba6c..527b0f07 100644 --- a/pywb/rewrite/html_rewriter.py +++ b/pywb/rewrite/html_rewriter.py @@ -109,6 +109,8 @@ class HTMLRewriterMixin(object): # get opts from urlrewriter self.opts = url_rewriter.rewrite_opts + self.force_decl = self.opts.get('force_html_decl', None) + self.parsed_any = False # =========================== @@ -300,6 +302,10 @@ class HTMLRewriterMixin(object): # Clear buffer to create new one for next rewrite() self.out = None + if self.force_decl: + result = self.force_decl + '\n' + result + self.force_decl = None + return result def close(self): @@ -409,6 +415,7 @@ class HTMLRewriter(HTMLRewriterMixin, HTMLParser): def handle_decl(self, data): self.out.write('') + self.force_decl = None def handle_pi(self, data): self.out.write('')