diff --git a/pywb/framework/wbrequestresponse.py b/pywb/framework/wbrequestresponse.py index a234c76e..991f42a2 100644 --- a/pywb/framework/wbrequestresponse.py +++ b/pywb/framework/wbrequestresponse.py @@ -87,6 +87,17 @@ class WbRequest(object): self._parse_extra() + @property + def is_embed(self): + return (self.wb_url and + self.wb_url.mod and + self.wb_url.mod != 'id_') + + @property + def is_identity(self): + return (self.wb_url and + self.wb_url.mod == 'id_') + def _is_ajax(self): value = self.env.get('HTTP_X_REQUESTED_WITH') if not value: diff --git a/pywb/rewrite/regex_rewriters.py b/pywb/rewrite/regex_rewriters.py index 7970ab48..5f429339 100644 --- a/pywb/rewrite/regex_rewriters.py +++ b/pywb/rewrite/regex_rewriters.py @@ -25,7 +25,7 @@ class RegexRewriter(object): @staticmethod def archival_rewrite(rewriter): - return lambda string: rewriter.rewrite(string) + return lambda string: rewriter.rewrite(string, 'em_') #@staticmethod #def replacer(other): @@ -33,7 +33,7 @@ class RegexRewriter(object): HTTPX_MATCH_STR = r'https?:\\?/\\?/[A-Za-z0-9:_@.-]+' - DEFAULT_OP = add_prefix + #DEFAULT_OP = add_prefix def __init__(self, rules): #rules = self.create_rules(http_prefix) @@ -74,8 +74,8 @@ class RegexRewriter(object): return m.group(0) # Custom func - if not hasattr(op, '__call__'): - op = RegexRewriter.DEFAULT_OP(op) + #if not hasattr(op, '__call__'): + # op = RegexRewriter.DEFAULT_OP(op) result = op(m.group(i)) final_str = result @@ -124,8 +124,8 @@ class JSLinkAndLocationRewriter(JSLinkOnlyRewriter): def __init__(self, rewriter, rules=[], prefix='WB_wombat_'): rules = rules + [ - (r'(?>> parse('') - + # Unterminated script tag, handle but don't auto-terminate >>> parse('') - + >>> parse('
') - + >>> parse('') - + # Unterminated style tag, handle but don't auto-terminate >>> parse('') - + # Unterminated style tag, handle but don't auto-terminate >>> parse('