2014-03-02 21:42:05 -08:00
|
|
|
from wbrequestresponse import WbResponse, WbRequest
|
2014-02-05 13:08:10 -08:00
|
|
|
from archivalrouter import ArchivalRouter
|
|
|
|
import urlparse
|
|
|
|
|
2014-03-09 14:21:32 -07:00
|
|
|
from pywb.rewrite.url_rewriter import HttpsUrlRewriter
|
2014-03-02 21:42:05 -08:00
|
|
|
|
2014-02-05 13:08:10 -08:00
|
|
|
#=================================================================
|
|
|
|
# An experimental router which combines both archival and proxy modes
|
2014-03-02 21:42:05 -08:00
|
|
|
# http proxy mode support is very simple so far:
|
|
|
|
# only latest capture is available currently
|
2014-02-05 13:08:10 -08:00
|
|
|
#=================================================================
|
2014-03-03 10:35:57 -08:00
|
|
|
class ProxyArchivalRouter(ArchivalRouter):
|
2014-03-14 10:46:20 -07:00
|
|
|
def __init__(self, routes, **kwargs):
|
|
|
|
super(ProxyArchivalRouter, self).__init__(routes, **kwargs)
|
|
|
|
request_class = routes[0].request_class
|
|
|
|
self.proxy = ProxyRouter(routes[0].handler,
|
|
|
|
request_class=request_class,
|
|
|
|
**kwargs)
|
2014-02-05 13:08:10 -08:00
|
|
|
|
|
|
|
def __call__(self, env):
|
2014-03-03 10:35:57 -08:00
|
|
|
response = self.proxy(env)
|
2014-02-05 13:08:10 -08:00
|
|
|
if response:
|
|
|
|
return response
|
|
|
|
|
2014-03-03 10:35:57 -08:00
|
|
|
response = super(ProxyArchivalRouter, self).__call__(env)
|
2014-02-05 13:08:10 -08:00
|
|
|
if response:
|
|
|
|
return response
|
|
|
|
|
|
|
|
|
|
|
|
#=================================================================
|
|
|
|
# Simple router which routes http proxy requests
|
|
|
|
# Handles requests of the form: GET http://example.com
|
|
|
|
# Only supports latest capture replay at the moment
|
|
|
|
#=================================================================
|
|
|
|
class ProxyRouter:
|
2014-03-14 10:46:20 -07:00
|
|
|
def __init__(self, handler, **kwargs):
|
2014-02-05 13:08:10 -08:00
|
|
|
self.handler = handler
|
2014-03-14 10:46:20 -07:00
|
|
|
self.hostpaths = kwargs.get('hostpaths')
|
2014-02-05 13:08:10 -08:00
|
|
|
|
2014-03-14 10:46:20 -07:00
|
|
|
self.error_view = kwargs.get('error_view')
|
|
|
|
self.request_class = kwargs.get('request_class')
|
2014-02-05 13:08:10 -08:00
|
|
|
|
|
|
|
def __call__(self, env):
|
|
|
|
url = env['REL_REQUEST_URI']
|
|
|
|
|
|
|
|
if url.endswith('/proxy.pac'):
|
|
|
|
return self.make_pac_response(env)
|
|
|
|
|
|
|
|
if not url.startswith('http://'):
|
|
|
|
return None
|
|
|
|
|
2014-03-14 10:46:20 -07:00
|
|
|
wbrequest = self.request_class(env,
|
2014-02-23 23:31:54 -08:00
|
|
|
request_uri=url,
|
|
|
|
wb_url_str=url,
|
2014-03-07 10:29:11 -08:00
|
|
|
host_prefix=self.hostpaths[0],
|
2014-02-23 23:31:54 -08:00
|
|
|
wburl_class=self.handler.get_wburl_type(),
|
2014-03-09 14:21:32 -07:00
|
|
|
urlrewriter_class=HttpsUrlRewriter,
|
2014-02-23 23:31:54 -08:00
|
|
|
use_abs_prefix=False,
|
|
|
|
is_proxy=True)
|
2014-02-05 13:08:10 -08:00
|
|
|
|
|
|
|
return self.handler(wbrequest)
|
|
|
|
|
|
|
|
# Proxy Auto-Config (PAC) script for the proxy
|
|
|
|
def make_pac_response(self, env):
|
2014-03-07 11:42:09 -08:00
|
|
|
import os
|
|
|
|
hostname = os.environ.get('PYWB_HOST_NAME')
|
|
|
|
if not hostname:
|
|
|
|
server_hostport = env['SERVER_NAME'] + ':' + env['SERVER_PORT']
|
|
|
|
hostonly = env['SERVER_NAME']
|
|
|
|
else:
|
|
|
|
server_hostport = hostname
|
|
|
|
hostonly = hostname.split(':')[0]
|
2014-02-05 13:08:10 -08:00
|
|
|
|
|
|
|
buff = 'function FindProxyForURL (url, host) {\n'
|
|
|
|
|
2014-03-02 21:42:05 -08:00
|
|
|
direct = ' if (shExpMatch(host, "{0}")) {{ return "DIRECT"; }}\n'
|
2014-02-05 13:08:10 -08:00
|
|
|
|
|
|
|
for hostpath in self.hostpaths:
|
|
|
|
parts = urlparse.urlsplit(hostpath).netloc.split(':')
|
2014-03-02 21:42:05 -08:00
|
|
|
buff += direct.format(parts[0])
|
2014-02-05 13:08:10 -08:00
|
|
|
|
2014-03-07 11:42:09 -08:00
|
|
|
buff += direct.format(hostonly)
|
2014-02-05 13:08:10 -08:00
|
|
|
|
|
|
|
#buff += '\n return "PROXY {0}";\n}}\n'.format(self.hostpaths[0])
|
|
|
|
buff += '\n return "PROXY {0}";\n}}\n'.format(server_hostport)
|
|
|
|
|
2014-03-02 21:42:05 -08:00
|
|
|
content_type = 'application/x-ns-proxy-autoconfig'
|
2014-02-05 13:08:10 -08:00
|
|
|
|
2014-03-02 21:42:05 -08:00
|
|
|
return WbResponse.text_response(buff, content_type=content_type)
|