-
Notifications
You must be signed in to change notification settings - Fork 18
/
proxy.py
174 lines (138 loc) · 5.53 KB
/
proxy.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
#!/usr/bin/python
# -*- coding:utf-8 -*-
#############################################
# Flask & werkzeug HTTP Proxy Sample code.
# - Code by Jioh L. Jung (ziozzang@gmail.com)
#############################################
import sys
if sys.version_info[0] < 3:
import httplib
import urlparse
else:
import http.client as httplib
import urllib.parse as urlparse
import re
import urllib
import json
from flask import Flask, Blueprint, request, Response, url_for
from werkzeug.datastructures import Headers
from werkzeug.exceptions import NotFound
app = Flask(__name__)
# Default Configuration
DEBUG_FLAG = True
LISTEN_PORT = 7788
proxy = Blueprint('proxy', __name__)
# You can insert Authentication here.
#proxy.before_request(check_login)
# Filters.
HTML_REGEX = re.compile(r'((?:src|action|href)=["\'])/')
JQUERY_REGEX = re.compile(r'(\$\.(?:get|post)\(["\'])/')
JS_LOCATION_REGEX = re.compile(r'((?:window|document)\.location.*=.*["\'])/')
CSS_REGEX = re.compile(r'(url\(["\']?)/')
REGEXES = [HTML_REGEX, JQUERY_REGEX, JS_LOCATION_REGEX, CSS_REGEX]
def iterform(multidict):
for key in multidict.keys():
for value in multidict.getlist(key):
yield (key.encode("utf8"), value.encode("utf8"))
def parse_host_port(h, proto):
"""Parses strings in the form host[:port]"""
host_port = h.split(":", 1)
if len(host_port) == 1:
if proto.lower() == 'http': return (h, 80)
if proto.lower() == 'https': return (h, 443)
return (h, 443) # Default is HTTPS
else:
host_port[1] = int(host_port[1])
return host_port
# For RESTful Service
@proxy.route('/proxy/<proto>/<host>/', methods=["GET", "POST", "PUT", "DELETE"])
@proxy.route('/proxy/<proto>/<host>/<path:file>', methods=["GET", "POST", "PUT", "DELETE"])
def proxy_request(proto, host, file=""):
hostname, port = parse_host_port(host, proto)
print ("H: '%s' P: %d" % (hostname, port))
print ("F: '%s'" % (file))
# Whitelist a few headers to pass on
request_headers = {}
for h in ["Cookie", "Referer", "X-Csrf-Token"]:
if h in request.headers:
request_headers[h] = request.headers[h]
if request.query_string:
path = "/%s?%s" % (file, request.query_string)
else:
path = "/" + file
if request.method == "POST" or request.method == "PUT":
form_data = list(iterform(request.form))
form_data = urllib.urlencode(form_data)
request_headers["Content-Length"] = len(form_data)
else:
form_data = None
if not ('host' in request_headers.keys()):
request_headers['host'] = hostname
# if target is for HTTP, use HTTPConnection method.
request_method = httplib.HTTPSConnection
if proto.lower() == 'http': request_method = httplib.HTTPConnection
conn = request_method(hostname, port)
conn.request(request.method, path, body=form_data, headers=request_headers)
resp = conn.getresponse()
# Clean up response headers for forwarding
d = {}
response_headers = Headers()
for key, value in resp.getheaders():
print ("HEADER: '%s':'%s'" % (key, value))
d[key.lower()] = value
if key in ["content-length", "connection", "content-type"]:
continue
if key == "set-cookie":
cookies = value.split(",")
[response_headers.add(key, c) for c in cookies]
else:
response_headers.add(key, value)
# If this is a redirect, munge the Location URL
if "location" in response_headers:
redirect = response_headers["location"]
parsed = urlparse.urlparse(request.url)
redirect_parsed = urlparse.urlparse(redirect)
redirect_host = redirect_parsed.netloc
if not redirect_host:
redirect_host = "%s:%d" % (hostname, port)
redirect_path = redirect_parsed.path
if redirect_parsed.query:
redirect_path += "?" + redirect_parsed.query
munged_path = url_for(".proxy_request",
proto=proto,
host=redirect_host,
file=redirect_path[1:])
url = "%s://%s%s" % (parsed.scheme, parsed.netloc, munged_path)
response_headers["location"] = url
# Rewrite URLs in the content to point to our URL schemt.method == " instead.
# Ugly, but seems to mostly work.
root = url_for(".proxy_request", proto=proto, host=host)
contents = resp.read()
# Restructing Contents.
if "content-type" in d.keys():
if d["content-type"].find("application/json") >= 0:
# JSON format conentens will be modified here.
jc = json.loads(contents)
if jc.has_key("nodes"):
del jc["nodes"]
contents = json.dumps(jc)
else:
# Generic HTTP.
pass
# only valid for python2 / cuz, python3's string & byte handling is diffrent from python2
#for regex in REGEXES:
# contents = regex.sub(r'\1%s' % root, contents)
else:
# set default content-type, for error handling
d['content-type'] = 'text/html; charset=utf-8'
# Remove transfer-encoding: chunked header. cuz proxy does not use chunk trnasfer.
if 'transfer-encoding' in d:
if d['transfer-encoding'].lower() == 'chunked':
del(d['transfer-encoding'])
d['content-length'] = len(contents)
flask_response = Response(response=contents,
status=resp.status,
headers=d)
return flask_response
app.register_blueprint(proxy)
app.run(debug=DEBUG_FLAG, host='0.0.0.0', port=LISTEN_PORT)