python: Remove HTTP_CONTENT_{TYPE,LENGTH} from WSGI environment.
[ashd.git] / python3 / ashd-wsgi3
... / ...
CommitLineData
1#!/usr/bin/python3
2
3import sys, os, getopt, threading, logging, time, locale, collections
4import ashd.proto, ashd.util, ashd.perf
5try:
6 import pdm.srv
7except:
8 pdm = None
9
10def usage(out):
11 out.write("usage: ashd-wsgi3 [-hAL] [-m PDM-SPEC] [-p MODPATH] [-l REQLIMIT] HANDLER-MODULE [ARGS...]\n")
12
13reqlimit = 0
14modwsgi_compat = False
15setlog = True
16opts, args = getopt.getopt(sys.argv[1:], "+hALp:l:m:")
17for o, a in opts:
18 if o == "-h":
19 usage(sys.stdout)
20 sys.exit(0)
21 elif o == "-p":
22 sys.path.insert(0, a)
23 elif o == "-L":
24 setlog = False
25 elif o == "-A":
26 modwsgi_compat = True
27 elif o == "-l":
28 reqlimit = int(a)
29 elif o == "-m":
30 if pdm is not None:
31 pdm.srv.listen(a)
32if len(args) < 1:
33 usage(sys.stderr)
34 sys.exit(1)
35if setlog:
36 logging.basicConfig(format="ashd-wsgi3(%(name)s): %(levelname)s: %(message)s")
37log = logging.getLogger("ashd-wsgi3")
38
39try:
40 handlermod = __import__(args[0], fromlist = ["dummy"])
41except ImportError as exc:
42 sys.stderr.write("ashd-wsgi3: handler %s not found: %s\n" % (args[0], exc.args[0]))
43 sys.exit(1)
44if not modwsgi_compat:
45 if not hasattr(handlermod, "wmain"):
46 sys.stderr.write("ashd-wsgi3: handler %s has no `wmain' function\n" % args[0])
47 sys.exit(1)
48 handler = handlermod.wmain(*args[1:])
49else:
50 if not hasattr(handlermod, "application"):
51 sys.stderr.write("ashd-wsgi3: handler %s has no `application' object\n" % args[0])
52 sys.exit(1)
53 handler = handlermod.application
54
55class closed(IOError):
56 def __init__(self):
57 super().__init__("The client has closed the connection.")
58
59cwd = os.getcwd()
60def absolutify(path):
61 if path[0] != '/':
62 return os.path.join(cwd, path)
63 return path
64
65def unquoteurl(url):
66 buf = bytearray()
67 i = 0
68 while i < len(url):
69 c = url[i]
70 i += 1
71 if c == ord(b'%'):
72 if len(url) >= i + 2:
73 c = 0
74 if ord(b'0') <= url[i] <= ord(b'9'):
75 c |= (url[i] - ord(b'0')) << 4
76 elif ord(b'a') <= url[i] <= ord(b'f'):
77 c |= (url[i] - ord(b'a') + 10) << 4
78 elif ord(b'A') <= url[i] <= ord(b'F'):
79 c |= (url[i] - ord(b'A') + 10) << 4
80 else:
81 raise ValueError("Illegal URL escape character")
82 if ord(b'0') <= url[i + 1] <= ord(b'9'):
83 c |= url[i + 1] - ord('0')
84 elif ord(b'a') <= url[i + 1] <= ord(b'f'):
85 c |= url[i + 1] - ord(b'a') + 10
86 elif ord(b'A') <= url[i + 1] <= ord(b'F'):
87 c |= url[i + 1] - ord(b'A') + 10
88 else:
89 raise ValueError("Illegal URL escape character")
90 buf.append(c)
91 i += 2
92 else:
93 raise ValueError("Incomplete URL escape character")
94 else:
95 buf.append(c)
96 return buf
97
98def dowsgi(req):
99 env = {}
100 env["wsgi.version"] = 1, 0
101 for key, val in req.headers:
102 env["HTTP_" + key.upper().replace(b"-", b"_").decode("latin-1")] = val.decode("latin-1")
103 env["SERVER_SOFTWARE"] = "ashd-wsgi/1"
104 env["GATEWAY_INTERFACE"] = "CGI/1.1"
105 env["SERVER_PROTOCOL"] = req.ver.decode("latin-1")
106 env["REQUEST_METHOD"] = req.method.decode("latin-1")
107 try:
108 rawpi = unquoteurl(req.rest)
109 except:
110 rawpi = req.rest
111 try:
112 name, rest, pi = (v.decode("utf-8") for v in (req.url, req.rest, rawpi))
113 env["wsgi.uri_encoding"] = "utf-8"
114 except UnicodeError as exc:
115 name, rest, pi = (v.decode("latin-1") for v in (req.url, req.rest, rawpi))
116 env["wsgi.uri_encoding"] = "latin-1"
117 env["REQUEST_URI"] = name
118 p = name.find('?')
119 if p >= 0:
120 env["QUERY_STRING"] = name[p + 1:]
121 name = name[:p]
122 else:
123 env["QUERY_STRING"] = ""
124 if name[-len(rest):] == rest:
125 # This is the same hack used in call*cgi.
126 name = name[:-len(rest)]
127 if name == "/":
128 # This seems to be normal CGI behavior, but see callcgi.c for
129 # details.
130 pi = "/" + pi
131 name = ""
132 env["SCRIPT_NAME"] = name
133 env["PATH_INFO"] = pi
134 for src, tgt in [("HTTP_HOST", "SERVER_NAME"), ("HTTP_X_ASH_SERVER_PORT", "SERVER_PORT"),
135 ("HTTP_X_ASH_ADDRESS", "REMOTE_ADDR"), ("HTTP_CONTENT_TYPE", "CONTENT_TYPE"),
136 ("HTTP_CONTENT_LENGTH", "CONTENT_LENGTH"), ("HTTP_X_ASH_PROTOCOL", "wsgi.url_scheme")]:
137 if src in env: env[tgt] = env[src]
138 for key in ["HTTP_CONTENT_TYPE", "HTTP_CONTENT_LENGTH"]:
139 # The CGI specification does not strictly require this, but
140 # many actualy programs and libraries seem to.
141 if key in env: del env[key]
142 if "X-Ash-Protocol" in req and req["X-Ash-Protocol"] == b"https": env["HTTPS"] = "on"
143 if "X-Ash-File" in req: env["SCRIPT_FILENAME"] = absolutify(req["X-Ash-File"].decode(locale.getpreferredencoding()))
144 env["wsgi.input"] = req.sk
145 env["wsgi.errors"] = sys.stderr
146 env["wsgi.multithread"] = True
147 env["wsgi.multiprocess"] = False
148 env["wsgi.run_once"] = False
149
150 resp = []
151 respsent = []
152
153 def recode(thing):
154 if isinstance(thing, collections.ByteString):
155 return thing
156 else:
157 return str(thing).encode("latin-1")
158
159 def flushreq():
160 if not respsent:
161 if not resp:
162 raise Exception("Trying to write data before starting response.")
163 status, headers = resp
164 respsent[:] = [True]
165 buf = bytearray()
166 buf += b"HTTP/1.1 " + recode(status) + b"\n"
167 for nm, val in headers:
168 buf += recode(nm) + b": " + recode(val) + b"\n"
169 buf += b"\n"
170 try:
171 req.sk.write(buf)
172 except IOError:
173 raise closed()
174
175 def write(data):
176 if not data:
177 return
178 flushreq()
179 try:
180 req.sk.write(data)
181 req.sk.flush()
182 except IOError:
183 raise closed()
184
185 def startreq(status, headers, exc_info = None):
186 if resp:
187 if exc_info: # Interesting, this...
188 try:
189 if respsent:
190 raise exc_info[1]
191 finally:
192 exc_info = None # CPython GC bug?
193 else:
194 raise Exception("Can only start responding once.")
195 resp[:] = status, headers
196 return write
197
198 with ashd.perf.request(env) as reqevent:
199 try:
200 respiter = handler(env, startreq)
201 try:
202 for data in respiter:
203 write(data)
204 if resp:
205 flushreq()
206 finally:
207 if hasattr(respiter, "close"):
208 respiter.close()
209 except closed:
210 pass
211 if resp:
212 reqevent.response(resp)
213
214flightlock = threading.Condition()
215inflight = 0
216
217class reqthread(threading.Thread):
218 def __init__(self, req):
219 super().__init__(name = "Request handler")
220 self.req = req.dup()
221
222 def run(self):
223 global inflight
224 try:
225 with flightlock:
226 if reqlimit != 0:
227 start = time.time()
228 while inflight >= reqlimit:
229 flightlock.wait(10)
230 if time.time() - start > 10:
231 os.abort()
232 inflight += 1
233 try:
234 dowsgi(self.req)
235 finally:
236 with flightlock:
237 inflight -= 1
238 flightlock.notify()
239 except:
240 log.error("exception occurred in handler thread", exc_info=True)
241 finally:
242 self.req.close()
243 sys.stderr.flush()
244
245def handle(req):
246 reqthread(req).start()
247
248ashd.util.serveloop(handle)