python: Improved error handling and logging in ashd-wsgi.
[ashd.git] / python3 / ashd-wsgi3
CommitLineData
55fa3f63 1#!/usr/bin/python3
c270f222 2
14640dcc 3import sys, os, getopt, threading, logging, time, locale, collections
d5ee5cde
FT
4import ashd.proto, ashd.util, ashd.perf
5try:
6 import pdm.srv
7except:
8 pdm = None
c270f222
FT
9
10def usage(out):
14640dcc 11 out.write("usage: ashd-wsgi3 [-hAL] [-m PDM-SPEC] [-p MODPATH] [-l REQLIMIT] HANDLER-MODULE [ARGS...]\n")
c270f222 12
3e11d7ed 13reqlimit = 0
c270f222 14modwsgi_compat = False
14640dcc
FT
15setlog = True
16opts, args = getopt.getopt(sys.argv[1:], "+hALp:l:m:")
c270f222
FT
17for o, a in opts:
18 if o == "-h":
19 usage(sys.stdout)
20 sys.exit(0)
21 elif o == "-p":
22 sys.path.insert(0, a)
14640dcc
FT
23 elif o == "-L":
24 setlog = False
c270f222
FT
25 elif o == "-A":
26 modwsgi_compat = True
3e11d7ed
FT
27 elif o == "-l":
28 reqlimit = int(a)
d5ee5cde
FT
29 elif o == "-m":
30 if pdm is not None:
31 pdm.srv.listen(a)
c270f222
FT
32if len(args) < 1:
33 usage(sys.stderr)
34 sys.exit(1)
14640dcc
FT
35if setlog:
36 logging.basicConfig(format="ashd-wsgi3(%(name)s): %(levelname)s: %(message)s")
64a8cd9f 37log = logging.getLogger("ashd-wsgi3")
c270f222
FT
38
39try:
40 handlermod = __import__(args[0], fromlist = ["dummy"])
55fa3f63 41except ImportError as exc:
1f3d7aa3 42 sys.stderr.write("ashd-wsgi3: handler %s not found: %s\n" % (args[0], exc.args[0]))
c270f222
FT
43 sys.exit(1)
44if not modwsgi_compat:
45 if not hasattr(handlermod, "wmain"):
1f3d7aa3 46 sys.stderr.write("ashd-wsgi3: handler %s has no `wmain' function\n" % args[0])
c270f222 47 sys.exit(1)
adb11d5f 48 handler = handlermod.wmain(*args[1:])
c270f222
FT
49else:
50 if not hasattr(handlermod, "application"):
1f3d7aa3 51 sys.stderr.write("ashd-wsgi3: handler %s has no `application' object\n" % args[0])
c270f222
FT
52 sys.exit(1)
53 handler = handlermod.application
54
81a0ca30
FT
55class closed(IOError):
56 def __init__(self):
55fa3f63 57 super().__init__("The client has closed the connection.")
81a0ca30 58
70d942a7
FT
59cwd = os.getcwd()
60def absolutify(path):
61 if path[0] != '/':
62 return os.path.join(cwd, path)
63 return path
64
09c82f9c 65def unquoteurl(url):
55fa3f63 66 buf = bytearray()
09c82f9c
FT
67 i = 0
68 while i < len(url):
69 c = url[i]
70 i += 1
55fa3f63 71 if c == ord(b'%'):
370d235f 72 if len(url) >= i + 2:
09c82f9c 73 c = 0
55fa3f63
FT
74 if ord(b'0') <= url[i] <= ord(b'9'):
75 c |= (url[i] - ord(b'0')) << 4
76 elif ord(b'a') <= url[i] <= ord(b'f'):
77 c |= (url[i] - ord(b'a') + 10) << 4
78 elif ord(b'A') <= url[i] <= ord(b'F'):
79 c |= (url[i] - ord(b'A') + 10) << 4
09c82f9c
FT
80 else:
81 raise ValueError("Illegal URL escape character")
55fa3f63
FT
82 if ord(b'0') <= url[i + 1] <= ord(b'9'):
83 c |= url[i + 1] - ord('0')
84 elif ord(b'a') <= url[i + 1] <= ord(b'f'):
85 c |= url[i + 1] - ord(b'a') + 10
86 elif ord(b'A') <= url[i + 1] <= ord(b'F'):
87 c |= url[i + 1] - ord(b'A') + 10
09c82f9c
FT
88 else:
89 raise ValueError("Illegal URL escape character")
55fa3f63 90 buf.append(c)
09c82f9c
FT
91 i += 2
92 else:
93 raise ValueError("Incomplete URL escape character")
94 else:
55fa3f63 95 buf.append(c)
09c82f9c 96 return buf
81a0ca30 97
c270f222
FT
98def dowsgi(req):
99 env = {}
100 env["wsgi.version"] = 1, 0
101 for key, val in req.headers:
55fa3f63 102 env["HTTP_" + key.upper().replace(b"-", b"_").decode("latin-1")] = val.decode("latin-1")
c270f222
FT
103 env["SERVER_SOFTWARE"] = "ashd-wsgi/1"
104 env["GATEWAY_INTERFACE"] = "CGI/1.1"
55fa3f63
FT
105 env["SERVER_PROTOCOL"] = req.ver.decode("latin-1")
106 env["REQUEST_METHOD"] = req.method.decode("latin-1")
107 try:
108 rawpi = unquoteurl(req.rest)
109 except:
110 rawpi = req.rest
111 try:
112 name, rest, pi = (v.decode("utf-8") for v in (req.url, req.rest, rawpi))
113 env["wsgi.uri_encoding"] = "utf-8"
114 except UnicodeError as exc:
115 name, rest, pi = (v.decode("latin-1") for v in (req.url, req.rest, rawpi))
116 env["wsgi.uri_encoding"] = "latin-1"
117 env["REQUEST_URI"] = name
c270f222
FT
118 p = name.find('?')
119 if p >= 0:
c270f222 120 env["QUERY_STRING"] = name[p + 1:]
8498ab28 121 name = name[:p]
c270f222
FT
122 else:
123 env["QUERY_STRING"] = ""
55fa3f63 124 if name[-len(rest):] == rest:
53d666ca 125 # This is the same hack used in call*cgi.
55fa3f63
FT
126 name = name[:-len(rest)]
127 if name == "/":
53d666ca
FT
128 # This seems to be normal CGI behavior, but see callcgi.c for
129 # details.
130 pi = "/" + pi
131 name = ""
c270f222 132 env["SCRIPT_NAME"] = name
53d666ca 133 env["PATH_INFO"] = pi
55fa3f63
FT
134 for src, tgt in [("HTTP_HOST", "SERVER_NAME"), ("HTTP_X_ASH_SERVER_PORT", "SERVER_PORT"),
135 ("HTTP_X_ASH_ADDRESS", "REMOTE_ADDR"), ("HTTP_CONTENT_TYPE", "CONTENT_TYPE"),
136 ("HTTP_CONTENT_LENGTH", "CONTENT_LENGTH"), ("HTTP_X_ASH_PROTOCOL", "wsgi.url_scheme")]:
137 if src in env: env[tgt] = env[src]
138 if "X-Ash-Protocol" in req and req["X-Ash-Protocol"] == b"https": env["HTTPS"] = "on"
139 if "X-Ash-File" in req: env["SCRIPT_FILENAME"] = absolutify(req["X-Ash-File"].decode(locale.getpreferredencoding()))
c270f222
FT
140 env["wsgi.input"] = req.sk
141 env["wsgi.errors"] = sys.stderr
142 env["wsgi.multithread"] = True
143 env["wsgi.multiprocess"] = False
144 env["wsgi.run_once"] = False
145
146 resp = []
147 respsent = []
148
55fa3f63
FT
149 def recode(thing):
150 if isinstance(thing, collections.ByteString):
151 return thing
152 else:
153 return str(thing).encode("latin-1")
154
699754de 155 def flushreq():
c270f222
FT
156 if not respsent:
157 if not resp:
55fa3f63 158 raise Exception("Trying to write data before starting response.")
c270f222
FT
159 status, headers = resp
160 respsent[:] = [True]
55fa3f63
FT
161 buf = bytearray()
162 buf += b"HTTP/1.1 " + recode(status) + b"\n"
163 for nm, val in headers:
164 buf += recode(nm) + b": " + recode(val) + b"\n"
165 buf += b"\n"
8bb0e3c1 166 try:
55fa3f63 167 req.sk.write(buf)
8bb0e3c1
FT
168 except IOError:
169 raise closed()
699754de
FT
170
171 def write(data):
172 if not data:
173 return
8bb0e3c1 174 flushreq()
81a0ca30
FT
175 try:
176 req.sk.write(data)
177 req.sk.flush()
178 except IOError:
179 raise closed()
c270f222
FT
180
181 def startreq(status, headers, exc_info = None):
182 if resp:
183 if exc_info: # Interesting, this...
184 try:
185 if respsent:
55fa3f63 186 raise exc_info[1]
c270f222
FT
187 finally:
188 exc_info = None # CPython GC bug?
189 else:
55fa3f63 190 raise Exception("Can only start responding once.")
c270f222
FT
191 resp[:] = status, headers
192 return write
193
d5ee5cde 194 with ashd.perf.request(env) as reqevent:
8bb0e3c1 195 try:
64a8cd9f 196 respiter = handler(env, startreq)
d5ee5cde
FT
197 try:
198 for data in respiter:
199 write(data)
200 if resp:
201 flushreq()
64a8cd9f
FT
202 finally:
203 if hasattr(respiter, "close"):
204 respiter.close()
205 except closed:
206 pass
d5ee5cde
FT
207 if resp:
208 reqevent.response(resp)
c270f222 209
3e11d7ed
FT
210flightlock = threading.Condition()
211inflight = 0
212
c270f222
FT
213class reqthread(threading.Thread):
214 def __init__(self, req):
55fa3f63 215 super().__init__(name = "Request handler")
c270f222
FT
216 self.req = req.dup()
217
218 def run(self):
3e11d7ed 219 global inflight
c270f222 220 try:
55fa3f63 221 with flightlock:
3e11d7ed
FT
222 if reqlimit != 0:
223 start = time.time()
224 while inflight >= reqlimit:
225 flightlock.wait(10)
226 if time.time() - start > 10:
227 os.abort()
228 inflight += 1
3e11d7ed
FT
229 try:
230 dowsgi(self.req)
231 finally:
55fa3f63 232 with flightlock:
3e11d7ed
FT
233 inflight -= 1
234 flightlock.notify()
64a8cd9f
FT
235 except:
236 log.error("exception occurred in handler thread", exc_info=True)
c270f222
FT
237 finally:
238 self.req.close()
a83cfbbc 239 sys.stderr.flush()
c270f222
FT
240
241def handle(req):
242 reqthread(req).start()
243
4e7888f7 244ashd.util.serveloop(handle)