chiark / gitweb /
hippotat: Convert an explicitly configured URL to ASCII.
[hippotat] / hippotat
CommitLineData
c55f394e 1#!/usr/bin/python3
6b926141
IJ
2#
3# Hippotat - Asinine IP Over HTTP program
4# ./hippotat - client main program
5#
6# Copyright 2017 Ian Jackson
7#
f85d143f 8# GPLv3+
6b926141 9#
f85d143f
IJ
10# This program is free software: you can redistribute it and/or modify
11# it under the terms of the GNU General Public License as published by
12# the Free Software Foundation, either version 3 of the License, or
13# (at your option) any later version.
6b926141 14#
f85d143f
IJ
15# This program is distributed in the hope that it will be useful,
16# but WITHOUT ANY WARRANTY; without even the implied warranty of
17# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18# GNU General Public License for more details.
19#
20# You should have received a copy of the GNU General Public License
21# along with this program, in the file GPLv3. If not,
22# see <http://www.gnu.org/licenses/>.
6b926141 23
1d33eef3 24#@ import sys; sys.path.append('@PYBUILD_INSTALL_DIR@')
5a37bac8 25from hippotatlib import *
c55f394e 26
c0c90673
IJ
27import twisted.web
28import twisted.web.client
e13eca8e 29import urllib.parse
c0c90673 30
dd6665ee
IJ
31import io
32
0accf0d3 33class GeneralResponseConsumer(twisted.internet.protocol.Protocol):
dbf9b0e5 34 def __init__(self, cl, req, resp, desc):
c7fb640e 35 self._cl = cl
8b62cd2c 36 self._req = req
d4161704 37 self._resp = resp
0accf0d3 38 self._desc = desc
14c6d55c
IJ
39
40 def _log(self, dflag, msg, **kwargs):
74934d63 41 self._cl.log(dflag, '%s: %s' % (self._desc, msg), idof=self._req, **kwargs)
0accf0d3
IJ
42
43 def connectionMade(self):
44 self._log(DBG.HTTP_CTRL, 'connectionMade')
45
216519e3 46 def connectionLostOK(self, reason):
916021af
IJ
47 return (reason.check(twisted.web.client.ResponseDone) or
48 reason.check(twisted.web.client.PotentialDataLoss))
49 # twisted.web.client.PotentialDataLoss is an entirely daft
50 # exception. It will occur every time if the origin server does
51 # not provide a Content-Length. (hippotatd does, of course, but
52 # the HTTP transaction might be proxied.)
216519e3 53
0accf0d3 54class ResponseConsumer(GeneralResponseConsumer):
4224dc19 55 def __init__(self, cl, req, resp):
dbf9b0e5 56 super().__init__(cl, req, resp, 'RC')
0accf0d3 57 ssddesc = '[%s] %s' % (id(req), self._desc)
909e0ff3 58 self._ssd = SlipStreamDecoder(ssddesc, partial(queue_inbound, cl.ipif))
0accf0d3 59 self._log(DBG.HTTP_CTRL, '__init__')
bd9e77fb 60
62b51bcf 61 def dataReceived(self, data):
380ed56c 62 self._log(DBG.HTTP, 'dataReceived', d=data)
9b65cdd4 63 try:
02cdcb52 64 self._ssd.inputdata(data)
9b65cdd4 65 except Exception as e:
eedc8b30 66 self._handleexception()
ccd371b3 67
62b51bcf 68 def connectionLost(self, reason):
d5008b7c
IJ
69 reason_msg = 'connectionLost ' + str(reason)
70 self._log(DBG.HTTP_CTRL, reason_msg)
216519e3 71 if not self.connectionLostOK(reason):
d5008b7c 72 self._latefailure(reason_msg)
765aba55
IJ
73 return
74 try:
380ed56c 75 self._log(DBG.HTTP, 'ResponseDone')
765aba55 76 self._ssd.flush()
74934d63 77 self._cl.req_fin(self._req)
765aba55 78 except Exception as e:
eedc8b30 79 self._handleexception()
909e0ff3 80 self._cl.report_running()
eedc8b30
IJ
81
82 def _handleexception(self):
0accf0d3 83 self._latefailure(traceback.format_exc())
33932420 84
0accf0d3 85 def _latefailure(self, reason):
380ed56c 86 self._log(DBG.HTTP_CTRL, '_latefailure ' + str(reason))
74934d63 87 self._cl.req_err(self._req, reason)
bd9e77fb 88
74934d63 89class ErrorResponseConsumer(GeneralResponseConsumer):
c7fb640e 90 def __init__(self, cl, req, resp):
dbf9b0e5 91 super().__init__(cl, req, resp, 'ERROR-RC')
0accf0d3 92 self._m = b''
6e4af0a2
IJ
93 try:
94 self._phrase = resp.phrase.decode('utf-8')
95 except Exception:
96 self._phrase = repr(resp.phrase)
6e4af0a2
IJ
97 self._log(DBG.HTTP_CTRL, '__init__ %d %s' % (resp.code, self._phrase))
98
765aba55
IJ
99 def dataReceived(self, data):
100 self._log(DBG.HTTP_CTRL, 'dataReceived ' + repr(data))
101 self._m += data
102
6e4af0a2
IJ
103 def connectionLost(self, reason):
104 try:
105 mbody = self._m.decode('utf-8')
106 except Exception:
107 mbody = repr(self._m)
216519e3 108 if not self.connectionLostOK(reason):
765aba55 109 mbody += ' || ' + str(reason)
74934d63 110 self._cl.req_err(self._req,
765aba55
IJ
111 "FAILED %d %s | %s"
112 % (self._resp.code, self._phrase, mbody))
6e4af0a2 113
c7fb640e
IJ
114class Client():
115 def __init__(cl, c,ss,cs):
116 cl.c = c
117 cl.outstanding = { }
118 cl.desc = '[%s %s] ' % (ss,cs)
909e0ff3
IJ
119 cl.running_reported = False
120 cl.log_info('setting up')
121
122 def log_info(cl, msg):
123 log.info(cl.desc + msg, dflag=False)
124
125 def report_running(cl):
126 if not cl.running_reported:
127 cl.log_info('running OK')
128 cl.running_reported = True
c7fb640e
IJ
129
130 def log(cl, dflag, msg, **kwargs):
131 log_debug(dflag, cl.desc + msg, **kwargs)
132
133 def log_outstanding(cl):
c7f134ce 134 cl.log(DBG.CTRL_DUMP, 'OS %s' % cl.outstanding)
c7fb640e
IJ
135
136 def start(cl):
8d374606 137 cl.queue = PacketQueue('up', cl.c.max_queue_time)
c7fb640e 138 cl.agent = twisted.web.client.Agent(
8d374606 139 reactor, connectTimeout = cl.c.http_timeout)
c7fb640e
IJ
140
141 def outbound(cl, packet, saddr, daddr):
142 #print('OUT ', saddr, daddr, repr(packet))
143 cl.queue.append(packet)
144 cl.check_outbound()
145
146 def req_ok(cl, req, resp):
147 cl.log(DBG.HTTP_CTRL,
5dd3275b
IJ
148 'req_ok %d %s %s' % (resp.code, repr(resp.phrase), str(resp)),
149 idof=req)
8d374606 150 if resp.code == 200:
4224dc19 151 rc = ResponseConsumer(cl, req, resp)
8d374606
IJ
152 else:
153 rc = ErrorResponseConsumer(cl, req, resp)
5dd3275b 154
8d374606
IJ
155 resp.deliverBody(rc)
156 # now rc is responsible for calling req_fin
7b07f0b5 157
c7fb640e
IJ
158 def req_err(cl, req, err):
159 # called when the Deferred fails, or (if it completes),
160 # later, by ResponsConsumer or ErrorResponsConsumer
161 try:
162 cl.log(DBG.HTTP_CTRL, 'req_err ' + str(err), idof=req)
1a691ffd 163 cl.running_reported = False
c7fb640e
IJ
164 if isinstance(err, twisted.python.failure.Failure):
165 err = err.getTraceback()
7ec61cc0
IJ
166 print('%s[%#x] %s' % (cl.desc, id(req), err.strip('\n').replace('\n',' / ')),
167 file=sys.stderr)
c7f134ce
IJ
168 if not isinstance(cl.outstanding[req], int):
169 raise RuntimeError('[%#x] previously %s' %
170 (id(req), cl.outstanding[req]))
c7fb640e
IJ
171 cl.outstanding[req] = err
172 cl.log_outstanding()
8d374606 173 reactor.callLater(cl.c.http_retry, partial(cl.req_fin, req))
c7fb640e
IJ
174 except Exception as e:
175 crash(traceback.format_exc() + '\n----- handling -----\n' + err)
176
177 def req_fin(cl, req):
178 del cl.outstanding[req]
c7f134ce 179 cl.log(DBG.HTTP_CTRL, 'req_fin OS=%d' % len(cl.outstanding), idof=req)
c7fb640e
IJ
180 cl.check_outbound()
181
182 def check_outbound(cl):
183 while True:
184 if len(cl.outstanding) >= cl.c.max_outstanding:
185 break
186
c7f134ce
IJ
187 if (not cl.queue.nonempty() and
188 len(cl.outstanding) >= cl.c.target_requests_outstanding):
c7fb640e
IJ
189 break
190
191 d = b''
192 def moredata(s): nonlocal d; d += s
c7f134ce 193 cl.queue.process((lambda: len(d)),
c7fb640e
IJ
194 moredata,
195 cl.c.max_batch_up)
196
197 d = mime_translate(d)
198
ef041033
IJ
199 token = authtoken_make(cl.c.secret)
200
c7fb640e
IJ
201 crlf = b'\r\n'
202 lf = b'\n'
203 mime = (b'--b' + crlf +
204 b'Content-Type: text/plain; charset="utf-8"' + crlf +
205 b'Content-Disposition: form-data; name="m"' + crlf + crlf +
206 str(cl.c.client) .encode('ascii') + crlf +
ef041033 207 token + crlf +
c7f134ce
IJ
208 str(cl.c.target_requests_outstanding)
209 .encode('ascii') + crlf +
c7fb640e
IJ
210 str(cl.c.http_timeout) .encode('ascii') + crlf +
211 ((
212 b'--b' + crlf +
213 b'Content-Type: application/octet-stream' + crlf +
214 b'Content-Disposition: form-data; name="d"' + crlf + crlf +
215 d + crlf
216 ) if len(d) else b'') +
217 b'--b--' + crlf)
218
219 #df = open('data.dump.dbg', mode='wb')
220 #df.write(mime)
221 #df.close()
222 # POST -use -c 'multipart/form-data; boundary="b"' http://localhost:8099/ <data.dump.dbg
223
224 cl.log(DBG.HTTP_FULL, 'requesting: ' + str(mime))
225
226 hh = { 'User-Agent': ['hippotat'],
b3e598b5 227 'Content-Type': ['multipart/form-data; boundary="b"'] }
c7fb640e
IJ
228
229 bytesreader = io.BytesIO(mime)
230 producer = twisted.web.client.FileBodyProducer(bytesreader)
231
c7f134ce 232 req = cl.agent.request(b'POST',
c7fb640e
IJ
233 cl.c.url,
234 twisted.web.client.Headers(hh),
235 producer)
236
237 cl.outstanding[req] = len(d)
238 cl.log(DBG.HTTP_CTRL,
239 'request OS=%d' % len(cl.outstanding),
240 idof=req, d=d)
241 req.addTimeout(cl.c.http_timeout, reactor)
242 req.addCallback(partial(cl.req_ok, req))
243 req.addErrback(partial(cl.req_err, req))
244
245 cl.log_outstanding()
246
247clients = [ ]
248
e13eca8e
MW
249def encode_url(urlstr):
250 # Oh, this is a disaster. We're given a URL as a `str', but the underlying
251 # machinery insists on having `bytes'. Assume we've been given a sensible
252 # URL, with escaping in all of the necessary places, except that it may
253 # contain non-ASCII characters: then encode as UTF-8 and squash the top-
254 # bit-set bytes down to percent escapes.
255 #
256 # This conses like it's going out of fashion, but it gets the job done.
257 return b''.join(bytes([b]) if b < 128 else '%%%02X' % b
258 for b in urlstr.encode('utf-8'))
259
1cc6968f 260def process_cfg(_opts, putative_servers, putative_clients):
c7fb640e
IJ
261 global clients
262
263 for ss in putative_servers.values():
264 for (ci,cs) in putative_clients.items():
265 c = ConfigResults()
266
8d374606 267 sections = cfg_process_client_common(c,ss,cs,ci)
c7fb640e
IJ
268 if not sections: continue
269
8c771381
IJ
270 log_debug_config('processing client [%s %s]' % (ss, cs))
271
c7fb640e
IJ
272 def srch(getter,key): return cfg_search(getter,key,sections)
273
274 c.http_timeout += srch(cfg.getint, 'http_timeout_grace')
275 c.max_outstanding = srch(cfg.getint, 'max_requests_outstanding')
276 c.max_batch_up = srch(cfg.getint, 'max_batch_up')
277 c.http_retry = srch(cfg.getint, 'http_retry')
f754eec4 278 c.max_queue_time = srch(cfg.getint, 'max_queue_time')
c7fb640e
IJ
279 c.vroutes = srch(cfg.get, 'vroutes')
280
d72f8360
IJ
281 try: c.ifname = srch(cfg_get_raw, 'ifname_client')
282 except NoOptionError: pass
283
e13eca8e 284 try: c.url = encode_url(srch(cfg.get,'url'))
c7fb640e 285 except NoOptionError:
8d374606 286 cfg_process_saddrs(c, ss)
c7fb640e
IJ
287 c.url = c.saddrs[0].url()
288
8d374606
IJ
289 c.client = ci
290
291 cfg_process_vaddr(c,ss)
292
293 cfg_process_ipif(c,
c7fb640e
IJ
294 sections,
295 (('local','client'),
296 ('peer', 'vaddr'),
297 ('rnets','vroutes')))
298
299 clients.append(Client(c,ss,cs))
0accf0d3 300
5510890e 301common_startup(process_cfg)
c7fb640e
IJ
302
303for cl in clients:
304 cl.start()
909e0ff3 305 cl.ipif = start_ipif(cl.c.ipif_command, cl.outbound)
c7fb640e
IJ
306 cl.check_outbound()
307
034284c3 308common_run()