chiark / gitweb /
polypath asymmetric routing: Handle data packet dupes
[secnet.git] / site.c
1 /* site.c - manage communication with a remote network site */
2
3 /*
4  * This file is part of secnet.
5  * See README for full list of copyright holders.
6  *
7  * secnet is free software; you can redistribute it and/or modify it
8  * under the terms of the GNU General Public License as published by
9  * the Free Software Foundation; either version 3 of the License, or
10  * (at your option) any later version.
11  * 
12  * secnet is distributed in the hope that it will be useful, but
13  * WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
15  * General Public License for more details.
16  * 
17  * You should have received a copy of the GNU General Public License
18  * version 3 along with secnet; if not, see
19  * https://www.gnu.org/licenses/gpl.html.
20  */
21
22 /* The 'site' code doesn't know anything about the structure of the
23    packets it's transmitting.  In fact, under the new netlink
24    configuration scheme it doesn't need to know anything at all about
25    IP addresses, except how to contact its peer.  This means it could
26    potentially be used to tunnel other protocols too (IPv6, IPX, plain
27    old Ethernet frames) if appropriate netlink code can be written
28    (and that ought not to be too hard, eg. using the TUN/TAP device to
29    pretend to be an Ethernet interface).  */
30
31 /* At some point in the future the netlink code will be asked for
32    configuration information to go in the PING/PONG packets at the end
33    of the key exchange. */
34
35 #include "secnet.h"
36 #include <stdio.h>
37 #include <string.h>
38 #include <limits.h>
39 #include <assert.h>
40 #include <sys/socket.h>
41
42 #include <sys/mman.h>
43 #include "util.h"
44 #include "unaligned.h"
45 #include "magic.h"
46
47 #define SETUP_BUFFER_LEN 2048
48
49 #define DEFAULT_KEY_LIFETIME                  (3600*1000) /* [ms] */
50 #define DEFAULT_KEY_RENEGOTIATE_GAP           (5*60*1000) /* [ms] */
51 #define DEFAULT_SETUP_RETRIES 5
52 #define DEFAULT_SETUP_RETRY_INTERVAL             (2*1000) /* [ms] */
53 #define DEFAULT_WAIT_TIME                       (20*1000) /* [ms] */
54
55 #define DEFAULT_MOBILE_KEY_LIFETIME      (2*24*3600*1000) /* [ms] */
56 #define DEFAULT_MOBILE_KEY_RENEGOTIATE_GAP (12*3600*1000) /* [ms] */
57 #define DEFAULT_MOBILE_SETUP_RETRIES 30
58 #define DEFAULT_MOBILE_SETUP_RETRY_INTERVAL      (1*1000) /* [ms] */
59 #define DEFAULT_MOBILE_WAIT_TIME                (10*1000) /* [ms] */
60
61 #define DEFAULT_MOBILE_PEER_EXPIRY            (2*60)      /* [s] */
62
63 /* Each site can be in one of several possible states. */
64
65 /* States:
66    SITE_STOP         - nothing is allowed to happen; tunnel is down;
67                        all session keys have been erased
68      -> SITE_RUN upon external instruction
69    SITE_RUN          - site up, maybe with valid key
70      -> SITE_RESOLVE upon outgoing packet and no valid key
71          we start name resolution for the other end of the tunnel
72      -> SITE_SENTMSG2 upon valid incoming message 1 and suitable time
73          we send an appropriate message 2
74    SITE_RESOLVE      - waiting for name resolution
75      -> SITE_SENTMSG1 upon successful resolution
76          we send an appropriate message 1
77      -> SITE_SENTMSG2 upon valid incoming message 1 (then abort resolution)
78          we abort resolution and 
79      -> SITE_WAIT on timeout or resolution failure
80    SITE_SENTMSG1
81      -> SITE_SENTMSG2 upon valid incoming message 1 from higher priority end
82      -> SITE_SENTMSG3 upon valid incoming message 2
83      -> SITE_WAIT on timeout
84    SITE_SENTMSG2
85      -> SITE_SENTMSG4 upon valid incoming message 3
86      -> SITE_WAIT on timeout
87    SITE_SENTMSG3
88      -> SITE_SENTMSG5 upon valid incoming message 4
89      -> SITE_WAIT on timeout
90    SITE_SENTMSG4
91      -> SITE_RUN upon valid incoming message 5
92      -> SITE_WAIT on timeout
93    SITE_SENTMSG5
94      -> SITE_RUN upon valid incoming message 6
95      -> SITE_WAIT on timeout
96    SITE_WAIT         - failed to establish key; do nothing for a while
97      -> SITE_RUN on timeout
98    */
99
100 #define SITE_STOP     0
101 #define SITE_RUN      1
102 #define SITE_RESOLVE  2
103 #define SITE_SENTMSG1 3
104 #define SITE_SENTMSG2 4
105 #define SITE_SENTMSG3 5
106 #define SITE_SENTMSG4 6
107 #define SITE_SENTMSG5 7
108 #define SITE_WAIT     8
109
110 int32_t site_max_start_pad = 4*4;
111
112 static cstring_t state_name(uint32_t state)
113 {
114     switch (state) {
115     case 0: return "STOP";
116     case 1: return "RUN";
117     case 2: return "RESOLVE";
118     case 3: return "SENTMSG1";
119     case 4: return "SENTMSG2";
120     case 5: return "SENTMSG3";
121     case 6: return "SENTMSG4";
122     case 7: return "SENTMSG5";
123     case 8: return "WAIT";
124     default: return "*bad state*";
125     }
126 }
127
128 #define NONCELEN 8
129
130 #define LOG_UNEXPECTED    0x00000001
131 #define LOG_SETUP_INIT    0x00000002
132 #define LOG_SETUP_TIMEOUT 0x00000004
133 #define LOG_ACTIVATE_KEY  0x00000008
134 #define LOG_TIMEOUT_KEY   0x00000010
135 #define LOG_SEC           0x00000020
136 #define LOG_STATE         0x00000040
137 #define LOG_DROP          0x00000080
138 #define LOG_DUMP          0x00000100
139 #define LOG_ERROR         0x00000400
140 #define LOG_PEER_ADDRS    0x00000800
141
142 static struct flagstr log_event_table[]={
143     { "unexpected", LOG_UNEXPECTED },
144     { "setup-init", LOG_SETUP_INIT },
145     { "setup-timeout", LOG_SETUP_TIMEOUT },
146     { "activate-key", LOG_ACTIVATE_KEY },
147     { "timeout-key", LOG_TIMEOUT_KEY },
148     { "security", LOG_SEC },
149     { "state-change", LOG_STATE },
150     { "packet-drop", LOG_DROP },
151     { "dump-packets", LOG_DUMP },
152     { "errors", LOG_ERROR },
153     { "peer-addrs", LOG_PEER_ADDRS },
154     { "default", LOG_SETUP_INIT|LOG_SETUP_TIMEOUT|
155       LOG_ACTIVATE_KEY|LOG_TIMEOUT_KEY|LOG_SEC|LOG_ERROR },
156     { "all", 0xffffffff },
157     { NULL, 0 }
158 };
159
160
161 /***** TRANSPORT PEERS declarations *****/
162
163 /* Details of "mobile peer" semantics:
164
165    - We use the same data structure for the different configurations,
166      but manage it with different algorithms.
167    
168    - We record up to mobile_peers_max peer address/port numbers
169      ("peers") for key setup, and separately up to mobile_peers_max
170      for data transfer.
171
172    - In general, we make a new set of addrs (see below) when we start
173      a new key exchange; the key setup addrs become the data transport
174      addrs when key setup complets.
175
176    If our peer is mobile:
177
178    - We send to all recent addresses of incoming packets, plus
179      initially all configured addresses (which we also expire).
180
181    - So, we record addrs of good incoming packets, as follows:
182       1. expire any peers last seen >120s ("mobile-peer-expiry") ago
183       2. add the peer of the just received packet to the applicable list
184          (possibly evicting the oldest entries to make room)
185      NB that we do not expire peers until an incoming packet arrives.
186
187    - If the peer has a configured address or name, we record them the
188      same way, but only as a result of our own initiation of key
189      setup.  (We might evict some incoming packet addrs to make room.)
190
191    - The default number of addrs to keep is 3, or 4 if we have a
192      configured name or address.  That's space for two configured
193      addresses (one IPv6 and one IPv4), plus two received addresses.
194
195    - Outgoing packets are sent to every recorded address in the
196      applicable list.  Any unsupported[1] addresses are deleted from
197      the list right away.  (This should only happen to configured
198      addresses, of course, but there is no need to check that.)
199
200    - When we successfully complete a key setup, we merge the key setup
201      peers into the data transfer peers.
202
203    [1] An unsupported address is one for whose AF we don't have a
204      socket (perhaps because we got EAFNOSUPPORT or some such) or for
205      which sendto gives ENETUNREACH.
206
207    If neither end is mobile:
208
209    - When peer initiated the key exchange, we use the incoming packet
210      address.
211
212    - When we initiate the key exchange, we try configured addresses
213      until we get one which isn't unsupported then fixate on that.
214
215    - When we complete a key setup, we replace the data transport peers
216      with those from the key setup.
217
218    If we are mobile:
219
220    - We can't tell when local network setup changes so we can't cache
221      the unsupported addrs and completely remove the spurious calls to
222      sendto, but we can optimise things a bit by deprioritising addrs
223      which seem to be unsupported.
224
225    - Use only configured addresses.  (Except, that if our peer
226      initiated a key exchange we use the incoming packet address until
227      our name resolution completes.)
228
229    - When we send a packet, try each address in turn; if addr
230      supported, put that address to the end of the list for future
231      packets, and go onto the next address.
232
233    - When we complete a key setup, we replace the data transport peers
234      with those from the key setup.
235
236    */
237
238 typedef struct {
239     struct timeval last;
240     struct comm_addr addr;
241 } transport_peer;
242
243 typedef struct {
244 /* configuration information */
245 /* runtime information */
246     int npeers;
247     transport_peer peers[MAX_PEER_ADDRS];
248 } transport_peers;
249
250 /* Basic operations on transport peer address sets */
251 static void transport_peers_clear(struct site *st, transport_peers *peers);
252 static int transport_peers_valid(transport_peers *peers);
253 static void transport_peers_copy(struct site *st, transport_peers *dst,
254                                  const transport_peers *src);
255
256 /* Record address of incoming setup packet; resp. data packet. */
257 static void transport_setup_msgok(struct site *st, const struct comm_addr *a);
258 static void transport_data_msgok(struct site *st, const struct comm_addr *a);
259
260 /* Initialise the setup addresses.  Called before we send the first
261  * packet in a key exchange.  If we are the initiator, as a result of
262  * resolve completing (or being determined not to be relevant) or an
263  * incoming PROD; if we are the responder, as a result of the MSG1. */
264 static bool_t transport_compute_setupinit_peers(struct site *st,
265         const struct comm_addr *configured_addrs /* 0 if none or not found */,
266         int n_configured_addrs /* 0 if none or not found */,
267         const struct comm_addr *incoming_packet_addr /* 0 if none */);
268
269 /* Called if we are the responder in a key setup, when the resolve
270  * completes.  transport_compute_setupinit_peers will hvae been called
271  * earlier.  If _complete is called, we are still doing the key setup
272  * (and we should use the new values for both the rest of the key
273  * setup and the ongoing data exchange); if _tardy is called, the key
274  * setup is done (either completed or not) and only the data peers are
275  * relevant */
276 static void transport_resolve_complete(struct site *st,
277         const struct comm_addr *addrs, int naddrs);
278 static void transport_resolve_complete_tardy(struct site *st,
279         const struct comm_addr *addrs, int naddrs);
280
281 static void transport_xmit(struct site *st, transport_peers *peers,
282                            struct buffer_if *buf, bool_t candebug);
283
284  /***** END of transport peers declarations *****/
285
286
287 struct data_key {
288     struct transform_inst_if *transform;
289     uint64_t key_timeout; /* End of life of current key */
290     uint32_t remote_session_id;
291 };
292
293 struct site {
294     closure_t cl;
295     struct site_if ops;
296 /* configuration information */
297     string_t localname;
298     string_t remotename;
299     bool_t keepalive;
300     bool_t local_mobile, peer_mobile; /* Mobile client support */
301     int32_t transport_peers_max;
302     string_t tunname; /* localname<->remotename by default, used in logs */
303     cstring_t *addresses; /* DNS name or address(es) for bootstrapping, optional */
304     int remoteport; /* Port for bootstrapping, optional */
305     uint32_t mtu_target;
306     struct netlink_if *netlink;
307     struct comm_if **comms;
308     struct comm_clientinfo **commclientinfos;
309     int ncomms;
310     struct resolver_if *resolver;
311     struct log_if *log;
312     struct random_if *random;
313     struct rsaprivkey_if *privkey;
314     struct rsapubkey_if *pubkey;
315     struct transform_if **transforms;
316     int ntransforms;
317     struct dh_if *dh;
318     struct hash_if *hash;
319
320     uint32_t index; /* Index of this site */
321     uint32_t local_capabilities;
322     int32_t setup_retries; /* How many times to send setup packets */
323     int32_t setup_retry_interval; /* Initial timeout for setup packets */
324     int32_t wait_timeout; /* How long to wait if setup unsuccessful */
325     int32_t mobile_peer_expiry; /* How long to remember 2ary addresses */
326     int32_t key_lifetime; /* How long a key lasts once set up */
327     int32_t key_renegotiate_time; /* If we see traffic (or a keepalive)
328                                       after this time, initiate a new
329                                       key exchange */
330
331     bool_t our_name_later; /* our name > peer name */
332     uint32_t log_events;
333
334 /* runtime information */
335     uint32_t state;
336     uint64_t now; /* Most recently seen time */
337     bool_t allow_send_prod;
338     bool_t msg1_crossed_logged;
339     int resolving_count;
340     int resolving_n_results_all;
341     int resolving_n_results_stored;
342     struct comm_addr resolving_results[MAX_PEER_ADDRS];
343
344     /* The currently established session */
345     struct data_key current;
346     struct data_key auxiliary_key;
347     bool_t auxiliary_is_new;
348     uint64_t renegotiate_key_time; /* When we can negotiate a new key */
349     uint64_t auxiliary_renegotiate_key_time;
350     transport_peers peers; /* Current address(es) of peer for data traffic */
351
352     /* The current key setup protocol exchange.  We can only be
353        involved in one of these at a time.  There's a potential for
354        denial of service here (the attacker keeps sending a setup
355        packet; we keep trying to continue the exchange, and have to
356        timeout before we can listen for another setup packet); perhaps
357        we should keep a list of 'bad' sources for setup packets. */
358     uint32_t remote_capabilities;
359     uint16_t remote_adv_mtu;
360     struct transform_if *chosen_transform;
361     uint32_t setup_session_id;
362     transport_peers setup_peers;
363     uint8_t localN[NONCELEN]; /* Nonces for key exchange */
364     uint8_t remoteN[NONCELEN];
365     struct buffer_if buffer; /* Current outgoing key exchange packet */
366     struct buffer_if scratch;
367     int32_t retries; /* Number of retries remaining */
368     uint64_t timeout; /* Timeout for current state */
369     uint8_t *dhsecret;
370     uint8_t *sharedsecret;
371     uint32_t sharedsecretlen, sharedsecretallocd;
372     struct transform_inst_if *new_transform; /* For key setup/verify */
373 };
374
375 static uint32_t event_log_priority(struct site *st, uint32_t event)
376 {
377     if (!(event&st->log_events))
378         return 0;
379     switch(event) {
380     case LOG_UNEXPECTED:    return M_INFO;
381     case LOG_SETUP_INIT:    return M_INFO;
382     case LOG_SETUP_TIMEOUT: return M_NOTICE;
383     case LOG_ACTIVATE_KEY:  return M_INFO;
384     case LOG_TIMEOUT_KEY:   return M_INFO;
385     case LOG_SEC:           return M_SECURITY;
386     case LOG_STATE:         return M_DEBUG;
387     case LOG_DROP:          return M_DEBUG;
388     case LOG_DUMP:          return M_DEBUG;
389     case LOG_ERROR:         return M_ERR;
390     case LOG_PEER_ADDRS:    return M_DEBUG;
391     default:                return M_ERR;
392     }
393 }
394
395 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
396 FORMAT(printf,3,0);
397 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
398 {
399     uint32_t class;
400
401     class=event_log_priority(st, event);
402     if (class) {
403         slilog_part(st->log,class,"%s: ",st->tunname);
404         vslilog_part(st->log,class,msg,ap);
405         slilog_part(st->log,class,"\n");
406     }
407 }
408
409 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
410 FORMAT(printf,3,4);
411 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
412 {
413     va_list ap;
414     va_start(ap,msg);
415     vslog(st,event,msg,ap);
416     va_end(ap);
417 }
418
419 static void logtimeout(struct site *st, const char *fmt, ...)
420 FORMAT(printf,2,3);
421 static void logtimeout(struct site *st, const char *fmt, ...)
422 {
423     uint32_t class=event_log_priority(st,LOG_SETUP_TIMEOUT);
424     if (!class)
425         return;
426
427     va_list ap;
428     va_start(ap,fmt);
429
430     slilog_part(st->log,class,"%s: ",st->tunname);
431     vslilog_part(st->log,class,fmt,ap);
432
433     const char *delim;
434     int i;
435     for (i=0, delim=" (tried ";
436          i<st->setup_peers.npeers;
437          i++, delim=", ") {
438         transport_peer *peer=&st->setup_peers.peers[i];
439         const char *s=comm_addr_to_string(&peer->addr);
440         slilog_part(st->log,class,"%s%s",delim,s);
441     }
442
443     slilog_part(st->log,class,")\n");
444     va_end(ap);
445 }
446
447 static void set_link_quality(struct site *st);
448 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel);
449 static void delete_one_key(struct site *st, struct data_key *key,
450                            const char *reason /* may be 0 meaning don't log*/,
451                            const char *which /* ignored if !reasonn */,
452                            uint32_t loglevel /* ignored if !reasonn */);
453 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
454                                  const struct comm_addr *prod_hint);
455 static void enter_state_run(struct site *st);
456 static bool_t enter_state_resolve(struct site *st);
457 static void decrement_resolving_count(struct site *st, int by);
458 static bool_t enter_new_state(struct site *st,uint32_t next);
459 static void enter_state_wait(struct site *st);
460 static void activate_new_key(struct site *st);
461
462 static bool_t is_transform_valid(struct transform_inst_if *transform)
463 {
464     return transform && transform->valid(transform->st);
465 }
466
467 static bool_t current_valid(struct site *st)
468 {
469     return is_transform_valid(st->current.transform);
470 }
471
472 #define DEFINE_CALL_TRANSFORM(fwdrev)                                   \
473 static transform_apply_return                                           \
474 call_transform_##fwdrev(struct site *st,                                \
475                                    struct transform_inst_if *transform, \
476                                    struct buffer_if *buf,               \
477                                    const char **errmsg)                 \
478 {                                                                       \
479     if (!is_transform_valid(transform)) {                               \
480         *errmsg="transform not set up";                                 \
481         return transform_apply_err;                                     \
482     }                                                                   \
483     return transform->fwdrev(transform->st,buf,errmsg);                 \
484 }
485
486 DEFINE_CALL_TRANSFORM(forwards)
487 DEFINE_CALL_TRANSFORM(reverse)
488
489 static void dispose_transform(struct transform_inst_if **transform_var)
490 {
491     struct transform_inst_if *transform=*transform_var;
492     if (transform) {
493         transform->delkey(transform->st);
494         transform->destroy(transform->st);
495     }
496     *transform_var = 0;
497 }    
498
499 #define CHECK_AVAIL(b,l) do { if ((b)->size<(l)) return False; } while(0)
500 #define CHECK_EMPTY(b) do { if ((b)->size!=0) return False; } while(0)
501 #define CHECK_TYPE(b,t) do { uint32_t type; \
502     CHECK_AVAIL((b),4); \
503     type=buf_unprepend_uint32((b)); \
504     if (type!=(t)) return False; } while(0)
505
506 static _Bool type_is_msg34(uint32_t type)
507 {
508     return
509         type == LABEL_MSG3 ||
510         type == LABEL_MSG3BIS ||
511         type == LABEL_MSG4;
512 }
513
514 struct parsedname {
515     int32_t len;
516     uint8_t *name;
517     struct buffer_if extrainfo;
518 };
519
520 struct msg {
521     uint8_t *hashstart;
522     uint32_t dest;
523     uint32_t source;
524     struct parsedname remote;
525     struct parsedname local;
526     uint32_t remote_capabilities;
527     uint16_t remote_mtu;
528     int capab_transformnum;
529     uint8_t *nR;
530     uint8_t *nL;
531     int32_t pklen;
532     char *pk;
533     int32_t hashlen;
534     int32_t siglen;
535     char *sig;
536 };
537
538 static _Bool set_new_transform(struct site *st, char *pk)
539 {
540     _Bool ok;
541
542     /* Make room for the shared key */
543     st->sharedsecretlen=st->chosen_transform->keylen?:st->dh->ceil_len;
544     assert(st->sharedsecretlen);
545     if (st->sharedsecretlen > st->sharedsecretallocd) {
546         st->sharedsecretallocd=st->sharedsecretlen;
547         st->sharedsecret=safe_realloc_ary(st->sharedsecret,1,
548                                           st->sharedsecretallocd,
549                                           "site:sharedsecret");
550     }
551
552     /* Generate the shared key */
553     st->dh->makeshared(st->dh->st,st->dhsecret,st->dh->len,pk,
554                        st->sharedsecret,st->sharedsecretlen);
555
556     /* Set up the transform */
557     struct transform_if *generator=st->chosen_transform;
558     struct transform_inst_if *generated=generator->create(generator->st);
559     ok = generated->setkey(generated->st,st->sharedsecret,
560                            st->sharedsecretlen,st->our_name_later);
561
562     dispose_transform(&st->new_transform);
563     if (!ok) return False;
564     st->new_transform=generated;
565
566     slog(st,LOG_SETUP_INIT,"key exchange negotiated transform"
567          " %d (capabilities ours=%#"PRIx32" theirs=%#"PRIx32")",
568          st->chosen_transform->capab_transformnum,
569          st->local_capabilities, st->remote_capabilities);
570     return True;
571 }
572
573 struct xinfoadd {
574     int32_t lenpos, afternul;
575 };
576 static void append_string_xinfo_start(struct buffer_if *buf,
577                                       struct xinfoadd *xia,
578                                       const char *str)
579     /* Helps construct one of the names with additional info as found
580      * in MSG1..4.  Call this function first, then append all the
581      * desired extra info (not including the nul byte) to the buffer,
582      * then call append_string_xinfo_done. */
583 {
584     xia->lenpos = buf->size;
585     buf_append_string(buf,str);
586     buf_append_uint8(buf,0);
587     xia->afternul = buf->size;
588 }
589 static void append_string_xinfo_done(struct buffer_if *buf,
590                                      struct xinfoadd *xia)
591 {
592     /* we just need to adjust the string length */
593     if (buf->size == xia->afternul) {
594         /* no extra info, strip the nul too */
595         buf_unappend_uint8(buf);
596     } else {
597         put_uint16(buf->start+xia->lenpos, buf->size-(xia->lenpos+2));
598     }
599 }
600
601 /* Build any of msg1 to msg4. msg5 and msg6 are built from the inside
602    out using a transform of config data supplied by netlink */
603 static bool_t generate_msg(struct site *st, uint32_t type, cstring_t what)
604 {
605     void *hst;
606     uint8_t *hash;
607     string_t dhpub, sig;
608
609     st->retries=st->setup_retries;
610     BUF_ALLOC(&st->buffer,what);
611     buffer_init(&st->buffer,0);
612     buf_append_uint32(&st->buffer,
613         (type==LABEL_MSG1?0:st->setup_session_id));
614     buf_append_uint32(&st->buffer,st->index);
615     buf_append_uint32(&st->buffer,type);
616
617     struct xinfoadd xia;
618     append_string_xinfo_start(&st->buffer,&xia,st->localname);
619     if ((st->local_capabilities & CAPAB_EARLY) || (type != LABEL_MSG1)) {
620         buf_append_uint32(&st->buffer,st->local_capabilities);
621     }
622     if (type_is_msg34(type)) {
623         buf_append_uint16(&st->buffer,st->mtu_target);
624     }
625     append_string_xinfo_done(&st->buffer,&xia);
626
627     buf_append_string(&st->buffer,st->remotename);
628     BUF_ADD_OBJ(append,&st->buffer,st->localN);
629     if (type==LABEL_MSG1) return True;
630     BUF_ADD_OBJ(append,&st->buffer,st->remoteN);
631     if (type==LABEL_MSG2) return True;
632
633     if (hacky_par_mid_failnow()) return False;
634
635     if (type==LABEL_MSG3BIS)
636         buf_append_uint8(&st->buffer,st->chosen_transform->capab_transformnum);
637
638     dhpub=st->dh->makepublic(st->dh->st,st->dhsecret,st->dh->len);
639     buf_append_string(&st->buffer,dhpub);
640     free(dhpub);
641     hash=safe_malloc(st->hash->len, "generate_msg");
642     hst=st->hash->init();
643     st->hash->update(hst,st->buffer.start,st->buffer.size);
644     st->hash->final(hst,hash);
645     sig=st->privkey->sign(st->privkey->st,hash,st->hash->len);
646     buf_append_string(&st->buffer,sig);
647     free(sig);
648     free(hash);
649     return True;
650 }
651
652 static bool_t unpick_name(struct buffer_if *msg, struct parsedname *nm)
653 {
654     CHECK_AVAIL(msg,2);
655     nm->len=buf_unprepend_uint16(msg);
656     CHECK_AVAIL(msg,nm->len);
657     nm->name=buf_unprepend(msg,nm->len);
658     uint8_t *nul=memchr(nm->name,0,nm->len);
659     if (!nul) {
660         buffer_readonly_view(&nm->extrainfo,0,0);
661     } else {
662         buffer_readonly_view(&nm->extrainfo, nul+1, msg->start-(nul+1));
663         nm->len=nul-nm->name;
664     }
665     return True;
666 }
667
668 static bool_t unpick_msg(struct site *st, uint32_t type,
669                          struct buffer_if *msg, struct msg *m)
670 {
671     m->capab_transformnum=-1;
672     m->hashstart=msg->start;
673     CHECK_AVAIL(msg,4);
674     m->dest=buf_unprepend_uint32(msg);
675     CHECK_AVAIL(msg,4);
676     m->source=buf_unprepend_uint32(msg);
677     CHECK_TYPE(msg,type);
678     if (!unpick_name(msg,&m->remote)) return False;
679     m->remote_capabilities=0;
680     m->remote_mtu=0;
681     if (m->remote.extrainfo.size) {
682         CHECK_AVAIL(&m->remote.extrainfo,4);
683         m->remote_capabilities=buf_unprepend_uint32(&m->remote.extrainfo);
684     }
685     if (type_is_msg34(type) && m->remote.extrainfo.size) {
686         CHECK_AVAIL(&m->remote.extrainfo,2);
687         m->remote_mtu=buf_unprepend_uint16(&m->remote.extrainfo);
688     }
689     if (!unpick_name(msg,&m->local)) return False;
690     if (type==LABEL_PROD) {
691         CHECK_EMPTY(msg);
692         return True;
693     }
694     CHECK_AVAIL(msg,NONCELEN);
695     m->nR=buf_unprepend(msg,NONCELEN);
696     if (type==LABEL_MSG1) {
697         CHECK_EMPTY(msg);
698         return True;
699     }
700     CHECK_AVAIL(msg,NONCELEN);
701     m->nL=buf_unprepend(msg,NONCELEN);
702     if (type==LABEL_MSG2) {
703         CHECK_EMPTY(msg);
704         return True;
705     }
706     if (type==LABEL_MSG3BIS) {
707         CHECK_AVAIL(msg,1);
708         m->capab_transformnum = buf_unprepend_uint8(msg);
709     } else {
710         m->capab_transformnum = CAPAB_TRANSFORMNUM_ANCIENT;
711     }
712     CHECK_AVAIL(msg,2);
713     m->pklen=buf_unprepend_uint16(msg);
714     CHECK_AVAIL(msg,m->pklen);
715     m->pk=buf_unprepend(msg,m->pklen);
716     m->hashlen=msg->start-m->hashstart;
717     CHECK_AVAIL(msg,2);
718     m->siglen=buf_unprepend_uint16(msg);
719     CHECK_AVAIL(msg,m->siglen);
720     m->sig=buf_unprepend(msg,m->siglen);
721     CHECK_EMPTY(msg);
722
723     /* In `process_msg3_msg4' below, we assume that we can write a nul
724      * terminator following the signature.  Make sure there's enough space.
725      */
726     if (msg->start >= msg->base + msg->alloclen)
727         return False;
728
729     return True;
730 }
731
732 static bool_t name_matches(const struct parsedname *nm, const char *expected)
733 {
734     int expected_len=strlen(expected);
735     return
736         nm->len == expected_len &&
737         !memcmp(nm->name, expected, expected_len);
738 }    
739
740 static bool_t check_msg(struct site *st, uint32_t type, struct msg *m,
741                         cstring_t *error)
742 {
743     if (type==LABEL_MSG1) return True;
744
745     /* Check that the site names and our nonce have been sent
746        back correctly, and then store our peer's nonce. */ 
747     if (!name_matches(&m->remote,st->remotename)) {
748         *error="wrong remote site name";
749         return False;
750     }
751     if (!name_matches(&m->local,st->localname)) {
752         *error="wrong local site name";
753         return False;
754     }
755     if (memcmp(m->nL,st->localN,NONCELEN)!=0) {
756         *error="wrong locally-generated nonce";
757         return False;
758     }
759     if (type==LABEL_MSG2) return True;
760     if (!consttime_memeq(m->nR,st->remoteN,NONCELEN)!=0) {
761         *error="wrong remotely-generated nonce";
762         return False;
763     }
764     /* MSG3 has complicated rules about capabilities, which are
765      * handled in process_msg3. */
766     if (type==LABEL_MSG3 || type==LABEL_MSG3BIS) return True;
767     if (m->remote_capabilities!=st->remote_capabilities) {
768         *error="remote capabilities changed";
769         return False;
770     }
771     if (type==LABEL_MSG4) return True;
772     *error="unknown message type";
773     return False;
774 }
775
776 static bool_t generate_msg1(struct site *st)
777 {
778     st->random->generate(st->random->st,NONCELEN,st->localN);
779     return generate_msg(st,LABEL_MSG1,"site:MSG1");
780 }
781
782 static bool_t process_msg1(struct site *st, struct buffer_if *msg1,
783                            const struct comm_addr *src, struct msg *m)
784 {
785     /* We've already determined we're in an appropriate state to
786        process an incoming MSG1, and that the MSG1 has correct values
787        of A and B. */
788
789     st->setup_session_id=m->source;
790     st->remote_capabilities=m->remote_capabilities;
791     memcpy(st->remoteN,m->nR,NONCELEN);
792     return True;
793 }
794
795 static bool_t generate_msg2(struct site *st)
796 {
797     st->random->generate(st->random->st,NONCELEN,st->localN);
798     return generate_msg(st,LABEL_MSG2,"site:MSG2");
799 }
800
801 static bool_t process_msg2(struct site *st, struct buffer_if *msg2,
802                            const struct comm_addr *src)
803 {
804     struct msg m;
805     cstring_t err;
806
807     if (!unpick_msg(st,LABEL_MSG2,msg2,&m)) return False;
808     if (!check_msg(st,LABEL_MSG2,&m,&err)) {
809         slog(st,LOG_SEC,"msg2: %s",err);
810         return False;
811     }
812     st->setup_session_id=m.source;
813     st->remote_capabilities=m.remote_capabilities;
814
815     /* Select the transform to use */
816
817     uint32_t remote_transforms = st->remote_capabilities & CAPAB_TRANSFORM_MASK;
818     if (!remote_transforms)
819         /* old secnets only had this one transform */
820         remote_transforms = 1UL << CAPAB_TRANSFORMNUM_ANCIENT;
821
822     struct transform_if *ti;
823     int i;
824     for (i=0; i<st->ntransforms; i++) {
825         ti=st->transforms[i];
826         if ((1UL << ti->capab_transformnum) & remote_transforms)
827             goto transform_found;
828     }
829     slog(st,LOG_ERROR,"no transforms in common"
830          " (us %#"PRIx32"; them: %#"PRIx32")",
831          st->local_capabilities & CAPAB_TRANSFORM_MASK,
832          remote_transforms);
833     return False;
834  transform_found:
835     st->chosen_transform=ti;
836
837     memcpy(st->remoteN,m.nR,NONCELEN);
838     return True;
839 }
840
841 static bool_t generate_msg3(struct site *st)
842 {
843     /* Now we have our nonce and their nonce. Think of a secret key,
844        and create message number 3. */
845     st->random->generate(st->random->st,st->dh->len,st->dhsecret);
846     return generate_msg(st,
847                         (st->remote_capabilities & CAPAB_TRANSFORM_MASK
848                          ? LABEL_MSG3BIS : LABEL_MSG3),
849                         "site:MSG3");
850 }
851
852 static bool_t process_msg3_msg4(struct site *st, struct msg *m)
853 {
854     uint8_t *hash;
855     void *hst;
856
857     /* Check signature and store g^x mod m */
858     hash=safe_malloc(st->hash->len, "process_msg3_msg4");
859     hst=st->hash->init();
860     st->hash->update(hst,m->hashstart,m->hashlen);
861     st->hash->final(hst,hash);
862     /* Terminate signature with a '0' - already checked that this will fit */
863     m->sig[m->siglen]=0;
864     if (!st->pubkey->check(st->pubkey->st,hash,st->hash->len,m->sig)) {
865         slog(st,LOG_SEC,"msg3/msg4 signature failed check!");
866         free(hash);
867         return False;
868     }
869     free(hash);
870
871     st->remote_adv_mtu=m->remote_mtu;
872
873     return True;
874 }
875
876 static bool_t process_msg3(struct site *st, struct buffer_if *msg3,
877                            const struct comm_addr *src, uint32_t msgtype)
878 {
879     struct msg m;
880     cstring_t err;
881
882     assert(msgtype==LABEL_MSG3 || msgtype==LABEL_MSG3BIS);
883
884     if (!unpick_msg(st,msgtype,msg3,&m)) return False;
885     if (!check_msg(st,msgtype,&m,&err)) {
886         slog(st,LOG_SEC,"msg3: %s",err);
887         return False;
888     }
889     uint32_t capab_adv_late = m.remote_capabilities
890         & ~st->remote_capabilities & CAPAB_EARLY;
891     if (capab_adv_late) {
892         slog(st,LOG_SEC,"msg3 impermissibly adds early capability flag(s)"
893              " %#"PRIx32" (was %#"PRIx32", now %#"PRIx32")",
894              capab_adv_late, st->remote_capabilities, m.remote_capabilities);
895         return False;
896     }
897     st->remote_capabilities|=m.remote_capabilities;
898
899     struct transform_if *ti;
900     int i;
901     for (i=0; i<st->ntransforms; i++) {
902         ti=st->transforms[i];
903         if (ti->capab_transformnum == m.capab_transformnum)
904             goto transform_found;
905     }
906     slog(st,LOG_SEC,"peer chose unknown-to-us transform %d!",
907          m.capab_transformnum);
908     return False;
909  transform_found:
910     st->chosen_transform=ti;
911
912     if (!process_msg3_msg4(st,&m))
913         return False;
914
915     /* Terminate their DH public key with a '0' */
916     m.pk[m.pklen]=0;
917     /* Invent our DH secret key */
918     st->random->generate(st->random->st,st->dh->len,st->dhsecret);
919
920     /* Generate the shared key and set up the transform */
921     if (!set_new_transform(st,m.pk)) return False;
922
923     return True;
924 }
925
926 static bool_t generate_msg4(struct site *st)
927 {
928     /* We have both nonces, their public key and our private key. Generate
929        our public key, sign it and send it to them. */
930     return generate_msg(st,LABEL_MSG4,"site:MSG4");
931 }
932
933 static bool_t process_msg4(struct site *st, struct buffer_if *msg4,
934                            const struct comm_addr *src)
935 {
936     struct msg m;
937     cstring_t err;
938
939     if (!unpick_msg(st,LABEL_MSG4,msg4,&m)) return False;
940     if (!check_msg(st,LABEL_MSG4,&m,&err)) {
941         slog(st,LOG_SEC,"msg4: %s",err);
942         return False;
943     }
944     
945     if (!process_msg3_msg4(st,&m))
946         return False;
947
948     /* Terminate their DH public key with a '0' */
949     m.pk[m.pklen]=0;
950
951     /* Generate the shared key and set up the transform */
952     if (!set_new_transform(st,m.pk)) return False;
953
954     return True;
955 }
956
957 struct msg0 {
958     uint32_t dest;
959     uint32_t source;
960     uint32_t type;
961 };
962
963 static bool_t unpick_msg0(struct site *st, struct buffer_if *msg0,
964                           struct msg0 *m)
965 {
966     CHECK_AVAIL(msg0,4);
967     m->dest=buf_unprepend_uint32(msg0);
968     CHECK_AVAIL(msg0,4);
969     m->source=buf_unprepend_uint32(msg0);
970     CHECK_AVAIL(msg0,4);
971     m->type=buf_unprepend_uint32(msg0);
972     return True;
973     /* Leaves transformed part of buffer untouched */
974 }
975
976 static bool_t generate_msg5(struct site *st)
977 {
978     cstring_t transform_err;
979
980     BUF_ALLOC(&st->buffer,"site:MSG5");
981     /* We are going to add four words to the message */
982     buffer_init(&st->buffer,calculate_max_start_pad());
983     /* Give the netlink code an opportunity to put its own stuff in the
984        message (configuration information, etc.) */
985     buf_prepend_uint32(&st->buffer,LABEL_MSG5);
986     if (call_transform_forwards(st,st->new_transform,
987                                 &st->buffer,&transform_err))
988         return False;
989     buf_prepend_uint32(&st->buffer,LABEL_MSG5);
990     buf_prepend_uint32(&st->buffer,st->index);
991     buf_prepend_uint32(&st->buffer,st->setup_session_id);
992
993     st->retries=st->setup_retries;
994     return True;
995 }
996
997 static bool_t process_msg5(struct site *st, struct buffer_if *msg5,
998                            const struct comm_addr *src,
999                            struct transform_inst_if *transform)
1000 {
1001     struct msg0 m;
1002     cstring_t transform_err;
1003
1004     if (!unpick_msg0(st,msg5,&m)) return False;
1005
1006     if (call_transform_reverse(st,transform,msg5,&transform_err)) {
1007         /* There's a problem */
1008         slog(st,LOG_SEC,"process_msg5: transform: %s",transform_err);
1009         return False;
1010     }
1011     /* Buffer should now contain untransformed PING packet data */
1012     CHECK_AVAIL(msg5,4);
1013     if (buf_unprepend_uint32(msg5)!=LABEL_MSG5) {
1014         slog(st,LOG_SEC,"MSG5/PING packet contained wrong label");
1015         return False;
1016     }
1017     /* Older versions of secnet used to write some config data here
1018      * which we ignore.  So we don't CHECK_EMPTY */
1019     return True;
1020 }
1021
1022 static void create_msg6(struct site *st, struct transform_inst_if *transform,
1023                         uint32_t session_id)
1024 {
1025     cstring_t transform_err;
1026
1027     BUF_ALLOC(&st->buffer,"site:MSG6");
1028     /* We are going to add four words to the message */
1029     buffer_init(&st->buffer,calculate_max_start_pad());
1030     /* Give the netlink code an opportunity to put its own stuff in the
1031        message (configuration information, etc.) */
1032     buf_prepend_uint32(&st->buffer,LABEL_MSG6);
1033     transform_apply_return problem =
1034         call_transform_forwards(st,transform,
1035                                 &st->buffer,&transform_err);
1036     assert(!problem);
1037     buf_prepend_uint32(&st->buffer,LABEL_MSG6);
1038     buf_prepend_uint32(&st->buffer,st->index);
1039     buf_prepend_uint32(&st->buffer,session_id);
1040 }
1041
1042 static bool_t generate_msg6(struct site *st)
1043 {
1044     if (!is_transform_valid(st->new_transform))
1045         return False;
1046     create_msg6(st,st->new_transform,st->setup_session_id);
1047     st->retries=1; /* Peer will retransmit MSG5 if this packet gets lost */
1048     return True;
1049 }
1050
1051 static bool_t process_msg6(struct site *st, struct buffer_if *msg6,
1052                            const struct comm_addr *src)
1053 {
1054     struct msg0 m;
1055     cstring_t transform_err;
1056
1057     if (!unpick_msg0(st,msg6,&m)) return False;
1058
1059     if (call_transform_reverse(st,st->new_transform,msg6,&transform_err)) {
1060         /* There's a problem */
1061         slog(st,LOG_SEC,"process_msg6: transform: %s",transform_err);
1062         return False;
1063     }
1064     /* Buffer should now contain untransformed PING packet data */
1065     CHECK_AVAIL(msg6,4);
1066     if (buf_unprepend_uint32(msg6)!=LABEL_MSG6) {
1067         slog(st,LOG_SEC,"MSG6/PONG packet contained invalid data");
1068         return False;
1069     }
1070     /* Older versions of secnet used to write some config data here
1071      * which we ignore.  So we don't CHECK_EMPTY */
1072     return True;
1073 }
1074
1075 static transform_apply_return
1076 decrypt_msg0(struct site *st, struct buffer_if *msg0,
1077                            const struct comm_addr *src)
1078 {
1079     cstring_t transform_err, auxkey_err, newkey_err="n/a";
1080     struct msg0 m;
1081     transform_apply_return problem;
1082
1083     if (!unpick_msg0(st,msg0,&m)) return False;
1084
1085     /* Keep a copy so we can try decrypting it with multiple keys */
1086     buffer_copy(&st->scratch, msg0);
1087
1088     problem = call_transform_reverse(st,st->current.transform,
1089                                      msg0,&transform_err);
1090     if (!problem) {
1091         if (!st->auxiliary_is_new)
1092             delete_one_key(st,&st->auxiliary_key,
1093                            "peer has used new key","auxiliary key",LOG_SEC);
1094         return 0;
1095     }
1096     if (transform_apply_return_badseq(problem))
1097         goto badseq;
1098
1099     buffer_copy(msg0, &st->scratch);
1100     problem = call_transform_reverse(st,st->auxiliary_key.transform,
1101                                      msg0,&auxkey_err);
1102     if (!problem) {
1103         slog(st,LOG_DROP,"processing packet which uses auxiliary key");
1104         if (st->auxiliary_is_new) {
1105             /* We previously timed out in state SENTMSG5 but it turns
1106              * out that our peer did in fact get our MSG5 and is
1107              * using the new key.  So we should switch to it too. */
1108             /* This is a bit like activate_new_key. */
1109             struct data_key t;
1110             t=st->current;
1111             st->current=st->auxiliary_key;
1112             st->auxiliary_key=t;
1113
1114             delete_one_key(st,&st->auxiliary_key,"peer has used new key",
1115                            "previous key",LOG_SEC);
1116             st->auxiliary_is_new=0;
1117             st->renegotiate_key_time=st->auxiliary_renegotiate_key_time;
1118         }
1119         return 0;
1120     }
1121     if (transform_apply_return_badseq(problem))
1122         goto badseq;
1123
1124     if (st->state==SITE_SENTMSG5) {
1125         buffer_copy(msg0, &st->scratch);
1126         problem = call_transform_reverse(st,st->new_transform,
1127                                          msg0,&newkey_err);
1128         if (!problem) {
1129             /* It looks like we didn't get the peer's MSG6 */
1130             /* This is like a cut-down enter_new_state(SITE_RUN) */
1131             slog(st,LOG_STATE,"will enter state RUN (MSG0 with new key)");
1132             BUF_FREE(&st->buffer);
1133             st->timeout=0;
1134             activate_new_key(st);
1135             return 0; /* do process the data in this packet */
1136         }
1137         if (transform_apply_return_badseq(problem))
1138             goto badseq;
1139     }
1140
1141     slog(st,LOG_SEC,"transform: %s (aux: %s, new: %s)",
1142          transform_err,auxkey_err,newkey_err);
1143     initiate_key_setup(st,"incoming message would not decrypt",0);
1144     send_nak(src,m.dest,m.source,m.type,msg0,"message would not decrypt");
1145     assert(problem);
1146     return problem;
1147
1148  badseq:
1149     slog(st,LOG_DROP,"transform: %s (bad seq.)",transform_err);
1150     assert(problem);
1151     return problem;
1152 }
1153
1154 static bool_t process_msg0(struct site *st, struct buffer_if *msg0,
1155                            const struct comm_addr *src)
1156 {
1157     uint32_t type;
1158     transform_apply_return problem;
1159
1160     problem = decrypt_msg0(st,msg0,src);
1161     if (problem==transform_apply_seqdupe) {
1162         /* We recently received another copy of this packet, maybe due
1163          * to polypath.  That's not a problem; indeed, for the
1164          * purposes of transport address management it is a success.
1165          * But we don't want to process the packet. */
1166         transport_data_msgok(st,src);
1167         return False;
1168     }
1169     if (problem)
1170         return False;
1171
1172     CHECK_AVAIL(msg0,4);
1173     type=buf_unprepend_uint32(msg0);
1174     switch(type) {
1175     case LABEL_MSG7:
1176         /* We must forget about the current session. */
1177         delete_keys(st,"request from peer",LOG_SEC);
1178         /* probably, the peer is shutting down, and this is going to fail,
1179          * but we need to be trying to bring the link up again */
1180         if (st->keepalive)
1181             initiate_key_setup(st,"peer requested key teardown",0);
1182         return True;
1183     case LABEL_MSG9:
1184         /* Deliver to netlink layer */
1185         st->netlink->deliver(st->netlink->st,msg0);
1186         transport_data_msgok(st,src);
1187         /* See whether we should start negotiating a new key */
1188         if (st->now > st->renegotiate_key_time)
1189             initiate_key_setup(st,"incoming packet in renegotiation window",0);
1190         return True;
1191     default:
1192         slog(st,LOG_SEC,"incoming encrypted message of type %08x "
1193              "(unknown)",type);
1194         break;
1195     }
1196     return False;
1197 }
1198
1199 static void dump_packet(struct site *st, struct buffer_if *buf,
1200                         const struct comm_addr *addr, bool_t incoming,
1201                         bool_t ok)
1202 {
1203     uint32_t dest=get_uint32(buf->start);
1204     uint32_t source=get_uint32(buf->start+4);
1205     uint32_t msgtype=get_uint32(buf->start+8);
1206
1207     if (st->log_events & LOG_DUMP)
1208         slilog(st->log,M_DEBUG,"%s: %s: %08x<-%08x: %08x: %s%s",
1209                st->tunname,incoming?"incoming":"outgoing",
1210                dest,source,msgtype,comm_addr_to_string(addr),
1211                ok?"":" - fail");
1212 }
1213
1214 static bool_t comm_addr_sendmsg(struct site *st,
1215                                 const struct comm_addr *dest,
1216                                 struct buffer_if *buf)
1217 {
1218     int i;
1219     struct comm_clientinfo *commclientinfo = 0;
1220
1221     for (i=0; i < st->ncomms; i++) {
1222         if (st->comms[i] == dest->comm) {
1223             commclientinfo = st->commclientinfos[i];
1224             break;
1225         }
1226     }
1227     return dest->comm->sendmsg(dest->comm->st, buf, dest, commclientinfo);
1228 }
1229
1230 static uint32_t site_status(void *st)
1231 {
1232     return 0;
1233 }
1234
1235 static bool_t send_msg(struct site *st)
1236 {
1237     if (st->retries>0) {
1238         transport_xmit(st, &st->setup_peers, &st->buffer, True);
1239         st->timeout=st->now+st->setup_retry_interval;
1240         st->retries--;
1241         return True;
1242     } else if (st->state==SITE_SENTMSG5) {
1243         logtimeout(st,"timed out sending MSG5, stashing new key");
1244         /* We stash the key we have produced, in case it turns out that
1245          * our peer did see our MSG5 after all and starts using it. */
1246         /* This is a bit like some of activate_new_key */
1247         struct transform_inst_if *t;
1248         t=st->auxiliary_key.transform;
1249         st->auxiliary_key.transform=st->new_transform;
1250         st->new_transform=t;
1251         dispose_transform(&st->new_transform);
1252
1253         st->auxiliary_is_new=1;
1254         st->auxiliary_key.key_timeout=st->now+st->key_lifetime;
1255         st->auxiliary_renegotiate_key_time=st->now+st->key_renegotiate_time;
1256         st->auxiliary_key.remote_session_id=st->setup_session_id;
1257
1258         enter_state_wait(st);
1259         return False;
1260     } else {
1261         logtimeout(st,"timed out sending key setup packet "
1262             "(in state %s)",state_name(st->state));
1263         enter_state_wait(st);
1264         return False;
1265     }
1266 }
1267
1268 static void site_resolve_callback(void *sst, const struct comm_addr *addrs,
1269                                   int stored_naddrs, int all_naddrs,
1270                                   const char *address, const char *failwhy)
1271 {
1272     struct site *st=sst;
1273
1274     if (!stored_naddrs) {
1275         slog(st,LOG_ERROR,"resolution of %s failed: %s",address,failwhy);
1276     } else {
1277         slog(st,LOG_PEER_ADDRS,"resolution of %s completed, %d addrs, eg: %s",
1278              address, all_naddrs, comm_addr_to_string(&addrs[0]));;
1279
1280         int space=st->transport_peers_max-st->resolving_n_results_stored;
1281         int n_tocopy=MIN(stored_naddrs,space);
1282         COPY_ARRAY(st->resolving_results + st->resolving_n_results_stored,
1283                    addrs,
1284                    n_tocopy);
1285         st->resolving_n_results_stored += n_tocopy;
1286         st->resolving_n_results_all += all_naddrs;
1287     }
1288
1289     decrement_resolving_count(st,1);
1290 }
1291
1292 static void decrement_resolving_count(struct site *st, int by)
1293 {
1294     assert(st->resolving_count>0);
1295     st->resolving_count-=by;
1296
1297     if (st->resolving_count)
1298         return;
1299
1300     /* OK, we are done with them all.  Handle combined results. */
1301
1302     const struct comm_addr *addrs=st->resolving_results;
1303     int naddrs=st->resolving_n_results_stored;
1304     assert(naddrs<=st->transport_peers_max);
1305
1306     if (naddrs) {
1307         if (naddrs != st->resolving_n_results_all) {
1308             slog(st,LOG_SETUP_INIT,"resolution of supplied addresses/names"
1309                  " yielded too many results (%d > %d), some ignored",
1310                  st->resolving_n_results_all, naddrs);
1311         }
1312         slog(st,LOG_STATE,"resolution completed, %d addrs, eg: %s",
1313              naddrs, iaddr_to_string(&addrs[0].ia));;
1314     }
1315
1316     switch (st->state) {
1317     case SITE_RESOLVE:
1318         if (transport_compute_setupinit_peers(st,addrs,naddrs,0)) {
1319             enter_new_state(st,SITE_SENTMSG1);
1320         } else {
1321             /* Can't figure out who to try to to talk to */
1322             slog(st,LOG_SETUP_INIT,
1323                  "key exchange failed: cannot find peer address");
1324             enter_state_run(st);
1325         }
1326         break;
1327     case SITE_SENTMSG1: case SITE_SENTMSG2:
1328     case SITE_SENTMSG3: case SITE_SENTMSG4:
1329     case SITE_SENTMSG5:
1330         if (naddrs) {
1331             /* We start using the address immediately for data too.
1332              * It's best to store it in st->peers now because we might
1333              * go via SENTMSG5, WAIT, and a MSG0, straight into using
1334              * the new key (without updating the data peer addrs). */
1335             transport_resolve_complete(st,addrs,naddrs);
1336         } else if (st->local_mobile) {
1337             /* We can't let this rest because we may have a peer
1338              * address which will break in the future. */
1339             slog(st,LOG_SETUP_INIT,"resolution failed: "
1340                  "abandoning key exchange");
1341             enter_state_wait(st);
1342         } else {
1343             slog(st,LOG_SETUP_INIT,"resolution failed: "
1344                  " continuing to use source address of peer's packets"
1345                  " for key exchange and ultimately data");
1346         }
1347         break;
1348     case SITE_RUN:
1349         if (naddrs) {
1350             slog(st,LOG_SETUP_INIT,"resolution completed tardily,"
1351                  " updating peer address(es)");
1352             transport_resolve_complete_tardy(st,addrs,naddrs);
1353         } else if (st->local_mobile) {
1354             /* Not very good.  We should queue (another) renegotiation
1355              * so that we can update the peer address. */
1356             st->key_renegotiate_time=st->now+st->wait_timeout;
1357         } else {
1358             slog(st,LOG_SETUP_INIT,"resolution failed: "
1359                  " continuing to use source address of peer's packets");
1360         }
1361         break;
1362     case SITE_WAIT:
1363     case SITE_STOP:
1364         /* oh well */
1365         break;
1366     }
1367 }
1368
1369 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
1370                                  const struct comm_addr *prod_hint)
1371 {
1372     /* Reentrancy hazard: can call enter_new_state/enter_state_* */
1373     if (st->state!=SITE_RUN) return False;
1374     slog(st,LOG_SETUP_INIT,"initiating key exchange (%s)",reason);
1375     if (st->addresses) {
1376         slog(st,LOG_SETUP_INIT,"resolving peer address(es)");
1377         return enter_state_resolve(st);
1378     } else if (transport_compute_setupinit_peers(st,0,0,prod_hint)) {
1379         return enter_new_state(st,SITE_SENTMSG1);
1380     }
1381     slog(st,LOG_SETUP_INIT,"key exchange failed: no address for peer");
1382     return False;
1383 }
1384
1385 static void activate_new_key(struct site *st)
1386 {
1387     struct transform_inst_if *t;
1388
1389     /* We have three transform instances, which we swap between old,
1390        active and setup */
1391     t=st->auxiliary_key.transform;
1392     st->auxiliary_key.transform=st->current.transform;
1393     st->current.transform=st->new_transform;
1394     st->new_transform=t;
1395     dispose_transform(&st->new_transform);
1396
1397     st->timeout=0;
1398     st->auxiliary_is_new=0;
1399     st->auxiliary_key.key_timeout=st->current.key_timeout;
1400     st->current.key_timeout=st->now+st->key_lifetime;
1401     st->renegotiate_key_time=st->now+st->key_renegotiate_time;
1402     transport_peers_copy(st,&st->peers,&st->setup_peers);
1403     st->current.remote_session_id=st->setup_session_id;
1404
1405     /* Compute the inter-site MTU.  This is min( our_mtu, their_mtu ).
1406      * But their mtu be unspecified, in which case we just use ours. */
1407     uint32_t intersite_mtu=
1408         MIN(st->mtu_target, st->remote_adv_mtu ?: ~(uint32_t)0);
1409     st->netlink->set_mtu(st->netlink->st,intersite_mtu);
1410
1411     slog(st,LOG_ACTIVATE_KEY,"new key activated"
1412          " (mtu ours=%"PRId32" theirs=%"PRId32" intersite=%"PRId32")",
1413          st->mtu_target, st->remote_adv_mtu, intersite_mtu);
1414     enter_state_run(st);
1415 }
1416
1417 static void delete_one_key(struct site *st, struct data_key *key,
1418                            cstring_t reason, cstring_t which, uint32_t loglevel)
1419 {
1420     if (!is_transform_valid(key->transform)) return;
1421     if (reason) slog(st,loglevel,"%s deleted (%s)",which,reason);
1422     dispose_transform(&key->transform);
1423     key->key_timeout=0;
1424 }
1425
1426 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel)
1427 {
1428     if (current_valid(st)) {
1429         slog(st,loglevel,"session closed (%s)",reason);
1430
1431         delete_one_key(st,&st->current,0,0,0);
1432         set_link_quality(st);
1433     }
1434     delete_one_key(st,&st->auxiliary_key,0,0,0);
1435 }
1436
1437 static void state_assert(struct site *st, bool_t ok)
1438 {
1439     if (!ok) fatal("site:state_assert");
1440 }
1441
1442 static void enter_state_stop(struct site *st)
1443 {
1444     st->state=SITE_STOP;
1445     st->timeout=0;
1446     delete_keys(st,"entering state STOP",LOG_TIMEOUT_KEY);
1447     dispose_transform(&st->new_transform);
1448 }
1449
1450 static void set_link_quality(struct site *st)
1451 {
1452     uint32_t quality;
1453     if (current_valid(st))
1454         quality=LINK_QUALITY_UP;
1455     else if (st->state==SITE_WAIT || st->state==SITE_STOP)
1456         quality=LINK_QUALITY_DOWN;
1457     else if (st->addresses)
1458         quality=LINK_QUALITY_DOWN_CURRENT_ADDRESS;
1459     else if (transport_peers_valid(&st->peers))
1460         quality=LINK_QUALITY_DOWN_STALE_ADDRESS;
1461     else
1462         quality=LINK_QUALITY_DOWN;
1463
1464     st->netlink->set_quality(st->netlink->st,quality);
1465 }
1466
1467 static void enter_state_run(struct site *st)
1468 {
1469     slog(st,LOG_STATE,"entering state RUN");
1470     st->state=SITE_RUN;
1471     st->timeout=0;
1472
1473     st->setup_session_id=0;
1474     transport_peers_clear(st,&st->setup_peers);
1475     FILLZERO(st->localN);
1476     FILLZERO(st->remoteN);
1477     dispose_transform(&st->new_transform);
1478     memset(st->dhsecret,0,st->dh->len);
1479     if (st->sharedsecret) memset(st->sharedsecret,0,st->sharedsecretlen);
1480     set_link_quality(st);
1481
1482     if (st->keepalive && !current_valid(st))
1483         initiate_key_setup(st, "keepalive", 0);
1484 }
1485
1486 static bool_t ensure_resolving(struct site *st)
1487 {
1488     /* Reentrancy hazard: may call site_resolve_callback and hence
1489      * enter_new_state, enter_state_* and generate_msg*. */
1490     if (st->resolving_count)
1491         return True;
1492
1493     assert(st->addresses);
1494
1495     /* resolver->request might reentrantly call site_resolve_callback
1496      * which will decrement st->resolving, so we need to increment it
1497      * twice beforehand to prevent decrement from thinking we're
1498      * finished, and decrement it ourselves.  Alternatively if
1499      * everything fails then there are no callbacks due and we simply
1500      * set it to 0 and return false.. */
1501     st->resolving_n_results_stored=0;
1502     st->resolving_n_results_all=0;
1503     st->resolving_count+=2;
1504     const char **addrp=st->addresses;
1505     const char *address;
1506     bool_t anyok=False;
1507     for (; (address=*addrp++); ) {
1508         bool_t ok = st->resolver->request(st->resolver->st,address,
1509                                           st->remoteport,st->comms[0],
1510                                           site_resolve_callback,st);
1511         if (ok)
1512             st->resolving_count++;
1513         anyok|=ok;
1514     }
1515     if (!anyok) {
1516         st->resolving_count=0;
1517         return False;
1518     }
1519     decrement_resolving_count(st,2);
1520     return True;
1521 }
1522
1523 static bool_t enter_state_resolve(struct site *st)
1524 {
1525     /* Reentrancy hazard!  See ensure_resolving. */
1526     state_assert(st,st->state==SITE_RUN);
1527     slog(st,LOG_STATE,"entering state RESOLVE");
1528     st->state=SITE_RESOLVE;
1529     return ensure_resolving(st);
1530 }
1531
1532 static bool_t enter_new_state(struct site *st, uint32_t next)
1533 {
1534     bool_t (*gen)(struct site *st);
1535     int r;
1536
1537     slog(st,LOG_STATE,"entering state %s",state_name(next));
1538     switch(next) {
1539     case SITE_SENTMSG1:
1540         state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE);
1541         gen=generate_msg1;
1542         st->msg1_crossed_logged = False;
1543         break;
1544     case SITE_SENTMSG2:
1545         state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1546                      st->state==SITE_SENTMSG1 || st->state==SITE_WAIT);
1547         gen=generate_msg2;
1548         break;
1549     case SITE_SENTMSG3:
1550         state_assert(st,st->state==SITE_SENTMSG1);
1551         BUF_FREE(&st->buffer);
1552         gen=generate_msg3;
1553         break;
1554     case SITE_SENTMSG4:
1555         state_assert(st,st->state==SITE_SENTMSG2);
1556         BUF_FREE(&st->buffer);
1557         gen=generate_msg4;
1558         break;
1559     case SITE_SENTMSG5:
1560         state_assert(st,st->state==SITE_SENTMSG3);
1561         BUF_FREE(&st->buffer);
1562         gen=generate_msg5;
1563         break;
1564     case SITE_RUN:
1565         state_assert(st,st->state==SITE_SENTMSG4);
1566         BUF_FREE(&st->buffer);
1567         gen=generate_msg6;
1568         break;
1569     default:
1570         gen=NULL;
1571         fatal("enter_new_state(%s): invalid new state",state_name(next));
1572         break;
1573     }
1574
1575     if (hacky_par_start_failnow()) return False;
1576
1577     r= gen(st) && send_msg(st);
1578
1579     hacky_par_end(&r,
1580                   st->setup_retries, st->setup_retry_interval,
1581                   send_msg, st);
1582     
1583     if (r) {
1584         st->state=next;
1585         if (next==SITE_RUN) {
1586             BUF_FREE(&st->buffer); /* Never reused */
1587             st->timeout=0; /* Never retransmit */
1588             activate_new_key(st);
1589         }
1590         return True;
1591     }
1592     slog(st,LOG_ERROR,"error entering state %s",state_name(next));
1593     st->buffer.free=False; /* Unconditionally use the buffer; it may be
1594                               in either state, and enter_state_wait() will
1595                               do a BUF_FREE() */
1596     enter_state_wait(st);
1597     return False;
1598 }
1599
1600 /* msg7 tells our peer that we're about to forget our key */
1601 static bool_t send_msg7(struct site *st, cstring_t reason)
1602 {
1603     cstring_t transform_err;
1604
1605     if (current_valid(st) && st->buffer.free
1606         && transport_peers_valid(&st->peers)) {
1607         BUF_ALLOC(&st->buffer,"site:MSG7");
1608         buffer_init(&st->buffer,calculate_max_start_pad());
1609         buf_append_uint32(&st->buffer,LABEL_MSG7);
1610         buf_append_string(&st->buffer,reason);
1611         if (call_transform_forwards(st, st->current.transform,
1612                                     &st->buffer, &transform_err))
1613             goto free_out;
1614         buf_prepend_uint32(&st->buffer,LABEL_MSG0);
1615         buf_prepend_uint32(&st->buffer,st->index);
1616         buf_prepend_uint32(&st->buffer,st->current.remote_session_id);
1617         transport_xmit(st,&st->peers,&st->buffer,True);
1618         BUF_FREE(&st->buffer);
1619     free_out:
1620         return True;
1621     }
1622     return False;
1623 }
1624
1625 /* We go into this state if our peer becomes uncommunicative. Similar to
1626    the "stop" state, we forget all session keys for a while, before
1627    re-entering the "run" state. */
1628 static void enter_state_wait(struct site *st)
1629 {
1630     slog(st,LOG_STATE,"entering state WAIT");
1631     st->timeout=st->now+st->wait_timeout;
1632     st->state=SITE_WAIT;
1633     set_link_quality(st);
1634     BUF_FREE(&st->buffer); /* will have had an outgoing packet in it */
1635     /* XXX Erase keys etc. */
1636 }
1637
1638 static void generate_prod(struct site *st, struct buffer_if *buf)
1639 {
1640     buffer_init(buf,0);
1641     buf_append_uint32(buf,0);
1642     buf_append_uint32(buf,0);
1643     buf_append_uint32(buf,LABEL_PROD);
1644     buf_append_string(buf,st->localname);
1645     buf_append_string(buf,st->remotename);
1646 }
1647
1648 static void generate_send_prod(struct site *st,
1649                                const struct comm_addr *source)
1650 {
1651     if (!st->allow_send_prod) return; /* too soon */
1652     if (!(st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1653           st->state==SITE_WAIT)) return; /* we'd ignore peer's MSG1 */
1654
1655     slog(st,LOG_SETUP_INIT,"prodding peer for key exchange");
1656     st->allow_send_prod=0;
1657     generate_prod(st,&st->scratch);
1658     bool_t ok = comm_addr_sendmsg(st, source, &st->scratch);
1659     dump_packet(st,&st->scratch,source,False,ok);
1660 }
1661
1662 static inline void site_settimeout(uint64_t timeout, int *timeout_io)
1663 {
1664     if (timeout) {
1665         int64_t offset=timeout-*now;
1666         if (offset<0) offset=0;
1667         if (offset>INT_MAX) offset=INT_MAX;
1668         if (*timeout_io<0 || offset<*timeout_io)
1669             *timeout_io=offset;
1670     }
1671 }
1672
1673 static int site_beforepoll(void *sst, struct pollfd *fds, int *nfds_io,
1674                            int *timeout_io)
1675 {
1676     struct site *st=sst;
1677
1678     BEFOREPOLL_WANT_FDS(0); /* We don't use any file descriptors */
1679     st->now=*now;
1680
1681     /* Work out when our next timeout is. The earlier of 'timeout' or
1682        'current.key_timeout'. A stored value of '0' indicates no timeout
1683        active. */
1684     site_settimeout(st->timeout, timeout_io);
1685     site_settimeout(st->current.key_timeout, timeout_io);
1686     site_settimeout(st->auxiliary_key.key_timeout, timeout_io);
1687
1688     return 0; /* success */
1689 }
1690
1691 static void check_expiry(struct site *st, struct data_key *key,
1692                          const char *which)
1693 {
1694     if (key->key_timeout && *now>key->key_timeout) {
1695         delete_one_key(st,key,"maximum life exceeded",which,LOG_TIMEOUT_KEY);
1696     }
1697 }
1698
1699 /* NB site_afterpoll will be called before site_beforepoll is ever called */
1700 static void site_afterpoll(void *sst, struct pollfd *fds, int nfds)
1701 {
1702     struct site *st=sst;
1703
1704     st->now=*now;
1705     if (st->timeout && *now>st->timeout) {
1706         st->timeout=0;
1707         if (st->state>=SITE_SENTMSG1 && st->state<=SITE_SENTMSG5) {
1708             if (!hacky_par_start_failnow())
1709                 send_msg(st);
1710         } else if (st->state==SITE_WAIT) {
1711             enter_state_run(st);
1712         } else {
1713             slog(st,LOG_ERROR,"site_afterpoll: unexpected timeout, state=%d",
1714                  st->state);
1715         }
1716     }
1717     check_expiry(st,&st->current,"current key");
1718     check_expiry(st,&st->auxiliary_key,"auxiliary key");
1719 }
1720
1721 /* This function is called by the netlink device to deliver packets
1722    intended for the remote network. The packet is in "raw" wire
1723    format, but is guaranteed to be word-aligned. */
1724 static void site_outgoing(void *sst, struct buffer_if *buf)
1725 {
1726     struct site *st=sst;
1727     cstring_t transform_err;
1728     
1729     if (st->state==SITE_STOP) {
1730         BUF_FREE(buf);
1731         return;
1732     }
1733
1734     st->allow_send_prod=1;
1735
1736     /* In all other states we consider delivering the packet if we have
1737        a valid key and a valid address to send it to. */
1738     if (current_valid(st) && transport_peers_valid(&st->peers)) {
1739         /* Transform it and send it */
1740         if (buf->size>0) {
1741             buf_prepend_uint32(buf,LABEL_MSG9);
1742             if (call_transform_forwards(st, st->current.transform,
1743                                         buf, &transform_err))
1744                 goto free_out;
1745             buf_prepend_uint32(buf,LABEL_MSG0);
1746             buf_prepend_uint32(buf,st->index);
1747             buf_prepend_uint32(buf,st->current.remote_session_id);
1748             transport_xmit(st,&st->peers,buf,False);
1749         }
1750     free_out:
1751         BUF_FREE(buf);
1752         return;
1753     }
1754
1755     slog(st,LOG_DROP,"discarding outgoing packet of size %d",buf->size);
1756     BUF_FREE(buf);
1757     initiate_key_setup(st,"outgoing packet",0);
1758 }
1759
1760 static bool_t named_for_us(struct site *st, const struct buffer_if *buf_in,
1761                            uint32_t type, struct msg *m)
1762     /* For packets which are identified by the local and remote names.
1763      * If it has our name and our peer's name in it it's for us. */
1764 {
1765     struct buffer_if buf[1];
1766     buffer_readonly_clone(buf,buf_in);
1767     return unpick_msg(st,type,buf,m)
1768         && name_matches(&m->remote,st->remotename)
1769         && name_matches(&m->local,st->localname);
1770 }
1771
1772 static bool_t we_have_priority(struct site *st, const struct msg *m) {
1773     if ((st->local_capabilities & m->remote_capabilities)
1774         && CAPAB_PRIORITY_MOBILE) {
1775         if (st->local_mobile) return True;
1776         if (st-> peer_mobile) return False;
1777     }
1778     return st->our_name_later;
1779 }
1780
1781 /* This function is called by the communication device to deliver
1782    packets from our peers.
1783    It should return True if the packet is recognised as being for
1784    this current site instance (and should therefore not be processed
1785    by other sites), even if the packet was otherwise ignored. */
1786 static bool_t site_incoming(void *sst, struct buffer_if *buf,
1787                             const struct comm_addr *source)
1788 {
1789     struct site *st=sst;
1790
1791     if (buf->size < 12) return False;
1792
1793     uint32_t dest=get_uint32(buf->start);
1794     uint32_t msgtype=get_uint32(buf->start+8);
1795     struct msg named_msg;
1796
1797     if (msgtype==LABEL_MSG1) {
1798         if (!named_for_us(st,buf,msgtype,&named_msg))
1799             return False;
1800         /* It's a MSG1 addressed to us. Decide what to do about it. */
1801         dump_packet(st,buf,source,True,True);
1802         if (st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1803             st->state==SITE_WAIT) {
1804             /* We should definitely process it */
1805             transport_compute_setupinit_peers(st,0,0,source);
1806             if (process_msg1(st,buf,source,&named_msg)) {
1807                 slog(st,LOG_SETUP_INIT,"key setup initiated by peer");
1808                 bool_t entered=enter_new_state(st,SITE_SENTMSG2);
1809                 if (entered && st->addresses && st->local_mobile)
1810                     /* We must do this as the very last thing, because
1811                        the resolver callback might reenter us. */
1812                     ensure_resolving(st);
1813             } else {
1814                 slog(st,LOG_ERROR,"failed to process incoming msg1");
1815             }
1816             BUF_FREE(buf);
1817             return True;
1818         } else if (st->state==SITE_SENTMSG1) {
1819             /* We've just sent a message 1! They may have crossed on
1820                the wire. If we have priority then we ignore the
1821                incoming one, otherwise we process it as usual. */
1822             if (we_have_priority(st,&named_msg)) {
1823                 BUF_FREE(buf);
1824                 if (!st->msg1_crossed_logged++)
1825                     slog(st,LOG_SETUP_INIT,"crossed msg1s; we are higher "
1826                          "priority => ignore incoming msg1");
1827                 return True;
1828             } else {
1829                 slog(st,LOG_SETUP_INIT,"crossed msg1s; we are lower "
1830                      "priority => use incoming msg1");
1831                 if (process_msg1(st,buf,source,&named_msg)) {
1832                     BUF_FREE(&st->buffer); /* Free our old message 1 */
1833                     transport_setup_msgok(st,source);
1834                     enter_new_state(st,SITE_SENTMSG2);
1835                 } else {
1836                     slog(st,LOG_ERROR,"failed to process an incoming "
1837                          "crossed msg1 (we have low priority)");
1838                 }
1839                 BUF_FREE(buf);
1840                 return True;
1841             }
1842         }
1843         /* The message 1 was received at an unexpected stage of the
1844            key setup. XXX POLICY - what do we do? */
1845         slog(st,LOG_UNEXPECTED,"unexpected incoming message 1");
1846         BUF_FREE(buf);
1847         return True;
1848     }
1849     if (msgtype==LABEL_PROD) {
1850         if (!named_for_us(st,buf,msgtype,&named_msg))
1851             return False;
1852         dump_packet(st,buf,source,True,True);
1853         if (st->state!=SITE_RUN) {
1854             slog(st,LOG_DROP,"ignoring PROD when not in state RUN");
1855         } else if (current_valid(st)) {
1856             slog(st,LOG_DROP,"ignoring PROD when we think we have a key");
1857         } else {
1858             initiate_key_setup(st,"peer sent PROD packet",source);
1859         }
1860         BUF_FREE(buf);
1861         return True;
1862     }
1863     if (dest==st->index) {
1864         /* Explicitly addressed to us */
1865         if (msgtype!=LABEL_MSG0) dump_packet(st,buf,source,True,True);
1866         switch (msgtype) {
1867         case LABEL_NAK:
1868             /* If the source is our current peer then initiate a key setup,
1869                because our peer's forgotten the key */
1870             if (get_uint32(buf->start+4)==st->current.remote_session_id) {
1871                 bool_t initiated;
1872                 initiated = initiate_key_setup(st,"received a NAK",source);
1873                 if (!initiated) generate_send_prod(st,source);
1874             } else {
1875                 slog(st,LOG_SEC,"bad incoming NAK");
1876             }
1877             break;
1878         case LABEL_MSG0:
1879             process_msg0(st,buf,source);
1880             break;
1881         case LABEL_MSG1:
1882             /* Setup packet: should not have been explicitly addressed
1883                to us */
1884             slog(st,LOG_SEC,"incoming explicitly addressed msg1");
1885             break;
1886         case LABEL_MSG2:
1887             /* Setup packet: expected only in state SENTMSG1 */
1888             if (st->state!=SITE_SENTMSG1) {
1889                 slog(st,LOG_UNEXPECTED,"unexpected MSG2");
1890             } else if (process_msg2(st,buf,source)) {
1891                 transport_setup_msgok(st,source);
1892                 enter_new_state(st,SITE_SENTMSG3);
1893             } else {
1894                 slog(st,LOG_SEC,"invalid MSG2");
1895             }
1896             break;
1897         case LABEL_MSG3:
1898         case LABEL_MSG3BIS:
1899             /* Setup packet: expected only in state SENTMSG2 */
1900             if (st->state!=SITE_SENTMSG2) {
1901                 slog(st,LOG_UNEXPECTED,"unexpected MSG3");
1902             } else if (process_msg3(st,buf,source,msgtype)) {
1903                 transport_setup_msgok(st,source);
1904                 enter_new_state(st,SITE_SENTMSG4);
1905             } else {
1906                 slog(st,LOG_SEC,"invalid MSG3");
1907             }
1908             break;
1909         case LABEL_MSG4:
1910             /* Setup packet: expected only in state SENTMSG3 */
1911             if (st->state!=SITE_SENTMSG3) {
1912                 slog(st,LOG_UNEXPECTED,"unexpected MSG4");
1913             } else if (process_msg4(st,buf,source)) {
1914                 transport_setup_msgok(st,source);
1915                 enter_new_state(st,SITE_SENTMSG5);
1916             } else {
1917                 slog(st,LOG_SEC,"invalid MSG4");
1918             }
1919             break;
1920         case LABEL_MSG5:
1921             /* Setup packet: expected only in state SENTMSG4 */
1922             /* (may turn up in state RUN if our return MSG6 was lost
1923                and the new key has already been activated. In that
1924                case we discard it. The peer will realise that we
1925                are using the new key when they see our data packets.
1926                Until then the peer's data packets to us get discarded. */
1927             if (st->state==SITE_SENTMSG4) {
1928                 if (process_msg5(st,buf,source,st->new_transform)) {
1929                     transport_setup_msgok(st,source);
1930                     enter_new_state(st,SITE_RUN);
1931                 } else {
1932                     slog(st,LOG_SEC,"invalid MSG5");
1933                 }
1934             } else if (st->state==SITE_RUN) {
1935                 if (process_msg5(st,buf,source,st->current.transform)) {
1936                     slog(st,LOG_DROP,"got MSG5, retransmitting MSG6");
1937                     transport_setup_msgok(st,source);
1938                     create_msg6(st,st->current.transform,
1939                                 st->current.remote_session_id);
1940                     transport_xmit(st,&st->peers,&st->buffer,True);
1941                     BUF_FREE(&st->buffer);
1942                 } else {
1943                     slog(st,LOG_SEC,"invalid MSG5 (in state RUN)");
1944                 }
1945             } else {
1946                 slog(st,LOG_UNEXPECTED,"unexpected MSG5");
1947             }
1948             break;
1949         case LABEL_MSG6:
1950             /* Setup packet: expected only in state SENTMSG5 */
1951             if (st->state!=SITE_SENTMSG5) {
1952                 slog(st,LOG_UNEXPECTED,"unexpected MSG6");
1953             } else if (process_msg6(st,buf,source)) {
1954                 BUF_FREE(&st->buffer); /* Free message 5 */
1955                 transport_setup_msgok(st,source);
1956                 activate_new_key(st);
1957             } else {
1958                 slog(st,LOG_SEC,"invalid MSG6");
1959             }
1960             break;
1961         default:
1962             slog(st,LOG_SEC,"received message of unknown type 0x%08x",
1963                  msgtype);
1964             break;
1965         }
1966         BUF_FREE(buf);
1967         return True;
1968     }
1969
1970     return False;
1971 }
1972
1973 static void site_control(void *vst, bool_t run)
1974 {
1975     struct site *st=vst;
1976     if (run) enter_state_run(st);
1977     else enter_state_stop(st);
1978 }
1979
1980 static void site_phase_hook(void *sst, uint32_t newphase)
1981 {
1982     struct site *st=sst;
1983
1984     /* The program is shutting down; tell our peer */
1985     send_msg7(st,"shutting down");
1986 }
1987
1988 static void site_childpersist_clearkeys(void *sst, uint32_t newphase)
1989 {
1990     struct site *st=sst;
1991     dispose_transform(&st->current.transform);
1992     dispose_transform(&st->auxiliary_key.transform);
1993     dispose_transform(&st->new_transform);
1994     /* Not much point overwiting the signing key, since we loaded it
1995        from disk, and it is only valid prospectively if at all,
1996        anyway. */
1997     /* XXX it would be best to overwrite the DH state, because that
1998        _is_ relevant to forward secrecy.  However we have no
1999        convenient interface for doing that and in practice gmp has
2000        probably dribbled droppings all over the malloc arena.  A good
2001        way to fix this would be to have a privsep child for asymmetric
2002        crypto operations, but that's a task for another day. */
2003 }
2004
2005 static list_t *site_apply(closure_t *self, struct cloc loc, dict_t *context,
2006                           list_t *args)
2007 {
2008     static uint32_t index_sequence;
2009     struct site *st;
2010     item_t *item;
2011     dict_t *dict;
2012     int i;
2013
2014     NEW(st);
2015
2016     st->cl.description="site";
2017     st->cl.type=CL_SITE;
2018     st->cl.apply=NULL;
2019     st->cl.interface=&st->ops;
2020     st->ops.st=st;
2021     st->ops.control=site_control;
2022     st->ops.status=site_status;
2023
2024     /* First parameter must be a dict */
2025     item=list_elem(args,0);
2026     if (!item || item->type!=t_dict)
2027         cfgfatal(loc,"site","parameter must be a dictionary\n");
2028     
2029     dict=item->data.dict;
2030     st->localname=dict_read_string(dict, "local-name", True, "site", loc);
2031     st->remotename=dict_read_string(dict, "name", True, "site", loc);
2032
2033     st->keepalive=dict_read_bool(dict,"keepalive",False,"site",loc,False);
2034
2035     st->peer_mobile=dict_read_bool(dict,"mobile",False,"site",loc,False);
2036     st->local_mobile=
2037         dict_read_bool(dict,"local-mobile",False,"site",loc,False);
2038
2039     /* Sanity check (which also allows the 'sites' file to include
2040        site() closures for all sites including our own): refuse to
2041        talk to ourselves */
2042     if (strcmp(st->localname,st->remotename)==0) {
2043         Message(M_DEBUG,"site %s: local-name==name -> ignoring this site\n",
2044                 st->localname);
2045         if (st->peer_mobile != st->local_mobile)
2046             cfgfatal(loc,"site","site %s's peer-mobile=%d"
2047                     " but our local-mobile=%d\n",
2048                     st->localname, st->peer_mobile, st->local_mobile);
2049         free(st);
2050         return NULL;
2051     }
2052     if (st->peer_mobile && st->local_mobile) {
2053         Message(M_WARNING,"site %s: site is mobile but so are we"
2054                 " -> ignoring this site\n", st->remotename);
2055         free(st);
2056         return NULL;
2057     }
2058
2059     assert(index_sequence < 0xffffffffUL);
2060     st->index = ++index_sequence;
2061     st->local_capabilities = 0;
2062     st->netlink=find_cl_if(dict,"link",CL_NETLINK,True,"site",loc);
2063
2064 #define GET_CLOSURE_LIST(dictkey,things,nthings,CL_TYPE) do{            \
2065     list_t *things##_cfg=dict_lookup(dict,dictkey);                     \
2066     if (!things##_cfg)                                                  \
2067         cfgfatal(loc,"site","closure list \"%s\" not found\n",dictkey); \
2068     st->nthings=list_length(things##_cfg);                              \
2069     NEW_ARY(st->things,st->nthings);                                    \
2070     assert(st->nthings);                                                \
2071     for (i=0; i<st->nthings; i++) {                                     \
2072         item_t *item=list_elem(things##_cfg,i);                         \
2073         if (item->type!=t_closure)                                      \
2074             cfgfatal(loc,"site","%s is not a closure\n",dictkey);       \
2075         closure_t *cl=item->data.closure;                               \
2076         if (cl->type!=CL_TYPE)                                          \
2077             cfgfatal(loc,"site","%s closure wrong type\n",dictkey);     \
2078         st->things[i]=cl->interface;                                    \
2079     }                                                                   \
2080 }while(0)
2081
2082     GET_CLOSURE_LIST("comm",comms,ncomms,CL_COMM);
2083
2084     NEW_ARY(st->commclientinfos, st->ncomms);
2085     dict_t *comminfo = dict_read_dict(dict,"comm-info",False,"site",loc);
2086     for (i=0; i<st->ncomms; i++) {
2087         st->commclientinfos[i] =
2088             !comminfo ? 0 :
2089             st->comms[i]->clientinfo(st->comms[i],comminfo,loc);
2090     }
2091
2092     st->resolver=find_cl_if(dict,"resolver",CL_RESOLVER,True,"site",loc);
2093     st->log=find_cl_if(dict,"log",CL_LOG,True,"site",loc);
2094     st->random=find_cl_if(dict,"random",CL_RANDOMSRC,True,"site",loc);
2095
2096     st->privkey=find_cl_if(dict,"local-key",CL_RSAPRIVKEY,True,"site",loc);
2097     st->addresses=dict_read_string_array(dict,"address",False,"site",loc,0);
2098     if (st->addresses)
2099         st->remoteport=dict_read_number(dict,"port",True,"site",loc,0);
2100     else st->remoteport=0;
2101     st->pubkey=find_cl_if(dict,"key",CL_RSAPUBKEY,True,"site",loc);
2102
2103     GET_CLOSURE_LIST("transform",transforms,ntransforms,CL_TRANSFORM);
2104
2105     st->dh=find_cl_if(dict,"dh",CL_DH,True,"site",loc);
2106     st->hash=find_cl_if(dict,"hash",CL_HASH,True,"site",loc);
2107
2108 #define DEFAULT(D) (st->peer_mobile || st->local_mobile \
2109                     ? DEFAULT_MOBILE_##D : DEFAULT_##D)
2110 #define CFG_NUMBER(k,D) dict_read_number(dict,(k),False,"site",loc,DEFAULT(D));
2111
2112     st->key_lifetime=         CFG_NUMBER("key-lifetime",  KEY_LIFETIME);
2113     st->setup_retries=        CFG_NUMBER("setup-retries", SETUP_RETRIES);
2114     st->setup_retry_interval= CFG_NUMBER("setup-timeout", SETUP_RETRY_INTERVAL);
2115     st->wait_timeout=         CFG_NUMBER("wait-time",     WAIT_TIME);
2116     st->mtu_target= dict_read_number(dict,"mtu-target",False,"site",loc,0);
2117
2118     st->mobile_peer_expiry= dict_read_number(
2119        dict,"mobile-peer-expiry",False,"site",loc,DEFAULT_MOBILE_PEER_EXPIRY);
2120
2121     const char *peerskey= st->peer_mobile
2122         ? "mobile-peers-max" : "static-peers-max";
2123     st->transport_peers_max= dict_read_number(
2124         dict,peerskey,False,"site",loc, st->addresses ? 4 : 3);
2125     if (st->transport_peers_max<1 ||
2126         st->transport_peers_max>MAX_PEER_ADDRS) {
2127         cfgfatal(loc,"site", "%s must be in range 1.."
2128                  STRING(MAX_PEER_ADDRS) "\n", peerskey);
2129     }
2130
2131     if (st->key_lifetime < DEFAULT(KEY_RENEGOTIATE_GAP)*2)
2132         st->key_renegotiate_time=st->key_lifetime/2;
2133     else
2134         st->key_renegotiate_time=st->key_lifetime-DEFAULT(KEY_RENEGOTIATE_GAP);
2135     st->key_renegotiate_time=dict_read_number(
2136         dict,"renegotiate-time",False,"site",loc,st->key_renegotiate_time);
2137     if (st->key_renegotiate_time > st->key_lifetime) {
2138         cfgfatal(loc,"site",
2139                  "renegotiate-time must be less than key-lifetime\n");
2140     }
2141
2142     st->log_events=string_list_to_word(dict_lookup(dict,"log-events"),
2143                                        log_event_table,"site");
2144
2145     st->resolving_count=0;
2146     st->allow_send_prod=0;
2147
2148     st->tunname=safe_malloc(strlen(st->localname)+strlen(st->remotename)+5,
2149                             "site_apply");
2150     sprintf(st->tunname,"%s<->%s",st->localname,st->remotename);
2151
2152     /* The information we expect to see in incoming messages of type 1 */
2153     /* fixme: lots of unchecked overflows here, but the results are only
2154        corrupted packets rather than undefined behaviour */
2155     st->our_name_later=(strcmp(st->localname,st->remotename)>0);
2156
2157     buffer_new(&st->buffer,SETUP_BUFFER_LEN);
2158
2159     buffer_new(&st->scratch,SETUP_BUFFER_LEN);
2160     BUF_ALLOC(&st->scratch,"site:scratch");
2161
2162     /* We are interested in poll(), but only for timeouts. We don't have
2163        any fds of our own. */
2164     register_for_poll(st, site_beforepoll, site_afterpoll, "site");
2165     st->timeout=0;
2166
2167     st->remote_capabilities=0;
2168     st->chosen_transform=0;
2169     st->current.key_timeout=0;
2170     st->auxiliary_key.key_timeout=0;
2171     transport_peers_clear(st,&st->peers);
2172     transport_peers_clear(st,&st->setup_peers);
2173     /* XXX mlock these */
2174     st->dhsecret=safe_malloc(st->dh->len,"site:dhsecret");
2175     st->sharedsecretlen=st->sharedsecretallocd=0;
2176     st->sharedsecret=0;
2177
2178     for (i=0; i<st->ntransforms; i++) {
2179         struct transform_if *ti=st->transforms[i];
2180         uint32_t capbit = 1UL << ti->capab_transformnum;
2181         if (st->local_capabilities & capbit)
2182             slog(st,LOG_ERROR,"transformnum capability bit"
2183                  " %d (%#"PRIx32") reused", ti->capab_transformnum, capbit);
2184         st->local_capabilities |= capbit;
2185     }
2186
2187     if (st->local_mobile || st->peer_mobile)
2188         st->local_capabilities |= CAPAB_PRIORITY_MOBILE;
2189
2190     /* We need to register the remote networks with the netlink device */
2191     uint32_t netlink_mtu; /* local virtual interface mtu */
2192     st->netlink->reg(st->netlink->st, site_outgoing, st, &netlink_mtu);
2193     if (!st->mtu_target)
2194         st->mtu_target=netlink_mtu;
2195     
2196     for (i=0; i<st->ncomms; i++)
2197         st->comms[i]->request_notify(st->comms[i]->st, st, site_incoming);
2198
2199     st->current.transform=0;
2200     st->auxiliary_key.transform=0;
2201     st->new_transform=0;
2202     st->auxiliary_is_new=0;
2203
2204     enter_state_stop(st);
2205
2206     add_hook(PHASE_SHUTDOWN,site_phase_hook,st);
2207     add_hook(PHASE_CHILDPERSIST,site_childpersist_clearkeys,st);
2208
2209     return new_closure(&st->cl);
2210 }
2211
2212 void site_module(dict_t *dict)
2213 {
2214     add_closure(dict,"site",site_apply);
2215 }
2216
2217
2218 /***** TRANSPORT PEERS definitions *****/
2219
2220 static void transport_peers_debug(struct site *st, transport_peers *dst,
2221                                   const char *didwhat,
2222                                   int nargs, const struct comm_addr *args,
2223                                   size_t stride) {
2224     int i;
2225     char *argp;
2226
2227     if (!(st->log_events & LOG_PEER_ADDRS))
2228         return; /* an optimisation */
2229
2230     slog(st, LOG_PEER_ADDRS, "peers (%s) %s nargs=%d => npeers=%d",
2231          (dst==&st->peers ? "data" :
2232           dst==&st->setup_peers ? "setup" : "UNKNOWN"),
2233          didwhat, nargs, dst->npeers);
2234
2235     for (i=0, argp=(void*)args;
2236          i<nargs;
2237          i++, (argp+=stride?stride:sizeof(*args))) {
2238         const struct comm_addr *ca=(void*)argp;
2239         slog(st, LOG_PEER_ADDRS, " args: addrs[%d]=%s",
2240              i, comm_addr_to_string(ca));
2241     }
2242     for (i=0; i<dst->npeers; i++) {
2243         struct timeval diff;
2244         timersub(tv_now,&dst->peers[i].last,&diff);
2245         const struct comm_addr *ca=&dst->peers[i].addr;
2246         slog(st, LOG_PEER_ADDRS, " peers: addrs[%d]=%s T-%ld.%06ld",
2247              i, comm_addr_to_string(ca),
2248              (unsigned long)diff.tv_sec, (unsigned long)diff.tv_usec);
2249     }
2250 }
2251
2252 static void transport_peers_expire(struct site *st, transport_peers *peers) {
2253     /* peers must be sorted first */
2254     int previous_peers=peers->npeers;
2255     struct timeval oldest;
2256     oldest.tv_sec  = tv_now->tv_sec - st->mobile_peer_expiry;
2257     oldest.tv_usec = tv_now->tv_usec;
2258     while (peers->npeers>1 &&
2259            timercmp(&peers->peers[peers->npeers-1].last, &oldest, <))
2260         peers->npeers--;
2261     if (peers->npeers != previous_peers)
2262         transport_peers_debug(st,peers,"expire", 0,0,0);
2263 }
2264
2265 static bool_t transport_peer_record_one(struct site *st, transport_peers *peers,
2266                                         const struct comm_addr *ca,
2267                                         const struct timeval *tv) {
2268     /* returns false if output is full */
2269     int search;
2270
2271     if (peers->npeers >= st->transport_peers_max)
2272         return 0;
2273
2274     for (search=0; search<peers->npeers; search++)
2275         if (comm_addr_equal(&peers->peers[search].addr, ca))
2276             return 1;
2277
2278     peers->peers[peers->npeers].addr = *ca;
2279     peers->peers[peers->npeers].last = *tv;
2280     peers->npeers++;
2281     return 1;
2282 }
2283
2284 static void transport_record_peers(struct site *st, transport_peers *peers,
2285                                    const struct comm_addr *addrs, int naddrs,
2286                                    const char *m) {
2287     /* We add addrs into peers.  The new entries end up at the front
2288      * and displace entries towards the end (perhaps even off the
2289      * end).  Any existing matching entries are moved up to the front.
2290      *
2291      * Caller must first call transport_peers_expire. */
2292
2293     if (naddrs==1) {
2294         /* avoids debug for uninteresting updates */
2295         int i;
2296         for (i=0; i<peers->npeers; i++) {
2297             if (comm_addr_equal(&addrs[0], &peers->peers[i].addr)) {
2298                 memmove(peers->peers+1, peers->peers,
2299                         sizeof(peers->peers[0]) * i);
2300                 peers->peers[0].addr = addrs[0];
2301                 peers->peers[0].last = *tv_now;
2302                 return;
2303             }
2304         }
2305     }
2306
2307     int old_npeers=peers->npeers;
2308     transport_peer old_peers[old_npeers];
2309     COPY_ARRAY(old_peers,peers->peers,old_npeers);
2310
2311     peers->npeers=0;
2312     int i;
2313     for (i=0; i<naddrs; i++) {
2314         if (!transport_peer_record_one(st,peers, &addrs[i], tv_now))
2315             break;
2316     }
2317     for (i=0; i<old_npeers; i++) {
2318         const transport_peer *old=&old_peers[i];
2319         if (!transport_peer_record_one(st,peers, &old->addr, &old->last))
2320             break;
2321     }
2322
2323     transport_peers_debug(st,peers,m, naddrs,addrs,0);
2324 }
2325
2326 static void transport_expire_record_peers(struct site *st,
2327                                           transport_peers *peers,
2328                                           const struct comm_addr *addrs,
2329                                           int naddrs, const char *m) {
2330     /* Convenience function */
2331     transport_peers_expire(st,peers);
2332     transport_record_peers(st,peers,addrs,naddrs,m);
2333 }
2334
2335 static bool_t transport_compute_setupinit_peers(struct site *st,
2336         const struct comm_addr *configured_addrs /* 0 if none or not found */,
2337         int n_configured_addrs /* 0 if none or not found */,
2338         const struct comm_addr *incoming_packet_addr /* 0 if none */) {
2339     if (!n_configured_addrs && !incoming_packet_addr &&
2340         !transport_peers_valid(&st->peers))
2341         return False;
2342
2343     slog(st,LOG_SETUP_INIT,
2344          "using: %d configured addr(s);%s %d old peer addrs(es)",
2345          n_configured_addrs,
2346          incoming_packet_addr ? " incoming packet address;" : "",
2347          st->peers.npeers);
2348
2349     /* Non-mobile peers try addresses until one is plausible.  The
2350      * effect is that this code always tries first the configured
2351      * address if supplied, or otherwise the address of the incoming
2352      * PROD, or finally the existing data peer if one exists; this is
2353      * as desired. */
2354
2355     transport_peers_copy(st,&st->setup_peers,&st->peers);
2356     transport_peers_expire(st,&st->setup_peers);
2357
2358     if (incoming_packet_addr)
2359         transport_record_peers(st,&st->setup_peers,
2360                                incoming_packet_addr,1, "incoming");
2361
2362     if (n_configured_addrs)
2363         transport_record_peers(st,&st->setup_peers,
2364                               configured_addrs,n_configured_addrs, "setupinit");
2365
2366     assert(transport_peers_valid(&st->setup_peers));
2367     return True;
2368 }
2369
2370 static void transport_setup_msgok(struct site *st, const struct comm_addr *a) {
2371     if (st->peer_mobile)
2372         transport_expire_record_peers(st,&st->setup_peers,a,1,"setupmsg");
2373 }
2374 static void transport_data_msgok(struct site *st, const struct comm_addr *a) {
2375     if (st->peer_mobile)
2376         transport_expire_record_peers(st,&st->peers,a,1,"datamsg");
2377 }
2378
2379 static int transport_peers_valid(transport_peers *peers) {
2380     return peers->npeers;
2381 }
2382 static void transport_peers_clear(struct site *st, transport_peers *peers) {
2383     peers->npeers= 0;
2384     transport_peers_debug(st,peers,"clear",0,0,0);
2385 }
2386 static void transport_peers_copy(struct site *st, transport_peers *dst,
2387                                  const transport_peers *src) {
2388     dst->npeers=src->npeers;
2389     COPY_ARRAY(dst->peers, src->peers, dst->npeers);
2390     transport_peers_debug(st,dst,"copy",
2391                           src->npeers, &src->peers->addr, sizeof(*src->peers));
2392 }
2393
2394 static void transport_resolve_complete(struct site *st,
2395                                        const struct comm_addr *addrs,
2396                                        int naddrs) {
2397     transport_expire_record_peers(st,&st->peers,addrs,naddrs,
2398                                   "resolved data");
2399     transport_expire_record_peers(st,&st->setup_peers,addrs,naddrs,
2400                                   "resolved setup");
2401 }
2402
2403 static void transport_resolve_complete_tardy(struct site *st,
2404                                              const struct comm_addr *addrs,
2405                                              int naddrs) {
2406     transport_expire_record_peers(st,&st->peers,addrs,naddrs,
2407                                   "resolved tardily");
2408 }
2409
2410 static void transport_peers__copy_by_mask(transport_peer *out, int *nout_io,
2411                                           unsigned mask,
2412                                           const transport_peers *inp) {
2413     /* out and in->peers may be the same region, or nonoverlapping */
2414     const transport_peer *in=inp->peers;
2415     int slot;
2416     for (slot=0; slot<inp->npeers; slot++) {
2417         if (!(mask & (1U << slot)))
2418             continue;
2419         if (!(out==in && slot==*nout_io))
2420             COPY_OBJ(out[*nout_io], in[slot]);
2421         (*nout_io)++;
2422     }
2423 }
2424
2425 void transport_xmit(struct site *st, transport_peers *peers,
2426                     struct buffer_if *buf, bool_t candebug) {
2427     int slot;
2428     transport_peers_expire(st, peers);
2429     unsigned failed=0; /* bitmask */
2430     assert(MAX_PEER_ADDRS < sizeof(unsigned)*CHAR_BIT);
2431
2432     int nfailed=0;
2433     for (slot=0; slot<peers->npeers; slot++) {
2434         transport_peer *peer=&peers->peers[slot];
2435         bool_t ok = comm_addr_sendmsg(st, &peer->addr, buf);
2436         if (candebug)
2437             dump_packet(st, buf, &peer->addr, False, ok);
2438         if (!ok) {
2439             failed |= 1U << slot;
2440             nfailed++;
2441         }
2442         if (ok && !st->peer_mobile)
2443             break;
2444     }
2445     /* Now we need to demote/delete failing addrs: if we are mobile we
2446      * merely demote them; otherwise we delete them. */
2447     if (st->local_mobile) {
2448         unsigned expected = ((1U << nfailed)-1) << (peers->npeers-nfailed);
2449         /* `expected' has all the failures at the end already */
2450         if (failed != expected) {
2451             int fslot=0;
2452             transport_peer failedpeers[nfailed];
2453             transport_peers__copy_by_mask(failedpeers, &fslot, failed,peers);
2454             assert(fslot == nfailed);
2455             int wslot=0;
2456             transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2457             assert(wslot+nfailed == peers->npeers);
2458             COPY_ARRAY(peers->peers+wslot, failedpeers, nfailed);
2459             transport_peers_debug(st,peers,"mobile failure reorder",0,0,0);
2460         }
2461     } else {
2462         if (failed && peers->npeers > 1) {
2463             int wslot=0;
2464             transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2465             peers->npeers=wslot;
2466             transport_peers_debug(st,peers,"non-mobile failure cleanup",0,0,0);
2467         }
2468     }
2469 }
2470
2471 /***** END of transport peers declarations *****/