chiark / gitweb /
d0dd909d57aac307373df6c3132997f795f1c270
[secnet.git] / site.c
1 /* site.c - manage communication with a remote network site */
2
3 /*
4  * This file is part of secnet.
5  * See README for full list of copyright holders.
6  *
7  * secnet is free software; you can redistribute it and/or modify it
8  * under the terms of the GNU General Public License as published by
9  * the Free Software Foundation; either version 3 of the License, or
10  * (at your option) any later version.
11  * 
12  * secnet is distributed in the hope that it will be useful, but
13  * WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
15  * General Public License for more details.
16  * 
17  * You should have received a copy of the GNU General Public License
18  * version 3 along with secnet; if not, see
19  * https://www.gnu.org/licenses/gpl.html.
20  */
21
22 /* The 'site' code doesn't know anything about the structure of the
23    packets it's transmitting.  In fact, under the new netlink
24    configuration scheme it doesn't need to know anything at all about
25    IP addresses, except how to contact its peer.  This means it could
26    potentially be used to tunnel other protocols too (IPv6, IPX, plain
27    old Ethernet frames) if appropriate netlink code can be written
28    (and that ought not to be too hard, eg. using the TUN/TAP device to
29    pretend to be an Ethernet interface).  */
30
31 /* At some point in the future the netlink code will be asked for
32    configuration information to go in the PING/PONG packets at the end
33    of the key exchange. */
34
35 #include "secnet.h"
36 #include <stdio.h>
37 #include <string.h>
38 #include <limits.h>
39 #include <assert.h>
40 #include <sys/socket.h>
41
42 #include <sys/mman.h>
43 #include "util.h"
44 #include "unaligned.h"
45 #include "magic.h"
46
47 #define SETUP_BUFFER_LEN 2048
48
49 #define DEFAULT_KEY_LIFETIME                  (3600*1000) /* [ms] */
50 #define DEFAULT_KEY_RENEGOTIATE_GAP           (5*60*1000) /* [ms] */
51 #define DEFAULT_SETUP_RETRIES 5
52 #define DEFAULT_SETUP_RETRY_INTERVAL             (2*1000) /* [ms] */
53 #define DEFAULT_WAIT_TIME                       (20*1000) /* [ms] */
54
55 #define DEFAULT_MOBILE_KEY_LIFETIME      (2*24*3600*1000) /* [ms] */
56 #define DEFAULT_MOBILE_KEY_RENEGOTIATE_GAP (12*3600*1000) /* [ms] */
57 #define DEFAULT_MOBILE_SETUP_RETRIES 30
58 #define DEFAULT_MOBILE_SETUP_RETRY_INTERVAL      (1*1000) /* [ms] */
59 #define DEFAULT_MOBILE_WAIT_TIME                (10*1000) /* [ms] */
60
61 #define DEFAULT_MOBILE_PEER_EXPIRY            (2*60)      /* [s] */
62
63 /* Each site can be in one of several possible states. */
64
65 /* States:
66    SITE_STOP         - nothing is allowed to happen; tunnel is down;
67                        all session keys have been erased
68      -> SITE_RUN upon external instruction
69    SITE_RUN          - site up, maybe with valid key
70      -> SITE_RESOLVE upon outgoing packet and no valid key
71          we start name resolution for the other end of the tunnel
72      -> SITE_SENTMSG2 upon valid incoming message 1 and suitable time
73          we send an appropriate message 2
74    SITE_RESOLVE      - waiting for name resolution
75      -> SITE_SENTMSG1 upon successful resolution
76          we send an appropriate message 1
77      -> SITE_SENTMSG2 upon valid incoming message 1 (then abort resolution)
78          we abort resolution and 
79      -> SITE_WAIT on timeout or resolution failure
80    SITE_SENTMSG1
81      -> SITE_SENTMSG2 upon valid incoming message 1 from higher priority end
82      -> SITE_SENTMSG3 upon valid incoming message 2
83      -> SITE_WAIT on timeout
84    SITE_SENTMSG2
85      -> SITE_SENTMSG4 upon valid incoming message 3
86      -> SITE_WAIT on timeout
87    SITE_SENTMSG3
88      -> SITE_SENTMSG5 upon valid incoming message 4
89      -> SITE_WAIT on timeout
90    SITE_SENTMSG4
91      -> SITE_RUN upon valid incoming message 5
92      -> SITE_WAIT on timeout
93    SITE_SENTMSG5
94      -> SITE_RUN upon valid incoming message 6
95      -> SITE_WAIT on timeout
96    SITE_WAIT         - failed to establish key; do nothing for a while
97      -> SITE_RUN on timeout
98    */
99
100 #define SITE_STOP     0
101 #define SITE_RUN      1
102 #define SITE_RESOLVE  2
103 #define SITE_SENTMSG1 3
104 #define SITE_SENTMSG2 4
105 #define SITE_SENTMSG3 5
106 #define SITE_SENTMSG4 6
107 #define SITE_SENTMSG5 7
108 #define SITE_WAIT     8
109
110 int32_t site_max_start_pad = 4*4;
111
112 static cstring_t state_name(uint32_t state)
113 {
114     switch (state) {
115     case 0: return "STOP";
116     case 1: return "RUN";
117     case 2: return "RESOLVE";
118     case 3: return "SENTMSG1";
119     case 4: return "SENTMSG2";
120     case 5: return "SENTMSG3";
121     case 6: return "SENTMSG4";
122     case 7: return "SENTMSG5";
123     case 8: return "WAIT";
124     default: return "*bad state*";
125     }
126 }
127
128 #define NONCELEN 8
129
130 #define LOG_UNEXPECTED    0x00000001
131 #define LOG_SETUP_INIT    0x00000002
132 #define LOG_SETUP_TIMEOUT 0x00000004
133 #define LOG_ACTIVATE_KEY  0x00000008
134 #define LOG_TIMEOUT_KEY   0x00000010
135 #define LOG_SEC           0x00000020
136 #define LOG_STATE         0x00000040
137 #define LOG_DROP          0x00000080
138 #define LOG_DUMP          0x00000100
139 #define LOG_ERROR         0x00000400
140 #define LOG_PEER_ADDRS    0x00000800
141
142 static struct flagstr log_event_table[]={
143     { "unexpected", LOG_UNEXPECTED },
144     { "setup-init", LOG_SETUP_INIT },
145     { "setup-timeout", LOG_SETUP_TIMEOUT },
146     { "activate-key", LOG_ACTIVATE_KEY },
147     { "timeout-key", LOG_TIMEOUT_KEY },
148     { "security", LOG_SEC },
149     { "state-change", LOG_STATE },
150     { "packet-drop", LOG_DROP },
151     { "dump-packets", LOG_DUMP },
152     { "errors", LOG_ERROR },
153     { "peer-addrs", LOG_PEER_ADDRS },
154     { "default", LOG_SETUP_INIT|LOG_SETUP_TIMEOUT|
155       LOG_ACTIVATE_KEY|LOG_TIMEOUT_KEY|LOG_SEC|LOG_ERROR },
156     { "all", 0xffffffff },
157     { NULL, 0 }
158 };
159
160
161 /***** TRANSPORT PEERS declarations *****/
162
163 /* Details of "mobile peer" semantics:
164
165    - We use the same data structure for the different configurations,
166      but manage it with different algorithms.
167    
168    - We record up to mobile_peers_max peer address/port numbers
169      ("peers") for key setup, and separately up to mobile_peers_max
170      for data transfer.
171
172    - In general, we make a new set of addrs (see below) when we start
173      a new key exchange; the key setup addrs become the data transport
174      addrs when key setup complets.
175
176    If our peer is mobile:
177
178    - We send to all recent addresses of incoming packets, plus
179      initially all configured addresses (which we also expire).
180
181    - So, we record addrs of good incoming packets, as follows:
182       1. expire any peers last seen >120s ("mobile-peer-expiry") ago
183       2. add the peer of the just received packet to the applicable list
184          (possibly evicting the oldest entries to make room)
185      NB that we do not expire peers until an incoming packet arrives.
186
187    - If the peer has a configured address or name, we record them the
188      same way, but only as a result of our own initiation of key
189      setup.  (We might evict some incoming packet addrs to make room.)
190
191    - The default number of addrs to keep is 3, or 4 if we have a
192      configured name or address.  That's space for two configured
193      addresses (one IPv6 and one IPv4), plus two received addresses.
194
195    - Outgoing packets are sent to every recorded address in the
196      applicable list.  Any unsupported[1] addresses are deleted from
197      the list right away.  (This should only happen to configured
198      addresses, of course, but there is no need to check that.)
199
200    - When we successfully complete a key setup, we merge the key setup
201      peers into the data transfer peers.
202
203    [1] An unsupported address is one for whose AF we don't have a
204      socket (perhaps because we got EAFNOSUPPORT or some such) or for
205      which sendto gives ENETUNREACH.
206
207    If neither end is mobile:
208
209    - When peer initiated the key exchange, we use the incoming packet
210      address.
211
212    - When we initiate the key exchange, we try configured addresses
213      until we get one which isn't unsupported then fixate on that.
214
215    - When we complete a key setup, we replace the data transport peers
216      with those from the key setup.
217
218    If we are mobile:
219
220    - We can't tell when local network setup changes so we can't cache
221      the unsupported addrs and completely remove the spurious calls to
222      sendto, but we can optimise things a bit by deprioritising addrs
223      which seem to be unsupported.
224
225    - Use only configured addresses.  (Except, that if our peer
226      initiated a key exchange we use the incoming packet address until
227      our name resolution completes.)
228
229    - When we send a packet, try each address in turn; if addr
230      supported, put that address to the end of the list for future
231      packets, and go onto the next address.
232
233    - When we complete a key setup, we replace the data transport peers
234      with those from the key setup.
235
236    */
237
238 typedef struct {
239     struct timeval last;
240     struct comm_addr addr;
241 } transport_peer;
242
243 typedef struct {
244 /* configuration information */
245 /* runtime information */
246     int npeers;
247     transport_peer peers[MAX_PEER_ADDRS];
248 } transport_peers;
249
250 /* Basic operations on transport peer address sets */
251 static void transport_peers_clear(struct site *st, transport_peers *peers);
252 static int transport_peers_valid(transport_peers *peers);
253 static void transport_peers_copy(struct site *st, transport_peers *dst,
254                                  const transport_peers *src);
255
256 /* Record address of incoming setup packet; resp. data packet. */
257 static void transport_setup_msgok(struct site *st, const struct comm_addr *a);
258 static void transport_data_msgok(struct site *st, const struct comm_addr *a);
259
260 /* Initialise the setup addresses.  Called before we send the first
261  * packet in a key exchange.  If we are the initiator, as a result of
262  * resolve completing (or being determined not to be relevant) or an
263  * incoming PROD; if we are the responder, as a result of the MSG1. */
264 static bool_t transport_compute_setupinit_peers(struct site *st,
265         const struct comm_addr *configured_addrs /* 0 if none or not found */,
266         int n_configured_addrs /* 0 if none or not found */,
267         const struct comm_addr *incoming_packet_addr /* 0 if none */);
268
269 /* Called if we are the responder in a key setup, when the resolve
270  * completes.  transport_compute_setupinit_peers will hvae been called
271  * earlier.  If _complete is called, we are still doing the key setup
272  * (and we should use the new values for both the rest of the key
273  * setup and the ongoing data exchange); if _tardy is called, the key
274  * setup is done (either completed or not) and only the data peers are
275  * relevant */
276 static void transport_resolve_complete(struct site *st,
277         const struct comm_addr *addrs, int naddrs);
278 static void transport_resolve_complete_tardy(struct site *st,
279         const struct comm_addr *addrs, int naddrs);
280
281 static void transport_xmit(struct site *st, transport_peers *peers,
282                            struct buffer_if *buf, bool_t candebug);
283
284  /***** END of transport peers declarations *****/
285
286
287 struct data_key {
288     struct transform_inst_if *transform;
289     uint64_t key_timeout; /* End of life of current key */
290     uint32_t remote_session_id;
291 };
292
293 struct site {
294     closure_t cl;
295     struct site_if ops;
296 /* configuration information */
297     string_t localname;
298     string_t remotename;
299     bool_t keepalive;
300     bool_t local_mobile, peer_mobile; /* Mobile client support */
301     int32_t transport_peers_max;
302     string_t tunname; /* localname<->remotename by default, used in logs */
303     cstring_t *addresses; /* DNS name or address(es) for bootstrapping, optional */
304     int remoteport; /* Port for bootstrapping, optional */
305     uint32_t mtu_target;
306     struct netlink_if *netlink;
307     struct comm_if **comms;
308     struct comm_clientinfo **commclientinfos;
309     int ncomms;
310     struct resolver_if *resolver;
311     struct log_if *log;
312     struct random_if *random;
313     struct rsaprivkey_if *privkey;
314     struct rsapubkey_if *pubkey;
315     struct transform_if **transforms;
316     int ntransforms;
317     struct dh_if *dh;
318     struct hash_if *hash;
319
320     uint32_t index; /* Index of this site */
321     uint32_t local_capabilities;
322     int32_t setup_retries; /* How many times to send setup packets */
323     int32_t setup_retry_interval; /* Initial timeout for setup packets */
324     int32_t wait_timeout_mean; /* How long to wait if setup unsuccessful */
325     int32_t mobile_peer_expiry; /* How long to remember 2ary addresses */
326     int32_t key_lifetime; /* How long a key lasts once set up */
327     int32_t key_renegotiate_time; /* If we see traffic (or a keepalive)
328                                       after this time, initiate a new
329                                       key exchange */
330
331     bool_t our_name_later; /* our name > peer name */
332     uint32_t log_events;
333
334 /* runtime information */
335     uint32_t state;
336     uint64_t now; /* Most recently seen time */
337     bool_t allow_send_prod;
338     bool_t msg1_crossed_logged;
339     int resolving_count;
340     int resolving_n_results_all;
341     int resolving_n_results_stored;
342     struct comm_addr resolving_results[MAX_PEER_ADDRS];
343
344     /* The currently established session */
345     struct data_key current;
346     struct data_key auxiliary_key;
347     bool_t auxiliary_is_new;
348     uint64_t renegotiate_key_time; /* When we can negotiate a new key */
349     uint64_t auxiliary_renegotiate_key_time;
350     transport_peers peers; /* Current address(es) of peer for data traffic */
351
352     /* The current key setup protocol exchange.  We can only be
353        involved in one of these at a time.  There's a potential for
354        denial of service here (the attacker keeps sending a setup
355        packet; we keep trying to continue the exchange, and have to
356        timeout before we can listen for another setup packet); perhaps
357        we should keep a list of 'bad' sources for setup packets. */
358     uint32_t remote_capabilities;
359     uint16_t remote_adv_mtu;
360     struct transform_if *chosen_transform;
361     uint32_t setup_session_id;
362     transport_peers setup_peers;
363     uint8_t localN[NONCELEN]; /* Nonces for key exchange */
364     uint8_t remoteN[NONCELEN];
365     struct buffer_if buffer; /* Current outgoing key exchange packet */
366     struct buffer_if scratch;
367     int32_t retries; /* Number of retries remaining */
368     uint64_t timeout; /* Timeout for current state */
369     uint8_t *dhsecret;
370     uint8_t *sharedsecret;
371     uint32_t sharedsecretlen, sharedsecretallocd;
372     struct transform_inst_if *new_transform; /* For key setup/verify */
373 };
374
375 static uint32_t event_log_priority(struct site *st, uint32_t event)
376 {
377     if (!(event&st->log_events))
378         return 0;
379     switch(event) {
380     case LOG_UNEXPECTED:    return M_INFO;
381     case LOG_SETUP_INIT:    return M_INFO;
382     case LOG_SETUP_TIMEOUT: return M_NOTICE;
383     case LOG_ACTIVATE_KEY:  return M_INFO;
384     case LOG_TIMEOUT_KEY:   return M_INFO;
385     case LOG_SEC:           return M_SECURITY;
386     case LOG_STATE:         return M_DEBUG;
387     case LOG_DROP:          return M_DEBUG;
388     case LOG_DUMP:          return M_DEBUG;
389     case LOG_ERROR:         return M_ERR;
390     case LOG_PEER_ADDRS:    return M_DEBUG;
391     default:                return M_ERR;
392     }
393 }
394
395 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
396 FORMAT(printf,3,0);
397 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
398 {
399     uint32_t class;
400
401     class=event_log_priority(st, event);
402     if (class) {
403         slilog_part(st->log,class,"%s: ",st->tunname);
404         vslilog_part(st->log,class,msg,ap);
405         slilog_part(st->log,class,"\n");
406     }
407 }
408
409 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
410 FORMAT(printf,3,4);
411 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
412 {
413     va_list ap;
414     va_start(ap,msg);
415     vslog(st,event,msg,ap);
416     va_end(ap);
417 }
418
419 static void logtimeout(struct site *st, const char *fmt, ...)
420 FORMAT(printf,2,3);
421 static void logtimeout(struct site *st, const char *fmt, ...)
422 {
423     uint32_t class=event_log_priority(st,LOG_SETUP_TIMEOUT);
424     if (!class)
425         return;
426
427     va_list ap;
428     va_start(ap,fmt);
429
430     slilog_part(st->log,class,"%s: ",st->tunname);
431     vslilog_part(st->log,class,fmt,ap);
432
433     const char *delim;
434     int i;
435     for (i=0, delim=" (tried ";
436          i<st->setup_peers.npeers;
437          i++, delim=", ") {
438         transport_peer *peer=&st->setup_peers.peers[i];
439         const char *s=comm_addr_to_string(&peer->addr);
440         slilog_part(st->log,class,"%s%s",delim,s);
441     }
442
443     slilog_part(st->log,class,")\n");
444     va_end(ap);
445 }
446
447 static void set_link_quality(struct site *st);
448 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel);
449 static void delete_one_key(struct site *st, struct data_key *key,
450                            const char *reason /* may be 0 meaning don't log*/,
451                            const char *which /* ignored if !reasonn */,
452                            uint32_t loglevel /* ignored if !reasonn */);
453 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
454                                  const struct comm_addr *prod_hint);
455 static void enter_state_run(struct site *st);
456 static bool_t enter_state_resolve(struct site *st);
457 static void decrement_resolving_count(struct site *st, int by);
458 static bool_t enter_new_state(struct site *st,uint32_t next);
459 static void enter_state_wait(struct site *st);
460 static void activate_new_key(struct site *st);
461
462 static bool_t is_transform_valid(struct transform_inst_if *transform)
463 {
464     return transform && transform->valid(transform->st);
465 }
466
467 static bool_t current_valid(struct site *st)
468 {
469     return is_transform_valid(st->current.transform);
470 }
471
472 #define DEFINE_CALL_TRANSFORM(fwdrev)                                   \
473 static transform_apply_return                                           \
474 call_transform_##fwdrev(struct site *st,                                \
475                                    struct transform_inst_if *transform, \
476                                    struct buffer_if *buf,               \
477                                    const char **errmsg)                 \
478 {                                                                       \
479     if (!is_transform_valid(transform)) {                               \
480         *errmsg="transform not set up";                                 \
481         return transform_apply_err;                                     \
482     }                                                                   \
483     return transform->fwdrev(transform->st,buf,errmsg);                 \
484 }
485
486 DEFINE_CALL_TRANSFORM(forwards)
487 DEFINE_CALL_TRANSFORM(reverse)
488
489 static void dispose_transform(struct transform_inst_if **transform_var)
490 {
491     struct transform_inst_if *transform=*transform_var;
492     if (transform) {
493         transform->delkey(transform->st);
494         transform->destroy(transform->st);
495     }
496     *transform_var = 0;
497 }    
498
499 #define CHECK_AVAIL(b,l) do { if ((b)->size<(l)) return False; } while(0)
500 #define CHECK_EMPTY(b) do { if ((b)->size!=0) return False; } while(0)
501 #define CHECK_TYPE(b,t) do { uint32_t type; \
502     CHECK_AVAIL((b),4); \
503     type=buf_unprepend_uint32((b)); \
504     if (type!=(t)) return False; } while(0)
505
506 static _Bool type_is_msg34(uint32_t type)
507 {
508     return
509         type == LABEL_MSG3 ||
510         type == LABEL_MSG3BIS ||
511         type == LABEL_MSG4;
512 }
513
514 struct parsedname {
515     int32_t len;
516     uint8_t *name;
517     struct buffer_if extrainfo;
518 };
519
520 struct msg {
521     uint8_t *hashstart;
522     uint32_t dest;
523     uint32_t source;
524     struct parsedname remote;
525     struct parsedname local;
526     uint32_t remote_capabilities;
527     uint16_t remote_mtu;
528     int capab_transformnum;
529     uint8_t *nR;
530     uint8_t *nL;
531     int32_t pklen;
532     char *pk;
533     int32_t hashlen;
534     int32_t siglen;
535     char *sig;
536 };
537
538 static int32_t wait_timeout(struct site *st) {
539     int32_t t = st->wait_timeout_mean;
540     int8_t factor;
541     if (t < INT_MAX/2) {
542         st->random->generate(st->random->st,sizeof(factor),&factor);
543         t += (t / 256) * factor;
544     }
545     return t;
546 }
547
548 static _Bool set_new_transform(struct site *st, char *pk)
549 {
550     _Bool ok;
551
552     /* Make room for the shared key */
553     st->sharedsecretlen=st->chosen_transform->keylen?:st->dh->ceil_len;
554     assert(st->sharedsecretlen);
555     if (st->sharedsecretlen > st->sharedsecretallocd) {
556         st->sharedsecretallocd=st->sharedsecretlen;
557         st->sharedsecret=safe_realloc_ary(st->sharedsecret,1,
558                                           st->sharedsecretallocd,
559                                           "site:sharedsecret");
560     }
561
562     /* Generate the shared key */
563     st->dh->makeshared(st->dh->st,st->dhsecret,st->dh->len,pk,
564                        st->sharedsecret,st->sharedsecretlen);
565
566     /* Set up the transform */
567     struct transform_if *generator=st->chosen_transform;
568     struct transform_inst_if *generated=generator->create(generator->st);
569     ok = generated->setkey(generated->st,st->sharedsecret,
570                            st->sharedsecretlen,st->our_name_later);
571
572     dispose_transform(&st->new_transform);
573     if (!ok) return False;
574     st->new_transform=generated;
575
576     slog(st,LOG_SETUP_INIT,"key exchange negotiated transform"
577          " %d (capabilities ours=%#"PRIx32" theirs=%#"PRIx32")",
578          st->chosen_transform->capab_transformnum,
579          st->local_capabilities, st->remote_capabilities);
580     return True;
581 }
582
583 struct xinfoadd {
584     int32_t lenpos, afternul;
585 };
586 static void append_string_xinfo_start(struct buffer_if *buf,
587                                       struct xinfoadd *xia,
588                                       const char *str)
589     /* Helps construct one of the names with additional info as found
590      * in MSG1..4.  Call this function first, then append all the
591      * desired extra info (not including the nul byte) to the buffer,
592      * then call append_string_xinfo_done. */
593 {
594     xia->lenpos = buf->size;
595     buf_append_string(buf,str);
596     buf_append_uint8(buf,0);
597     xia->afternul = buf->size;
598 }
599 static void append_string_xinfo_done(struct buffer_if *buf,
600                                      struct xinfoadd *xia)
601 {
602     /* we just need to adjust the string length */
603     if (buf->size == xia->afternul) {
604         /* no extra info, strip the nul too */
605         buf_unappend_uint8(buf);
606     } else {
607         put_uint16(buf->start+xia->lenpos, buf->size-(xia->lenpos+2));
608     }
609 }
610
611 /* Build any of msg1 to msg4. msg5 and msg6 are built from the inside
612    out using a transform of config data supplied by netlink */
613 static bool_t generate_msg(struct site *st, uint32_t type, cstring_t what)
614 {
615     void *hst;
616     uint8_t *hash;
617     string_t dhpub, sig;
618
619     st->retries=st->setup_retries;
620     BUF_ALLOC(&st->buffer,what);
621     buffer_init(&st->buffer,0);
622     buf_append_uint32(&st->buffer,
623         (type==LABEL_MSG1?0:st->setup_session_id));
624     buf_append_uint32(&st->buffer,st->index);
625     buf_append_uint32(&st->buffer,type);
626
627     struct xinfoadd xia;
628     append_string_xinfo_start(&st->buffer,&xia,st->localname);
629     if ((st->local_capabilities & CAPAB_EARLY) || (type != LABEL_MSG1)) {
630         buf_append_uint32(&st->buffer,st->local_capabilities);
631     }
632     if (type_is_msg34(type)) {
633         buf_append_uint16(&st->buffer,st->mtu_target);
634     }
635     append_string_xinfo_done(&st->buffer,&xia);
636
637     buf_append_string(&st->buffer,st->remotename);
638     BUF_ADD_OBJ(append,&st->buffer,st->localN);
639     if (type==LABEL_MSG1) return True;
640     BUF_ADD_OBJ(append,&st->buffer,st->remoteN);
641     if (type==LABEL_MSG2) return True;
642
643     if (hacky_par_mid_failnow()) return False;
644
645     if (type==LABEL_MSG3BIS)
646         buf_append_uint8(&st->buffer,st->chosen_transform->capab_transformnum);
647
648     dhpub=st->dh->makepublic(st->dh->st,st->dhsecret,st->dh->len);
649     buf_append_string(&st->buffer,dhpub);
650     free(dhpub);
651     hash=safe_malloc(st->hash->len, "generate_msg");
652     hst=st->hash->init();
653     st->hash->update(hst,st->buffer.start,st->buffer.size);
654     st->hash->final(hst,hash);
655     sig=st->privkey->sign(st->privkey->st,hash,st->hash->len);
656     buf_append_string(&st->buffer,sig);
657     free(sig);
658     free(hash);
659     return True;
660 }
661
662 static bool_t unpick_name(struct buffer_if *msg, struct parsedname *nm)
663 {
664     CHECK_AVAIL(msg,2);
665     nm->len=buf_unprepend_uint16(msg);
666     CHECK_AVAIL(msg,nm->len);
667     nm->name=buf_unprepend(msg,nm->len);
668     uint8_t *nul=memchr(nm->name,0,nm->len);
669     if (!nul) {
670         buffer_readonly_view(&nm->extrainfo,0,0);
671     } else {
672         buffer_readonly_view(&nm->extrainfo, nul+1, msg->start-(nul+1));
673         nm->len=nul-nm->name;
674     }
675     return True;
676 }
677
678 static bool_t unpick_msg(struct site *st, uint32_t type,
679                          struct buffer_if *msg, struct msg *m)
680 {
681     m->capab_transformnum=-1;
682     m->hashstart=msg->start;
683     CHECK_AVAIL(msg,4);
684     m->dest=buf_unprepend_uint32(msg);
685     CHECK_AVAIL(msg,4);
686     m->source=buf_unprepend_uint32(msg);
687     CHECK_TYPE(msg,type);
688     if (!unpick_name(msg,&m->remote)) return False;
689     m->remote_capabilities=0;
690     m->remote_mtu=0;
691     if (m->remote.extrainfo.size) {
692         CHECK_AVAIL(&m->remote.extrainfo,4);
693         m->remote_capabilities=buf_unprepend_uint32(&m->remote.extrainfo);
694     }
695     if (type_is_msg34(type) && m->remote.extrainfo.size) {
696         CHECK_AVAIL(&m->remote.extrainfo,2);
697         m->remote_mtu=buf_unprepend_uint16(&m->remote.extrainfo);
698     }
699     if (!unpick_name(msg,&m->local)) return False;
700     if (type==LABEL_PROD) {
701         CHECK_EMPTY(msg);
702         return True;
703     }
704     CHECK_AVAIL(msg,NONCELEN);
705     m->nR=buf_unprepend(msg,NONCELEN);
706     if (type==LABEL_MSG1) {
707         CHECK_EMPTY(msg);
708         return True;
709     }
710     CHECK_AVAIL(msg,NONCELEN);
711     m->nL=buf_unprepend(msg,NONCELEN);
712     if (type==LABEL_MSG2) {
713         CHECK_EMPTY(msg);
714         return True;
715     }
716     if (type==LABEL_MSG3BIS) {
717         CHECK_AVAIL(msg,1);
718         m->capab_transformnum = buf_unprepend_uint8(msg);
719     } else {
720         m->capab_transformnum = CAPAB_TRANSFORMNUM_ANCIENT;
721     }
722     CHECK_AVAIL(msg,2);
723     m->pklen=buf_unprepend_uint16(msg);
724     CHECK_AVAIL(msg,m->pklen);
725     m->pk=buf_unprepend(msg,m->pklen);
726     m->hashlen=msg->start-m->hashstart;
727     CHECK_AVAIL(msg,2);
728     m->siglen=buf_unprepend_uint16(msg);
729     CHECK_AVAIL(msg,m->siglen);
730     m->sig=buf_unprepend(msg,m->siglen);
731     CHECK_EMPTY(msg);
732
733     /* In `process_msg3_msg4' below, we assume that we can write a nul
734      * terminator following the signature.  Make sure there's enough space.
735      */
736     if (msg->start >= msg->base + msg->alloclen)
737         return False;
738
739     return True;
740 }
741
742 static bool_t name_matches(const struct parsedname *nm, const char *expected)
743 {
744     int expected_len=strlen(expected);
745     return
746         nm->len == expected_len &&
747         !memcmp(nm->name, expected, expected_len);
748 }    
749
750 static bool_t check_msg(struct site *st, uint32_t type, struct msg *m,
751                         cstring_t *error)
752 {
753     if (type==LABEL_MSG1) return True;
754
755     /* Check that the site names and our nonce have been sent
756        back correctly, and then store our peer's nonce. */ 
757     if (!name_matches(&m->remote,st->remotename)) {
758         *error="wrong remote site name";
759         return False;
760     }
761     if (!name_matches(&m->local,st->localname)) {
762         *error="wrong local site name";
763         return False;
764     }
765     if (memcmp(m->nL,st->localN,NONCELEN)!=0) {
766         *error="wrong locally-generated nonce";
767         return False;
768     }
769     if (type==LABEL_MSG2) return True;
770     if (!consttime_memeq(m->nR,st->remoteN,NONCELEN)) {
771         *error="wrong remotely-generated nonce";
772         return False;
773     }
774     /* MSG3 has complicated rules about capabilities, which are
775      * handled in process_msg3. */
776     if (type==LABEL_MSG3 || type==LABEL_MSG3BIS) return True;
777     if (m->remote_capabilities!=st->remote_capabilities) {
778         *error="remote capabilities changed";
779         return False;
780     }
781     if (type==LABEL_MSG4) return True;
782     *error="unknown message type";
783     return False;
784 }
785
786 static bool_t generate_msg1(struct site *st)
787 {
788     st->random->generate(st->random->st,NONCELEN,st->localN);
789     return generate_msg(st,LABEL_MSG1,"site:MSG1");
790 }
791
792 static bool_t process_msg1(struct site *st, struct buffer_if *msg1,
793                            const struct comm_addr *src, struct msg *m)
794 {
795     /* We've already determined we're in an appropriate state to
796        process an incoming MSG1, and that the MSG1 has correct values
797        of A and B. */
798
799     st->setup_session_id=m->source;
800     st->remote_capabilities=m->remote_capabilities;
801     memcpy(st->remoteN,m->nR,NONCELEN);
802     return True;
803 }
804
805 static bool_t generate_msg2(struct site *st)
806 {
807     st->random->generate(st->random->st,NONCELEN,st->localN);
808     return generate_msg(st,LABEL_MSG2,"site:MSG2");
809 }
810
811 static bool_t process_msg2(struct site *st, struct buffer_if *msg2,
812                            const struct comm_addr *src)
813 {
814     struct msg m;
815     cstring_t err;
816
817     if (!unpick_msg(st,LABEL_MSG2,msg2,&m)) return False;
818     if (!check_msg(st,LABEL_MSG2,&m,&err)) {
819         slog(st,LOG_SEC,"msg2: %s",err);
820         return False;
821     }
822     st->setup_session_id=m.source;
823     st->remote_capabilities=m.remote_capabilities;
824
825     /* Select the transform to use */
826
827     uint32_t remote_transforms = st->remote_capabilities & CAPAB_TRANSFORM_MASK;
828     if (!remote_transforms)
829         /* old secnets only had this one transform */
830         remote_transforms = 1UL << CAPAB_TRANSFORMNUM_ANCIENT;
831
832     struct transform_if *ti;
833     int i;
834     for (i=0; i<st->ntransforms; i++) {
835         ti=st->transforms[i];
836         if ((1UL << ti->capab_transformnum) & remote_transforms)
837             goto transform_found;
838     }
839     slog(st,LOG_ERROR,"no transforms in common"
840          " (us %#"PRIx32"; them: %#"PRIx32")",
841          st->local_capabilities & CAPAB_TRANSFORM_MASK,
842          remote_transforms);
843     return False;
844  transform_found:
845     st->chosen_transform=ti;
846
847     memcpy(st->remoteN,m.nR,NONCELEN);
848     return True;
849 }
850
851 static bool_t generate_msg3(struct site *st)
852 {
853     /* Now we have our nonce and their nonce. Think of a secret key,
854        and create message number 3. */
855     st->random->generate(st->random->st,st->dh->len,st->dhsecret);
856     return generate_msg(st,
857                         (st->remote_capabilities & CAPAB_TRANSFORM_MASK
858                          ? LABEL_MSG3BIS : LABEL_MSG3),
859                         "site:MSG3");
860 }
861
862 static bool_t process_msg3_msg4(struct site *st, struct msg *m)
863 {
864     uint8_t *hash;
865     void *hst;
866
867     /* Check signature and store g^x mod m */
868     hash=safe_malloc(st->hash->len, "process_msg3_msg4");
869     hst=st->hash->init();
870     st->hash->update(hst,m->hashstart,m->hashlen);
871     st->hash->final(hst,hash);
872     /* Terminate signature with a '0' - already checked that this will fit */
873     m->sig[m->siglen]=0;
874     if (!st->pubkey->check(st->pubkey->st,hash,st->hash->len,m->sig)) {
875         slog(st,LOG_SEC,"msg3/msg4 signature failed check!");
876         free(hash);
877         return False;
878     }
879     free(hash);
880
881     st->remote_adv_mtu=m->remote_mtu;
882
883     return True;
884 }
885
886 static bool_t process_msg3(struct site *st, struct buffer_if *msg3,
887                            const struct comm_addr *src, uint32_t msgtype)
888 {
889     struct msg m;
890     cstring_t err;
891
892     assert(msgtype==LABEL_MSG3 || msgtype==LABEL_MSG3BIS);
893
894     if (!unpick_msg(st,msgtype,msg3,&m)) return False;
895     if (!check_msg(st,msgtype,&m,&err)) {
896         slog(st,LOG_SEC,"msg3: %s",err);
897         return False;
898     }
899     uint32_t capab_adv_late = m.remote_capabilities
900         & ~st->remote_capabilities & CAPAB_EARLY;
901     if (capab_adv_late) {
902         slog(st,LOG_SEC,"msg3 impermissibly adds early capability flag(s)"
903              " %#"PRIx32" (was %#"PRIx32", now %#"PRIx32")",
904              capab_adv_late, st->remote_capabilities, m.remote_capabilities);
905         return False;
906     }
907     st->remote_capabilities|=m.remote_capabilities;
908
909     struct transform_if *ti;
910     int i;
911     for (i=0; i<st->ntransforms; i++) {
912         ti=st->transforms[i];
913         if (ti->capab_transformnum == m.capab_transformnum)
914             goto transform_found;
915     }
916     slog(st,LOG_SEC,"peer chose unknown-to-us transform %d!",
917          m.capab_transformnum);
918     return False;
919  transform_found:
920     st->chosen_transform=ti;
921
922     if (!process_msg3_msg4(st,&m))
923         return False;
924
925     /* Terminate their DH public key with a '0' */
926     m.pk[m.pklen]=0;
927     /* Invent our DH secret key */
928     st->random->generate(st->random->st,st->dh->len,st->dhsecret);
929
930     /* Generate the shared key and set up the transform */
931     if (!set_new_transform(st,m.pk)) return False;
932
933     return True;
934 }
935
936 static bool_t generate_msg4(struct site *st)
937 {
938     /* We have both nonces, their public key and our private key. Generate
939        our public key, sign it and send it to them. */
940     return generate_msg(st,LABEL_MSG4,"site:MSG4");
941 }
942
943 static bool_t process_msg4(struct site *st, struct buffer_if *msg4,
944                            const struct comm_addr *src)
945 {
946     struct msg m;
947     cstring_t err;
948
949     if (!unpick_msg(st,LABEL_MSG4,msg4,&m)) return False;
950     if (!check_msg(st,LABEL_MSG4,&m,&err)) {
951         slog(st,LOG_SEC,"msg4: %s",err);
952         return False;
953     }
954     
955     if (!process_msg3_msg4(st,&m))
956         return False;
957
958     /* Terminate their DH public key with a '0' */
959     m.pk[m.pklen]=0;
960
961     /* Generate the shared key and set up the transform */
962     if (!set_new_transform(st,m.pk)) return False;
963
964     return True;
965 }
966
967 struct msg0 {
968     uint32_t dest;
969     uint32_t source;
970     uint32_t type;
971 };
972
973 static bool_t unpick_msg0(struct site *st, struct buffer_if *msg0,
974                           struct msg0 *m)
975 {
976     CHECK_AVAIL(msg0,4);
977     m->dest=buf_unprepend_uint32(msg0);
978     CHECK_AVAIL(msg0,4);
979     m->source=buf_unprepend_uint32(msg0);
980     CHECK_AVAIL(msg0,4);
981     m->type=buf_unprepend_uint32(msg0);
982     return True;
983     /* Leaves transformed part of buffer untouched */
984 }
985
986 static bool_t generate_msg5(struct site *st)
987 {
988     cstring_t transform_err;
989
990     BUF_ALLOC(&st->buffer,"site:MSG5");
991     /* We are going to add four words to the message */
992     buffer_init(&st->buffer,calculate_max_start_pad());
993     /* Give the netlink code an opportunity to put its own stuff in the
994        message (configuration information, etc.) */
995     buf_prepend_uint32(&st->buffer,LABEL_MSG5);
996     if (call_transform_forwards(st,st->new_transform,
997                                 &st->buffer,&transform_err))
998         return False;
999     buf_prepend_uint32(&st->buffer,LABEL_MSG5);
1000     buf_prepend_uint32(&st->buffer,st->index);
1001     buf_prepend_uint32(&st->buffer,st->setup_session_id);
1002
1003     st->retries=st->setup_retries;
1004     return True;
1005 }
1006
1007 static bool_t process_msg5(struct site *st, struct buffer_if *msg5,
1008                            const struct comm_addr *src,
1009                            struct transform_inst_if *transform)
1010 {
1011     struct msg0 m;
1012     cstring_t transform_err;
1013
1014     if (!unpick_msg0(st,msg5,&m)) return False;
1015
1016     if (call_transform_reverse(st,transform,msg5,&transform_err)) {
1017         /* There's a problem */
1018         slog(st,LOG_SEC,"process_msg5: transform: %s",transform_err);
1019         return False;
1020     }
1021     /* Buffer should now contain untransformed PING packet data */
1022     CHECK_AVAIL(msg5,4);
1023     if (buf_unprepend_uint32(msg5)!=LABEL_MSG5) {
1024         slog(st,LOG_SEC,"MSG5/PING packet contained wrong label");
1025         return False;
1026     }
1027     /* Older versions of secnet used to write some config data here
1028      * which we ignore.  So we don't CHECK_EMPTY */
1029     return True;
1030 }
1031
1032 static void create_msg6(struct site *st, struct transform_inst_if *transform,
1033                         uint32_t session_id)
1034 {
1035     cstring_t transform_err;
1036
1037     BUF_ALLOC(&st->buffer,"site:MSG6");
1038     /* We are going to add four words to the message */
1039     buffer_init(&st->buffer,calculate_max_start_pad());
1040     /* Give the netlink code an opportunity to put its own stuff in the
1041        message (configuration information, etc.) */
1042     buf_prepend_uint32(&st->buffer,LABEL_MSG6);
1043     transform_apply_return problem =
1044         call_transform_forwards(st,transform,
1045                                 &st->buffer,&transform_err);
1046     assert(!problem);
1047     buf_prepend_uint32(&st->buffer,LABEL_MSG6);
1048     buf_prepend_uint32(&st->buffer,st->index);
1049     buf_prepend_uint32(&st->buffer,session_id);
1050 }
1051
1052 static bool_t generate_msg6(struct site *st)
1053 {
1054     if (!is_transform_valid(st->new_transform))
1055         return False;
1056     create_msg6(st,st->new_transform,st->setup_session_id);
1057     st->retries=1; /* Peer will retransmit MSG5 if this packet gets lost */
1058     return True;
1059 }
1060
1061 static bool_t process_msg6(struct site *st, struct buffer_if *msg6,
1062                            const struct comm_addr *src)
1063 {
1064     struct msg0 m;
1065     cstring_t transform_err;
1066
1067     if (!unpick_msg0(st,msg6,&m)) return False;
1068
1069     if (call_transform_reverse(st,st->new_transform,msg6,&transform_err)) {
1070         /* There's a problem */
1071         slog(st,LOG_SEC,"process_msg6: transform: %s",transform_err);
1072         return False;
1073     }
1074     /* Buffer should now contain untransformed PING packet data */
1075     CHECK_AVAIL(msg6,4);
1076     if (buf_unprepend_uint32(msg6)!=LABEL_MSG6) {
1077         slog(st,LOG_SEC,"MSG6/PONG packet contained invalid data");
1078         return False;
1079     }
1080     /* Older versions of secnet used to write some config data here
1081      * which we ignore.  So we don't CHECK_EMPTY */
1082     return True;
1083 }
1084
1085 static transform_apply_return
1086 decrypt_msg0(struct site *st, struct buffer_if *msg0,
1087                            const struct comm_addr *src)
1088 {
1089     cstring_t transform_err, auxkey_err, newkey_err="n/a";
1090     struct msg0 m;
1091     transform_apply_return problem;
1092
1093     if (!unpick_msg0(st,msg0,&m)) return False;
1094
1095     /* Keep a copy so we can try decrypting it with multiple keys */
1096     buffer_copy(&st->scratch, msg0);
1097
1098     problem = call_transform_reverse(st,st->current.transform,
1099                                      msg0,&transform_err);
1100     if (!problem) {
1101         if (!st->auxiliary_is_new)
1102             delete_one_key(st,&st->auxiliary_key,
1103                            "peer has used new key","auxiliary key",LOG_SEC);
1104         return 0;
1105     }
1106     if (transform_apply_return_badseq(problem))
1107         goto badseq;
1108
1109     buffer_copy(msg0, &st->scratch);
1110     problem = call_transform_reverse(st,st->auxiliary_key.transform,
1111                                      msg0,&auxkey_err);
1112     if (!problem) {
1113         slog(st,LOG_DROP,"processing packet which uses auxiliary key");
1114         if (st->auxiliary_is_new) {
1115             /* We previously timed out in state SENTMSG5 but it turns
1116              * out that our peer did in fact get our MSG5 and is
1117              * using the new key.  So we should switch to it too. */
1118             /* This is a bit like activate_new_key. */
1119             struct data_key t;
1120             t=st->current;
1121             st->current=st->auxiliary_key;
1122             st->auxiliary_key=t;
1123
1124             delete_one_key(st,&st->auxiliary_key,"peer has used new key",
1125                            "previous key",LOG_SEC);
1126             st->auxiliary_is_new=0;
1127             st->renegotiate_key_time=st->auxiliary_renegotiate_key_time;
1128         }
1129         return 0;
1130     }
1131     if (transform_apply_return_badseq(problem))
1132         goto badseq;
1133
1134     if (st->state==SITE_SENTMSG5) {
1135         buffer_copy(msg0, &st->scratch);
1136         problem = call_transform_reverse(st,st->new_transform,
1137                                          msg0,&newkey_err);
1138         if (!problem) {
1139             /* It looks like we didn't get the peer's MSG6 */
1140             /* This is like a cut-down enter_new_state(SITE_RUN) */
1141             slog(st,LOG_STATE,"will enter state RUN (MSG0 with new key)");
1142             BUF_FREE(&st->buffer);
1143             st->timeout=0;
1144             activate_new_key(st);
1145             return 0; /* do process the data in this packet */
1146         }
1147         if (transform_apply_return_badseq(problem))
1148             goto badseq;
1149     }
1150
1151     slog(st,LOG_SEC,"transform: %s (aux: %s, new: %s)",
1152          transform_err,auxkey_err,newkey_err);
1153     initiate_key_setup(st,"incoming message would not decrypt",0);
1154     send_nak(src,m.dest,m.source,m.type,msg0,"message would not decrypt");
1155     assert(problem);
1156     return problem;
1157
1158  badseq:
1159     slog(st,LOG_DROP,"transform: %s (bad seq.)",transform_err);
1160     assert(problem);
1161     return problem;
1162 }
1163
1164 static bool_t process_msg0(struct site *st, struct buffer_if *msg0,
1165                            const struct comm_addr *src)
1166 {
1167     uint32_t type;
1168     transform_apply_return problem;
1169
1170     problem = decrypt_msg0(st,msg0,src);
1171     if (problem==transform_apply_seqdupe) {
1172         /* We recently received another copy of this packet, maybe due
1173          * to polypath.  That's not a problem; indeed, for the
1174          * purposes of transport address management it is a success.
1175          * But we don't want to process the packet. */
1176         transport_data_msgok(st,src);
1177         return False;
1178     }
1179     if (problem)
1180         return False;
1181
1182     CHECK_AVAIL(msg0,4);
1183     type=buf_unprepend_uint32(msg0);
1184     switch(type) {
1185     case LABEL_MSG7:
1186         /* We must forget about the current session. */
1187         delete_keys(st,"request from peer",LOG_SEC);
1188         /* probably, the peer is shutting down, and this is going to fail,
1189          * but we need to be trying to bring the link up again */
1190         if (st->keepalive)
1191             initiate_key_setup(st,"peer requested key teardown",0);
1192         return True;
1193     case LABEL_MSG9:
1194         /* Deliver to netlink layer */
1195         st->netlink->deliver(st->netlink->st,msg0);
1196         transport_data_msgok(st,src);
1197         /* See whether we should start negotiating a new key */
1198         if (st->now > st->renegotiate_key_time)
1199             initiate_key_setup(st,"incoming packet in renegotiation window",0);
1200         return True;
1201     default:
1202         slog(st,LOG_SEC,"incoming encrypted message of type %08x "
1203              "(unknown)",type);
1204         break;
1205     }
1206     return False;
1207 }
1208
1209 static void dump_packet(struct site *st, struct buffer_if *buf,
1210                         const struct comm_addr *addr, bool_t incoming,
1211                         bool_t ok)
1212 {
1213     uint32_t dest=get_uint32(buf->start);
1214     uint32_t source=get_uint32(buf->start+4);
1215     uint32_t msgtype=get_uint32(buf->start+8);
1216
1217     if (st->log_events & LOG_DUMP)
1218         slilog(st->log,M_DEBUG,"%s: %s: %08x<-%08x: %08x: %s%s",
1219                st->tunname,incoming?"incoming":"outgoing",
1220                dest,source,msgtype,comm_addr_to_string(addr),
1221                ok?"":" - fail");
1222 }
1223
1224 static bool_t comm_addr_sendmsg(struct site *st,
1225                                 const struct comm_addr *dest,
1226                                 struct buffer_if *buf)
1227 {
1228     int i;
1229     struct comm_clientinfo *commclientinfo = 0;
1230
1231     for (i=0; i < st->ncomms; i++) {
1232         if (st->comms[i] == dest->comm) {
1233             commclientinfo = st->commclientinfos[i];
1234             break;
1235         }
1236     }
1237     return dest->comm->sendmsg(dest->comm->st, buf, dest, commclientinfo);
1238 }
1239
1240 static uint32_t site_status(void *st)
1241 {
1242     return 0;
1243 }
1244
1245 static bool_t send_msg(struct site *st)
1246 {
1247     if (st->retries>0) {
1248         transport_xmit(st, &st->setup_peers, &st->buffer, True);
1249         st->timeout=st->now+st->setup_retry_interval;
1250         st->retries--;
1251         return True;
1252     } else if (st->state==SITE_SENTMSG5) {
1253         logtimeout(st,"timed out sending MSG5, stashing new key");
1254         /* We stash the key we have produced, in case it turns out that
1255          * our peer did see our MSG5 after all and starts using it. */
1256         /* This is a bit like some of activate_new_key */
1257         struct transform_inst_if *t;
1258         t=st->auxiliary_key.transform;
1259         st->auxiliary_key.transform=st->new_transform;
1260         st->new_transform=t;
1261         dispose_transform(&st->new_transform);
1262
1263         st->auxiliary_is_new=1;
1264         st->auxiliary_key.key_timeout=st->now+st->key_lifetime;
1265         st->auxiliary_renegotiate_key_time=st->now+st->key_renegotiate_time;
1266         st->auxiliary_key.remote_session_id=st->setup_session_id;
1267
1268         enter_state_wait(st);
1269         return False;
1270     } else {
1271         logtimeout(st,"timed out sending key setup packet "
1272             "(in state %s)",state_name(st->state));
1273         enter_state_wait(st);
1274         return False;
1275     }
1276 }
1277
1278 static void site_resolve_callback(void *sst, const struct comm_addr *addrs,
1279                                   int stored_naddrs, int all_naddrs,
1280                                   const char *address, const char *failwhy)
1281 {
1282     struct site *st=sst;
1283
1284     if (!stored_naddrs) {
1285         slog(st,LOG_ERROR,"resolution of %s failed: %s",address,failwhy);
1286     } else {
1287         slog(st,LOG_PEER_ADDRS,"resolution of %s completed, %d addrs, eg: %s",
1288              address, all_naddrs, comm_addr_to_string(&addrs[0]));;
1289
1290         int space=st->transport_peers_max-st->resolving_n_results_stored;
1291         int n_tocopy=MIN(stored_naddrs,space);
1292         COPY_ARRAY(st->resolving_results + st->resolving_n_results_stored,
1293                    addrs,
1294                    n_tocopy);
1295         st->resolving_n_results_stored += n_tocopy;
1296         st->resolving_n_results_all += all_naddrs;
1297     }
1298
1299     decrement_resolving_count(st,1);
1300 }
1301
1302 static void decrement_resolving_count(struct site *st, int by)
1303 {
1304     assert(st->resolving_count>0);
1305     st->resolving_count-=by;
1306
1307     if (st->resolving_count)
1308         return;
1309
1310     /* OK, we are done with them all.  Handle combined results. */
1311
1312     const struct comm_addr *addrs=st->resolving_results;
1313     int naddrs=st->resolving_n_results_stored;
1314     assert(naddrs<=st->transport_peers_max);
1315
1316     if (naddrs) {
1317         if (naddrs != st->resolving_n_results_all) {
1318             slog(st,LOG_SETUP_INIT,"resolution of supplied addresses/names"
1319                  " yielded too many results (%d > %d), some ignored",
1320                  st->resolving_n_results_all, naddrs);
1321         }
1322         slog(st,LOG_STATE,"resolution completed, %d addrs, eg: %s",
1323              naddrs, iaddr_to_string(&addrs[0].ia));;
1324     }
1325
1326     switch (st->state) {
1327     case SITE_RESOLVE:
1328         if (transport_compute_setupinit_peers(st,addrs,naddrs,0)) {
1329             enter_new_state(st,SITE_SENTMSG1);
1330         } else {
1331             /* Can't figure out who to try to to talk to */
1332             slog(st,LOG_SETUP_INIT,
1333                  "key exchange failed: cannot find peer address");
1334             enter_state_run(st);
1335         }
1336         break;
1337     case SITE_SENTMSG1: case SITE_SENTMSG2:
1338     case SITE_SENTMSG3: case SITE_SENTMSG4:
1339     case SITE_SENTMSG5:
1340         if (naddrs) {
1341             /* We start using the address immediately for data too.
1342              * It's best to store it in st->peers now because we might
1343              * go via SENTMSG5, WAIT, and a MSG0, straight into using
1344              * the new key (without updating the data peer addrs). */
1345             transport_resolve_complete(st,addrs,naddrs);
1346         } else if (st->local_mobile) {
1347             /* We can't let this rest because we may have a peer
1348              * address which will break in the future. */
1349             slog(st,LOG_SETUP_INIT,"resolution failed: "
1350                  "abandoning key exchange");
1351             enter_state_wait(st);
1352         } else {
1353             slog(st,LOG_SETUP_INIT,"resolution failed: "
1354                  " continuing to use source address of peer's packets"
1355                  " for key exchange and ultimately data");
1356         }
1357         break;
1358     case SITE_RUN:
1359         if (naddrs) {
1360             slog(st,LOG_SETUP_INIT,"resolution completed tardily,"
1361                  " updating peer address(es)");
1362             transport_resolve_complete_tardy(st,addrs,naddrs);
1363         } else if (st->local_mobile) {
1364             /* Not very good.  We should queue (another) renegotiation
1365              * so that we can update the peer address. */
1366             st->key_renegotiate_time=st->now+wait_timeout(st);
1367         } else {
1368             slog(st,LOG_SETUP_INIT,"resolution failed: "
1369                  " continuing to use source address of peer's packets");
1370         }
1371         break;
1372     case SITE_WAIT:
1373     case SITE_STOP:
1374         /* oh well */
1375         break;
1376     }
1377 }
1378
1379 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
1380                                  const struct comm_addr *prod_hint)
1381 {
1382     /* Reentrancy hazard: can call enter_new_state/enter_state_* */
1383     if (st->state!=SITE_RUN) return False;
1384     slog(st,LOG_SETUP_INIT,"initiating key exchange (%s)",reason);
1385     if (st->addresses) {
1386         slog(st,LOG_SETUP_INIT,"resolving peer address(es)");
1387         return enter_state_resolve(st);
1388     } else if (transport_compute_setupinit_peers(st,0,0,prod_hint)) {
1389         return enter_new_state(st,SITE_SENTMSG1);
1390     }
1391     slog(st,LOG_SETUP_INIT,"key exchange failed: no address for peer");
1392     return False;
1393 }
1394
1395 static void activate_new_key(struct site *st)
1396 {
1397     struct transform_inst_if *t;
1398
1399     /* We have three transform instances, which we swap between old,
1400        active and setup */
1401     t=st->auxiliary_key.transform;
1402     st->auxiliary_key.transform=st->current.transform;
1403     st->current.transform=st->new_transform;
1404     st->new_transform=t;
1405     dispose_transform(&st->new_transform);
1406
1407     st->timeout=0;
1408     st->auxiliary_is_new=0;
1409     st->auxiliary_key.key_timeout=st->current.key_timeout;
1410     st->current.key_timeout=st->now+st->key_lifetime;
1411     st->renegotiate_key_time=st->now+st->key_renegotiate_time;
1412     transport_peers_copy(st,&st->peers,&st->setup_peers);
1413     st->current.remote_session_id=st->setup_session_id;
1414
1415     /* Compute the inter-site MTU.  This is min( our_mtu, their_mtu ).
1416      * But their mtu be unspecified, in which case we just use ours. */
1417     uint32_t intersite_mtu=
1418         MIN(st->mtu_target, st->remote_adv_mtu ?: ~(uint32_t)0);
1419     st->netlink->set_mtu(st->netlink->st,intersite_mtu);
1420
1421     slog(st,LOG_ACTIVATE_KEY,"new key activated"
1422          " (mtu ours=%"PRId32" theirs=%"PRId32" intersite=%"PRId32")",
1423          st->mtu_target, st->remote_adv_mtu, intersite_mtu);
1424     enter_state_run(st);
1425 }
1426
1427 static void delete_one_key(struct site *st, struct data_key *key,
1428                            cstring_t reason, cstring_t which, uint32_t loglevel)
1429 {
1430     if (!is_transform_valid(key->transform)) return;
1431     if (reason) slog(st,loglevel,"%s deleted (%s)",which,reason);
1432     dispose_transform(&key->transform);
1433     key->key_timeout=0;
1434 }
1435
1436 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel)
1437 {
1438     if (current_valid(st)) {
1439         slog(st,loglevel,"session closed (%s)",reason);
1440
1441         delete_one_key(st,&st->current,0,0,0);
1442         set_link_quality(st);
1443     }
1444     delete_one_key(st,&st->auxiliary_key,0,0,0);
1445 }
1446
1447 static void state_assert(struct site *st, bool_t ok)
1448 {
1449     if (!ok) fatal("site:state_assert");
1450 }
1451
1452 static void enter_state_stop(struct site *st)
1453 {
1454     st->state=SITE_STOP;
1455     st->timeout=0;
1456     delete_keys(st,"entering state STOP",LOG_TIMEOUT_KEY);
1457     dispose_transform(&st->new_transform);
1458 }
1459
1460 static void set_link_quality(struct site *st)
1461 {
1462     uint32_t quality;
1463     if (current_valid(st))
1464         quality=LINK_QUALITY_UP;
1465     else if (st->state==SITE_WAIT || st->state==SITE_STOP)
1466         quality=LINK_QUALITY_DOWN;
1467     else if (st->addresses)
1468         quality=LINK_QUALITY_DOWN_CURRENT_ADDRESS;
1469     else if (transport_peers_valid(&st->peers))
1470         quality=LINK_QUALITY_DOWN_STALE_ADDRESS;
1471     else
1472         quality=LINK_QUALITY_DOWN;
1473
1474     st->netlink->set_quality(st->netlink->st,quality);
1475 }
1476
1477 static void enter_state_run(struct site *st)
1478 {
1479     slog(st,LOG_STATE,"entering state RUN%s",
1480          current_valid(st) ? " (keyed)" : " (unkeyed)");
1481     st->state=SITE_RUN;
1482     st->timeout=0;
1483
1484     st->setup_session_id=0;
1485     transport_peers_clear(st,&st->setup_peers);
1486     FILLZERO(st->localN);
1487     FILLZERO(st->remoteN);
1488     dispose_transform(&st->new_transform);
1489     memset(st->dhsecret,0,st->dh->len);
1490     if (st->sharedsecret) memset(st->sharedsecret,0,st->sharedsecretlen);
1491     set_link_quality(st);
1492
1493     if (st->keepalive && !current_valid(st))
1494         initiate_key_setup(st, "keepalive", 0);
1495 }
1496
1497 static bool_t ensure_resolving(struct site *st)
1498 {
1499     /* Reentrancy hazard: may call site_resolve_callback and hence
1500      * enter_new_state, enter_state_* and generate_msg*. */
1501     if (st->resolving_count)
1502         return True;
1503
1504     assert(st->addresses);
1505
1506     /* resolver->request might reentrantly call site_resolve_callback
1507      * which will decrement st->resolving, so we need to increment it
1508      * twice beforehand to prevent decrement from thinking we're
1509      * finished, and decrement it ourselves.  Alternatively if
1510      * everything fails then there are no callbacks due and we simply
1511      * set it to 0 and return false.. */
1512     st->resolving_n_results_stored=0;
1513     st->resolving_n_results_all=0;
1514     st->resolving_count+=2;
1515     const char **addrp=st->addresses;
1516     const char *address;
1517     bool_t anyok=False;
1518     for (; (address=*addrp++); ) {
1519         bool_t ok = st->resolver->request(st->resolver->st,address,
1520                                           st->remoteport,st->comms[0],
1521                                           site_resolve_callback,st);
1522         if (ok)
1523             st->resolving_count++;
1524         anyok|=ok;
1525     }
1526     if (!anyok) {
1527         st->resolving_count=0;
1528         return False;
1529     }
1530     decrement_resolving_count(st,2);
1531     return True;
1532 }
1533
1534 static bool_t enter_state_resolve(struct site *st)
1535 {
1536     /* Reentrancy hazard!  See ensure_resolving. */
1537     state_assert(st,st->state==SITE_RUN);
1538     slog(st,LOG_STATE,"entering state RESOLVE");
1539     st->state=SITE_RESOLVE;
1540     return ensure_resolving(st);
1541 }
1542
1543 static bool_t enter_new_state(struct site *st, uint32_t next)
1544 {
1545     bool_t (*gen)(struct site *st);
1546     int r;
1547
1548     slog(st,LOG_STATE,"entering state %s",state_name(next));
1549     switch(next) {
1550     case SITE_SENTMSG1:
1551         state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE);
1552         gen=generate_msg1;
1553         st->msg1_crossed_logged = False;
1554         break;
1555     case SITE_SENTMSG2:
1556         state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1557                      st->state==SITE_SENTMSG1 || st->state==SITE_WAIT);
1558         gen=generate_msg2;
1559         break;
1560     case SITE_SENTMSG3:
1561         state_assert(st,st->state==SITE_SENTMSG1);
1562         BUF_FREE(&st->buffer);
1563         gen=generate_msg3;
1564         break;
1565     case SITE_SENTMSG4:
1566         state_assert(st,st->state==SITE_SENTMSG2);
1567         BUF_FREE(&st->buffer);
1568         gen=generate_msg4;
1569         break;
1570     case SITE_SENTMSG5:
1571         state_assert(st,st->state==SITE_SENTMSG3);
1572         BUF_FREE(&st->buffer);
1573         gen=generate_msg5;
1574         break;
1575     case SITE_RUN:
1576         state_assert(st,st->state==SITE_SENTMSG4);
1577         BUF_FREE(&st->buffer);
1578         gen=generate_msg6;
1579         break;
1580     default:
1581         gen=NULL;
1582         fatal("enter_new_state(%s): invalid new state",state_name(next));
1583         break;
1584     }
1585
1586     if (hacky_par_start_failnow()) return False;
1587
1588     r= gen(st) && send_msg(st);
1589
1590     hacky_par_end(&r,
1591                   st->setup_retries, st->setup_retry_interval,
1592                   send_msg, st);
1593     
1594     if (r) {
1595         st->state=next;
1596         if (next==SITE_RUN) {
1597             BUF_FREE(&st->buffer); /* Never reused */
1598             st->timeout=0; /* Never retransmit */
1599             activate_new_key(st);
1600         }
1601         return True;
1602     }
1603     slog(st,LOG_ERROR,"error entering state %s",state_name(next));
1604     st->buffer.free=False; /* Unconditionally use the buffer; it may be
1605                               in either state, and enter_state_wait() will
1606                               do a BUF_FREE() */
1607     enter_state_wait(st);
1608     return False;
1609 }
1610
1611 /* msg7 tells our peer that we're about to forget our key */
1612 static bool_t send_msg7(struct site *st, cstring_t reason)
1613 {
1614     cstring_t transform_err;
1615
1616     if (current_valid(st) && st->buffer.free
1617         && transport_peers_valid(&st->peers)) {
1618         BUF_ALLOC(&st->buffer,"site:MSG7");
1619         buffer_init(&st->buffer,calculate_max_start_pad());
1620         buf_append_uint32(&st->buffer,LABEL_MSG7);
1621         buf_append_string(&st->buffer,reason);
1622         if (call_transform_forwards(st, st->current.transform,
1623                                     &st->buffer, &transform_err))
1624             goto free_out;
1625         buf_prepend_uint32(&st->buffer,LABEL_MSG0);
1626         buf_prepend_uint32(&st->buffer,st->index);
1627         buf_prepend_uint32(&st->buffer,st->current.remote_session_id);
1628         transport_xmit(st,&st->peers,&st->buffer,True);
1629         BUF_FREE(&st->buffer);
1630     free_out:
1631         return True;
1632     }
1633     return False;
1634 }
1635
1636 /* We go into this state if our peer becomes uncommunicative. Similar to
1637    the "stop" state, we forget all session keys for a while, before
1638    re-entering the "run" state. */
1639 static void enter_state_wait(struct site *st)
1640 {
1641     slog(st,LOG_STATE,"entering state WAIT");
1642     st->timeout=st->now+wait_timeout(st);
1643     st->state=SITE_WAIT;
1644     set_link_quality(st);
1645     BUF_FREE(&st->buffer); /* will have had an outgoing packet in it */
1646     /* XXX Erase keys etc. */
1647 }
1648
1649 static void generate_prod(struct site *st, struct buffer_if *buf)
1650 {
1651     buffer_init(buf,0);
1652     buf_append_uint32(buf,0);
1653     buf_append_uint32(buf,0);
1654     buf_append_uint32(buf,LABEL_PROD);
1655     buf_append_string(buf,st->localname);
1656     buf_append_string(buf,st->remotename);
1657 }
1658
1659 static void generate_send_prod(struct site *st,
1660                                const struct comm_addr *source)
1661 {
1662     if (!st->allow_send_prod) return; /* too soon */
1663     if (!(st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1664           st->state==SITE_WAIT)) return; /* we'd ignore peer's MSG1 */
1665
1666     slog(st,LOG_SETUP_INIT,"prodding peer for key exchange");
1667     st->allow_send_prod=0;
1668     generate_prod(st,&st->scratch);
1669     bool_t ok = comm_addr_sendmsg(st, source, &st->scratch);
1670     dump_packet(st,&st->scratch,source,False,ok);
1671 }
1672
1673 static inline void site_settimeout(uint64_t timeout, int *timeout_io)
1674 {
1675     if (timeout) {
1676         int64_t offset=timeout-*now;
1677         if (offset<0) offset=0;
1678         if (offset>INT_MAX) offset=INT_MAX;
1679         if (*timeout_io<0 || offset<*timeout_io)
1680             *timeout_io=offset;
1681     }
1682 }
1683
1684 static int site_beforepoll(void *sst, struct pollfd *fds, int *nfds_io,
1685                            int *timeout_io)
1686 {
1687     struct site *st=sst;
1688
1689     BEFOREPOLL_WANT_FDS(0); /* We don't use any file descriptors */
1690     st->now=*now;
1691
1692     /* Work out when our next timeout is. The earlier of 'timeout' or
1693        'current.key_timeout'. A stored value of '0' indicates no timeout
1694        active. */
1695     site_settimeout(st->timeout, timeout_io);
1696     site_settimeout(st->current.key_timeout, timeout_io);
1697     site_settimeout(st->auxiliary_key.key_timeout, timeout_io);
1698
1699     return 0; /* success */
1700 }
1701
1702 static void check_expiry(struct site *st, struct data_key *key,
1703                          const char *which)
1704 {
1705     if (key->key_timeout && *now>key->key_timeout) {
1706         delete_one_key(st,key,"maximum life exceeded",which,LOG_TIMEOUT_KEY);
1707     }
1708 }
1709
1710 /* NB site_afterpoll will be called before site_beforepoll is ever called */
1711 static void site_afterpoll(void *sst, struct pollfd *fds, int nfds)
1712 {
1713     struct site *st=sst;
1714
1715     st->now=*now;
1716     if (st->timeout && *now>st->timeout) {
1717         st->timeout=0;
1718         if (st->state>=SITE_SENTMSG1 && st->state<=SITE_SENTMSG5) {
1719             if (!hacky_par_start_failnow())
1720                 send_msg(st);
1721         } else if (st->state==SITE_WAIT) {
1722             enter_state_run(st);
1723         } else {
1724             slog(st,LOG_ERROR,"site_afterpoll: unexpected timeout, state=%d",
1725                  st->state);
1726         }
1727     }
1728     check_expiry(st,&st->current,"current key");
1729     check_expiry(st,&st->auxiliary_key,"auxiliary key");
1730 }
1731
1732 /* This function is called by the netlink device to deliver packets
1733    intended for the remote network. The packet is in "raw" wire
1734    format, but is guaranteed to be word-aligned. */
1735 static void site_outgoing(void *sst, struct buffer_if *buf)
1736 {
1737     struct site *st=sst;
1738     cstring_t transform_err;
1739     
1740     if (st->state==SITE_STOP) {
1741         BUF_FREE(buf);
1742         return;
1743     }
1744
1745     st->allow_send_prod=1;
1746
1747     /* In all other states we consider delivering the packet if we have
1748        a valid key and a valid address to send it to. */
1749     if (current_valid(st) && transport_peers_valid(&st->peers)) {
1750         /* Transform it and send it */
1751         if (buf->size>0) {
1752             buf_prepend_uint32(buf,LABEL_MSG9);
1753             if (call_transform_forwards(st, st->current.transform,
1754                                         buf, &transform_err))
1755                 goto free_out;
1756             buf_prepend_uint32(buf,LABEL_MSG0);
1757             buf_prepend_uint32(buf,st->index);
1758             buf_prepend_uint32(buf,st->current.remote_session_id);
1759             transport_xmit(st,&st->peers,buf,False);
1760         }
1761     free_out:
1762         BUF_FREE(buf);
1763         return;
1764     }
1765
1766     slog(st,LOG_DROP,"discarding outgoing packet of size %d",buf->size);
1767     BUF_FREE(buf);
1768     initiate_key_setup(st,"outgoing packet",0);
1769 }
1770
1771 static bool_t named_for_us(struct site *st, const struct buffer_if *buf_in,
1772                            uint32_t type, struct msg *m)
1773     /* For packets which are identified by the local and remote names.
1774      * If it has our name and our peer's name in it it's for us. */
1775 {
1776     struct buffer_if buf[1];
1777     buffer_readonly_clone(buf,buf_in);
1778     return unpick_msg(st,type,buf,m)
1779         && name_matches(&m->remote,st->remotename)
1780         && name_matches(&m->local,st->localname);
1781 }
1782
1783 static bool_t we_have_priority(struct site *st, const struct msg *m) {
1784     if (st->local_capabilities & m->remote_capabilities &
1785         CAPAB_PRIORITY_MOBILE) {
1786         if (st->local_mobile) return True;
1787         if (st-> peer_mobile) return False;
1788     }
1789     return st->our_name_later;
1790 }
1791
1792 static bool_t setup_late_msg_ok(struct site *st, 
1793                                 const struct buffer_if *buf_in,
1794                                 uint32_t msgtype,
1795                                 const struct comm_addr *source) {
1796     /* For setup packets which seem from their type like they are
1797      * late.  Maybe they came via a different path.  All we do is make
1798      * a note of the sending address, iff they look like they are part
1799      * of the current key setup attempt. */
1800     struct msg m;
1801     if (!named_for_us(st,buf_in,msgtype,&m))
1802         /* named_for_us calls unpick_msg which gets the nonces */
1803         return False;
1804     if (!consttime_memeq(m.nR,st->remoteN,NONCELEN) ||
1805         !consttime_memeq(m.nL,st->localN, NONCELEN))
1806         /* spoof ?  from stale run ?  who knows */
1807         return False;
1808     transport_setup_msgok(st,source);
1809     return True;
1810 }
1811
1812 /* This function is called by the communication device to deliver
1813    packets from our peers.
1814    It should return True if the packet is recognised as being for
1815    this current site instance (and should therefore not be processed
1816    by other sites), even if the packet was otherwise ignored. */
1817 static bool_t site_incoming(void *sst, struct buffer_if *buf,
1818                             const struct comm_addr *source)
1819 {
1820     struct site *st=sst;
1821
1822     if (buf->size < 12) return False;
1823
1824     uint32_t dest=get_uint32(buf->start);
1825     uint32_t msgtype=get_uint32(buf->start+8);
1826     struct msg named_msg;
1827
1828     if (msgtype==LABEL_MSG1) {
1829         if (!named_for_us(st,buf,msgtype,&named_msg))
1830             return False;
1831         /* It's a MSG1 addressed to us. Decide what to do about it. */
1832         dump_packet(st,buf,source,True,True);
1833         if (st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1834             st->state==SITE_WAIT) {
1835             /* We should definitely process it */
1836             transport_compute_setupinit_peers(st,0,0,source);
1837             if (process_msg1(st,buf,source,&named_msg)) {
1838                 slog(st,LOG_SETUP_INIT,"key setup initiated by peer");
1839                 bool_t entered=enter_new_state(st,SITE_SENTMSG2);
1840                 if (entered && st->addresses && st->local_mobile)
1841                     /* We must do this as the very last thing, because
1842                        the resolver callback might reenter us. */
1843                     ensure_resolving(st);
1844             } else {
1845                 slog(st,LOG_ERROR,"failed to process incoming msg1");
1846             }
1847             BUF_FREE(buf);
1848             return True;
1849         } else if (st->state==SITE_SENTMSG1) {
1850             /* We've just sent a message 1! They may have crossed on
1851                the wire. If we have priority then we ignore the
1852                incoming one, otherwise we process it as usual. */
1853             if (we_have_priority(st,&named_msg)) {
1854                 BUF_FREE(buf);
1855                 if (!st->msg1_crossed_logged++)
1856                     slog(st,LOG_SETUP_INIT,"crossed msg1s; we are higher "
1857                          "priority => ignore incoming msg1");
1858                 return True;
1859             } else {
1860                 slog(st,LOG_SETUP_INIT,"crossed msg1s; we are lower "
1861                      "priority => use incoming msg1");
1862                 if (process_msg1(st,buf,source,&named_msg)) {
1863                     BUF_FREE(&st->buffer); /* Free our old message 1 */
1864                     transport_setup_msgok(st,source);
1865                     enter_new_state(st,SITE_SENTMSG2);
1866                 } else {
1867                     slog(st,LOG_ERROR,"failed to process an incoming "
1868                          "crossed msg1 (we have low priority)");
1869                 }
1870                 BUF_FREE(buf);
1871                 return True;
1872             }
1873         } else if (st->state==SITE_SENTMSG2 ||
1874                    st->state==SITE_SENTMSG4) {
1875             if (consttime_memeq(named_msg.nR,st->remoteN,NONCELEN)) {
1876                 /* We are ahead in the protocol, but that msg1 had the
1877                  * peer's nonce so presumably it is from this key
1878                  * exchange run, via a slower route */
1879                 transport_setup_msgok(st,source);
1880             } else {
1881                 slog(st,LOG_UNEXPECTED,"competing incoming message 1");
1882             }
1883             BUF_FREE(buf);
1884             return True;
1885         }
1886         /* The message 1 was received at an unexpected stage of the
1887            key setup.  Well, they lost the race. */
1888         slog(st,LOG_UNEXPECTED,"unexpected incoming message 1");
1889         BUF_FREE(buf);
1890         return True;
1891     }
1892     if (msgtype==LABEL_PROD) {
1893         if (!named_for_us(st,buf,msgtype,&named_msg))
1894             return False;
1895         dump_packet(st,buf,source,True,True);
1896         if (st->state!=SITE_RUN) {
1897             slog(st,LOG_DROP,"ignoring PROD when not in state RUN");
1898         } else if (current_valid(st)) {
1899             slog(st,LOG_DROP,"ignoring PROD when we think we have a key");
1900         } else {
1901             initiate_key_setup(st,"peer sent PROD packet",source);
1902         }
1903         BUF_FREE(buf);
1904         return True;
1905     }
1906     if (dest==st->index) {
1907         /* Explicitly addressed to us */
1908         if (msgtype!=LABEL_MSG0) dump_packet(st,buf,source,True,True);
1909         switch (msgtype) {
1910         case LABEL_NAK:
1911             /* If the source is our current peer then initiate a key setup,
1912                because our peer's forgotten the key */
1913             if (get_uint32(buf->start+4)==st->current.remote_session_id) {
1914                 bool_t initiated;
1915                 initiated = initiate_key_setup(st,"received a NAK",source);
1916                 if (!initiated) generate_send_prod(st,source);
1917             } else {
1918                 slog(st,LOG_SEC,"bad incoming NAK");
1919             }
1920             break;
1921         case LABEL_MSG0:
1922             process_msg0(st,buf,source);
1923             break;
1924         case LABEL_MSG1:
1925             /* Setup packet: should not have been explicitly addressed
1926                to us */
1927             slog(st,LOG_SEC,"incoming explicitly addressed msg1");
1928             break;
1929         case LABEL_MSG2:
1930             /* Setup packet: expected only in state SENTMSG1 */
1931             if (st->state!=SITE_SENTMSG1) {
1932                 if ((st->state==SITE_SENTMSG3 ||
1933                      st->state==SITE_SENTMSG5) &&
1934                     setup_late_msg_ok(st,buf,msgtype,source))
1935                     break;
1936                 slog(st,LOG_UNEXPECTED,"unexpected MSG2");
1937             } else if (process_msg2(st,buf,source)) {
1938                 transport_setup_msgok(st,source);
1939                 enter_new_state(st,SITE_SENTMSG3);
1940             } else {
1941                 slog(st,LOG_SEC,"invalid MSG2");
1942             }
1943             break;
1944         case LABEL_MSG3:
1945         case LABEL_MSG3BIS:
1946             /* Setup packet: expected only in state SENTMSG2 */
1947             if (st->state!=SITE_SENTMSG2) {
1948                 if ((st->state==SITE_SENTMSG4) &&
1949                     setup_late_msg_ok(st,buf,msgtype,source))
1950                     break;
1951                 slog(st,LOG_UNEXPECTED,"unexpected MSG3");
1952             } else if (process_msg3(st,buf,source,msgtype)) {
1953                 transport_setup_msgok(st,source);
1954                 enter_new_state(st,SITE_SENTMSG4);
1955             } else {
1956                 slog(st,LOG_SEC,"invalid MSG3");
1957             }
1958             break;
1959         case LABEL_MSG4:
1960             /* Setup packet: expected only in state SENTMSG3 */
1961             if (st->state!=SITE_SENTMSG3) {
1962                 if ((st->state==SITE_SENTMSG5) &&
1963                     setup_late_msg_ok(st,buf,msgtype,source))
1964                     break;
1965                 slog(st,LOG_UNEXPECTED,"unexpected MSG4");
1966             } else if (process_msg4(st,buf,source)) {
1967                 transport_setup_msgok(st,source);
1968                 enter_new_state(st,SITE_SENTMSG5);
1969             } else {
1970                 slog(st,LOG_SEC,"invalid MSG4");
1971             }
1972             break;
1973         case LABEL_MSG5:
1974             /* Setup packet: expected only in state SENTMSG4 */
1975             /* (may turn up in state RUN if our return MSG6 was lost
1976                and the new key has already been activated. In that
1977                case we discard it. The peer will realise that we
1978                are using the new key when they see our data packets.
1979                Until then the peer's data packets to us get discarded. */
1980             if (st->state==SITE_SENTMSG4) {
1981                 if (process_msg5(st,buf,source,st->new_transform)) {
1982                     transport_setup_msgok(st,source);
1983                     enter_new_state(st,SITE_RUN);
1984                 } else {
1985                     slog(st,LOG_SEC,"invalid MSG5");
1986                 }
1987             } else if (st->state==SITE_RUN) {
1988                 if (process_msg5(st,buf,source,st->current.transform)) {
1989                     slog(st,LOG_DROP,"got MSG5, retransmitting MSG6");
1990                     transport_setup_msgok(st,source);
1991                     create_msg6(st,st->current.transform,
1992                                 st->current.remote_session_id);
1993                     transport_xmit(st,&st->peers,&st->buffer,True);
1994                     BUF_FREE(&st->buffer);
1995                 } else {
1996                     slog(st,LOG_SEC,"invalid MSG5 (in state RUN)");
1997                 }
1998             } else {
1999                 slog(st,LOG_UNEXPECTED,"unexpected MSG5");
2000             }
2001             break;
2002         case LABEL_MSG6:
2003             /* Setup packet: expected only in state SENTMSG5 */
2004             if (st->state!=SITE_SENTMSG5) {
2005                 slog(st,LOG_UNEXPECTED,"unexpected MSG6");
2006             } else if (process_msg6(st,buf,source)) {
2007                 BUF_FREE(&st->buffer); /* Free message 5 */
2008                 transport_setup_msgok(st,source);
2009                 activate_new_key(st);
2010             } else {
2011                 slog(st,LOG_SEC,"invalid MSG6");
2012             }
2013             break;
2014         default:
2015             slog(st,LOG_SEC,"received message of unknown type 0x%08x",
2016                  msgtype);
2017             break;
2018         }
2019         BUF_FREE(buf);
2020         return True;
2021     }
2022
2023     return False;
2024 }
2025
2026 static void site_control(void *vst, bool_t run)
2027 {
2028     struct site *st=vst;
2029     if (run) enter_state_run(st);
2030     else enter_state_stop(st);
2031 }
2032
2033 static void site_phase_hook(void *sst, uint32_t newphase)
2034 {
2035     struct site *st=sst;
2036
2037     /* The program is shutting down; tell our peer */
2038     send_msg7(st,"shutting down");
2039 }
2040
2041 static void site_childpersist_clearkeys(void *sst, uint32_t newphase)
2042 {
2043     struct site *st=sst;
2044     dispose_transform(&st->current.transform);
2045     dispose_transform(&st->auxiliary_key.transform);
2046     dispose_transform(&st->new_transform);
2047     /* Not much point overwiting the signing key, since we loaded it
2048        from disk, and it is only valid prospectively if at all,
2049        anyway. */
2050     /* XXX it would be best to overwrite the DH state, because that
2051        _is_ relevant to forward secrecy.  However we have no
2052        convenient interface for doing that and in practice gmp has
2053        probably dribbled droppings all over the malloc arena.  A good
2054        way to fix this would be to have a privsep child for asymmetric
2055        crypto operations, but that's a task for another day. */
2056 }
2057
2058 static list_t *site_apply(closure_t *self, struct cloc loc, dict_t *context,
2059                           list_t *args)
2060 {
2061     static uint32_t index_sequence;
2062     struct site *st;
2063     item_t *item;
2064     dict_t *dict;
2065     int i;
2066
2067     NEW(st);
2068
2069     st->cl.description="site";
2070     st->cl.type=CL_SITE;
2071     st->cl.apply=NULL;
2072     st->cl.interface=&st->ops;
2073     st->ops.st=st;
2074     st->ops.control=site_control;
2075     st->ops.status=site_status;
2076
2077     /* First parameter must be a dict */
2078     item=list_elem(args,0);
2079     if (!item || item->type!=t_dict)
2080         cfgfatal(loc,"site","parameter must be a dictionary\n");
2081     
2082     dict=item->data.dict;
2083     st->localname=dict_read_string(dict, "local-name", True, "site", loc);
2084     st->remotename=dict_read_string(dict, "name", True, "site", loc);
2085
2086     st->keepalive=dict_read_bool(dict,"keepalive",False,"site",loc,False);
2087
2088     st->peer_mobile=dict_read_bool(dict,"mobile",False,"site",loc,False);
2089     st->local_mobile=
2090         dict_read_bool(dict,"local-mobile",False,"site",loc,False);
2091
2092     /* Sanity check (which also allows the 'sites' file to include
2093        site() closures for all sites including our own): refuse to
2094        talk to ourselves */
2095     if (strcmp(st->localname,st->remotename)==0) {
2096         Message(M_DEBUG,"site %s: local-name==name -> ignoring this site\n",
2097                 st->localname);
2098         if (st->peer_mobile != st->local_mobile)
2099             cfgfatal(loc,"site","site %s's peer-mobile=%d"
2100                     " but our local-mobile=%d\n",
2101                     st->localname, st->peer_mobile, st->local_mobile);
2102         free(st);
2103         return NULL;
2104     }
2105     if (st->peer_mobile && st->local_mobile) {
2106         Message(M_WARNING,"site %s: site is mobile but so are we"
2107                 " -> ignoring this site\n", st->remotename);
2108         free(st);
2109         return NULL;
2110     }
2111
2112     assert(index_sequence < 0xffffffffUL);
2113     st->index = ++index_sequence;
2114     st->local_capabilities = 0;
2115     st->netlink=find_cl_if(dict,"link",CL_NETLINK,True,"site",loc);
2116
2117 #define GET_CLOSURE_LIST(dictkey,things,nthings,CL_TYPE) do{            \
2118     list_t *things##_cfg=dict_lookup(dict,dictkey);                     \
2119     if (!things##_cfg)                                                  \
2120         cfgfatal(loc,"site","closure list \"%s\" not found\n",dictkey); \
2121     st->nthings=list_length(things##_cfg);                              \
2122     NEW_ARY(st->things,st->nthings);                                    \
2123     assert(st->nthings);                                                \
2124     for (i=0; i<st->nthings; i++) {                                     \
2125         item_t *item=list_elem(things##_cfg,i);                         \
2126         if (item->type!=t_closure)                                      \
2127             cfgfatal(loc,"site","%s is not a closure\n",dictkey);       \
2128         closure_t *cl=item->data.closure;                               \
2129         if (cl->type!=CL_TYPE)                                          \
2130             cfgfatal(loc,"site","%s closure wrong type\n",dictkey);     \
2131         st->things[i]=cl->interface;                                    \
2132     }                                                                   \
2133 }while(0)
2134
2135     GET_CLOSURE_LIST("comm",comms,ncomms,CL_COMM);
2136
2137     NEW_ARY(st->commclientinfos, st->ncomms);
2138     dict_t *comminfo = dict_read_dict(dict,"comm-info",False,"site",loc);
2139     for (i=0; i<st->ncomms; i++) {
2140         st->commclientinfos[i] =
2141             !comminfo ? 0 :
2142             st->comms[i]->clientinfo(st->comms[i],comminfo,loc);
2143     }
2144
2145     st->resolver=find_cl_if(dict,"resolver",CL_RESOLVER,True,"site",loc);
2146     st->log=find_cl_if(dict,"log",CL_LOG,True,"site",loc);
2147     st->random=find_cl_if(dict,"random",CL_RANDOMSRC,True,"site",loc);
2148
2149     st->privkey=find_cl_if(dict,"local-key",CL_RSAPRIVKEY,True,"site",loc);
2150     st->addresses=dict_read_string_array(dict,"address",False,"site",loc,0);
2151     if (st->addresses)
2152         st->remoteport=dict_read_number(dict,"port",True,"site",loc,0);
2153     else st->remoteport=0;
2154     st->pubkey=find_cl_if(dict,"key",CL_RSAPUBKEY,True,"site",loc);
2155
2156     GET_CLOSURE_LIST("transform",transforms,ntransforms,CL_TRANSFORM);
2157
2158     st->dh=find_cl_if(dict,"dh",CL_DH,True,"site",loc);
2159     st->hash=find_cl_if(dict,"hash",CL_HASH,True,"site",loc);
2160
2161 #define DEFAULT(D) (st->peer_mobile || st->local_mobile \
2162                     ? DEFAULT_MOBILE_##D : DEFAULT_##D)
2163 #define CFG_NUMBER(k,D) dict_read_number(dict,(k),False,"site",loc,DEFAULT(D));
2164
2165     st->key_lifetime=         CFG_NUMBER("key-lifetime",  KEY_LIFETIME);
2166     st->setup_retries=        CFG_NUMBER("setup-retries", SETUP_RETRIES);
2167     st->setup_retry_interval= CFG_NUMBER("setup-timeout", SETUP_RETRY_INTERVAL);
2168     st->wait_timeout_mean=    CFG_NUMBER("wait-time",     WAIT_TIME);
2169     st->mtu_target= dict_read_number(dict,"mtu-target",False,"site",loc,0);
2170
2171     st->mobile_peer_expiry= dict_read_number(
2172        dict,"mobile-peer-expiry",False,"site",loc,DEFAULT_MOBILE_PEER_EXPIRY);
2173
2174     const char *peerskey= st->peer_mobile
2175         ? "mobile-peers-max" : "static-peers-max";
2176     st->transport_peers_max= dict_read_number(
2177         dict,peerskey,False,"site",loc, st->addresses ? 4 : 3);
2178     if (st->transport_peers_max<1 ||
2179         st->transport_peers_max>MAX_PEER_ADDRS) {
2180         cfgfatal(loc,"site", "%s must be in range 1.."
2181                  STRING(MAX_PEER_ADDRS) "\n", peerskey);
2182     }
2183
2184     if (st->key_lifetime < DEFAULT(KEY_RENEGOTIATE_GAP)*2)
2185         st->key_renegotiate_time=st->key_lifetime/2;
2186     else
2187         st->key_renegotiate_time=st->key_lifetime-DEFAULT(KEY_RENEGOTIATE_GAP);
2188     st->key_renegotiate_time=dict_read_number(
2189         dict,"renegotiate-time",False,"site",loc,st->key_renegotiate_time);
2190     if (st->key_renegotiate_time > st->key_lifetime) {
2191         cfgfatal(loc,"site",
2192                  "renegotiate-time must be less than key-lifetime\n");
2193     }
2194
2195     st->log_events=string_list_to_word(dict_lookup(dict,"log-events"),
2196                                        log_event_table,"site");
2197
2198     st->resolving_count=0;
2199     st->allow_send_prod=0;
2200
2201     st->tunname=safe_malloc(strlen(st->localname)+strlen(st->remotename)+5,
2202                             "site_apply");
2203     sprintf(st->tunname,"%s<->%s",st->localname,st->remotename);
2204
2205     /* The information we expect to see in incoming messages of type 1 */
2206     /* fixme: lots of unchecked overflows here, but the results are only
2207        corrupted packets rather than undefined behaviour */
2208     st->our_name_later=(strcmp(st->localname,st->remotename)>0);
2209
2210     buffer_new(&st->buffer,SETUP_BUFFER_LEN);
2211
2212     buffer_new(&st->scratch,SETUP_BUFFER_LEN);
2213     BUF_ALLOC(&st->scratch,"site:scratch");
2214
2215     /* We are interested in poll(), but only for timeouts. We don't have
2216        any fds of our own. */
2217     register_for_poll(st, site_beforepoll, site_afterpoll, "site");
2218     st->timeout=0;
2219
2220     st->remote_capabilities=0;
2221     st->chosen_transform=0;
2222     st->current.key_timeout=0;
2223     st->auxiliary_key.key_timeout=0;
2224     transport_peers_clear(st,&st->peers);
2225     transport_peers_clear(st,&st->setup_peers);
2226     /* XXX mlock these */
2227     st->dhsecret=safe_malloc(st->dh->len,"site:dhsecret");
2228     st->sharedsecretlen=st->sharedsecretallocd=0;
2229     st->sharedsecret=0;
2230
2231     for (i=0; i<st->ntransforms; i++) {
2232         struct transform_if *ti=st->transforms[i];
2233         uint32_t capbit = 1UL << ti->capab_transformnum;
2234         if (st->local_capabilities & capbit)
2235             slog(st,LOG_ERROR,"transformnum capability bit"
2236                  " %d (%#"PRIx32") reused", ti->capab_transformnum, capbit);
2237         st->local_capabilities |= capbit;
2238     }
2239
2240     if (st->local_mobile || st->peer_mobile)
2241         st->local_capabilities |= CAPAB_PRIORITY_MOBILE;
2242
2243     /* We need to register the remote networks with the netlink device */
2244     uint32_t netlink_mtu; /* local virtual interface mtu */
2245     st->netlink->reg(st->netlink->st, site_outgoing, st, &netlink_mtu);
2246     if (!st->mtu_target)
2247         st->mtu_target=netlink_mtu;
2248     
2249     for (i=0; i<st->ncomms; i++)
2250         st->comms[i]->request_notify(st->comms[i]->st, st, site_incoming);
2251
2252     st->current.transform=0;
2253     st->auxiliary_key.transform=0;
2254     st->new_transform=0;
2255     st->auxiliary_is_new=0;
2256
2257     enter_state_stop(st);
2258
2259     add_hook(PHASE_SHUTDOWN,site_phase_hook,st);
2260     add_hook(PHASE_CHILDPERSIST,site_childpersist_clearkeys,st);
2261
2262     return new_closure(&st->cl);
2263 }
2264
2265 void site_module(dict_t *dict)
2266 {
2267     add_closure(dict,"site",site_apply);
2268 }
2269
2270
2271 /***** TRANSPORT PEERS definitions *****/
2272
2273 static void transport_peers_debug(struct site *st, transport_peers *dst,
2274                                   const char *didwhat,
2275                                   int nargs, const struct comm_addr *args,
2276                                   size_t stride) {
2277     int i;
2278     char *argp;
2279
2280     if (!(st->log_events & LOG_PEER_ADDRS))
2281         return; /* an optimisation */
2282
2283     slog(st, LOG_PEER_ADDRS, "peers (%s) %s nargs=%d => npeers=%d",
2284          (dst==&st->peers ? "data" :
2285           dst==&st->setup_peers ? "setup" : "UNKNOWN"),
2286          didwhat, nargs, dst->npeers);
2287
2288     for (i=0, argp=(void*)args;
2289          i<nargs;
2290          i++, (argp+=stride?stride:sizeof(*args))) {
2291         const struct comm_addr *ca=(void*)argp;
2292         slog(st, LOG_PEER_ADDRS, " args: addrs[%d]=%s",
2293              i, comm_addr_to_string(ca));
2294     }
2295     for (i=0; i<dst->npeers; i++) {
2296         struct timeval diff;
2297         timersub(tv_now,&dst->peers[i].last,&diff);
2298         const struct comm_addr *ca=&dst->peers[i].addr;
2299         slog(st, LOG_PEER_ADDRS, " peers: addrs[%d]=%s T-%ld.%06ld",
2300              i, comm_addr_to_string(ca),
2301              (unsigned long)diff.tv_sec, (unsigned long)diff.tv_usec);
2302     }
2303 }
2304
2305 static void transport_peers_expire(struct site *st, transport_peers *peers) {
2306     /* peers must be sorted first */
2307     int previous_peers=peers->npeers;
2308     struct timeval oldest;
2309     oldest.tv_sec  = tv_now->tv_sec - st->mobile_peer_expiry;
2310     oldest.tv_usec = tv_now->tv_usec;
2311     while (peers->npeers>1 &&
2312            timercmp(&peers->peers[peers->npeers-1].last, &oldest, <))
2313         peers->npeers--;
2314     if (peers->npeers != previous_peers)
2315         transport_peers_debug(st,peers,"expire", 0,0,0);
2316 }
2317
2318 static bool_t transport_peer_record_one(struct site *st, transport_peers *peers,
2319                                         const struct comm_addr *ca,
2320                                         const struct timeval *tv) {
2321     /* returns false if output is full */
2322     int search;
2323
2324     if (peers->npeers >= st->transport_peers_max)
2325         return 0;
2326
2327     for (search=0; search<peers->npeers; search++)
2328         if (comm_addr_equal(&peers->peers[search].addr, ca))
2329             return 1;
2330
2331     peers->peers[peers->npeers].addr = *ca;
2332     peers->peers[peers->npeers].last = *tv;
2333     peers->npeers++;
2334     return 1;
2335 }
2336
2337 static void transport_record_peers(struct site *st, transport_peers *peers,
2338                                    const struct comm_addr *addrs, int naddrs,
2339                                    const char *m) {
2340     /* We add addrs into peers.  The new entries end up at the front
2341      * and displace entries towards the end (perhaps even off the
2342      * end).  Any existing matching entries are moved up to the front.
2343      *
2344      * Caller must first call transport_peers_expire. */
2345
2346     if (naddrs==1) {
2347         /* avoids debug for uninteresting updates */
2348         int i;
2349         for (i=0; i<peers->npeers; i++) {
2350             if (comm_addr_equal(&addrs[0], &peers->peers[i].addr)) {
2351                 memmove(peers->peers+1, peers->peers,
2352                         sizeof(peers->peers[0]) * i);
2353                 peers->peers[0].addr = addrs[0];
2354                 peers->peers[0].last = *tv_now;
2355                 return;
2356             }
2357         }
2358     }
2359
2360     int old_npeers=peers->npeers;
2361     transport_peer old_peers[old_npeers];
2362     COPY_ARRAY(old_peers,peers->peers,old_npeers);
2363
2364     peers->npeers=0;
2365     int i;
2366     for (i=0; i<naddrs; i++) {
2367         if (!transport_peer_record_one(st,peers, &addrs[i], tv_now))
2368             break;
2369     }
2370     for (i=0; i<old_npeers; i++) {
2371         const transport_peer *old=&old_peers[i];
2372         if (!transport_peer_record_one(st,peers, &old->addr, &old->last))
2373             break;
2374     }
2375
2376     transport_peers_debug(st,peers,m, naddrs,addrs,0);
2377 }
2378
2379 static void transport_expire_record_peers(struct site *st,
2380                                           transport_peers *peers,
2381                                           const struct comm_addr *addrs,
2382                                           int naddrs, const char *m) {
2383     /* Convenience function */
2384     transport_peers_expire(st,peers);
2385     transport_record_peers(st,peers,addrs,naddrs,m);
2386 }
2387
2388 static bool_t transport_compute_setupinit_peers(struct site *st,
2389         const struct comm_addr *configured_addrs /* 0 if none or not found */,
2390         int n_configured_addrs /* 0 if none or not found */,
2391         const struct comm_addr *incoming_packet_addr /* 0 if none */) {
2392     if (!n_configured_addrs && !incoming_packet_addr &&
2393         !transport_peers_valid(&st->peers))
2394         return False;
2395
2396     slog(st,LOG_SETUP_INIT,
2397          "using: %d configured addr(s);%s %d old peer addrs(es)",
2398          n_configured_addrs,
2399          incoming_packet_addr ? " incoming packet address;" : "",
2400          st->peers.npeers);
2401
2402     /* Non-mobile peers try addresses until one is plausible.  The
2403      * effect is that this code always tries first the configured
2404      * address if supplied, or otherwise the address of the incoming
2405      * PROD, or finally the existing data peer if one exists; this is
2406      * as desired. */
2407
2408     transport_peers_copy(st,&st->setup_peers,&st->peers);
2409     transport_peers_expire(st,&st->setup_peers);
2410
2411     if (incoming_packet_addr)
2412         transport_record_peers(st,&st->setup_peers,
2413                                incoming_packet_addr,1, "incoming");
2414
2415     if (n_configured_addrs)
2416         transport_record_peers(st,&st->setup_peers,
2417                               configured_addrs,n_configured_addrs, "setupinit");
2418
2419     assert(transport_peers_valid(&st->setup_peers));
2420     return True;
2421 }
2422
2423 static void transport_setup_msgok(struct site *st, const struct comm_addr *a) {
2424     if (st->peer_mobile)
2425         transport_expire_record_peers(st,&st->setup_peers,a,1,"setupmsg");
2426 }
2427 static void transport_data_msgok(struct site *st, const struct comm_addr *a) {
2428     if (st->peer_mobile)
2429         transport_expire_record_peers(st,&st->peers,a,1,"datamsg");
2430 }
2431
2432 static int transport_peers_valid(transport_peers *peers) {
2433     return peers->npeers;
2434 }
2435 static void transport_peers_clear(struct site *st, transport_peers *peers) {
2436     peers->npeers= 0;
2437     transport_peers_debug(st,peers,"clear",0,0,0);
2438 }
2439 static void transport_peers_copy(struct site *st, transport_peers *dst,
2440                                  const transport_peers *src) {
2441     dst->npeers=src->npeers;
2442     COPY_ARRAY(dst->peers, src->peers, dst->npeers);
2443     transport_peers_debug(st,dst,"copy",
2444                           src->npeers, &src->peers->addr, sizeof(*src->peers));
2445 }
2446
2447 static void transport_resolve_complete(struct site *st,
2448                                        const struct comm_addr *addrs,
2449                                        int naddrs) {
2450     transport_expire_record_peers(st,&st->peers,addrs,naddrs,
2451                                   "resolved data");
2452     transport_expire_record_peers(st,&st->setup_peers,addrs,naddrs,
2453                                   "resolved setup");
2454 }
2455
2456 static void transport_resolve_complete_tardy(struct site *st,
2457                                              const struct comm_addr *addrs,
2458                                              int naddrs) {
2459     transport_expire_record_peers(st,&st->peers,addrs,naddrs,
2460                                   "resolved tardily");
2461 }
2462
2463 static void transport_peers__copy_by_mask(transport_peer *out, int *nout_io,
2464                                           unsigned mask,
2465                                           const transport_peers *inp) {
2466     /* out and in->peers may be the same region, or nonoverlapping */
2467     const transport_peer *in=inp->peers;
2468     int slot;
2469     for (slot=0; slot<inp->npeers; slot++) {
2470         if (!(mask & (1U << slot)))
2471             continue;
2472         if (!(out==in && slot==*nout_io))
2473             COPY_OBJ(out[*nout_io], in[slot]);
2474         (*nout_io)++;
2475     }
2476 }
2477
2478 void transport_xmit(struct site *st, transport_peers *peers,
2479                     struct buffer_if *buf, bool_t candebug) {
2480     int slot;
2481     transport_peers_expire(st, peers);
2482     unsigned failed=0; /* bitmask */
2483     assert(MAX_PEER_ADDRS < sizeof(unsigned)*CHAR_BIT);
2484
2485     int nfailed=0;
2486     for (slot=0; slot<peers->npeers; slot++) {
2487         transport_peer *peer=&peers->peers[slot];
2488         bool_t ok = comm_addr_sendmsg(st, &peer->addr, buf);
2489         if (candebug)
2490             dump_packet(st, buf, &peer->addr, False, ok);
2491         if (!ok) {
2492             failed |= 1U << slot;
2493             nfailed++;
2494         }
2495         if (ok && !st->peer_mobile)
2496             break;
2497     }
2498     /* Now we need to demote/delete failing addrs: if we are mobile we
2499      * merely demote them; otherwise we delete them. */
2500     if (st->local_mobile) {
2501         unsigned expected = ((1U << nfailed)-1) << (peers->npeers-nfailed);
2502         /* `expected' has all the failures at the end already */
2503         if (failed != expected) {
2504             int fslot=0;
2505             transport_peer failedpeers[nfailed];
2506             transport_peers__copy_by_mask(failedpeers, &fslot, failed,peers);
2507             assert(fslot == nfailed);
2508             int wslot=0;
2509             transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2510             assert(wslot+nfailed == peers->npeers);
2511             COPY_ARRAY(peers->peers+wslot, failedpeers, nfailed);
2512             transport_peers_debug(st,peers,"mobile failure reorder",0,0,0);
2513         }
2514     } else {
2515         if (failed && peers->npeers > 1) {
2516             int wslot=0;
2517             transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2518             peers->npeers=wslot;
2519             transport_peers_debug(st,peers,"non-mobile failure cleanup",0,0,0);
2520         }
2521     }
2522 }
2523
2524 /***** END of transport peers declarations *****/