chiark / gitweb /
site.c: Abstract out the various parts of capability handling.
[secnet.git] / site.c
1 /* site.c - manage communication with a remote network site */
2
3 /*
4  * This file is part of secnet.
5  * See README for full list of copyright holders.
6  *
7  * secnet is free software; you can redistribute it and/or modify it
8  * under the terms of the GNU General Public License as published by
9  * the Free Software Foundation; either version 3 of the License, or
10  * (at your option) any later version.
11  * 
12  * secnet is distributed in the hope that it will be useful, but
13  * WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
15  * General Public License for more details.
16  * 
17  * You should have received a copy of the GNU General Public License
18  * version 3 along with secnet; if not, see
19  * https://www.gnu.org/licenses/gpl.html.
20  */
21
22 /* The 'site' code doesn't know anything about the structure of the
23    packets it's transmitting.  In fact, under the new netlink
24    configuration scheme it doesn't need to know anything at all about
25    IP addresses, except how to contact its peer.  This means it could
26    potentially be used to tunnel other protocols too (IPv6, IPX, plain
27    old Ethernet frames) if appropriate netlink code can be written
28    (and that ought not to be too hard, eg. using the TUN/TAP device to
29    pretend to be an Ethernet interface).  */
30
31 /* At some point in the future the netlink code will be asked for
32    configuration information to go in the PING/PONG packets at the end
33    of the key exchange. */
34
35 #include "secnet.h"
36 #include <stdio.h>
37 #include <string.h>
38 #include <limits.h>
39 #include <assert.h>
40 #include <sys/socket.h>
41
42 #include <sys/mman.h>
43 #include "util.h"
44 #include "unaligned.h"
45 #include "magic.h"
46
47 #define SETUP_BUFFER_LEN 2048
48
49 #define DEFAULT_KEY_LIFETIME                  (3600*1000) /* [ms] */
50 #define DEFAULT_KEY_RENEGOTIATE_GAP           (5*60*1000) /* [ms] */
51 #define DEFAULT_SETUP_RETRIES 5
52 #define DEFAULT_SETUP_RETRY_INTERVAL             (2*1000) /* [ms] */
53 #define DEFAULT_WAIT_TIME                       (20*1000) /* [ms] */
54
55 #define DEFAULT_MOBILE_KEY_LIFETIME      (2*24*3600*1000) /* [ms] */
56 #define DEFAULT_MOBILE_KEY_RENEGOTIATE_GAP (12*3600*1000) /* [ms] */
57 #define DEFAULT_MOBILE_SETUP_RETRIES 30
58 #define DEFAULT_MOBILE_SETUP_RETRY_INTERVAL      (1*1000) /* [ms] */
59 #define DEFAULT_MOBILE_WAIT_TIME                (10*1000) /* [ms] */
60
61 #define DEFAULT_MOBILE_PEER_EXPIRY            (2*60)      /* [s] */
62
63 /* Each site can be in one of several possible states. */
64
65 /* States:
66    SITE_STOP         - nothing is allowed to happen; tunnel is down;
67                        all session keys have been erased
68      -> SITE_RUN upon external instruction
69    SITE_RUN          - site up, maybe with valid key
70      -> SITE_RESOLVE upon outgoing packet and no valid key
71          we start name resolution for the other end of the tunnel
72      -> SITE_SENTMSG2 upon valid incoming message 1 and suitable time
73          we send an appropriate message 2
74    SITE_RESOLVE      - waiting for name resolution
75      -> SITE_SENTMSG1 upon successful resolution
76          we send an appropriate message 1
77      -> SITE_SENTMSG2 upon valid incoming message 1 (then abort resolution)
78          we abort resolution and 
79      -> SITE_WAIT on timeout or resolution failure
80    SITE_SENTMSG1
81      -> SITE_SENTMSG2 upon valid incoming message 1 from higher priority end
82      -> SITE_SENTMSG3 upon valid incoming message 2
83      -> SITE_WAIT on timeout
84    SITE_SENTMSG2
85      -> SITE_SENTMSG4 upon valid incoming message 3
86      -> SITE_WAIT on timeout
87    SITE_SENTMSG3
88      -> SITE_SENTMSG5 upon valid incoming message 4
89      -> SITE_WAIT on timeout
90    SITE_SENTMSG4
91      -> SITE_RUN upon valid incoming message 5
92      -> SITE_WAIT on timeout
93    SITE_SENTMSG5
94      -> SITE_RUN upon valid incoming message 6
95      -> SITE_WAIT on timeout
96    SITE_WAIT         - failed to establish key; do nothing for a while
97      -> SITE_RUN on timeout
98    */
99
100 #define SITE_STOP     0
101 #define SITE_RUN      1
102 #define SITE_RESOLVE  2
103 #define SITE_SENTMSG1 3
104 #define SITE_SENTMSG2 4
105 #define SITE_SENTMSG3 5
106 #define SITE_SENTMSG4 6
107 #define SITE_SENTMSG5 7
108 #define SITE_WAIT     8
109
110 int32_t site_max_start_pad = 4*4;
111
112 static cstring_t state_name(uint32_t state)
113 {
114     switch (state) {
115     case 0: return "STOP";
116     case 1: return "RUN";
117     case 2: return "RESOLVE";
118     case 3: return "SENTMSG1";
119     case 4: return "SENTMSG2";
120     case 5: return "SENTMSG3";
121     case 6: return "SENTMSG4";
122     case 7: return "SENTMSG5";
123     case 8: return "WAIT";
124     default: return "*bad state*";
125     }
126 }
127
128 #define NONCELEN 8
129
130 #define LOG_UNEXPECTED    0x00000001
131 #define LOG_SETUP_INIT    0x00000002
132 #define LOG_SETUP_TIMEOUT 0x00000004
133 #define LOG_ACTIVATE_KEY  0x00000008
134 #define LOG_TIMEOUT_KEY   0x00000010
135 #define LOG_SEC           0x00000020
136 #define LOG_STATE         0x00000040
137 #define LOG_DROP          0x00000080
138 #define LOG_DUMP          0x00000100
139 #define LOG_ERROR         0x00000400
140 #define LOG_PEER_ADDRS    0x00000800
141
142 static struct flagstr log_event_table[]={
143     { "unexpected", LOG_UNEXPECTED },
144     { "setup-init", LOG_SETUP_INIT },
145     { "setup-timeout", LOG_SETUP_TIMEOUT },
146     { "activate-key", LOG_ACTIVATE_KEY },
147     { "timeout-key", LOG_TIMEOUT_KEY },
148     { "security", LOG_SEC },
149     { "state-change", LOG_STATE },
150     { "packet-drop", LOG_DROP },
151     { "dump-packets", LOG_DUMP },
152     { "errors", LOG_ERROR },
153     { "peer-addrs", LOG_PEER_ADDRS },
154     { "default", LOG_SETUP_INIT|LOG_SETUP_TIMEOUT|
155       LOG_ACTIVATE_KEY|LOG_TIMEOUT_KEY|LOG_SEC|LOG_ERROR },
156     { "all", 0xffffffff },
157     { NULL, 0 }
158 };
159
160
161 /***** TRANSPORT PEERS declarations *****/
162
163 /* Details of "mobile peer" semantics:
164
165    - We use the same data structure for the different configurations,
166      but manage it with different algorithms.
167    
168    - We record up to mobile_peers_max peer address/port numbers
169      ("peers") for key setup, and separately up to mobile_peers_max
170      for data transfer.
171
172    - In general, we make a new set of addrs (see below) when we start
173      a new key exchange; the key setup addrs become the data transport
174      addrs when key setup complets.
175
176    If our peer is mobile:
177
178    - We send to all recent addresses of incoming packets, plus
179      initially all configured addresses (which we also expire).
180
181    - So, we record addrs of good incoming packets, as follows:
182       1. expire any peers last seen >120s ("mobile-peer-expiry") ago
183       2. add the peer of the just received packet to the applicable list
184          (possibly evicting the oldest entries to make room)
185      NB that we do not expire peers until an incoming packet arrives.
186
187    - If the peer has a configured address or name, we record them the
188      same way, but only as a result of our own initiation of key
189      setup.  (We might evict some incoming packet addrs to make room.)
190
191    - The default number of addrs to keep is 3, or 4 if we have a
192      configured name or address.  That's space for two configured
193      addresses (one IPv6 and one IPv4), plus two received addresses.
194
195    - Outgoing packets are sent to every recorded address in the
196      applicable list.  Any unsupported[1] addresses are deleted from
197      the list right away.  (This should only happen to configured
198      addresses, of course, but there is no need to check that.)
199
200    - When we successfully complete a key setup, we merge the key setup
201      peers into the data transfer peers.
202
203    [1] An unsupported address is one for whose AF we don't have a
204      socket (perhaps because we got EAFNOSUPPORT or some such) or for
205      which sendto gives ENETUNREACH.
206
207    If neither end is mobile:
208
209    - When peer initiated the key exchange, we use the incoming packet
210      address.
211
212    - When we initiate the key exchange, we try configured addresses
213      until we get one which isn't unsupported then fixate on that.
214
215    - When we complete a key setup, we replace the data transport peers
216      with those from the key setup.
217
218    If we are mobile:
219
220    - We can't tell when local network setup changes so we can't cache
221      the unsupported addrs and completely remove the spurious calls to
222      sendto, but we can optimise things a bit by deprioritising addrs
223      which seem to be unsupported.
224
225    - Use only configured addresses.  (Except, that if our peer
226      initiated a key exchange we use the incoming packet address until
227      our name resolution completes.)
228
229    - When we send a packet, try each address in turn; if addr
230      supported, put that address to the end of the list for future
231      packets, and go onto the next address.
232
233    - When we complete a key setup, we replace the data transport peers
234      with those from the key setup.
235
236    */
237
238 typedef struct {
239     struct timeval last;
240     struct comm_addr addr;
241 } transport_peer;
242
243 typedef struct {
244 /* configuration information */
245 /* runtime information */
246     int npeers;
247     transport_peer peers[MAX_PEER_ADDRS];
248 } transport_peers;
249
250 /* Basic operations on transport peer address sets */
251 static void transport_peers_clear(struct site *st, transport_peers *peers);
252 static int transport_peers_valid(transport_peers *peers);
253 static void transport_peers_copy(struct site *st, transport_peers *dst,
254                                  const transport_peers *src);
255
256 /* Record address of incoming setup packet; resp. data packet. */
257 static void transport_setup_msgok(struct site *st, const struct comm_addr *a);
258 static void transport_data_msgok(struct site *st, const struct comm_addr *a);
259
260 /* Initialise the setup addresses.  Called before we send the first
261  * packet in a key exchange.  If we are the initiator, as a result of
262  * resolve completing (or being determined not to be relevant) or an
263  * incoming PROD; if we are the responder, as a result of the MSG1. */
264 static bool_t transport_compute_setupinit_peers(struct site *st,
265         const struct comm_addr *configured_addrs /* 0 if none or not found */,
266         int n_configured_addrs /* 0 if none or not found */,
267         const struct comm_addr *incoming_packet_addr /* 0 if none */);
268
269 /* Called if we are the responder in a key setup, when the resolve
270  * completes.  transport_compute_setupinit_peers will hvae been called
271  * earlier.  If _complete is called, we are still doing the key setup
272  * (and we should use the new values for both the rest of the key
273  * setup and the ongoing data exchange); if _tardy is called, the key
274  * setup is done (either completed or not) and only the data peers are
275  * relevant */
276 static void transport_resolve_complete(struct site *st,
277         const struct comm_addr *addrs, int naddrs);
278 static void transport_resolve_complete_tardy(struct site *st,
279         const struct comm_addr *addrs, int naddrs);
280
281 static void transport_xmit(struct site *st, transport_peers *peers,
282                            struct buffer_if *buf, bool_t candebug);
283
284  /***** END of transport peers declarations *****/
285
286
287 struct data_key {
288     struct transform_inst_if *transform;
289     uint64_t key_timeout; /* End of life of current key */
290     uint32_t remote_session_id;
291 };
292
293 struct site {
294     closure_t cl;
295     struct site_if ops;
296 /* configuration information */
297     string_t localname;
298     string_t remotename;
299     bool_t keepalive;
300     bool_t local_mobile, peer_mobile; /* Mobile client support */
301     int32_t transport_peers_max;
302     string_t tunname; /* localname<->remotename by default, used in logs */
303     cstring_t *addresses; /* DNS name or address(es) for bootstrapping, optional */
304     int remoteport; /* Port for bootstrapping, optional */
305     uint32_t mtu_target;
306     struct netlink_if *netlink;
307     struct comm_if **comms;
308     struct comm_clientinfo **commclientinfos;
309     int ncomms;
310     struct resolver_if *resolver;
311     struct log_if *log;
312     struct random_if *random;
313     struct rsaprivkey_if *privkey;
314     struct rsapubkey_if *pubkey;
315     struct transform_if **transforms;
316     int ntransforms;
317     struct dh_if *dh;
318     struct hash_if *hash;
319
320     uint32_t index; /* Index of this site */
321     uint32_t local_capabilities;
322     int32_t setup_retries; /* How many times to send setup packets */
323     int32_t setup_retry_interval; /* Initial timeout for setup packets */
324     int32_t wait_timeout_mean; /* How long to wait if setup unsuccessful */
325     int32_t mobile_peer_expiry; /* How long to remember 2ary addresses */
326     int32_t key_lifetime; /* How long a key lasts once set up */
327     int32_t key_renegotiate_time; /* If we see traffic (or a keepalive)
328                                       after this time, initiate a new
329                                       key exchange */
330
331     bool_t our_name_later; /* our name > peer name */
332     uint32_t log_events;
333
334 /* runtime information */
335     uint32_t state;
336     uint64_t now; /* Most recently seen time */
337     bool_t allow_send_prod;
338     bool_t msg1_crossed_logged;
339     int resolving_count;
340     int resolving_n_results_all;
341     int resolving_n_results_stored;
342     struct comm_addr resolving_results[MAX_PEER_ADDRS];
343
344     /* The currently established session */
345     struct data_key current;
346     struct data_key auxiliary_key;
347     bool_t auxiliary_is_new;
348     uint64_t renegotiate_key_time; /* When we can negotiate a new key */
349     uint64_t auxiliary_renegotiate_key_time;
350     transport_peers peers; /* Current address(es) of peer for data traffic */
351
352     /* The current key setup protocol exchange.  We can only be
353        involved in one of these at a time.  There's a potential for
354        denial of service here (the attacker keeps sending a setup
355        packet; we keep trying to continue the exchange, and have to
356        timeout before we can listen for another setup packet); perhaps
357        we should keep a list of 'bad' sources for setup packets. */
358     uint32_t remote_capabilities;
359     uint16_t remote_adv_mtu;
360     struct transform_if *chosen_transform;
361     uint32_t setup_session_id;
362     transport_peers setup_peers;
363     uint8_t localN[NONCELEN]; /* Nonces for key exchange */
364     uint8_t remoteN[NONCELEN];
365     struct buffer_if buffer; /* Current outgoing key exchange packet */
366     struct buffer_if scratch;
367     int32_t retries; /* Number of retries remaining */
368     uint64_t timeout; /* Timeout for current state */
369     uint8_t *dhsecret;
370     uint8_t *sharedsecret;
371     uint32_t sharedsecretlen, sharedsecretallocd;
372     struct transform_inst_if *new_transform; /* For key setup/verify */
373 };
374
375 static uint32_t event_log_priority(struct site *st, uint32_t event)
376 {
377     if (!(event&st->log_events))
378         return 0;
379     switch(event) {
380     case LOG_UNEXPECTED:    return M_INFO;
381     case LOG_SETUP_INIT:    return M_INFO;
382     case LOG_SETUP_TIMEOUT: return M_NOTICE;
383     case LOG_ACTIVATE_KEY:  return M_INFO;
384     case LOG_TIMEOUT_KEY:   return M_INFO;
385     case LOG_SEC:           return M_SECURITY;
386     case LOG_STATE:         return M_DEBUG;
387     case LOG_DROP:          return M_DEBUG;
388     case LOG_DUMP:          return M_DEBUG;
389     case LOG_ERROR:         return M_ERR;
390     case LOG_PEER_ADDRS:    return M_DEBUG;
391     default:                return M_ERR;
392     }
393 }
394
395 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
396 FORMAT(printf,3,0);
397 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
398 {
399     uint32_t class;
400
401     class=event_log_priority(st, event);
402     if (class) {
403         slilog_part(st->log,class,"%s: ",st->tunname);
404         vslilog_part(st->log,class,msg,ap);
405         slilog_part(st->log,class,"\n");
406     }
407 }
408
409 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
410 FORMAT(printf,3,4);
411 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
412 {
413     va_list ap;
414     va_start(ap,msg);
415     vslog(st,event,msg,ap);
416     va_end(ap);
417 }
418
419 static void logtimeout(struct site *st, const char *fmt, ...)
420 FORMAT(printf,2,3);
421 static void logtimeout(struct site *st, const char *fmt, ...)
422 {
423     uint32_t class=event_log_priority(st,LOG_SETUP_TIMEOUT);
424     if (!class)
425         return;
426
427     va_list ap;
428     va_start(ap,fmt);
429
430     slilog_part(st->log,class,"%s: ",st->tunname);
431     vslilog_part(st->log,class,fmt,ap);
432
433     const char *delim;
434     int i;
435     for (i=0, delim=" (tried ";
436          i<st->setup_peers.npeers;
437          i++, delim=", ") {
438         transport_peer *peer=&st->setup_peers.peers[i];
439         const char *s=comm_addr_to_string(&peer->addr);
440         slilog_part(st->log,class,"%s%s",delim,s);
441     }
442
443     slilog_part(st->log,class,")\n");
444     va_end(ap);
445 }
446
447 static void set_link_quality(struct site *st);
448 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel);
449 static void delete_one_key(struct site *st, struct data_key *key,
450                            const char *reason /* may be 0 meaning don't log*/,
451                            const char *which /* ignored if !reasonn */,
452                            uint32_t loglevel /* ignored if !reasonn */);
453 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
454                                  const struct comm_addr *prod_hint);
455 static void enter_state_run(struct site *st);
456 static bool_t enter_state_resolve(struct site *st);
457 static void decrement_resolving_count(struct site *st, int by);
458 static bool_t enter_new_state(struct site *st,uint32_t next);
459 static void enter_state_wait(struct site *st);
460 static void activate_new_key(struct site *st);
461
462 static bool_t is_transform_valid(struct transform_inst_if *transform)
463 {
464     return transform && transform->valid(transform->st);
465 }
466
467 static bool_t current_valid(struct site *st)
468 {
469     return is_transform_valid(st->current.transform);
470 }
471
472 #define DEFINE_CALL_TRANSFORM(fwdrev)                                   \
473 static transform_apply_return                                           \
474 call_transform_##fwdrev(struct site *st,                                \
475                                    struct transform_inst_if *transform, \
476                                    struct buffer_if *buf,               \
477                                    const char **errmsg)                 \
478 {                                                                       \
479     if (!is_transform_valid(transform)) {                               \
480         *errmsg="transform not set up";                                 \
481         return transform_apply_err;                                     \
482     }                                                                   \
483     return transform->fwdrev(transform->st,buf,errmsg);                 \
484 }
485
486 DEFINE_CALL_TRANSFORM(forwards)
487 DEFINE_CALL_TRANSFORM(reverse)
488
489 static void dispose_transform(struct transform_inst_if **transform_var)
490 {
491     struct transform_inst_if *transform=*transform_var;
492     if (transform) {
493         transform->delkey(transform->st);
494         transform->destroy(transform->st);
495     }
496     *transform_var = 0;
497 }    
498
499 #define CHECK_AVAIL(b,l) do { if ((b)->size<(l)) return False; } while(0)
500 #define CHECK_EMPTY(b) do { if ((b)->size!=0) return False; } while(0)
501 #define CHECK_TYPE(b,t) do { uint32_t type; \
502     CHECK_AVAIL((b),4); \
503     type=buf_unprepend_uint32((b)); \
504     if (type!=(t)) return False; } while(0)
505
506 static _Bool type_is_msg34(uint32_t type)
507 {
508     return
509         type == LABEL_MSG3 ||
510         type == LABEL_MSG3BIS ||
511         type == LABEL_MSG4;
512 }
513
514 struct parsedname {
515     int32_t len;
516     uint8_t *name;
517     struct buffer_if extrainfo;
518 };
519
520 struct msg {
521     uint8_t *hashstart;
522     uint32_t dest;
523     uint32_t source;
524     struct parsedname remote;
525     struct parsedname local;
526     uint32_t remote_capabilities;
527     uint16_t remote_mtu;
528     int capab_transformnum;
529     uint8_t *nR;
530     uint8_t *nL;
531     int32_t pklen;
532     char *pk;
533     int32_t hashlen;
534     int32_t siglen;
535     char *sig;
536 };
537
538 static int32_t wait_timeout(struct site *st) {
539     int32_t t = st->wait_timeout_mean;
540     int8_t factor;
541     if (t < INT_MAX/2) {
542         st->random->generate(st->random->st,sizeof(factor),&factor);
543         t += (t / 256) * factor;
544     }
545     return t;
546 }
547
548 static _Bool set_new_transform(struct site *st, char *pk)
549 {
550     _Bool ok;
551
552     /* Make room for the shared key */
553     st->sharedsecretlen=st->chosen_transform->keylen?:st->dh->ceil_len;
554     assert(st->sharedsecretlen);
555     if (st->sharedsecretlen > st->sharedsecretallocd) {
556         st->sharedsecretallocd=st->sharedsecretlen;
557         st->sharedsecret=safe_realloc_ary(st->sharedsecret,1,
558                                           st->sharedsecretallocd,
559                                           "site:sharedsecret");
560     }
561
562     /* Generate the shared key */
563     st->dh->makeshared(st->dh->st,st->dhsecret,st->dh->len,pk,
564                        st->sharedsecret,st->sharedsecretlen);
565
566     /* Set up the transform */
567     struct transform_if *generator=st->chosen_transform;
568     struct transform_inst_if *generated=generator->create(generator->st);
569     ok = generated->setkey(generated->st,st->sharedsecret,
570                            st->sharedsecretlen,st->our_name_later);
571
572     dispose_transform(&st->new_transform);
573     if (!ok) return False;
574     st->new_transform=generated;
575
576     slog(st,LOG_SETUP_INIT,"key exchange negotiated transform"
577          " %d (capabilities ours=%#"PRIx32" theirs=%#"PRIx32")",
578          st->chosen_transform->capab_bit,
579          st->local_capabilities, st->remote_capabilities);
580     return True;
581 }
582
583 struct xinfoadd {
584     int32_t lenpos, afternul;
585 };
586 static void append_string_xinfo_start(struct buffer_if *buf,
587                                       struct xinfoadd *xia,
588                                       const char *str)
589     /* Helps construct one of the names with additional info as found
590      * in MSG1..4.  Call this function first, then append all the
591      * desired extra info (not including the nul byte) to the buffer,
592      * then call append_string_xinfo_done. */
593 {
594     xia->lenpos = buf->size;
595     buf_append_string(buf,str);
596     buf_append_uint8(buf,0);
597     xia->afternul = buf->size;
598 }
599 static void append_string_xinfo_done(struct buffer_if *buf,
600                                      struct xinfoadd *xia)
601 {
602     /* we just need to adjust the string length */
603     if (buf->size == xia->afternul) {
604         /* no extra info, strip the nul too */
605         buf_unappend_uint8(buf);
606     } else {
607         put_uint16(buf->start+xia->lenpos, buf->size-(xia->lenpos+2));
608     }
609 }
610
611 /* Build any of msg1 to msg4. msg5 and msg6 are built from the inside
612    out using a transform of config data supplied by netlink */
613 static bool_t generate_msg(struct site *st, uint32_t type, cstring_t what)
614 {
615     void *hst;
616     uint8_t *hash;
617     string_t dhpub, sig;
618
619     st->retries=st->setup_retries;
620     BUF_ALLOC(&st->buffer,what);
621     buffer_init(&st->buffer,0);
622     buf_append_uint32(&st->buffer,
623         (type==LABEL_MSG1?0:st->setup_session_id));
624     buf_append_uint32(&st->buffer,st->index);
625     buf_append_uint32(&st->buffer,type);
626
627     struct xinfoadd xia;
628     append_string_xinfo_start(&st->buffer,&xia,st->localname);
629     if ((st->local_capabilities & CAPAB_EARLY) || (type != LABEL_MSG1)) {
630         buf_append_uint32(&st->buffer,st->local_capabilities);
631     }
632     if (type_is_msg34(type)) {
633         buf_append_uint16(&st->buffer,st->mtu_target);
634     }
635     append_string_xinfo_done(&st->buffer,&xia);
636
637     buf_append_string(&st->buffer,st->remotename);
638     BUF_ADD_OBJ(append,&st->buffer,st->localN);
639     if (type==LABEL_MSG1) return True;
640     BUF_ADD_OBJ(append,&st->buffer,st->remoteN);
641     if (type==LABEL_MSG2) return True;
642
643     if (hacky_par_mid_failnow()) return False;
644
645     if (type==LABEL_MSG3BIS)
646         buf_append_uint8(&st->buffer,st->chosen_transform->capab_bit);
647
648     dhpub=st->dh->makepublic(st->dh->st,st->dhsecret,st->dh->len);
649     buf_append_string(&st->buffer,dhpub);
650     free(dhpub);
651     hash=safe_malloc(st->hash->len, "generate_msg");
652     hst=st->hash->init();
653     st->hash->update(hst,st->buffer.start,st->buffer.size);
654     st->hash->final(hst,hash);
655     sig=st->privkey->sign(st->privkey->st,hash,st->hash->len);
656     buf_append_string(&st->buffer,sig);
657     free(sig);
658     free(hash);
659     return True;
660 }
661
662 static bool_t unpick_name(struct buffer_if *msg, struct parsedname *nm)
663 {
664     CHECK_AVAIL(msg,2);
665     nm->len=buf_unprepend_uint16(msg);
666     CHECK_AVAIL(msg,nm->len);
667     nm->name=buf_unprepend(msg,nm->len);
668     uint8_t *nul=memchr(nm->name,0,nm->len);
669     if (!nul) {
670         buffer_readonly_view(&nm->extrainfo,0,0);
671     } else {
672         buffer_readonly_view(&nm->extrainfo, nul+1, msg->start-(nul+1));
673         nm->len=nul-nm->name;
674     }
675     return True;
676 }
677
678 static bool_t unpick_msg(struct site *st, uint32_t type,
679                          struct buffer_if *msg, struct msg *m)
680 {
681     m->capab_transformnum=-1;
682     m->hashstart=msg->start;
683     CHECK_AVAIL(msg,4);
684     m->dest=buf_unprepend_uint32(msg);
685     CHECK_AVAIL(msg,4);
686     m->source=buf_unprepend_uint32(msg);
687     CHECK_TYPE(msg,type);
688     if (!unpick_name(msg,&m->remote)) return False;
689     m->remote_capabilities=0;
690     m->remote_mtu=0;
691     if (m->remote.extrainfo.size) {
692         CHECK_AVAIL(&m->remote.extrainfo,4);
693         m->remote_capabilities=buf_unprepend_uint32(&m->remote.extrainfo);
694     }
695     if (type_is_msg34(type) && m->remote.extrainfo.size) {
696         CHECK_AVAIL(&m->remote.extrainfo,2);
697         m->remote_mtu=buf_unprepend_uint16(&m->remote.extrainfo);
698     }
699     if (!unpick_name(msg,&m->local)) return False;
700     if (type==LABEL_PROD) {
701         CHECK_EMPTY(msg);
702         return True;
703     }
704     CHECK_AVAIL(msg,NONCELEN);
705     m->nR=buf_unprepend(msg,NONCELEN);
706     if (type==LABEL_MSG1) {
707         CHECK_EMPTY(msg);
708         return True;
709     }
710     CHECK_AVAIL(msg,NONCELEN);
711     m->nL=buf_unprepend(msg,NONCELEN);
712     if (type==LABEL_MSG2) {
713         CHECK_EMPTY(msg);
714         return True;
715     }
716     if (type==LABEL_MSG3BIS) {
717         CHECK_AVAIL(msg,1);
718         m->capab_transformnum = buf_unprepend_uint8(msg);
719     } else {
720         m->capab_transformnum = CAPAB_BIT_ANCIENTTRANSFORM;
721     }
722     CHECK_AVAIL(msg,2);
723     m->pklen=buf_unprepend_uint16(msg);
724     CHECK_AVAIL(msg,m->pklen);
725     m->pk=buf_unprepend(msg,m->pklen);
726     m->hashlen=msg->start-m->hashstart;
727     CHECK_AVAIL(msg,2);
728     m->siglen=buf_unprepend_uint16(msg);
729     CHECK_AVAIL(msg,m->siglen);
730     m->sig=buf_unprepend(msg,m->siglen);
731     CHECK_EMPTY(msg);
732
733     /* In `process_msg3_msg4' below, we assume that we can write a nul
734      * terminator following the signature.  Make sure there's enough space.
735      */
736     if (msg->start >= msg->base + msg->alloclen)
737         return False;
738
739     return True;
740 }
741
742 static bool_t name_matches(const struct parsedname *nm, const char *expected)
743 {
744     int expected_len=strlen(expected);
745     return
746         nm->len == expected_len &&
747         !memcmp(nm->name, expected, expected_len);
748 }    
749
750 static bool_t check_msg(struct site *st, uint32_t type, struct msg *m,
751                         cstring_t *error)
752 {
753     if (type==LABEL_MSG1) return True;
754
755     /* Check that the site names and our nonce have been sent
756        back correctly, and then store our peer's nonce. */ 
757     if (!name_matches(&m->remote,st->remotename)) {
758         *error="wrong remote site name";
759         return False;
760     }
761     if (!name_matches(&m->local,st->localname)) {
762         *error="wrong local site name";
763         return False;
764     }
765     if (memcmp(m->nL,st->localN,NONCELEN)!=0) {
766         *error="wrong locally-generated nonce";
767         return False;
768     }
769     if (type==LABEL_MSG2) return True;
770     if (!consttime_memeq(m->nR,st->remoteN,NONCELEN)) {
771         *error="wrong remotely-generated nonce";
772         return False;
773     }
774     /* MSG3 has complicated rules about capabilities, which are
775      * handled in process_msg3. */
776     if (type==LABEL_MSG3 || type==LABEL_MSG3BIS) return True;
777     if (m->remote_capabilities!=st->remote_capabilities) {
778         *error="remote capabilities changed";
779         return False;
780     }
781     if (type==LABEL_MSG4) return True;
782     *error="unknown message type";
783     return False;
784 }
785
786 static bool_t generate_msg1(struct site *st)
787 {
788     st->random->generate(st->random->st,NONCELEN,st->localN);
789     return generate_msg(st,LABEL_MSG1,"site:MSG1");
790 }
791
792 static bool_t process_msg1(struct site *st, struct buffer_if *msg1,
793                            const struct comm_addr *src, struct msg *m)
794 {
795     /* We've already determined we're in an appropriate state to
796        process an incoming MSG1, and that the MSG1 has correct values
797        of A and B. */
798
799     st->setup_session_id=m->source;
800     st->remote_capabilities=m->remote_capabilities;
801     memcpy(st->remoteN,m->nR,NONCELEN);
802     return True;
803 }
804
805 static bool_t generate_msg2(struct site *st)
806 {
807     st->random->generate(st->random->st,NONCELEN,st->localN);
808     return generate_msg(st,LABEL_MSG2,"site:MSG2");
809 }
810
811 static bool_t process_msg2(struct site *st, struct buffer_if *msg2,
812                            const struct comm_addr *src)
813 {
814     struct msg m;
815     cstring_t err;
816
817     if (!unpick_msg(st,LABEL_MSG2,msg2,&m)) return False;
818     if (!check_msg(st,LABEL_MSG2,&m,&err)) {
819         slog(st,LOG_SEC,"msg2: %s",err);
820         return False;
821     }
822     st->setup_session_id=m.source;
823     st->remote_capabilities=m.remote_capabilities;
824
825     /* Select the transform to use */
826
827     uint32_t remote_crypto_caps = st->remote_capabilities & CAPAB_TRANSFORM_MASK;
828     if (!remote_crypto_caps)
829         /* old secnets only had this one transform */
830         remote_crypto_caps = 1UL << CAPAB_BIT_ANCIENTTRANSFORM;
831
832 #define CHOOSE_CRYPTO(kind, whats) do {                                 \
833     struct kind##_if *iface;                                            \
834     uint32_t bit, ours = 0;                                             \
835     int i;                                                              \
836     for (i= 0; i < st->n##kind##s; i++) {                               \
837         iface=st->kind##s[i];                                           \
838         bit = 1UL << iface->capab_bit;                                  \
839         if (bit & remote_crypto_caps) goto kind##_found;                \
840         ours |= bit;                                                    \
841     }                                                                   \
842     slog(st,LOG_ERROR,"no " whats " in common"                          \
843          " (us %#"PRIx32"; them: %#"PRIx32")",                          \
844          st->local_capabilities & ours, remote_crypto_caps);            \
845     return False;                                                       \
846 kind##_found:                                                           \
847     st->chosen_##kind = iface;                                          \
848 } while (0)
849
850     CHOOSE_CRYPTO(transform, "transforms");
851
852 #undef CHOOSE_CRYPTO
853
854     memcpy(st->remoteN,m.nR,NONCELEN);
855     return True;
856 }
857
858 static bool_t generate_msg3(struct site *st)
859 {
860     /* Now we have our nonce and their nonce. Think of a secret key,
861        and create message number 3. */
862     st->random->generate(st->random->st,st->dh->len,st->dhsecret);
863     return generate_msg(st,
864                         (st->remote_capabilities & CAPAB_TRANSFORM_MASK
865                          ? LABEL_MSG3BIS : LABEL_MSG3),
866                         "site:MSG3");
867 }
868
869 static bool_t process_msg3_msg4(struct site *st, struct msg *m)
870 {
871     uint8_t *hash;
872     void *hst;
873
874     /* Check signature and store g^x mod m */
875     hash=safe_malloc(st->hash->len, "process_msg3_msg4");
876     hst=st->hash->init();
877     st->hash->update(hst,m->hashstart,m->hashlen);
878     st->hash->final(hst,hash);
879     /* Terminate signature with a '0' - already checked that this will fit */
880     m->sig[m->siglen]=0;
881     if (!st->pubkey->check(st->pubkey->st,hash,st->hash->len,m->sig)) {
882         slog(st,LOG_SEC,"msg3/msg4 signature failed check!");
883         free(hash);
884         return False;
885     }
886     free(hash);
887
888     st->remote_adv_mtu=m->remote_mtu;
889
890     return True;
891 }
892
893 static bool_t process_msg3(struct site *st, struct buffer_if *msg3,
894                            const struct comm_addr *src, uint32_t msgtype)
895 {
896     struct msg m;
897     cstring_t err;
898
899     assert(msgtype==LABEL_MSG3 || msgtype==LABEL_MSG3BIS);
900
901     if (!unpick_msg(st,msgtype,msg3,&m)) return False;
902     if (!check_msg(st,msgtype,&m,&err)) {
903         slog(st,LOG_SEC,"msg3: %s",err);
904         return False;
905     }
906     uint32_t capab_adv_late = m.remote_capabilities
907         & ~st->remote_capabilities & CAPAB_EARLY;
908     if (capab_adv_late) {
909         slog(st,LOG_SEC,"msg3 impermissibly adds early capability flag(s)"
910              " %#"PRIx32" (was %#"PRIx32", now %#"PRIx32")",
911              capab_adv_late, st->remote_capabilities, m.remote_capabilities);
912         return False;
913     }
914     st->remote_capabilities|=m.remote_capabilities;
915
916 #define CHOSE_CRYPTO(kind, what) do {                                   \
917     struct kind##_if *iface;                                            \
918     int i;                                                              \
919     for (i=0; i<st->n##kind##s; i++) {                                  \
920         iface=st->kind##s[i];                                           \
921         if (iface->capab_bit == m.capab_##kind##num)                    \
922             goto kind##_found;                                          \
923     }                                                                   \
924     slog(st,LOG_SEC,"peer chose unknown-to-us " what " %d!",            \
925          m.capab_##kind##num);                                                  \
926     return False;                                                       \
927 kind##_found:                                                           \
928     st->chosen_##kind=iface;                                            \
929 } while (0)
930
931     CHOSE_CRYPTO(transform, "transform");
932
933 #undef CHOSE_CRYPTO
934
935     if (!process_msg3_msg4(st,&m))
936         return False;
937
938     /* Terminate their DH public key with a '0' */
939     m.pk[m.pklen]=0;
940     /* Invent our DH secret key */
941     st->random->generate(st->random->st,st->dh->len,st->dhsecret);
942
943     /* Generate the shared key and set up the transform */
944     if (!set_new_transform(st,m.pk)) return False;
945
946     return True;
947 }
948
949 static bool_t generate_msg4(struct site *st)
950 {
951     /* We have both nonces, their public key and our private key. Generate
952        our public key, sign it and send it to them. */
953     return generate_msg(st,LABEL_MSG4,"site:MSG4");
954 }
955
956 static bool_t process_msg4(struct site *st, struct buffer_if *msg4,
957                            const struct comm_addr *src)
958 {
959     struct msg m;
960     cstring_t err;
961
962     if (!unpick_msg(st,LABEL_MSG4,msg4,&m)) return False;
963     if (!check_msg(st,LABEL_MSG4,&m,&err)) {
964         slog(st,LOG_SEC,"msg4: %s",err);
965         return False;
966     }
967     
968     if (!process_msg3_msg4(st,&m))
969         return False;
970
971     /* Terminate their DH public key with a '0' */
972     m.pk[m.pklen]=0;
973
974     /* Generate the shared key and set up the transform */
975     if (!set_new_transform(st,m.pk)) return False;
976
977     return True;
978 }
979
980 struct msg0 {
981     uint32_t dest;
982     uint32_t source;
983     uint32_t type;
984 };
985
986 static bool_t unpick_msg0(struct site *st, struct buffer_if *msg0,
987                           struct msg0 *m)
988 {
989     CHECK_AVAIL(msg0,4);
990     m->dest=buf_unprepend_uint32(msg0);
991     CHECK_AVAIL(msg0,4);
992     m->source=buf_unprepend_uint32(msg0);
993     CHECK_AVAIL(msg0,4);
994     m->type=buf_unprepend_uint32(msg0);
995     return True;
996     /* Leaves transformed part of buffer untouched */
997 }
998
999 static bool_t generate_msg5(struct site *st)
1000 {
1001     cstring_t transform_err;
1002
1003     BUF_ALLOC(&st->buffer,"site:MSG5");
1004     /* We are going to add four words to the message */
1005     buffer_init(&st->buffer,calculate_max_start_pad());
1006     /* Give the netlink code an opportunity to put its own stuff in the
1007        message (configuration information, etc.) */
1008     buf_prepend_uint32(&st->buffer,LABEL_MSG5);
1009     if (call_transform_forwards(st,st->new_transform,
1010                                 &st->buffer,&transform_err))
1011         return False;
1012     buf_prepend_uint32(&st->buffer,LABEL_MSG5);
1013     buf_prepend_uint32(&st->buffer,st->index);
1014     buf_prepend_uint32(&st->buffer,st->setup_session_id);
1015
1016     st->retries=st->setup_retries;
1017     return True;
1018 }
1019
1020 static bool_t process_msg5(struct site *st, struct buffer_if *msg5,
1021                            const struct comm_addr *src,
1022                            struct transform_inst_if *transform)
1023 {
1024     struct msg0 m;
1025     cstring_t transform_err;
1026
1027     if (!unpick_msg0(st,msg5,&m)) return False;
1028
1029     if (call_transform_reverse(st,transform,msg5,&transform_err)) {
1030         /* There's a problem */
1031         slog(st,LOG_SEC,"process_msg5: transform: %s",transform_err);
1032         return False;
1033     }
1034     /* Buffer should now contain untransformed PING packet data */
1035     CHECK_AVAIL(msg5,4);
1036     if (buf_unprepend_uint32(msg5)!=LABEL_MSG5) {
1037         slog(st,LOG_SEC,"MSG5/PING packet contained wrong label");
1038         return False;
1039     }
1040     /* Older versions of secnet used to write some config data here
1041      * which we ignore.  So we don't CHECK_EMPTY */
1042     return True;
1043 }
1044
1045 static void create_msg6(struct site *st, struct transform_inst_if *transform,
1046                         uint32_t session_id)
1047 {
1048     cstring_t transform_err;
1049
1050     BUF_ALLOC(&st->buffer,"site:MSG6");
1051     /* We are going to add four words to the message */
1052     buffer_init(&st->buffer,calculate_max_start_pad());
1053     /* Give the netlink code an opportunity to put its own stuff in the
1054        message (configuration information, etc.) */
1055     buf_prepend_uint32(&st->buffer,LABEL_MSG6);
1056     transform_apply_return problem =
1057         call_transform_forwards(st,transform,
1058                                 &st->buffer,&transform_err);
1059     assert(!problem);
1060     buf_prepend_uint32(&st->buffer,LABEL_MSG6);
1061     buf_prepend_uint32(&st->buffer,st->index);
1062     buf_prepend_uint32(&st->buffer,session_id);
1063 }
1064
1065 static bool_t generate_msg6(struct site *st)
1066 {
1067     if (!is_transform_valid(st->new_transform))
1068         return False;
1069     create_msg6(st,st->new_transform,st->setup_session_id);
1070     st->retries=1; /* Peer will retransmit MSG5 if this packet gets lost */
1071     return True;
1072 }
1073
1074 static bool_t process_msg6(struct site *st, struct buffer_if *msg6,
1075                            const struct comm_addr *src)
1076 {
1077     struct msg0 m;
1078     cstring_t transform_err;
1079
1080     if (!unpick_msg0(st,msg6,&m)) return False;
1081
1082     if (call_transform_reverse(st,st->new_transform,msg6,&transform_err)) {
1083         /* There's a problem */
1084         slog(st,LOG_SEC,"process_msg6: transform: %s",transform_err);
1085         return False;
1086     }
1087     /* Buffer should now contain untransformed PING packet data */
1088     CHECK_AVAIL(msg6,4);
1089     if (buf_unprepend_uint32(msg6)!=LABEL_MSG6) {
1090         slog(st,LOG_SEC,"MSG6/PONG packet contained invalid data");
1091         return False;
1092     }
1093     /* Older versions of secnet used to write some config data here
1094      * which we ignore.  So we don't CHECK_EMPTY */
1095     return True;
1096 }
1097
1098 static transform_apply_return
1099 decrypt_msg0(struct site *st, struct buffer_if *msg0,
1100                            const struct comm_addr *src)
1101 {
1102     cstring_t transform_err, auxkey_err, newkey_err="n/a";
1103     struct msg0 m;
1104     transform_apply_return problem;
1105
1106     if (!unpick_msg0(st,msg0,&m)) return False;
1107
1108     /* Keep a copy so we can try decrypting it with multiple keys */
1109     buffer_copy(&st->scratch, msg0);
1110
1111     problem = call_transform_reverse(st,st->current.transform,
1112                                      msg0,&transform_err);
1113     if (!problem) {
1114         if (!st->auxiliary_is_new)
1115             delete_one_key(st,&st->auxiliary_key,
1116                            "peer has used new key","auxiliary key",LOG_SEC);
1117         return 0;
1118     }
1119     if (transform_apply_return_badseq(problem))
1120         goto badseq;
1121
1122     buffer_copy(msg0, &st->scratch);
1123     problem = call_transform_reverse(st,st->auxiliary_key.transform,
1124                                      msg0,&auxkey_err);
1125     if (!problem) {
1126         slog(st,LOG_DROP,"processing packet which uses auxiliary key");
1127         if (st->auxiliary_is_new) {
1128             /* We previously timed out in state SENTMSG5 but it turns
1129              * out that our peer did in fact get our MSG5 and is
1130              * using the new key.  So we should switch to it too. */
1131             /* This is a bit like activate_new_key. */
1132             struct data_key t;
1133             t=st->current;
1134             st->current=st->auxiliary_key;
1135             st->auxiliary_key=t;
1136
1137             delete_one_key(st,&st->auxiliary_key,"peer has used new key",
1138                            "previous key",LOG_SEC);
1139             st->auxiliary_is_new=0;
1140             st->renegotiate_key_time=st->auxiliary_renegotiate_key_time;
1141         }
1142         return 0;
1143     }
1144     if (transform_apply_return_badseq(problem))
1145         goto badseq;
1146
1147     if (st->state==SITE_SENTMSG5) {
1148         buffer_copy(msg0, &st->scratch);
1149         problem = call_transform_reverse(st,st->new_transform,
1150                                          msg0,&newkey_err);
1151         if (!problem) {
1152             /* It looks like we didn't get the peer's MSG6 */
1153             /* This is like a cut-down enter_new_state(SITE_RUN) */
1154             slog(st,LOG_STATE,"will enter state RUN (MSG0 with new key)");
1155             BUF_FREE(&st->buffer);
1156             st->timeout=0;
1157             activate_new_key(st);
1158             return 0; /* do process the data in this packet */
1159         }
1160         if (transform_apply_return_badseq(problem))
1161             goto badseq;
1162     }
1163
1164     slog(st,LOG_SEC,"transform: %s (aux: %s, new: %s)",
1165          transform_err,auxkey_err,newkey_err);
1166     initiate_key_setup(st,"incoming message would not decrypt",0);
1167     send_nak(src,m.dest,m.source,m.type,msg0,"message would not decrypt");
1168     assert(problem);
1169     return problem;
1170
1171  badseq:
1172     slog(st,LOG_DROP,"transform: %s (bad seq.)",transform_err);
1173     assert(problem);
1174     return problem;
1175 }
1176
1177 static bool_t process_msg0(struct site *st, struct buffer_if *msg0,
1178                            const struct comm_addr *src)
1179 {
1180     uint32_t type;
1181     transform_apply_return problem;
1182
1183     problem = decrypt_msg0(st,msg0,src);
1184     if (problem==transform_apply_seqdupe) {
1185         /* We recently received another copy of this packet, maybe due
1186          * to polypath.  That's not a problem; indeed, for the
1187          * purposes of transport address management it is a success.
1188          * But we don't want to process the packet. */
1189         transport_data_msgok(st,src);
1190         return False;
1191     }
1192     if (problem)
1193         return False;
1194
1195     CHECK_AVAIL(msg0,4);
1196     type=buf_unprepend_uint32(msg0);
1197     switch(type) {
1198     case LABEL_MSG7:
1199         /* We must forget about the current session. */
1200         delete_keys(st,"request from peer",LOG_SEC);
1201         /* probably, the peer is shutting down, and this is going to fail,
1202          * but we need to be trying to bring the link up again */
1203         if (st->keepalive)
1204             initiate_key_setup(st,"peer requested key teardown",0);
1205         return True;
1206     case LABEL_MSG9:
1207         /* Deliver to netlink layer */
1208         st->netlink->deliver(st->netlink->st,msg0);
1209         transport_data_msgok(st,src);
1210         /* See whether we should start negotiating a new key */
1211         if (st->now > st->renegotiate_key_time)
1212             initiate_key_setup(st,"incoming packet in renegotiation window",0);
1213         return True;
1214     default:
1215         slog(st,LOG_SEC,"incoming encrypted message of type %08x "
1216              "(unknown)",type);
1217         break;
1218     }
1219     return False;
1220 }
1221
1222 static void dump_packet(struct site *st, struct buffer_if *buf,
1223                         const struct comm_addr *addr, bool_t incoming,
1224                         bool_t ok)
1225 {
1226     uint32_t dest=get_uint32(buf->start);
1227     uint32_t source=get_uint32(buf->start+4);
1228     uint32_t msgtype=get_uint32(buf->start+8);
1229
1230     if (st->log_events & LOG_DUMP)
1231         slilog(st->log,M_DEBUG,"%s: %s: %08x<-%08x: %08x: %s%s",
1232                st->tunname,incoming?"incoming":"outgoing",
1233                dest,source,msgtype,comm_addr_to_string(addr),
1234                ok?"":" - fail");
1235 }
1236
1237 static bool_t comm_addr_sendmsg(struct site *st,
1238                                 const struct comm_addr *dest,
1239                                 struct buffer_if *buf)
1240 {
1241     int i;
1242     struct comm_clientinfo *commclientinfo = 0;
1243
1244     for (i=0; i < st->ncomms; i++) {
1245         if (st->comms[i] == dest->comm) {
1246             commclientinfo = st->commclientinfos[i];
1247             break;
1248         }
1249     }
1250     return dest->comm->sendmsg(dest->comm->st, buf, dest, commclientinfo);
1251 }
1252
1253 static uint32_t site_status(void *st)
1254 {
1255     return 0;
1256 }
1257
1258 static bool_t send_msg(struct site *st)
1259 {
1260     if (st->retries>0) {
1261         transport_xmit(st, &st->setup_peers, &st->buffer, True);
1262         st->timeout=st->now+st->setup_retry_interval;
1263         st->retries--;
1264         return True;
1265     } else if (st->state==SITE_SENTMSG5) {
1266         logtimeout(st,"timed out sending MSG5, stashing new key");
1267         /* We stash the key we have produced, in case it turns out that
1268          * our peer did see our MSG5 after all and starts using it. */
1269         /* This is a bit like some of activate_new_key */
1270         struct transform_inst_if *t;
1271         t=st->auxiliary_key.transform;
1272         st->auxiliary_key.transform=st->new_transform;
1273         st->new_transform=t;
1274         dispose_transform(&st->new_transform);
1275
1276         st->auxiliary_is_new=1;
1277         st->auxiliary_key.key_timeout=st->now+st->key_lifetime;
1278         st->auxiliary_renegotiate_key_time=st->now+st->key_renegotiate_time;
1279         st->auxiliary_key.remote_session_id=st->setup_session_id;
1280
1281         enter_state_wait(st);
1282         return False;
1283     } else {
1284         logtimeout(st,"timed out sending key setup packet "
1285             "(in state %s)",state_name(st->state));
1286         enter_state_wait(st);
1287         return False;
1288     }
1289 }
1290
1291 static void site_resolve_callback(void *sst, const struct comm_addr *addrs,
1292                                   int stored_naddrs, int all_naddrs,
1293                                   const char *address, const char *failwhy)
1294 {
1295     struct site *st=sst;
1296
1297     if (!stored_naddrs) {
1298         slog(st,LOG_ERROR,"resolution of %s failed: %s",address,failwhy);
1299     } else {
1300         slog(st,LOG_PEER_ADDRS,"resolution of %s completed, %d addrs, eg: %s",
1301              address, all_naddrs, comm_addr_to_string(&addrs[0]));;
1302
1303         int space=st->transport_peers_max-st->resolving_n_results_stored;
1304         int n_tocopy=MIN(stored_naddrs,space);
1305         COPY_ARRAY(st->resolving_results + st->resolving_n_results_stored,
1306                    addrs,
1307                    n_tocopy);
1308         st->resolving_n_results_stored += n_tocopy;
1309         st->resolving_n_results_all += all_naddrs;
1310     }
1311
1312     decrement_resolving_count(st,1);
1313 }
1314
1315 static void decrement_resolving_count(struct site *st, int by)
1316 {
1317     assert(st->resolving_count>0);
1318     st->resolving_count-=by;
1319
1320     if (st->resolving_count)
1321         return;
1322
1323     /* OK, we are done with them all.  Handle combined results. */
1324
1325     const struct comm_addr *addrs=st->resolving_results;
1326     int naddrs=st->resolving_n_results_stored;
1327     assert(naddrs<=st->transport_peers_max);
1328
1329     if (naddrs) {
1330         if (naddrs != st->resolving_n_results_all) {
1331             slog(st,LOG_SETUP_INIT,"resolution of supplied addresses/names"
1332                  " yielded too many results (%d > %d), some ignored",
1333                  st->resolving_n_results_all, naddrs);
1334         }
1335         slog(st,LOG_STATE,"resolution completed, %d addrs, eg: %s",
1336              naddrs, iaddr_to_string(&addrs[0].ia));;
1337     }
1338
1339     switch (st->state) {
1340     case SITE_RESOLVE:
1341         if (transport_compute_setupinit_peers(st,addrs,naddrs,0)) {
1342             enter_new_state(st,SITE_SENTMSG1);
1343         } else {
1344             /* Can't figure out who to try to to talk to */
1345             slog(st,LOG_SETUP_INIT,
1346                  "key exchange failed: cannot find peer address");
1347             enter_state_run(st);
1348         }
1349         break;
1350     case SITE_SENTMSG1: case SITE_SENTMSG2:
1351     case SITE_SENTMSG3: case SITE_SENTMSG4:
1352     case SITE_SENTMSG5:
1353         if (naddrs) {
1354             /* We start using the address immediately for data too.
1355              * It's best to store it in st->peers now because we might
1356              * go via SENTMSG5, WAIT, and a MSG0, straight into using
1357              * the new key (without updating the data peer addrs). */
1358             transport_resolve_complete(st,addrs,naddrs);
1359         } else if (st->local_mobile) {
1360             /* We can't let this rest because we may have a peer
1361              * address which will break in the future. */
1362             slog(st,LOG_SETUP_INIT,"resolution failed: "
1363                  "abandoning key exchange");
1364             enter_state_wait(st);
1365         } else {
1366             slog(st,LOG_SETUP_INIT,"resolution failed: "
1367                  " continuing to use source address of peer's packets"
1368                  " for key exchange and ultimately data");
1369         }
1370         break;
1371     case SITE_RUN:
1372         if (naddrs) {
1373             slog(st,LOG_SETUP_INIT,"resolution completed tardily,"
1374                  " updating peer address(es)");
1375             transport_resolve_complete_tardy(st,addrs,naddrs);
1376         } else if (st->local_mobile) {
1377             /* Not very good.  We should queue (another) renegotiation
1378              * so that we can update the peer address. */
1379             st->key_renegotiate_time=st->now+wait_timeout(st);
1380         } else {
1381             slog(st,LOG_SETUP_INIT,"resolution failed: "
1382                  " continuing to use source address of peer's packets");
1383         }
1384         break;
1385     case SITE_WAIT:
1386     case SITE_STOP:
1387         /* oh well */
1388         break;
1389     }
1390 }
1391
1392 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
1393                                  const struct comm_addr *prod_hint)
1394 {
1395     /* Reentrancy hazard: can call enter_new_state/enter_state_* */
1396     if (st->state!=SITE_RUN) return False;
1397     slog(st,LOG_SETUP_INIT,"initiating key exchange (%s)",reason);
1398     if (st->addresses) {
1399         slog(st,LOG_SETUP_INIT,"resolving peer address(es)");
1400         return enter_state_resolve(st);
1401     } else if (transport_compute_setupinit_peers(st,0,0,prod_hint)) {
1402         return enter_new_state(st,SITE_SENTMSG1);
1403     }
1404     slog(st,LOG_SETUP_INIT,"key exchange failed: no address for peer");
1405     return False;
1406 }
1407
1408 static void activate_new_key(struct site *st)
1409 {
1410     struct transform_inst_if *t;
1411
1412     /* We have three transform instances, which we swap between old,
1413        active and setup */
1414     t=st->auxiliary_key.transform;
1415     st->auxiliary_key.transform=st->current.transform;
1416     st->current.transform=st->new_transform;
1417     st->new_transform=t;
1418     dispose_transform(&st->new_transform);
1419
1420     st->timeout=0;
1421     st->auxiliary_is_new=0;
1422     st->auxiliary_key.key_timeout=st->current.key_timeout;
1423     st->current.key_timeout=st->now+st->key_lifetime;
1424     st->renegotiate_key_time=st->now+st->key_renegotiate_time;
1425     transport_peers_copy(st,&st->peers,&st->setup_peers);
1426     st->current.remote_session_id=st->setup_session_id;
1427
1428     /* Compute the inter-site MTU.  This is min( our_mtu, their_mtu ).
1429      * But their mtu be unspecified, in which case we just use ours. */
1430     uint32_t intersite_mtu=
1431         MIN(st->mtu_target, st->remote_adv_mtu ?: ~(uint32_t)0);
1432     st->netlink->set_mtu(st->netlink->st,intersite_mtu);
1433
1434     slog(st,LOG_ACTIVATE_KEY,"new key activated"
1435          " (mtu ours=%"PRId32" theirs=%"PRId32" intersite=%"PRId32")",
1436          st->mtu_target, st->remote_adv_mtu, intersite_mtu);
1437     enter_state_run(st);
1438 }
1439
1440 static void delete_one_key(struct site *st, struct data_key *key,
1441                            cstring_t reason, cstring_t which, uint32_t loglevel)
1442 {
1443     if (!is_transform_valid(key->transform)) return;
1444     if (reason) slog(st,loglevel,"%s deleted (%s)",which,reason);
1445     dispose_transform(&key->transform);
1446     key->key_timeout=0;
1447 }
1448
1449 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel)
1450 {
1451     if (current_valid(st)) {
1452         slog(st,loglevel,"session closed (%s)",reason);
1453
1454         delete_one_key(st,&st->current,0,0,0);
1455         set_link_quality(st);
1456     }
1457     delete_one_key(st,&st->auxiliary_key,0,0,0);
1458 }
1459
1460 static void state_assert(struct site *st, bool_t ok)
1461 {
1462     if (!ok) fatal("site:state_assert");
1463 }
1464
1465 static void enter_state_stop(struct site *st)
1466 {
1467     st->state=SITE_STOP;
1468     st->timeout=0;
1469     delete_keys(st,"entering state STOP",LOG_TIMEOUT_KEY);
1470     dispose_transform(&st->new_transform);
1471 }
1472
1473 static void set_link_quality(struct site *st)
1474 {
1475     uint32_t quality;
1476     if (current_valid(st))
1477         quality=LINK_QUALITY_UP;
1478     else if (st->state==SITE_WAIT || st->state==SITE_STOP)
1479         quality=LINK_QUALITY_DOWN;
1480     else if (st->addresses)
1481         quality=LINK_QUALITY_DOWN_CURRENT_ADDRESS;
1482     else if (transport_peers_valid(&st->peers))
1483         quality=LINK_QUALITY_DOWN_STALE_ADDRESS;
1484     else
1485         quality=LINK_QUALITY_DOWN;
1486
1487     st->netlink->set_quality(st->netlink->st,quality);
1488 }
1489
1490 static void enter_state_run(struct site *st)
1491 {
1492     slog(st,LOG_STATE,"entering state RUN%s",
1493          current_valid(st) ? " (keyed)" : " (unkeyed)");
1494     st->state=SITE_RUN;
1495     st->timeout=0;
1496
1497     st->setup_session_id=0;
1498     transport_peers_clear(st,&st->setup_peers);
1499     FILLZERO(st->localN);
1500     FILLZERO(st->remoteN);
1501     dispose_transform(&st->new_transform);
1502     memset(st->dhsecret,0,st->dh->len);
1503     if (st->sharedsecret) memset(st->sharedsecret,0,st->sharedsecretlen);
1504     set_link_quality(st);
1505
1506     if (st->keepalive && !current_valid(st))
1507         initiate_key_setup(st, "keepalive", 0);
1508 }
1509
1510 static bool_t ensure_resolving(struct site *st)
1511 {
1512     /* Reentrancy hazard: may call site_resolve_callback and hence
1513      * enter_new_state, enter_state_* and generate_msg*. */
1514     if (st->resolving_count)
1515         return True;
1516
1517     assert(st->addresses);
1518
1519     /* resolver->request might reentrantly call site_resolve_callback
1520      * which will decrement st->resolving, so we need to increment it
1521      * twice beforehand to prevent decrement from thinking we're
1522      * finished, and decrement it ourselves.  Alternatively if
1523      * everything fails then there are no callbacks due and we simply
1524      * set it to 0 and return false.. */
1525     st->resolving_n_results_stored=0;
1526     st->resolving_n_results_all=0;
1527     st->resolving_count+=2;
1528     const char **addrp=st->addresses;
1529     const char *address;
1530     bool_t anyok=False;
1531     for (; (address=*addrp++); ) {
1532         bool_t ok = st->resolver->request(st->resolver->st,address,
1533                                           st->remoteport,st->comms[0],
1534                                           site_resolve_callback,st);
1535         if (ok)
1536             st->resolving_count++;
1537         anyok|=ok;
1538     }
1539     if (!anyok) {
1540         st->resolving_count=0;
1541         return False;
1542     }
1543     decrement_resolving_count(st,2);
1544     return True;
1545 }
1546
1547 static bool_t enter_state_resolve(struct site *st)
1548 {
1549     /* Reentrancy hazard!  See ensure_resolving. */
1550     state_assert(st,st->state==SITE_RUN);
1551     slog(st,LOG_STATE,"entering state RESOLVE");
1552     st->state=SITE_RESOLVE;
1553     return ensure_resolving(st);
1554 }
1555
1556 static bool_t enter_new_state(struct site *st, uint32_t next)
1557 {
1558     bool_t (*gen)(struct site *st);
1559     int r;
1560
1561     slog(st,LOG_STATE,"entering state %s",state_name(next));
1562     switch(next) {
1563     case SITE_SENTMSG1:
1564         state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE);
1565         gen=generate_msg1;
1566         st->msg1_crossed_logged = False;
1567         break;
1568     case SITE_SENTMSG2:
1569         state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1570                      st->state==SITE_SENTMSG1 || st->state==SITE_WAIT);
1571         gen=generate_msg2;
1572         break;
1573     case SITE_SENTMSG3:
1574         state_assert(st,st->state==SITE_SENTMSG1);
1575         BUF_FREE(&st->buffer);
1576         gen=generate_msg3;
1577         break;
1578     case SITE_SENTMSG4:
1579         state_assert(st,st->state==SITE_SENTMSG2);
1580         BUF_FREE(&st->buffer);
1581         gen=generate_msg4;
1582         break;
1583     case SITE_SENTMSG5:
1584         state_assert(st,st->state==SITE_SENTMSG3);
1585         BUF_FREE(&st->buffer);
1586         gen=generate_msg5;
1587         break;
1588     case SITE_RUN:
1589         state_assert(st,st->state==SITE_SENTMSG4);
1590         BUF_FREE(&st->buffer);
1591         gen=generate_msg6;
1592         break;
1593     default:
1594         gen=NULL;
1595         fatal("enter_new_state(%s): invalid new state",state_name(next));
1596         break;
1597     }
1598
1599     if (hacky_par_start_failnow()) return False;
1600
1601     r= gen(st) && send_msg(st);
1602
1603     hacky_par_end(&r,
1604                   st->setup_retries, st->setup_retry_interval,
1605                   send_msg, st);
1606     
1607     if (r) {
1608         st->state=next;
1609         if (next==SITE_RUN) {
1610             BUF_FREE(&st->buffer); /* Never reused */
1611             st->timeout=0; /* Never retransmit */
1612             activate_new_key(st);
1613         }
1614         return True;
1615     }
1616     slog(st,LOG_ERROR,"error entering state %s",state_name(next));
1617     st->buffer.free=False; /* Unconditionally use the buffer; it may be
1618                               in either state, and enter_state_wait() will
1619                               do a BUF_FREE() */
1620     enter_state_wait(st);
1621     return False;
1622 }
1623
1624 /* msg7 tells our peer that we're about to forget our key */
1625 static bool_t send_msg7(struct site *st, cstring_t reason)
1626 {
1627     cstring_t transform_err;
1628
1629     if (current_valid(st) && st->buffer.free
1630         && transport_peers_valid(&st->peers)) {
1631         BUF_ALLOC(&st->buffer,"site:MSG7");
1632         buffer_init(&st->buffer,calculate_max_start_pad());
1633         buf_append_uint32(&st->buffer,LABEL_MSG7);
1634         buf_append_string(&st->buffer,reason);
1635         if (call_transform_forwards(st, st->current.transform,
1636                                     &st->buffer, &transform_err))
1637             goto free_out;
1638         buf_prepend_uint32(&st->buffer,LABEL_MSG0);
1639         buf_prepend_uint32(&st->buffer,st->index);
1640         buf_prepend_uint32(&st->buffer,st->current.remote_session_id);
1641         transport_xmit(st,&st->peers,&st->buffer,True);
1642         BUF_FREE(&st->buffer);
1643     free_out:
1644         return True;
1645     }
1646     return False;
1647 }
1648
1649 /* We go into this state if our peer becomes uncommunicative. Similar to
1650    the "stop" state, we forget all session keys for a while, before
1651    re-entering the "run" state. */
1652 static void enter_state_wait(struct site *st)
1653 {
1654     slog(st,LOG_STATE,"entering state WAIT");
1655     st->timeout=st->now+wait_timeout(st);
1656     st->state=SITE_WAIT;
1657     set_link_quality(st);
1658     BUF_FREE(&st->buffer); /* will have had an outgoing packet in it */
1659     /* XXX Erase keys etc. */
1660 }
1661
1662 static void generate_prod(struct site *st, struct buffer_if *buf)
1663 {
1664     buffer_init(buf,0);
1665     buf_append_uint32(buf,0);
1666     buf_append_uint32(buf,0);
1667     buf_append_uint32(buf,LABEL_PROD);
1668     buf_append_string(buf,st->localname);
1669     buf_append_string(buf,st->remotename);
1670 }
1671
1672 static void generate_send_prod(struct site *st,
1673                                const struct comm_addr *source)
1674 {
1675     if (!st->allow_send_prod) return; /* too soon */
1676     if (!(st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1677           st->state==SITE_WAIT)) return; /* we'd ignore peer's MSG1 */
1678
1679     slog(st,LOG_SETUP_INIT,"prodding peer for key exchange");
1680     st->allow_send_prod=0;
1681     generate_prod(st,&st->scratch);
1682     bool_t ok = comm_addr_sendmsg(st, source, &st->scratch);
1683     dump_packet(st,&st->scratch,source,False,ok);
1684 }
1685
1686 static inline void site_settimeout(uint64_t timeout, int *timeout_io)
1687 {
1688     if (timeout) {
1689         int64_t offset=timeout-*now;
1690         if (offset<0) offset=0;
1691         if (offset>INT_MAX) offset=INT_MAX;
1692         if (*timeout_io<0 || offset<*timeout_io)
1693             *timeout_io=offset;
1694     }
1695 }
1696
1697 static int site_beforepoll(void *sst, struct pollfd *fds, int *nfds_io,
1698                            int *timeout_io)
1699 {
1700     struct site *st=sst;
1701
1702     BEFOREPOLL_WANT_FDS(0); /* We don't use any file descriptors */
1703     st->now=*now;
1704
1705     /* Work out when our next timeout is. The earlier of 'timeout' or
1706        'current.key_timeout'. A stored value of '0' indicates no timeout
1707        active. */
1708     site_settimeout(st->timeout, timeout_io);
1709     site_settimeout(st->current.key_timeout, timeout_io);
1710     site_settimeout(st->auxiliary_key.key_timeout, timeout_io);
1711
1712     return 0; /* success */
1713 }
1714
1715 static void check_expiry(struct site *st, struct data_key *key,
1716                          const char *which)
1717 {
1718     if (key->key_timeout && *now>key->key_timeout) {
1719         delete_one_key(st,key,"maximum life exceeded",which,LOG_TIMEOUT_KEY);
1720     }
1721 }
1722
1723 /* NB site_afterpoll will be called before site_beforepoll is ever called */
1724 static void site_afterpoll(void *sst, struct pollfd *fds, int nfds)
1725 {
1726     struct site *st=sst;
1727
1728     st->now=*now;
1729     if (st->timeout && *now>st->timeout) {
1730         st->timeout=0;
1731         if (st->state>=SITE_SENTMSG1 && st->state<=SITE_SENTMSG5) {
1732             if (!hacky_par_start_failnow())
1733                 send_msg(st);
1734         } else if (st->state==SITE_WAIT) {
1735             enter_state_run(st);
1736         } else {
1737             slog(st,LOG_ERROR,"site_afterpoll: unexpected timeout, state=%d",
1738                  st->state);
1739         }
1740     }
1741     check_expiry(st,&st->current,"current key");
1742     check_expiry(st,&st->auxiliary_key,"auxiliary key");
1743 }
1744
1745 /* This function is called by the netlink device to deliver packets
1746    intended for the remote network. The packet is in "raw" wire
1747    format, but is guaranteed to be word-aligned. */
1748 static void site_outgoing(void *sst, struct buffer_if *buf)
1749 {
1750     struct site *st=sst;
1751     cstring_t transform_err;
1752     
1753     if (st->state==SITE_STOP) {
1754         BUF_FREE(buf);
1755         return;
1756     }
1757
1758     st->allow_send_prod=1;
1759
1760     /* In all other states we consider delivering the packet if we have
1761        a valid key and a valid address to send it to. */
1762     if (current_valid(st) && transport_peers_valid(&st->peers)) {
1763         /* Transform it and send it */
1764         if (buf->size>0) {
1765             buf_prepend_uint32(buf,LABEL_MSG9);
1766             if (call_transform_forwards(st, st->current.transform,
1767                                         buf, &transform_err))
1768                 goto free_out;
1769             buf_prepend_uint32(buf,LABEL_MSG0);
1770             buf_prepend_uint32(buf,st->index);
1771             buf_prepend_uint32(buf,st->current.remote_session_id);
1772             transport_xmit(st,&st->peers,buf,False);
1773         }
1774     free_out:
1775         BUF_FREE(buf);
1776         return;
1777     }
1778
1779     slog(st,LOG_DROP,"discarding outgoing packet of size %d",buf->size);
1780     BUF_FREE(buf);
1781     initiate_key_setup(st,"outgoing packet",0);
1782 }
1783
1784 static bool_t named_for_us(struct site *st, const struct buffer_if *buf_in,
1785                            uint32_t type, struct msg *m)
1786     /* For packets which are identified by the local and remote names.
1787      * If it has our name and our peer's name in it it's for us. */
1788 {
1789     struct buffer_if buf[1];
1790     buffer_readonly_clone(buf,buf_in);
1791     return unpick_msg(st,type,buf,m)
1792         && name_matches(&m->remote,st->remotename)
1793         && name_matches(&m->local,st->localname);
1794 }
1795
1796 static bool_t we_have_priority(struct site *st, const struct msg *m) {
1797     if (st->local_capabilities & m->remote_capabilities &
1798         CAPAB_PRIORITY_MOBILE) {
1799         if (st->local_mobile) return True;
1800         if (st-> peer_mobile) return False;
1801     }
1802     return st->our_name_later;
1803 }
1804
1805 static bool_t setup_late_msg_ok(struct site *st, 
1806                                 const struct buffer_if *buf_in,
1807                                 uint32_t msgtype,
1808                                 const struct comm_addr *source) {
1809     /* For setup packets which seem from their type like they are
1810      * late.  Maybe they came via a different path.  All we do is make
1811      * a note of the sending address, iff they look like they are part
1812      * of the current key setup attempt. */
1813     struct msg m;
1814     if (!named_for_us(st,buf_in,msgtype,&m))
1815         /* named_for_us calls unpick_msg which gets the nonces */
1816         return False;
1817     if (!consttime_memeq(m.nR,st->remoteN,NONCELEN) ||
1818         !consttime_memeq(m.nL,st->localN, NONCELEN))
1819         /* spoof ?  from stale run ?  who knows */
1820         return False;
1821     transport_setup_msgok(st,source);
1822     return True;
1823 }
1824
1825 /* This function is called by the communication device to deliver
1826    packets from our peers.
1827    It should return True if the packet is recognised as being for
1828    this current site instance (and should therefore not be processed
1829    by other sites), even if the packet was otherwise ignored. */
1830 static bool_t site_incoming(void *sst, struct buffer_if *buf,
1831                             const struct comm_addr *source)
1832 {
1833     struct site *st=sst;
1834
1835     if (buf->size < 12) return False;
1836
1837     uint32_t dest=get_uint32(buf->start);
1838     uint32_t msgtype=get_uint32(buf->start+8);
1839     struct msg named_msg;
1840
1841     if (msgtype==LABEL_MSG1) {
1842         if (!named_for_us(st,buf,msgtype,&named_msg))
1843             return False;
1844         /* It's a MSG1 addressed to us. Decide what to do about it. */
1845         dump_packet(st,buf,source,True,True);
1846         if (st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1847             st->state==SITE_WAIT) {
1848             /* We should definitely process it */
1849             transport_compute_setupinit_peers(st,0,0,source);
1850             if (process_msg1(st,buf,source,&named_msg)) {
1851                 slog(st,LOG_SETUP_INIT,"key setup initiated by peer");
1852                 bool_t entered=enter_new_state(st,SITE_SENTMSG2);
1853                 if (entered && st->addresses && st->local_mobile)
1854                     /* We must do this as the very last thing, because
1855                        the resolver callback might reenter us. */
1856                     ensure_resolving(st);
1857             } else {
1858                 slog(st,LOG_ERROR,"failed to process incoming msg1");
1859             }
1860             BUF_FREE(buf);
1861             return True;
1862         } else if (st->state==SITE_SENTMSG1) {
1863             /* We've just sent a message 1! They may have crossed on
1864                the wire. If we have priority then we ignore the
1865                incoming one, otherwise we process it as usual. */
1866             if (we_have_priority(st,&named_msg)) {
1867                 BUF_FREE(buf);
1868                 if (!st->msg1_crossed_logged++)
1869                     slog(st,LOG_SETUP_INIT,"crossed msg1s; we are higher "
1870                          "priority => ignore incoming msg1");
1871                 return True;
1872             } else {
1873                 slog(st,LOG_SETUP_INIT,"crossed msg1s; we are lower "
1874                      "priority => use incoming msg1");
1875                 if (process_msg1(st,buf,source,&named_msg)) {
1876                     BUF_FREE(&st->buffer); /* Free our old message 1 */
1877                     transport_setup_msgok(st,source);
1878                     enter_new_state(st,SITE_SENTMSG2);
1879                 } else {
1880                     slog(st,LOG_ERROR,"failed to process an incoming "
1881                          "crossed msg1 (we have low priority)");
1882                 }
1883                 BUF_FREE(buf);
1884                 return True;
1885             }
1886         } else if (st->state==SITE_SENTMSG2 ||
1887                    st->state==SITE_SENTMSG4) {
1888             if (consttime_memeq(named_msg.nR,st->remoteN,NONCELEN)) {
1889                 /* We are ahead in the protocol, but that msg1 had the
1890                  * peer's nonce so presumably it is from this key
1891                  * exchange run, via a slower route */
1892                 transport_setup_msgok(st,source);
1893             } else {
1894                 slog(st,LOG_UNEXPECTED,"competing incoming message 1");
1895             }
1896             BUF_FREE(buf);
1897             return True;
1898         }
1899         /* The message 1 was received at an unexpected stage of the
1900            key setup.  Well, they lost the race. */
1901         slog(st,LOG_UNEXPECTED,"unexpected incoming message 1");
1902         BUF_FREE(buf);
1903         return True;
1904     }
1905     if (msgtype==LABEL_PROD) {
1906         if (!named_for_us(st,buf,msgtype,&named_msg))
1907             return False;
1908         dump_packet(st,buf,source,True,True);
1909         if (st->state!=SITE_RUN) {
1910             slog(st,LOG_DROP,"ignoring PROD when not in state RUN");
1911         } else if (current_valid(st)) {
1912             slog(st,LOG_DROP,"ignoring PROD when we think we have a key");
1913         } else {
1914             initiate_key_setup(st,"peer sent PROD packet",source);
1915         }
1916         BUF_FREE(buf);
1917         return True;
1918     }
1919     if (dest==st->index) {
1920         /* Explicitly addressed to us */
1921         if (msgtype!=LABEL_MSG0) dump_packet(st,buf,source,True,True);
1922         switch (msgtype) {
1923         case LABEL_NAK:
1924             /* If the source is our current peer then initiate a key setup,
1925                because our peer's forgotten the key */
1926             if (get_uint32(buf->start+4)==st->current.remote_session_id) {
1927                 bool_t initiated;
1928                 initiated = initiate_key_setup(st,"received a NAK",source);
1929                 if (!initiated) generate_send_prod(st,source);
1930             } else {
1931                 slog(st,LOG_SEC,"bad incoming NAK");
1932             }
1933             break;
1934         case LABEL_MSG0:
1935             process_msg0(st,buf,source);
1936             break;
1937         case LABEL_MSG1:
1938             /* Setup packet: should not have been explicitly addressed
1939                to us */
1940             slog(st,LOG_SEC,"incoming explicitly addressed msg1");
1941             break;
1942         case LABEL_MSG2:
1943             /* Setup packet: expected only in state SENTMSG1 */
1944             if (st->state!=SITE_SENTMSG1) {
1945                 if ((st->state==SITE_SENTMSG3 ||
1946                      st->state==SITE_SENTMSG5) &&
1947                     setup_late_msg_ok(st,buf,msgtype,source))
1948                     break;
1949                 slog(st,LOG_UNEXPECTED,"unexpected MSG2");
1950             } else if (process_msg2(st,buf,source)) {
1951                 transport_setup_msgok(st,source);
1952                 enter_new_state(st,SITE_SENTMSG3);
1953             } else {
1954                 slog(st,LOG_SEC,"invalid MSG2");
1955             }
1956             break;
1957         case LABEL_MSG3:
1958         case LABEL_MSG3BIS:
1959             /* Setup packet: expected only in state SENTMSG2 */
1960             if (st->state!=SITE_SENTMSG2) {
1961                 if ((st->state==SITE_SENTMSG4) &&
1962                     setup_late_msg_ok(st,buf,msgtype,source))
1963                     break;
1964                 slog(st,LOG_UNEXPECTED,"unexpected MSG3");
1965             } else if (process_msg3(st,buf,source,msgtype)) {
1966                 transport_setup_msgok(st,source);
1967                 enter_new_state(st,SITE_SENTMSG4);
1968             } else {
1969                 slog(st,LOG_SEC,"invalid MSG3");
1970             }
1971             break;
1972         case LABEL_MSG4:
1973             /* Setup packet: expected only in state SENTMSG3 */
1974             if (st->state!=SITE_SENTMSG3) {
1975                 if ((st->state==SITE_SENTMSG5) &&
1976                     setup_late_msg_ok(st,buf,msgtype,source))
1977                     break;
1978                 slog(st,LOG_UNEXPECTED,"unexpected MSG4");
1979             } else if (process_msg4(st,buf,source)) {
1980                 transport_setup_msgok(st,source);
1981                 enter_new_state(st,SITE_SENTMSG5);
1982             } else {
1983                 slog(st,LOG_SEC,"invalid MSG4");
1984             }
1985             break;
1986         case LABEL_MSG5:
1987             /* Setup packet: expected only in state SENTMSG4 */
1988             /* (may turn up in state RUN if our return MSG6 was lost
1989                and the new key has already been activated. In that
1990                case we discard it. The peer will realise that we
1991                are using the new key when they see our data packets.
1992                Until then the peer's data packets to us get discarded. */
1993             if (st->state==SITE_SENTMSG4) {
1994                 if (process_msg5(st,buf,source,st->new_transform)) {
1995                     transport_setup_msgok(st,source);
1996                     enter_new_state(st,SITE_RUN);
1997                 } else {
1998                     slog(st,LOG_SEC,"invalid MSG5");
1999                 }
2000             } else if (st->state==SITE_RUN) {
2001                 if (process_msg5(st,buf,source,st->current.transform)) {
2002                     slog(st,LOG_DROP,"got MSG5, retransmitting MSG6");
2003                     transport_setup_msgok(st,source);
2004                     create_msg6(st,st->current.transform,
2005                                 st->current.remote_session_id);
2006                     transport_xmit(st,&st->peers,&st->buffer,True);
2007                     BUF_FREE(&st->buffer);
2008                 } else {
2009                     slog(st,LOG_SEC,"invalid MSG5 (in state RUN)");
2010                 }
2011             } else {
2012                 slog(st,LOG_UNEXPECTED,"unexpected MSG5");
2013             }
2014             break;
2015         case LABEL_MSG6:
2016             /* Setup packet: expected only in state SENTMSG5 */
2017             if (st->state!=SITE_SENTMSG5) {
2018                 slog(st,LOG_UNEXPECTED,"unexpected MSG6");
2019             } else if (process_msg6(st,buf,source)) {
2020                 BUF_FREE(&st->buffer); /* Free message 5 */
2021                 transport_setup_msgok(st,source);
2022                 activate_new_key(st);
2023             } else {
2024                 slog(st,LOG_SEC,"invalid MSG6");
2025             }
2026             break;
2027         default:
2028             slog(st,LOG_SEC,"received message of unknown type 0x%08x",
2029                  msgtype);
2030             break;
2031         }
2032         BUF_FREE(buf);
2033         return True;
2034     }
2035
2036     return False;
2037 }
2038
2039 static void site_control(void *vst, bool_t run)
2040 {
2041     struct site *st=vst;
2042     if (run) enter_state_run(st);
2043     else enter_state_stop(st);
2044 }
2045
2046 static void site_phase_hook(void *sst, uint32_t newphase)
2047 {
2048     struct site *st=sst;
2049
2050     /* The program is shutting down; tell our peer */
2051     send_msg7(st,"shutting down");
2052 }
2053
2054 static void site_childpersist_clearkeys(void *sst, uint32_t newphase)
2055 {
2056     struct site *st=sst;
2057     dispose_transform(&st->current.transform);
2058     dispose_transform(&st->auxiliary_key.transform);
2059     dispose_transform(&st->new_transform);
2060     /* Not much point overwiting the signing key, since we loaded it
2061        from disk, and it is only valid prospectively if at all,
2062        anyway. */
2063     /* XXX it would be best to overwrite the DH state, because that
2064        _is_ relevant to forward secrecy.  However we have no
2065        convenient interface for doing that and in practice gmp has
2066        probably dribbled droppings all over the malloc arena.  A good
2067        way to fix this would be to have a privsep child for asymmetric
2068        crypto operations, but that's a task for another day. */
2069 }
2070
2071 static list_t *site_apply(closure_t *self, struct cloc loc, dict_t *context,
2072                           list_t *args)
2073 {
2074     static uint32_t index_sequence;
2075     struct site *st;
2076     item_t *item;
2077     dict_t *dict;
2078     int i;
2079
2080     NEW(st);
2081
2082     st->cl.description="site";
2083     st->cl.type=CL_SITE;
2084     st->cl.apply=NULL;
2085     st->cl.interface=&st->ops;
2086     st->ops.st=st;
2087     st->ops.control=site_control;
2088     st->ops.status=site_status;
2089
2090     /* First parameter must be a dict */
2091     item=list_elem(args,0);
2092     if (!item || item->type!=t_dict)
2093         cfgfatal(loc,"site","parameter must be a dictionary\n");
2094     
2095     dict=item->data.dict;
2096     st->localname=dict_read_string(dict, "local-name", True, "site", loc);
2097     st->remotename=dict_read_string(dict, "name", True, "site", loc);
2098
2099     st->keepalive=dict_read_bool(dict,"keepalive",False,"site",loc,False);
2100
2101     st->peer_mobile=dict_read_bool(dict,"mobile",False,"site",loc,False);
2102     st->local_mobile=
2103         dict_read_bool(dict,"local-mobile",False,"site",loc,False);
2104
2105     /* Sanity check (which also allows the 'sites' file to include
2106        site() closures for all sites including our own): refuse to
2107        talk to ourselves */
2108     if (strcmp(st->localname,st->remotename)==0) {
2109         Message(M_DEBUG,"site %s: local-name==name -> ignoring this site\n",
2110                 st->localname);
2111         if (st->peer_mobile != st->local_mobile)
2112             cfgfatal(loc,"site","site %s's peer-mobile=%d"
2113                     " but our local-mobile=%d\n",
2114                     st->localname, st->peer_mobile, st->local_mobile);
2115         free(st);
2116         return NULL;
2117     }
2118     if (st->peer_mobile && st->local_mobile) {
2119         Message(M_WARNING,"site %s: site is mobile but so are we"
2120                 " -> ignoring this site\n", st->remotename);
2121         free(st);
2122         return NULL;
2123     }
2124
2125     assert(index_sequence < 0xffffffffUL);
2126     st->index = ++index_sequence;
2127     st->local_capabilities = 0;
2128     st->netlink=find_cl_if(dict,"link",CL_NETLINK,True,"site",loc);
2129
2130 #define GET_CLOSURE_LIST(dictkey,things,nthings,CL_TYPE) do{            \
2131     list_t *things##_cfg=dict_lookup(dict,dictkey);                     \
2132     if (!things##_cfg)                                                  \
2133         cfgfatal(loc,"site","closure list \"%s\" not found\n",dictkey); \
2134     st->nthings=list_length(things##_cfg);                              \
2135     NEW_ARY(st->things,st->nthings);                                    \
2136     assert(st->nthings);                                                \
2137     for (i=0; i<st->nthings; i++) {                                     \
2138         item_t *item=list_elem(things##_cfg,i);                         \
2139         if (item->type!=t_closure)                                      \
2140             cfgfatal(loc,"site","%s is not a closure\n",dictkey);       \
2141         closure_t *cl=item->data.closure;                               \
2142         if (cl->type!=CL_TYPE)                                          \
2143             cfgfatal(loc,"site","%s closure wrong type\n",dictkey);     \
2144         st->things[i]=cl->interface;                                    \
2145     }                                                                   \
2146 }while(0)
2147
2148     GET_CLOSURE_LIST("comm",comms,ncomms,CL_COMM);
2149
2150     NEW_ARY(st->commclientinfos, st->ncomms);
2151     dict_t *comminfo = dict_read_dict(dict,"comm-info",False,"site",loc);
2152     for (i=0; i<st->ncomms; i++) {
2153         st->commclientinfos[i] =
2154             !comminfo ? 0 :
2155             st->comms[i]->clientinfo(st->comms[i],comminfo,loc);
2156     }
2157
2158     st->resolver=find_cl_if(dict,"resolver",CL_RESOLVER,True,"site",loc);
2159     st->log=find_cl_if(dict,"log",CL_LOG,True,"site",loc);
2160     st->random=find_cl_if(dict,"random",CL_RANDOMSRC,True,"site",loc);
2161
2162     st->privkey=find_cl_if(dict,"local-key",CL_RSAPRIVKEY,True,"site",loc);
2163     st->addresses=dict_read_string_array(dict,"address",False,"site",loc,0);
2164     if (st->addresses)
2165         st->remoteport=dict_read_number(dict,"port",True,"site",loc,0);
2166     else st->remoteport=0;
2167     st->pubkey=find_cl_if(dict,"key",CL_RSAPUBKEY,True,"site",loc);
2168
2169     GET_CLOSURE_LIST("transform",transforms,ntransforms,CL_TRANSFORM);
2170
2171     st->dh=find_cl_if(dict,"dh",CL_DH,True,"site",loc);
2172     st->hash=find_cl_if(dict,"hash",CL_HASH,True,"site",loc);
2173
2174 #define DEFAULT(D) (st->peer_mobile || st->local_mobile \
2175                     ? DEFAULT_MOBILE_##D : DEFAULT_##D)
2176 #define CFG_NUMBER(k,D) dict_read_number(dict,(k),False,"site",loc,DEFAULT(D));
2177
2178     st->key_lifetime=         CFG_NUMBER("key-lifetime",  KEY_LIFETIME);
2179     st->setup_retries=        CFG_NUMBER("setup-retries", SETUP_RETRIES);
2180     st->setup_retry_interval= CFG_NUMBER("setup-timeout", SETUP_RETRY_INTERVAL);
2181     st->wait_timeout_mean=    CFG_NUMBER("wait-time",     WAIT_TIME);
2182     st->mtu_target= dict_read_number(dict,"mtu-target",False,"site",loc,0);
2183
2184     st->mobile_peer_expiry= dict_read_number(
2185        dict,"mobile-peer-expiry",False,"site",loc,DEFAULT_MOBILE_PEER_EXPIRY);
2186
2187     const char *peerskey= st->peer_mobile
2188         ? "mobile-peers-max" : "static-peers-max";
2189     st->transport_peers_max= dict_read_number(
2190         dict,peerskey,False,"site",loc, st->addresses ? 4 : 3);
2191     if (st->transport_peers_max<1 ||
2192         st->transport_peers_max>MAX_PEER_ADDRS) {
2193         cfgfatal(loc,"site", "%s must be in range 1.."
2194                  STRING(MAX_PEER_ADDRS) "\n", peerskey);
2195     }
2196
2197     if (st->key_lifetime < DEFAULT(KEY_RENEGOTIATE_GAP)*2)
2198         st->key_renegotiate_time=st->key_lifetime/2;
2199     else
2200         st->key_renegotiate_time=st->key_lifetime-DEFAULT(KEY_RENEGOTIATE_GAP);
2201     st->key_renegotiate_time=dict_read_number(
2202         dict,"renegotiate-time",False,"site",loc,st->key_renegotiate_time);
2203     if (st->key_renegotiate_time > st->key_lifetime) {
2204         cfgfatal(loc,"site",
2205                  "renegotiate-time must be less than key-lifetime\n");
2206     }
2207
2208     st->log_events=string_list_to_word(dict_lookup(dict,"log-events"),
2209                                        log_event_table,"site");
2210
2211     st->resolving_count=0;
2212     st->allow_send_prod=0;
2213
2214     st->tunname=safe_malloc(strlen(st->localname)+strlen(st->remotename)+5,
2215                             "site_apply");
2216     sprintf(st->tunname,"%s<->%s",st->localname,st->remotename);
2217
2218     /* The information we expect to see in incoming messages of type 1 */
2219     /* fixme: lots of unchecked overflows here, but the results are only
2220        corrupted packets rather than undefined behaviour */
2221     st->our_name_later=(strcmp(st->localname,st->remotename)>0);
2222
2223     buffer_new(&st->buffer,SETUP_BUFFER_LEN);
2224
2225     buffer_new(&st->scratch,SETUP_BUFFER_LEN);
2226     BUF_ALLOC(&st->scratch,"site:scratch");
2227
2228     /* We are interested in poll(), but only for timeouts. We don't have
2229        any fds of our own. */
2230     register_for_poll(st, site_beforepoll, site_afterpoll, "site");
2231     st->timeout=0;
2232
2233     st->remote_capabilities=0;
2234     st->chosen_transform=0;
2235     st->current.key_timeout=0;
2236     st->auxiliary_key.key_timeout=0;
2237     transport_peers_clear(st,&st->peers);
2238     transport_peers_clear(st,&st->setup_peers);
2239     /* XXX mlock these */
2240     st->dhsecret=safe_malloc(st->dh->len,"site:dhsecret");
2241     st->sharedsecretlen=st->sharedsecretallocd=0;
2242     st->sharedsecret=0;
2243
2244 #define SET_CAPBIT(bit) do {                                            \
2245     uint32_t capflag = 1UL << (bit);                                    \
2246     if (st->local_capabilities & capflag)                               \
2247         slog(st,LOG_ERROR,"capability bit"                              \
2248              " %d (%#"PRIx32") reused", (bit), capflag);                \
2249     st->local_capabilities |= capflag;                                  \
2250 } while (0)
2251
2252     for (i=0; i<st->ntransforms; i++)
2253         SET_CAPBIT(st->transforms[i]->capab_bit);
2254
2255 #undef SET_CAPBIT
2256
2257     if (st->local_mobile || st->peer_mobile)
2258         st->local_capabilities |= CAPAB_PRIORITY_MOBILE;
2259
2260     /* We need to register the remote networks with the netlink device */
2261     uint32_t netlink_mtu; /* local virtual interface mtu */
2262     st->netlink->reg(st->netlink->st, site_outgoing, st, &netlink_mtu);
2263     if (!st->mtu_target)
2264         st->mtu_target=netlink_mtu;
2265     
2266     for (i=0; i<st->ncomms; i++)
2267         st->comms[i]->request_notify(st->comms[i]->st, st, site_incoming);
2268
2269     st->current.transform=0;
2270     st->auxiliary_key.transform=0;
2271     st->new_transform=0;
2272     st->auxiliary_is_new=0;
2273
2274     enter_state_stop(st);
2275
2276     add_hook(PHASE_SHUTDOWN,site_phase_hook,st);
2277     add_hook(PHASE_CHILDPERSIST,site_childpersist_clearkeys,st);
2278
2279     return new_closure(&st->cl);
2280 }
2281
2282 void site_module(dict_t *dict)
2283 {
2284     add_closure(dict,"site",site_apply);
2285 }
2286
2287
2288 /***** TRANSPORT PEERS definitions *****/
2289
2290 static void transport_peers_debug(struct site *st, transport_peers *dst,
2291                                   const char *didwhat,
2292                                   int nargs, const struct comm_addr *args,
2293                                   size_t stride) {
2294     int i;
2295     char *argp;
2296
2297     if (!(st->log_events & LOG_PEER_ADDRS))
2298         return; /* an optimisation */
2299
2300     slog(st, LOG_PEER_ADDRS, "peers (%s) %s nargs=%d => npeers=%d",
2301          (dst==&st->peers ? "data" :
2302           dst==&st->setup_peers ? "setup" : "UNKNOWN"),
2303          didwhat, nargs, dst->npeers);
2304
2305     for (i=0, argp=(void*)args;
2306          i<nargs;
2307          i++, (argp+=stride?stride:sizeof(*args))) {
2308         const struct comm_addr *ca=(void*)argp;
2309         slog(st, LOG_PEER_ADDRS, " args: addrs[%d]=%s",
2310              i, comm_addr_to_string(ca));
2311     }
2312     for (i=0; i<dst->npeers; i++) {
2313         struct timeval diff;
2314         timersub(tv_now,&dst->peers[i].last,&diff);
2315         const struct comm_addr *ca=&dst->peers[i].addr;
2316         slog(st, LOG_PEER_ADDRS, " peers: addrs[%d]=%s T-%ld.%06ld",
2317              i, comm_addr_to_string(ca),
2318              (unsigned long)diff.tv_sec, (unsigned long)diff.tv_usec);
2319     }
2320 }
2321
2322 static void transport_peers_expire(struct site *st, transport_peers *peers) {
2323     /* peers must be sorted first */
2324     int previous_peers=peers->npeers;
2325     struct timeval oldest;
2326     oldest.tv_sec  = tv_now->tv_sec - st->mobile_peer_expiry;
2327     oldest.tv_usec = tv_now->tv_usec;
2328     while (peers->npeers>1 &&
2329            timercmp(&peers->peers[peers->npeers-1].last, &oldest, <))
2330         peers->npeers--;
2331     if (peers->npeers != previous_peers)
2332         transport_peers_debug(st,peers,"expire", 0,0,0);
2333 }
2334
2335 static bool_t transport_peer_record_one(struct site *st, transport_peers *peers,
2336                                         const struct comm_addr *ca,
2337                                         const struct timeval *tv) {
2338     /* returns false if output is full */
2339     int search;
2340
2341     if (peers->npeers >= st->transport_peers_max)
2342         return 0;
2343
2344     for (search=0; search<peers->npeers; search++)
2345         if (comm_addr_equal(&peers->peers[search].addr, ca))
2346             return 1;
2347
2348     peers->peers[peers->npeers].addr = *ca;
2349     peers->peers[peers->npeers].last = *tv;
2350     peers->npeers++;
2351     return 1;
2352 }
2353
2354 static void transport_record_peers(struct site *st, transport_peers *peers,
2355                                    const struct comm_addr *addrs, int naddrs,
2356                                    const char *m) {
2357     /* We add addrs into peers.  The new entries end up at the front
2358      * and displace entries towards the end (perhaps even off the
2359      * end).  Any existing matching entries are moved up to the front.
2360      *
2361      * Caller must first call transport_peers_expire. */
2362
2363     if (naddrs==1) {
2364         /* avoids debug for uninteresting updates */
2365         int i;
2366         for (i=0; i<peers->npeers; i++) {
2367             if (comm_addr_equal(&addrs[0], &peers->peers[i].addr)) {
2368                 memmove(peers->peers+1, peers->peers,
2369                         sizeof(peers->peers[0]) * i);
2370                 peers->peers[0].addr = addrs[0];
2371                 peers->peers[0].last = *tv_now;
2372                 return;
2373             }
2374         }
2375     }
2376
2377     int old_npeers=peers->npeers;
2378     transport_peer old_peers[old_npeers];
2379     COPY_ARRAY(old_peers,peers->peers,old_npeers);
2380
2381     peers->npeers=0;
2382     int i;
2383     for (i=0; i<naddrs; i++) {
2384         if (!transport_peer_record_one(st,peers, &addrs[i], tv_now))
2385             break;
2386     }
2387     for (i=0; i<old_npeers; i++) {
2388         const transport_peer *old=&old_peers[i];
2389         if (!transport_peer_record_one(st,peers, &old->addr, &old->last))
2390             break;
2391     }
2392
2393     transport_peers_debug(st,peers,m, naddrs,addrs,0);
2394 }
2395
2396 static void transport_expire_record_peers(struct site *st,
2397                                           transport_peers *peers,
2398                                           const struct comm_addr *addrs,
2399                                           int naddrs, const char *m) {
2400     /* Convenience function */
2401     transport_peers_expire(st,peers);
2402     transport_record_peers(st,peers,addrs,naddrs,m);
2403 }
2404
2405 static bool_t transport_compute_setupinit_peers(struct site *st,
2406         const struct comm_addr *configured_addrs /* 0 if none or not found */,
2407         int n_configured_addrs /* 0 if none or not found */,
2408         const struct comm_addr *incoming_packet_addr /* 0 if none */) {
2409     if (!n_configured_addrs && !incoming_packet_addr &&
2410         !transport_peers_valid(&st->peers))
2411         return False;
2412
2413     slog(st,LOG_SETUP_INIT,
2414          "using: %d configured addr(s);%s %d old peer addrs(es)",
2415          n_configured_addrs,
2416          incoming_packet_addr ? " incoming packet address;" : "",
2417          st->peers.npeers);
2418
2419     /* Non-mobile peers try addresses until one is plausible.  The
2420      * effect is that this code always tries first the configured
2421      * address if supplied, or otherwise the address of the incoming
2422      * PROD, or finally the existing data peer if one exists; this is
2423      * as desired. */
2424
2425     transport_peers_copy(st,&st->setup_peers,&st->peers);
2426     transport_peers_expire(st,&st->setup_peers);
2427
2428     if (incoming_packet_addr)
2429         transport_record_peers(st,&st->setup_peers,
2430                                incoming_packet_addr,1, "incoming");
2431
2432     if (n_configured_addrs)
2433         transport_record_peers(st,&st->setup_peers,
2434                               configured_addrs,n_configured_addrs, "setupinit");
2435
2436     assert(transport_peers_valid(&st->setup_peers));
2437     return True;
2438 }
2439
2440 static void transport_setup_msgok(struct site *st, const struct comm_addr *a) {
2441     if (st->peer_mobile)
2442         transport_expire_record_peers(st,&st->setup_peers,a,1,"setupmsg");
2443 }
2444 static void transport_data_msgok(struct site *st, const struct comm_addr *a) {
2445     if (st->peer_mobile)
2446         transport_expire_record_peers(st,&st->peers,a,1,"datamsg");
2447 }
2448
2449 static int transport_peers_valid(transport_peers *peers) {
2450     return peers->npeers;
2451 }
2452 static void transport_peers_clear(struct site *st, transport_peers *peers) {
2453     peers->npeers= 0;
2454     transport_peers_debug(st,peers,"clear",0,0,0);
2455 }
2456 static void transport_peers_copy(struct site *st, transport_peers *dst,
2457                                  const transport_peers *src) {
2458     dst->npeers=src->npeers;
2459     COPY_ARRAY(dst->peers, src->peers, dst->npeers);
2460     transport_peers_debug(st,dst,"copy",
2461                           src->npeers, &src->peers->addr, sizeof(*src->peers));
2462 }
2463
2464 static void transport_resolve_complete(struct site *st,
2465                                        const struct comm_addr *addrs,
2466                                        int naddrs) {
2467     transport_expire_record_peers(st,&st->peers,addrs,naddrs,
2468                                   "resolved data");
2469     transport_expire_record_peers(st,&st->setup_peers,addrs,naddrs,
2470                                   "resolved setup");
2471 }
2472
2473 static void transport_resolve_complete_tardy(struct site *st,
2474                                              const struct comm_addr *addrs,
2475                                              int naddrs) {
2476     transport_expire_record_peers(st,&st->peers,addrs,naddrs,
2477                                   "resolved tardily");
2478 }
2479
2480 static void transport_peers__copy_by_mask(transport_peer *out, int *nout_io,
2481                                           unsigned mask,
2482                                           const transport_peers *inp) {
2483     /* out and in->peers may be the same region, or nonoverlapping */
2484     const transport_peer *in=inp->peers;
2485     int slot;
2486     for (slot=0; slot<inp->npeers; slot++) {
2487         if (!(mask & (1U << slot)))
2488             continue;
2489         if (!(out==in && slot==*nout_io))
2490             COPY_OBJ(out[*nout_io], in[slot]);
2491         (*nout_io)++;
2492     }
2493 }
2494
2495 void transport_xmit(struct site *st, transport_peers *peers,
2496                     struct buffer_if *buf, bool_t candebug) {
2497     int slot;
2498     transport_peers_expire(st, peers);
2499     unsigned failed=0; /* bitmask */
2500     assert(MAX_PEER_ADDRS < sizeof(unsigned)*CHAR_BIT);
2501
2502     int nfailed=0;
2503     for (slot=0; slot<peers->npeers; slot++) {
2504         transport_peer *peer=&peers->peers[slot];
2505         bool_t ok = comm_addr_sendmsg(st, &peer->addr, buf);
2506         if (candebug)
2507             dump_packet(st, buf, &peer->addr, False, ok);
2508         if (!ok) {
2509             failed |= 1U << slot;
2510             nfailed++;
2511         }
2512         if (ok && !st->peer_mobile)
2513             break;
2514     }
2515     /* Now we need to demote/delete failing addrs: if we are mobile we
2516      * merely demote them; otherwise we delete them. */
2517     if (st->local_mobile) {
2518         unsigned expected = ((1U << nfailed)-1) << (peers->npeers-nfailed);
2519         /* `expected' has all the failures at the end already */
2520         if (failed != expected) {
2521             int fslot=0;
2522             transport_peer failedpeers[nfailed];
2523             transport_peers__copy_by_mask(failedpeers, &fslot, failed,peers);
2524             assert(fslot == nfailed);
2525             int wslot=0;
2526             transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2527             assert(wslot+nfailed == peers->npeers);
2528             COPY_ARRAY(peers->peers+wslot, failedpeers, nfailed);
2529             transport_peers_debug(st,peers,"mobile failure reorder",0,0,0);
2530         }
2531     } else {
2532         if (failed && peers->npeers > 1) {
2533             int wslot=0;
2534             transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2535             peers->npeers=wslot;
2536             transport_peers_debug(st,peers,"non-mobile failure cleanup",0,0,0);
2537         }
2538     }
2539 }
2540
2541 /***** END of transport peers declarations *****/