chiark / gitweb /
dh.c, secnet.8: Allow `diffie-hellman' to take a dictionary of arguments.
[secnet] / site.c
1 /* site.c - manage communication with a remote network site */
2
3 /*
4  * This file is part of secnet.
5  * See README for full list of copyright holders.
6  *
7  * secnet is free software; you can redistribute it and/or modify it
8  * under the terms of the GNU General Public License as published by
9  * the Free Software Foundation; either version 3 of the License, or
10  * (at your option) any later version.
11  * 
12  * secnet is distributed in the hope that it will be useful, but
13  * WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
15  * General Public License for more details.
16  * 
17  * You should have received a copy of the GNU General Public License
18  * version 3 along with secnet; if not, see
19  * https://www.gnu.org/licenses/gpl.html.
20  */
21
22 /* The 'site' code doesn't know anything about the structure of the
23    packets it's transmitting.  In fact, under the new netlink
24    configuration scheme it doesn't need to know anything at all about
25    IP addresses, except how to contact its peer.  This means it could
26    potentially be used to tunnel other protocols too (IPv6, IPX, plain
27    old Ethernet frames) if appropriate netlink code can be written
28    (and that ought not to be too hard, eg. using the TUN/TAP device to
29    pretend to be an Ethernet interface).  */
30
31 /* At some point in the future the netlink code will be asked for
32    configuration information to go in the PING/PONG packets at the end
33    of the key exchange. */
34
35 #include "secnet.h"
36 #include <stdio.h>
37 #include <string.h>
38 #include <limits.h>
39 #include <assert.h>
40 #include <sys/socket.h>
41
42 #include <sys/mman.h>
43 #include "util.h"
44 #include "unaligned.h"
45 #include "magic.h"
46
47 #define SETUP_BUFFER_LEN 2048
48
49 #define DEFAULT_KEY_LIFETIME                  (3600*1000) /* [ms] */
50 #define DEFAULT_KEY_RENEGOTIATE_GAP           (5*60*1000) /* [ms] */
51 #define DEFAULT_SETUP_RETRIES 5
52 #define DEFAULT_SETUP_RETRY_INTERVAL             (2*1000) /* [ms] */
53 #define DEFAULT_WAIT_TIME                       (20*1000) /* [ms] */
54
55 #define DEFAULT_MOBILE_KEY_LIFETIME      (2*24*3600*1000) /* [ms] */
56 #define DEFAULT_MOBILE_KEY_RENEGOTIATE_GAP (12*3600*1000) /* [ms] */
57 #define DEFAULT_MOBILE_SETUP_RETRIES 30
58 #define DEFAULT_MOBILE_SETUP_RETRY_INTERVAL      (1*1000) /* [ms] */
59 #define DEFAULT_MOBILE_WAIT_TIME                (10*1000) /* [ms] */
60
61 #define DEFAULT_MOBILE_PEER_EXPIRY            (2*60)      /* [s] */
62
63 /* Each site can be in one of several possible states. */
64
65 /* States:
66    SITE_STOP         - nothing is allowed to happen; tunnel is down;
67                        all session keys have been erased
68      -> SITE_RUN upon external instruction
69    SITE_RUN          - site up, maybe with valid key
70      -> SITE_RESOLVE upon outgoing packet and no valid key
71          we start name resolution for the other end of the tunnel
72      -> SITE_SENTMSG2 upon valid incoming message 1 and suitable time
73          we send an appropriate message 2
74    SITE_RESOLVE      - waiting for name resolution
75      -> SITE_SENTMSG1 upon successful resolution
76          we send an appropriate message 1
77      -> SITE_SENTMSG2 upon valid incoming message 1 (then abort resolution)
78          we abort resolution and 
79      -> SITE_WAIT on timeout or resolution failure
80    SITE_SENTMSG1
81      -> SITE_SENTMSG2 upon valid incoming message 1 from higher priority end
82      -> SITE_SENTMSG3 upon valid incoming message 2
83      -> SITE_WAIT on timeout
84    SITE_SENTMSG2
85      -> SITE_SENTMSG4 upon valid incoming message 3
86      -> SITE_WAIT on timeout
87    SITE_SENTMSG3
88      -> SITE_SENTMSG5 upon valid incoming message 4
89      -> SITE_WAIT on timeout
90    SITE_SENTMSG4
91      -> SITE_RUN upon valid incoming message 5
92      -> SITE_WAIT on timeout
93    SITE_SENTMSG5
94      -> SITE_RUN upon valid incoming message 6
95      -> SITE_WAIT on timeout
96    SITE_WAIT         - failed to establish key; do nothing for a while
97      -> SITE_RUN on timeout
98    */
99
100 #define SITE_STOP     0
101 #define SITE_RUN      1
102 #define SITE_RESOLVE  2
103 #define SITE_SENTMSG1 3
104 #define SITE_SENTMSG2 4
105 #define SITE_SENTMSG3 5
106 #define SITE_SENTMSG4 6
107 #define SITE_SENTMSG5 7
108 #define SITE_WAIT     8
109
110 #define CASES_MSG3_KNOWN LABEL_MSG3: case LABEL_MSG3BIS
111
112 int32_t site_max_start_pad = 4*4;
113
114 static cstring_t state_name(uint32_t state)
115 {
116     switch (state) {
117     case 0: return "STOP";
118     case 1: return "RUN";
119     case 2: return "RESOLVE";
120     case 3: return "SENTMSG1";
121     case 4: return "SENTMSG2";
122     case 5: return "SENTMSG3";
123     case 6: return "SENTMSG4";
124     case 7: return "SENTMSG5";
125     case 8: return "WAIT";
126     default: return "*bad state*";
127     }
128 }
129
130 #define NONCELEN 8
131
132 #define LOG_UNEXPECTED    0x00000001
133 #define LOG_SETUP_INIT    0x00000002
134 #define LOG_SETUP_TIMEOUT 0x00000004
135 #define LOG_ACTIVATE_KEY  0x00000008
136 #define LOG_TIMEOUT_KEY   0x00000010
137 #define LOG_SEC           0x00000020
138 #define LOG_STATE         0x00000040
139 #define LOG_DROP          0x00000080
140 #define LOG_DUMP          0x00000100
141 #define LOG_ERROR         0x00000400
142 #define LOG_PEER_ADDRS    0x00000800
143
144 static struct flagstr log_event_table[]={
145     { "unexpected", LOG_UNEXPECTED },
146     { "setup-init", LOG_SETUP_INIT },
147     { "setup-timeout", LOG_SETUP_TIMEOUT },
148     { "activate-key", LOG_ACTIVATE_KEY },
149     { "timeout-key", LOG_TIMEOUT_KEY },
150     { "security", LOG_SEC },
151     { "state-change", LOG_STATE },
152     { "packet-drop", LOG_DROP },
153     { "dump-packets", LOG_DUMP },
154     { "errors", LOG_ERROR },
155     { "peer-addrs", LOG_PEER_ADDRS },
156     { "default", LOG_SETUP_INIT|LOG_SETUP_TIMEOUT|
157       LOG_ACTIVATE_KEY|LOG_TIMEOUT_KEY|LOG_SEC|LOG_ERROR },
158     { "all", 0xffffffff },
159     { NULL, 0 }
160 };
161
162
163 /***** TRANSPORT PEERS declarations *****/
164
165 /* Details of "mobile peer" semantics:
166
167    - We use the same data structure for the different configurations,
168      but manage it with different algorithms.
169    
170    - We record up to mobile_peers_max peer address/port numbers
171      ("peers") for key setup, and separately up to mobile_peers_max
172      for data transfer.
173
174    - In general, we make a new set of addrs (see below) when we start
175      a new key exchange; the key setup addrs become the data transport
176      addrs when key setup complets.
177
178    If our peer is mobile:
179
180    - We send to all recent addresses of incoming packets, plus
181      initially all configured addresses (which we also expire).
182
183    - So, we record addrs of good incoming packets, as follows:
184       1. expire any peers last seen >120s ("mobile-peer-expiry") ago
185       2. add the peer of the just received packet to the applicable list
186          (possibly evicting the oldest entries to make room)
187      NB that we do not expire peers until an incoming packet arrives.
188
189    - If the peer has a configured address or name, we record them the
190      same way, but only as a result of our own initiation of key
191      setup.  (We might evict some incoming packet addrs to make room.)
192
193    - The default number of addrs to keep is 3, or 4 if we have a
194      configured name or address.  That's space for two configured
195      addresses (one IPv6 and one IPv4), plus two received addresses.
196
197    - Outgoing packets are sent to every recorded address in the
198      applicable list.  Any unsupported[1] addresses are deleted from
199      the list right away.  (This should only happen to configured
200      addresses, of course, but there is no need to check that.)
201
202    - When we successfully complete a key setup, we merge the key setup
203      peers into the data transfer peers.
204
205    [1] An unsupported address is one for whose AF we don't have a
206      socket (perhaps because we got EAFNOSUPPORT or some such) or for
207      which sendto gives ENETUNREACH.
208
209    If neither end is mobile:
210
211    - When peer initiated the key exchange, we use the incoming packet
212      address.
213
214    - When we initiate the key exchange, we try configured addresses
215      until we get one which isn't unsupported then fixate on that.
216
217    - When we complete a key setup, we replace the data transport peers
218      with those from the key setup.
219
220    If we are mobile:
221
222    - We can't tell when local network setup changes so we can't cache
223      the unsupported addrs and completely remove the spurious calls to
224      sendto, but we can optimise things a bit by deprioritising addrs
225      which seem to be unsupported.
226
227    - Use only configured addresses.  (Except, that if our peer
228      initiated a key exchange we use the incoming packet address until
229      our name resolution completes.)
230
231    - When we send a packet, try each address in turn; if addr
232      supported, put that address to the end of the list for future
233      packets, and go onto the next address.
234
235    - When we complete a key setup, we replace the data transport peers
236      with those from the key setup.
237
238    */
239
240 typedef struct {
241     struct timeval last;
242     struct comm_addr addr;
243 } transport_peer;
244
245 typedef struct {
246 /* configuration information */
247 /* runtime information */
248     int npeers;
249     transport_peer peers[MAX_PEER_ADDRS];
250 } transport_peers;
251
252 /* Basic operations on transport peer address sets */
253 static void transport_peers_clear(struct site *st, transport_peers *peers);
254 static int transport_peers_valid(transport_peers *peers);
255 static void transport_peers_copy(struct site *st, transport_peers *dst,
256                                  const transport_peers *src);
257
258 /* Record address of incoming setup packet; resp. data packet. */
259 static void transport_setup_msgok(struct site *st, const struct comm_addr *a);
260 static void transport_data_msgok(struct site *st, const struct comm_addr *a);
261
262 /* Initialise the setup addresses.  Called before we send the first
263  * packet in a key exchange.  If we are the initiator, as a result of
264  * resolve completing (or being determined not to be relevant) or an
265  * incoming PROD; if we are the responder, as a result of the MSG1. */
266 static bool_t transport_compute_setupinit_peers(struct site *st,
267         const struct comm_addr *configured_addrs /* 0 if none or not found */,
268         int n_configured_addrs /* 0 if none or not found */,
269         const struct comm_addr *incoming_packet_addr /* 0 if none */);
270
271 /* Called if we are the responder in a key setup, when the resolve
272  * completes.  transport_compute_setupinit_peers will hvae been called
273  * earlier.  If _complete is called, we are still doing the key setup
274  * (and we should use the new values for both the rest of the key
275  * setup and the ongoing data exchange); if _tardy is called, the key
276  * setup is done (either completed or not) and only the data peers are
277  * relevant */
278 static void transport_resolve_complete(struct site *st,
279         const struct comm_addr *addrs, int naddrs);
280 static void transport_resolve_complete_tardy(struct site *st,
281         const struct comm_addr *addrs, int naddrs);
282
283 static void transport_xmit(struct site *st, transport_peers *peers,
284                            struct buffer_if *buf, bool_t candebug);
285
286  /***** END of transport peers declarations *****/
287
288
289 struct data_key {
290     struct transform_inst_if *transform;
291     uint64_t key_timeout; /* End of life of current key */
292     uint32_t remote_session_id;
293 };
294
295 struct site {
296     closure_t cl;
297     struct site_if ops;
298 /* configuration information */
299     string_t localname;
300     string_t remotename;
301     bool_t keepalive;
302     bool_t local_mobile, peer_mobile; /* Mobile client support */
303     int32_t transport_peers_max;
304     string_t tunname; /* localname<->remotename by default, used in logs */
305     cstring_t *addresses; /* DNS name or address(es) for bootstrapping, optional */
306     int remoteport; /* Port for bootstrapping, optional */
307     uint32_t mtu_target;
308     struct netlink_if *netlink;
309     struct comm_if **comms;
310     struct comm_clientinfo **commclientinfos;
311     int ncomms;
312     struct resolver_if *resolver;
313     struct log_if *log;
314     struct random_if *random;
315     struct rsaprivkey_if *privkey;
316     struct rsapubkey_if *pubkey;
317     struct transform_if **transforms;
318     int ntransforms;
319     struct dh_if *dh;
320     struct hash_if *hash;
321
322     uint32_t index; /* Index of this site */
323     uint32_t early_capabilities;
324     uint32_t local_capabilities;
325     int32_t setup_retries; /* How many times to send setup packets */
326     int32_t setup_retry_interval; /* Initial timeout for setup packets */
327     int32_t wait_timeout_mean; /* How long to wait if setup unsuccessful */
328     int32_t mobile_peer_expiry; /* How long to remember 2ary addresses */
329     int32_t key_lifetime; /* How long a key lasts once set up */
330     int32_t key_renegotiate_time; /* If we see traffic (or a keepalive)
331                                       after this time, initiate a new
332                                       key exchange */
333
334     bool_t our_name_later; /* our name > peer name */
335     uint32_t log_events;
336
337 /* runtime information */
338     uint32_t state;
339     uint64_t now; /* Most recently seen time */
340     bool_t allow_send_prod;
341     bool_t msg1_crossed_logged;
342     int resolving_count;
343     int resolving_n_results_all;
344     int resolving_n_results_stored;
345     struct comm_addr resolving_results[MAX_PEER_ADDRS];
346
347     /* The currently established session */
348     struct data_key current;
349     struct data_key auxiliary_key;
350     bool_t auxiliary_is_new;
351     uint64_t renegotiate_key_time; /* When we can negotiate a new key */
352     uint64_t auxiliary_renegotiate_key_time;
353     transport_peers peers; /* Current address(es) of peer for data traffic */
354
355     /* The current key setup protocol exchange.  We can only be
356        involved in one of these at a time.  There's a potential for
357        denial of service here (the attacker keeps sending a setup
358        packet; we keep trying to continue the exchange, and have to
359        timeout before we can listen for another setup packet); perhaps
360        we should keep a list of 'bad' sources for setup packets. */
361     uint32_t remote_capabilities;
362     uint16_t remote_adv_mtu;
363     struct transform_if *chosen_transform;
364     uint32_t setup_session_id;
365     transport_peers setup_peers;
366     uint8_t localN[NONCELEN]; /* Nonces for key exchange */
367     uint8_t remoteN[NONCELEN];
368     struct buffer_if buffer; /* Current outgoing key exchange packet */
369     struct buffer_if scratch;
370     int32_t retries; /* Number of retries remaining */
371     uint64_t timeout; /* Timeout for current state */
372     uint8_t *dhsecret;
373     uint8_t *sharedsecret;
374     struct transform_inst_if *new_transform; /* For key setup/verify */
375 };
376
377 static uint32_t event_log_priority(struct site *st, uint32_t event)
378 {
379     if (!(event&st->log_events))
380         return 0;
381     switch(event) {
382     case LOG_UNEXPECTED:    return M_INFO;
383     case LOG_SETUP_INIT:    return M_INFO;
384     case LOG_SETUP_TIMEOUT: return M_NOTICE;
385     case LOG_ACTIVATE_KEY:  return M_INFO;
386     case LOG_TIMEOUT_KEY:   return M_INFO;
387     case LOG_SEC:           return M_SECURITY;
388     case LOG_STATE:         return M_DEBUG;
389     case LOG_DROP:          return M_DEBUG;
390     case LOG_DUMP:          return M_DEBUG;
391     case LOG_ERROR:         return M_ERR;
392     case LOG_PEER_ADDRS:    return M_DEBUG;
393     default:                return M_ERR;
394     }
395 }
396
397 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
398 FORMAT(printf,3,0);
399 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
400 {
401     uint32_t class;
402
403     class=event_log_priority(st, event);
404     if (class) {
405         slilog_part(st->log,class,"%s: ",st->tunname);
406         vslilog_part(st->log,class,msg,ap);
407         slilog_part(st->log,class,"\n");
408     }
409 }
410
411 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
412 FORMAT(printf,3,4);
413 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
414 {
415     va_list ap;
416     va_start(ap,msg);
417     vslog(st,event,msg,ap);
418     va_end(ap);
419 }
420
421 static void logtimeout(struct site *st, const char *fmt, ...)
422 FORMAT(printf,2,3);
423 static void logtimeout(struct site *st, const char *fmt, ...)
424 {
425     uint32_t class=event_log_priority(st,LOG_SETUP_TIMEOUT);
426     if (!class)
427         return;
428
429     va_list ap;
430     va_start(ap,fmt);
431
432     slilog_part(st->log,class,"%s: ",st->tunname);
433     vslilog_part(st->log,class,fmt,ap);
434
435     const char *delim;
436     int i;
437     for (i=0, delim=" (tried ";
438          i<st->setup_peers.npeers;
439          i++, delim=", ") {
440         transport_peer *peer=&st->setup_peers.peers[i];
441         const char *s=comm_addr_to_string(&peer->addr);
442         slilog_part(st->log,class,"%s%s",delim,s);
443     }
444
445     slilog_part(st->log,class,")\n");
446     va_end(ap);
447 }
448
449 static void set_link_quality(struct site *st);
450 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel);
451 static void delete_one_key(struct site *st, struct data_key *key,
452                            const char *reason /* may be 0 meaning don't log*/,
453                            const char *which /* ignored if !reasonn */,
454                            uint32_t loglevel /* ignored if !reasonn */);
455 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
456                                  const struct comm_addr *prod_hint);
457 static void enter_state_run(struct site *st);
458 static bool_t enter_state_resolve(struct site *st);
459 static void decrement_resolving_count(struct site *st, int by);
460 static bool_t enter_new_state(struct site *st,uint32_t next);
461 static void enter_state_wait(struct site *st);
462 static void activate_new_key(struct site *st);
463
464 static bool_t is_transform_valid(struct transform_inst_if *transform)
465 {
466     return transform && transform->valid(transform->st);
467 }
468
469 static bool_t current_valid(struct site *st)
470 {
471     return is_transform_valid(st->current.transform);
472 }
473
474 #define DEFINE_CALL_TRANSFORM(fwdrev)                                   \
475 static transform_apply_return                                           \
476 call_transform_##fwdrev(struct site *st,                                \
477                                    struct transform_inst_if *transform, \
478                                    struct buffer_if *buf,               \
479                                    const char **errmsg)                 \
480 {                                                                       \
481     if (!is_transform_valid(transform)) {                               \
482         *errmsg="transform not set up";                                 \
483         return transform_apply_err;                                     \
484     }                                                                   \
485     return transform->fwdrev(transform->st,buf,errmsg);                 \
486 }
487
488 DEFINE_CALL_TRANSFORM(forwards)
489 DEFINE_CALL_TRANSFORM(reverse)
490
491 static void dispose_transform(struct transform_inst_if **transform_var)
492 {
493     struct transform_inst_if *transform=*transform_var;
494     if (transform) {
495         transform->delkey(transform->st);
496         transform->destroy(transform->st);
497     }
498     *transform_var = 0;
499 }    
500
501 #define CHECK_AVAIL(b,l) do { if ((b)->size<(l)) return False; } while(0)
502 #define CHECK_EMPTY(b) do { if ((b)->size!=0) return False; } while(0)
503 #define CHECK_TYPE(b,t) do { uint32_t type; \
504     CHECK_AVAIL((b),4); \
505     type=buf_unprepend_uint32((b)); \
506     if (type!=(t)) return False; } while(0)
507
508 static _Bool type_is_msg34(uint32_t type)
509 {
510     switch (type) {
511         case CASES_MSG3_KNOWN: case LABEL_MSG4: return True;
512         default: return False;
513     }
514 }
515
516 struct parsedname {
517     int32_t len;
518     uint8_t *name;
519     struct buffer_if extrainfo;
520 };
521
522 struct msg {
523     uint8_t *hashstart;
524     uint32_t dest;
525     uint32_t source;
526     struct parsedname remote;
527     struct parsedname local;
528     uint32_t remote_capabilities;
529     uint16_t remote_mtu;
530     int capab_transformnum;
531     uint8_t *nR;
532     uint8_t *nL;
533     int32_t pklen;
534     char *pk;
535     int32_t hashlen;
536     int32_t siglen;
537     char *sig;
538 };
539
540 static int32_t wait_timeout(struct site *st) {
541     int32_t t = st->wait_timeout_mean;
542     int8_t factor;
543     if (t < INT_MAX/2) {
544         st->random->generate(st->random->st,sizeof(factor),&factor);
545         t += (t / 256) * factor;
546     }
547     return t;
548 }
549
550 static _Bool set_new_transform(struct site *st, char *pk)
551 {
552     _Bool ok;
553
554     /* Generate the shared key */
555     if (!st->dh->makeshared(st->dh->st,st->dhsecret,st->dh->secret_len,
556                             pk, st->sharedsecret,st->dh->shared_len))
557         return False;
558
559     /* Set up the transform */
560     struct transform_if *generator=st->chosen_transform;
561     struct transform_inst_if *generated=generator->create(generator->st);
562     ok = generated->setkey(generated->st,st->sharedsecret,
563                            st->dh->shared_len,st->our_name_later);
564
565     dispose_transform(&st->new_transform);
566     if (!ok) return False;
567     st->new_transform=generated;
568
569     slog(st,LOG_SETUP_INIT,"key exchange negotiated transform"
570          " %d (capabilities ours=%#"PRIx32" theirs=%#"PRIx32")",
571          st->chosen_transform->capab_bit,
572          st->local_capabilities, st->remote_capabilities);
573     return True;
574 }
575
576 struct xinfoadd {
577     int32_t lenpos, afternul;
578 };
579 static void append_string_xinfo_start(struct buffer_if *buf,
580                                       struct xinfoadd *xia,
581                                       const char *str)
582     /* Helps construct one of the names with additional info as found
583      * in MSG1..4.  Call this function first, then append all the
584      * desired extra info (not including the nul byte) to the buffer,
585      * then call append_string_xinfo_done. */
586 {
587     xia->lenpos = buf->size;
588     buf_append_string(buf,str);
589     buf_append_uint8(buf,0);
590     xia->afternul = buf->size;
591 }
592 static void append_string_xinfo_done(struct buffer_if *buf,
593                                      struct xinfoadd *xia)
594 {
595     /* we just need to adjust the string length */
596     if (buf->size == xia->afternul) {
597         /* no extra info, strip the nul too */
598         buf_unappend_uint8(buf);
599     } else {
600         put_uint16(buf->start+xia->lenpos, buf->size-(xia->lenpos+2));
601     }
602 }
603
604 /* Build any of msg1 to msg4. msg5 and msg6 are built from the inside
605    out using a transform of config data supplied by netlink */
606 static bool_t generate_msg(struct site *st, uint32_t type, cstring_t what)
607 {
608     void *hst;
609     uint8_t *hash;
610     string_t dhpub, sig;
611     unsigned minor;
612
613     st->retries=st->setup_retries;
614     BUF_ALLOC(&st->buffer,what);
615     buffer_init(&st->buffer,0);
616     buf_append_uint32(&st->buffer,
617         (type==LABEL_MSG1?0:st->setup_session_id));
618     buf_append_uint32(&st->buffer,st->index);
619     buf_append_uint32(&st->buffer,type);
620
621     struct xinfoadd xia;
622     append_string_xinfo_start(&st->buffer,&xia,st->localname);
623     if ((st->local_capabilities & st->early_capabilities) ||
624         (type != LABEL_MSG1)) {
625         buf_append_uint32(&st->buffer,st->local_capabilities);
626     }
627     if (type_is_msg34(type)) {
628         buf_append_uint16(&st->buffer,st->mtu_target);
629     }
630     append_string_xinfo_done(&st->buffer,&xia);
631
632     buf_append_string(&st->buffer,st->remotename);
633     BUF_ADD_OBJ(append,&st->buffer,st->localN);
634     if (type==LABEL_MSG1) return True;
635     BUF_ADD_OBJ(append,&st->buffer,st->remoteN);
636     if (type==LABEL_MSG2) return True;
637
638     if (hacky_par_mid_failnow()) return False;
639
640     if (MSGMAJOR(type) == 3) do {
641         minor = MSGMINOR(type);
642         if (minor < 1) break;
643         buf_append_uint8(&st->buffer,st->chosen_transform->capab_bit);
644     } while (0);
645
646     dhpub=st->dh->makepublic(st->dh->st,st->dhsecret,st->dh->secret_len);
647     buf_append_string(&st->buffer,dhpub);
648     free(dhpub);
649     hash=safe_malloc(st->hash->len, "generate_msg");
650     hst=st->hash->init();
651     st->hash->update(hst,st->buffer.start,st->buffer.size);
652     st->hash->final(hst,hash);
653     sig=st->privkey->sign(st->privkey->st,hash,st->hash->len);
654     buf_append_string(&st->buffer,sig);
655     free(sig);
656     free(hash);
657     return True;
658 }
659
660 static bool_t unpick_name(struct buffer_if *msg, struct parsedname *nm)
661 {
662     CHECK_AVAIL(msg,2);
663     nm->len=buf_unprepend_uint16(msg);
664     CHECK_AVAIL(msg,nm->len);
665     nm->name=buf_unprepend(msg,nm->len);
666     uint8_t *nul=memchr(nm->name,0,nm->len);
667     if (!nul) {
668         buffer_readonly_view(&nm->extrainfo,0,0);
669     } else {
670         buffer_readonly_view(&nm->extrainfo, nul+1, msg->start-(nul+1));
671         nm->len=nul-nm->name;
672     }
673     return True;
674 }
675
676 static bool_t unpick_msg(struct site *st, uint32_t type,
677                          struct buffer_if *msg, struct msg *m)
678 {
679     unsigned minor;
680
681     m->capab_transformnum=-1;
682     m->hashstart=msg->start;
683     CHECK_AVAIL(msg,4);
684     m->dest=buf_unprepend_uint32(msg);
685     CHECK_AVAIL(msg,4);
686     m->source=buf_unprepend_uint32(msg);
687     CHECK_TYPE(msg,type);
688     if (!unpick_name(msg,&m->remote)) return False;
689     m->remote_capabilities=0;
690     m->remote_mtu=0;
691     if (m->remote.extrainfo.size) {
692         CHECK_AVAIL(&m->remote.extrainfo,4);
693         m->remote_capabilities=buf_unprepend_uint32(&m->remote.extrainfo);
694     }
695     if (type_is_msg34(type) && m->remote.extrainfo.size) {
696         CHECK_AVAIL(&m->remote.extrainfo,2);
697         m->remote_mtu=buf_unprepend_uint16(&m->remote.extrainfo);
698     }
699     if (!unpick_name(msg,&m->local)) return False;
700     if (type==LABEL_PROD) {
701         CHECK_EMPTY(msg);
702         return True;
703     }
704     CHECK_AVAIL(msg,NONCELEN);
705     m->nR=buf_unprepend(msg,NONCELEN);
706     if (type==LABEL_MSG1) {
707         CHECK_EMPTY(msg);
708         return True;
709     }
710     CHECK_AVAIL(msg,NONCELEN);
711     m->nL=buf_unprepend(msg,NONCELEN);
712     if (type==LABEL_MSG2) {
713         CHECK_EMPTY(msg);
714         return True;
715     }
716     if (MSGMAJOR(type) == 3) do {
717         minor = MSGMINOR(type);
718 #define MAYBE_READ_CAP(minminor, kind, dflt) do {                       \
719     if (minor < (minminor))                                             \
720         m->capab_##kind##num = (dflt);                                  \
721     else {                                                              \
722         CHECK_AVAIL(msg, 1);                                            \
723         m->capab_##kind##num = buf_unprepend_uint8(msg);                \
724     }                                                                   \
725 } while (0)
726         MAYBE_READ_CAP(1, transform, CAPAB_BIT_ANCIENTTRANSFORM);
727 #undef MAYBE_READ_CAP
728     } while (0);
729     CHECK_AVAIL(msg,2);
730     m->pklen=buf_unprepend_uint16(msg);
731     CHECK_AVAIL(msg,m->pklen);
732     m->pk=buf_unprepend(msg,m->pklen);
733     m->hashlen=msg->start-m->hashstart;
734     CHECK_AVAIL(msg,2);
735     m->siglen=buf_unprepend_uint16(msg);
736     CHECK_AVAIL(msg,m->siglen);
737     m->sig=buf_unprepend(msg,m->siglen);
738     CHECK_EMPTY(msg);
739
740     /* In `process_msg3_msg4' below, we assume that we can write a nul
741      * terminator following the signature.  Make sure there's enough space.
742      */
743     if (msg->start >= msg->base + msg->alloclen)
744         return False;
745
746     return True;
747 }
748
749 static bool_t name_matches(const struct parsedname *nm, const char *expected)
750 {
751     int expected_len=strlen(expected);
752     return
753         nm->len == expected_len &&
754         !memcmp(nm->name, expected, expected_len);
755 }    
756
757 static bool_t check_msg(struct site *st, uint32_t type, struct msg *m,
758                         cstring_t *error)
759 {
760     if (type==LABEL_MSG1) return True;
761
762     /* Check that the site names and our nonce have been sent
763        back correctly, and then store our peer's nonce. */ 
764     if (!name_matches(&m->remote,st->remotename)) {
765         *error="wrong remote site name";
766         return False;
767     }
768     if (!name_matches(&m->local,st->localname)) {
769         *error="wrong local site name";
770         return False;
771     }
772     if (memcmp(m->nL,st->localN,NONCELEN)!=0) {
773         *error="wrong locally-generated nonce";
774         return False;
775     }
776     if (type==LABEL_MSG2) return True;
777     if (!consttime_memeq(m->nR,st->remoteN,NONCELEN)) {
778         *error="wrong remotely-generated nonce";
779         return False;
780     }
781     /* MSG3 has complicated rules about capabilities, which are
782      * handled in process_msg3. */
783     if (MSGMAJOR(type) == 3) return True;
784     if (m->remote_capabilities!=st->remote_capabilities) {
785         *error="remote capabilities changed";
786         return False;
787     }
788     if (type==LABEL_MSG4) return True;
789     *error="unknown message type";
790     return False;
791 }
792
793 static bool_t generate_msg1(struct site *st)
794 {
795     st->random->generate(st->random->st,NONCELEN,st->localN);
796     return generate_msg(st,LABEL_MSG1,"site:MSG1");
797 }
798
799 static bool_t process_msg1(struct site *st, struct buffer_if *msg1,
800                            const struct comm_addr *src, struct msg *m)
801 {
802     /* We've already determined we're in an appropriate state to
803        process an incoming MSG1, and that the MSG1 has correct values
804        of A and B. */
805
806     st->setup_session_id=m->source;
807     st->remote_capabilities=m->remote_capabilities;
808     memcpy(st->remoteN,m->nR,NONCELEN);
809     return True;
810 }
811
812 static bool_t generate_msg2(struct site *st)
813 {
814     st->random->generate(st->random->st,NONCELEN,st->localN);
815     return generate_msg(st,LABEL_MSG2,"site:MSG2");
816 }
817
818 static bool_t process_msg2(struct site *st, struct buffer_if *msg2,
819                            const struct comm_addr *src)
820 {
821     struct msg m;
822     cstring_t err;
823
824     if (!unpick_msg(st,LABEL_MSG2,msg2,&m)) return False;
825     if (!check_msg(st,LABEL_MSG2,&m,&err)) {
826         slog(st,LOG_SEC,"msg2: %s",err);
827         return False;
828     }
829     st->setup_session_id=m.source;
830     st->remote_capabilities=m.remote_capabilities;
831
832     /* Select the transform to use */
833
834     uint32_t remote_crypto_caps = st->remote_capabilities & CAPAB_TRANSFORM_MASK;
835     if (!remote_crypto_caps)
836         /* old secnets only had this one transform */
837         remote_crypto_caps = 1UL << CAPAB_BIT_ANCIENTTRANSFORM;
838
839 #define CHOOSE_CRYPTO(kind, whats) do {                                 \
840     struct kind##_if *iface;                                            \
841     uint32_t bit, ours = 0;                                             \
842     int i;                                                              \
843     for (i= 0; i < st->n##kind##s; i++) {                               \
844         iface=st->kind##s[i];                                           \
845         bit = 1UL << iface->capab_bit;                                  \
846         if (bit & remote_crypto_caps) goto kind##_found;                \
847         ours |= bit;                                                    \
848     }                                                                   \
849     slog(st,LOG_ERROR,"no " whats " in common"                          \
850          " (us %#"PRIx32"; them: %#"PRIx32")",                          \
851          st->local_capabilities & ours, remote_crypto_caps);            \
852     return False;                                                       \
853 kind##_found:                                                           \
854     st->chosen_##kind = iface;                                          \
855 } while (0)
856
857     CHOOSE_CRYPTO(transform, "transforms");
858
859 #undef CHOOSE_CRYPTO
860
861     memcpy(st->remoteN,m.nR,NONCELEN);
862     return True;
863 }
864
865 static bool_t generate_msg3(struct site *st)
866 {
867     /* Now we have our nonce and their nonce. Think of a secret key,
868        and create message number 3. */
869     st->random->generate(st->random->st,st->dh->secret_len,st->dhsecret);
870     return generate_msg(st,
871                         (st->remote_capabilities & CAPAB_TRANSFORM_MASK)
872                         ? LABEL_MSG3BIS
873                         : LABEL_MSG3,
874                         "site:MSG3");
875 }
876
877 static bool_t process_msg3_msg4(struct site *st, struct msg *m)
878 {
879     uint8_t *hash;
880     void *hst;
881
882     /* Check signature and store g^x mod m */
883     hash=safe_malloc(st->hash->len, "process_msg3_msg4");
884     hst=st->hash->init();
885     st->hash->update(hst,m->hashstart,m->hashlen);
886     st->hash->final(hst,hash);
887     /* Terminate signature with a '0' - already checked that this will fit */
888     m->sig[m->siglen]=0;
889     if (!st->pubkey->check(st->pubkey->st,hash,st->hash->len,m->sig)) {
890         slog(st,LOG_SEC,"msg3/msg4 signature failed check!");
891         free(hash);
892         return False;
893     }
894     free(hash);
895
896     st->remote_adv_mtu=m->remote_mtu;
897
898     return True;
899 }
900
901 static bool_t process_msg3(struct site *st, struct buffer_if *msg3,
902                            const struct comm_addr *src, uint32_t msgtype)
903 {
904     struct msg m;
905     cstring_t err;
906
907     switch (msgtype) {
908         case CASES_MSG3_KNOWN: break;
909         default: assert(0);
910     }
911
912     if (!unpick_msg(st,msgtype,msg3,&m)) return False;
913     if (!check_msg(st,msgtype,&m,&err)) {
914         slog(st,LOG_SEC,"msg3: %s",err);
915         return False;
916     }
917     uint32_t capab_adv_late = m.remote_capabilities
918         & ~st->remote_capabilities & st->early_capabilities;
919     if (capab_adv_late) {
920         slog(st,LOG_SEC,"msg3 impermissibly adds early capability flag(s)"
921              " %#"PRIx32" (was %#"PRIx32", now %#"PRIx32")",
922              capab_adv_late, st->remote_capabilities, m.remote_capabilities);
923         return False;
924     }
925     st->remote_capabilities|=m.remote_capabilities;
926
927 #define CHOSE_CRYPTO(kind, what) do {                                   \
928     struct kind##_if *iface;                                            \
929     int i;                                                              \
930     for (i=0; i<st->n##kind##s; i++) {                                  \
931         iface=st->kind##s[i];                                           \
932         if (iface->capab_bit == m.capab_##kind##num)                    \
933             goto kind##_found;                                          \
934     }                                                                   \
935     slog(st,LOG_SEC,"peer chose unknown-to-us " what " %d!",            \
936          m.capab_##kind##num);                                                  \
937     return False;                                                       \
938 kind##_found:                                                           \
939     st->chosen_##kind=iface;                                            \
940 } while (0)
941
942     CHOSE_CRYPTO(transform, "transform");
943
944 #undef CHOSE_CRYPTO
945
946     if (!process_msg3_msg4(st,&m))
947         return False;
948
949     /* Terminate their DH public key with a '0' */
950     m.pk[m.pklen]=0;
951     /* Invent our DH secret key */
952     st->random->generate(st->random->st,st->dh->secret_len,st->dhsecret);
953
954     /* Generate the shared key and set up the transform */
955     if (!set_new_transform(st,m.pk)) return False;
956
957     return True;
958 }
959
960 static bool_t generate_msg4(struct site *st)
961 {
962     /* We have both nonces, their public key and our private key. Generate
963        our public key, sign it and send it to them. */
964     return generate_msg(st,LABEL_MSG4,"site:MSG4");
965 }
966
967 static bool_t process_msg4(struct site *st, struct buffer_if *msg4,
968                            const struct comm_addr *src)
969 {
970     struct msg m;
971     cstring_t err;
972
973     if (!unpick_msg(st,LABEL_MSG4,msg4,&m)) return False;
974     if (!check_msg(st,LABEL_MSG4,&m,&err)) {
975         slog(st,LOG_SEC,"msg4: %s",err);
976         return False;
977     }
978     
979     if (!process_msg3_msg4(st,&m))
980         return False;
981
982     /* Terminate their DH public key with a '0' */
983     m.pk[m.pklen]=0;
984
985     /* Generate the shared key and set up the transform */
986     if (!set_new_transform(st,m.pk)) return False;
987
988     return True;
989 }
990
991 struct msg0 {
992     uint32_t dest;
993     uint32_t source;
994     uint32_t type;
995 };
996
997 static bool_t unpick_msg0(struct site *st, struct buffer_if *msg0,
998                           struct msg0 *m)
999 {
1000     CHECK_AVAIL(msg0,4);
1001     m->dest=buf_unprepend_uint32(msg0);
1002     CHECK_AVAIL(msg0,4);
1003     m->source=buf_unprepend_uint32(msg0);
1004     CHECK_AVAIL(msg0,4);
1005     m->type=buf_unprepend_uint32(msg0);
1006     return True;
1007     /* Leaves transformed part of buffer untouched */
1008 }
1009
1010 static bool_t generate_msg5(struct site *st)
1011 {
1012     cstring_t transform_err;
1013
1014     BUF_ALLOC(&st->buffer,"site:MSG5");
1015     /* We are going to add four words to the message */
1016     buffer_init(&st->buffer,calculate_max_start_pad());
1017     /* Give the netlink code an opportunity to put its own stuff in the
1018        message (configuration information, etc.) */
1019     buf_prepend_uint32(&st->buffer,LABEL_MSG5);
1020     if (call_transform_forwards(st,st->new_transform,
1021                                 &st->buffer,&transform_err))
1022         return False;
1023     buf_prepend_uint32(&st->buffer,LABEL_MSG5);
1024     buf_prepend_uint32(&st->buffer,st->index);
1025     buf_prepend_uint32(&st->buffer,st->setup_session_id);
1026
1027     st->retries=st->setup_retries;
1028     return True;
1029 }
1030
1031 static bool_t process_msg5(struct site *st, struct buffer_if *msg5,
1032                            const struct comm_addr *src,
1033                            struct transform_inst_if *transform)
1034 {
1035     struct msg0 m;
1036     cstring_t transform_err;
1037
1038     if (!unpick_msg0(st,msg5,&m)) return False;
1039
1040     if (call_transform_reverse(st,transform,msg5,&transform_err)) {
1041         /* There's a problem */
1042         slog(st,LOG_SEC,"process_msg5: transform: %s",transform_err);
1043         return False;
1044     }
1045     /* Buffer should now contain untransformed PING packet data */
1046     CHECK_AVAIL(msg5,4);
1047     if (buf_unprepend_uint32(msg5)!=LABEL_MSG5) {
1048         slog(st,LOG_SEC,"MSG5/PING packet contained wrong label");
1049         return False;
1050     }
1051     /* Older versions of secnet used to write some config data here
1052      * which we ignore.  So we don't CHECK_EMPTY */
1053     return True;
1054 }
1055
1056 static void create_msg6(struct site *st, struct transform_inst_if *transform,
1057                         uint32_t session_id)
1058 {
1059     cstring_t transform_err;
1060
1061     BUF_ALLOC(&st->buffer,"site:MSG6");
1062     /* We are going to add four words to the message */
1063     buffer_init(&st->buffer,calculate_max_start_pad());
1064     /* Give the netlink code an opportunity to put its own stuff in the
1065        message (configuration information, etc.) */
1066     buf_prepend_uint32(&st->buffer,LABEL_MSG6);
1067     transform_apply_return problem =
1068         call_transform_forwards(st,transform,
1069                                 &st->buffer,&transform_err);
1070     assert(!problem);
1071     buf_prepend_uint32(&st->buffer,LABEL_MSG6);
1072     buf_prepend_uint32(&st->buffer,st->index);
1073     buf_prepend_uint32(&st->buffer,session_id);
1074 }
1075
1076 static bool_t generate_msg6(struct site *st)
1077 {
1078     if (!is_transform_valid(st->new_transform))
1079         return False;
1080     create_msg6(st,st->new_transform,st->setup_session_id);
1081     st->retries=1; /* Peer will retransmit MSG5 if this packet gets lost */
1082     return True;
1083 }
1084
1085 static bool_t process_msg6(struct site *st, struct buffer_if *msg6,
1086                            const struct comm_addr *src)
1087 {
1088     struct msg0 m;
1089     cstring_t transform_err;
1090
1091     if (!unpick_msg0(st,msg6,&m)) return False;
1092
1093     if (call_transform_reverse(st,st->new_transform,msg6,&transform_err)) {
1094         /* There's a problem */
1095         slog(st,LOG_SEC,"process_msg6: transform: %s",transform_err);
1096         return False;
1097     }
1098     /* Buffer should now contain untransformed PING packet data */
1099     CHECK_AVAIL(msg6,4);
1100     if (buf_unprepend_uint32(msg6)!=LABEL_MSG6) {
1101         slog(st,LOG_SEC,"MSG6/PONG packet contained invalid data");
1102         return False;
1103     }
1104     /* Older versions of secnet used to write some config data here
1105      * which we ignore.  So we don't CHECK_EMPTY */
1106     return True;
1107 }
1108
1109 static transform_apply_return
1110 decrypt_msg0(struct site *st, struct buffer_if *msg0,
1111                            const struct comm_addr *src)
1112 {
1113     cstring_t transform_err, auxkey_err, newkey_err="n/a";
1114     struct msg0 m;
1115     transform_apply_return problem;
1116
1117     if (!unpick_msg0(st,msg0,&m)) return False;
1118
1119     /* Keep a copy so we can try decrypting it with multiple keys */
1120     buffer_copy(&st->scratch, msg0);
1121
1122     problem = call_transform_reverse(st,st->current.transform,
1123                                      msg0,&transform_err);
1124     if (!problem) {
1125         if (!st->auxiliary_is_new)
1126             delete_one_key(st,&st->auxiliary_key,
1127                            "peer has used new key","auxiliary key",LOG_SEC);
1128         return 0;
1129     }
1130     if (transform_apply_return_badseq(problem))
1131         goto badseq;
1132
1133     buffer_copy(msg0, &st->scratch);
1134     problem = call_transform_reverse(st,st->auxiliary_key.transform,
1135                                      msg0,&auxkey_err);
1136     if (!problem) {
1137         slog(st,LOG_DROP,"processing packet which uses auxiliary key");
1138         if (st->auxiliary_is_new) {
1139             /* We previously timed out in state SENTMSG5 but it turns
1140              * out that our peer did in fact get our MSG5 and is
1141              * using the new key.  So we should switch to it too. */
1142             /* This is a bit like activate_new_key. */
1143             struct data_key t;
1144             t=st->current;
1145             st->current=st->auxiliary_key;
1146             st->auxiliary_key=t;
1147
1148             delete_one_key(st,&st->auxiliary_key,"peer has used new key",
1149                            "previous key",LOG_SEC);
1150             st->auxiliary_is_new=0;
1151             st->renegotiate_key_time=st->auxiliary_renegotiate_key_time;
1152         }
1153         return 0;
1154     }
1155     if (transform_apply_return_badseq(problem))
1156         goto badseq;
1157
1158     if (st->state==SITE_SENTMSG5) {
1159         buffer_copy(msg0, &st->scratch);
1160         problem = call_transform_reverse(st,st->new_transform,
1161                                          msg0,&newkey_err);
1162         if (!problem) {
1163             /* It looks like we didn't get the peer's MSG6 */
1164             /* This is like a cut-down enter_new_state(SITE_RUN) */
1165             slog(st,LOG_STATE,"will enter state RUN (MSG0 with new key)");
1166             BUF_FREE(&st->buffer);
1167             st->timeout=0;
1168             activate_new_key(st);
1169             return 0; /* do process the data in this packet */
1170         }
1171         if (transform_apply_return_badseq(problem))
1172             goto badseq;
1173     }
1174
1175     slog(st,LOG_SEC,"transform: %s (aux: %s, new: %s)",
1176          transform_err,auxkey_err,newkey_err);
1177     initiate_key_setup(st,"incoming message would not decrypt",0);
1178     send_nak(src,m.dest,m.source,m.type,msg0,"message would not decrypt");
1179     assert(problem);
1180     return problem;
1181
1182  badseq:
1183     slog(st,LOG_DROP,"transform: %s (bad seq.)",transform_err);
1184     assert(problem);
1185     return problem;
1186 }
1187
1188 static bool_t process_msg0(struct site *st, struct buffer_if *msg0,
1189                            const struct comm_addr *src)
1190 {
1191     uint32_t type;
1192     transform_apply_return problem;
1193
1194     problem = decrypt_msg0(st,msg0,src);
1195     if (problem==transform_apply_seqdupe) {
1196         /* We recently received another copy of this packet, maybe due
1197          * to polypath.  That's not a problem; indeed, for the
1198          * purposes of transport address management it is a success.
1199          * But we don't want to process the packet. */
1200         transport_data_msgok(st,src);
1201         return False;
1202     }
1203     if (problem)
1204         return False;
1205
1206     CHECK_AVAIL(msg0,4);
1207     type=buf_unprepend_uint32(msg0);
1208     switch(type) {
1209     case LABEL_MSG7:
1210         /* We must forget about the current session. */
1211         delete_keys(st,"request from peer",LOG_SEC);
1212         /* probably, the peer is shutting down, and this is going to fail,
1213          * but we need to be trying to bring the link up again */
1214         if (st->keepalive)
1215             initiate_key_setup(st,"peer requested key teardown",0);
1216         return True;
1217     case LABEL_MSG9:
1218         /* Deliver to netlink layer */
1219         st->netlink->deliver(st->netlink->st,msg0);
1220         transport_data_msgok(st,src);
1221         /* See whether we should start negotiating a new key */
1222         if (st->now > st->renegotiate_key_time)
1223             initiate_key_setup(st,"incoming packet in renegotiation window",0);
1224         return True;
1225     default:
1226         slog(st,LOG_SEC,"incoming encrypted message of type %08x "
1227              "(unknown)",type);
1228         break;
1229     }
1230     return False;
1231 }
1232
1233 static void dump_packet(struct site *st, struct buffer_if *buf,
1234                         const struct comm_addr *addr, bool_t incoming,
1235                         bool_t ok)
1236 {
1237     uint32_t dest=get_uint32(buf->start);
1238     uint32_t source=get_uint32(buf->start+4);
1239     uint32_t msgtype=get_uint32(buf->start+8);
1240
1241     if (st->log_events & LOG_DUMP)
1242         slilog(st->log,M_DEBUG,"%s: %s: %08x<-%08x: %08x: %s%s",
1243                st->tunname,incoming?"incoming":"outgoing",
1244                dest,source,msgtype,comm_addr_to_string(addr),
1245                ok?"":" - fail");
1246 }
1247
1248 static bool_t comm_addr_sendmsg(struct site *st,
1249                                 const struct comm_addr *dest,
1250                                 struct buffer_if *buf)
1251 {
1252     int i;
1253     struct comm_clientinfo *commclientinfo = 0;
1254
1255     for (i=0; i < st->ncomms; i++) {
1256         if (st->comms[i] == dest->comm) {
1257             commclientinfo = st->commclientinfos[i];
1258             break;
1259         }
1260     }
1261     return dest->comm->sendmsg(dest->comm->st, buf, dest, commclientinfo);
1262 }
1263
1264 static uint32_t site_status(void *st)
1265 {
1266     return 0;
1267 }
1268
1269 static bool_t send_msg(struct site *st)
1270 {
1271     if (st->retries>0) {
1272         transport_xmit(st, &st->setup_peers, &st->buffer, True);
1273         st->timeout=st->now+st->setup_retry_interval;
1274         st->retries--;
1275         return True;
1276     } else if (st->state==SITE_SENTMSG5) {
1277         logtimeout(st,"timed out sending MSG5, stashing new key");
1278         /* We stash the key we have produced, in case it turns out that
1279          * our peer did see our MSG5 after all and starts using it. */
1280         /* This is a bit like some of activate_new_key */
1281         struct transform_inst_if *t;
1282         t=st->auxiliary_key.transform;
1283         st->auxiliary_key.transform=st->new_transform;
1284         st->new_transform=t;
1285         dispose_transform(&st->new_transform);
1286
1287         st->auxiliary_is_new=1;
1288         st->auxiliary_key.key_timeout=st->now+st->key_lifetime;
1289         st->auxiliary_renegotiate_key_time=st->now+st->key_renegotiate_time;
1290         st->auxiliary_key.remote_session_id=st->setup_session_id;
1291
1292         enter_state_wait(st);
1293         return False;
1294     } else {
1295         logtimeout(st,"timed out sending key setup packet "
1296             "(in state %s)",state_name(st->state));
1297         enter_state_wait(st);
1298         return False;
1299     }
1300 }
1301
1302 static void site_resolve_callback(void *sst, const struct comm_addr *addrs,
1303                                   int stored_naddrs, int all_naddrs,
1304                                   const char *address, const char *failwhy)
1305 {
1306     struct site *st=sst;
1307
1308     if (!stored_naddrs) {
1309         slog(st,LOG_ERROR,"resolution of %s failed: %s",address,failwhy);
1310     } else {
1311         slog(st,LOG_PEER_ADDRS,"resolution of %s completed, %d addrs, eg: %s",
1312              address, all_naddrs, comm_addr_to_string(&addrs[0]));;
1313
1314         int space=st->transport_peers_max-st->resolving_n_results_stored;
1315         int n_tocopy=MIN(stored_naddrs,space);
1316         COPY_ARRAY(st->resolving_results + st->resolving_n_results_stored,
1317                    addrs,
1318                    n_tocopy);
1319         st->resolving_n_results_stored += n_tocopy;
1320         st->resolving_n_results_all += all_naddrs;
1321     }
1322
1323     decrement_resolving_count(st,1);
1324 }
1325
1326 static void decrement_resolving_count(struct site *st, int by)
1327 {
1328     assert(st->resolving_count>0);
1329     st->resolving_count-=by;
1330
1331     if (st->resolving_count)
1332         return;
1333
1334     /* OK, we are done with them all.  Handle combined results. */
1335
1336     const struct comm_addr *addrs=st->resolving_results;
1337     int naddrs=st->resolving_n_results_stored;
1338     assert(naddrs<=st->transport_peers_max);
1339
1340     if (naddrs) {
1341         if (naddrs != st->resolving_n_results_all) {
1342             slog(st,LOG_SETUP_INIT,"resolution of supplied addresses/names"
1343                  " yielded too many results (%d > %d), some ignored",
1344                  st->resolving_n_results_all, naddrs);
1345         }
1346         slog(st,LOG_STATE,"resolution completed, %d addrs, eg: %s",
1347              naddrs, iaddr_to_string(&addrs[0].ia));;
1348     }
1349
1350     switch (st->state) {
1351     case SITE_RESOLVE:
1352         if (transport_compute_setupinit_peers(st,addrs,naddrs,0)) {
1353             enter_new_state(st,SITE_SENTMSG1);
1354         } else {
1355             /* Can't figure out who to try to to talk to */
1356             slog(st,LOG_SETUP_INIT,
1357                  "key exchange failed: cannot find peer address");
1358             enter_state_run(st);
1359         }
1360         break;
1361     case SITE_SENTMSG1: case SITE_SENTMSG2:
1362     case SITE_SENTMSG3: case SITE_SENTMSG4:
1363     case SITE_SENTMSG5:
1364         if (naddrs) {
1365             /* We start using the address immediately for data too.
1366              * It's best to store it in st->peers now because we might
1367              * go via SENTMSG5, WAIT, and a MSG0, straight into using
1368              * the new key (without updating the data peer addrs). */
1369             transport_resolve_complete(st,addrs,naddrs);
1370         } else if (st->local_mobile) {
1371             /* We can't let this rest because we may have a peer
1372              * address which will break in the future. */
1373             slog(st,LOG_SETUP_INIT,"resolution failed: "
1374                  "abandoning key exchange");
1375             enter_state_wait(st);
1376         } else {
1377             slog(st,LOG_SETUP_INIT,"resolution failed: "
1378                  " continuing to use source address of peer's packets"
1379                  " for key exchange and ultimately data");
1380         }
1381         break;
1382     case SITE_RUN:
1383         if (naddrs) {
1384             slog(st,LOG_SETUP_INIT,"resolution completed tardily,"
1385                  " updating peer address(es)");
1386             transport_resolve_complete_tardy(st,addrs,naddrs);
1387         } else if (st->local_mobile) {
1388             /* Not very good.  We should queue (another) renegotiation
1389              * so that we can update the peer address. */
1390             st->key_renegotiate_time=st->now+wait_timeout(st);
1391         } else {
1392             slog(st,LOG_SETUP_INIT,"resolution failed: "
1393                  " continuing to use source address of peer's packets");
1394         }
1395         break;
1396     case SITE_WAIT:
1397     case SITE_STOP:
1398         /* oh well */
1399         break;
1400     }
1401 }
1402
1403 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
1404                                  const struct comm_addr *prod_hint)
1405 {
1406     /* Reentrancy hazard: can call enter_new_state/enter_state_* */
1407     if (st->state!=SITE_RUN) return False;
1408     slog(st,LOG_SETUP_INIT,"initiating key exchange (%s)",reason);
1409     if (st->addresses) {
1410         slog(st,LOG_SETUP_INIT,"resolving peer address(es)");
1411         return enter_state_resolve(st);
1412     } else if (transport_compute_setupinit_peers(st,0,0,prod_hint)) {
1413         return enter_new_state(st,SITE_SENTMSG1);
1414     }
1415     slog(st,LOG_SETUP_INIT,"key exchange failed: no address for peer");
1416     return False;
1417 }
1418
1419 static void activate_new_key(struct site *st)
1420 {
1421     struct transform_inst_if *t;
1422
1423     /* We have three transform instances, which we swap between old,
1424        active and setup */
1425     t=st->auxiliary_key.transform;
1426     st->auxiliary_key.transform=st->current.transform;
1427     st->current.transform=st->new_transform;
1428     st->new_transform=t;
1429     dispose_transform(&st->new_transform);
1430
1431     st->timeout=0;
1432     st->auxiliary_is_new=0;
1433     st->auxiliary_key.key_timeout=st->current.key_timeout;
1434     st->current.key_timeout=st->now+st->key_lifetime;
1435     st->renegotiate_key_time=st->now+st->key_renegotiate_time;
1436     transport_peers_copy(st,&st->peers,&st->setup_peers);
1437     st->current.remote_session_id=st->setup_session_id;
1438
1439     /* Compute the inter-site MTU.  This is min( our_mtu, their_mtu ).
1440      * But their mtu be unspecified, in which case we just use ours. */
1441     uint32_t intersite_mtu=
1442         MIN(st->mtu_target, st->remote_adv_mtu ?: ~(uint32_t)0);
1443     st->netlink->set_mtu(st->netlink->st,intersite_mtu);
1444
1445     slog(st,LOG_ACTIVATE_KEY,"new key activated"
1446          " (mtu ours=%"PRId32" theirs=%"PRId32" intersite=%"PRId32")",
1447          st->mtu_target, st->remote_adv_mtu, intersite_mtu);
1448     enter_state_run(st);
1449 }
1450
1451 static void delete_one_key(struct site *st, struct data_key *key,
1452                            cstring_t reason, cstring_t which, uint32_t loglevel)
1453 {
1454     if (!is_transform_valid(key->transform)) return;
1455     if (reason) slog(st,loglevel,"%s deleted (%s)",which,reason);
1456     dispose_transform(&key->transform);
1457     key->key_timeout=0;
1458 }
1459
1460 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel)
1461 {
1462     if (current_valid(st)) {
1463         slog(st,loglevel,"session closed (%s)",reason);
1464
1465         delete_one_key(st,&st->current,0,0,0);
1466         set_link_quality(st);
1467     }
1468     delete_one_key(st,&st->auxiliary_key,0,0,0);
1469 }
1470
1471 static void state_assert(struct site *st, bool_t ok)
1472 {
1473     if (!ok) fatal("site:state_assert");
1474 }
1475
1476 static void enter_state_stop(struct site *st)
1477 {
1478     st->state=SITE_STOP;
1479     st->timeout=0;
1480     delete_keys(st,"entering state STOP",LOG_TIMEOUT_KEY);
1481     dispose_transform(&st->new_transform);
1482 }
1483
1484 static void set_link_quality(struct site *st)
1485 {
1486     uint32_t quality;
1487     if (current_valid(st))
1488         quality=LINK_QUALITY_UP;
1489     else if (st->state==SITE_WAIT || st->state==SITE_STOP)
1490         quality=LINK_QUALITY_DOWN;
1491     else if (st->addresses)
1492         quality=LINK_QUALITY_DOWN_CURRENT_ADDRESS;
1493     else if (transport_peers_valid(&st->peers))
1494         quality=LINK_QUALITY_DOWN_STALE_ADDRESS;
1495     else
1496         quality=LINK_QUALITY_DOWN;
1497
1498     st->netlink->set_quality(st->netlink->st,quality);
1499 }
1500
1501 static void enter_state_run(struct site *st)
1502 {
1503     slog(st,LOG_STATE,"entering state RUN%s",
1504          current_valid(st) ? " (keyed)" : " (unkeyed)");
1505     st->state=SITE_RUN;
1506     st->timeout=0;
1507
1508     st->setup_session_id=0;
1509     transport_peers_clear(st,&st->setup_peers);
1510     FILLZERO(st->localN);
1511     FILLZERO(st->remoteN);
1512     dispose_transform(&st->new_transform);
1513     memset(st->dhsecret,0,st->dh->secret_len);
1514     memset(st->sharedsecret,0,st->dh->shared_len);
1515     set_link_quality(st);
1516
1517     if (st->keepalive && !current_valid(st))
1518         initiate_key_setup(st, "keepalive", 0);
1519 }
1520
1521 static bool_t ensure_resolving(struct site *st)
1522 {
1523     /* Reentrancy hazard: may call site_resolve_callback and hence
1524      * enter_new_state, enter_state_* and generate_msg*. */
1525     if (st->resolving_count)
1526         return True;
1527
1528     assert(st->addresses);
1529
1530     /* resolver->request might reentrantly call site_resolve_callback
1531      * which will decrement st->resolving, so we need to increment it
1532      * twice beforehand to prevent decrement from thinking we're
1533      * finished, and decrement it ourselves.  Alternatively if
1534      * everything fails then there are no callbacks due and we simply
1535      * set it to 0 and return false.. */
1536     st->resolving_n_results_stored=0;
1537     st->resolving_n_results_all=0;
1538     st->resolving_count+=2;
1539     const char **addrp=st->addresses;
1540     const char *address;
1541     bool_t anyok=False;
1542     for (; (address=*addrp++); ) {
1543         bool_t ok = st->resolver->request(st->resolver->st,address,
1544                                           st->remoteport,st->comms[0],
1545                                           site_resolve_callback,st);
1546         if (ok)
1547             st->resolving_count++;
1548         anyok|=ok;
1549     }
1550     if (!anyok) {
1551         st->resolving_count=0;
1552         return False;
1553     }
1554     decrement_resolving_count(st,2);
1555     return True;
1556 }
1557
1558 static bool_t enter_state_resolve(struct site *st)
1559 {
1560     /* Reentrancy hazard!  See ensure_resolving. */
1561     state_assert(st,st->state==SITE_RUN);
1562     slog(st,LOG_STATE,"entering state RESOLVE");
1563     st->state=SITE_RESOLVE;
1564     return ensure_resolving(st);
1565 }
1566
1567 static bool_t enter_new_state(struct site *st, uint32_t next)
1568 {
1569     bool_t (*gen)(struct site *st);
1570     int r;
1571
1572     slog(st,LOG_STATE,"entering state %s",state_name(next));
1573     switch(next) {
1574     case SITE_SENTMSG1:
1575         state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE);
1576         gen=generate_msg1;
1577         st->msg1_crossed_logged = False;
1578         break;
1579     case SITE_SENTMSG2:
1580         state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1581                      st->state==SITE_SENTMSG1 || st->state==SITE_WAIT);
1582         gen=generate_msg2;
1583         break;
1584     case SITE_SENTMSG3:
1585         state_assert(st,st->state==SITE_SENTMSG1);
1586         BUF_FREE(&st->buffer);
1587         gen=generate_msg3;
1588         break;
1589     case SITE_SENTMSG4:
1590         state_assert(st,st->state==SITE_SENTMSG2);
1591         BUF_FREE(&st->buffer);
1592         gen=generate_msg4;
1593         break;
1594     case SITE_SENTMSG5:
1595         state_assert(st,st->state==SITE_SENTMSG3);
1596         BUF_FREE(&st->buffer);
1597         gen=generate_msg5;
1598         break;
1599     case SITE_RUN:
1600         state_assert(st,st->state==SITE_SENTMSG4);
1601         BUF_FREE(&st->buffer);
1602         gen=generate_msg6;
1603         break;
1604     default:
1605         gen=NULL;
1606         fatal("enter_new_state(%s): invalid new state",state_name(next));
1607         break;
1608     }
1609
1610     if (hacky_par_start_failnow()) return False;
1611
1612     r= gen(st) && send_msg(st);
1613
1614     hacky_par_end(&r,
1615                   st->setup_retries, st->setup_retry_interval,
1616                   send_msg, st);
1617     
1618     if (r) {
1619         st->state=next;
1620         if (next==SITE_RUN) {
1621             BUF_FREE(&st->buffer); /* Never reused */
1622             st->timeout=0; /* Never retransmit */
1623             activate_new_key(st);
1624         }
1625         return True;
1626     }
1627     slog(st,LOG_ERROR,"error entering state %s",state_name(next));
1628     st->buffer.free=False; /* Unconditionally use the buffer; it may be
1629                               in either state, and enter_state_wait() will
1630                               do a BUF_FREE() */
1631     enter_state_wait(st);
1632     return False;
1633 }
1634
1635 /* msg7 tells our peer that we're about to forget our key */
1636 static bool_t send_msg7(struct site *st, cstring_t reason)
1637 {
1638     cstring_t transform_err;
1639
1640     if (current_valid(st) && st->buffer.free
1641         && transport_peers_valid(&st->peers)) {
1642         BUF_ALLOC(&st->buffer,"site:MSG7");
1643         buffer_init(&st->buffer,calculate_max_start_pad());
1644         buf_append_uint32(&st->buffer,LABEL_MSG7);
1645         buf_append_string(&st->buffer,reason);
1646         if (call_transform_forwards(st, st->current.transform,
1647                                     &st->buffer, &transform_err))
1648             goto free_out;
1649         buf_prepend_uint32(&st->buffer,LABEL_MSG0);
1650         buf_prepend_uint32(&st->buffer,st->index);
1651         buf_prepend_uint32(&st->buffer,st->current.remote_session_id);
1652         transport_xmit(st,&st->peers,&st->buffer,True);
1653         BUF_FREE(&st->buffer);
1654     free_out:
1655         return True;
1656     }
1657     return False;
1658 }
1659
1660 /* We go into this state if our peer becomes uncommunicative. Similar to
1661    the "stop" state, we forget all session keys for a while, before
1662    re-entering the "run" state. */
1663 static void enter_state_wait(struct site *st)
1664 {
1665     slog(st,LOG_STATE,"entering state WAIT");
1666     st->timeout=st->now+wait_timeout(st);
1667     st->state=SITE_WAIT;
1668     set_link_quality(st);
1669     BUF_FREE(&st->buffer); /* will have had an outgoing packet in it */
1670     /* XXX Erase keys etc. */
1671 }
1672
1673 static void generate_prod(struct site *st, struct buffer_if *buf)
1674 {
1675     buffer_init(buf,0);
1676     buf_append_uint32(buf,0);
1677     buf_append_uint32(buf,0);
1678     buf_append_uint32(buf,LABEL_PROD);
1679     buf_append_string(buf,st->localname);
1680     buf_append_string(buf,st->remotename);
1681 }
1682
1683 static void generate_send_prod(struct site *st,
1684                                const struct comm_addr *source)
1685 {
1686     if (!st->allow_send_prod) return; /* too soon */
1687     if (!(st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1688           st->state==SITE_WAIT)) return; /* we'd ignore peer's MSG1 */
1689
1690     slog(st,LOG_SETUP_INIT,"prodding peer for key exchange");
1691     st->allow_send_prod=0;
1692     generate_prod(st,&st->scratch);
1693     bool_t ok = comm_addr_sendmsg(st, source, &st->scratch);
1694     dump_packet(st,&st->scratch,source,False,ok);
1695 }
1696
1697 static inline void site_settimeout(uint64_t timeout, int *timeout_io)
1698 {
1699     if (timeout) {
1700         int64_t offset=timeout-*now;
1701         if (offset<0) offset=0;
1702         if (offset>INT_MAX) offset=INT_MAX;
1703         if (*timeout_io<0 || offset<*timeout_io)
1704             *timeout_io=offset;
1705     }
1706 }
1707
1708 static int site_beforepoll(void *sst, struct pollfd *fds, int *nfds_io,
1709                            int *timeout_io)
1710 {
1711     struct site *st=sst;
1712
1713     BEFOREPOLL_WANT_FDS(0); /* We don't use any file descriptors */
1714     st->now=*now;
1715
1716     /* Work out when our next timeout is. The earlier of 'timeout' or
1717        'current.key_timeout'. A stored value of '0' indicates no timeout
1718        active. */
1719     site_settimeout(st->timeout, timeout_io);
1720     site_settimeout(st->current.key_timeout, timeout_io);
1721     site_settimeout(st->auxiliary_key.key_timeout, timeout_io);
1722
1723     return 0; /* success */
1724 }
1725
1726 static void check_expiry(struct site *st, struct data_key *key,
1727                          const char *which)
1728 {
1729     if (key->key_timeout && *now>key->key_timeout) {
1730         delete_one_key(st,key,"maximum life exceeded",which,LOG_TIMEOUT_KEY);
1731     }
1732 }
1733
1734 /* NB site_afterpoll will be called before site_beforepoll is ever called */
1735 static void site_afterpoll(void *sst, struct pollfd *fds, int nfds)
1736 {
1737     struct site *st=sst;
1738
1739     st->now=*now;
1740     if (st->timeout && *now>st->timeout) {
1741         st->timeout=0;
1742         if (st->state>=SITE_SENTMSG1 && st->state<=SITE_SENTMSG5) {
1743             if (!hacky_par_start_failnow())
1744                 send_msg(st);
1745         } else if (st->state==SITE_WAIT) {
1746             enter_state_run(st);
1747         } else {
1748             slog(st,LOG_ERROR,"site_afterpoll: unexpected timeout, state=%d",
1749                  st->state);
1750         }
1751     }
1752     check_expiry(st,&st->current,"current key");
1753     check_expiry(st,&st->auxiliary_key,"auxiliary key");
1754 }
1755
1756 /* This function is called by the netlink device to deliver packets
1757    intended for the remote network. The packet is in "raw" wire
1758    format, but is guaranteed to be word-aligned. */
1759 static void site_outgoing(void *sst, struct buffer_if *buf)
1760 {
1761     struct site *st=sst;
1762     cstring_t transform_err;
1763     
1764     if (st->state==SITE_STOP) {
1765         BUF_FREE(buf);
1766         return;
1767     }
1768
1769     st->allow_send_prod=1;
1770
1771     /* In all other states we consider delivering the packet if we have
1772        a valid key and a valid address to send it to. */
1773     if (current_valid(st) && transport_peers_valid(&st->peers)) {
1774         /* Transform it and send it */
1775         if (buf->size>0) {
1776             buf_prepend_uint32(buf,LABEL_MSG9);
1777             if (call_transform_forwards(st, st->current.transform,
1778                                         buf, &transform_err))
1779                 goto free_out;
1780             buf_prepend_uint32(buf,LABEL_MSG0);
1781             buf_prepend_uint32(buf,st->index);
1782             buf_prepend_uint32(buf,st->current.remote_session_id);
1783             transport_xmit(st,&st->peers,buf,False);
1784         }
1785     free_out:
1786         BUF_FREE(buf);
1787         return;
1788     }
1789
1790     slog(st,LOG_DROP,"discarding outgoing packet of size %d",buf->size);
1791     BUF_FREE(buf);
1792     initiate_key_setup(st,"outgoing packet",0);
1793 }
1794
1795 static bool_t named_for_us(struct site *st, const struct buffer_if *buf_in,
1796                            uint32_t type, struct msg *m)
1797     /* For packets which are identified by the local and remote names.
1798      * If it has our name and our peer's name in it it's for us. */
1799 {
1800     struct buffer_if buf[1];
1801     buffer_readonly_clone(buf,buf_in);
1802     return unpick_msg(st,type,buf,m)
1803         && name_matches(&m->remote,st->remotename)
1804         && name_matches(&m->local,st->localname);
1805 }
1806
1807 static bool_t we_have_priority(struct site *st, const struct msg *m) {
1808     if (st->local_capabilities & m->remote_capabilities &
1809         CAPAB_PRIORITY_MOBILE) {
1810         if (st->local_mobile) return True;
1811         if (st-> peer_mobile) return False;
1812     }
1813     return st->our_name_later;
1814 }
1815
1816 static bool_t setup_late_msg_ok(struct site *st, 
1817                                 const struct buffer_if *buf_in,
1818                                 uint32_t msgtype,
1819                                 const struct comm_addr *source) {
1820     /* For setup packets which seem from their type like they are
1821      * late.  Maybe they came via a different path.  All we do is make
1822      * a note of the sending address, iff they look like they are part
1823      * of the current key setup attempt. */
1824     struct msg m;
1825     if (!named_for_us(st,buf_in,msgtype,&m))
1826         /* named_for_us calls unpick_msg which gets the nonces */
1827         return False;
1828     if (!consttime_memeq(m.nR,st->remoteN,NONCELEN) ||
1829         !consttime_memeq(m.nL,st->localN, NONCELEN))
1830         /* spoof ?  from stale run ?  who knows */
1831         return False;
1832     transport_setup_msgok(st,source);
1833     return True;
1834 }
1835
1836 /* This function is called by the communication device to deliver
1837    packets from our peers.
1838    It should return True if the packet is recognised as being for
1839    this current site instance (and should therefore not be processed
1840    by other sites), even if the packet was otherwise ignored. */
1841 static bool_t site_incoming(void *sst, struct buffer_if *buf,
1842                             const struct comm_addr *source)
1843 {
1844     struct site *st=sst;
1845
1846     if (buf->size < 12) return False;
1847
1848     uint32_t dest=get_uint32(buf->start);
1849     uint32_t msgtype=get_uint32(buf->start+8);
1850     struct msg named_msg;
1851
1852     if (msgtype==LABEL_MSG1) {
1853         if (!named_for_us(st,buf,msgtype,&named_msg))
1854             return False;
1855         /* It's a MSG1 addressed to us. Decide what to do about it. */
1856         dump_packet(st,buf,source,True,True);
1857         if (st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1858             st->state==SITE_WAIT) {
1859             /* We should definitely process it */
1860             transport_compute_setupinit_peers(st,0,0,source);
1861             if (process_msg1(st,buf,source,&named_msg)) {
1862                 slog(st,LOG_SETUP_INIT,"key setup initiated by peer");
1863                 bool_t entered=enter_new_state(st,SITE_SENTMSG2);
1864                 if (entered && st->addresses && st->local_mobile)
1865                     /* We must do this as the very last thing, because
1866                        the resolver callback might reenter us. */
1867                     ensure_resolving(st);
1868             } else {
1869                 slog(st,LOG_ERROR,"failed to process incoming msg1");
1870             }
1871             BUF_FREE(buf);
1872             return True;
1873         } else if (st->state==SITE_SENTMSG1) {
1874             /* We've just sent a message 1! They may have crossed on
1875                the wire. If we have priority then we ignore the
1876                incoming one, otherwise we process it as usual. */
1877             if (we_have_priority(st,&named_msg)) {
1878                 BUF_FREE(buf);
1879                 if (!st->msg1_crossed_logged++)
1880                     slog(st,LOG_SETUP_INIT,"crossed msg1s; we are higher "
1881                          "priority => ignore incoming msg1");
1882                 return True;
1883             } else {
1884                 slog(st,LOG_SETUP_INIT,"crossed msg1s; we are lower "
1885                      "priority => use incoming msg1");
1886                 if (process_msg1(st,buf,source,&named_msg)) {
1887                     BUF_FREE(&st->buffer); /* Free our old message 1 */
1888                     transport_setup_msgok(st,source);
1889                     enter_new_state(st,SITE_SENTMSG2);
1890                 } else {
1891                     slog(st,LOG_ERROR,"failed to process an incoming "
1892                          "crossed msg1 (we have low priority)");
1893                 }
1894                 BUF_FREE(buf);
1895                 return True;
1896             }
1897         } else if (st->state==SITE_SENTMSG2 ||
1898                    st->state==SITE_SENTMSG4) {
1899             if (consttime_memeq(named_msg.nR,st->remoteN,NONCELEN)) {
1900                 /* We are ahead in the protocol, but that msg1 had the
1901                  * peer's nonce so presumably it is from this key
1902                  * exchange run, via a slower route */
1903                 transport_setup_msgok(st,source);
1904             } else {
1905                 slog(st,LOG_UNEXPECTED,"competing incoming message 1");
1906             }
1907             BUF_FREE(buf);
1908             return True;
1909         }
1910         /* The message 1 was received at an unexpected stage of the
1911            key setup.  Well, they lost the race. */
1912         slog(st,LOG_UNEXPECTED,"unexpected incoming message 1");
1913         BUF_FREE(buf);
1914         return True;
1915     }
1916     if (msgtype==LABEL_PROD) {
1917         if (!named_for_us(st,buf,msgtype,&named_msg))
1918             return False;
1919         dump_packet(st,buf,source,True,True);
1920         if (st->state!=SITE_RUN) {
1921             slog(st,LOG_DROP,"ignoring PROD when not in state RUN");
1922         } else if (current_valid(st)) {
1923             slog(st,LOG_DROP,"ignoring PROD when we think we have a key");
1924         } else {
1925             initiate_key_setup(st,"peer sent PROD packet",source);
1926         }
1927         BUF_FREE(buf);
1928         return True;
1929     }
1930     if (dest==st->index) {
1931         /* Explicitly addressed to us */
1932         if (msgtype!=LABEL_MSG0) dump_packet(st,buf,source,True,True);
1933         switch (msgtype) {
1934         case LABEL_NAK:
1935             /* If the source is our current peer then initiate a key setup,
1936                because our peer's forgotten the key */
1937             if (get_uint32(buf->start+4)==st->current.remote_session_id) {
1938                 bool_t initiated;
1939                 initiated = initiate_key_setup(st,"received a NAK",source);
1940                 if (!initiated) generate_send_prod(st,source);
1941             } else {
1942                 slog(st,LOG_SEC,"bad incoming NAK");
1943             }
1944             break;
1945         case LABEL_MSG0:
1946             process_msg0(st,buf,source);
1947             break;
1948         case LABEL_MSG1:
1949             /* Setup packet: should not have been explicitly addressed
1950                to us */
1951             slog(st,LOG_SEC,"incoming explicitly addressed msg1");
1952             break;
1953         case LABEL_MSG2:
1954             /* Setup packet: expected only in state SENTMSG1 */
1955             if (st->state!=SITE_SENTMSG1) {
1956                 if ((st->state==SITE_SENTMSG3 ||
1957                      st->state==SITE_SENTMSG5) &&
1958                     setup_late_msg_ok(st,buf,msgtype,source))
1959                     break;
1960                 slog(st,LOG_UNEXPECTED,"unexpected MSG2");
1961             } else if (process_msg2(st,buf,source)) {
1962                 transport_setup_msgok(st,source);
1963                 enter_new_state(st,SITE_SENTMSG3);
1964             } else {
1965                 slog(st,LOG_SEC,"invalid MSG2");
1966             }
1967             break;
1968         case CASES_MSG3_KNOWN:
1969             /* Setup packet: expected only in state SENTMSG2 */
1970             if (st->state!=SITE_SENTMSG2) {
1971                 if ((st->state==SITE_SENTMSG4) &&
1972                     setup_late_msg_ok(st,buf,msgtype,source))
1973                     break;
1974                 slog(st,LOG_UNEXPECTED,"unexpected MSG3");
1975             } else if (process_msg3(st,buf,source,msgtype)) {
1976                 transport_setup_msgok(st,source);
1977                 enter_new_state(st,SITE_SENTMSG4);
1978             } else {
1979                 slog(st,LOG_SEC,"invalid MSG3");
1980             }
1981             break;
1982         case LABEL_MSG4:
1983             /* Setup packet: expected only in state SENTMSG3 */
1984             if (st->state!=SITE_SENTMSG3) {
1985                 if ((st->state==SITE_SENTMSG5) &&
1986                     setup_late_msg_ok(st,buf,msgtype,source))
1987                     break;
1988                 slog(st,LOG_UNEXPECTED,"unexpected MSG4");
1989             } else if (process_msg4(st,buf,source)) {
1990                 transport_setup_msgok(st,source);
1991                 enter_new_state(st,SITE_SENTMSG5);
1992             } else {
1993                 slog(st,LOG_SEC,"invalid MSG4");
1994             }
1995             break;
1996         case LABEL_MSG5:
1997             /* Setup packet: expected only in state SENTMSG4 */
1998             /* (may turn up in state RUN if our return MSG6 was lost
1999                and the new key has already been activated. In that
2000                case we discard it. The peer will realise that we
2001                are using the new key when they see our data packets.
2002                Until then the peer's data packets to us get discarded. */
2003             if (st->state==SITE_SENTMSG4) {
2004                 if (process_msg5(st,buf,source,st->new_transform)) {
2005                     transport_setup_msgok(st,source);
2006                     enter_new_state(st,SITE_RUN);
2007                 } else {
2008                     slog(st,LOG_SEC,"invalid MSG5");
2009                 }
2010             } else if (st->state==SITE_RUN) {
2011                 if (process_msg5(st,buf,source,st->current.transform)) {
2012                     slog(st,LOG_DROP,"got MSG5, retransmitting MSG6");
2013                     transport_setup_msgok(st,source);
2014                     create_msg6(st,st->current.transform,
2015                                 st->current.remote_session_id);
2016                     transport_xmit(st,&st->peers,&st->buffer,True);
2017                     BUF_FREE(&st->buffer);
2018                 } else {
2019                     slog(st,LOG_SEC,"invalid MSG5 (in state RUN)");
2020                 }
2021             } else {
2022                 slog(st,LOG_UNEXPECTED,"unexpected MSG5");
2023             }
2024             break;
2025         case LABEL_MSG6:
2026             /* Setup packet: expected only in state SENTMSG5 */
2027             if (st->state!=SITE_SENTMSG5) {
2028                 slog(st,LOG_UNEXPECTED,"unexpected MSG6");
2029             } else if (process_msg6(st,buf,source)) {
2030                 BUF_FREE(&st->buffer); /* Free message 5 */
2031                 transport_setup_msgok(st,source);
2032                 activate_new_key(st);
2033             } else {
2034                 slog(st,LOG_SEC,"invalid MSG6");
2035             }
2036             break;
2037         default:
2038             slog(st,LOG_SEC,"received message of unknown type 0x%08x",
2039                  msgtype);
2040             break;
2041         }
2042         BUF_FREE(buf);
2043         return True;
2044     }
2045
2046     return False;
2047 }
2048
2049 static void site_control(void *vst, bool_t run)
2050 {
2051     struct site *st=vst;
2052     if (run) enter_state_run(st);
2053     else enter_state_stop(st);
2054 }
2055
2056 static void site_phase_hook(void *sst, uint32_t newphase)
2057 {
2058     struct site *st=sst;
2059
2060     /* The program is shutting down; tell our peer */
2061     send_msg7(st,"shutting down");
2062 }
2063
2064 static void site_childpersist_clearkeys(void *sst, uint32_t newphase)
2065 {
2066     struct site *st=sst;
2067     dispose_transform(&st->current.transform);
2068     dispose_transform(&st->auxiliary_key.transform);
2069     dispose_transform(&st->new_transform);
2070     /* Not much point overwiting the signing key, since we loaded it
2071        from disk, and it is only valid prospectively if at all,
2072        anyway. */
2073     /* XXX it would be best to overwrite the DH state, because that
2074        _is_ relevant to forward secrecy.  However we have no
2075        convenient interface for doing that and in practice gmp has
2076        probably dribbled droppings all over the malloc arena.  A good
2077        way to fix this would be to have a privsep child for asymmetric
2078        crypto operations, but that's a task for another day. */
2079 }
2080
2081 static list_t *site_apply(closure_t *self, struct cloc loc, dict_t *context,
2082                           list_t *args)
2083 {
2084     static uint32_t index_sequence;
2085     struct site *st;
2086     item_t *item;
2087     dict_t *dict;
2088     int i;
2089
2090     NEW(st);
2091
2092     st->cl.description="site";
2093     st->cl.type=CL_SITE;
2094     st->cl.apply=NULL;
2095     st->cl.interface=&st->ops;
2096     st->ops.st=st;
2097     st->ops.control=site_control;
2098     st->ops.status=site_status;
2099
2100     /* First parameter must be a dict */
2101     item=list_elem(args,0);
2102     if (!item || item->type!=t_dict)
2103         cfgfatal(loc,"site","parameter must be a dictionary\n");
2104     
2105     dict=item->data.dict;
2106     st->localname=dict_read_string(dict, "local-name", True, "site", loc);
2107     st->remotename=dict_read_string(dict, "name", True, "site", loc);
2108
2109     st->keepalive=dict_read_bool(dict,"keepalive",False,"site",loc,False);
2110
2111     st->peer_mobile=dict_read_bool(dict,"mobile",False,"site",loc,False);
2112     st->local_mobile=
2113         dict_read_bool(dict,"local-mobile",False,"site",loc,False);
2114
2115     /* Sanity check (which also allows the 'sites' file to include
2116        site() closures for all sites including our own): refuse to
2117        talk to ourselves */
2118     if (strcmp(st->localname,st->remotename)==0) {
2119         Message(M_DEBUG,"site %s: local-name==name -> ignoring this site\n",
2120                 st->localname);
2121         if (st->peer_mobile != st->local_mobile)
2122             cfgfatal(loc,"site","site %s's peer-mobile=%d"
2123                     " but our local-mobile=%d\n",
2124                     st->localname, st->peer_mobile, st->local_mobile);
2125         free(st);
2126         return NULL;
2127     }
2128     if (st->peer_mobile && st->local_mobile) {
2129         Message(M_WARNING,"site %s: site is mobile but so are we"
2130                 " -> ignoring this site\n", st->remotename);
2131         free(st);
2132         return NULL;
2133     }
2134
2135     assert(index_sequence < 0xffffffffUL);
2136     st->index = ++index_sequence;
2137     st->local_capabilities = 0;
2138     st->early_capabilities = CAPAB_PRIORITY_MOBILE;
2139     st->netlink=find_cl_if(dict,"link",CL_NETLINK,True,"site",loc);
2140
2141 #define GET_CLOSURE_LIST(dictkey,things,nthings,CL_TYPE) do{            \
2142     list_t *things##_cfg=dict_lookup(dict,dictkey);                     \
2143     if (!things##_cfg)                                                  \
2144         cfgfatal(loc,"site","closure list \"%s\" not found\n",dictkey); \
2145     st->nthings=list_length(things##_cfg);                              \
2146     NEW_ARY(st->things,st->nthings);                                    \
2147     assert(st->nthings);                                                \
2148     for (i=0; i<st->nthings; i++) {                                     \
2149         item_t *item=list_elem(things##_cfg,i);                         \
2150         if (item->type!=t_closure)                                      \
2151             cfgfatal(loc,"site","%s is not a closure\n",dictkey);       \
2152         closure_t *cl=item->data.closure;                               \
2153         if (cl->type!=CL_TYPE)                                          \
2154             cfgfatal(loc,"site","%s closure wrong type\n",dictkey);     \
2155         st->things[i]=cl->interface;                                    \
2156     }                                                                   \
2157 }while(0)
2158
2159     GET_CLOSURE_LIST("comm",comms,ncomms,CL_COMM);
2160
2161     NEW_ARY(st->commclientinfos, st->ncomms);
2162     dict_t *comminfo = dict_read_dict(dict,"comm-info",False,"site",loc);
2163     for (i=0; i<st->ncomms; i++) {
2164         st->commclientinfos[i] =
2165             !comminfo ? 0 :
2166             st->comms[i]->clientinfo(st->comms[i],comminfo,loc);
2167     }
2168
2169     st->resolver=find_cl_if(dict,"resolver",CL_RESOLVER,True,"site",loc);
2170     st->log=find_cl_if(dict,"log",CL_LOG,True,"site",loc);
2171     st->random=find_cl_if(dict,"random",CL_RANDOMSRC,True,"site",loc);
2172
2173     st->privkey=find_cl_if(dict,"local-key",CL_RSAPRIVKEY,True,"site",loc);
2174     st->addresses=dict_read_string_array(dict,"address",False,"site",loc,0);
2175     if (st->addresses)
2176         st->remoteport=dict_read_number(dict,"port",True,"site",loc,0);
2177     else st->remoteport=0;
2178     st->pubkey=find_cl_if(dict,"key",CL_RSAPUBKEY,True,"site",loc);
2179
2180     GET_CLOSURE_LIST("transform",transforms,ntransforms,CL_TRANSFORM);
2181
2182     st->dh=find_cl_if(dict,"dh",CL_DH,True,"site",loc);
2183     st->hash=find_cl_if(dict,"hash",CL_HASH,True,"site",loc);
2184
2185 #define DEFAULT(D) (st->peer_mobile || st->local_mobile \
2186                     ? DEFAULT_MOBILE_##D : DEFAULT_##D)
2187 #define CFG_NUMBER(k,D) dict_read_number(dict,(k),False,"site",loc,DEFAULT(D));
2188
2189     st->key_lifetime=         CFG_NUMBER("key-lifetime",  KEY_LIFETIME);
2190     st->setup_retries=        CFG_NUMBER("setup-retries", SETUP_RETRIES);
2191     st->setup_retry_interval= CFG_NUMBER("setup-timeout", SETUP_RETRY_INTERVAL);
2192     st->wait_timeout_mean=    CFG_NUMBER("wait-time",     WAIT_TIME);
2193     st->mtu_target= dict_read_number(dict,"mtu-target",False,"site",loc,0);
2194
2195     st->mobile_peer_expiry= dict_read_number(
2196        dict,"mobile-peer-expiry",False,"site",loc,DEFAULT_MOBILE_PEER_EXPIRY);
2197
2198     const char *peerskey= st->peer_mobile
2199         ? "mobile-peers-max" : "static-peers-max";
2200     st->transport_peers_max= dict_read_number(
2201         dict,peerskey,False,"site",loc, st->addresses ? 4 : 3);
2202     if (st->transport_peers_max<1 ||
2203         st->transport_peers_max>MAX_PEER_ADDRS) {
2204         cfgfatal(loc,"site", "%s must be in range 1.."
2205                  STRING(MAX_PEER_ADDRS) "\n", peerskey);
2206     }
2207
2208     if (st->key_lifetime < DEFAULT(KEY_RENEGOTIATE_GAP)*2)
2209         st->key_renegotiate_time=st->key_lifetime/2;
2210     else
2211         st->key_renegotiate_time=st->key_lifetime-DEFAULT(KEY_RENEGOTIATE_GAP);
2212     st->key_renegotiate_time=dict_read_number(
2213         dict,"renegotiate-time",False,"site",loc,st->key_renegotiate_time);
2214     if (st->key_renegotiate_time > st->key_lifetime) {
2215         cfgfatal(loc,"site",
2216                  "renegotiate-time must be less than key-lifetime\n");
2217     }
2218
2219     st->log_events=string_list_to_word(dict_lookup(dict,"log-events"),
2220                                        log_event_table,"site");
2221
2222     st->resolving_count=0;
2223     st->allow_send_prod=0;
2224
2225     st->tunname=safe_malloc(strlen(st->localname)+strlen(st->remotename)+5,
2226                             "site_apply");
2227     sprintf(st->tunname,"%s<->%s",st->localname,st->remotename);
2228
2229     /* The information we expect to see in incoming messages of type 1 */
2230     /* fixme: lots of unchecked overflows here, but the results are only
2231        corrupted packets rather than undefined behaviour */
2232     st->our_name_later=(strcmp(st->localname,st->remotename)>0);
2233
2234     buffer_new(&st->buffer,SETUP_BUFFER_LEN);
2235
2236     buffer_new(&st->scratch,SETUP_BUFFER_LEN);
2237     BUF_ALLOC(&st->scratch,"site:scratch");
2238
2239     /* We are interested in poll(), but only for timeouts. We don't have
2240        any fds of our own. */
2241     register_for_poll(st, site_beforepoll, site_afterpoll, "site");
2242     st->timeout=0;
2243
2244     st->remote_capabilities=0;
2245     st->chosen_transform=0;
2246     st->current.key_timeout=0;
2247     st->auxiliary_key.key_timeout=0;
2248     transport_peers_clear(st,&st->peers);
2249     transport_peers_clear(st,&st->setup_peers);
2250     /* XXX mlock these */
2251     st->dhsecret=safe_malloc(st->dh->secret_len,"site:dhsecret");
2252     st->sharedsecret=safe_malloc(st->dh->shared_len, "site:sharedsecret");
2253
2254 #define SET_CAPBIT(bit) do {                                            \
2255     uint32_t capflag = 1UL << (bit);                                    \
2256     if (st->local_capabilities & capflag)                               \
2257         slog(st,LOG_ERROR,"capability bit"                              \
2258              " %d (%#"PRIx32") reused", (bit), capflag);                \
2259     st->local_capabilities |= capflag;                                  \
2260 } while (0)
2261
2262     for (i=0; i<st->ntransforms; i++)
2263         SET_CAPBIT(st->transforms[i]->capab_bit);
2264
2265 #undef SET_CAPBIT
2266
2267     if (st->local_mobile || st->peer_mobile)
2268         st->local_capabilities |= CAPAB_PRIORITY_MOBILE;
2269
2270     /* We need to register the remote networks with the netlink device */
2271     uint32_t netlink_mtu; /* local virtual interface mtu */
2272     st->netlink->reg(st->netlink->st, site_outgoing, st, &netlink_mtu);
2273     if (!st->mtu_target)
2274         st->mtu_target=netlink_mtu;
2275     
2276     for (i=0; i<st->ncomms; i++)
2277         st->comms[i]->request_notify(st->comms[i]->st, st, site_incoming);
2278
2279     st->current.transform=0;
2280     st->auxiliary_key.transform=0;
2281     st->new_transform=0;
2282     st->auxiliary_is_new=0;
2283
2284     enter_state_stop(st);
2285
2286     add_hook(PHASE_SHUTDOWN,site_phase_hook,st);
2287     add_hook(PHASE_CHILDPERSIST,site_childpersist_clearkeys,st);
2288
2289     return new_closure(&st->cl);
2290 }
2291
2292 void site_module(dict_t *dict)
2293 {
2294     add_closure(dict,"site",site_apply);
2295 }
2296
2297
2298 /***** TRANSPORT PEERS definitions *****/
2299
2300 static void transport_peers_debug(struct site *st, transport_peers *dst,
2301                                   const char *didwhat,
2302                                   int nargs, const struct comm_addr *args,
2303                                   size_t stride) {
2304     int i;
2305     char *argp;
2306
2307     if (!(st->log_events & LOG_PEER_ADDRS))
2308         return; /* an optimisation */
2309
2310     slog(st, LOG_PEER_ADDRS, "peers (%s) %s nargs=%d => npeers=%d",
2311          (dst==&st->peers ? "data" :
2312           dst==&st->setup_peers ? "setup" : "UNKNOWN"),
2313          didwhat, nargs, dst->npeers);
2314
2315     for (i=0, argp=(void*)args;
2316          i<nargs;
2317          i++, (argp+=stride?stride:sizeof(*args))) {
2318         const struct comm_addr *ca=(void*)argp;
2319         slog(st, LOG_PEER_ADDRS, " args: addrs[%d]=%s",
2320              i, comm_addr_to_string(ca));
2321     }
2322     for (i=0; i<dst->npeers; i++) {
2323         struct timeval diff;
2324         timersub(tv_now,&dst->peers[i].last,&diff);
2325         const struct comm_addr *ca=&dst->peers[i].addr;
2326         slog(st, LOG_PEER_ADDRS, " peers: addrs[%d]=%s T-%ld.%06ld",
2327              i, comm_addr_to_string(ca),
2328              (unsigned long)diff.tv_sec, (unsigned long)diff.tv_usec);
2329     }
2330 }
2331
2332 static void transport_peers_expire(struct site *st, transport_peers *peers) {
2333     /* peers must be sorted first */
2334     int previous_peers=peers->npeers;
2335     struct timeval oldest;
2336     oldest.tv_sec  = tv_now->tv_sec - st->mobile_peer_expiry;
2337     oldest.tv_usec = tv_now->tv_usec;
2338     while (peers->npeers>1 &&
2339            timercmp(&peers->peers[peers->npeers-1].last, &oldest, <))
2340         peers->npeers--;
2341     if (peers->npeers != previous_peers)
2342         transport_peers_debug(st,peers,"expire", 0,0,0);
2343 }
2344
2345 static bool_t transport_peer_record_one(struct site *st, transport_peers *peers,
2346                                         const struct comm_addr *ca,
2347                                         const struct timeval *tv) {
2348     /* returns false if output is full */
2349     int search;
2350
2351     if (peers->npeers >= st->transport_peers_max)
2352         return 0;
2353
2354     for (search=0; search<peers->npeers; search++)
2355         if (comm_addr_equal(&peers->peers[search].addr, ca))
2356             return 1;
2357
2358     peers->peers[peers->npeers].addr = *ca;
2359     peers->peers[peers->npeers].last = *tv;
2360     peers->npeers++;
2361     return 1;
2362 }
2363
2364 static void transport_record_peers(struct site *st, transport_peers *peers,
2365                                    const struct comm_addr *addrs, int naddrs,
2366                                    const char *m) {
2367     /* We add addrs into peers.  The new entries end up at the front
2368      * and displace entries towards the end (perhaps even off the
2369      * end).  Any existing matching entries are moved up to the front.
2370      *
2371      * Caller must first call transport_peers_expire. */
2372
2373     if (naddrs==1) {
2374         /* avoids debug for uninteresting updates */
2375         int i;
2376         for (i=0; i<peers->npeers; i++) {
2377             if (comm_addr_equal(&addrs[0], &peers->peers[i].addr)) {
2378                 memmove(peers->peers+1, peers->peers,
2379                         sizeof(peers->peers[0]) * i);
2380                 peers->peers[0].addr = addrs[0];
2381                 peers->peers[0].last = *tv_now;
2382                 return;
2383             }
2384         }
2385     }
2386
2387     int old_npeers=peers->npeers;
2388     transport_peer old_peers[old_npeers];
2389     COPY_ARRAY(old_peers,peers->peers,old_npeers);
2390
2391     peers->npeers=0;
2392     int i;
2393     for (i=0; i<naddrs; i++) {
2394         if (!transport_peer_record_one(st,peers, &addrs[i], tv_now))
2395             break;
2396     }
2397     for (i=0; i<old_npeers; i++) {
2398         const transport_peer *old=&old_peers[i];
2399         if (!transport_peer_record_one(st,peers, &old->addr, &old->last))
2400             break;
2401     }
2402
2403     transport_peers_debug(st,peers,m, naddrs,addrs,0);
2404 }
2405
2406 static void transport_expire_record_peers(struct site *st,
2407                                           transport_peers *peers,
2408                                           const struct comm_addr *addrs,
2409                                           int naddrs, const char *m) {
2410     /* Convenience function */
2411     transport_peers_expire(st,peers);
2412     transport_record_peers(st,peers,addrs,naddrs,m);
2413 }
2414
2415 static bool_t transport_compute_setupinit_peers(struct site *st,
2416         const struct comm_addr *configured_addrs /* 0 if none or not found */,
2417         int n_configured_addrs /* 0 if none or not found */,
2418         const struct comm_addr *incoming_packet_addr /* 0 if none */) {
2419     if (!n_configured_addrs && !incoming_packet_addr &&
2420         !transport_peers_valid(&st->peers))
2421         return False;
2422
2423     slog(st,LOG_SETUP_INIT,
2424          "using: %d configured addr(s);%s %d old peer addrs(es)",
2425          n_configured_addrs,
2426          incoming_packet_addr ? " incoming packet address;" : "",
2427          st->peers.npeers);
2428
2429     /* Non-mobile peers try addresses until one is plausible.  The
2430      * effect is that this code always tries first the configured
2431      * address if supplied, or otherwise the address of the incoming
2432      * PROD, or finally the existing data peer if one exists; this is
2433      * as desired. */
2434
2435     transport_peers_copy(st,&st->setup_peers,&st->peers);
2436     transport_peers_expire(st,&st->setup_peers);
2437
2438     if (incoming_packet_addr)
2439         transport_record_peers(st,&st->setup_peers,
2440                                incoming_packet_addr,1, "incoming");
2441
2442     if (n_configured_addrs)
2443         transport_record_peers(st,&st->setup_peers,
2444                               configured_addrs,n_configured_addrs, "setupinit");
2445
2446     assert(transport_peers_valid(&st->setup_peers));
2447     return True;
2448 }
2449
2450 static void transport_setup_msgok(struct site *st, const struct comm_addr *a) {
2451     if (st->peer_mobile)
2452         transport_expire_record_peers(st,&st->setup_peers,a,1,"setupmsg");
2453 }
2454 static void transport_data_msgok(struct site *st, const struct comm_addr *a) {
2455     if (st->peer_mobile)
2456         transport_expire_record_peers(st,&st->peers,a,1,"datamsg");
2457 }
2458
2459 static int transport_peers_valid(transport_peers *peers) {
2460     return peers->npeers;
2461 }
2462 static void transport_peers_clear(struct site *st, transport_peers *peers) {
2463     peers->npeers= 0;
2464     transport_peers_debug(st,peers,"clear",0,0,0);
2465 }
2466 static void transport_peers_copy(struct site *st, transport_peers *dst,
2467                                  const transport_peers *src) {
2468     dst->npeers=src->npeers;
2469     COPY_ARRAY(dst->peers, src->peers, dst->npeers);
2470     transport_peers_debug(st,dst,"copy",
2471                           src->npeers, &src->peers->addr, sizeof(*src->peers));
2472 }
2473
2474 static void transport_resolve_complete(struct site *st,
2475                                        const struct comm_addr *addrs,
2476                                        int naddrs) {
2477     transport_expire_record_peers(st,&st->peers,addrs,naddrs,
2478                                   "resolved data");
2479     transport_expire_record_peers(st,&st->setup_peers,addrs,naddrs,
2480                                   "resolved setup");
2481 }
2482
2483 static void transport_resolve_complete_tardy(struct site *st,
2484                                              const struct comm_addr *addrs,
2485                                              int naddrs) {
2486     transport_expire_record_peers(st,&st->peers,addrs,naddrs,
2487                                   "resolved tardily");
2488 }
2489
2490 static void transport_peers__copy_by_mask(transport_peer *out, int *nout_io,
2491                                           unsigned mask,
2492                                           const transport_peers *inp) {
2493     /* out and in->peers may be the same region, or nonoverlapping */
2494     const transport_peer *in=inp->peers;
2495     int slot;
2496     for (slot=0; slot<inp->npeers; slot++) {
2497         if (!(mask & (1U << slot)))
2498             continue;
2499         if (!(out==in && slot==*nout_io))
2500             COPY_OBJ(out[*nout_io], in[slot]);
2501         (*nout_io)++;
2502     }
2503 }
2504
2505 void transport_xmit(struct site *st, transport_peers *peers,
2506                     struct buffer_if *buf, bool_t candebug) {
2507     int slot;
2508     transport_peers_expire(st, peers);
2509     unsigned failed=0; /* bitmask */
2510     assert(MAX_PEER_ADDRS < sizeof(unsigned)*CHAR_BIT);
2511
2512     int nfailed=0;
2513     for (slot=0; slot<peers->npeers; slot++) {
2514         transport_peer *peer=&peers->peers[slot];
2515         bool_t ok = comm_addr_sendmsg(st, &peer->addr, buf);
2516         if (candebug)
2517             dump_packet(st, buf, &peer->addr, False, ok);
2518         if (!ok) {
2519             failed |= 1U << slot;
2520             nfailed++;
2521         }
2522         if (ok && !st->peer_mobile)
2523             break;
2524     }
2525     /* Now we need to demote/delete failing addrs: if we are mobile we
2526      * merely demote them; otherwise we delete them. */
2527     if (st->local_mobile) {
2528         unsigned expected = ((1U << nfailed)-1) << (peers->npeers-nfailed);
2529         /* `expected' has all the failures at the end already */
2530         if (failed != expected) {
2531             int fslot=0;
2532             transport_peer failedpeers[nfailed];
2533             transport_peers__copy_by_mask(failedpeers, &fslot, failed,peers);
2534             assert(fslot == nfailed);
2535             int wslot=0;
2536             transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2537             assert(wslot+nfailed == peers->npeers);
2538             COPY_ARRAY(peers->peers+wslot, failedpeers, nfailed);
2539             transport_peers_debug(st,peers,"mobile failure reorder",0,0,0);
2540         }
2541     } else {
2542         if (failed && peers->npeers > 1) {
2543             int wslot=0;
2544             transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2545             peers->npeers=wslot;
2546             transport_peers_debug(st,peers,"non-mobile failure cleanup",0,0,0);
2547         }
2548     }
2549 }
2550
2551 /***** END of transport peers declarations *****/