chiark / gitweb /
db1452394bf67b7f173cb8133dd2793c573f24eb
[secnet.git] / site.c
1 /* site.c - manage communication with a remote network site */
2
3 /*
4  * This file is part of secnet.
5  * See README for full list of copyright holders.
6  *
7  * secnet is free software; you can redistribute it and/or modify it
8  * under the terms of the GNU General Public License as published by
9  * the Free Software Foundation; either version 3 of the License, or
10  * (at your option) any later version.
11  * 
12  * secnet is distributed in the hope that it will be useful, but
13  * WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
15  * General Public License for more details.
16  * 
17  * You should have received a copy of the GNU General Public License
18  * version 3 along with secnet; if not, see
19  * https://www.gnu.org/licenses/gpl.html.
20  */
21
22 /* The 'site' code doesn't know anything about the structure of the
23    packets it's transmitting.  In fact, under the new netlink
24    configuration scheme it doesn't need to know anything at all about
25    IP addresses, except how to contact its peer.  This means it could
26    potentially be used to tunnel other protocols too (IPv6, IPX, plain
27    old Ethernet frames) if appropriate netlink code can be written
28    (and that ought not to be too hard, eg. using the TUN/TAP device to
29    pretend to be an Ethernet interface).  */
30
31 /* At some point in the future the netlink code will be asked for
32    configuration information to go in the PING/PONG packets at the end
33    of the key exchange. */
34
35 #include "secnet.h"
36 #include <stdio.h>
37 #include <string.h>
38 #include <limits.h>
39 #include <assert.h>
40 #include <sys/socket.h>
41
42 #include <sys/mman.h>
43 #include "util.h"
44 #include "unaligned.h"
45 #include "magic.h"
46
47 #define SETUP_BUFFER_LEN 2048
48
49 #define DEFAULT_KEY_LIFETIME                  (3600*1000) /* [ms] */
50 #define DEFAULT_KEY_RENEGOTIATE_GAP           (5*60*1000) /* [ms] */
51 #define DEFAULT_SETUP_RETRIES 5
52 #define DEFAULT_SETUP_RETRY_INTERVAL             (2*1000) /* [ms] */
53 #define DEFAULT_WAIT_TIME                       (20*1000) /* [ms] */
54
55 #define DEFAULT_MOBILE_KEY_LIFETIME      (2*24*3600*1000) /* [ms] */
56 #define DEFAULT_MOBILE_KEY_RENEGOTIATE_GAP (12*3600*1000) /* [ms] */
57 #define DEFAULT_MOBILE_SETUP_RETRIES 30
58 #define DEFAULT_MOBILE_SETUP_RETRY_INTERVAL      (1*1000) /* [ms] */
59 #define DEFAULT_MOBILE_WAIT_TIME                (10*1000) /* [ms] */
60
61 #define DEFAULT_MOBILE_PEER_EXPIRY            (2*60)      /* [s] */
62
63 /* Each site can be in one of several possible states. */
64
65 /* States:
66    SITE_STOP         - nothing is allowed to happen; tunnel is down;
67                        all session keys have been erased
68      -> SITE_RUN upon external instruction
69    SITE_RUN          - site up, maybe with valid key
70      -> SITE_RESOLVE upon outgoing packet and no valid key
71          we start name resolution for the other end of the tunnel
72      -> SITE_SENTMSG2 upon valid incoming message 1 and suitable time
73          we send an appropriate message 2
74    SITE_RESOLVE      - waiting for name resolution
75      -> SITE_SENTMSG1 upon successful resolution
76          we send an appropriate message 1
77      -> SITE_SENTMSG2 upon valid incoming message 1 (then abort resolution)
78          we abort resolution and 
79      -> SITE_WAIT on timeout or resolution failure
80    SITE_SENTMSG1
81      -> SITE_SENTMSG2 upon valid incoming message 1 from higher priority end
82      -> SITE_SENTMSG3 upon valid incoming message 2
83      -> SITE_WAIT on timeout
84    SITE_SENTMSG2
85      -> SITE_SENTMSG4 upon valid incoming message 3
86      -> SITE_WAIT on timeout
87    SITE_SENTMSG3
88      -> SITE_SENTMSG5 upon valid incoming message 4
89      -> SITE_WAIT on timeout
90    SITE_SENTMSG4
91      -> SITE_RUN upon valid incoming message 5
92      -> SITE_WAIT on timeout
93    SITE_SENTMSG5
94      -> SITE_RUN upon valid incoming message 6
95      -> SITE_WAIT on timeout
96    SITE_WAIT         - failed to establish key; do nothing for a while
97      -> SITE_RUN on timeout
98    */
99
100 #define SITE_STOP     0
101 #define SITE_RUN      1
102 #define SITE_RESOLVE  2
103 #define SITE_SENTMSG1 3
104 #define SITE_SENTMSG2 4
105 #define SITE_SENTMSG3 5
106 #define SITE_SENTMSG4 6
107 #define SITE_SENTMSG5 7
108 #define SITE_WAIT     8
109
110 int32_t site_max_start_pad = 4*4;
111
112 static cstring_t state_name(uint32_t state)
113 {
114     switch (state) {
115     case 0: return "STOP";
116     case 1: return "RUN";
117     case 2: return "RESOLVE";
118     case 3: return "SENTMSG1";
119     case 4: return "SENTMSG2";
120     case 5: return "SENTMSG3";
121     case 6: return "SENTMSG4";
122     case 7: return "SENTMSG5";
123     case 8: return "WAIT";
124     default: return "*bad state*";
125     }
126 }
127
128 #define NONCELEN 8
129
130 #define LOG_UNEXPECTED    0x00000001
131 #define LOG_SETUP_INIT    0x00000002
132 #define LOG_SETUP_TIMEOUT 0x00000004
133 #define LOG_ACTIVATE_KEY  0x00000008
134 #define LOG_TIMEOUT_KEY   0x00000010
135 #define LOG_SEC           0x00000020
136 #define LOG_STATE         0x00000040
137 #define LOG_DROP          0x00000080
138 #define LOG_DUMP          0x00000100
139 #define LOG_ERROR         0x00000400
140 #define LOG_PEER_ADDRS    0x00000800
141
142 static struct flagstr log_event_table[]={
143     { "unexpected", LOG_UNEXPECTED },
144     { "setup-init", LOG_SETUP_INIT },
145     { "setup-timeout", LOG_SETUP_TIMEOUT },
146     { "activate-key", LOG_ACTIVATE_KEY },
147     { "timeout-key", LOG_TIMEOUT_KEY },
148     { "security", LOG_SEC },
149     { "state-change", LOG_STATE },
150     { "packet-drop", LOG_DROP },
151     { "dump-packets", LOG_DUMP },
152     { "errors", LOG_ERROR },
153     { "peer-addrs", LOG_PEER_ADDRS },
154     { "default", LOG_SETUP_INIT|LOG_SETUP_TIMEOUT|
155       LOG_ACTIVATE_KEY|LOG_TIMEOUT_KEY|LOG_SEC|LOG_ERROR },
156     { "all", 0xffffffff },
157     { NULL, 0 }
158 };
159
160
161 /***** TRANSPORT PEERS declarations *****/
162
163 /* Details of "mobile peer" semantics:
164
165    - We use the same data structure for the different configurations,
166      but manage it with different algorithms.
167    
168    - We record up to mobile_peers_max peer address/port numbers
169      ("peers") for key setup, and separately up to mobile_peers_max
170      for data transfer.
171
172    - In general, we make a new set of addrs (see below) when we start
173      a new key exchange; the key setup addrs become the data transport
174      addrs when key setup complets.
175
176    If our peer is mobile:
177
178    - We send to all recent addresses of incoming packets, plus
179      initially all configured addresses (which we also expire).
180
181    - So, we record addrs of good incoming packets, as follows:
182       1. expire any peers last seen >120s ("mobile-peer-expiry") ago
183       2. add the peer of the just received packet to the applicable list
184          (possibly evicting the oldest entries to make room)
185      NB that we do not expire peers until an incoming packet arrives.
186
187    - If the peer has a configured address or name, we record them the
188      same way, but only as a result of our own initiation of key
189      setup.  (We might evict some incoming packet addrs to make room.)
190
191    - The default number of addrs to keep is 3, or 4 if we have a
192      configured name or address.  That's space for two configured
193      addresses (one IPv6 and one IPv4), plus two received addresses.
194
195    - Outgoing packets are sent to every recorded address in the
196      applicable list.  Any unsupported[1] addresses are deleted from
197      the list right away.  (This should only happen to configured
198      addresses, of course, but there is no need to check that.)
199
200    - When we successfully complete a key setup, we merge the key setup
201      peers into the data transfer peers.
202
203    [1] An unsupported address is one for whose AF we don't have a
204      socket (perhaps because we got EAFNOSUPPORT or some such) or for
205      which sendto gives ENETUNREACH.
206
207    If neither end is mobile:
208
209    - When peer initiated the key exchange, we use the incoming packet
210      address.
211
212    - When we initiate the key exchange, we try configured addresses
213      until we get one which isn't unsupported then fixate on that.
214
215    - When we complete a key setup, we replace the data transport peers
216      with those from the key setup.
217
218    If we are mobile:
219
220    - We can't tell when local network setup changes so we can't cache
221      the unsupported addrs and completely remove the spurious calls to
222      sendto, but we can optimise things a bit by deprioritising addrs
223      which seem to be unsupported.
224
225    - Use only configured addresses.  (Except, that if our peer
226      initiated a key exchange we use the incoming packet address until
227      our name resolution completes.)
228
229    - When we send a packet, try each address in turn; if addr
230      supported, put that address to the end of the list for future
231      packets, and go onto the next address.
232
233    - When we complete a key setup, we replace the data transport peers
234      with those from the key setup.
235
236    */
237
238 typedef struct {
239     struct timeval last;
240     struct comm_addr addr;
241 } transport_peer;
242
243 typedef struct {
244 /* configuration information */
245 /* runtime information */
246     int npeers;
247     transport_peer peers[MAX_PEER_ADDRS];
248 } transport_peers;
249
250 /* Basic operations on transport peer address sets */
251 static void transport_peers_clear(struct site *st, transport_peers *peers);
252 static int transport_peers_valid(transport_peers *peers);
253 static void transport_peers_copy(struct site *st, transport_peers *dst,
254                                  const transport_peers *src);
255
256 /* Record address of incoming setup packet; resp. data packet. */
257 static void transport_setup_msgok(struct site *st, const struct comm_addr *a);
258 static void transport_data_msgok(struct site *st, const struct comm_addr *a);
259
260 /* Initialise the setup addresses.  Called before we send the first
261  * packet in a key exchange.  If we are the initiator, as a result of
262  * resolve completing (or being determined not to be relevant) or an
263  * incoming PROD; if we are the responder, as a result of the MSG1. */
264 static bool_t transport_compute_setupinit_peers(struct site *st,
265         const struct comm_addr *configured_addrs /* 0 if none or not found */,
266         int n_configured_addrs /* 0 if none or not found */,
267         const struct comm_addr *incoming_packet_addr /* 0 if none */);
268
269 /* Called if we are the responder in a key setup, when the resolve
270  * completes.  transport_compute_setupinit_peers will hvae been called
271  * earlier.  If _complete is called, we are still doing the key setup
272  * (and we should use the new values for both the rest of the key
273  * setup and the ongoing data exchange); if _tardy is called, the key
274  * setup is done (either completed or not) and only the data peers are
275  * relevant */
276 static void transport_resolve_complete(struct site *st,
277         const struct comm_addr *addrs, int naddrs);
278 static void transport_resolve_complete_tardy(struct site *st,
279         const struct comm_addr *addrs, int naddrs);
280
281 static void transport_xmit(struct site *st, transport_peers *peers,
282                            struct buffer_if *buf, bool_t candebug);
283
284  /***** END of transport peers declarations *****/
285
286
287 struct data_key {
288     struct transform_inst_if *transform;
289     uint64_t key_timeout; /* End of life of current key */
290     uint32_t remote_session_id;
291 };
292
293 struct site {
294     closure_t cl;
295     struct site_if ops;
296 /* configuration information */
297     string_t localname;
298     string_t remotename;
299     bool_t keepalive;
300     bool_t local_mobile, peer_mobile; /* Mobile client support */
301     int32_t transport_peers_max;
302     string_t tunname; /* localname<->remotename by default, used in logs */
303     cstring_t *addresses; /* DNS name or address(es) for bootstrapping, optional */
304     int remoteport; /* Port for bootstrapping, optional */
305     uint32_t mtu_target;
306     struct netlink_if *netlink;
307     struct comm_if **comms;
308     struct comm_clientinfo **commclientinfos;
309     int ncomms;
310     struct resolver_if *resolver;
311     struct log_if *log;
312     struct random_if *random;
313     struct rsaprivkey_if *privkey;
314     struct rsapubkey_if *pubkey;
315     struct transform_if **transforms;
316     int ntransforms;
317     struct dh_if *dh;
318     struct hash_if *hash;
319
320     uint32_t index; /* Index of this site */
321     uint32_t local_capabilities;
322     int32_t setup_retries; /* How many times to send setup packets */
323     int32_t setup_retry_interval; /* Initial timeout for setup packets */
324     int32_t wait_timeout; /* How long to wait if setup unsuccessful */
325     int32_t mobile_peer_expiry; /* How long to remember 2ary addresses */
326     int32_t key_lifetime; /* How long a key lasts once set up */
327     int32_t key_renegotiate_time; /* If we see traffic (or a keepalive)
328                                       after this time, initiate a new
329                                       key exchange */
330
331     bool_t our_name_later; /* our name > peer name */
332     uint32_t log_events;
333
334 /* runtime information */
335     uint32_t state;
336     uint64_t now; /* Most recently seen time */
337     bool_t allow_send_prod;
338     bool_t msg1_crossed_logged;
339     int resolving_count;
340     int resolving_n_results_all;
341     int resolving_n_results_stored;
342     struct comm_addr resolving_results[MAX_PEER_ADDRS];
343
344     /* The currently established session */
345     struct data_key current;
346     struct data_key auxiliary_key;
347     bool_t auxiliary_is_new;
348     uint64_t renegotiate_key_time; /* When we can negotiate a new key */
349     uint64_t auxiliary_renegotiate_key_time;
350     transport_peers peers; /* Current address(es) of peer for data traffic */
351
352     /* The current key setup protocol exchange.  We can only be
353        involved in one of these at a time.  There's a potential for
354        denial of service here (the attacker keeps sending a setup
355        packet; we keep trying to continue the exchange, and have to
356        timeout before we can listen for another setup packet); perhaps
357        we should keep a list of 'bad' sources for setup packets. */
358     uint32_t remote_capabilities;
359     uint16_t remote_adv_mtu;
360     struct transform_if *chosen_transform;
361     uint32_t setup_session_id;
362     transport_peers setup_peers;
363     uint8_t localN[NONCELEN]; /* Nonces for key exchange */
364     uint8_t remoteN[NONCELEN];
365     struct buffer_if buffer; /* Current outgoing key exchange packet */
366     struct buffer_if scratch;
367     int32_t retries; /* Number of retries remaining */
368     uint64_t timeout; /* Timeout for current state */
369     uint8_t *dhsecret;
370     uint8_t *sharedsecret;
371     uint32_t sharedsecretlen, sharedsecretallocd;
372     struct transform_inst_if *new_transform; /* For key setup/verify */
373 };
374
375 static uint32_t event_log_priority(struct site *st, uint32_t event)
376 {
377     if (!(event&st->log_events))
378         return 0;
379     switch(event) {
380     case LOG_UNEXPECTED:    return M_INFO;
381     case LOG_SETUP_INIT:    return M_INFO;
382     case LOG_SETUP_TIMEOUT: return M_NOTICE;
383     case LOG_ACTIVATE_KEY:  return M_INFO;
384     case LOG_TIMEOUT_KEY:   return M_INFO;
385     case LOG_SEC:           return M_SECURITY;
386     case LOG_STATE:         return M_DEBUG;
387     case LOG_DROP:          return M_DEBUG;
388     case LOG_DUMP:          return M_DEBUG;
389     case LOG_ERROR:         return M_ERR;
390     case LOG_PEER_ADDRS:    return M_DEBUG;
391     default:                return M_ERR;
392     }
393 }
394
395 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
396 FORMAT(printf,3,0);
397 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
398 {
399     uint32_t class;
400
401     class=event_log_priority(st, event);
402     if (class) {
403         slilog_part(st->log,class,"%s: ",st->tunname);
404         vslilog_part(st->log,class,msg,ap);
405         slilog_part(st->log,class,"\n");
406     }
407 }
408
409 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
410 FORMAT(printf,3,4);
411 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
412 {
413     va_list ap;
414     va_start(ap,msg);
415     vslog(st,event,msg,ap);
416     va_end(ap);
417 }
418
419 static void logtimeout(struct site *st, const char *fmt, ...)
420 FORMAT(printf,2,3);
421 static void logtimeout(struct site *st, const char *fmt, ...)
422 {
423     uint32_t class=event_log_priority(st,LOG_SETUP_TIMEOUT);
424     if (!class)
425         return;
426
427     va_list ap;
428     va_start(ap,fmt);
429
430     slilog_part(st->log,class,"%s: ",st->tunname);
431     vslilog_part(st->log,class,fmt,ap);
432
433     const char *delim;
434     int i;
435     for (i=0, delim=" (tried ";
436          i<st->setup_peers.npeers;
437          i++, delim=", ") {
438         transport_peer *peer=&st->setup_peers.peers[i];
439         const char *s=comm_addr_to_string(&peer->addr);
440         slilog_part(st->log,class,"%s%s",delim,s);
441     }
442
443     slilog_part(st->log,class,")\n");
444     va_end(ap);
445 }
446
447 static void set_link_quality(struct site *st);
448 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel);
449 static void delete_one_key(struct site *st, struct data_key *key,
450                            const char *reason /* may be 0 meaning don't log*/,
451                            const char *which /* ignored if !reasonn */,
452                            uint32_t loglevel /* ignored if !reasonn */);
453 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
454                                  const struct comm_addr *prod_hint);
455 static void enter_state_run(struct site *st);
456 static bool_t enter_state_resolve(struct site *st);
457 static void decrement_resolving_count(struct site *st, int by);
458 static bool_t enter_new_state(struct site *st,uint32_t next);
459 static void enter_state_wait(struct site *st);
460 static void activate_new_key(struct site *st);
461
462 static bool_t is_transform_valid(struct transform_inst_if *transform)
463 {
464     return transform && transform->valid(transform->st);
465 }
466
467 static bool_t current_valid(struct site *st)
468 {
469     return is_transform_valid(st->current.transform);
470 }
471
472 #define DEFINE_CALL_TRANSFORM(fwdrev)                                   \
473 static int call_transform_##fwdrev(struct site *st,                     \
474                                    struct transform_inst_if *transform, \
475                                    struct buffer_if *buf,               \
476                                    const char **errmsg)                 \
477 {                                                                       \
478     if (!is_transform_valid(transform)) {                               \
479         *errmsg="transform not set up";                                 \
480         return 1;                                                       \
481     }                                                                   \
482     return transform->fwdrev(transform->st,buf,errmsg);                 \
483 }
484
485 DEFINE_CALL_TRANSFORM(forwards)
486 DEFINE_CALL_TRANSFORM(reverse)
487
488 static void dispose_transform(struct transform_inst_if **transform_var)
489 {
490     struct transform_inst_if *transform=*transform_var;
491     if (transform) {
492         transform->delkey(transform->st);
493         transform->destroy(transform->st);
494     }
495     *transform_var = 0;
496 }    
497
498 #define CHECK_AVAIL(b,l) do { if ((b)->size<(l)) return False; } while(0)
499 #define CHECK_EMPTY(b) do { if ((b)->size!=0) return False; } while(0)
500 #define CHECK_TYPE(b,t) do { uint32_t type; \
501     CHECK_AVAIL((b),4); \
502     type=buf_unprepend_uint32((b)); \
503     if (type!=(t)) return False; } while(0)
504
505 static _Bool type_is_msg34(uint32_t type)
506 {
507     return
508         type == LABEL_MSG3 ||
509         type == LABEL_MSG3BIS ||
510         type == LABEL_MSG4;
511 }
512
513 struct parsedname {
514     int32_t len;
515     uint8_t *name;
516     struct buffer_if extrainfo;
517 };
518
519 struct msg {
520     uint8_t *hashstart;
521     uint32_t dest;
522     uint32_t source;
523     struct parsedname remote;
524     struct parsedname local;
525     uint32_t remote_capabilities;
526     uint16_t remote_mtu;
527     int capab_transformnum;
528     uint8_t *nR;
529     uint8_t *nL;
530     int32_t pklen;
531     char *pk;
532     int32_t hashlen;
533     int32_t siglen;
534     char *sig;
535 };
536
537 static _Bool set_new_transform(struct site *st, char *pk)
538 {
539     _Bool ok;
540
541     /* Make room for the shared key */
542     st->sharedsecretlen=st->chosen_transform->keylen?:st->dh->ceil_len;
543     assert(st->sharedsecretlen);
544     if (st->sharedsecretlen > st->sharedsecretallocd) {
545         st->sharedsecretallocd=st->sharedsecretlen;
546         st->sharedsecret=safe_realloc_ary(st->sharedsecret,1,
547                                           st->sharedsecretallocd,
548                                           "site:sharedsecret");
549     }
550
551     /* Generate the shared key */
552     st->dh->makeshared(st->dh->st,st->dhsecret,st->dh->len,pk,
553                        st->sharedsecret,st->sharedsecretlen);
554
555     /* Set up the transform */
556     struct transform_if *generator=st->chosen_transform;
557     struct transform_inst_if *generated=generator->create(generator->st);
558     ok = generated->setkey(generated->st,st->sharedsecret,
559                            st->sharedsecretlen,st->our_name_later);
560
561     dispose_transform(&st->new_transform);
562     if (!ok) return False;
563     st->new_transform=generated;
564
565     slog(st,LOG_SETUP_INIT,"key exchange negotiated transform"
566          " %d (capabilities ours=%#"PRIx32" theirs=%#"PRIx32")",
567          st->chosen_transform->capab_transformnum,
568          st->local_capabilities, st->remote_capabilities);
569     return True;
570 }
571
572 struct xinfoadd {
573     int32_t lenpos, afternul;
574 };
575 static void append_string_xinfo_start(struct buffer_if *buf,
576                                       struct xinfoadd *xia,
577                                       const char *str)
578     /* Helps construct one of the names with additional info as found
579      * in MSG1..4.  Call this function first, then append all the
580      * desired extra info (not including the nul byte) to the buffer,
581      * then call append_string_xinfo_done. */
582 {
583     xia->lenpos = buf->size;
584     buf_append_string(buf,str);
585     buf_append_uint8(buf,0);
586     xia->afternul = buf->size;
587 }
588 static void append_string_xinfo_done(struct buffer_if *buf,
589                                      struct xinfoadd *xia)
590 {
591     /* we just need to adjust the string length */
592     if (buf->size == xia->afternul) {
593         /* no extra info, strip the nul too */
594         buf_unappend_uint8(buf);
595     } else {
596         put_uint16(buf->start+xia->lenpos, buf->size-(xia->lenpos+2));
597     }
598 }
599
600 /* Build any of msg1 to msg4. msg5 and msg6 are built from the inside
601    out using a transform of config data supplied by netlink */
602 static bool_t generate_msg(struct site *st, uint32_t type, cstring_t what)
603 {
604     void *hst;
605     uint8_t *hash;
606     string_t dhpub, sig;
607
608     st->retries=st->setup_retries;
609     BUF_ALLOC(&st->buffer,what);
610     buffer_init(&st->buffer,0);
611     buf_append_uint32(&st->buffer,
612         (type==LABEL_MSG1?0:st->setup_session_id));
613     buf_append_uint32(&st->buffer,st->index);
614     buf_append_uint32(&st->buffer,type);
615
616     struct xinfoadd xia;
617     append_string_xinfo_start(&st->buffer,&xia,st->localname);
618     if ((st->local_capabilities & CAPAB_EARLY) || (type != LABEL_MSG1)) {
619         buf_append_uint32(&st->buffer,st->local_capabilities);
620     }
621     if (type_is_msg34(type)) {
622         buf_append_uint16(&st->buffer,st->mtu_target);
623     }
624     append_string_xinfo_done(&st->buffer,&xia);
625
626     buf_append_string(&st->buffer,st->remotename);
627     BUF_ADD_OBJ(append,&st->buffer,st->localN);
628     if (type==LABEL_MSG1) return True;
629     BUF_ADD_OBJ(append,&st->buffer,st->remoteN);
630     if (type==LABEL_MSG2) return True;
631
632     if (hacky_par_mid_failnow()) return False;
633
634     if (type==LABEL_MSG3BIS)
635         buf_append_uint8(&st->buffer,st->chosen_transform->capab_transformnum);
636
637     dhpub=st->dh->makepublic(st->dh->st,st->dhsecret,st->dh->len);
638     buf_append_string(&st->buffer,dhpub);
639     free(dhpub);
640     hash=safe_malloc(st->hash->len, "generate_msg");
641     hst=st->hash->init();
642     st->hash->update(hst,st->buffer.start,st->buffer.size);
643     st->hash->final(hst,hash);
644     sig=st->privkey->sign(st->privkey->st,hash,st->hash->len);
645     buf_append_string(&st->buffer,sig);
646     free(sig);
647     free(hash);
648     return True;
649 }
650
651 static bool_t unpick_name(struct buffer_if *msg, struct parsedname *nm)
652 {
653     CHECK_AVAIL(msg,2);
654     nm->len=buf_unprepend_uint16(msg);
655     CHECK_AVAIL(msg,nm->len);
656     nm->name=buf_unprepend(msg,nm->len);
657     uint8_t *nul=memchr(nm->name,0,nm->len);
658     if (!nul) {
659         buffer_readonly_view(&nm->extrainfo,0,0);
660     } else {
661         buffer_readonly_view(&nm->extrainfo, nul+1, msg->start-(nul+1));
662         nm->len=nul-nm->name;
663     }
664     return True;
665 }
666
667 static bool_t unpick_msg(struct site *st, uint32_t type,
668                          struct buffer_if *msg, struct msg *m)
669 {
670     m->capab_transformnum=-1;
671     m->hashstart=msg->start;
672     CHECK_AVAIL(msg,4);
673     m->dest=buf_unprepend_uint32(msg);
674     CHECK_AVAIL(msg,4);
675     m->source=buf_unprepend_uint32(msg);
676     CHECK_TYPE(msg,type);
677     if (!unpick_name(msg,&m->remote)) return False;
678     m->remote_capabilities=0;
679     m->remote_mtu=0;
680     if (m->remote.extrainfo.size) {
681         CHECK_AVAIL(&m->remote.extrainfo,4);
682         m->remote_capabilities=buf_unprepend_uint32(&m->remote.extrainfo);
683     }
684     if (type_is_msg34(type) && m->remote.extrainfo.size) {
685         CHECK_AVAIL(&m->remote.extrainfo,2);
686         m->remote_mtu=buf_unprepend_uint16(&m->remote.extrainfo);
687     }
688     if (!unpick_name(msg,&m->local)) return False;
689     if (type==LABEL_PROD) {
690         CHECK_EMPTY(msg);
691         return True;
692     }
693     CHECK_AVAIL(msg,NONCELEN);
694     m->nR=buf_unprepend(msg,NONCELEN);
695     if (type==LABEL_MSG1) {
696         CHECK_EMPTY(msg);
697         return True;
698     }
699     CHECK_AVAIL(msg,NONCELEN);
700     m->nL=buf_unprepend(msg,NONCELEN);
701     if (type==LABEL_MSG2) {
702         CHECK_EMPTY(msg);
703         return True;
704     }
705     if (type==LABEL_MSG3BIS) {
706         CHECK_AVAIL(msg,1);
707         m->capab_transformnum = buf_unprepend_uint8(msg);
708     } else {
709         m->capab_transformnum = CAPAB_TRANSFORMNUM_ANCIENT;
710     }
711     CHECK_AVAIL(msg,2);
712     m->pklen=buf_unprepend_uint16(msg);
713     CHECK_AVAIL(msg,m->pklen);
714     m->pk=buf_unprepend(msg,m->pklen);
715     m->hashlen=msg->start-m->hashstart;
716     CHECK_AVAIL(msg,2);
717     m->siglen=buf_unprepend_uint16(msg);
718     CHECK_AVAIL(msg,m->siglen);
719     m->sig=buf_unprepend(msg,m->siglen);
720     CHECK_EMPTY(msg);
721
722     /* In `process_msg3_msg4' below, we assume that we can write a nul
723      * terminator following the signature.  Make sure there's enough space.
724      */
725     if (msg->start >= msg->base + msg->alloclen)
726         return False;
727
728     return True;
729 }
730
731 static bool_t name_matches(const struct parsedname *nm, const char *expected)
732 {
733     int expected_len=strlen(expected);
734     return
735         nm->len == expected_len &&
736         !memcmp(nm->name, expected, expected_len);
737 }    
738
739 static bool_t check_msg(struct site *st, uint32_t type, struct msg *m,
740                         cstring_t *error)
741 {
742     if (type==LABEL_MSG1) return True;
743
744     /* Check that the site names and our nonce have been sent
745        back correctly, and then store our peer's nonce. */ 
746     if (!name_matches(&m->remote,st->remotename)) {
747         *error="wrong remote site name";
748         return False;
749     }
750     if (!name_matches(&m->local,st->localname)) {
751         *error="wrong local site name";
752         return False;
753     }
754     if (memcmp(m->nL,st->localN,NONCELEN)!=0) {
755         *error="wrong locally-generated nonce";
756         return False;
757     }
758     if (type==LABEL_MSG2) return True;
759     if (!consttime_memeq(m->nR,st->remoteN,NONCELEN)!=0) {
760         *error="wrong remotely-generated nonce";
761         return False;
762     }
763     /* MSG3 has complicated rules about capabilities, which are
764      * handled in process_msg3. */
765     if (type==LABEL_MSG3 || type==LABEL_MSG3BIS) return True;
766     if (m->remote_capabilities!=st->remote_capabilities) {
767         *error="remote capabilities changed";
768         return False;
769     }
770     if (type==LABEL_MSG4) return True;
771     *error="unknown message type";
772     return False;
773 }
774
775 static bool_t generate_msg1(struct site *st)
776 {
777     st->random->generate(st->random->st,NONCELEN,st->localN);
778     return generate_msg(st,LABEL_MSG1,"site:MSG1");
779 }
780
781 static bool_t process_msg1(struct site *st, struct buffer_if *msg1,
782                            const struct comm_addr *src, struct msg *m)
783 {
784     /* We've already determined we're in an appropriate state to
785        process an incoming MSG1, and that the MSG1 has correct values
786        of A and B. */
787
788     st->setup_session_id=m->source;
789     st->remote_capabilities=m->remote_capabilities;
790     memcpy(st->remoteN,m->nR,NONCELEN);
791     return True;
792 }
793
794 static bool_t generate_msg2(struct site *st)
795 {
796     st->random->generate(st->random->st,NONCELEN,st->localN);
797     return generate_msg(st,LABEL_MSG2,"site:MSG2");
798 }
799
800 static bool_t process_msg2(struct site *st, struct buffer_if *msg2,
801                            const struct comm_addr *src)
802 {
803     struct msg m;
804     cstring_t err;
805
806     if (!unpick_msg(st,LABEL_MSG2,msg2,&m)) return False;
807     if (!check_msg(st,LABEL_MSG2,&m,&err)) {
808         slog(st,LOG_SEC,"msg2: %s",err);
809         return False;
810     }
811     st->setup_session_id=m.source;
812     st->remote_capabilities=m.remote_capabilities;
813
814     /* Select the transform to use */
815
816     uint32_t remote_transforms = st->remote_capabilities & CAPAB_TRANSFORM_MASK;
817     if (!remote_transforms)
818         /* old secnets only had this one transform */
819         remote_transforms = 1UL << CAPAB_TRANSFORMNUM_ANCIENT;
820
821     struct transform_if *ti;
822     int i;
823     for (i=0; i<st->ntransforms; i++) {
824         ti=st->transforms[i];
825         if ((1UL << ti->capab_transformnum) & remote_transforms)
826             goto transform_found;
827     }
828     slog(st,LOG_ERROR,"no transforms in common"
829          " (us %#"PRIx32"; them: %#"PRIx32")",
830          st->local_capabilities & CAPAB_TRANSFORM_MASK,
831          remote_transforms);
832     return False;
833  transform_found:
834     st->chosen_transform=ti;
835
836     memcpy(st->remoteN,m.nR,NONCELEN);
837     return True;
838 }
839
840 static bool_t generate_msg3(struct site *st)
841 {
842     /* Now we have our nonce and their nonce. Think of a secret key,
843        and create message number 3. */
844     st->random->generate(st->random->st,st->dh->len,st->dhsecret);
845     return generate_msg(st,
846                         (st->remote_capabilities & CAPAB_TRANSFORM_MASK
847                          ? LABEL_MSG3BIS : LABEL_MSG3),
848                         "site:MSG3");
849 }
850
851 static bool_t process_msg3_msg4(struct site *st, struct msg *m)
852 {
853     uint8_t *hash;
854     void *hst;
855
856     /* Check signature and store g^x mod m */
857     hash=safe_malloc(st->hash->len, "process_msg3_msg4");
858     hst=st->hash->init();
859     st->hash->update(hst,m->hashstart,m->hashlen);
860     st->hash->final(hst,hash);
861     /* Terminate signature with a '0' - already checked that this will fit */
862     m->sig[m->siglen]=0;
863     if (!st->pubkey->check(st->pubkey->st,hash,st->hash->len,m->sig)) {
864         slog(st,LOG_SEC,"msg3/msg4 signature failed check!");
865         free(hash);
866         return False;
867     }
868     free(hash);
869
870     st->remote_adv_mtu=m->remote_mtu;
871
872     return True;
873 }
874
875 static bool_t process_msg3(struct site *st, struct buffer_if *msg3,
876                            const struct comm_addr *src, uint32_t msgtype)
877 {
878     struct msg m;
879     cstring_t err;
880
881     assert(msgtype==LABEL_MSG3 || msgtype==LABEL_MSG3BIS);
882
883     if (!unpick_msg(st,msgtype,msg3,&m)) return False;
884     if (!check_msg(st,msgtype,&m,&err)) {
885         slog(st,LOG_SEC,"msg3: %s",err);
886         return False;
887     }
888     uint32_t capab_adv_late = m.remote_capabilities
889         & ~st->remote_capabilities & CAPAB_EARLY;
890     if (capab_adv_late) {
891         slog(st,LOG_SEC,"msg3 impermissibly adds early capability flag(s)"
892              " %#"PRIx32" (was %#"PRIx32", now %#"PRIx32")",
893              capab_adv_late, st->remote_capabilities, m.remote_capabilities);
894         return False;
895     }
896     st->remote_capabilities|=m.remote_capabilities;
897
898     struct transform_if *ti;
899     int i;
900     for (i=0; i<st->ntransforms; i++) {
901         ti=st->transforms[i];
902         if (ti->capab_transformnum == m.capab_transformnum)
903             goto transform_found;
904     }
905     slog(st,LOG_SEC,"peer chose unknown-to-us transform %d!",
906          m.capab_transformnum);
907     return False;
908  transform_found:
909     st->chosen_transform=ti;
910
911     if (!process_msg3_msg4(st,&m))
912         return False;
913
914     /* Terminate their DH public key with a '0' */
915     m.pk[m.pklen]=0;
916     /* Invent our DH secret key */
917     st->random->generate(st->random->st,st->dh->len,st->dhsecret);
918
919     /* Generate the shared key and set up the transform */
920     if (!set_new_transform(st,m.pk)) return False;
921
922     return True;
923 }
924
925 static bool_t generate_msg4(struct site *st)
926 {
927     /* We have both nonces, their public key and our private key. Generate
928        our public key, sign it and send it to them. */
929     return generate_msg(st,LABEL_MSG4,"site:MSG4");
930 }
931
932 static bool_t process_msg4(struct site *st, struct buffer_if *msg4,
933                            const struct comm_addr *src)
934 {
935     struct msg m;
936     cstring_t err;
937
938     if (!unpick_msg(st,LABEL_MSG4,msg4,&m)) return False;
939     if (!check_msg(st,LABEL_MSG4,&m,&err)) {
940         slog(st,LOG_SEC,"msg4: %s",err);
941         return False;
942     }
943     
944     if (!process_msg3_msg4(st,&m))
945         return False;
946
947     /* Terminate their DH public key with a '0' */
948     m.pk[m.pklen]=0;
949
950     /* Generate the shared key and set up the transform */
951     if (!set_new_transform(st,m.pk)) return False;
952
953     return True;
954 }
955
956 struct msg0 {
957     uint32_t dest;
958     uint32_t source;
959     uint32_t type;
960 };
961
962 static bool_t unpick_msg0(struct site *st, struct buffer_if *msg0,
963                           struct msg0 *m)
964 {
965     CHECK_AVAIL(msg0,4);
966     m->dest=buf_unprepend_uint32(msg0);
967     CHECK_AVAIL(msg0,4);
968     m->source=buf_unprepend_uint32(msg0);
969     CHECK_AVAIL(msg0,4);
970     m->type=buf_unprepend_uint32(msg0);
971     return True;
972     /* Leaves transformed part of buffer untouched */
973 }
974
975 static bool_t generate_msg5(struct site *st)
976 {
977     cstring_t transform_err;
978
979     BUF_ALLOC(&st->buffer,"site:MSG5");
980     /* We are going to add four words to the message */
981     buffer_init(&st->buffer,calculate_max_start_pad());
982     /* Give the netlink code an opportunity to put its own stuff in the
983        message (configuration information, etc.) */
984     buf_prepend_uint32(&st->buffer,LABEL_MSG5);
985     if (call_transform_forwards(st,st->new_transform,
986                                 &st->buffer,&transform_err))
987         return False;
988     buf_prepend_uint32(&st->buffer,LABEL_MSG5);
989     buf_prepend_uint32(&st->buffer,st->index);
990     buf_prepend_uint32(&st->buffer,st->setup_session_id);
991
992     st->retries=st->setup_retries;
993     return True;
994 }
995
996 static bool_t process_msg5(struct site *st, struct buffer_if *msg5,
997                            const struct comm_addr *src,
998                            struct transform_inst_if *transform)
999 {
1000     struct msg0 m;
1001     cstring_t transform_err;
1002
1003     if (!unpick_msg0(st,msg5,&m)) return False;
1004
1005     if (call_transform_reverse(st,transform,msg5,&transform_err)) {
1006         /* There's a problem */
1007         slog(st,LOG_SEC,"process_msg5: transform: %s",transform_err);
1008         return False;
1009     }
1010     /* Buffer should now contain untransformed PING packet data */
1011     CHECK_AVAIL(msg5,4);
1012     if (buf_unprepend_uint32(msg5)!=LABEL_MSG5) {
1013         slog(st,LOG_SEC,"MSG5/PING packet contained wrong label");
1014         return False;
1015     }
1016     /* Older versions of secnet used to write some config data here
1017      * which we ignore.  So we don't CHECK_EMPTY */
1018     return True;
1019 }
1020
1021 static void create_msg6(struct site *st, struct transform_inst_if *transform,
1022                         uint32_t session_id)
1023 {
1024     cstring_t transform_err;
1025
1026     BUF_ALLOC(&st->buffer,"site:MSG6");
1027     /* We are going to add four words to the message */
1028     buffer_init(&st->buffer,calculate_max_start_pad());
1029     /* Give the netlink code an opportunity to put its own stuff in the
1030        message (configuration information, etc.) */
1031     buf_prepend_uint32(&st->buffer,LABEL_MSG6);
1032     int problem = call_transform_forwards(st,transform,
1033                                           &st->buffer,&transform_err);
1034     assert(!problem);
1035     buf_prepend_uint32(&st->buffer,LABEL_MSG6);
1036     buf_prepend_uint32(&st->buffer,st->index);
1037     buf_prepend_uint32(&st->buffer,session_id);
1038 }
1039
1040 static bool_t generate_msg6(struct site *st)
1041 {
1042     if (!is_transform_valid(st->new_transform))
1043         return False;
1044     create_msg6(st,st->new_transform,st->setup_session_id);
1045     st->retries=1; /* Peer will retransmit MSG5 if this packet gets lost */
1046     return True;
1047 }
1048
1049 static bool_t process_msg6(struct site *st, struct buffer_if *msg6,
1050                            const struct comm_addr *src)
1051 {
1052     struct msg0 m;
1053     cstring_t transform_err;
1054
1055     if (!unpick_msg0(st,msg6,&m)) return False;
1056
1057     if (call_transform_reverse(st,st->new_transform,msg6,&transform_err)) {
1058         /* There's a problem */
1059         slog(st,LOG_SEC,"process_msg6: transform: %s",transform_err);
1060         return False;
1061     }
1062     /* Buffer should now contain untransformed PING packet data */
1063     CHECK_AVAIL(msg6,4);
1064     if (buf_unprepend_uint32(msg6)!=LABEL_MSG6) {
1065         slog(st,LOG_SEC,"MSG6/PONG packet contained invalid data");
1066         return False;
1067     }
1068     /* Older versions of secnet used to write some config data here
1069      * which we ignore.  So we don't CHECK_EMPTY */
1070     return True;
1071 }
1072
1073 static bool_t decrypt_msg0(struct site *st, struct buffer_if *msg0,
1074                            const struct comm_addr *src)
1075 {
1076     cstring_t transform_err, auxkey_err, newkey_err="n/a";
1077     struct msg0 m;
1078     uint32_t problem;
1079
1080     if (!unpick_msg0(st,msg0,&m)) return False;
1081
1082     /* Keep a copy so we can try decrypting it with multiple keys */
1083     buffer_copy(&st->scratch, msg0);
1084
1085     problem = call_transform_reverse(st,st->current.transform,
1086                                      msg0,&transform_err);
1087     if (!problem) {
1088         if (!st->auxiliary_is_new)
1089             delete_one_key(st,&st->auxiliary_key,
1090                            "peer has used new key","auxiliary key",LOG_SEC);
1091         return True;
1092     }
1093     if (problem==2)
1094         goto skew;
1095
1096     buffer_copy(msg0, &st->scratch);
1097     problem = call_transform_reverse(st,st->auxiliary_key.transform,
1098                                      msg0,&auxkey_err);
1099     if (problem==0) {
1100         slog(st,LOG_DROP,"processing packet which uses auxiliary key");
1101         if (st->auxiliary_is_new) {
1102             /* We previously timed out in state SENTMSG5 but it turns
1103              * out that our peer did in fact get our MSG5 and is
1104              * using the new key.  So we should switch to it too. */
1105             /* This is a bit like activate_new_key. */
1106             struct data_key t;
1107             t=st->current;
1108             st->current=st->auxiliary_key;
1109             st->auxiliary_key=t;
1110
1111             delete_one_key(st,&st->auxiliary_key,"peer has used new key",
1112                            "previous key",LOG_SEC);
1113             st->auxiliary_is_new=0;
1114             st->renegotiate_key_time=st->auxiliary_renegotiate_key_time;
1115         }
1116         return True;
1117     }
1118     if (problem==2)
1119         goto skew;
1120
1121     if (st->state==SITE_SENTMSG5) {
1122         buffer_copy(msg0, &st->scratch);
1123         problem = call_transform_reverse(st,st->new_transform,
1124                                          msg0,&newkey_err);
1125         if (!problem) {
1126             /* It looks like we didn't get the peer's MSG6 */
1127             /* This is like a cut-down enter_new_state(SITE_RUN) */
1128             slog(st,LOG_STATE,"will enter state RUN (MSG0 with new key)");
1129             BUF_FREE(&st->buffer);
1130             st->timeout=0;
1131             activate_new_key(st);
1132             return True; /* do process the data in this packet */
1133         }
1134         if (problem==2)
1135             goto skew;
1136     }
1137
1138     slog(st,LOG_SEC,"transform: %s (aux: %s, new: %s)",
1139          transform_err,auxkey_err,newkey_err);
1140     initiate_key_setup(st,"incoming message would not decrypt",0);
1141     send_nak(src,m.dest,m.source,m.type,msg0,"message would not decrypt");
1142     return False;
1143
1144  skew:
1145     slog(st,LOG_DROP,"transform: %s (merely skew)",transform_err);
1146     assert(problem);
1147     return problem;
1148 }
1149
1150 static bool_t process_msg0(struct site *st, struct buffer_if *msg0,
1151                            const struct comm_addr *src)
1152 {
1153     uint32_t type;
1154
1155     if (!decrypt_msg0(st,msg0,src))
1156         return False;
1157
1158     CHECK_AVAIL(msg0,4);
1159     type=buf_unprepend_uint32(msg0);
1160     switch(type) {
1161     case LABEL_MSG7:
1162         /* We must forget about the current session. */
1163         delete_keys(st,"request from peer",LOG_SEC);
1164         /* probably, the peer is shutting down, and this is going to fail,
1165          * but we need to be trying to bring the link up again */
1166         if (st->keepalive)
1167             initiate_key_setup(st,"peer requested key teardown",0);
1168         return True;
1169     case LABEL_MSG9:
1170         /* Deliver to netlink layer */
1171         st->netlink->deliver(st->netlink->st,msg0);
1172         transport_data_msgok(st,src);
1173         /* See whether we should start negotiating a new key */
1174         if (st->now > st->renegotiate_key_time)
1175             initiate_key_setup(st,"incoming packet in renegotiation window",0);
1176         return True;
1177     default:
1178         slog(st,LOG_SEC,"incoming encrypted message of type %08x "
1179              "(unknown)",type);
1180         break;
1181     }
1182     return False;
1183 }
1184
1185 static void dump_packet(struct site *st, struct buffer_if *buf,
1186                         const struct comm_addr *addr, bool_t incoming,
1187                         bool_t ok)
1188 {
1189     uint32_t dest=get_uint32(buf->start);
1190     uint32_t source=get_uint32(buf->start+4);
1191     uint32_t msgtype=get_uint32(buf->start+8);
1192
1193     if (st->log_events & LOG_DUMP)
1194         slilog(st->log,M_DEBUG,"%s: %s: %08x<-%08x: %08x: %s%s",
1195                st->tunname,incoming?"incoming":"outgoing",
1196                dest,source,msgtype,comm_addr_to_string(addr),
1197                ok?"":" - fail");
1198 }
1199
1200 static bool_t comm_addr_sendmsg(struct site *st,
1201                                 const struct comm_addr *dest,
1202                                 struct buffer_if *buf)
1203 {
1204     int i;
1205     struct comm_clientinfo *commclientinfo = 0;
1206
1207     for (i=0; i < st->ncomms; i++) {
1208         if (st->comms[i] == dest->comm) {
1209             commclientinfo = st->commclientinfos[i];
1210             break;
1211         }
1212     }
1213     return dest->comm->sendmsg(dest->comm->st, buf, dest, commclientinfo);
1214 }
1215
1216 static uint32_t site_status(void *st)
1217 {
1218     return 0;
1219 }
1220
1221 static bool_t send_msg(struct site *st)
1222 {
1223     if (st->retries>0) {
1224         transport_xmit(st, &st->setup_peers, &st->buffer, True);
1225         st->timeout=st->now+st->setup_retry_interval;
1226         st->retries--;
1227         return True;
1228     } else if (st->state==SITE_SENTMSG5) {
1229         logtimeout(st,"timed out sending MSG5, stashing new key");
1230         /* We stash the key we have produced, in case it turns out that
1231          * our peer did see our MSG5 after all and starts using it. */
1232         /* This is a bit like some of activate_new_key */
1233         struct transform_inst_if *t;
1234         t=st->auxiliary_key.transform;
1235         st->auxiliary_key.transform=st->new_transform;
1236         st->new_transform=t;
1237         dispose_transform(&st->new_transform);
1238
1239         st->auxiliary_is_new=1;
1240         st->auxiliary_key.key_timeout=st->now+st->key_lifetime;
1241         st->auxiliary_renegotiate_key_time=st->now+st->key_renegotiate_time;
1242         st->auxiliary_key.remote_session_id=st->setup_session_id;
1243
1244         enter_state_wait(st);
1245         return False;
1246     } else {
1247         logtimeout(st,"timed out sending key setup packet "
1248             "(in state %s)",state_name(st->state));
1249         enter_state_wait(st);
1250         return False;
1251     }
1252 }
1253
1254 static void site_resolve_callback(void *sst, const struct comm_addr *addrs,
1255                                   int stored_naddrs, int all_naddrs,
1256                                   const char *address, const char *failwhy)
1257 {
1258     struct site *st=sst;
1259
1260     if (!stored_naddrs) {
1261         slog(st,LOG_ERROR,"resolution of %s failed: %s",address,failwhy);
1262     } else {
1263         slog(st,LOG_PEER_ADDRS,"resolution of %s completed, %d addrs, eg: %s",
1264              address, all_naddrs, comm_addr_to_string(&addrs[0]));;
1265
1266         int space=st->transport_peers_max-st->resolving_n_results_stored;
1267         int n_tocopy=MIN(stored_naddrs,space);
1268         COPY_ARRAY(st->resolving_results + st->resolving_n_results_stored,
1269                    addrs,
1270                    n_tocopy);
1271         st->resolving_n_results_stored += n_tocopy;
1272         st->resolving_n_results_all += all_naddrs;
1273     }
1274
1275     decrement_resolving_count(st,1);
1276 }
1277
1278 static void decrement_resolving_count(struct site *st, int by)
1279 {
1280     assert(st->resolving_count>0);
1281     st->resolving_count-=by;
1282
1283     if (st->resolving_count)
1284         return;
1285
1286     /* OK, we are done with them all.  Handle combined results. */
1287
1288     const struct comm_addr *addrs=st->resolving_results;
1289     int naddrs=st->resolving_n_results_stored;
1290     assert(naddrs<=st->transport_peers_max);
1291
1292     if (naddrs) {
1293         if (naddrs != st->resolving_n_results_all) {
1294             slog(st,LOG_SETUP_INIT,"resolution of supplied addresses/names"
1295                  " yielded too many results (%d > %d), some ignored",
1296                  st->resolving_n_results_all, naddrs);
1297         }
1298         slog(st,LOG_STATE,"resolution completed, %d addrs, eg: %s",
1299              naddrs, iaddr_to_string(&addrs[0].ia));;
1300     }
1301
1302     switch (st->state) {
1303     case SITE_RESOLVE:
1304         if (transport_compute_setupinit_peers(st,addrs,naddrs,0)) {
1305             enter_new_state(st,SITE_SENTMSG1);
1306         } else {
1307             /* Can't figure out who to try to to talk to */
1308             slog(st,LOG_SETUP_INIT,
1309                  "key exchange failed: cannot find peer address");
1310             enter_state_run(st);
1311         }
1312         break;
1313     case SITE_SENTMSG1: case SITE_SENTMSG2:
1314     case SITE_SENTMSG3: case SITE_SENTMSG4:
1315     case SITE_SENTMSG5:
1316         if (naddrs) {
1317             /* We start using the address immediately for data too.
1318              * It's best to store it in st->peers now because we might
1319              * go via SENTMSG5, WAIT, and a MSG0, straight into using
1320              * the new key (without updating the data peer addrs). */
1321             transport_resolve_complete(st,addrs,naddrs);
1322         } else if (st->local_mobile) {
1323             /* We can't let this rest because we may have a peer
1324              * address which will break in the future. */
1325             slog(st,LOG_SETUP_INIT,"resolution failed: "
1326                  "abandoning key exchange");
1327             enter_state_wait(st);
1328         } else {
1329             slog(st,LOG_SETUP_INIT,"resolution failed: "
1330                  " continuing to use source address of peer's packets"
1331                  " for key exchange and ultimately data");
1332         }
1333         break;
1334     case SITE_RUN:
1335         if (naddrs) {
1336             slog(st,LOG_SETUP_INIT,"resolution completed tardily,"
1337                  " updating peer address(es)");
1338             transport_resolve_complete_tardy(st,addrs,naddrs);
1339         } else if (st->local_mobile) {
1340             /* Not very good.  We should queue (another) renegotiation
1341              * so that we can update the peer address. */
1342             st->key_renegotiate_time=st->now+st->wait_timeout;
1343         } else {
1344             slog(st,LOG_SETUP_INIT,"resolution failed: "
1345                  " continuing to use source address of peer's packets");
1346         }
1347         break;
1348     case SITE_WAIT:
1349     case SITE_STOP:
1350         /* oh well */
1351         break;
1352     }
1353 }
1354
1355 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
1356                                  const struct comm_addr *prod_hint)
1357 {
1358     /* Reentrancy hazard: can call enter_new_state/enter_state_* */
1359     if (st->state!=SITE_RUN) return False;
1360     slog(st,LOG_SETUP_INIT,"initiating key exchange (%s)",reason);
1361     if (st->addresses) {
1362         slog(st,LOG_SETUP_INIT,"resolving peer address(es)");
1363         return enter_state_resolve(st);
1364     } else if (transport_compute_setupinit_peers(st,0,0,prod_hint)) {
1365         return enter_new_state(st,SITE_SENTMSG1);
1366     }
1367     slog(st,LOG_SETUP_INIT,"key exchange failed: no address for peer");
1368     return False;
1369 }
1370
1371 static void activate_new_key(struct site *st)
1372 {
1373     struct transform_inst_if *t;
1374
1375     /* We have three transform instances, which we swap between old,
1376        active and setup */
1377     t=st->auxiliary_key.transform;
1378     st->auxiliary_key.transform=st->current.transform;
1379     st->current.transform=st->new_transform;
1380     st->new_transform=t;
1381     dispose_transform(&st->new_transform);
1382
1383     st->timeout=0;
1384     st->auxiliary_is_new=0;
1385     st->auxiliary_key.key_timeout=st->current.key_timeout;
1386     st->current.key_timeout=st->now+st->key_lifetime;
1387     st->renegotiate_key_time=st->now+st->key_renegotiate_time;
1388     transport_peers_copy(st,&st->peers,&st->setup_peers);
1389     st->current.remote_session_id=st->setup_session_id;
1390
1391     /* Compute the inter-site MTU.  This is min( our_mtu, their_mtu ).
1392      * But their mtu be unspecified, in which case we just use ours. */
1393     uint32_t intersite_mtu=
1394         MIN(st->mtu_target, st->remote_adv_mtu ?: ~(uint32_t)0);
1395     st->netlink->set_mtu(st->netlink->st,intersite_mtu);
1396
1397     slog(st,LOG_ACTIVATE_KEY,"new key activated"
1398          " (mtu ours=%"PRId32" theirs=%"PRId32" intersite=%"PRId32")",
1399          st->mtu_target, st->remote_adv_mtu, intersite_mtu);
1400     enter_state_run(st);
1401 }
1402
1403 static void delete_one_key(struct site *st, struct data_key *key,
1404                            cstring_t reason, cstring_t which, uint32_t loglevel)
1405 {
1406     if (!is_transform_valid(key->transform)) return;
1407     if (reason) slog(st,loglevel,"%s deleted (%s)",which,reason);
1408     dispose_transform(&key->transform);
1409     key->key_timeout=0;
1410 }
1411
1412 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel)
1413 {
1414     if (current_valid(st)) {
1415         slog(st,loglevel,"session closed (%s)",reason);
1416
1417         delete_one_key(st,&st->current,0,0,0);
1418         set_link_quality(st);
1419     }
1420     delete_one_key(st,&st->auxiliary_key,0,0,0);
1421 }
1422
1423 static void state_assert(struct site *st, bool_t ok)
1424 {
1425     if (!ok) fatal("site:state_assert");
1426 }
1427
1428 static void enter_state_stop(struct site *st)
1429 {
1430     st->state=SITE_STOP;
1431     st->timeout=0;
1432     delete_keys(st,"entering state STOP",LOG_TIMEOUT_KEY);
1433     dispose_transform(&st->new_transform);
1434 }
1435
1436 static void set_link_quality(struct site *st)
1437 {
1438     uint32_t quality;
1439     if (current_valid(st))
1440         quality=LINK_QUALITY_UP;
1441     else if (st->state==SITE_WAIT || st->state==SITE_STOP)
1442         quality=LINK_QUALITY_DOWN;
1443     else if (st->addresses)
1444         quality=LINK_QUALITY_DOWN_CURRENT_ADDRESS;
1445     else if (transport_peers_valid(&st->peers))
1446         quality=LINK_QUALITY_DOWN_STALE_ADDRESS;
1447     else
1448         quality=LINK_QUALITY_DOWN;
1449
1450     st->netlink->set_quality(st->netlink->st,quality);
1451 }
1452
1453 static void enter_state_run(struct site *st)
1454 {
1455     slog(st,LOG_STATE,"entering state RUN");
1456     st->state=SITE_RUN;
1457     st->timeout=0;
1458
1459     st->setup_session_id=0;
1460     transport_peers_clear(st,&st->setup_peers);
1461     FILLZERO(st->localN);
1462     FILLZERO(st->remoteN);
1463     dispose_transform(&st->new_transform);
1464     memset(st->dhsecret,0,st->dh->len);
1465     if (st->sharedsecret) memset(st->sharedsecret,0,st->sharedsecretlen);
1466     set_link_quality(st);
1467
1468     if (st->keepalive && !current_valid(st))
1469         initiate_key_setup(st, "keepalive", 0);
1470 }
1471
1472 static bool_t ensure_resolving(struct site *st)
1473 {
1474     /* Reentrancy hazard: may call site_resolve_callback and hence
1475      * enter_new_state, enter_state_* and generate_msg*. */
1476     if (st->resolving_count)
1477         return True;
1478
1479     assert(st->addresses);
1480
1481     /* resolver->request might reentrantly call site_resolve_callback
1482      * which will decrement st->resolving, so we need to increment it
1483      * twice beforehand to prevent decrement from thinking we're
1484      * finished, and decrement it ourselves.  Alternatively if
1485      * everything fails then there are no callbacks due and we simply
1486      * set it to 0 and return false.. */
1487     st->resolving_n_results_stored=0;
1488     st->resolving_n_results_all=0;
1489     st->resolving_count+=2;
1490     const char **addrp=st->addresses;
1491     const char *address;
1492     bool_t anyok=False;
1493     for (; (address=*addrp++); ) {
1494         bool_t ok = st->resolver->request(st->resolver->st,address,
1495                                           st->remoteport,st->comms[0],
1496                                           site_resolve_callback,st);
1497         if (ok)
1498             st->resolving_count++;
1499         anyok|=ok;
1500     }
1501     if (!anyok) {
1502         st->resolving_count=0;
1503         return False;
1504     }
1505     decrement_resolving_count(st,2);
1506     return True;
1507 }
1508
1509 static bool_t enter_state_resolve(struct site *st)
1510 {
1511     /* Reentrancy hazard!  See ensure_resolving. */
1512     state_assert(st,st->state==SITE_RUN);
1513     slog(st,LOG_STATE,"entering state RESOLVE");
1514     st->state=SITE_RESOLVE;
1515     return ensure_resolving(st);
1516 }
1517
1518 static bool_t enter_new_state(struct site *st, uint32_t next)
1519 {
1520     bool_t (*gen)(struct site *st);
1521     int r;
1522
1523     slog(st,LOG_STATE,"entering state %s",state_name(next));
1524     switch(next) {
1525     case SITE_SENTMSG1:
1526         state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE);
1527         gen=generate_msg1;
1528         st->msg1_crossed_logged = False;
1529         break;
1530     case SITE_SENTMSG2:
1531         state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1532                      st->state==SITE_SENTMSG1 || st->state==SITE_WAIT);
1533         gen=generate_msg2;
1534         break;
1535     case SITE_SENTMSG3:
1536         state_assert(st,st->state==SITE_SENTMSG1);
1537         BUF_FREE(&st->buffer);
1538         gen=generate_msg3;
1539         break;
1540     case SITE_SENTMSG4:
1541         state_assert(st,st->state==SITE_SENTMSG2);
1542         BUF_FREE(&st->buffer);
1543         gen=generate_msg4;
1544         break;
1545     case SITE_SENTMSG5:
1546         state_assert(st,st->state==SITE_SENTMSG3);
1547         BUF_FREE(&st->buffer);
1548         gen=generate_msg5;
1549         break;
1550     case SITE_RUN:
1551         state_assert(st,st->state==SITE_SENTMSG4);
1552         BUF_FREE(&st->buffer);
1553         gen=generate_msg6;
1554         break;
1555     default:
1556         gen=NULL;
1557         fatal("enter_new_state(%s): invalid new state",state_name(next));
1558         break;
1559     }
1560
1561     if (hacky_par_start_failnow()) return False;
1562
1563     r= gen(st) && send_msg(st);
1564
1565     hacky_par_end(&r,
1566                   st->setup_retries, st->setup_retry_interval,
1567                   send_msg, st);
1568     
1569     if (r) {
1570         st->state=next;
1571         if (next==SITE_RUN) {
1572             BUF_FREE(&st->buffer); /* Never reused */
1573             st->timeout=0; /* Never retransmit */
1574             activate_new_key(st);
1575         }
1576         return True;
1577     }
1578     slog(st,LOG_ERROR,"error entering state %s",state_name(next));
1579     st->buffer.free=False; /* Unconditionally use the buffer; it may be
1580                               in either state, and enter_state_wait() will
1581                               do a BUF_FREE() */
1582     enter_state_wait(st);
1583     return False;
1584 }
1585
1586 /* msg7 tells our peer that we're about to forget our key */
1587 static bool_t send_msg7(struct site *st, cstring_t reason)
1588 {
1589     cstring_t transform_err;
1590
1591     if (current_valid(st) && st->buffer.free
1592         && transport_peers_valid(&st->peers)) {
1593         BUF_ALLOC(&st->buffer,"site:MSG7");
1594         buffer_init(&st->buffer,calculate_max_start_pad());
1595         buf_append_uint32(&st->buffer,LABEL_MSG7);
1596         buf_append_string(&st->buffer,reason);
1597         if (call_transform_forwards(st, st->current.transform,
1598                                     &st->buffer, &transform_err))
1599             goto free_out;
1600         buf_prepend_uint32(&st->buffer,LABEL_MSG0);
1601         buf_prepend_uint32(&st->buffer,st->index);
1602         buf_prepend_uint32(&st->buffer,st->current.remote_session_id);
1603         transport_xmit(st,&st->peers,&st->buffer,True);
1604         BUF_FREE(&st->buffer);
1605     free_out:
1606         return True;
1607     }
1608     return False;
1609 }
1610
1611 /* We go into this state if our peer becomes uncommunicative. Similar to
1612    the "stop" state, we forget all session keys for a while, before
1613    re-entering the "run" state. */
1614 static void enter_state_wait(struct site *st)
1615 {
1616     slog(st,LOG_STATE,"entering state WAIT");
1617     st->timeout=st->now+st->wait_timeout;
1618     st->state=SITE_WAIT;
1619     set_link_quality(st);
1620     BUF_FREE(&st->buffer); /* will have had an outgoing packet in it */
1621     /* XXX Erase keys etc. */
1622 }
1623
1624 static void generate_prod(struct site *st, struct buffer_if *buf)
1625 {
1626     buffer_init(buf,0);
1627     buf_append_uint32(buf,0);
1628     buf_append_uint32(buf,0);
1629     buf_append_uint32(buf,LABEL_PROD);
1630     buf_append_string(buf,st->localname);
1631     buf_append_string(buf,st->remotename);
1632 }
1633
1634 static void generate_send_prod(struct site *st,
1635                                const struct comm_addr *source)
1636 {
1637     if (!st->allow_send_prod) return; /* too soon */
1638     if (!(st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1639           st->state==SITE_WAIT)) return; /* we'd ignore peer's MSG1 */
1640
1641     slog(st,LOG_SETUP_INIT,"prodding peer for key exchange");
1642     st->allow_send_prod=0;
1643     generate_prod(st,&st->scratch);
1644     bool_t ok = comm_addr_sendmsg(st, source, &st->scratch);
1645     dump_packet(st,&st->scratch,source,False,ok);
1646 }
1647
1648 static inline void site_settimeout(uint64_t timeout, int *timeout_io)
1649 {
1650     if (timeout) {
1651         int64_t offset=timeout-*now;
1652         if (offset<0) offset=0;
1653         if (offset>INT_MAX) offset=INT_MAX;
1654         if (*timeout_io<0 || offset<*timeout_io)
1655             *timeout_io=offset;
1656     }
1657 }
1658
1659 static int site_beforepoll(void *sst, struct pollfd *fds, int *nfds_io,
1660                            int *timeout_io)
1661 {
1662     struct site *st=sst;
1663
1664     BEFOREPOLL_WANT_FDS(0); /* We don't use any file descriptors */
1665     st->now=*now;
1666
1667     /* Work out when our next timeout is. The earlier of 'timeout' or
1668        'current.key_timeout'. A stored value of '0' indicates no timeout
1669        active. */
1670     site_settimeout(st->timeout, timeout_io);
1671     site_settimeout(st->current.key_timeout, timeout_io);
1672     site_settimeout(st->auxiliary_key.key_timeout, timeout_io);
1673
1674     return 0; /* success */
1675 }
1676
1677 static void check_expiry(struct site *st, struct data_key *key,
1678                          const char *which)
1679 {
1680     if (key->key_timeout && *now>key->key_timeout) {
1681         delete_one_key(st,key,"maximum life exceeded",which,LOG_TIMEOUT_KEY);
1682     }
1683 }
1684
1685 /* NB site_afterpoll will be called before site_beforepoll is ever called */
1686 static void site_afterpoll(void *sst, struct pollfd *fds, int nfds)
1687 {
1688     struct site *st=sst;
1689
1690     st->now=*now;
1691     if (st->timeout && *now>st->timeout) {
1692         st->timeout=0;
1693         if (st->state>=SITE_SENTMSG1 && st->state<=SITE_SENTMSG5) {
1694             if (!hacky_par_start_failnow())
1695                 send_msg(st);
1696         } else if (st->state==SITE_WAIT) {
1697             enter_state_run(st);
1698         } else {
1699             slog(st,LOG_ERROR,"site_afterpoll: unexpected timeout, state=%d",
1700                  st->state);
1701         }
1702     }
1703     check_expiry(st,&st->current,"current key");
1704     check_expiry(st,&st->auxiliary_key,"auxiliary key");
1705 }
1706
1707 /* This function is called by the netlink device to deliver packets
1708    intended for the remote network. The packet is in "raw" wire
1709    format, but is guaranteed to be word-aligned. */
1710 static void site_outgoing(void *sst, struct buffer_if *buf)
1711 {
1712     struct site *st=sst;
1713     cstring_t transform_err;
1714     
1715     if (st->state==SITE_STOP) {
1716         BUF_FREE(buf);
1717         return;
1718     }
1719
1720     st->allow_send_prod=1;
1721
1722     /* In all other states we consider delivering the packet if we have
1723        a valid key and a valid address to send it to. */
1724     if (current_valid(st) && transport_peers_valid(&st->peers)) {
1725         /* Transform it and send it */
1726         if (buf->size>0) {
1727             buf_prepend_uint32(buf,LABEL_MSG9);
1728             if (call_transform_forwards(st, st->current.transform,
1729                                         buf, &transform_err))
1730                 goto free_out;
1731             buf_prepend_uint32(buf,LABEL_MSG0);
1732             buf_prepend_uint32(buf,st->index);
1733             buf_prepend_uint32(buf,st->current.remote_session_id);
1734             transport_xmit(st,&st->peers,buf,False);
1735         }
1736     free_out:
1737         BUF_FREE(buf);
1738         return;
1739     }
1740
1741     slog(st,LOG_DROP,"discarding outgoing packet of size %d",buf->size);
1742     BUF_FREE(buf);
1743     initiate_key_setup(st,"outgoing packet",0);
1744 }
1745
1746 static bool_t named_for_us(struct site *st, const struct buffer_if *buf_in,
1747                            uint32_t type, struct msg *m)
1748     /* For packets which are identified by the local and remote names.
1749      * If it has our name and our peer's name in it it's for us. */
1750 {
1751     struct buffer_if buf[1];
1752     buffer_readonly_clone(buf,buf_in);
1753     return unpick_msg(st,type,buf,m)
1754         && name_matches(&m->remote,st->remotename)
1755         && name_matches(&m->local,st->localname);
1756 }
1757
1758 static bool_t we_have_priority(struct site *st, const struct msg *m) {
1759     if ((st->local_capabilities & m->remote_capabilities)
1760         && CAPAB_PRIORITY_MOBILE) {
1761         if (st->local_mobile) return True;
1762         if (st-> peer_mobile) return False;
1763     }
1764     return st->our_name_later;
1765 }
1766
1767 /* This function is called by the communication device to deliver
1768    packets from our peers.
1769    It should return True if the packet is recognised as being for
1770    this current site instance (and should therefore not be processed
1771    by other sites), even if the packet was otherwise ignored. */
1772 static bool_t site_incoming(void *sst, struct buffer_if *buf,
1773                             const struct comm_addr *source)
1774 {
1775     struct site *st=sst;
1776
1777     if (buf->size < 12) return False;
1778
1779     uint32_t dest=get_uint32(buf->start);
1780     uint32_t msgtype=get_uint32(buf->start+8);
1781     struct msg named_msg;
1782
1783     if (msgtype==LABEL_MSG1) {
1784         if (!named_for_us(st,buf,msgtype,&named_msg))
1785             return False;
1786         /* It's a MSG1 addressed to us. Decide what to do about it. */
1787         dump_packet(st,buf,source,True,True);
1788         if (st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1789             st->state==SITE_WAIT) {
1790             /* We should definitely process it */
1791             transport_compute_setupinit_peers(st,0,0,source);
1792             if (process_msg1(st,buf,source,&named_msg)) {
1793                 slog(st,LOG_SETUP_INIT,"key setup initiated by peer");
1794                 bool_t entered=enter_new_state(st,SITE_SENTMSG2);
1795                 if (entered && st->addresses && st->local_mobile)
1796                     /* We must do this as the very last thing, because
1797                        the resolver callback might reenter us. */
1798                     ensure_resolving(st);
1799             } else {
1800                 slog(st,LOG_ERROR,"failed to process incoming msg1");
1801             }
1802             BUF_FREE(buf);
1803             return True;
1804         } else if (st->state==SITE_SENTMSG1) {
1805             /* We've just sent a message 1! They may have crossed on
1806                the wire. If we have priority then we ignore the
1807                incoming one, otherwise we process it as usual. */
1808             if (we_have_priority(st,&named_msg)) {
1809                 BUF_FREE(buf);
1810                 if (!st->msg1_crossed_logged++)
1811                     slog(st,LOG_SETUP_INIT,"crossed msg1s; we are higher "
1812                          "priority => ignore incoming msg1");
1813                 return True;
1814             } else {
1815                 slog(st,LOG_SETUP_INIT,"crossed msg1s; we are lower "
1816                      "priority => use incoming msg1");
1817                 if (process_msg1(st,buf,source,&named_msg)) {
1818                     BUF_FREE(&st->buffer); /* Free our old message 1 */
1819                     transport_setup_msgok(st,source);
1820                     enter_new_state(st,SITE_SENTMSG2);
1821                 } else {
1822                     slog(st,LOG_ERROR,"failed to process an incoming "
1823                          "crossed msg1 (we have low priority)");
1824                 }
1825                 BUF_FREE(buf);
1826                 return True;
1827             }
1828         }
1829         /* The message 1 was received at an unexpected stage of the
1830            key setup. XXX POLICY - what do we do? */
1831         slog(st,LOG_UNEXPECTED,"unexpected incoming message 1");
1832         BUF_FREE(buf);
1833         return True;
1834     }
1835     if (msgtype==LABEL_PROD) {
1836         if (!named_for_us(st,buf,msgtype,&named_msg))
1837             return False;
1838         dump_packet(st,buf,source,True,True);
1839         if (st->state!=SITE_RUN) {
1840             slog(st,LOG_DROP,"ignoring PROD when not in state RUN");
1841         } else if (current_valid(st)) {
1842             slog(st,LOG_DROP,"ignoring PROD when we think we have a key");
1843         } else {
1844             initiate_key_setup(st,"peer sent PROD packet",source);
1845         }
1846         BUF_FREE(buf);
1847         return True;
1848     }
1849     if (dest==st->index) {
1850         /* Explicitly addressed to us */
1851         if (msgtype!=LABEL_MSG0) dump_packet(st,buf,source,True,True);
1852         switch (msgtype) {
1853         case LABEL_NAK:
1854             /* If the source is our current peer then initiate a key setup,
1855                because our peer's forgotten the key */
1856             if (get_uint32(buf->start+4)==st->current.remote_session_id) {
1857                 bool_t initiated;
1858                 initiated = initiate_key_setup(st,"received a NAK",source);
1859                 if (!initiated) generate_send_prod(st,source);
1860             } else {
1861                 slog(st,LOG_SEC,"bad incoming NAK");
1862             }
1863             break;
1864         case LABEL_MSG0:
1865             process_msg0(st,buf,source);
1866             break;
1867         case LABEL_MSG1:
1868             /* Setup packet: should not have been explicitly addressed
1869                to us */
1870             slog(st,LOG_SEC,"incoming explicitly addressed msg1");
1871             break;
1872         case LABEL_MSG2:
1873             /* Setup packet: expected only in state SENTMSG1 */
1874             if (st->state!=SITE_SENTMSG1) {
1875                 slog(st,LOG_UNEXPECTED,"unexpected MSG2");
1876             } else if (process_msg2(st,buf,source)) {
1877                 transport_setup_msgok(st,source);
1878                 enter_new_state(st,SITE_SENTMSG3);
1879             } else {
1880                 slog(st,LOG_SEC,"invalid MSG2");
1881             }
1882             break;
1883         case LABEL_MSG3:
1884         case LABEL_MSG3BIS:
1885             /* Setup packet: expected only in state SENTMSG2 */
1886             if (st->state!=SITE_SENTMSG2) {
1887                 slog(st,LOG_UNEXPECTED,"unexpected MSG3");
1888             } else if (process_msg3(st,buf,source,msgtype)) {
1889                 transport_setup_msgok(st,source);
1890                 enter_new_state(st,SITE_SENTMSG4);
1891             } else {
1892                 slog(st,LOG_SEC,"invalid MSG3");
1893             }
1894             break;
1895         case LABEL_MSG4:
1896             /* Setup packet: expected only in state SENTMSG3 */
1897             if (st->state!=SITE_SENTMSG3) {
1898                 slog(st,LOG_UNEXPECTED,"unexpected MSG4");
1899             } else if (process_msg4(st,buf,source)) {
1900                 transport_setup_msgok(st,source);
1901                 enter_new_state(st,SITE_SENTMSG5);
1902             } else {
1903                 slog(st,LOG_SEC,"invalid MSG4");
1904             }
1905             break;
1906         case LABEL_MSG5:
1907             /* Setup packet: expected only in state SENTMSG4 */
1908             /* (may turn up in state RUN if our return MSG6 was lost
1909                and the new key has already been activated. In that
1910                case we discard it. The peer will realise that we
1911                are using the new key when they see our data packets.
1912                Until then the peer's data packets to us get discarded. */
1913             if (st->state==SITE_SENTMSG4) {
1914                 if (process_msg5(st,buf,source,st->new_transform)) {
1915                     transport_setup_msgok(st,source);
1916                     enter_new_state(st,SITE_RUN);
1917                 } else {
1918                     slog(st,LOG_SEC,"invalid MSG5");
1919                 }
1920             } else if (st->state==SITE_RUN) {
1921                 if (process_msg5(st,buf,source,st->current.transform)) {
1922                     slog(st,LOG_DROP,"got MSG5, retransmitting MSG6");
1923                     transport_setup_msgok(st,source);
1924                     create_msg6(st,st->current.transform,
1925                                 st->current.remote_session_id);
1926                     transport_xmit(st,&st->peers,&st->buffer,True);
1927                     BUF_FREE(&st->buffer);
1928                 } else {
1929                     slog(st,LOG_SEC,"invalid MSG5 (in state RUN)");
1930                 }
1931             } else {
1932                 slog(st,LOG_UNEXPECTED,"unexpected MSG5");
1933             }
1934             break;
1935         case LABEL_MSG6:
1936             /* Setup packet: expected only in state SENTMSG5 */
1937             if (st->state!=SITE_SENTMSG5) {
1938                 slog(st,LOG_UNEXPECTED,"unexpected MSG6");
1939             } else if (process_msg6(st,buf,source)) {
1940                 BUF_FREE(&st->buffer); /* Free message 5 */
1941                 transport_setup_msgok(st,source);
1942                 activate_new_key(st);
1943             } else {
1944                 slog(st,LOG_SEC,"invalid MSG6");
1945             }
1946             break;
1947         default:
1948             slog(st,LOG_SEC,"received message of unknown type 0x%08x",
1949                  msgtype);
1950             break;
1951         }
1952         BUF_FREE(buf);
1953         return True;
1954     }
1955
1956     return False;
1957 }
1958
1959 static void site_control(void *vst, bool_t run)
1960 {
1961     struct site *st=vst;
1962     if (run) enter_state_run(st);
1963     else enter_state_stop(st);
1964 }
1965
1966 static void site_phase_hook(void *sst, uint32_t newphase)
1967 {
1968     struct site *st=sst;
1969
1970     /* The program is shutting down; tell our peer */
1971     send_msg7(st,"shutting down");
1972 }
1973
1974 static void site_childpersist_clearkeys(void *sst, uint32_t newphase)
1975 {
1976     struct site *st=sst;
1977     dispose_transform(&st->current.transform);
1978     dispose_transform(&st->auxiliary_key.transform);
1979     dispose_transform(&st->new_transform);
1980     /* Not much point overwiting the signing key, since we loaded it
1981        from disk, and it is only valid prospectively if at all,
1982        anyway. */
1983     /* XXX it would be best to overwrite the DH state, because that
1984        _is_ relevant to forward secrecy.  However we have no
1985        convenient interface for doing that and in practice gmp has
1986        probably dribbled droppings all over the malloc arena.  A good
1987        way to fix this would be to have a privsep child for asymmetric
1988        crypto operations, but that's a task for another day. */
1989 }
1990
1991 static list_t *site_apply(closure_t *self, struct cloc loc, dict_t *context,
1992                           list_t *args)
1993 {
1994     static uint32_t index_sequence;
1995     struct site *st;
1996     item_t *item;
1997     dict_t *dict;
1998     int i;
1999
2000     NEW(st);
2001
2002     st->cl.description="site";
2003     st->cl.type=CL_SITE;
2004     st->cl.apply=NULL;
2005     st->cl.interface=&st->ops;
2006     st->ops.st=st;
2007     st->ops.control=site_control;
2008     st->ops.status=site_status;
2009
2010     /* First parameter must be a dict */
2011     item=list_elem(args,0);
2012     if (!item || item->type!=t_dict)
2013         cfgfatal(loc,"site","parameter must be a dictionary\n");
2014     
2015     dict=item->data.dict;
2016     st->localname=dict_read_string(dict, "local-name", True, "site", loc);
2017     st->remotename=dict_read_string(dict, "name", True, "site", loc);
2018
2019     st->keepalive=dict_read_bool(dict,"keepalive",False,"site",loc,False);
2020
2021     st->peer_mobile=dict_read_bool(dict,"mobile",False,"site",loc,False);
2022     st->local_mobile=
2023         dict_read_bool(dict,"local-mobile",False,"site",loc,False);
2024
2025     /* Sanity check (which also allows the 'sites' file to include
2026        site() closures for all sites including our own): refuse to
2027        talk to ourselves */
2028     if (strcmp(st->localname,st->remotename)==0) {
2029         Message(M_DEBUG,"site %s: local-name==name -> ignoring this site\n",
2030                 st->localname);
2031         if (st->peer_mobile != st->local_mobile)
2032             cfgfatal(loc,"site","site %s's peer-mobile=%d"
2033                     " but our local-mobile=%d\n",
2034                     st->localname, st->peer_mobile, st->local_mobile);
2035         free(st);
2036         return NULL;
2037     }
2038     if (st->peer_mobile && st->local_mobile) {
2039         Message(M_WARNING,"site %s: site is mobile but so are we"
2040                 " -> ignoring this site\n", st->remotename);
2041         free(st);
2042         return NULL;
2043     }
2044
2045     assert(index_sequence < 0xffffffffUL);
2046     st->index = ++index_sequence;
2047     st->local_capabilities = 0;
2048     st->netlink=find_cl_if(dict,"link",CL_NETLINK,True,"site",loc);
2049
2050 #define GET_CLOSURE_LIST(dictkey,things,nthings,CL_TYPE) do{            \
2051     list_t *things##_cfg=dict_lookup(dict,dictkey);                     \
2052     if (!things##_cfg)                                                  \
2053         cfgfatal(loc,"site","closure list \"%s\" not found\n",dictkey); \
2054     st->nthings=list_length(things##_cfg);                              \
2055     NEW_ARY(st->things,st->nthings);                                    \
2056     assert(st->nthings);                                                \
2057     for (i=0; i<st->nthings; i++) {                                     \
2058         item_t *item=list_elem(things##_cfg,i);                         \
2059         if (item->type!=t_closure)                                      \
2060             cfgfatal(loc,"site","%s is not a closure\n",dictkey);       \
2061         closure_t *cl=item->data.closure;                               \
2062         if (cl->type!=CL_TYPE)                                          \
2063             cfgfatal(loc,"site","%s closure wrong type\n",dictkey);     \
2064         st->things[i]=cl->interface;                                    \
2065     }                                                                   \
2066 }while(0)
2067
2068     GET_CLOSURE_LIST("comm",comms,ncomms,CL_COMM);
2069
2070     NEW_ARY(st->commclientinfos, st->ncomms);
2071     dict_t *comminfo = dict_read_dict(dict,"comm-info",False,"site",loc);
2072     for (i=0; i<st->ncomms; i++) {
2073         st->commclientinfos[i] =
2074             !comminfo ? 0 :
2075             st->comms[i]->clientinfo(st->comms[i],comminfo,loc);
2076     }
2077
2078     st->resolver=find_cl_if(dict,"resolver",CL_RESOLVER,True,"site",loc);
2079     st->log=find_cl_if(dict,"log",CL_LOG,True,"site",loc);
2080     st->random=find_cl_if(dict,"random",CL_RANDOMSRC,True,"site",loc);
2081
2082     st->privkey=find_cl_if(dict,"local-key",CL_RSAPRIVKEY,True,"site",loc);
2083     st->addresses=dict_read_string_array(dict,"address",False,"site",loc,0);
2084     if (st->addresses)
2085         st->remoteport=dict_read_number(dict,"port",True,"site",loc,0);
2086     else st->remoteport=0;
2087     st->pubkey=find_cl_if(dict,"key",CL_RSAPUBKEY,True,"site",loc);
2088
2089     GET_CLOSURE_LIST("transform",transforms,ntransforms,CL_TRANSFORM);
2090
2091     st->dh=find_cl_if(dict,"dh",CL_DH,True,"site",loc);
2092     st->hash=find_cl_if(dict,"hash",CL_HASH,True,"site",loc);
2093
2094 #define DEFAULT(D) (st->peer_mobile || st->local_mobile \
2095                     ? DEFAULT_MOBILE_##D : DEFAULT_##D)
2096 #define CFG_NUMBER(k,D) dict_read_number(dict,(k),False,"site",loc,DEFAULT(D));
2097
2098     st->key_lifetime=         CFG_NUMBER("key-lifetime",  KEY_LIFETIME);
2099     st->setup_retries=        CFG_NUMBER("setup-retries", SETUP_RETRIES);
2100     st->setup_retry_interval= CFG_NUMBER("setup-timeout", SETUP_RETRY_INTERVAL);
2101     st->wait_timeout=         CFG_NUMBER("wait-time",     WAIT_TIME);
2102     st->mtu_target= dict_read_number(dict,"mtu-target",False,"site",loc,0);
2103
2104     st->mobile_peer_expiry= dict_read_number(
2105        dict,"mobile-peer-expiry",False,"site",loc,DEFAULT_MOBILE_PEER_EXPIRY);
2106
2107     const char *peerskey= st->peer_mobile
2108         ? "mobile-peers-max" : "static-peers-max";
2109     st->transport_peers_max= dict_read_number(
2110         dict,peerskey,False,"site",loc, st->addresses ? 4 : 3);
2111     if (st->transport_peers_max<1 ||
2112         st->transport_peers_max>MAX_PEER_ADDRS) {
2113         cfgfatal(loc,"site", "%s must be in range 1.."
2114                  STRING(MAX_PEER_ADDRS) "\n", peerskey);
2115     }
2116
2117     if (st->key_lifetime < DEFAULT(KEY_RENEGOTIATE_GAP)*2)
2118         st->key_renegotiate_time=st->key_lifetime/2;
2119     else
2120         st->key_renegotiate_time=st->key_lifetime-DEFAULT(KEY_RENEGOTIATE_GAP);
2121     st->key_renegotiate_time=dict_read_number(
2122         dict,"renegotiate-time",False,"site",loc,st->key_renegotiate_time);
2123     if (st->key_renegotiate_time > st->key_lifetime) {
2124         cfgfatal(loc,"site",
2125                  "renegotiate-time must be less than key-lifetime\n");
2126     }
2127
2128     st->log_events=string_list_to_word(dict_lookup(dict,"log-events"),
2129                                        log_event_table,"site");
2130
2131     st->resolving_count=0;
2132     st->allow_send_prod=0;
2133
2134     st->tunname=safe_malloc(strlen(st->localname)+strlen(st->remotename)+5,
2135                             "site_apply");
2136     sprintf(st->tunname,"%s<->%s",st->localname,st->remotename);
2137
2138     /* The information we expect to see in incoming messages of type 1 */
2139     /* fixme: lots of unchecked overflows here, but the results are only
2140        corrupted packets rather than undefined behaviour */
2141     st->our_name_later=(strcmp(st->localname,st->remotename)>0);
2142
2143     buffer_new(&st->buffer,SETUP_BUFFER_LEN);
2144
2145     buffer_new(&st->scratch,SETUP_BUFFER_LEN);
2146     BUF_ALLOC(&st->scratch,"site:scratch");
2147
2148     /* We are interested in poll(), but only for timeouts. We don't have
2149        any fds of our own. */
2150     register_for_poll(st, site_beforepoll, site_afterpoll, "site");
2151     st->timeout=0;
2152
2153     st->remote_capabilities=0;
2154     st->chosen_transform=0;
2155     st->current.key_timeout=0;
2156     st->auxiliary_key.key_timeout=0;
2157     transport_peers_clear(st,&st->peers);
2158     transport_peers_clear(st,&st->setup_peers);
2159     /* XXX mlock these */
2160     st->dhsecret=safe_malloc(st->dh->len,"site:dhsecret");
2161     st->sharedsecretlen=st->sharedsecretallocd=0;
2162     st->sharedsecret=0;
2163
2164     for (i=0; i<st->ntransforms; i++) {
2165         struct transform_if *ti=st->transforms[i];
2166         uint32_t capbit = 1UL << ti->capab_transformnum;
2167         if (st->local_capabilities & capbit)
2168             slog(st,LOG_ERROR,"transformnum capability bit"
2169                  " %d (%#"PRIx32") reused", ti->capab_transformnum, capbit);
2170         st->local_capabilities |= capbit;
2171     }
2172
2173     if (st->local_mobile || st->peer_mobile)
2174         st->local_capabilities |= CAPAB_PRIORITY_MOBILE;
2175
2176     /* We need to register the remote networks with the netlink device */
2177     uint32_t netlink_mtu; /* local virtual interface mtu */
2178     st->netlink->reg(st->netlink->st, site_outgoing, st, &netlink_mtu);
2179     if (!st->mtu_target)
2180         st->mtu_target=netlink_mtu;
2181     
2182     for (i=0; i<st->ncomms; i++)
2183         st->comms[i]->request_notify(st->comms[i]->st, st, site_incoming);
2184
2185     st->current.transform=0;
2186     st->auxiliary_key.transform=0;
2187     st->new_transform=0;
2188     st->auxiliary_is_new=0;
2189
2190     enter_state_stop(st);
2191
2192     add_hook(PHASE_SHUTDOWN,site_phase_hook,st);
2193     add_hook(PHASE_CHILDPERSIST,site_childpersist_clearkeys,st);
2194
2195     return new_closure(&st->cl);
2196 }
2197
2198 void site_module(dict_t *dict)
2199 {
2200     add_closure(dict,"site",site_apply);
2201 }
2202
2203
2204 /***** TRANSPORT PEERS definitions *****/
2205
2206 static void transport_peers_debug(struct site *st, transport_peers *dst,
2207                                   const char *didwhat,
2208                                   int nargs, const struct comm_addr *args,
2209                                   size_t stride) {
2210     int i;
2211     char *argp;
2212
2213     if (!(st->log_events & LOG_PEER_ADDRS))
2214         return; /* an optimisation */
2215
2216     slog(st, LOG_PEER_ADDRS, "peers (%s) %s nargs=%d => npeers=%d",
2217          (dst==&st->peers ? "data" :
2218           dst==&st->setup_peers ? "setup" : "UNKNOWN"),
2219          didwhat, nargs, dst->npeers);
2220
2221     for (i=0, argp=(void*)args;
2222          i<nargs;
2223          i++, (argp+=stride?stride:sizeof(*args))) {
2224         const struct comm_addr *ca=(void*)argp;
2225         slog(st, LOG_PEER_ADDRS, " args: addrs[%d]=%s",
2226              i, comm_addr_to_string(ca));
2227     }
2228     for (i=0; i<dst->npeers; i++) {
2229         struct timeval diff;
2230         timersub(tv_now,&dst->peers[i].last,&diff);
2231         const struct comm_addr *ca=&dst->peers[i].addr;
2232         slog(st, LOG_PEER_ADDRS, " peers: addrs[%d]=%s T-%ld.%06ld",
2233              i, comm_addr_to_string(ca),
2234              (unsigned long)diff.tv_sec, (unsigned long)diff.tv_usec);
2235     }
2236 }
2237
2238 static void transport_peers_expire(struct site *st, transport_peers *peers) {
2239     /* peers must be sorted first */
2240     int previous_peers=peers->npeers;
2241     struct timeval oldest;
2242     oldest.tv_sec  = tv_now->tv_sec - st->mobile_peer_expiry;
2243     oldest.tv_usec = tv_now->tv_usec;
2244     while (peers->npeers>1 &&
2245            timercmp(&peers->peers[peers->npeers-1].last, &oldest, <))
2246         peers->npeers--;
2247     if (peers->npeers != previous_peers)
2248         transport_peers_debug(st,peers,"expire", 0,0,0);
2249 }
2250
2251 static bool_t transport_peer_record_one(struct site *st, transport_peers *peers,
2252                                         const struct comm_addr *ca,
2253                                         const struct timeval *tv) {
2254     /* returns false if output is full */
2255     int search;
2256
2257     if (peers->npeers >= st->transport_peers_max)
2258         return 0;
2259
2260     for (search=0; search<peers->npeers; search++)
2261         if (comm_addr_equal(&peers->peers[search].addr, ca))
2262             return 1;
2263
2264     peers->peers[peers->npeers].addr = *ca;
2265     peers->peers[peers->npeers].last = *tv;
2266     peers->npeers++;
2267     return 1;
2268 }
2269
2270 static void transport_record_peers(struct site *st, transport_peers *peers,
2271                                    const struct comm_addr *addrs, int naddrs,
2272                                    const char *m) {
2273     /* We add addrs into peers.  The new entries end up at the front
2274      * and displace entries towards the end (perhaps even off the
2275      * end).  Any existing matching entries are moved up to the front.
2276      *
2277      * Caller must first call transport_peers_expire. */
2278
2279     if (naddrs==1) {
2280         /* avoids debug for uninteresting updates */
2281         int i;
2282         for (i=0; i<peers->npeers; i++) {
2283             if (comm_addr_equal(&addrs[0], &peers->peers[i].addr)) {
2284                 memmove(peers->peers+1, peers->peers,
2285                         sizeof(peers->peers[0]) * i);
2286                 peers->peers[0].addr = addrs[0];
2287                 peers->peers[0].last = *tv_now;
2288                 return;
2289             }
2290         }
2291     }
2292
2293     int old_npeers=peers->npeers;
2294     transport_peer old_peers[old_npeers];
2295     COPY_ARRAY(old_peers,peers->peers,old_npeers);
2296
2297     peers->npeers=0;
2298     int i;
2299     for (i=0; i<naddrs; i++) {
2300         if (!transport_peer_record_one(st,peers, &addrs[i], tv_now))
2301             break;
2302     }
2303     for (i=0; i<old_npeers; i++) {
2304         const transport_peer *old=&old_peers[i];
2305         if (!transport_peer_record_one(st,peers, &old->addr, &old->last))
2306             break;
2307     }
2308
2309     transport_peers_debug(st,peers,m, naddrs,addrs,0);
2310 }
2311
2312 static void transport_expire_record_peers(struct site *st,
2313                                           transport_peers *peers,
2314                                           const struct comm_addr *addrs,
2315                                           int naddrs, const char *m) {
2316     /* Convenience function */
2317     transport_peers_expire(st,peers);
2318     transport_record_peers(st,peers,addrs,naddrs,m);
2319 }
2320
2321 static bool_t transport_compute_setupinit_peers(struct site *st,
2322         const struct comm_addr *configured_addrs /* 0 if none or not found */,
2323         int n_configured_addrs /* 0 if none or not found */,
2324         const struct comm_addr *incoming_packet_addr /* 0 if none */) {
2325     if (!n_configured_addrs && !incoming_packet_addr &&
2326         !transport_peers_valid(&st->peers))
2327         return False;
2328
2329     slog(st,LOG_SETUP_INIT,
2330          "using: %d configured addr(s);%s %d old peer addrs(es)",
2331          n_configured_addrs,
2332          incoming_packet_addr ? " incoming packet address;" : "",
2333          st->peers.npeers);
2334
2335     /* Non-mobile peers try addresses until one is plausible.  The
2336      * effect is that this code always tries first the configured
2337      * address if supplied, or otherwise the address of the incoming
2338      * PROD, or finally the existing data peer if one exists; this is
2339      * as desired. */
2340
2341     transport_peers_copy(st,&st->setup_peers,&st->peers);
2342     transport_peers_expire(st,&st->setup_peers);
2343
2344     if (incoming_packet_addr)
2345         transport_record_peers(st,&st->setup_peers,
2346                                incoming_packet_addr,1, "incoming");
2347
2348     if (n_configured_addrs)
2349         transport_record_peers(st,&st->setup_peers,
2350                               configured_addrs,n_configured_addrs, "setupinit");
2351
2352     assert(transport_peers_valid(&st->setup_peers));
2353     return True;
2354 }
2355
2356 static void transport_setup_msgok(struct site *st, const struct comm_addr *a) {
2357     if (st->peer_mobile)
2358         transport_expire_record_peers(st,&st->setup_peers,a,1,"setupmsg");
2359 }
2360 static void transport_data_msgok(struct site *st, const struct comm_addr *a) {
2361     if (st->peer_mobile)
2362         transport_expire_record_peers(st,&st->peers,a,1,"datamsg");
2363 }
2364
2365 static int transport_peers_valid(transport_peers *peers) {
2366     return peers->npeers;
2367 }
2368 static void transport_peers_clear(struct site *st, transport_peers *peers) {
2369     peers->npeers= 0;
2370     transport_peers_debug(st,peers,"clear",0,0,0);
2371 }
2372 static void transport_peers_copy(struct site *st, transport_peers *dst,
2373                                  const transport_peers *src) {
2374     dst->npeers=src->npeers;
2375     COPY_ARRAY(dst->peers, src->peers, dst->npeers);
2376     transport_peers_debug(st,dst,"copy",
2377                           src->npeers, &src->peers->addr, sizeof(*src->peers));
2378 }
2379
2380 static void transport_resolve_complete(struct site *st,
2381                                        const struct comm_addr *addrs,
2382                                        int naddrs) {
2383     transport_expire_record_peers(st,&st->peers,addrs,naddrs,
2384                                   "resolved data");
2385     transport_expire_record_peers(st,&st->setup_peers,addrs,naddrs,
2386                                   "resolved setup");
2387 }
2388
2389 static void transport_resolve_complete_tardy(struct site *st,
2390                                              const struct comm_addr *addrs,
2391                                              int naddrs) {
2392     transport_expire_record_peers(st,&st->peers,addrs,naddrs,
2393                                   "resolved tardily");
2394 }
2395
2396 static void transport_peers__copy_by_mask(transport_peer *out, int *nout_io,
2397                                           unsigned mask,
2398                                           const transport_peers *inp) {
2399     /* out and in->peers may be the same region, or nonoverlapping */
2400     const transport_peer *in=inp->peers;
2401     int slot;
2402     for (slot=0; slot<inp->npeers; slot++) {
2403         if (!(mask & (1U << slot)))
2404             continue;
2405         if (!(out==in && slot==*nout_io))
2406             COPY_OBJ(out[*nout_io], in[slot]);
2407         (*nout_io)++;
2408     }
2409 }
2410
2411 void transport_xmit(struct site *st, transport_peers *peers,
2412                     struct buffer_if *buf, bool_t candebug) {
2413     int slot;
2414     transport_peers_expire(st, peers);
2415     unsigned failed=0; /* bitmask */
2416     assert(MAX_PEER_ADDRS < sizeof(unsigned)*CHAR_BIT);
2417
2418     int nfailed=0;
2419     for (slot=0; slot<peers->npeers; slot++) {
2420         transport_peer *peer=&peers->peers[slot];
2421         bool_t ok = comm_addr_sendmsg(st, &peer->addr, buf);
2422         if (candebug)
2423             dump_packet(st, buf, &peer->addr, False, ok);
2424         if (!ok) {
2425             failed |= 1U << slot;
2426             nfailed++;
2427         }
2428         if (ok && !st->peer_mobile)
2429             break;
2430     }
2431     /* Now we need to demote/delete failing addrs: if we are mobile we
2432      * merely demote them; otherwise we delete them. */
2433     if (st->local_mobile) {
2434         unsigned expected = ((1U << nfailed)-1) << (peers->npeers-nfailed);
2435         /* `expected' has all the failures at the end already */
2436         if (failed != expected) {
2437             int fslot=0;
2438             transport_peer failedpeers[nfailed];
2439             transport_peers__copy_by_mask(failedpeers, &fslot, failed,peers);
2440             assert(fslot == nfailed);
2441             int wslot=0;
2442             transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2443             assert(wslot+nfailed == peers->npeers);
2444             COPY_ARRAY(peers->peers+wslot, failedpeers, nfailed);
2445             transport_peers_debug(st,peers,"mobile failure reorder",0,0,0);
2446         }
2447     } else {
2448         if (failed && peers->npeers > 1) {
2449             int wslot=0;
2450             transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2451             peers->npeers=wslot;
2452             transport_peers_debug(st,peers,"non-mobile failure cleanup",0,0,0);
2453         }
2454     }
2455 }
2456
2457 /***** END of transport peers declarations *****/