chiark / gitweb /
site.c: Abstract out generation of the Diffie--Hellman private secret.
[secnet] / site.c
1 /* site.c - manage communication with a remote network site */
2
3 /*
4  * This file is part of secnet.
5  * See README for full list of copyright holders.
6  *
7  * secnet is free software; you can redistribute it and/or modify it
8  * under the terms of the GNU General Public License as published by
9  * the Free Software Foundation; either version 3 of the License, or
10  * (at your option) any later version.
11  * 
12  * secnet is distributed in the hope that it will be useful, but
13  * WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
15  * General Public License for more details.
16  * 
17  * You should have received a copy of the GNU General Public License
18  * version 3 along with secnet; if not, see
19  * https://www.gnu.org/licenses/gpl.html.
20  */
21
22 /* The 'site' code doesn't know anything about the structure of the
23    packets it's transmitting.  In fact, under the new netlink
24    configuration scheme it doesn't need to know anything at all about
25    IP addresses, except how to contact its peer.  This means it could
26    potentially be used to tunnel other protocols too (IPv6, IPX, plain
27    old Ethernet frames) if appropriate netlink code can be written
28    (and that ought not to be too hard, eg. using the TUN/TAP device to
29    pretend to be an Ethernet interface).  */
30
31 /* At some point in the future the netlink code will be asked for
32    configuration information to go in the PING/PONG packets at the end
33    of the key exchange. */
34
35 #include "secnet.h"
36 #include <stdio.h>
37 #include <string.h>
38 #include <limits.h>
39 #include <assert.h>
40 #include <sys/socket.h>
41
42 #include <sys/mman.h>
43 #include "util.h"
44 #include "unaligned.h"
45 #include "magic.h"
46
47 #define SETUP_BUFFER_LEN 2048
48
49 #define DEFAULT_KEY_LIFETIME                  (3600*1000) /* [ms] */
50 #define DEFAULT_KEY_RENEGOTIATE_GAP           (5*60*1000) /* [ms] */
51 #define DEFAULT_SETUP_RETRIES 5
52 #define DEFAULT_SETUP_RETRY_INTERVAL             (2*1000) /* [ms] */
53 #define DEFAULT_WAIT_TIME                       (20*1000) /* [ms] */
54
55 #define DEFAULT_MOBILE_KEY_LIFETIME      (2*24*3600*1000) /* [ms] */
56 #define DEFAULT_MOBILE_KEY_RENEGOTIATE_GAP (12*3600*1000) /* [ms] */
57 #define DEFAULT_MOBILE_SETUP_RETRIES 30
58 #define DEFAULT_MOBILE_SETUP_RETRY_INTERVAL      (1*1000) /* [ms] */
59 #define DEFAULT_MOBILE_WAIT_TIME                (10*1000) /* [ms] */
60
61 #define DEFAULT_MOBILE_PEER_EXPIRY            (2*60)      /* [s] */
62
63 /* Each site can be in one of several possible states. */
64
65 /* States:
66    SITE_STOP         - nothing is allowed to happen; tunnel is down;
67                        all session keys have been erased
68      -> SITE_RUN upon external instruction
69    SITE_RUN          - site up, maybe with valid key
70      -> SITE_RESOLVE upon outgoing packet and no valid key
71          we start name resolution for the other end of the tunnel
72      -> SITE_SENTMSG2 upon valid incoming message 1 and suitable time
73          we send an appropriate message 2
74    SITE_RESOLVE      - waiting for name resolution
75      -> SITE_SENTMSG1 upon successful resolution
76          we send an appropriate message 1
77      -> SITE_SENTMSG2 upon valid incoming message 1 (then abort resolution)
78          we abort resolution and 
79      -> SITE_WAIT on timeout or resolution failure
80    SITE_SENTMSG1
81      -> SITE_SENTMSG2 upon valid incoming message 1 from higher priority end
82      -> SITE_SENTMSG3 upon valid incoming message 2
83      -> SITE_WAIT on timeout
84    SITE_SENTMSG2
85      -> SITE_SENTMSG4 upon valid incoming message 3
86      -> SITE_WAIT on timeout
87    SITE_SENTMSG3
88      -> SITE_SENTMSG5 upon valid incoming message 4
89      -> SITE_WAIT on timeout
90    SITE_SENTMSG4
91      -> SITE_RUN upon valid incoming message 5
92      -> SITE_WAIT on timeout
93    SITE_SENTMSG5
94      -> SITE_RUN upon valid incoming message 6
95      -> SITE_WAIT on timeout
96    SITE_WAIT         - failed to establish key; do nothing for a while
97      -> SITE_RUN on timeout
98    */
99
100 #define SITE_STOP     0
101 #define SITE_RUN      1
102 #define SITE_RESOLVE  2
103 #define SITE_SENTMSG1 3
104 #define SITE_SENTMSG2 4
105 #define SITE_SENTMSG3 5
106 #define SITE_SENTMSG4 6
107 #define SITE_SENTMSG5 7
108 #define SITE_WAIT     8
109
110 #define CASES_MSG3_KNOWN LABEL_MSG3: case LABEL_MSG3BIS
111
112 int32_t site_max_start_pad = 4*4;
113
114 static cstring_t state_name(uint32_t state)
115 {
116     switch (state) {
117     case 0: return "STOP";
118     case 1: return "RUN";
119     case 2: return "RESOLVE";
120     case 3: return "SENTMSG1";
121     case 4: return "SENTMSG2";
122     case 5: return "SENTMSG3";
123     case 6: return "SENTMSG4";
124     case 7: return "SENTMSG5";
125     case 8: return "WAIT";
126     default: return "*bad state*";
127     }
128 }
129
130 #define NONCELEN 8
131
132 #define LOG_UNEXPECTED    0x00000001
133 #define LOG_SETUP_INIT    0x00000002
134 #define LOG_SETUP_TIMEOUT 0x00000004
135 #define LOG_ACTIVATE_KEY  0x00000008
136 #define LOG_TIMEOUT_KEY   0x00000010
137 #define LOG_SEC           0x00000020
138 #define LOG_STATE         0x00000040
139 #define LOG_DROP          0x00000080
140 #define LOG_DUMP          0x00000100
141 #define LOG_ERROR         0x00000400
142 #define LOG_PEER_ADDRS    0x00000800
143
144 static struct flagstr log_event_table[]={
145     { "unexpected", LOG_UNEXPECTED },
146     { "setup-init", LOG_SETUP_INIT },
147     { "setup-timeout", LOG_SETUP_TIMEOUT },
148     { "activate-key", LOG_ACTIVATE_KEY },
149     { "timeout-key", LOG_TIMEOUT_KEY },
150     { "security", LOG_SEC },
151     { "state-change", LOG_STATE },
152     { "packet-drop", LOG_DROP },
153     { "dump-packets", LOG_DUMP },
154     { "errors", LOG_ERROR },
155     { "peer-addrs", LOG_PEER_ADDRS },
156     { "default", LOG_SETUP_INIT|LOG_SETUP_TIMEOUT|
157       LOG_ACTIVATE_KEY|LOG_TIMEOUT_KEY|LOG_SEC|LOG_ERROR },
158     { "all", 0xffffffff },
159     { NULL, 0 }
160 };
161
162
163 /***** TRANSPORT PEERS declarations *****/
164
165 /* Details of "mobile peer" semantics:
166
167    - We use the same data structure for the different configurations,
168      but manage it with different algorithms.
169    
170    - We record up to mobile_peers_max peer address/port numbers
171      ("peers") for key setup, and separately up to mobile_peers_max
172      for data transfer.
173
174    - In general, we make a new set of addrs (see below) when we start
175      a new key exchange; the key setup addrs become the data transport
176      addrs when key setup complets.
177
178    If our peer is mobile:
179
180    - We send to all recent addresses of incoming packets, plus
181      initially all configured addresses (which we also expire).
182
183    - So, we record addrs of good incoming packets, as follows:
184       1. expire any peers last seen >120s ("mobile-peer-expiry") ago
185       2. add the peer of the just received packet to the applicable list
186          (possibly evicting the oldest entries to make room)
187      NB that we do not expire peers until an incoming packet arrives.
188
189    - If the peer has a configured address or name, we record them the
190      same way, but only as a result of our own initiation of key
191      setup.  (We might evict some incoming packet addrs to make room.)
192
193    - The default number of addrs to keep is 3, or 4 if we have a
194      configured name or address.  That's space for two configured
195      addresses (one IPv6 and one IPv4), plus two received addresses.
196
197    - Outgoing packets are sent to every recorded address in the
198      applicable list.  Any unsupported[1] addresses are deleted from
199      the list right away.  (This should only happen to configured
200      addresses, of course, but there is no need to check that.)
201
202    - When we successfully complete a key setup, we merge the key setup
203      peers into the data transfer peers.
204
205    [1] An unsupported address is one for whose AF we don't have a
206      socket (perhaps because we got EAFNOSUPPORT or some such) or for
207      which sendto gives ENETUNREACH.
208
209    If neither end is mobile:
210
211    - When peer initiated the key exchange, we use the incoming packet
212      address.
213
214    - When we initiate the key exchange, we try configured addresses
215      until we get one which isn't unsupported then fixate on that.
216
217    - When we complete a key setup, we replace the data transport peers
218      with those from the key setup.
219
220    If we are mobile:
221
222    - We can't tell when local network setup changes so we can't cache
223      the unsupported addrs and completely remove the spurious calls to
224      sendto, but we can optimise things a bit by deprioritising addrs
225      which seem to be unsupported.
226
227    - Use only configured addresses.  (Except, that if our peer
228      initiated a key exchange we use the incoming packet address until
229      our name resolution completes.)
230
231    - When we send a packet, try each address in turn; if addr
232      supported, put that address to the end of the list for future
233      packets, and go onto the next address.
234
235    - When we complete a key setup, we replace the data transport peers
236      with those from the key setup.
237
238    */
239
240 typedef struct {
241     struct timeval last;
242     struct comm_addr addr;
243 } transport_peer;
244
245 typedef struct {
246 /* configuration information */
247 /* runtime information */
248     int npeers;
249     transport_peer peers[MAX_PEER_ADDRS];
250 } transport_peers;
251
252 /* Basic operations on transport peer address sets */
253 static void transport_peers_clear(struct site *st, transport_peers *peers);
254 static int transport_peers_valid(transport_peers *peers);
255 static void transport_peers_copy(struct site *st, transport_peers *dst,
256                                  const transport_peers *src);
257
258 /* Record address of incoming setup packet; resp. data packet. */
259 static void transport_setup_msgok(struct site *st, const struct comm_addr *a);
260 static void transport_data_msgok(struct site *st, const struct comm_addr *a);
261
262 /* Initialise the setup addresses.  Called before we send the first
263  * packet in a key exchange.  If we are the initiator, as a result of
264  * resolve completing (or being determined not to be relevant) or an
265  * incoming PROD; if we are the responder, as a result of the MSG1. */
266 static bool_t transport_compute_setupinit_peers(struct site *st,
267         const struct comm_addr *configured_addrs /* 0 if none or not found */,
268         int n_configured_addrs /* 0 if none or not found */,
269         const struct comm_addr *incoming_packet_addr /* 0 if none */);
270
271 /* Called if we are the responder in a key setup, when the resolve
272  * completes.  transport_compute_setupinit_peers will hvae been called
273  * earlier.  If _complete is called, we are still doing the key setup
274  * (and we should use the new values for both the rest of the key
275  * setup and the ongoing data exchange); if _tardy is called, the key
276  * setup is done (either completed or not) and only the data peers are
277  * relevant */
278 static void transport_resolve_complete(struct site *st,
279         const struct comm_addr *addrs, int naddrs);
280 static void transport_resolve_complete_tardy(struct site *st,
281         const struct comm_addr *addrs, int naddrs);
282
283 static void transport_xmit(struct site *st, transport_peers *peers,
284                            struct buffer_if *buf, bool_t candebug);
285
286  /***** END of transport peers declarations *****/
287
288
289 struct data_key {
290     struct transform_inst_if *transform;
291     uint64_t key_timeout; /* End of life of current key */
292     uint32_t remote_session_id;
293 };
294
295 struct site {
296     closure_t cl;
297     struct site_if ops;
298 /* configuration information */
299     string_t localname;
300     string_t remotename;
301     bool_t keepalive;
302     bool_t local_mobile, peer_mobile; /* Mobile client support */
303     int32_t transport_peers_max;
304     string_t tunname; /* localname<->remotename by default, used in logs */
305     cstring_t *addresses; /* DNS name or address(es) for bootstrapping, optional */
306     int remoteport; /* Port for bootstrapping, optional */
307     uint32_t mtu_target;
308     struct netlink_if *netlink;
309     struct comm_if **comms;
310     struct comm_clientinfo **commclientinfos;
311     int ncomms;
312     struct resolver_if *resolver;
313     struct log_if *log;
314     struct random_if *random;
315     struct rsaprivkey_if *privkey;
316     struct rsapubkey_if *pubkey;
317     struct transform_if **transforms;
318     int ntransforms;
319     struct dh_if *dh;
320     struct hash_if *hash;
321
322     uint32_t index; /* Index of this site */
323     uint32_t early_capabilities;
324     uint32_t local_capabilities;
325     int32_t setup_retries; /* How many times to send setup packets */
326     int32_t setup_retry_interval; /* Initial timeout for setup packets */
327     int32_t wait_timeout_mean; /* How long to wait if setup unsuccessful */
328     int32_t mobile_peer_expiry; /* How long to remember 2ary addresses */
329     int32_t key_lifetime; /* How long a key lasts once set up */
330     int32_t key_renegotiate_time; /* If we see traffic (or a keepalive)
331                                       after this time, initiate a new
332                                       key exchange */
333
334     bool_t our_name_later; /* our name > peer name */
335     uint32_t log_events;
336
337 /* runtime information */
338     uint32_t state;
339     uint64_t now; /* Most recently seen time */
340     bool_t allow_send_prod;
341     bool_t msg1_crossed_logged;
342     int resolving_count;
343     int resolving_n_results_all;
344     int resolving_n_results_stored;
345     struct comm_addr resolving_results[MAX_PEER_ADDRS];
346
347     /* The currently established session */
348     struct data_key current;
349     struct data_key auxiliary_key;
350     bool_t auxiliary_is_new;
351     uint64_t renegotiate_key_time; /* When we can negotiate a new key */
352     uint64_t auxiliary_renegotiate_key_time;
353     transport_peers peers; /* Current address(es) of peer for data traffic */
354
355     /* The current key setup protocol exchange.  We can only be
356        involved in one of these at a time.  There's a potential for
357        denial of service here (the attacker keeps sending a setup
358        packet; we keep trying to continue the exchange, and have to
359        timeout before we can listen for another setup packet); perhaps
360        we should keep a list of 'bad' sources for setup packets. */
361     uint32_t remote_capabilities;
362     uint16_t remote_adv_mtu;
363     struct transform_if *chosen_transform;
364     uint32_t setup_session_id;
365     transport_peers setup_peers;
366     uint8_t localN[NONCELEN]; /* Nonces for key exchange */
367     uint8_t remoteN[NONCELEN];
368     struct buffer_if buffer; /* Current outgoing key exchange packet */
369     struct buffer_if scratch;
370     int32_t retries; /* Number of retries remaining */
371     uint64_t timeout; /* Timeout for current state */
372     uint8_t *dhsecret;
373     uint8_t *sharedsecret;
374     struct transform_inst_if *new_transform; /* For key setup/verify */
375 };
376
377 static uint32_t event_log_priority(struct site *st, uint32_t event)
378 {
379     if (!(event&st->log_events))
380         return 0;
381     switch(event) {
382     case LOG_UNEXPECTED:    return M_INFO;
383     case LOG_SETUP_INIT:    return M_INFO;
384     case LOG_SETUP_TIMEOUT: return M_NOTICE;
385     case LOG_ACTIVATE_KEY:  return M_INFO;
386     case LOG_TIMEOUT_KEY:   return M_INFO;
387     case LOG_SEC:           return M_SECURITY;
388     case LOG_STATE:         return M_DEBUG;
389     case LOG_DROP:          return M_DEBUG;
390     case LOG_DUMP:          return M_DEBUG;
391     case LOG_ERROR:         return M_ERR;
392     case LOG_PEER_ADDRS:    return M_DEBUG;
393     default:                return M_ERR;
394     }
395 }
396
397 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
398 FORMAT(printf,3,0);
399 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
400 {
401     uint32_t class;
402
403     class=event_log_priority(st, event);
404     if (class) {
405         slilog_part(st->log,class,"%s: ",st->tunname);
406         vslilog_part(st->log,class,msg,ap);
407         slilog_part(st->log,class,"\n");
408     }
409 }
410
411 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
412 FORMAT(printf,3,4);
413 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
414 {
415     va_list ap;
416     va_start(ap,msg);
417     vslog(st,event,msg,ap);
418     va_end(ap);
419 }
420
421 static void logtimeout(struct site *st, const char *fmt, ...)
422 FORMAT(printf,2,3);
423 static void logtimeout(struct site *st, const char *fmt, ...)
424 {
425     uint32_t class=event_log_priority(st,LOG_SETUP_TIMEOUT);
426     if (!class)
427         return;
428
429     va_list ap;
430     va_start(ap,fmt);
431
432     slilog_part(st->log,class,"%s: ",st->tunname);
433     vslilog_part(st->log,class,fmt,ap);
434
435     const char *delim;
436     int i;
437     for (i=0, delim=" (tried ";
438          i<st->setup_peers.npeers;
439          i++, delim=", ") {
440         transport_peer *peer=&st->setup_peers.peers[i];
441         const char *s=comm_addr_to_string(&peer->addr);
442         slilog_part(st->log,class,"%s%s",delim,s);
443     }
444
445     slilog_part(st->log,class,")\n");
446     va_end(ap);
447 }
448
449 static void set_link_quality(struct site *st);
450 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel);
451 static void delete_one_key(struct site *st, struct data_key *key,
452                            const char *reason /* may be 0 meaning don't log*/,
453                            const char *which /* ignored if !reasonn */,
454                            uint32_t loglevel /* ignored if !reasonn */);
455 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
456                                  const struct comm_addr *prod_hint);
457 static void enter_state_run(struct site *st);
458 static bool_t enter_state_resolve(struct site *st);
459 static void decrement_resolving_count(struct site *st, int by);
460 static bool_t enter_new_state(struct site *st,uint32_t next);
461 static void enter_state_wait(struct site *st);
462 static void activate_new_key(struct site *st);
463
464 static bool_t is_transform_valid(struct transform_inst_if *transform)
465 {
466     return transform && transform->valid(transform->st);
467 }
468
469 static bool_t current_valid(struct site *st)
470 {
471     return is_transform_valid(st->current.transform);
472 }
473
474 #define DEFINE_CALL_TRANSFORM(fwdrev)                                   \
475 static transform_apply_return                                           \
476 call_transform_##fwdrev(struct site *st,                                \
477                                    struct transform_inst_if *transform, \
478                                    struct buffer_if *buf,               \
479                                    const char **errmsg)                 \
480 {                                                                       \
481     if (!is_transform_valid(transform)) {                               \
482         *errmsg="transform not set up";                                 \
483         return transform_apply_err;                                     \
484     }                                                                   \
485     return transform->fwdrev(transform->st,buf,errmsg);                 \
486 }
487
488 DEFINE_CALL_TRANSFORM(forwards)
489 DEFINE_CALL_TRANSFORM(reverse)
490
491 static void dispose_transform(struct transform_inst_if **transform_var)
492 {
493     struct transform_inst_if *transform=*transform_var;
494     if (transform) {
495         transform->delkey(transform->st);
496         transform->destroy(transform->st);
497     }
498     *transform_var = 0;
499 }    
500
501 #define CHECK_AVAIL(b,l) do { if ((b)->size<(l)) return False; } while(0)
502 #define CHECK_EMPTY(b) do { if ((b)->size!=0) return False; } while(0)
503 #define CHECK_TYPE(b,t) do { uint32_t type; \
504     CHECK_AVAIL((b),4); \
505     type=buf_unprepend_uint32((b)); \
506     if (type!=(t)) return False; } while(0)
507
508 static _Bool type_is_msg34(uint32_t type)
509 {
510     switch (type) {
511         case CASES_MSG3_KNOWN: case LABEL_MSG4: return True;
512         default: return False;
513     }
514 }
515
516 struct parsedname {
517     int32_t len;
518     uint8_t *name;
519     struct buffer_if extrainfo;
520 };
521
522 struct msg {
523     uint8_t *hashstart;
524     uint32_t dest;
525     uint32_t source;
526     struct parsedname remote;
527     struct parsedname local;
528     uint32_t remote_capabilities;
529     uint16_t remote_mtu;
530     int capab_transformnum;
531     uint8_t *nR;
532     uint8_t *nL;
533     int32_t pklen;
534     char *pk;
535     int32_t hashlen;
536     int32_t siglen;
537     char *sig;
538 };
539
540 static int32_t wait_timeout(struct site *st) {
541     int32_t t = st->wait_timeout_mean;
542     int8_t factor;
543     if (t < INT_MAX/2) {
544         st->random->generate(st->random->st,sizeof(factor),&factor);
545         t += (t / 256) * factor;
546     }
547     return t;
548 }
549
550 static _Bool set_new_transform(struct site *st, char *pk)
551 {
552     _Bool ok;
553
554     /* Generate the shared key */
555     if (!st->dh->makeshared(st->dh->st,st->dhsecret,st->dh->secret_len,
556                             pk, st->sharedsecret,st->dh->shared_len))
557         return False;
558
559     /* Set up the transform */
560     struct transform_if *generator=st->chosen_transform;
561     struct transform_inst_if *generated=generator->create(generator->st);
562     ok = generated->setkey(generated->st,st->sharedsecret,
563                            st->dh->shared_len,st->our_name_later);
564
565     dispose_transform(&st->new_transform);
566     if (!ok) return False;
567     st->new_transform=generated;
568
569     slog(st,LOG_SETUP_INIT,"key exchange negotiated transform"
570          " %d (capabilities ours=%#"PRIx32" theirs=%#"PRIx32")",
571          st->chosen_transform->capab_bit,
572          st->local_capabilities, st->remote_capabilities);
573     return True;
574 }
575
576 struct xinfoadd {
577     int32_t lenpos, afternul;
578 };
579 static void append_string_xinfo_start(struct buffer_if *buf,
580                                       struct xinfoadd *xia,
581                                       const char *str)
582     /* Helps construct one of the names with additional info as found
583      * in MSG1..4.  Call this function first, then append all the
584      * desired extra info (not including the nul byte) to the buffer,
585      * then call append_string_xinfo_done. */
586 {
587     xia->lenpos = buf->size;
588     buf_append_string(buf,str);
589     buf_append_uint8(buf,0);
590     xia->afternul = buf->size;
591 }
592 static void append_string_xinfo_done(struct buffer_if *buf,
593                                      struct xinfoadd *xia)
594 {
595     /* we just need to adjust the string length */
596     if (buf->size == xia->afternul) {
597         /* no extra info, strip the nul too */
598         buf_unappend_uint8(buf);
599     } else {
600         put_uint16(buf->start+xia->lenpos, buf->size-(xia->lenpos+2));
601     }
602 }
603
604 /* Build any of msg1 to msg4. msg5 and msg6 are built from the inside
605    out using a transform of config data supplied by netlink */
606 static bool_t generate_msg(struct site *st, uint32_t type, cstring_t what)
607 {
608     void *hst;
609     uint8_t *hash;
610     string_t dhpub, sig;
611     unsigned minor;
612
613     st->retries=st->setup_retries;
614     BUF_ALLOC(&st->buffer,what);
615     buffer_init(&st->buffer,0);
616     buf_append_uint32(&st->buffer,
617         (type==LABEL_MSG1?0:st->setup_session_id));
618     buf_append_uint32(&st->buffer,st->index);
619     buf_append_uint32(&st->buffer,type);
620
621     struct xinfoadd xia;
622     append_string_xinfo_start(&st->buffer,&xia,st->localname);
623     if ((st->local_capabilities & st->early_capabilities) ||
624         (type != LABEL_MSG1)) {
625         buf_append_uint32(&st->buffer,st->local_capabilities);
626     }
627     if (type_is_msg34(type)) {
628         buf_append_uint16(&st->buffer,st->mtu_target);
629     }
630     append_string_xinfo_done(&st->buffer,&xia);
631
632     buf_append_string(&st->buffer,st->remotename);
633     BUF_ADD_OBJ(append,&st->buffer,st->localN);
634     if (type==LABEL_MSG1) return True;
635     BUF_ADD_OBJ(append,&st->buffer,st->remoteN);
636     if (type==LABEL_MSG2) return True;
637
638     if (hacky_par_mid_failnow()) return False;
639
640     if (MSGMAJOR(type) == 3) do {
641         minor = MSGMINOR(type);
642         if (minor < 1) break;
643         buf_append_uint8(&st->buffer,st->chosen_transform->capab_bit);
644     } while (0);
645
646     dhpub=st->dh->makepublic(st->dh->st,st->dhsecret,st->dh->secret_len);
647     buf_append_string(&st->buffer,dhpub);
648     free(dhpub);
649     hash=safe_malloc(st->hash->len, "generate_msg");
650     hst=st->hash->init();
651     st->hash->update(hst,st->buffer.start,st->buffer.size);
652     st->hash->final(hst,hash);
653     sig=st->privkey->sign(st->privkey->st,hash,st->hash->len);
654     buf_append_string(&st->buffer,sig);
655     free(sig);
656     free(hash);
657     return True;
658 }
659
660 static bool_t unpick_name(struct buffer_if *msg, struct parsedname *nm)
661 {
662     CHECK_AVAIL(msg,2);
663     nm->len=buf_unprepend_uint16(msg);
664     CHECK_AVAIL(msg,nm->len);
665     nm->name=buf_unprepend(msg,nm->len);
666     uint8_t *nul=memchr(nm->name,0,nm->len);
667     if (!nul) {
668         buffer_readonly_view(&nm->extrainfo,0,0);
669     } else {
670         buffer_readonly_view(&nm->extrainfo, nul+1, msg->start-(nul+1));
671         nm->len=nul-nm->name;
672     }
673     return True;
674 }
675
676 static bool_t unpick_msg(struct site *st, uint32_t type,
677                          struct buffer_if *msg, struct msg *m)
678 {
679     unsigned minor;
680
681     m->capab_transformnum=-1;
682     m->hashstart=msg->start;
683     CHECK_AVAIL(msg,4);
684     m->dest=buf_unprepend_uint32(msg);
685     CHECK_AVAIL(msg,4);
686     m->source=buf_unprepend_uint32(msg);
687     CHECK_TYPE(msg,type);
688     if (!unpick_name(msg,&m->remote)) return False;
689     m->remote_capabilities=0;
690     m->remote_mtu=0;
691     if (m->remote.extrainfo.size) {
692         CHECK_AVAIL(&m->remote.extrainfo,4);
693         m->remote_capabilities=buf_unprepend_uint32(&m->remote.extrainfo);
694     }
695     if (type_is_msg34(type) && m->remote.extrainfo.size) {
696         CHECK_AVAIL(&m->remote.extrainfo,2);
697         m->remote_mtu=buf_unprepend_uint16(&m->remote.extrainfo);
698     }
699     if (!unpick_name(msg,&m->local)) return False;
700     if (type==LABEL_PROD) {
701         CHECK_EMPTY(msg);
702         return True;
703     }
704     CHECK_AVAIL(msg,NONCELEN);
705     m->nR=buf_unprepend(msg,NONCELEN);
706     if (type==LABEL_MSG1) {
707         CHECK_EMPTY(msg);
708         return True;
709     }
710     CHECK_AVAIL(msg,NONCELEN);
711     m->nL=buf_unprepend(msg,NONCELEN);
712     if (type==LABEL_MSG2) {
713         CHECK_EMPTY(msg);
714         return True;
715     }
716     if (MSGMAJOR(type) == 3) do {
717         minor = MSGMINOR(type);
718 #define MAYBE_READ_CAP(minminor, kind, dflt) do {                       \
719     if (minor < (minminor))                                             \
720         m->capab_##kind##num = (dflt);                                  \
721     else {                                                              \
722         CHECK_AVAIL(msg, 1);                                            \
723         m->capab_##kind##num = buf_unprepend_uint8(msg);                \
724     }                                                                   \
725 } while (0)
726         MAYBE_READ_CAP(1, transform, CAPAB_BIT_ANCIENTTRANSFORM);
727 #undef MAYBE_READ_CAP
728     } while (0);
729     CHECK_AVAIL(msg,2);
730     m->pklen=buf_unprepend_uint16(msg);
731     CHECK_AVAIL(msg,m->pklen);
732     m->pk=buf_unprepend(msg,m->pklen);
733     m->hashlen=msg->start-m->hashstart;
734     CHECK_AVAIL(msg,2);
735     m->siglen=buf_unprepend_uint16(msg);
736     CHECK_AVAIL(msg,m->siglen);
737     m->sig=buf_unprepend(msg,m->siglen);
738     CHECK_EMPTY(msg);
739
740     /* In `process_msg3_msg4' below, we assume that we can write a nul
741      * terminator following the signature.  Make sure there's enough space.
742      */
743     if (msg->start >= msg->base + msg->alloclen)
744         return False;
745
746     return True;
747 }
748
749 static bool_t name_matches(const struct parsedname *nm, const char *expected)
750 {
751     int expected_len=strlen(expected);
752     return
753         nm->len == expected_len &&
754         !memcmp(nm->name, expected, expected_len);
755 }    
756
757 static bool_t check_msg(struct site *st, uint32_t type, struct msg *m,
758                         cstring_t *error)
759 {
760     if (type==LABEL_MSG1) return True;
761
762     /* Check that the site names and our nonce have been sent
763        back correctly, and then store our peer's nonce. */ 
764     if (!name_matches(&m->remote,st->remotename)) {
765         *error="wrong remote site name";
766         return False;
767     }
768     if (!name_matches(&m->local,st->localname)) {
769         *error="wrong local site name";
770         return False;
771     }
772     if (memcmp(m->nL,st->localN,NONCELEN)!=0) {
773         *error="wrong locally-generated nonce";
774         return False;
775     }
776     if (type==LABEL_MSG2) return True;
777     if (!consttime_memeq(m->nR,st->remoteN,NONCELEN)) {
778         *error="wrong remotely-generated nonce";
779         return False;
780     }
781     /* MSG3 has complicated rules about capabilities, which are
782      * handled in process_msg3. */
783     if (MSGMAJOR(type) == 3) return True;
784     if (m->remote_capabilities!=st->remote_capabilities) {
785         *error="remote capabilities changed";
786         return False;
787     }
788     if (type==LABEL_MSG4) return True;
789     *error="unknown message type";
790     return False;
791 }
792
793 static bool_t generate_msg1(struct site *st)
794 {
795     st->random->generate(st->random->st,NONCELEN,st->localN);
796     return generate_msg(st,LABEL_MSG1,"site:MSG1");
797 }
798
799 static bool_t process_msg1(struct site *st, struct buffer_if *msg1,
800                            const struct comm_addr *src, struct msg *m)
801 {
802     /* We've already determined we're in an appropriate state to
803        process an incoming MSG1, and that the MSG1 has correct values
804        of A and B. */
805
806     st->setup_session_id=m->source;
807     st->remote_capabilities=m->remote_capabilities;
808     memcpy(st->remoteN,m->nR,NONCELEN);
809     return True;
810 }
811
812 static bool_t generate_msg2(struct site *st)
813 {
814     st->random->generate(st->random->st,NONCELEN,st->localN);
815     return generate_msg(st,LABEL_MSG2,"site:MSG2");
816 }
817
818 static bool_t process_msg2(struct site *st, struct buffer_if *msg2,
819                            const struct comm_addr *src)
820 {
821     struct msg m;
822     cstring_t err;
823
824     if (!unpick_msg(st,LABEL_MSG2,msg2,&m)) return False;
825     if (!check_msg(st,LABEL_MSG2,&m,&err)) {
826         slog(st,LOG_SEC,"msg2: %s",err);
827         return False;
828     }
829     st->setup_session_id=m.source;
830     st->remote_capabilities=m.remote_capabilities;
831
832     /* Select the transform to use */
833
834     uint32_t remote_crypto_caps = st->remote_capabilities & CAPAB_TRANSFORM_MASK;
835     if (!remote_crypto_caps)
836         /* old secnets only had this one transform */
837         remote_crypto_caps = 1UL << CAPAB_BIT_ANCIENTTRANSFORM;
838
839 #define CHOOSE_CRYPTO(kind, whats) do {                                 \
840     struct kind##_if *iface;                                            \
841     uint32_t bit, ours = 0;                                             \
842     int i;                                                              \
843     for (i= 0; i < st->n##kind##s; i++) {                               \
844         iface=st->kind##s[i];                                           \
845         bit = 1UL << iface->capab_bit;                                  \
846         if (bit & remote_crypto_caps) goto kind##_found;                \
847         ours |= bit;                                                    \
848     }                                                                   \
849     slog(st,LOG_ERROR,"no " whats " in common"                          \
850          " (us %#"PRIx32"; them: %#"PRIx32")",                          \
851          st->local_capabilities & ours, remote_crypto_caps);            \
852     return False;                                                       \
853 kind##_found:                                                           \
854     st->chosen_##kind = iface;                                          \
855 } while (0)
856
857     CHOOSE_CRYPTO(transform, "transforms");
858
859 #undef CHOOSE_CRYPTO
860
861     memcpy(st->remoteN,m.nR,NONCELEN);
862     return True;
863 }
864
865 static void generate_dhsecret(struct site *st)
866 {
867     st->random->generate(st->random->st, st->dh->secret_len,st->dhsecret);
868 }
869
870 static bool_t generate_msg3(struct site *st)
871 {
872     /* Now we have our nonce and their nonce. Think of a secret key,
873        and create message number 3. */
874     generate_dhsecret(st);
875     return generate_msg(st,
876                         (st->remote_capabilities & CAPAB_TRANSFORM_MASK)
877                         ? LABEL_MSG3BIS
878                         : LABEL_MSG3,
879                         "site:MSG3");
880 }
881
882 static bool_t process_msg3_msg4(struct site *st, struct msg *m)
883 {
884     uint8_t *hash;
885     void *hst;
886
887     /* Check signature and store g^x mod m */
888     hash=safe_malloc(st->hash->len, "process_msg3_msg4");
889     hst=st->hash->init();
890     st->hash->update(hst,m->hashstart,m->hashlen);
891     st->hash->final(hst,hash);
892     /* Terminate signature with a '0' - already checked that this will fit */
893     m->sig[m->siglen]=0;
894     if (!st->pubkey->check(st->pubkey->st,hash,st->hash->len,m->sig)) {
895         slog(st,LOG_SEC,"msg3/msg4 signature failed check!");
896         free(hash);
897         return False;
898     }
899     free(hash);
900
901     st->remote_adv_mtu=m->remote_mtu;
902
903     return True;
904 }
905
906 static bool_t process_msg3(struct site *st, struct buffer_if *msg3,
907                            const struct comm_addr *src, uint32_t msgtype)
908 {
909     struct msg m;
910     cstring_t err;
911
912     switch (msgtype) {
913         case CASES_MSG3_KNOWN: break;
914         default: assert(0);
915     }
916
917     if (!unpick_msg(st,msgtype,msg3,&m)) return False;
918     if (!check_msg(st,msgtype,&m,&err)) {
919         slog(st,LOG_SEC,"msg3: %s",err);
920         return False;
921     }
922     uint32_t capab_adv_late = m.remote_capabilities
923         & ~st->remote_capabilities & st->early_capabilities;
924     if (capab_adv_late) {
925         slog(st,LOG_SEC,"msg3 impermissibly adds early capability flag(s)"
926              " %#"PRIx32" (was %#"PRIx32", now %#"PRIx32")",
927              capab_adv_late, st->remote_capabilities, m.remote_capabilities);
928         return False;
929     }
930     st->remote_capabilities|=m.remote_capabilities;
931
932 #define CHOSE_CRYPTO(kind, what) do {                                   \
933     struct kind##_if *iface;                                            \
934     int i;                                                              \
935     for (i=0; i<st->n##kind##s; i++) {                                  \
936         iface=st->kind##s[i];                                           \
937         if (iface->capab_bit == m.capab_##kind##num)                    \
938             goto kind##_found;                                          \
939     }                                                                   \
940     slog(st,LOG_SEC,"peer chose unknown-to-us " what " %d!",            \
941          m.capab_##kind##num);                                                  \
942     return False;                                                       \
943 kind##_found:                                                           \
944     st->chosen_##kind=iface;                                            \
945 } while (0)
946
947     CHOSE_CRYPTO(transform, "transform");
948
949 #undef CHOSE_CRYPTO
950
951     if (!process_msg3_msg4(st,&m))
952         return False;
953
954     /* Terminate their DH public key with a '0' */
955     m.pk[m.pklen]=0;
956     /* Invent our DH secret key */
957     generate_dhsecret(st);
958
959     /* Generate the shared key and set up the transform */
960     if (!set_new_transform(st,m.pk)) return False;
961
962     return True;
963 }
964
965 static bool_t generate_msg4(struct site *st)
966 {
967     /* We have both nonces, their public key and our private key. Generate
968        our public key, sign it and send it to them. */
969     return generate_msg(st,LABEL_MSG4,"site:MSG4");
970 }
971
972 static bool_t process_msg4(struct site *st, struct buffer_if *msg4,
973                            const struct comm_addr *src)
974 {
975     struct msg m;
976     cstring_t err;
977
978     if (!unpick_msg(st,LABEL_MSG4,msg4,&m)) return False;
979     if (!check_msg(st,LABEL_MSG4,&m,&err)) {
980         slog(st,LOG_SEC,"msg4: %s",err);
981         return False;
982     }
983     
984     if (!process_msg3_msg4(st,&m))
985         return False;
986
987     /* Terminate their DH public key with a '0' */
988     m.pk[m.pklen]=0;
989
990     /* Generate the shared key and set up the transform */
991     if (!set_new_transform(st,m.pk)) return False;
992
993     return True;
994 }
995
996 struct msg0 {
997     uint32_t dest;
998     uint32_t source;
999     uint32_t type;
1000 };
1001
1002 static bool_t unpick_msg0(struct site *st, struct buffer_if *msg0,
1003                           struct msg0 *m)
1004 {
1005     CHECK_AVAIL(msg0,4);
1006     m->dest=buf_unprepend_uint32(msg0);
1007     CHECK_AVAIL(msg0,4);
1008     m->source=buf_unprepend_uint32(msg0);
1009     CHECK_AVAIL(msg0,4);
1010     m->type=buf_unprepend_uint32(msg0);
1011     return True;
1012     /* Leaves transformed part of buffer untouched */
1013 }
1014
1015 static bool_t generate_msg5(struct site *st)
1016 {
1017     cstring_t transform_err;
1018
1019     BUF_ALLOC(&st->buffer,"site:MSG5");
1020     /* We are going to add four words to the message */
1021     buffer_init(&st->buffer,calculate_max_start_pad());
1022     /* Give the netlink code an opportunity to put its own stuff in the
1023        message (configuration information, etc.) */
1024     buf_prepend_uint32(&st->buffer,LABEL_MSG5);
1025     if (call_transform_forwards(st,st->new_transform,
1026                                 &st->buffer,&transform_err))
1027         return False;
1028     buf_prepend_uint32(&st->buffer,LABEL_MSG5);
1029     buf_prepend_uint32(&st->buffer,st->index);
1030     buf_prepend_uint32(&st->buffer,st->setup_session_id);
1031
1032     st->retries=st->setup_retries;
1033     return True;
1034 }
1035
1036 static bool_t process_msg5(struct site *st, struct buffer_if *msg5,
1037                            const struct comm_addr *src,
1038                            struct transform_inst_if *transform)
1039 {
1040     struct msg0 m;
1041     cstring_t transform_err;
1042
1043     if (!unpick_msg0(st,msg5,&m)) return False;
1044
1045     if (call_transform_reverse(st,transform,msg5,&transform_err)) {
1046         /* There's a problem */
1047         slog(st,LOG_SEC,"process_msg5: transform: %s",transform_err);
1048         return False;
1049     }
1050     /* Buffer should now contain untransformed PING packet data */
1051     CHECK_AVAIL(msg5,4);
1052     if (buf_unprepend_uint32(msg5)!=LABEL_MSG5) {
1053         slog(st,LOG_SEC,"MSG5/PING packet contained wrong label");
1054         return False;
1055     }
1056     /* Older versions of secnet used to write some config data here
1057      * which we ignore.  So we don't CHECK_EMPTY */
1058     return True;
1059 }
1060
1061 static void create_msg6(struct site *st, struct transform_inst_if *transform,
1062                         uint32_t session_id)
1063 {
1064     cstring_t transform_err;
1065
1066     BUF_ALLOC(&st->buffer,"site:MSG6");
1067     /* We are going to add four words to the message */
1068     buffer_init(&st->buffer,calculate_max_start_pad());
1069     /* Give the netlink code an opportunity to put its own stuff in the
1070        message (configuration information, etc.) */
1071     buf_prepend_uint32(&st->buffer,LABEL_MSG6);
1072     transform_apply_return problem =
1073         call_transform_forwards(st,transform,
1074                                 &st->buffer,&transform_err);
1075     assert(!problem);
1076     buf_prepend_uint32(&st->buffer,LABEL_MSG6);
1077     buf_prepend_uint32(&st->buffer,st->index);
1078     buf_prepend_uint32(&st->buffer,session_id);
1079 }
1080
1081 static bool_t generate_msg6(struct site *st)
1082 {
1083     if (!is_transform_valid(st->new_transform))
1084         return False;
1085     create_msg6(st,st->new_transform,st->setup_session_id);
1086     st->retries=1; /* Peer will retransmit MSG5 if this packet gets lost */
1087     return True;
1088 }
1089
1090 static bool_t process_msg6(struct site *st, struct buffer_if *msg6,
1091                            const struct comm_addr *src)
1092 {
1093     struct msg0 m;
1094     cstring_t transform_err;
1095
1096     if (!unpick_msg0(st,msg6,&m)) return False;
1097
1098     if (call_transform_reverse(st,st->new_transform,msg6,&transform_err)) {
1099         /* There's a problem */
1100         slog(st,LOG_SEC,"process_msg6: transform: %s",transform_err);
1101         return False;
1102     }
1103     /* Buffer should now contain untransformed PING packet data */
1104     CHECK_AVAIL(msg6,4);
1105     if (buf_unprepend_uint32(msg6)!=LABEL_MSG6) {
1106         slog(st,LOG_SEC,"MSG6/PONG packet contained invalid data");
1107         return False;
1108     }
1109     /* Older versions of secnet used to write some config data here
1110      * which we ignore.  So we don't CHECK_EMPTY */
1111     return True;
1112 }
1113
1114 static transform_apply_return
1115 decrypt_msg0(struct site *st, struct buffer_if *msg0,
1116                            const struct comm_addr *src)
1117 {
1118     cstring_t transform_err, auxkey_err, newkey_err="n/a";
1119     struct msg0 m;
1120     transform_apply_return problem;
1121
1122     if (!unpick_msg0(st,msg0,&m)) return False;
1123
1124     /* Keep a copy so we can try decrypting it with multiple keys */
1125     buffer_copy(&st->scratch, msg0);
1126
1127     problem = call_transform_reverse(st,st->current.transform,
1128                                      msg0,&transform_err);
1129     if (!problem) {
1130         if (!st->auxiliary_is_new)
1131             delete_one_key(st,&st->auxiliary_key,
1132                            "peer has used new key","auxiliary key",LOG_SEC);
1133         return 0;
1134     }
1135     if (transform_apply_return_badseq(problem))
1136         goto badseq;
1137
1138     buffer_copy(msg0, &st->scratch);
1139     problem = call_transform_reverse(st,st->auxiliary_key.transform,
1140                                      msg0,&auxkey_err);
1141     if (!problem) {
1142         slog(st,LOG_DROP,"processing packet which uses auxiliary key");
1143         if (st->auxiliary_is_new) {
1144             /* We previously timed out in state SENTMSG5 but it turns
1145              * out that our peer did in fact get our MSG5 and is
1146              * using the new key.  So we should switch to it too. */
1147             /* This is a bit like activate_new_key. */
1148             struct data_key t;
1149             t=st->current;
1150             st->current=st->auxiliary_key;
1151             st->auxiliary_key=t;
1152
1153             delete_one_key(st,&st->auxiliary_key,"peer has used new key",
1154                            "previous key",LOG_SEC);
1155             st->auxiliary_is_new=0;
1156             st->renegotiate_key_time=st->auxiliary_renegotiate_key_time;
1157         }
1158         return 0;
1159     }
1160     if (transform_apply_return_badseq(problem))
1161         goto badseq;
1162
1163     if (st->state==SITE_SENTMSG5) {
1164         buffer_copy(msg0, &st->scratch);
1165         problem = call_transform_reverse(st,st->new_transform,
1166                                          msg0,&newkey_err);
1167         if (!problem) {
1168             /* It looks like we didn't get the peer's MSG6 */
1169             /* This is like a cut-down enter_new_state(SITE_RUN) */
1170             slog(st,LOG_STATE,"will enter state RUN (MSG0 with new key)");
1171             BUF_FREE(&st->buffer);
1172             st->timeout=0;
1173             activate_new_key(st);
1174             return 0; /* do process the data in this packet */
1175         }
1176         if (transform_apply_return_badseq(problem))
1177             goto badseq;
1178     }
1179
1180     slog(st,LOG_SEC,"transform: %s (aux: %s, new: %s)",
1181          transform_err,auxkey_err,newkey_err);
1182     initiate_key_setup(st,"incoming message would not decrypt",0);
1183     send_nak(src,m.dest,m.source,m.type,msg0,"message would not decrypt");
1184     assert(problem);
1185     return problem;
1186
1187  badseq:
1188     slog(st,LOG_DROP,"transform: %s (bad seq.)",transform_err);
1189     assert(problem);
1190     return problem;
1191 }
1192
1193 static bool_t process_msg0(struct site *st, struct buffer_if *msg0,
1194                            const struct comm_addr *src)
1195 {
1196     uint32_t type;
1197     transform_apply_return problem;
1198
1199     problem = decrypt_msg0(st,msg0,src);
1200     if (problem==transform_apply_seqdupe) {
1201         /* We recently received another copy of this packet, maybe due
1202          * to polypath.  That's not a problem; indeed, for the
1203          * purposes of transport address management it is a success.
1204          * But we don't want to process the packet. */
1205         transport_data_msgok(st,src);
1206         return False;
1207     }
1208     if (problem)
1209         return False;
1210
1211     CHECK_AVAIL(msg0,4);
1212     type=buf_unprepend_uint32(msg0);
1213     switch(type) {
1214     case LABEL_MSG7:
1215         /* We must forget about the current session. */
1216         delete_keys(st,"request from peer",LOG_SEC);
1217         /* probably, the peer is shutting down, and this is going to fail,
1218          * but we need to be trying to bring the link up again */
1219         if (st->keepalive)
1220             initiate_key_setup(st,"peer requested key teardown",0);
1221         return True;
1222     case LABEL_MSG9:
1223         /* Deliver to netlink layer */
1224         st->netlink->deliver(st->netlink->st,msg0);
1225         transport_data_msgok(st,src);
1226         /* See whether we should start negotiating a new key */
1227         if (st->now > st->renegotiate_key_time)
1228             initiate_key_setup(st,"incoming packet in renegotiation window",0);
1229         return True;
1230     default:
1231         slog(st,LOG_SEC,"incoming encrypted message of type %08x "
1232              "(unknown)",type);
1233         break;
1234     }
1235     return False;
1236 }
1237
1238 static void dump_packet(struct site *st, struct buffer_if *buf,
1239                         const struct comm_addr *addr, bool_t incoming,
1240                         bool_t ok)
1241 {
1242     uint32_t dest=get_uint32(buf->start);
1243     uint32_t source=get_uint32(buf->start+4);
1244     uint32_t msgtype=get_uint32(buf->start+8);
1245
1246     if (st->log_events & LOG_DUMP)
1247         slilog(st->log,M_DEBUG,"%s: %s: %08x<-%08x: %08x: %s%s",
1248                st->tunname,incoming?"incoming":"outgoing",
1249                dest,source,msgtype,comm_addr_to_string(addr),
1250                ok?"":" - fail");
1251 }
1252
1253 static bool_t comm_addr_sendmsg(struct site *st,
1254                                 const struct comm_addr *dest,
1255                                 struct buffer_if *buf)
1256 {
1257     int i;
1258     struct comm_clientinfo *commclientinfo = 0;
1259
1260     for (i=0; i < st->ncomms; i++) {
1261         if (st->comms[i] == dest->comm) {
1262             commclientinfo = st->commclientinfos[i];
1263             break;
1264         }
1265     }
1266     return dest->comm->sendmsg(dest->comm->st, buf, dest, commclientinfo);
1267 }
1268
1269 static uint32_t site_status(void *st)
1270 {
1271     return 0;
1272 }
1273
1274 static bool_t send_msg(struct site *st)
1275 {
1276     if (st->retries>0) {
1277         transport_xmit(st, &st->setup_peers, &st->buffer, True);
1278         st->timeout=st->now+st->setup_retry_interval;
1279         st->retries--;
1280         return True;
1281     } else if (st->state==SITE_SENTMSG5) {
1282         logtimeout(st,"timed out sending MSG5, stashing new key");
1283         /* We stash the key we have produced, in case it turns out that
1284          * our peer did see our MSG5 after all and starts using it. */
1285         /* This is a bit like some of activate_new_key */
1286         struct transform_inst_if *t;
1287         t=st->auxiliary_key.transform;
1288         st->auxiliary_key.transform=st->new_transform;
1289         st->new_transform=t;
1290         dispose_transform(&st->new_transform);
1291
1292         st->auxiliary_is_new=1;
1293         st->auxiliary_key.key_timeout=st->now+st->key_lifetime;
1294         st->auxiliary_renegotiate_key_time=st->now+st->key_renegotiate_time;
1295         st->auxiliary_key.remote_session_id=st->setup_session_id;
1296
1297         enter_state_wait(st);
1298         return False;
1299     } else {
1300         logtimeout(st,"timed out sending key setup packet "
1301             "(in state %s)",state_name(st->state));
1302         enter_state_wait(st);
1303         return False;
1304     }
1305 }
1306
1307 static void site_resolve_callback(void *sst, const struct comm_addr *addrs,
1308                                   int stored_naddrs, int all_naddrs,
1309                                   const char *address, const char *failwhy)
1310 {
1311     struct site *st=sst;
1312
1313     if (!stored_naddrs) {
1314         slog(st,LOG_ERROR,"resolution of %s failed: %s",address,failwhy);
1315     } else {
1316         slog(st,LOG_PEER_ADDRS,"resolution of %s completed, %d addrs, eg: %s",
1317              address, all_naddrs, comm_addr_to_string(&addrs[0]));;
1318
1319         int space=st->transport_peers_max-st->resolving_n_results_stored;
1320         int n_tocopy=MIN(stored_naddrs,space);
1321         COPY_ARRAY(st->resolving_results + st->resolving_n_results_stored,
1322                    addrs,
1323                    n_tocopy);
1324         st->resolving_n_results_stored += n_tocopy;
1325         st->resolving_n_results_all += all_naddrs;
1326     }
1327
1328     decrement_resolving_count(st,1);
1329 }
1330
1331 static void decrement_resolving_count(struct site *st, int by)
1332 {
1333     assert(st->resolving_count>0);
1334     st->resolving_count-=by;
1335
1336     if (st->resolving_count)
1337         return;
1338
1339     /* OK, we are done with them all.  Handle combined results. */
1340
1341     const struct comm_addr *addrs=st->resolving_results;
1342     int naddrs=st->resolving_n_results_stored;
1343     assert(naddrs<=st->transport_peers_max);
1344
1345     if (naddrs) {
1346         if (naddrs != st->resolving_n_results_all) {
1347             slog(st,LOG_SETUP_INIT,"resolution of supplied addresses/names"
1348                  " yielded too many results (%d > %d), some ignored",
1349                  st->resolving_n_results_all, naddrs);
1350         }
1351         slog(st,LOG_STATE,"resolution completed, %d addrs, eg: %s",
1352              naddrs, iaddr_to_string(&addrs[0].ia));;
1353     }
1354
1355     switch (st->state) {
1356     case SITE_RESOLVE:
1357         if (transport_compute_setupinit_peers(st,addrs,naddrs,0)) {
1358             enter_new_state(st,SITE_SENTMSG1);
1359         } else {
1360             /* Can't figure out who to try to to talk to */
1361             slog(st,LOG_SETUP_INIT,
1362                  "key exchange failed: cannot find peer address");
1363             enter_state_run(st);
1364         }
1365         break;
1366     case SITE_SENTMSG1: case SITE_SENTMSG2:
1367     case SITE_SENTMSG3: case SITE_SENTMSG4:
1368     case SITE_SENTMSG5:
1369         if (naddrs) {
1370             /* We start using the address immediately for data too.
1371              * It's best to store it in st->peers now because we might
1372              * go via SENTMSG5, WAIT, and a MSG0, straight into using
1373              * the new key (without updating the data peer addrs). */
1374             transport_resolve_complete(st,addrs,naddrs);
1375         } else if (st->local_mobile) {
1376             /* We can't let this rest because we may have a peer
1377              * address which will break in the future. */
1378             slog(st,LOG_SETUP_INIT,"resolution failed: "
1379                  "abandoning key exchange");
1380             enter_state_wait(st);
1381         } else {
1382             slog(st,LOG_SETUP_INIT,"resolution failed: "
1383                  " continuing to use source address of peer's packets"
1384                  " for key exchange and ultimately data");
1385         }
1386         break;
1387     case SITE_RUN:
1388         if (naddrs) {
1389             slog(st,LOG_SETUP_INIT,"resolution completed tardily,"
1390                  " updating peer address(es)");
1391             transport_resolve_complete_tardy(st,addrs,naddrs);
1392         } else if (st->local_mobile) {
1393             /* Not very good.  We should queue (another) renegotiation
1394              * so that we can update the peer address. */
1395             st->key_renegotiate_time=st->now+wait_timeout(st);
1396         } else {
1397             slog(st,LOG_SETUP_INIT,"resolution failed: "
1398                  " continuing to use source address of peer's packets");
1399         }
1400         break;
1401     case SITE_WAIT:
1402     case SITE_STOP:
1403         /* oh well */
1404         break;
1405     }
1406 }
1407
1408 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
1409                                  const struct comm_addr *prod_hint)
1410 {
1411     /* Reentrancy hazard: can call enter_new_state/enter_state_* */
1412     if (st->state!=SITE_RUN) return False;
1413     slog(st,LOG_SETUP_INIT,"initiating key exchange (%s)",reason);
1414     if (st->addresses) {
1415         slog(st,LOG_SETUP_INIT,"resolving peer address(es)");
1416         return enter_state_resolve(st);
1417     } else if (transport_compute_setupinit_peers(st,0,0,prod_hint)) {
1418         return enter_new_state(st,SITE_SENTMSG1);
1419     }
1420     slog(st,LOG_SETUP_INIT,"key exchange failed: no address for peer");
1421     return False;
1422 }
1423
1424 static void activate_new_key(struct site *st)
1425 {
1426     struct transform_inst_if *t;
1427
1428     /* We have three transform instances, which we swap between old,
1429        active and setup */
1430     t=st->auxiliary_key.transform;
1431     st->auxiliary_key.transform=st->current.transform;
1432     st->current.transform=st->new_transform;
1433     st->new_transform=t;
1434     dispose_transform(&st->new_transform);
1435
1436     st->timeout=0;
1437     st->auxiliary_is_new=0;
1438     st->auxiliary_key.key_timeout=st->current.key_timeout;
1439     st->current.key_timeout=st->now+st->key_lifetime;
1440     st->renegotiate_key_time=st->now+st->key_renegotiate_time;
1441     transport_peers_copy(st,&st->peers,&st->setup_peers);
1442     st->current.remote_session_id=st->setup_session_id;
1443
1444     /* Compute the inter-site MTU.  This is min( our_mtu, their_mtu ).
1445      * But their mtu be unspecified, in which case we just use ours. */
1446     uint32_t intersite_mtu=
1447         MIN(st->mtu_target, st->remote_adv_mtu ?: ~(uint32_t)0);
1448     st->netlink->set_mtu(st->netlink->st,intersite_mtu);
1449
1450     slog(st,LOG_ACTIVATE_KEY,"new key activated"
1451          " (mtu ours=%"PRId32" theirs=%"PRId32" intersite=%"PRId32")",
1452          st->mtu_target, st->remote_adv_mtu, intersite_mtu);
1453     enter_state_run(st);
1454 }
1455
1456 static void delete_one_key(struct site *st, struct data_key *key,
1457                            cstring_t reason, cstring_t which, uint32_t loglevel)
1458 {
1459     if (!is_transform_valid(key->transform)) return;
1460     if (reason) slog(st,loglevel,"%s deleted (%s)",which,reason);
1461     dispose_transform(&key->transform);
1462     key->key_timeout=0;
1463 }
1464
1465 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel)
1466 {
1467     if (current_valid(st)) {
1468         slog(st,loglevel,"session closed (%s)",reason);
1469
1470         delete_one_key(st,&st->current,0,0,0);
1471         set_link_quality(st);
1472     }
1473     delete_one_key(st,&st->auxiliary_key,0,0,0);
1474 }
1475
1476 static void state_assert(struct site *st, bool_t ok)
1477 {
1478     if (!ok) fatal("site:state_assert");
1479 }
1480
1481 static void enter_state_stop(struct site *st)
1482 {
1483     st->state=SITE_STOP;
1484     st->timeout=0;
1485     delete_keys(st,"entering state STOP",LOG_TIMEOUT_KEY);
1486     dispose_transform(&st->new_transform);
1487 }
1488
1489 static void set_link_quality(struct site *st)
1490 {
1491     uint32_t quality;
1492     if (current_valid(st))
1493         quality=LINK_QUALITY_UP;
1494     else if (st->state==SITE_WAIT || st->state==SITE_STOP)
1495         quality=LINK_QUALITY_DOWN;
1496     else if (st->addresses)
1497         quality=LINK_QUALITY_DOWN_CURRENT_ADDRESS;
1498     else if (transport_peers_valid(&st->peers))
1499         quality=LINK_QUALITY_DOWN_STALE_ADDRESS;
1500     else
1501         quality=LINK_QUALITY_DOWN;
1502
1503     st->netlink->set_quality(st->netlink->st,quality);
1504 }
1505
1506 static void enter_state_run(struct site *st)
1507 {
1508     slog(st,LOG_STATE,"entering state RUN%s",
1509          current_valid(st) ? " (keyed)" : " (unkeyed)");
1510     st->state=SITE_RUN;
1511     st->timeout=0;
1512
1513     st->setup_session_id=0;
1514     transport_peers_clear(st,&st->setup_peers);
1515     FILLZERO(st->localN);
1516     FILLZERO(st->remoteN);
1517     dispose_transform(&st->new_transform);
1518     memset(st->dhsecret,0,st->dh->secret_len);
1519     memset(st->sharedsecret,0,st->dh->shared_len);
1520     set_link_quality(st);
1521
1522     if (st->keepalive && !current_valid(st))
1523         initiate_key_setup(st, "keepalive", 0);
1524 }
1525
1526 static bool_t ensure_resolving(struct site *st)
1527 {
1528     /* Reentrancy hazard: may call site_resolve_callback and hence
1529      * enter_new_state, enter_state_* and generate_msg*. */
1530     if (st->resolving_count)
1531         return True;
1532
1533     assert(st->addresses);
1534
1535     /* resolver->request might reentrantly call site_resolve_callback
1536      * which will decrement st->resolving, so we need to increment it
1537      * twice beforehand to prevent decrement from thinking we're
1538      * finished, and decrement it ourselves.  Alternatively if
1539      * everything fails then there are no callbacks due and we simply
1540      * set it to 0 and return false.. */
1541     st->resolving_n_results_stored=0;
1542     st->resolving_n_results_all=0;
1543     st->resolving_count+=2;
1544     const char **addrp=st->addresses;
1545     const char *address;
1546     bool_t anyok=False;
1547     for (; (address=*addrp++); ) {
1548         bool_t ok = st->resolver->request(st->resolver->st,address,
1549                                           st->remoteport,st->comms[0],
1550                                           site_resolve_callback,st);
1551         if (ok)
1552             st->resolving_count++;
1553         anyok|=ok;
1554     }
1555     if (!anyok) {
1556         st->resolving_count=0;
1557         return False;
1558     }
1559     decrement_resolving_count(st,2);
1560     return True;
1561 }
1562
1563 static bool_t enter_state_resolve(struct site *st)
1564 {
1565     /* Reentrancy hazard!  See ensure_resolving. */
1566     state_assert(st,st->state==SITE_RUN);
1567     slog(st,LOG_STATE,"entering state RESOLVE");
1568     st->state=SITE_RESOLVE;
1569     return ensure_resolving(st);
1570 }
1571
1572 static bool_t enter_new_state(struct site *st, uint32_t next)
1573 {
1574     bool_t (*gen)(struct site *st);
1575     int r;
1576
1577     slog(st,LOG_STATE,"entering state %s",state_name(next));
1578     switch(next) {
1579     case SITE_SENTMSG1:
1580         state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE);
1581         gen=generate_msg1;
1582         st->msg1_crossed_logged = False;
1583         break;
1584     case SITE_SENTMSG2:
1585         state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1586                      st->state==SITE_SENTMSG1 || st->state==SITE_WAIT);
1587         gen=generate_msg2;
1588         break;
1589     case SITE_SENTMSG3:
1590         state_assert(st,st->state==SITE_SENTMSG1);
1591         BUF_FREE(&st->buffer);
1592         gen=generate_msg3;
1593         break;
1594     case SITE_SENTMSG4:
1595         state_assert(st,st->state==SITE_SENTMSG2);
1596         BUF_FREE(&st->buffer);
1597         gen=generate_msg4;
1598         break;
1599     case SITE_SENTMSG5:
1600         state_assert(st,st->state==SITE_SENTMSG3);
1601         BUF_FREE(&st->buffer);
1602         gen=generate_msg5;
1603         break;
1604     case SITE_RUN:
1605         state_assert(st,st->state==SITE_SENTMSG4);
1606         BUF_FREE(&st->buffer);
1607         gen=generate_msg6;
1608         break;
1609     default:
1610         gen=NULL;
1611         fatal("enter_new_state(%s): invalid new state",state_name(next));
1612         break;
1613     }
1614
1615     if (hacky_par_start_failnow()) return False;
1616
1617     r= gen(st) && send_msg(st);
1618
1619     hacky_par_end(&r,
1620                   st->setup_retries, st->setup_retry_interval,
1621                   send_msg, st);
1622     
1623     if (r) {
1624         st->state=next;
1625         if (next==SITE_RUN) {
1626             BUF_FREE(&st->buffer); /* Never reused */
1627             st->timeout=0; /* Never retransmit */
1628             activate_new_key(st);
1629         }
1630         return True;
1631     }
1632     slog(st,LOG_ERROR,"error entering state %s",state_name(next));
1633     st->buffer.free=False; /* Unconditionally use the buffer; it may be
1634                               in either state, and enter_state_wait() will
1635                               do a BUF_FREE() */
1636     enter_state_wait(st);
1637     return False;
1638 }
1639
1640 /* msg7 tells our peer that we're about to forget our key */
1641 static bool_t send_msg7(struct site *st, cstring_t reason)
1642 {
1643     cstring_t transform_err;
1644
1645     if (current_valid(st) && st->buffer.free
1646         && transport_peers_valid(&st->peers)) {
1647         BUF_ALLOC(&st->buffer,"site:MSG7");
1648         buffer_init(&st->buffer,calculate_max_start_pad());
1649         buf_append_uint32(&st->buffer,LABEL_MSG7);
1650         buf_append_string(&st->buffer,reason);
1651         if (call_transform_forwards(st, st->current.transform,
1652                                     &st->buffer, &transform_err))
1653             goto free_out;
1654         buf_prepend_uint32(&st->buffer,LABEL_MSG0);
1655         buf_prepend_uint32(&st->buffer,st->index);
1656         buf_prepend_uint32(&st->buffer,st->current.remote_session_id);
1657         transport_xmit(st,&st->peers,&st->buffer,True);
1658         BUF_FREE(&st->buffer);
1659     free_out:
1660         return True;
1661     }
1662     return False;
1663 }
1664
1665 /* We go into this state if our peer becomes uncommunicative. Similar to
1666    the "stop" state, we forget all session keys for a while, before
1667    re-entering the "run" state. */
1668 static void enter_state_wait(struct site *st)
1669 {
1670     slog(st,LOG_STATE,"entering state WAIT");
1671     st->timeout=st->now+wait_timeout(st);
1672     st->state=SITE_WAIT;
1673     set_link_quality(st);
1674     BUF_FREE(&st->buffer); /* will have had an outgoing packet in it */
1675     /* XXX Erase keys etc. */
1676 }
1677
1678 static void generate_prod(struct site *st, struct buffer_if *buf)
1679 {
1680     buffer_init(buf,0);
1681     buf_append_uint32(buf,0);
1682     buf_append_uint32(buf,0);
1683     buf_append_uint32(buf,LABEL_PROD);
1684     buf_append_string(buf,st->localname);
1685     buf_append_string(buf,st->remotename);
1686 }
1687
1688 static void generate_send_prod(struct site *st,
1689                                const struct comm_addr *source)
1690 {
1691     if (!st->allow_send_prod) return; /* too soon */
1692     if (!(st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1693           st->state==SITE_WAIT)) return; /* we'd ignore peer's MSG1 */
1694
1695     slog(st,LOG_SETUP_INIT,"prodding peer for key exchange");
1696     st->allow_send_prod=0;
1697     generate_prod(st,&st->scratch);
1698     bool_t ok = comm_addr_sendmsg(st, source, &st->scratch);
1699     dump_packet(st,&st->scratch,source,False,ok);
1700 }
1701
1702 static inline void site_settimeout(uint64_t timeout, int *timeout_io)
1703 {
1704     if (timeout) {
1705         int64_t offset=timeout-*now;
1706         if (offset<0) offset=0;
1707         if (offset>INT_MAX) offset=INT_MAX;
1708         if (*timeout_io<0 || offset<*timeout_io)
1709             *timeout_io=offset;
1710     }
1711 }
1712
1713 static int site_beforepoll(void *sst, struct pollfd *fds, int *nfds_io,
1714                            int *timeout_io)
1715 {
1716     struct site *st=sst;
1717
1718     BEFOREPOLL_WANT_FDS(0); /* We don't use any file descriptors */
1719     st->now=*now;
1720
1721     /* Work out when our next timeout is. The earlier of 'timeout' or
1722        'current.key_timeout'. A stored value of '0' indicates no timeout
1723        active. */
1724     site_settimeout(st->timeout, timeout_io);
1725     site_settimeout(st->current.key_timeout, timeout_io);
1726     site_settimeout(st->auxiliary_key.key_timeout, timeout_io);
1727
1728     return 0; /* success */
1729 }
1730
1731 static void check_expiry(struct site *st, struct data_key *key,
1732                          const char *which)
1733 {
1734     if (key->key_timeout && *now>key->key_timeout) {
1735         delete_one_key(st,key,"maximum life exceeded",which,LOG_TIMEOUT_KEY);
1736     }
1737 }
1738
1739 /* NB site_afterpoll will be called before site_beforepoll is ever called */
1740 static void site_afterpoll(void *sst, struct pollfd *fds, int nfds)
1741 {
1742     struct site *st=sst;
1743
1744     st->now=*now;
1745     if (st->timeout && *now>st->timeout) {
1746         st->timeout=0;
1747         if (st->state>=SITE_SENTMSG1 && st->state<=SITE_SENTMSG5) {
1748             if (!hacky_par_start_failnow())
1749                 send_msg(st);
1750         } else if (st->state==SITE_WAIT) {
1751             enter_state_run(st);
1752         } else {
1753             slog(st,LOG_ERROR,"site_afterpoll: unexpected timeout, state=%d",
1754                  st->state);
1755         }
1756     }
1757     check_expiry(st,&st->current,"current key");
1758     check_expiry(st,&st->auxiliary_key,"auxiliary key");
1759 }
1760
1761 /* This function is called by the netlink device to deliver packets
1762    intended for the remote network. The packet is in "raw" wire
1763    format, but is guaranteed to be word-aligned. */
1764 static void site_outgoing(void *sst, struct buffer_if *buf)
1765 {
1766     struct site *st=sst;
1767     cstring_t transform_err;
1768     
1769     if (st->state==SITE_STOP) {
1770         BUF_FREE(buf);
1771         return;
1772     }
1773
1774     st->allow_send_prod=1;
1775
1776     /* In all other states we consider delivering the packet if we have
1777        a valid key and a valid address to send it to. */
1778     if (current_valid(st) && transport_peers_valid(&st->peers)) {
1779         /* Transform it and send it */
1780         if (buf->size>0) {
1781             buf_prepend_uint32(buf,LABEL_MSG9);
1782             if (call_transform_forwards(st, st->current.transform,
1783                                         buf, &transform_err))
1784                 goto free_out;
1785             buf_prepend_uint32(buf,LABEL_MSG0);
1786             buf_prepend_uint32(buf,st->index);
1787             buf_prepend_uint32(buf,st->current.remote_session_id);
1788             transport_xmit(st,&st->peers,buf,False);
1789         }
1790     free_out:
1791         BUF_FREE(buf);
1792         return;
1793     }
1794
1795     slog(st,LOG_DROP,"discarding outgoing packet of size %d",buf->size);
1796     BUF_FREE(buf);
1797     initiate_key_setup(st,"outgoing packet",0);
1798 }
1799
1800 static bool_t named_for_us(struct site *st, const struct buffer_if *buf_in,
1801                            uint32_t type, struct msg *m)
1802     /* For packets which are identified by the local and remote names.
1803      * If it has our name and our peer's name in it it's for us. */
1804 {
1805     struct buffer_if buf[1];
1806     buffer_readonly_clone(buf,buf_in);
1807     return unpick_msg(st,type,buf,m)
1808         && name_matches(&m->remote,st->remotename)
1809         && name_matches(&m->local,st->localname);
1810 }
1811
1812 static bool_t we_have_priority(struct site *st, const struct msg *m) {
1813     if (st->local_capabilities & m->remote_capabilities &
1814         CAPAB_PRIORITY_MOBILE) {
1815         if (st->local_mobile) return True;
1816         if (st-> peer_mobile) return False;
1817     }
1818     return st->our_name_later;
1819 }
1820
1821 static bool_t setup_late_msg_ok(struct site *st, 
1822                                 const struct buffer_if *buf_in,
1823                                 uint32_t msgtype,
1824                                 const struct comm_addr *source) {
1825     /* For setup packets which seem from their type like they are
1826      * late.  Maybe they came via a different path.  All we do is make
1827      * a note of the sending address, iff they look like they are part
1828      * of the current key setup attempt. */
1829     struct msg m;
1830     if (!named_for_us(st,buf_in,msgtype,&m))
1831         /* named_for_us calls unpick_msg which gets the nonces */
1832         return False;
1833     if (!consttime_memeq(m.nR,st->remoteN,NONCELEN) ||
1834         !consttime_memeq(m.nL,st->localN, NONCELEN))
1835         /* spoof ?  from stale run ?  who knows */
1836         return False;
1837     transport_setup_msgok(st,source);
1838     return True;
1839 }
1840
1841 /* This function is called by the communication device to deliver
1842    packets from our peers.
1843    It should return True if the packet is recognised as being for
1844    this current site instance (and should therefore not be processed
1845    by other sites), even if the packet was otherwise ignored. */
1846 static bool_t site_incoming(void *sst, struct buffer_if *buf,
1847                             const struct comm_addr *source)
1848 {
1849     struct site *st=sst;
1850
1851     if (buf->size < 12) return False;
1852
1853     uint32_t dest=get_uint32(buf->start);
1854     uint32_t msgtype=get_uint32(buf->start+8);
1855     struct msg named_msg;
1856
1857     if (msgtype==LABEL_MSG1) {
1858         if (!named_for_us(st,buf,msgtype,&named_msg))
1859             return False;
1860         /* It's a MSG1 addressed to us. Decide what to do about it. */
1861         dump_packet(st,buf,source,True,True);
1862         if (st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1863             st->state==SITE_WAIT) {
1864             /* We should definitely process it */
1865             transport_compute_setupinit_peers(st,0,0,source);
1866             if (process_msg1(st,buf,source,&named_msg)) {
1867                 slog(st,LOG_SETUP_INIT,"key setup initiated by peer");
1868                 bool_t entered=enter_new_state(st,SITE_SENTMSG2);
1869                 if (entered && st->addresses && st->local_mobile)
1870                     /* We must do this as the very last thing, because
1871                        the resolver callback might reenter us. */
1872                     ensure_resolving(st);
1873             } else {
1874                 slog(st,LOG_ERROR,"failed to process incoming msg1");
1875             }
1876             BUF_FREE(buf);
1877             return True;
1878         } else if (st->state==SITE_SENTMSG1) {
1879             /* We've just sent a message 1! They may have crossed on
1880                the wire. If we have priority then we ignore the
1881                incoming one, otherwise we process it as usual. */
1882             if (we_have_priority(st,&named_msg)) {
1883                 BUF_FREE(buf);
1884                 if (!st->msg1_crossed_logged++)
1885                     slog(st,LOG_SETUP_INIT,"crossed msg1s; we are higher "
1886                          "priority => ignore incoming msg1");
1887                 return True;
1888             } else {
1889                 slog(st,LOG_SETUP_INIT,"crossed msg1s; we are lower "
1890                      "priority => use incoming msg1");
1891                 if (process_msg1(st,buf,source,&named_msg)) {
1892                     BUF_FREE(&st->buffer); /* Free our old message 1 */
1893                     transport_setup_msgok(st,source);
1894                     enter_new_state(st,SITE_SENTMSG2);
1895                 } else {
1896                     slog(st,LOG_ERROR,"failed to process an incoming "
1897                          "crossed msg1 (we have low priority)");
1898                 }
1899                 BUF_FREE(buf);
1900                 return True;
1901             }
1902         } else if (st->state==SITE_SENTMSG2 ||
1903                    st->state==SITE_SENTMSG4) {
1904             if (consttime_memeq(named_msg.nR,st->remoteN,NONCELEN)) {
1905                 /* We are ahead in the protocol, but that msg1 had the
1906                  * peer's nonce so presumably it is from this key
1907                  * exchange run, via a slower route */
1908                 transport_setup_msgok(st,source);
1909             } else {
1910                 slog(st,LOG_UNEXPECTED,"competing incoming message 1");
1911             }
1912             BUF_FREE(buf);
1913             return True;
1914         }
1915         /* The message 1 was received at an unexpected stage of the
1916            key setup.  Well, they lost the race. */
1917         slog(st,LOG_UNEXPECTED,"unexpected incoming message 1");
1918         BUF_FREE(buf);
1919         return True;
1920     }
1921     if (msgtype==LABEL_PROD) {
1922         if (!named_for_us(st,buf,msgtype,&named_msg))
1923             return False;
1924         dump_packet(st,buf,source,True,True);
1925         if (st->state!=SITE_RUN) {
1926             slog(st,LOG_DROP,"ignoring PROD when not in state RUN");
1927         } else if (current_valid(st)) {
1928             slog(st,LOG_DROP,"ignoring PROD when we think we have a key");
1929         } else {
1930             initiate_key_setup(st,"peer sent PROD packet",source);
1931         }
1932         BUF_FREE(buf);
1933         return True;
1934     }
1935     if (dest==st->index) {
1936         /* Explicitly addressed to us */
1937         if (msgtype!=LABEL_MSG0) dump_packet(st,buf,source,True,True);
1938         switch (msgtype) {
1939         case LABEL_NAK:
1940             /* If the source is our current peer then initiate a key setup,
1941                because our peer's forgotten the key */
1942             if (get_uint32(buf->start+4)==st->current.remote_session_id) {
1943                 bool_t initiated;
1944                 initiated = initiate_key_setup(st,"received a NAK",source);
1945                 if (!initiated) generate_send_prod(st,source);
1946             } else {
1947                 slog(st,LOG_SEC,"bad incoming NAK");
1948             }
1949             break;
1950         case LABEL_MSG0:
1951             process_msg0(st,buf,source);
1952             break;
1953         case LABEL_MSG1:
1954             /* Setup packet: should not have been explicitly addressed
1955                to us */
1956             slog(st,LOG_SEC,"incoming explicitly addressed msg1");
1957             break;
1958         case LABEL_MSG2:
1959             /* Setup packet: expected only in state SENTMSG1 */
1960             if (st->state!=SITE_SENTMSG1) {
1961                 if ((st->state==SITE_SENTMSG3 ||
1962                      st->state==SITE_SENTMSG5) &&
1963                     setup_late_msg_ok(st,buf,msgtype,source))
1964                     break;
1965                 slog(st,LOG_UNEXPECTED,"unexpected MSG2");
1966             } else if (process_msg2(st,buf,source)) {
1967                 transport_setup_msgok(st,source);
1968                 enter_new_state(st,SITE_SENTMSG3);
1969             } else {
1970                 slog(st,LOG_SEC,"invalid MSG2");
1971             }
1972             break;
1973         case CASES_MSG3_KNOWN:
1974             /* Setup packet: expected only in state SENTMSG2 */
1975             if (st->state!=SITE_SENTMSG2) {
1976                 if ((st->state==SITE_SENTMSG4) &&
1977                     setup_late_msg_ok(st,buf,msgtype,source))
1978                     break;
1979                 slog(st,LOG_UNEXPECTED,"unexpected MSG3");
1980             } else if (process_msg3(st,buf,source,msgtype)) {
1981                 transport_setup_msgok(st,source);
1982                 enter_new_state(st,SITE_SENTMSG4);
1983             } else {
1984                 slog(st,LOG_SEC,"invalid MSG3");
1985             }
1986             break;
1987         case LABEL_MSG4:
1988             /* Setup packet: expected only in state SENTMSG3 */
1989             if (st->state!=SITE_SENTMSG3) {
1990                 if ((st->state==SITE_SENTMSG5) &&
1991                     setup_late_msg_ok(st,buf,msgtype,source))
1992                     break;
1993                 slog(st,LOG_UNEXPECTED,"unexpected MSG4");
1994             } else if (process_msg4(st,buf,source)) {
1995                 transport_setup_msgok(st,source);
1996                 enter_new_state(st,SITE_SENTMSG5);
1997             } else {
1998                 slog(st,LOG_SEC,"invalid MSG4");
1999             }
2000             break;
2001         case LABEL_MSG5:
2002             /* Setup packet: expected only in state SENTMSG4 */
2003             /* (may turn up in state RUN if our return MSG6 was lost
2004                and the new key has already been activated. In that
2005                case we discard it. The peer will realise that we
2006                are using the new key when they see our data packets.
2007                Until then the peer's data packets to us get discarded. */
2008             if (st->state==SITE_SENTMSG4) {
2009                 if (process_msg5(st,buf,source,st->new_transform)) {
2010                     transport_setup_msgok(st,source);
2011                     enter_new_state(st,SITE_RUN);
2012                 } else {
2013                     slog(st,LOG_SEC,"invalid MSG5");
2014                 }
2015             } else if (st->state==SITE_RUN) {
2016                 if (process_msg5(st,buf,source,st->current.transform)) {
2017                     slog(st,LOG_DROP,"got MSG5, retransmitting MSG6");
2018                     transport_setup_msgok(st,source);
2019                     create_msg6(st,st->current.transform,
2020                                 st->current.remote_session_id);
2021                     transport_xmit(st,&st->peers,&st->buffer,True);
2022                     BUF_FREE(&st->buffer);
2023                 } else {
2024                     slog(st,LOG_SEC,"invalid MSG5 (in state RUN)");
2025                 }
2026             } else {
2027                 slog(st,LOG_UNEXPECTED,"unexpected MSG5");
2028             }
2029             break;
2030         case LABEL_MSG6:
2031             /* Setup packet: expected only in state SENTMSG5 */
2032             if (st->state!=SITE_SENTMSG5) {
2033                 slog(st,LOG_UNEXPECTED,"unexpected MSG6");
2034             } else if (process_msg6(st,buf,source)) {
2035                 BUF_FREE(&st->buffer); /* Free message 5 */
2036                 transport_setup_msgok(st,source);
2037                 activate_new_key(st);
2038             } else {
2039                 slog(st,LOG_SEC,"invalid MSG6");
2040             }
2041             break;
2042         default:
2043             slog(st,LOG_SEC,"received message of unknown type 0x%08x",
2044                  msgtype);
2045             break;
2046         }
2047         BUF_FREE(buf);
2048         return True;
2049     }
2050
2051     return False;
2052 }
2053
2054 static void site_control(void *vst, bool_t run)
2055 {
2056     struct site *st=vst;
2057     if (run) enter_state_run(st);
2058     else enter_state_stop(st);
2059 }
2060
2061 static void site_phase_hook(void *sst, uint32_t newphase)
2062 {
2063     struct site *st=sst;
2064
2065     /* The program is shutting down; tell our peer */
2066     send_msg7(st,"shutting down");
2067 }
2068
2069 static void site_childpersist_clearkeys(void *sst, uint32_t newphase)
2070 {
2071     struct site *st=sst;
2072     dispose_transform(&st->current.transform);
2073     dispose_transform(&st->auxiliary_key.transform);
2074     dispose_transform(&st->new_transform);
2075     /* Not much point overwiting the signing key, since we loaded it
2076        from disk, and it is only valid prospectively if at all,
2077        anyway. */
2078     /* XXX it would be best to overwrite the DH state, because that
2079        _is_ relevant to forward secrecy.  However we have no
2080        convenient interface for doing that and in practice gmp has
2081        probably dribbled droppings all over the malloc arena.  A good
2082        way to fix this would be to have a privsep child for asymmetric
2083        crypto operations, but that's a task for another day. */
2084 }
2085
2086 static list_t *site_apply(closure_t *self, struct cloc loc, dict_t *context,
2087                           list_t *args)
2088 {
2089     static uint32_t index_sequence;
2090     struct site *st;
2091     item_t *item;
2092     dict_t *dict;
2093     int i;
2094
2095     NEW(st);
2096
2097     st->cl.description="site";
2098     st->cl.type=CL_SITE;
2099     st->cl.apply=NULL;
2100     st->cl.interface=&st->ops;
2101     st->ops.st=st;
2102     st->ops.control=site_control;
2103     st->ops.status=site_status;
2104
2105     /* First parameter must be a dict */
2106     item=list_elem(args,0);
2107     if (!item || item->type!=t_dict)
2108         cfgfatal(loc,"site","parameter must be a dictionary\n");
2109     
2110     dict=item->data.dict;
2111     st->localname=dict_read_string(dict, "local-name", True, "site", loc);
2112     st->remotename=dict_read_string(dict, "name", True, "site", loc);
2113
2114     st->keepalive=dict_read_bool(dict,"keepalive",False,"site",loc,False);
2115
2116     st->peer_mobile=dict_read_bool(dict,"mobile",False,"site",loc,False);
2117     st->local_mobile=
2118         dict_read_bool(dict,"local-mobile",False,"site",loc,False);
2119
2120     /* Sanity check (which also allows the 'sites' file to include
2121        site() closures for all sites including our own): refuse to
2122        talk to ourselves */
2123     if (strcmp(st->localname,st->remotename)==0) {
2124         Message(M_DEBUG,"site %s: local-name==name -> ignoring this site\n",
2125                 st->localname);
2126         if (st->peer_mobile != st->local_mobile)
2127             cfgfatal(loc,"site","site %s's peer-mobile=%d"
2128                     " but our local-mobile=%d\n",
2129                     st->localname, st->peer_mobile, st->local_mobile);
2130         free(st);
2131         return NULL;
2132     }
2133     if (st->peer_mobile && st->local_mobile) {
2134         Message(M_WARNING,"site %s: site is mobile but so are we"
2135                 " -> ignoring this site\n", st->remotename);
2136         free(st);
2137         return NULL;
2138     }
2139
2140     assert(index_sequence < 0xffffffffUL);
2141     st->index = ++index_sequence;
2142     st->local_capabilities = 0;
2143     st->early_capabilities = CAPAB_PRIORITY_MOBILE;
2144     st->netlink=find_cl_if(dict,"link",CL_NETLINK,True,"site",loc);
2145
2146 #define GET_CLOSURE_LIST(dictkey,things,nthings,CL_TYPE) do{            \
2147     list_t *things##_cfg=dict_lookup(dict,dictkey);                     \
2148     if (!things##_cfg)                                                  \
2149         cfgfatal(loc,"site","closure list \"%s\" not found\n",dictkey); \
2150     st->nthings=list_length(things##_cfg);                              \
2151     NEW_ARY(st->things,st->nthings);                                    \
2152     assert(st->nthings);                                                \
2153     for (i=0; i<st->nthings; i++) {                                     \
2154         item_t *item=list_elem(things##_cfg,i);                         \
2155         if (item->type!=t_closure)                                      \
2156             cfgfatal(loc,"site","%s is not a closure\n",dictkey);       \
2157         closure_t *cl=item->data.closure;                               \
2158         if (cl->type!=CL_TYPE)                                          \
2159             cfgfatal(loc,"site","%s closure wrong type\n",dictkey);     \
2160         st->things[i]=cl->interface;                                    \
2161     }                                                                   \
2162 }while(0)
2163
2164     GET_CLOSURE_LIST("comm",comms,ncomms,CL_COMM);
2165
2166     NEW_ARY(st->commclientinfos, st->ncomms);
2167     dict_t *comminfo = dict_read_dict(dict,"comm-info",False,"site",loc);
2168     for (i=0; i<st->ncomms; i++) {
2169         st->commclientinfos[i] =
2170             !comminfo ? 0 :
2171             st->comms[i]->clientinfo(st->comms[i],comminfo,loc);
2172     }
2173
2174     st->resolver=find_cl_if(dict,"resolver",CL_RESOLVER,True,"site",loc);
2175     st->log=find_cl_if(dict,"log",CL_LOG,True,"site",loc);
2176     st->random=find_cl_if(dict,"random",CL_RANDOMSRC,True,"site",loc);
2177
2178     st->privkey=find_cl_if(dict,"local-key",CL_RSAPRIVKEY,True,"site",loc);
2179     st->addresses=dict_read_string_array(dict,"address",False,"site",loc,0);
2180     if (st->addresses)
2181         st->remoteport=dict_read_number(dict,"port",True,"site",loc,0);
2182     else st->remoteport=0;
2183     st->pubkey=find_cl_if(dict,"key",CL_RSAPUBKEY,True,"site",loc);
2184
2185     GET_CLOSURE_LIST("transform",transforms,ntransforms,CL_TRANSFORM);
2186
2187     st->dh=find_cl_if(dict,"dh",CL_DH,True,"site",loc);
2188     st->hash=find_cl_if(dict,"hash",CL_HASH,True,"site",loc);
2189
2190 #define DEFAULT(D) (st->peer_mobile || st->local_mobile \
2191                     ? DEFAULT_MOBILE_##D : DEFAULT_##D)
2192 #define CFG_NUMBER(k,D) dict_read_number(dict,(k),False,"site",loc,DEFAULT(D));
2193
2194     st->key_lifetime=         CFG_NUMBER("key-lifetime",  KEY_LIFETIME);
2195     st->setup_retries=        CFG_NUMBER("setup-retries", SETUP_RETRIES);
2196     st->setup_retry_interval= CFG_NUMBER("setup-timeout", SETUP_RETRY_INTERVAL);
2197     st->wait_timeout_mean=    CFG_NUMBER("wait-time",     WAIT_TIME);
2198     st->mtu_target= dict_read_number(dict,"mtu-target",False,"site",loc,0);
2199
2200     st->mobile_peer_expiry= dict_read_number(
2201        dict,"mobile-peer-expiry",False,"site",loc,DEFAULT_MOBILE_PEER_EXPIRY);
2202
2203     const char *peerskey= st->peer_mobile
2204         ? "mobile-peers-max" : "static-peers-max";
2205     st->transport_peers_max= dict_read_number(
2206         dict,peerskey,False,"site",loc, st->addresses ? 4 : 3);
2207     if (st->transport_peers_max<1 ||
2208         st->transport_peers_max>MAX_PEER_ADDRS) {
2209         cfgfatal(loc,"site", "%s must be in range 1.."
2210                  STRING(MAX_PEER_ADDRS) "\n", peerskey);
2211     }
2212
2213     if (st->key_lifetime < DEFAULT(KEY_RENEGOTIATE_GAP)*2)
2214         st->key_renegotiate_time=st->key_lifetime/2;
2215     else
2216         st->key_renegotiate_time=st->key_lifetime-DEFAULT(KEY_RENEGOTIATE_GAP);
2217     st->key_renegotiate_time=dict_read_number(
2218         dict,"renegotiate-time",False,"site",loc,st->key_renegotiate_time);
2219     if (st->key_renegotiate_time > st->key_lifetime) {
2220         cfgfatal(loc,"site",
2221                  "renegotiate-time must be less than key-lifetime\n");
2222     }
2223
2224     st->log_events=string_list_to_word(dict_lookup(dict,"log-events"),
2225                                        log_event_table,"site");
2226
2227     st->resolving_count=0;
2228     st->allow_send_prod=0;
2229
2230     st->tunname=safe_malloc(strlen(st->localname)+strlen(st->remotename)+5,
2231                             "site_apply");
2232     sprintf(st->tunname,"%s<->%s",st->localname,st->remotename);
2233
2234     /* The information we expect to see in incoming messages of type 1 */
2235     /* fixme: lots of unchecked overflows here, but the results are only
2236        corrupted packets rather than undefined behaviour */
2237     st->our_name_later=(strcmp(st->localname,st->remotename)>0);
2238
2239     buffer_new(&st->buffer,SETUP_BUFFER_LEN);
2240
2241     buffer_new(&st->scratch,SETUP_BUFFER_LEN);
2242     BUF_ALLOC(&st->scratch,"site:scratch");
2243
2244     /* We are interested in poll(), but only for timeouts. We don't have
2245        any fds of our own. */
2246     register_for_poll(st, site_beforepoll, site_afterpoll, "site");
2247     st->timeout=0;
2248
2249     st->remote_capabilities=0;
2250     st->chosen_transform=0;
2251     st->current.key_timeout=0;
2252     st->auxiliary_key.key_timeout=0;
2253     transport_peers_clear(st,&st->peers);
2254     transport_peers_clear(st,&st->setup_peers);
2255     /* XXX mlock these */
2256     st->dhsecret=safe_malloc(st->dh->secret_len,"site:dhsecret");
2257     st->sharedsecret=safe_malloc(st->dh->shared_len, "site:sharedsecret");
2258
2259 #define SET_CAPBIT(bit) do {                                            \
2260     uint32_t capflag = 1UL << (bit);                                    \
2261     if (st->local_capabilities & capflag)                               \
2262         slog(st,LOG_ERROR,"capability bit"                              \
2263              " %d (%#"PRIx32") reused", (bit), capflag);                \
2264     st->local_capabilities |= capflag;                                  \
2265 } while (0)
2266
2267     for (i=0; i<st->ntransforms; i++)
2268         SET_CAPBIT(st->transforms[i]->capab_bit);
2269
2270 #undef SET_CAPBIT
2271
2272     if (st->local_mobile || st->peer_mobile)
2273         st->local_capabilities |= CAPAB_PRIORITY_MOBILE;
2274
2275     /* We need to register the remote networks with the netlink device */
2276     uint32_t netlink_mtu; /* local virtual interface mtu */
2277     st->netlink->reg(st->netlink->st, site_outgoing, st, &netlink_mtu);
2278     if (!st->mtu_target)
2279         st->mtu_target=netlink_mtu;
2280     
2281     for (i=0; i<st->ncomms; i++)
2282         st->comms[i]->request_notify(st->comms[i]->st, st, site_incoming);
2283
2284     st->current.transform=0;
2285     st->auxiliary_key.transform=0;
2286     st->new_transform=0;
2287     st->auxiliary_is_new=0;
2288
2289     enter_state_stop(st);
2290
2291     add_hook(PHASE_SHUTDOWN,site_phase_hook,st);
2292     add_hook(PHASE_CHILDPERSIST,site_childpersist_clearkeys,st);
2293
2294     return new_closure(&st->cl);
2295 }
2296
2297 void site_module(dict_t *dict)
2298 {
2299     add_closure(dict,"site",site_apply);
2300 }
2301
2302
2303 /***** TRANSPORT PEERS definitions *****/
2304
2305 static void transport_peers_debug(struct site *st, transport_peers *dst,
2306                                   const char *didwhat,
2307                                   int nargs, const struct comm_addr *args,
2308                                   size_t stride) {
2309     int i;
2310     char *argp;
2311
2312     if (!(st->log_events & LOG_PEER_ADDRS))
2313         return; /* an optimisation */
2314
2315     slog(st, LOG_PEER_ADDRS, "peers (%s) %s nargs=%d => npeers=%d",
2316          (dst==&st->peers ? "data" :
2317           dst==&st->setup_peers ? "setup" : "UNKNOWN"),
2318          didwhat, nargs, dst->npeers);
2319
2320     for (i=0, argp=(void*)args;
2321          i<nargs;
2322          i++, (argp+=stride?stride:sizeof(*args))) {
2323         const struct comm_addr *ca=(void*)argp;
2324         slog(st, LOG_PEER_ADDRS, " args: addrs[%d]=%s",
2325              i, comm_addr_to_string(ca));
2326     }
2327     for (i=0; i<dst->npeers; i++) {
2328         struct timeval diff;
2329         timersub(tv_now,&dst->peers[i].last,&diff);
2330         const struct comm_addr *ca=&dst->peers[i].addr;
2331         slog(st, LOG_PEER_ADDRS, " peers: addrs[%d]=%s T-%ld.%06ld",
2332              i, comm_addr_to_string(ca),
2333              (unsigned long)diff.tv_sec, (unsigned long)diff.tv_usec);
2334     }
2335 }
2336
2337 static void transport_peers_expire(struct site *st, transport_peers *peers) {
2338     /* peers must be sorted first */
2339     int previous_peers=peers->npeers;
2340     struct timeval oldest;
2341     oldest.tv_sec  = tv_now->tv_sec - st->mobile_peer_expiry;
2342     oldest.tv_usec = tv_now->tv_usec;
2343     while (peers->npeers>1 &&
2344            timercmp(&peers->peers[peers->npeers-1].last, &oldest, <))
2345         peers->npeers--;
2346     if (peers->npeers != previous_peers)
2347         transport_peers_debug(st,peers,"expire", 0,0,0);
2348 }
2349
2350 static bool_t transport_peer_record_one(struct site *st, transport_peers *peers,
2351                                         const struct comm_addr *ca,
2352                                         const struct timeval *tv) {
2353     /* returns false if output is full */
2354     int search;
2355
2356     if (peers->npeers >= st->transport_peers_max)
2357         return 0;
2358
2359     for (search=0; search<peers->npeers; search++)
2360         if (comm_addr_equal(&peers->peers[search].addr, ca))
2361             return 1;
2362
2363     peers->peers[peers->npeers].addr = *ca;
2364     peers->peers[peers->npeers].last = *tv;
2365     peers->npeers++;
2366     return 1;
2367 }
2368
2369 static void transport_record_peers(struct site *st, transport_peers *peers,
2370                                    const struct comm_addr *addrs, int naddrs,
2371                                    const char *m) {
2372     /* We add addrs into peers.  The new entries end up at the front
2373      * and displace entries towards the end (perhaps even off the
2374      * end).  Any existing matching entries are moved up to the front.
2375      *
2376      * Caller must first call transport_peers_expire. */
2377
2378     if (naddrs==1) {
2379         /* avoids debug for uninteresting updates */
2380         int i;
2381         for (i=0; i<peers->npeers; i++) {
2382             if (comm_addr_equal(&addrs[0], &peers->peers[i].addr)) {
2383                 memmove(peers->peers+1, peers->peers,
2384                         sizeof(peers->peers[0]) * i);
2385                 peers->peers[0].addr = addrs[0];
2386                 peers->peers[0].last = *tv_now;
2387                 return;
2388             }
2389         }
2390     }
2391
2392     int old_npeers=peers->npeers;
2393     transport_peer old_peers[old_npeers];
2394     COPY_ARRAY(old_peers,peers->peers,old_npeers);
2395
2396     peers->npeers=0;
2397     int i;
2398     for (i=0; i<naddrs; i++) {
2399         if (!transport_peer_record_one(st,peers, &addrs[i], tv_now))
2400             break;
2401     }
2402     for (i=0; i<old_npeers; i++) {
2403         const transport_peer *old=&old_peers[i];
2404         if (!transport_peer_record_one(st,peers, &old->addr, &old->last))
2405             break;
2406     }
2407
2408     transport_peers_debug(st,peers,m, naddrs,addrs,0);
2409 }
2410
2411 static void transport_expire_record_peers(struct site *st,
2412                                           transport_peers *peers,
2413                                           const struct comm_addr *addrs,
2414                                           int naddrs, const char *m) {
2415     /* Convenience function */
2416     transport_peers_expire(st,peers);
2417     transport_record_peers(st,peers,addrs,naddrs,m);
2418 }
2419
2420 static bool_t transport_compute_setupinit_peers(struct site *st,
2421         const struct comm_addr *configured_addrs /* 0 if none or not found */,
2422         int n_configured_addrs /* 0 if none or not found */,
2423         const struct comm_addr *incoming_packet_addr /* 0 if none */) {
2424     if (!n_configured_addrs && !incoming_packet_addr &&
2425         !transport_peers_valid(&st->peers))
2426         return False;
2427
2428     slog(st,LOG_SETUP_INIT,
2429          "using: %d configured addr(s);%s %d old peer addrs(es)",
2430          n_configured_addrs,
2431          incoming_packet_addr ? " incoming packet address;" : "",
2432          st->peers.npeers);
2433
2434     /* Non-mobile peers try addresses until one is plausible.  The
2435      * effect is that this code always tries first the configured
2436      * address if supplied, or otherwise the address of the incoming
2437      * PROD, or finally the existing data peer if one exists; this is
2438      * as desired. */
2439
2440     transport_peers_copy(st,&st->setup_peers,&st->peers);
2441     transport_peers_expire(st,&st->setup_peers);
2442
2443     if (incoming_packet_addr)
2444         transport_record_peers(st,&st->setup_peers,
2445                                incoming_packet_addr,1, "incoming");
2446
2447     if (n_configured_addrs)
2448         transport_record_peers(st,&st->setup_peers,
2449                               configured_addrs,n_configured_addrs, "setupinit");
2450
2451     assert(transport_peers_valid(&st->setup_peers));
2452     return True;
2453 }
2454
2455 static void transport_setup_msgok(struct site *st, const struct comm_addr *a) {
2456     if (st->peer_mobile)
2457         transport_expire_record_peers(st,&st->setup_peers,a,1,"setupmsg");
2458 }
2459 static void transport_data_msgok(struct site *st, const struct comm_addr *a) {
2460     if (st->peer_mobile)
2461         transport_expire_record_peers(st,&st->peers,a,1,"datamsg");
2462 }
2463
2464 static int transport_peers_valid(transport_peers *peers) {
2465     return peers->npeers;
2466 }
2467 static void transport_peers_clear(struct site *st, transport_peers *peers) {
2468     peers->npeers= 0;
2469     transport_peers_debug(st,peers,"clear",0,0,0);
2470 }
2471 static void transport_peers_copy(struct site *st, transport_peers *dst,
2472                                  const transport_peers *src) {
2473     dst->npeers=src->npeers;
2474     COPY_ARRAY(dst->peers, src->peers, dst->npeers);
2475     transport_peers_debug(st,dst,"copy",
2476                           src->npeers, &src->peers->addr, sizeof(*src->peers));
2477 }
2478
2479 static void transport_resolve_complete(struct site *st,
2480                                        const struct comm_addr *addrs,
2481                                        int naddrs) {
2482     transport_expire_record_peers(st,&st->peers,addrs,naddrs,
2483                                   "resolved data");
2484     transport_expire_record_peers(st,&st->setup_peers,addrs,naddrs,
2485                                   "resolved setup");
2486 }
2487
2488 static void transport_resolve_complete_tardy(struct site *st,
2489                                              const struct comm_addr *addrs,
2490                                              int naddrs) {
2491     transport_expire_record_peers(st,&st->peers,addrs,naddrs,
2492                                   "resolved tardily");
2493 }
2494
2495 static void transport_peers__copy_by_mask(transport_peer *out, int *nout_io,
2496                                           unsigned mask,
2497                                           const transport_peers *inp) {
2498     /* out and in->peers may be the same region, or nonoverlapping */
2499     const transport_peer *in=inp->peers;
2500     int slot;
2501     for (slot=0; slot<inp->npeers; slot++) {
2502         if (!(mask & (1U << slot)))
2503             continue;
2504         if (!(out==in && slot==*nout_io))
2505             COPY_OBJ(out[*nout_io], in[slot]);
2506         (*nout_io)++;
2507     }
2508 }
2509
2510 void transport_xmit(struct site *st, transport_peers *peers,
2511                     struct buffer_if *buf, bool_t candebug) {
2512     int slot;
2513     transport_peers_expire(st, peers);
2514     unsigned failed=0; /* bitmask */
2515     assert(MAX_PEER_ADDRS < sizeof(unsigned)*CHAR_BIT);
2516
2517     int nfailed=0;
2518     for (slot=0; slot<peers->npeers; slot++) {
2519         transport_peer *peer=&peers->peers[slot];
2520         bool_t ok = comm_addr_sendmsg(st, &peer->addr, buf);
2521         if (candebug)
2522             dump_packet(st, buf, &peer->addr, False, ok);
2523         if (!ok) {
2524             failed |= 1U << slot;
2525             nfailed++;
2526         }
2527         if (ok && !st->peer_mobile)
2528             break;
2529     }
2530     /* Now we need to demote/delete failing addrs: if we are mobile we
2531      * merely demote them; otherwise we delete them. */
2532     if (st->local_mobile) {
2533         unsigned expected = ((1U << nfailed)-1) << (peers->npeers-nfailed);
2534         /* `expected' has all the failures at the end already */
2535         if (failed != expected) {
2536             int fslot=0;
2537             transport_peer failedpeers[nfailed];
2538             transport_peers__copy_by_mask(failedpeers, &fslot, failed,peers);
2539             assert(fslot == nfailed);
2540             int wslot=0;
2541             transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2542             assert(wslot+nfailed == peers->npeers);
2543             COPY_ARRAY(peers->peers+wslot, failedpeers, nfailed);
2544             transport_peers_debug(st,peers,"mobile failure reorder",0,0,0);
2545         }
2546     } else {
2547         if (failed && peers->npeers > 1) {
2548             int wslot=0;
2549             transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2550             peers->npeers=wslot;
2551             transport_peers_debug(st,peers,"non-mobile failure cleanup",0,0,0);
2552         }
2553     }
2554 }
2555
2556 /***** END of transport peers declarations *****/