chiark / gitweb /
polypath: Close parent's socket in child
[secnet.git] / site.c
1 /* site.c - manage communication with a remote network site */
2
3 /* The 'site' code doesn't know anything about the structure of the
4    packets it's transmitting.  In fact, under the new netlink
5    configuration scheme it doesn't need to know anything at all about
6    IP addresses, except how to contact its peer.  This means it could
7    potentially be used to tunnel other protocols too (IPv6, IPX, plain
8    old Ethernet frames) if appropriate netlink code can be written
9    (and that ought not to be too hard, eg. using the TUN/TAP device to
10    pretend to be an Ethernet interface).  */
11
12 /* At some point in the future the netlink code will be asked for
13    configuration information to go in the PING/PONG packets at the end
14    of the key exchange. */
15
16 #include "secnet.h"
17 #include <stdio.h>
18 #include <string.h>
19 #include <limits.h>
20 #include <assert.h>
21 #include <sys/socket.h>
22
23 #include <sys/mman.h>
24 #include "util.h"
25 #include "unaligned.h"
26 #include "magic.h"
27
28 #define SETUP_BUFFER_LEN 2048
29
30 #define DEFAULT_KEY_LIFETIME                  (3600*1000) /* [ms] */
31 #define DEFAULT_KEY_RENEGOTIATE_GAP           (5*60*1000) /* [ms] */
32 #define DEFAULT_SETUP_RETRIES 5
33 #define DEFAULT_SETUP_RETRY_INTERVAL             (2*1000) /* [ms] */
34 #define DEFAULT_WAIT_TIME                       (20*1000) /* [ms] */
35
36 #define DEFAULT_MOBILE_KEY_LIFETIME      (2*24*3600*1000) /* [ms] */
37 #define DEFAULT_MOBILE_KEY_RENEGOTIATE_GAP (12*3600*1000) /* [ms] */
38 #define DEFAULT_MOBILE_SETUP_RETRIES 30
39 #define DEFAULT_MOBILE_SETUP_RETRY_INTERVAL      (1*1000) /* [ms] */
40 #define DEFAULT_MOBILE_WAIT_TIME                (10*1000) /* [ms] */
41
42 #define DEFAULT_MOBILE_PEER_EXPIRY            (2*60)      /* [s] */
43 #define DEFAULT_MOBILE_PEERS_MAX 3 /* send at most this many copies (default) */
44 #define DEFAULT_STATIC_PEERS_MAX 3 /* retain at most this many peer addresses */
45
46 /* Each site can be in one of several possible states. */
47
48 /* States:
49    SITE_STOP         - nothing is allowed to happen; tunnel is down;
50                        all session keys have been erased
51      -> SITE_RUN upon external instruction
52    SITE_RUN          - site up, maybe with valid key
53      -> SITE_RESOLVE upon outgoing packet and no valid key
54          we start name resolution for the other end of the tunnel
55      -> SITE_SENTMSG2 upon valid incoming message 1 and suitable time
56          we send an appropriate message 2
57    SITE_RESOLVE      - waiting for name resolution
58      -> SITE_SENTMSG1 upon successful resolution
59          we send an appropriate message 1
60      -> SITE_SENTMSG2 upon valid incoming message 1 (then abort resolution)
61          we abort resolution and 
62      -> SITE_WAIT on timeout or resolution failure
63    SITE_SENTMSG1
64      -> SITE_SENTMSG2 upon valid incoming message 1 from higher priority end
65      -> SITE_SENTMSG3 upon valid incoming message 2
66      -> SITE_WAIT on timeout
67    SITE_SENTMSG2
68      -> SITE_SENTMSG4 upon valid incoming message 3
69      -> SITE_WAIT on timeout
70    SITE_SENTMSG3
71      -> SITE_SENTMSG5 upon valid incoming message 4
72      -> SITE_WAIT on timeout
73    SITE_SENTMSG4
74      -> SITE_RUN upon valid incoming message 5
75      -> SITE_WAIT on timeout
76    SITE_SENTMSG5
77      -> SITE_RUN upon valid incoming message 6
78      -> SITE_WAIT on timeout
79    SITE_WAIT         - failed to establish key; do nothing for a while
80      -> SITE_RUN on timeout
81    */
82
83 #define SITE_STOP     0
84 #define SITE_RUN      1
85 #define SITE_RESOLVE  2
86 #define SITE_SENTMSG1 3
87 #define SITE_SENTMSG2 4
88 #define SITE_SENTMSG3 5
89 #define SITE_SENTMSG4 6
90 #define SITE_SENTMSG5 7
91 #define SITE_WAIT     8
92
93 int32_t site_max_start_pad = 4*4;
94
95 static cstring_t state_name(uint32_t state)
96 {
97     switch (state) {
98     case 0: return "STOP";
99     case 1: return "RUN";
100     case 2: return "RESOLVE";
101     case 3: return "SENTMSG1";
102     case 4: return "SENTMSG2";
103     case 5: return "SENTMSG3";
104     case 6: return "SENTMSG4";
105     case 7: return "SENTMSG5";
106     case 8: return "WAIT";
107     default: return "*bad state*";
108     }
109 }
110
111 #define NONCELEN 8
112
113 #define LOG_UNEXPECTED    0x00000001
114 #define LOG_SETUP_INIT    0x00000002
115 #define LOG_SETUP_TIMEOUT 0x00000004
116 #define LOG_ACTIVATE_KEY  0x00000008
117 #define LOG_TIMEOUT_KEY   0x00000010
118 #define LOG_SEC           0x00000020
119 #define LOG_STATE         0x00000040
120 #define LOG_DROP          0x00000080
121 #define LOG_DUMP          0x00000100
122 #define LOG_ERROR         0x00000400
123 #define LOG_PEER_ADDRS    0x00000800
124
125 static struct flagstr log_event_table[]={
126     { "unexpected", LOG_UNEXPECTED },
127     { "setup-init", LOG_SETUP_INIT },
128     { "setup-timeout", LOG_SETUP_TIMEOUT },
129     { "activate-key", LOG_ACTIVATE_KEY },
130     { "timeout-key", LOG_TIMEOUT_KEY },
131     { "security", LOG_SEC },
132     { "state-change", LOG_STATE },
133     { "packet-drop", LOG_DROP },
134     { "dump-packets", LOG_DUMP },
135     { "errors", LOG_ERROR },
136     { "peer-addrs", LOG_PEER_ADDRS },
137     { "default", LOG_SETUP_INIT|LOG_SETUP_TIMEOUT|
138       LOG_ACTIVATE_KEY|LOG_TIMEOUT_KEY|LOG_SEC|LOG_ERROR },
139     { "all", 0xffffffff },
140     { NULL, 0 }
141 };
142
143
144 /***** TRANSPORT PEERS declarations *****/
145
146 /* Details of "mobile peer" semantics:
147
148    - We use the same data structure for the different configurations,
149      but manage it with different algorithms.
150    
151    - We record up to mobile_peers_max peer address/port numbers
152      ("peers") for key setup, and separately up to mobile_peers_max
153      for data transfer.
154
155    - In general, we make a new set of addrs (see below) when we start
156      a new key exchange; the key setup addrs become the data transport
157      addrs when key setup complets.
158
159    If our peer is mobile:
160
161    - We send to all recent addresses of incoming packets, plus
162      initially all configured addresses (which we also expire).
163
164    - So, we record addrs of good incoming packets, as follows:
165       1. expire any peers last seen >120s ("mobile-peer-expiry") ago
166       2. add the peer of the just received packet to the applicable list
167          (possibly evicting the oldest entries to make room)
168      NB that we do not expire peers until an incoming packet arrives.
169
170    - If the peer has a configured address or name, we record them the
171      same way, but only as a result of our own initiation of key
172      setup.  (We might evict some incoming packet addrs to make room.)
173
174    - The default number of addrs to keep is 3, or 4 if we have a
175      configured name or address.  That's space for two configured
176      addresses (one IPv6 and one IPv4), plus two received addresses.
177
178    - Outgoing packets are sent to every recorded address in the
179      applicable list.  Any unsupported[1] addresses are deleted from
180      the list right away.  (This should only happen to configured
181      addresses, of course, but there is no need to check that.)
182
183    - When we successfully complete a key setup, we merge the key setup
184      peers into the data transfer peers.
185
186    [1] An unsupported address is one for whose AF we don't have a
187      socket (perhaps because we got EAFNOSUPPORT or some such) or for
188      which sendto gives ENETUNREACH.
189
190    If neither end is mobile:
191
192    - When peer initiated the key exchange, we use the incoming packet
193      address.
194
195    - When we initiate the key exchange, we try configured addresses
196      until we get one which isn't unsupported then fixate on that.
197
198    - When we complete a key setup, we replace the data transport peers
199      with those from the key setup.
200
201    If we are mobile:
202
203    - We can't tell when local network setup changes so we can't cache
204      the unsupported addrs and completely remove the spurious calls to
205      sendto, but we can optimise things a bit by deprioritising addrs
206      which seem to be unsupported.
207
208    - Use only configured addresses.  (Except, that if our peer
209      initiated a key exchange we use the incoming packet address until
210      our name resolution completes.)
211
212    - When we send a packet, try each address in turn; if addr
213      supported, put that address to the end of the list for future
214      packets, and go onto the next address.
215
216    - When we complete a key setup, we replace the data transport peers
217      with those from the key setup.
218
219    */
220
221 typedef struct {
222     struct timeval last;
223     struct comm_addr addr;
224 } transport_peer;
225
226 typedef struct {
227 /* configuration information */
228 /* runtime information */
229     int npeers;
230     transport_peer peers[MAX_PEER_ADDRS];
231 } transport_peers;
232
233 /* Basic operations on transport peer address sets */
234 static void transport_peers_clear(struct site *st, transport_peers *peers);
235 static int transport_peers_valid(transport_peers *peers);
236 static void transport_peers_copy(struct site *st, transport_peers *dst,
237                                  const transport_peers *src);
238
239 /* Record address of incoming setup packet; resp. data packet. */
240 static void transport_setup_msgok(struct site *st, const struct comm_addr *a);
241 static void transport_data_msgok(struct site *st, const struct comm_addr *a);
242
243 /* Initialise the setup addresses.  Called before we send the first
244  * packet in a key exchange.  If we are the initiator, as a result of
245  * resolve completing (or being determined not to be relevant) or an
246  * incoming PROD; if we are the responder, as a result of the MSG1. */
247 static bool_t transport_compute_setupinit_peers(struct site *st,
248         const struct comm_addr *configured_addrs /* 0 if none or not found */,
249         int n_configured_addrs /* 0 if none or not found */,
250         const struct comm_addr *incoming_packet_addr /* 0 if none */);
251
252 /* Called if we are the responder in a key setup, when the resolve
253  * completes.  transport_compute_setupinit_peers will hvae been called
254  * earlier.  If _complete is called, we are still doing the key setup
255  * (and we should use the new values for both the rest of the key
256  * setup and the ongoing data exchange); if _tardy is called, the key
257  * setup is done (either completed or not) and only the data peers are
258  * relevant */
259 static void transport_resolve_complete(struct site *st,
260         const struct comm_addr *addrs, int naddrs);
261 static void transport_resolve_complete_tardy(struct site *st,
262         const struct comm_addr *addrs, int naddrs);
263
264 static void transport_xmit(struct site *st, transport_peers *peers,
265                            struct buffer_if *buf, bool_t candebug);
266
267  /***** END of transport peers declarations *****/
268
269
270 struct data_key {
271     struct transform_inst_if *transform;
272     uint64_t key_timeout; /* End of life of current key */
273     uint32_t remote_session_id;
274 };
275
276 struct site {
277     closure_t cl;
278     struct site_if ops;
279 /* configuration information */
280     string_t localname;
281     string_t remotename;
282     bool_t local_mobile, peer_mobile; /* Mobile client support */
283     int32_t transport_peers_max;
284     string_t tunname; /* localname<->remotename by default, used in logs */
285     cstring_t *addresses; /* DNS name or address(es) for bootstrapping, optional */
286     int remoteport; /* Port for bootstrapping, optional */
287     uint32_t mtu_target;
288     struct netlink_if *netlink;
289     struct comm_if **comms;
290     int ncomms;
291     struct resolver_if *resolver;
292     struct log_if *log;
293     struct random_if *random;
294     struct rsaprivkey_if *privkey;
295     struct rsapubkey_if *pubkey;
296     struct transform_if **transforms;
297     int ntransforms;
298     struct dh_if *dh;
299     struct hash_if *hash;
300
301     uint32_t index; /* Index of this site */
302     uint32_t local_capabilities;
303     int32_t setup_retries; /* How many times to send setup packets */
304     int32_t setup_retry_interval; /* Initial timeout for setup packets */
305     int32_t wait_timeout; /* How long to wait if setup unsuccessful */
306     int32_t mobile_peer_expiry; /* How long to remember 2ary addresses */
307     int32_t key_lifetime; /* How long a key lasts once set up */
308     int32_t key_renegotiate_time; /* If we see traffic (or a keepalive)
309                                       after this time, initiate a new
310                                       key exchange */
311
312     bool_t setup_priority; /* Do we have precedence if both sites emit
313                               message 1 simultaneously? */
314     uint32_t log_events;
315
316 /* runtime information */
317     uint32_t state;
318     uint64_t now; /* Most recently seen time */
319     bool_t allow_send_prod;
320     int resolving_count;
321     int resolving_n_results;
322     struct comm_addr resolving_results[MAX_PEER_ADDRS];
323
324     /* The currently established session */
325     struct data_key current;
326     struct data_key auxiliary_key;
327     bool_t auxiliary_is_new;
328     uint64_t renegotiate_key_time; /* When we can negotiate a new key */
329     uint64_t auxiliary_renegotiate_key_time;
330     transport_peers peers; /* Current address(es) of peer for data traffic */
331
332     /* The current key setup protocol exchange.  We can only be
333        involved in one of these at a time.  There's a potential for
334        denial of service here (the attacker keeps sending a setup
335        packet; we keep trying to continue the exchange, and have to
336        timeout before we can listen for another setup packet); perhaps
337        we should keep a list of 'bad' sources for setup packets. */
338     uint32_t remote_capabilities;
339     uint16_t remote_adv_mtu;
340     struct transform_if *chosen_transform;
341     uint32_t setup_session_id;
342     transport_peers setup_peers;
343     uint8_t localN[NONCELEN]; /* Nonces for key exchange */
344     uint8_t remoteN[NONCELEN];
345     struct buffer_if buffer; /* Current outgoing key exchange packet */
346     struct buffer_if scratch;
347     int32_t retries; /* Number of retries remaining */
348     uint64_t timeout; /* Timeout for current state */
349     uint8_t *dhsecret;
350     uint8_t *sharedsecret;
351     uint32_t sharedsecretlen, sharedsecretallocd;
352     struct transform_inst_if *new_transform; /* For key setup/verify */
353 };
354
355 static uint32_t event_log_priority(struct site *st, uint32_t event)
356 {
357     if (!(event&st->log_events))
358         return 0;
359     switch(event) {
360     case LOG_UNEXPECTED:    return M_INFO;
361     case LOG_SETUP_INIT:    return M_INFO;
362     case LOG_SETUP_TIMEOUT: return M_NOTICE;
363     case LOG_ACTIVATE_KEY:  return M_INFO;
364     case LOG_TIMEOUT_KEY:   return M_INFO;
365     case LOG_SEC:           return M_SECURITY;
366     case LOG_STATE:         return M_DEBUG;
367     case LOG_DROP:          return M_DEBUG;
368     case LOG_DUMP:          return M_DEBUG;
369     case LOG_ERROR:         return M_ERR;
370     case LOG_PEER_ADDRS:    return M_DEBUG;
371     default:                return M_ERR;
372     }
373 }
374
375 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
376 FORMAT(printf,3,0);
377 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
378 {
379     uint32_t class;
380
381     class=event_log_priority(st, event);
382     if (class) {
383         slilog_part(st->log,class,"%s: ",st->tunname);
384         vslilog_part(st->log,class,msg,ap);
385         slilog_part(st->log,class,"\n");
386     }
387 }
388
389 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
390 FORMAT(printf,3,4);
391 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
392 {
393     va_list ap;
394     va_start(ap,msg);
395     vslog(st,event,msg,ap);
396     va_end(ap);
397 }
398
399 static void logtimeout(struct site *st, const char *fmt, ...)
400 FORMAT(printf,2,3);
401 static void logtimeout(struct site *st, const char *fmt, ...)
402 {
403     uint32_t class=event_log_priority(st,LOG_SETUP_TIMEOUT);
404     if (!class)
405         return;
406
407     va_list ap;
408     va_start(ap,fmt);
409
410     slilog_part(st->log,class,"%s: ",st->tunname);
411     vslilog_part(st->log,class,fmt,ap);
412
413     const char *delim;
414     int i;
415     for (i=0, delim=" (tried ";
416          i<st->setup_peers.npeers;
417          i++, delim=", ") {
418         transport_peer *peer=&st->setup_peers.peers[i];
419         const char *s=comm_addr_to_string(&peer->addr);
420         slilog_part(st->log,class,"%s%s",delim,s);
421     }
422
423     slilog_part(st->log,class,")\n");
424     va_end(ap);
425 }
426
427 static void set_link_quality(struct site *st);
428 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel);
429 static void delete_one_key(struct site *st, struct data_key *key,
430                            const char *reason /* may be 0 meaning don't log*/,
431                            const char *which /* ignored if !reasonn */,
432                            uint32_t loglevel /* ignored if !reasonn */);
433 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
434                                  const struct comm_addr *prod_hint);
435 static void enter_state_run(struct site *st);
436 static bool_t enter_state_resolve(struct site *st);
437 static void decrement_resolving_count(struct site *st, int by);
438 static bool_t enter_new_state(struct site *st,uint32_t next);
439 static void enter_state_wait(struct site *st);
440 static void activate_new_key(struct site *st);
441
442 static bool_t is_transform_valid(struct transform_inst_if *transform)
443 {
444     return transform && transform->valid(transform->st);
445 }
446
447 static bool_t current_valid(struct site *st)
448 {
449     return is_transform_valid(st->current.transform);
450 }
451
452 #define DEFINE_CALL_TRANSFORM(fwdrev)                                   \
453 static int call_transform_##fwdrev(struct site *st,                     \
454                                    struct transform_inst_if *transform, \
455                                    struct buffer_if *buf,               \
456                                    const char **errmsg)                 \
457 {                                                                       \
458     if (!is_transform_valid(transform)) {                               \
459         *errmsg="transform not set up";                                 \
460         return 1;                                                       \
461     }                                                                   \
462     return transform->fwdrev(transform->st,buf,errmsg);                 \
463 }
464
465 DEFINE_CALL_TRANSFORM(forwards)
466 DEFINE_CALL_TRANSFORM(reverse)
467
468 static void dispose_transform(struct transform_inst_if **transform_var)
469 {
470     struct transform_inst_if *transform=*transform_var;
471     if (transform) {
472         transform->delkey(transform->st);
473         transform->destroy(transform->st);
474     }
475     *transform_var = 0;
476 }    
477
478 #define CHECK_AVAIL(b,l) do { if ((b)->size<(l)) return False; } while(0)
479 #define CHECK_EMPTY(b) do { if ((b)->size!=0) return False; } while(0)
480 #define CHECK_TYPE(b,t) do { uint32_t type; \
481     CHECK_AVAIL((b),4); \
482     type=buf_unprepend_uint32((b)); \
483     if (type!=(t)) return False; } while(0)
484
485 static _Bool type_is_msg34(uint32_t type)
486 {
487     return
488         type == LABEL_MSG3 ||
489         type == LABEL_MSG3BIS ||
490         type == LABEL_MSG4;
491 }
492
493 struct parsedname {
494     int32_t len;
495     uint8_t *name;
496     struct buffer_if extrainfo;
497 };
498
499 struct msg {
500     uint8_t *hashstart;
501     uint32_t dest;
502     uint32_t source;
503     struct parsedname remote;
504     struct parsedname local;
505     uint32_t remote_capabilities;
506     uint16_t remote_mtu;
507     int capab_transformnum;
508     uint8_t *nR;
509     uint8_t *nL;
510     int32_t pklen;
511     char *pk;
512     int32_t hashlen;
513     int32_t siglen;
514     char *sig;
515 };
516
517 static void set_new_transform(struct site *st, char *pk)
518 {
519     /* Make room for the shared key */
520     st->sharedsecretlen=st->chosen_transform->keylen?:st->dh->ceil_len;
521     assert(st->sharedsecretlen);
522     if (st->sharedsecretlen > st->sharedsecretallocd) {
523         st->sharedsecretallocd=st->sharedsecretlen;
524         st->sharedsecret=safe_realloc_ary(st->sharedsecret,1,
525                                           st->sharedsecretallocd,
526                                           "site:sharedsecret");
527     }
528
529     /* Generate the shared key */
530     st->dh->makeshared(st->dh->st,st->dhsecret,st->dh->len,pk,
531                        st->sharedsecret,st->sharedsecretlen);
532
533     /* Set up the transform */
534     struct transform_if *generator=st->chosen_transform;
535     struct transform_inst_if *generated=generator->create(generator->st);
536     generated->setkey(generated->st,st->sharedsecret,
537                       st->sharedsecretlen,st->setup_priority);
538     dispose_transform(&st->new_transform);
539     st->new_transform=generated;
540
541     slog(st,LOG_SETUP_INIT,"key exchange negotiated transform"
542          " %d (capabilities ours=%#"PRIx32" theirs=%#"PRIx32")",
543          st->chosen_transform->capab_transformnum,
544          st->local_capabilities, st->remote_capabilities);
545 }
546
547 struct xinfoadd {
548     int32_t lenpos, afternul;
549 };
550 static void append_string_xinfo_start(struct buffer_if *buf,
551                                       struct xinfoadd *xia,
552                                       const char *str)
553     /* Helps construct one of the names with additional info as found
554      * in MSG1..4.  Call this function first, then append all the
555      * desired extra info (not including the nul byte) to the buffer,
556      * then call append_string_xinfo_done. */
557 {
558     xia->lenpos = buf->size;
559     buf_append_string(buf,str);
560     buf_append_uint8(buf,0);
561     xia->afternul = buf->size;
562 }
563 static void append_string_xinfo_done(struct buffer_if *buf,
564                                      struct xinfoadd *xia)
565 {
566     /* we just need to adjust the string length */
567     if (buf->size == xia->afternul) {
568         /* no extra info, strip the nul too */
569         buf_unappend_uint8(buf);
570     } else {
571         put_uint16(buf->start+xia->lenpos, buf->size-(xia->lenpos+2));
572     }
573 }
574
575 /* Build any of msg1 to msg4. msg5 and msg6 are built from the inside
576    out using a transform of config data supplied by netlink */
577 static bool_t generate_msg(struct site *st, uint32_t type, cstring_t what)
578 {
579     void *hst;
580     uint8_t *hash;
581     string_t dhpub, sig;
582
583     st->retries=st->setup_retries;
584     BUF_ALLOC(&st->buffer,what);
585     buffer_init(&st->buffer,0);
586     buf_append_uint32(&st->buffer,
587         (type==LABEL_MSG1?0:st->setup_session_id));
588     buf_append_uint32(&st->buffer,st->index);
589     buf_append_uint32(&st->buffer,type);
590
591     struct xinfoadd xia;
592     append_string_xinfo_start(&st->buffer,&xia,st->localname);
593     if ((st->local_capabilities & CAPAB_EARLY) || (type != LABEL_MSG1)) {
594         buf_append_uint32(&st->buffer,st->local_capabilities);
595     }
596     if (type_is_msg34(type)) {
597         buf_append_uint16(&st->buffer,st->mtu_target);
598     }
599     append_string_xinfo_done(&st->buffer,&xia);
600
601     buf_append_string(&st->buffer,st->remotename);
602     BUF_ADD_OBJ(append,&st->buffer,st->localN);
603     if (type==LABEL_MSG1) return True;
604     BUF_ADD_OBJ(append,&st->buffer,st->remoteN);
605     if (type==LABEL_MSG2) return True;
606
607     if (hacky_par_mid_failnow()) return False;
608
609     if (type==LABEL_MSG3BIS)
610         buf_append_uint8(&st->buffer,st->chosen_transform->capab_transformnum);
611
612     dhpub=st->dh->makepublic(st->dh->st,st->dhsecret,st->dh->len);
613     buf_append_string(&st->buffer,dhpub);
614     free(dhpub);
615     hash=safe_malloc(st->hash->len, "generate_msg");
616     hst=st->hash->init();
617     st->hash->update(hst,st->buffer.start,st->buffer.size);
618     st->hash->final(hst,hash);
619     sig=st->privkey->sign(st->privkey->st,hash,st->hash->len);
620     buf_append_string(&st->buffer,sig);
621     free(sig);
622     free(hash);
623     return True;
624 }
625
626 static bool_t unpick_name(struct buffer_if *msg, struct parsedname *nm)
627 {
628     CHECK_AVAIL(msg,2);
629     nm->len=buf_unprepend_uint16(msg);
630     CHECK_AVAIL(msg,nm->len);
631     nm->name=buf_unprepend(msg,nm->len);
632     uint8_t *nul=memchr(nm->name,0,nm->len);
633     if (!nul) {
634         buffer_readonly_view(&nm->extrainfo,0,0);
635     } else {
636         buffer_readonly_view(&nm->extrainfo, nul+1, msg->start-(nul+1));
637         nm->len=nul-nm->name;
638     }
639     return True;
640 }
641
642 static bool_t unpick_msg(struct site *st, uint32_t type,
643                          struct buffer_if *msg, struct msg *m)
644 {
645     m->capab_transformnum=-1;
646     m->hashstart=msg->start;
647     CHECK_AVAIL(msg,4);
648     m->dest=buf_unprepend_uint32(msg);
649     CHECK_AVAIL(msg,4);
650     m->source=buf_unprepend_uint32(msg);
651     CHECK_TYPE(msg,type);
652     if (!unpick_name(msg,&m->remote)) return False;
653     m->remote_capabilities=0;
654     m->remote_mtu=0;
655     if (m->remote.extrainfo.size) {
656         CHECK_AVAIL(&m->remote.extrainfo,4);
657         m->remote_capabilities=buf_unprepend_uint32(&m->remote.extrainfo);
658     }
659     if (type_is_msg34(type) && m->remote.extrainfo.size) {
660         CHECK_AVAIL(&m->remote.extrainfo,2);
661         m->remote_mtu=buf_unprepend_uint16(&m->remote.extrainfo);
662     }
663     if (!unpick_name(msg,&m->local)) return False;
664     if (type==LABEL_PROD) {
665         CHECK_EMPTY(msg);
666         return True;
667     }
668     CHECK_AVAIL(msg,NONCELEN);
669     m->nR=buf_unprepend(msg,NONCELEN);
670     if (type==LABEL_MSG1) {
671         CHECK_EMPTY(msg);
672         return True;
673     }
674     CHECK_AVAIL(msg,NONCELEN);
675     m->nL=buf_unprepend(msg,NONCELEN);
676     if (type==LABEL_MSG2) {
677         CHECK_EMPTY(msg);
678         return True;
679     }
680     if (type==LABEL_MSG3BIS) {
681         CHECK_AVAIL(msg,1);
682         m->capab_transformnum = buf_unprepend_uint8(msg);
683     } else {
684         m->capab_transformnum = CAPAB_TRANSFORMNUM_ANCIENT;
685     }
686     CHECK_AVAIL(msg,2);
687     m->pklen=buf_unprepend_uint16(msg);
688     CHECK_AVAIL(msg,m->pklen);
689     m->pk=buf_unprepend(msg,m->pklen);
690     m->hashlen=msg->start-m->hashstart;
691     CHECK_AVAIL(msg,2);
692     m->siglen=buf_unprepend_uint16(msg);
693     CHECK_AVAIL(msg,m->siglen);
694     m->sig=buf_unprepend(msg,m->siglen);
695     CHECK_EMPTY(msg);
696     return True;
697 }
698
699 static bool_t name_matches(const struct parsedname *nm, const char *expected)
700 {
701     int expected_len=strlen(expected);
702     return
703         nm->len == expected_len &&
704         !memcmp(nm->name, expected, expected_len);
705 }    
706
707 static bool_t check_msg(struct site *st, uint32_t type, struct msg *m,
708                         cstring_t *error)
709 {
710     if (type==LABEL_MSG1) return True;
711
712     /* Check that the site names and our nonce have been sent
713        back correctly, and then store our peer's nonce. */ 
714     if (!name_matches(&m->remote,st->remotename)) {
715         *error="wrong remote site name";
716         return False;
717     }
718     if (!name_matches(&m->local,st->localname)) {
719         *error="wrong local site name";
720         return False;
721     }
722     if (memcmp(m->nL,st->localN,NONCELEN)!=0) {
723         *error="wrong locally-generated nonce";
724         return False;
725     }
726     if (type==LABEL_MSG2) return True;
727     if (!consttime_memeq(m->nR,st->remoteN,NONCELEN)!=0) {
728         *error="wrong remotely-generated nonce";
729         return False;
730     }
731     /* MSG3 has complicated rules about capabilities, which are
732      * handled in process_msg3. */
733     if (type==LABEL_MSG3 || type==LABEL_MSG3BIS) return True;
734     if (m->remote_capabilities!=st->remote_capabilities) {
735         *error="remote capabilities changed";
736         return False;
737     }
738     if (type==LABEL_MSG4) return True;
739     *error="unknown message type";
740     return False;
741 }
742
743 static bool_t generate_msg1(struct site *st)
744 {
745     st->random->generate(st->random->st,NONCELEN,st->localN);
746     return generate_msg(st,LABEL_MSG1,"site:MSG1");
747 }
748
749 static bool_t process_msg1(struct site *st, struct buffer_if *msg1,
750                            const struct comm_addr *src, struct msg *m)
751 {
752     /* We've already determined we're in an appropriate state to
753        process an incoming MSG1, and that the MSG1 has correct values
754        of A and B. */
755
756     st->setup_session_id=m->source;
757     st->remote_capabilities=m->remote_capabilities;
758     memcpy(st->remoteN,m->nR,NONCELEN);
759     return True;
760 }
761
762 static bool_t generate_msg2(struct site *st)
763 {
764     st->random->generate(st->random->st,NONCELEN,st->localN);
765     return generate_msg(st,LABEL_MSG2,"site:MSG2");
766 }
767
768 static bool_t process_msg2(struct site *st, struct buffer_if *msg2,
769                            const struct comm_addr *src)
770 {
771     struct msg m;
772     cstring_t err;
773
774     if (!unpick_msg(st,LABEL_MSG2,msg2,&m)) return False;
775     if (!check_msg(st,LABEL_MSG2,&m,&err)) {
776         slog(st,LOG_SEC,"msg2: %s",err);
777         return False;
778     }
779     st->setup_session_id=m.source;
780     st->remote_capabilities=m.remote_capabilities;
781
782     /* Select the transform to use */
783
784     uint32_t remote_transforms = st->remote_capabilities & CAPAB_TRANSFORM_MASK;
785     if (!remote_transforms)
786         /* old secnets only had this one transform */
787         remote_transforms = 1UL << CAPAB_TRANSFORMNUM_ANCIENT;
788
789     struct transform_if *ti;
790     int i;
791     for (i=0; i<st->ntransforms; i++) {
792         ti=st->transforms[i];
793         if ((1UL << ti->capab_transformnum) & remote_transforms)
794             goto transform_found;
795     }
796     slog(st,LOG_ERROR,"no transforms in common"
797          " (us %#"PRIx32"; them: %#"PRIx32")",
798          st->local_capabilities & CAPAB_TRANSFORM_MASK,
799          remote_transforms);
800     return False;
801  transform_found:
802     st->chosen_transform=ti;
803
804     memcpy(st->remoteN,m.nR,NONCELEN);
805     return True;
806 }
807
808 static bool_t generate_msg3(struct site *st)
809 {
810     /* Now we have our nonce and their nonce. Think of a secret key,
811        and create message number 3. */
812     st->random->generate(st->random->st,st->dh->len,st->dhsecret);
813     return generate_msg(st,
814                         (st->remote_capabilities & CAPAB_TRANSFORM_MASK
815                          ? LABEL_MSG3BIS : LABEL_MSG3),
816                         "site:MSG3");
817 }
818
819 static bool_t process_msg3_msg4(struct site *st, struct msg *m)
820 {
821     uint8_t *hash;
822     void *hst;
823
824     /* Check signature and store g^x mod m */
825     hash=safe_malloc(st->hash->len, "process_msg3_msg4");
826     hst=st->hash->init();
827     st->hash->update(hst,m->hashstart,m->hashlen);
828     st->hash->final(hst,hash);
829     /* Terminate signature with a '0' - cheating, but should be ok */
830     m->sig[m->siglen]=0;
831     if (!st->pubkey->check(st->pubkey->st,hash,st->hash->len,m->sig)) {
832         slog(st,LOG_SEC,"msg3/msg4 signature failed check!");
833         free(hash);
834         return False;
835     }
836     free(hash);
837
838     st->remote_adv_mtu=m->remote_mtu;
839
840     return True;
841 }
842
843 static bool_t process_msg3(struct site *st, struct buffer_if *msg3,
844                            const struct comm_addr *src, uint32_t msgtype)
845 {
846     struct msg m;
847     cstring_t err;
848
849     assert(msgtype==LABEL_MSG3 || msgtype==LABEL_MSG3BIS);
850
851     if (!unpick_msg(st,msgtype,msg3,&m)) return False;
852     if (!check_msg(st,msgtype,&m,&err)) {
853         slog(st,LOG_SEC,"msg3: %s",err);
854         return False;
855     }
856     uint32_t capab_adv_late = m.remote_capabilities
857         & ~st->remote_capabilities & CAPAB_EARLY;
858     if (capab_adv_late) {
859         slog(st,LOG_SEC,"msg3 impermissibly adds early capability flag(s)"
860              " %#"PRIx32" (was %#"PRIx32", now %#"PRIx32")",
861              capab_adv_late, st->remote_capabilities, m.remote_capabilities);
862         return False;
863     }
864     st->remote_capabilities|=m.remote_capabilities;
865
866     struct transform_if *ti;
867     int i;
868     for (i=0; i<st->ntransforms; i++) {
869         ti=st->transforms[i];
870         if (ti->capab_transformnum == m.capab_transformnum)
871             goto transform_found;
872     }
873     slog(st,LOG_SEC,"peer chose unknown-to-us transform %d!",
874          m.capab_transformnum);
875     return False;
876  transform_found:
877     st->chosen_transform=ti;
878
879     if (!process_msg3_msg4(st,&m))
880         return False;
881
882     /* Terminate their DH public key with a '0' */
883     m.pk[m.pklen]=0;
884     /* Invent our DH secret key */
885     st->random->generate(st->random->st,st->dh->len,st->dhsecret);
886
887     /* Generate the shared key and set up the transform */
888     set_new_transform(st,m.pk);
889
890     return True;
891 }
892
893 static bool_t generate_msg4(struct site *st)
894 {
895     /* We have both nonces, their public key and our private key. Generate
896        our public key, sign it and send it to them. */
897     return generate_msg(st,LABEL_MSG4,"site:MSG4");
898 }
899
900 static bool_t process_msg4(struct site *st, struct buffer_if *msg4,
901                            const struct comm_addr *src)
902 {
903     struct msg m;
904     cstring_t err;
905
906     if (!unpick_msg(st,LABEL_MSG4,msg4,&m)) return False;
907     if (!check_msg(st,LABEL_MSG4,&m,&err)) {
908         slog(st,LOG_SEC,"msg4: %s",err);
909         return False;
910     }
911     
912     if (!process_msg3_msg4(st,&m))
913         return False;
914
915     /* Terminate their DH public key with a '0' */
916     m.pk[m.pklen]=0;
917
918     /* Generate the shared key and set up the transform */
919     set_new_transform(st,m.pk);
920
921     return True;
922 }
923
924 struct msg0 {
925     uint32_t dest;
926     uint32_t source;
927     uint32_t type;
928 };
929
930 static bool_t unpick_msg0(struct site *st, struct buffer_if *msg0,
931                           struct msg0 *m)
932 {
933     CHECK_AVAIL(msg0,4);
934     m->dest=buf_unprepend_uint32(msg0);
935     CHECK_AVAIL(msg0,4);
936     m->source=buf_unprepend_uint32(msg0);
937     CHECK_AVAIL(msg0,4);
938     m->type=buf_unprepend_uint32(msg0);
939     return True;
940     /* Leaves transformed part of buffer untouched */
941 }
942
943 static bool_t generate_msg5(struct site *st)
944 {
945     cstring_t transform_err;
946
947     BUF_ALLOC(&st->buffer,"site:MSG5");
948     /* We are going to add four words to the message */
949     buffer_init(&st->buffer,calculate_max_start_pad());
950     /* Give the netlink code an opportunity to put its own stuff in the
951        message (configuration information, etc.) */
952     buf_prepend_uint32(&st->buffer,LABEL_MSG5);
953     if (call_transform_forwards(st,st->new_transform,
954                                 &st->buffer,&transform_err))
955         return False;
956     buf_prepend_uint32(&st->buffer,LABEL_MSG5);
957     buf_prepend_uint32(&st->buffer,st->index);
958     buf_prepend_uint32(&st->buffer,st->setup_session_id);
959
960     st->retries=st->setup_retries;
961     return True;
962 }
963
964 static bool_t process_msg5(struct site *st, struct buffer_if *msg5,
965                            const struct comm_addr *src,
966                            struct transform_inst_if *transform)
967 {
968     struct msg0 m;
969     cstring_t transform_err;
970
971     if (!unpick_msg0(st,msg5,&m)) return False;
972
973     if (call_transform_reverse(st,transform,msg5,&transform_err)) {
974         /* There's a problem */
975         slog(st,LOG_SEC,"process_msg5: transform: %s",transform_err);
976         return False;
977     }
978     /* Buffer should now contain untransformed PING packet data */
979     CHECK_AVAIL(msg5,4);
980     if (buf_unprepend_uint32(msg5)!=LABEL_MSG5) {
981         slog(st,LOG_SEC,"MSG5/PING packet contained wrong label");
982         return False;
983     }
984     /* Older versions of secnet used to write some config data here
985      * which we ignore.  So we don't CHECK_EMPTY */
986     return True;
987 }
988
989 static void create_msg6(struct site *st, struct transform_inst_if *transform,
990                         uint32_t session_id)
991 {
992     cstring_t transform_err;
993
994     BUF_ALLOC(&st->buffer,"site:MSG6");
995     /* We are going to add four words to the message */
996     buffer_init(&st->buffer,calculate_max_start_pad());
997     /* Give the netlink code an opportunity to put its own stuff in the
998        message (configuration information, etc.) */
999     buf_prepend_uint32(&st->buffer,LABEL_MSG6);
1000     int problem = call_transform_forwards(st,transform,
1001                                           &st->buffer,&transform_err);
1002     assert(!problem);
1003     buf_prepend_uint32(&st->buffer,LABEL_MSG6);
1004     buf_prepend_uint32(&st->buffer,st->index);
1005     buf_prepend_uint32(&st->buffer,session_id);
1006 }
1007
1008 static bool_t generate_msg6(struct site *st)
1009 {
1010     if (!is_transform_valid(st->new_transform))
1011         return False;
1012     create_msg6(st,st->new_transform,st->setup_session_id);
1013     st->retries=1; /* Peer will retransmit MSG5 if this packet gets lost */
1014     return True;
1015 }
1016
1017 static bool_t process_msg6(struct site *st, struct buffer_if *msg6,
1018                            const struct comm_addr *src)
1019 {
1020     struct msg0 m;
1021     cstring_t transform_err;
1022
1023     if (!unpick_msg0(st,msg6,&m)) return False;
1024
1025     if (call_transform_reverse(st,st->new_transform,msg6,&transform_err)) {
1026         /* There's a problem */
1027         slog(st,LOG_SEC,"process_msg6: transform: %s",transform_err);
1028         return False;
1029     }
1030     /* Buffer should now contain untransformed PING packet data */
1031     CHECK_AVAIL(msg6,4);
1032     if (buf_unprepend_uint32(msg6)!=LABEL_MSG6) {
1033         slog(st,LOG_SEC,"MSG6/PONG packet contained invalid data");
1034         return False;
1035     }
1036     /* Older versions of secnet used to write some config data here
1037      * which we ignore.  So we don't CHECK_EMPTY */
1038     return True;
1039 }
1040
1041 static bool_t decrypt_msg0(struct site *st, struct buffer_if *msg0,
1042                            const struct comm_addr *src)
1043 {
1044     cstring_t transform_err, auxkey_err, newkey_err="n/a";
1045     struct msg0 m;
1046     uint32_t problem;
1047
1048     if (!unpick_msg0(st,msg0,&m)) return False;
1049
1050     /* Keep a copy so we can try decrypting it with multiple keys */
1051     buffer_copy(&st->scratch, msg0);
1052
1053     problem = call_transform_reverse(st,st->current.transform,
1054                                      msg0,&transform_err);
1055     if (!problem) {
1056         if (!st->auxiliary_is_new)
1057             delete_one_key(st,&st->auxiliary_key,
1058                            "peer has used new key","auxiliary key",LOG_SEC);
1059         return True;
1060     }
1061     if (problem==2)
1062         goto skew;
1063
1064     buffer_copy(msg0, &st->scratch);
1065     problem = call_transform_reverse(st,st->auxiliary_key.transform,
1066                                      msg0,&auxkey_err);
1067     if (problem==0) {
1068         slog(st,LOG_DROP,"processing packet which uses auxiliary key");
1069         if (st->auxiliary_is_new) {
1070             /* We previously timed out in state SENTMSG5 but it turns
1071              * out that our peer did in fact get our MSG5 and is
1072              * using the new key.  So we should switch to it too. */
1073             /* This is a bit like activate_new_key. */
1074             struct data_key t;
1075             t=st->current;
1076             st->current=st->auxiliary_key;
1077             st->auxiliary_key=t;
1078
1079             delete_one_key(st,&st->auxiliary_key,"peer has used new key",
1080                            "previous key",LOG_SEC);
1081             st->auxiliary_is_new=0;
1082             st->renegotiate_key_time=st->auxiliary_renegotiate_key_time;
1083         }
1084         return True;
1085     }
1086     if (problem==2)
1087         goto skew;
1088
1089     if (st->state==SITE_SENTMSG5) {
1090         buffer_copy(msg0, &st->scratch);
1091         problem = call_transform_reverse(st,st->new_transform,
1092                                          msg0,&newkey_err);
1093         if (!problem) {
1094             /* It looks like we didn't get the peer's MSG6 */
1095             /* This is like a cut-down enter_new_state(SITE_RUN) */
1096             slog(st,LOG_STATE,"will enter state RUN (MSG0 with new key)");
1097             BUF_FREE(&st->buffer);
1098             st->timeout=0;
1099             activate_new_key(st);
1100             return True; /* do process the data in this packet */
1101         }
1102         if (problem==2)
1103             goto skew;
1104     }
1105
1106     slog(st,LOG_SEC,"transform: %s (aux: %s, new: %s)",
1107          transform_err,auxkey_err,newkey_err);
1108     initiate_key_setup(st,"incoming message would not decrypt",0);
1109     send_nak(src,m.dest,m.source,m.type,msg0,"message would not decrypt");
1110     return False;
1111
1112  skew:
1113     slog(st,LOG_DROP,"transform: %s (merely skew)",transform_err);
1114     return False;
1115 }
1116
1117 static bool_t process_msg0(struct site *st, struct buffer_if *msg0,
1118                            const struct comm_addr *src)
1119 {
1120     uint32_t type;
1121
1122     if (!decrypt_msg0(st,msg0,src))
1123         return False;
1124
1125     CHECK_AVAIL(msg0,4);
1126     type=buf_unprepend_uint32(msg0);
1127     switch(type) {
1128     case LABEL_MSG7:
1129         /* We must forget about the current session. */
1130         delete_keys(st,"request from peer",LOG_SEC);
1131         return True;
1132     case LABEL_MSG9:
1133         /* Deliver to netlink layer */
1134         st->netlink->deliver(st->netlink->st,msg0);
1135         transport_data_msgok(st,src);
1136         /* See whether we should start negotiating a new key */
1137         if (st->now > st->renegotiate_key_time)
1138             initiate_key_setup(st,"incoming packet in renegotiation window",0);
1139         return True;
1140     default:
1141         slog(st,LOG_SEC,"incoming encrypted message of type %08x "
1142              "(unknown)",type);
1143         break;
1144     }
1145     return False;
1146 }
1147
1148 static void dump_packet(struct site *st, struct buffer_if *buf,
1149                         const struct comm_addr *addr, bool_t incoming)
1150 {
1151     uint32_t dest=get_uint32(buf->start);
1152     uint32_t source=get_uint32(buf->start+4);
1153     uint32_t msgtype=get_uint32(buf->start+8);
1154
1155     if (st->log_events & LOG_DUMP)
1156         slilog(st->log,M_DEBUG,"%s: %s: %08x<-%08x: %08x:",
1157                st->tunname,incoming?"incoming":"outgoing",
1158                dest,source,msgtype);
1159 }
1160
1161 static uint32_t site_status(void *st)
1162 {
1163     return 0;
1164 }
1165
1166 static bool_t send_msg(struct site *st)
1167 {
1168     if (st->retries>0) {
1169         transport_xmit(st, &st->setup_peers, &st->buffer, True);
1170         st->timeout=st->now+st->setup_retry_interval;
1171         st->retries--;
1172         return True;
1173     } else if (st->state==SITE_SENTMSG5) {
1174         logtimeout(st,"timed out sending MSG5, stashing new key");
1175         /* We stash the key we have produced, in case it turns out that
1176          * our peer did see our MSG5 after all and starts using it. */
1177         /* This is a bit like some of activate_new_key */
1178         struct transform_inst_if *t;
1179         t=st->auxiliary_key.transform;
1180         st->auxiliary_key.transform=st->new_transform;
1181         st->new_transform=t;
1182         dispose_transform(&st->new_transform);
1183
1184         st->auxiliary_is_new=1;
1185         st->auxiliary_key.key_timeout=st->now+st->key_lifetime;
1186         st->auxiliary_renegotiate_key_time=st->now+st->key_renegotiate_time;
1187         st->auxiliary_key.remote_session_id=st->setup_session_id;
1188
1189         enter_state_wait(st);
1190         return False;
1191     } else {
1192         logtimeout(st,"timed out sending key setup packet "
1193             "(in state %s)",state_name(st->state));
1194         enter_state_wait(st);
1195         return False;
1196     }
1197 }
1198
1199 static void site_resolve_callback(void *sst, const struct comm_addr *addrs,
1200                                   int naddrs, const char *address,
1201                                   const char *failwhy)
1202 {
1203     struct site *st=sst;
1204
1205     if (!naddrs) {
1206         slog(st,LOG_ERROR,"resolution of %s failed: %s",address,failwhy);
1207     } else {
1208         slog(st,LOG_PEER_ADDRS,"resolution of %s completed, %d addrs, eg: %s",
1209              address, naddrs, comm_addr_to_string(&addrs[0]));;
1210
1211         int n_tocopy = MIN(st->transport_peers_max - st->resolving_n_results,
1212                            naddrs);
1213         COPY_ARRAY(st->resolving_results + st->resolving_n_results,
1214                    addrs,
1215                    n_tocopy);
1216         st->resolving_n_results += naddrs;
1217     }
1218
1219     decrement_resolving_count(st,1);
1220 }
1221
1222 static void decrement_resolving_count(struct site *st, int by)
1223 {
1224     assert(st->resolving_count>0);
1225     st->resolving_count-=by;
1226
1227     if (st->resolving_count)
1228         return;
1229
1230     /* OK, we are done with them all.  Handle combined results. */
1231
1232     const struct comm_addr *addrs=st->resolving_results;
1233     int naddrs=st->resolving_n_results;
1234
1235     if (naddrs) {
1236         slog(st,LOG_STATE,"resolution completed, %d addrs, eg: %s",
1237              naddrs, comm_addr_to_string(&addrs[0]));;
1238         if (st->resolving_n_results > st->transport_peers_max) {
1239             slog(st,LOG_STATE,"resolution of supplied addresses/names"
1240                  " yielded too many results (%d > %d), some ignored",
1241                  st->resolving_n_results, st->transport_peers_max);
1242             st->resolving_n_results=st->transport_peers_max;
1243         }
1244     }
1245
1246     switch (st->state) {
1247     case SITE_RESOLVE:
1248         if (transport_compute_setupinit_peers(st,addrs,naddrs,0)) {
1249             enter_new_state(st,SITE_SENTMSG1);
1250         } else {
1251             /* Can't figure out who to try to to talk to */
1252             slog(st,LOG_SETUP_INIT,
1253                  "key exchange failed: cannot find peer address");
1254             enter_state_run(st);
1255         }
1256         break;
1257     case SITE_SENTMSG1: case SITE_SENTMSG2:
1258     case SITE_SENTMSG3: case SITE_SENTMSG4:
1259     case SITE_SENTMSG5:
1260         if (naddrs) {
1261             /* We start using the address immediately for data too.
1262              * It's best to store it in st->peers now because we might
1263              * go via SENTMSG5, WAIT, and a MSG0, straight into using
1264              * the new key (without updating the data peer addrs). */
1265             transport_resolve_complete(st,addrs,naddrs);
1266         } else if (st->local_mobile) {
1267             /* We can't let this rest because we may have a peer
1268              * address which will break in the future. */
1269             slog(st,LOG_SETUP_INIT,"resolution failed: "
1270                  "abandoning key exchange");
1271             enter_state_wait(st);
1272         } else {
1273             slog(st,LOG_SETUP_INIT,"resolution failed: "
1274                  " continuing to use source address of peer's packets"
1275                  " for key exchange and ultimately data");
1276         }
1277         break;
1278     case SITE_RUN:
1279         if (naddrs) {
1280             slog(st,LOG_SETUP_INIT,"resolution completed tardily,"
1281                  " updating peer address(es)");
1282             transport_resolve_complete_tardy(st,addrs,naddrs);
1283         } else if (st->local_mobile) {
1284             /* Not very good.  We should queue (another) renegotiation
1285              * so that we can update the peer address. */
1286             st->key_renegotiate_time=st->now+st->wait_timeout;
1287         } else {
1288             slog(st,LOG_SETUP_INIT,"resolution failed: "
1289                  " continuing to use source address of peer's packets");
1290         }
1291         break;
1292     case SITE_WAIT:
1293     case SITE_STOP:
1294         /* oh well */
1295         break;
1296     }
1297 }
1298
1299 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
1300                                  const struct comm_addr *prod_hint)
1301 {
1302     /* Reentrancy hazard: can call enter_new_state/enter_state_* */
1303     if (st->state!=SITE_RUN) return False;
1304     slog(st,LOG_SETUP_INIT,"initiating key exchange (%s)",reason);
1305     if (st->addresses) {
1306         slog(st,LOG_SETUP_INIT,"resolving peer address(es)");
1307         return enter_state_resolve(st);
1308     } else if (transport_compute_setupinit_peers(st,0,0,prod_hint)) {
1309         return enter_new_state(st,SITE_SENTMSG1);
1310     }
1311     slog(st,LOG_SETUP_INIT,"key exchange failed: no address for peer");
1312     return False;
1313 }
1314
1315 static void activate_new_key(struct site *st)
1316 {
1317     struct transform_inst_if *t;
1318
1319     /* We have three transform instances, which we swap between old,
1320        active and setup */
1321     t=st->auxiliary_key.transform;
1322     st->auxiliary_key.transform=st->current.transform;
1323     st->current.transform=st->new_transform;
1324     st->new_transform=t;
1325     dispose_transform(&st->new_transform);
1326
1327     st->timeout=0;
1328     st->auxiliary_is_new=0;
1329     st->auxiliary_key.key_timeout=st->current.key_timeout;
1330     st->current.key_timeout=st->now+st->key_lifetime;
1331     st->renegotiate_key_time=st->now+st->key_renegotiate_time;
1332     transport_peers_copy(st,&st->peers,&st->setup_peers);
1333     st->current.remote_session_id=st->setup_session_id;
1334
1335     /* Compute the inter-site MTU.  This is min( our_mtu, their_mtu ).
1336      * But their mtu be unspecified, in which case we just use ours. */
1337     uint32_t intersite_mtu=
1338         MIN(st->mtu_target, st->remote_adv_mtu ?: ~(uint32_t)0);
1339     st->netlink->set_mtu(st->netlink->st,intersite_mtu);
1340
1341     slog(st,LOG_ACTIVATE_KEY,"new key activated"
1342          " (mtu ours=%"PRId32" theirs=%"PRId32" intersite=%"PRId32")",
1343          st->mtu_target, st->remote_adv_mtu, intersite_mtu);
1344     enter_state_run(st);
1345 }
1346
1347 static void delete_one_key(struct site *st, struct data_key *key,
1348                            cstring_t reason, cstring_t which, uint32_t loglevel)
1349 {
1350     if (!is_transform_valid(key->transform)) return;
1351     if (reason) slog(st,loglevel,"%s deleted (%s)",which,reason);
1352     dispose_transform(&key->transform);
1353     key->key_timeout=0;
1354 }
1355
1356 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel)
1357 {
1358     if (current_valid(st)) {
1359         slog(st,loglevel,"session closed (%s)",reason);
1360
1361         delete_one_key(st,&st->current,0,0,0);
1362         set_link_quality(st);
1363     }
1364     delete_one_key(st,&st->auxiliary_key,0,0,0);
1365 }
1366
1367 static void state_assert(struct site *st, bool_t ok)
1368 {
1369     if (!ok) fatal("site:state_assert");
1370 }
1371
1372 static void enter_state_stop(struct site *st)
1373 {
1374     st->state=SITE_STOP;
1375     st->timeout=0;
1376     delete_keys(st,"entering state STOP",LOG_TIMEOUT_KEY);
1377     dispose_transform(&st->new_transform);
1378 }
1379
1380 static void set_link_quality(struct site *st)
1381 {
1382     uint32_t quality;
1383     if (current_valid(st))
1384         quality=LINK_QUALITY_UP;
1385     else if (st->state==SITE_WAIT || st->state==SITE_STOP)
1386         quality=LINK_QUALITY_DOWN;
1387     else if (st->addresses)
1388         quality=LINK_QUALITY_DOWN_CURRENT_ADDRESS;
1389     else if (transport_peers_valid(&st->peers))
1390         quality=LINK_QUALITY_DOWN_STALE_ADDRESS;
1391     else
1392         quality=LINK_QUALITY_DOWN;
1393
1394     st->netlink->set_quality(st->netlink->st,quality);
1395 }
1396
1397 static void enter_state_run(struct site *st)
1398 {
1399     slog(st,LOG_STATE,"entering state RUN");
1400     st->state=SITE_RUN;
1401     st->timeout=0;
1402
1403     st->setup_session_id=0;
1404     transport_peers_clear(st,&st->setup_peers);
1405     FILLZERO(st->localN);
1406     FILLZERO(st->remoteN);
1407     dispose_transform(&st->new_transform);
1408     memset(st->dhsecret,0,st->dh->len);
1409     memset(st->sharedsecret,0,st->sharedsecretlen);
1410     set_link_quality(st);
1411 }
1412
1413 static bool_t ensure_resolving(struct site *st)
1414 {
1415     /* Reentrancy hazard: may call site_resolve_callback and hence
1416      * enter_new_state, enter_state_* and generate_msg*. */
1417     if (st->resolving_count)
1418         return True;
1419
1420     assert(st->addresses);
1421
1422     /* resolver->request might reentrantly call site_resolve_callback
1423      * which will decrement st->resolving, so we need to increment it
1424      * twice beforehand to prevent decrement from thinking we're
1425      * finished, and decrement it ourselves.  Alternatively if
1426      * everything fails then there are no callbacks due and we simply
1427      * set it to 0 and return false.. */
1428     st->resolving_n_results=0;
1429     st->resolving_count+=2;
1430     const char **addrp=st->addresses;
1431     const char *address;
1432     bool_t anyok=False;
1433     for (; (address=*addrp++); ) {
1434         bool_t ok = st->resolver->request(st->resolver->st,address,
1435                                           st->remoteport,st->comms[0],
1436                                           site_resolve_callback,st);
1437         if (ok)
1438             st->resolving_count++;
1439         anyok|=ok;
1440     }
1441     if (!anyok) {
1442         st->resolving_count=0;
1443         return False;
1444     }
1445     decrement_resolving_count(st,2);
1446     return True;
1447 }
1448
1449 static bool_t enter_state_resolve(struct site *st)
1450 {
1451     /* Reentrancy hazard!  See ensure_resolving. */
1452     state_assert(st,st->state==SITE_RUN);
1453     slog(st,LOG_STATE,"entering state RESOLVE");
1454     st->state=SITE_RESOLVE;
1455     return ensure_resolving(st);
1456 }
1457
1458 static bool_t enter_new_state(struct site *st, uint32_t next)
1459 {
1460     bool_t (*gen)(struct site *st);
1461     int r;
1462
1463     slog(st,LOG_STATE,"entering state %s",state_name(next));
1464     switch(next) {
1465     case SITE_SENTMSG1:
1466         state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE);
1467         gen=generate_msg1;
1468         break;
1469     case SITE_SENTMSG2:
1470         state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1471                      st->state==SITE_SENTMSG1 || st->state==SITE_WAIT);
1472         gen=generate_msg2;
1473         break;
1474     case SITE_SENTMSG3:
1475         state_assert(st,st->state==SITE_SENTMSG1);
1476         BUF_FREE(&st->buffer);
1477         gen=generate_msg3;
1478         break;
1479     case SITE_SENTMSG4:
1480         state_assert(st,st->state==SITE_SENTMSG2);
1481         BUF_FREE(&st->buffer);
1482         gen=generate_msg4;
1483         break;
1484     case SITE_SENTMSG5:
1485         state_assert(st,st->state==SITE_SENTMSG3);
1486         BUF_FREE(&st->buffer);
1487         gen=generate_msg5;
1488         break;
1489     case SITE_RUN:
1490         state_assert(st,st->state==SITE_SENTMSG4);
1491         BUF_FREE(&st->buffer);
1492         gen=generate_msg6;
1493         break;
1494     default:
1495         gen=NULL;
1496         fatal("enter_new_state(%s): invalid new state",state_name(next));
1497         break;
1498     }
1499
1500     if (hacky_par_start_failnow()) return False;
1501
1502     r= gen(st) && send_msg(st);
1503
1504     hacky_par_end(&r,
1505                   st->setup_retries, st->setup_retry_interval,
1506                   send_msg, st);
1507     
1508     if (r) {
1509         st->state=next;
1510         if (next==SITE_RUN) {
1511             BUF_FREE(&st->buffer); /* Never reused */
1512             st->timeout=0; /* Never retransmit */
1513             activate_new_key(st);
1514         }
1515         return True;
1516     }
1517     slog(st,LOG_ERROR,"error entering state %s",state_name(next));
1518     st->buffer.free=False; /* Unconditionally use the buffer; it may be
1519                               in either state, and enter_state_wait() will
1520                               do a BUF_FREE() */
1521     enter_state_wait(st);
1522     return False;
1523 }
1524
1525 /* msg7 tells our peer that we're about to forget our key */
1526 static bool_t send_msg7(struct site *st, cstring_t reason)
1527 {
1528     cstring_t transform_err;
1529
1530     if (current_valid(st) && st->buffer.free
1531         && transport_peers_valid(&st->peers)) {
1532         BUF_ALLOC(&st->buffer,"site:MSG7");
1533         buffer_init(&st->buffer,calculate_max_start_pad());
1534         buf_append_uint32(&st->buffer,LABEL_MSG7);
1535         buf_append_string(&st->buffer,reason);
1536         if (call_transform_forwards(st, st->current.transform,
1537                                     &st->buffer, &transform_err))
1538             goto free_out;
1539         buf_prepend_uint32(&st->buffer,LABEL_MSG0);
1540         buf_prepend_uint32(&st->buffer,st->index);
1541         buf_prepend_uint32(&st->buffer,st->current.remote_session_id);
1542         transport_xmit(st,&st->peers,&st->buffer,True);
1543         BUF_FREE(&st->buffer);
1544     free_out:
1545         return True;
1546     }
1547     return False;
1548 }
1549
1550 /* We go into this state if our peer becomes uncommunicative. Similar to
1551    the "stop" state, we forget all session keys for a while, before
1552    re-entering the "run" state. */
1553 static void enter_state_wait(struct site *st)
1554 {
1555     slog(st,LOG_STATE,"entering state WAIT");
1556     st->timeout=st->now+st->wait_timeout;
1557     st->state=SITE_WAIT;
1558     set_link_quality(st);
1559     BUF_FREE(&st->buffer); /* will have had an outgoing packet in it */
1560     /* XXX Erase keys etc. */
1561 }
1562
1563 static void generate_prod(struct site *st, struct buffer_if *buf)
1564 {
1565     buffer_init(buf,0);
1566     buf_append_uint32(buf,0);
1567     buf_append_uint32(buf,0);
1568     buf_append_uint32(buf,LABEL_PROD);
1569     buf_append_string(buf,st->localname);
1570     buf_append_string(buf,st->remotename);
1571 }
1572
1573 static void generate_send_prod(struct site *st,
1574                                const struct comm_addr *source)
1575 {
1576     if (!st->allow_send_prod) return; /* too soon */
1577     if (!(st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1578           st->state==SITE_WAIT)) return; /* we'd ignore peer's MSG1 */
1579
1580     slog(st,LOG_SETUP_INIT,"prodding peer for key exchange");
1581     st->allow_send_prod=0;
1582     generate_prod(st,&st->scratch);
1583     dump_packet(st,&st->scratch,source,False);
1584     source->comm->sendmsg(source->comm->st, &st->scratch, source);
1585 }
1586
1587 static inline void site_settimeout(uint64_t timeout, int *timeout_io)
1588 {
1589     if (timeout) {
1590         int64_t offset=timeout-*now;
1591         if (offset<0) offset=0;
1592         if (offset>INT_MAX) offset=INT_MAX;
1593         if (*timeout_io<0 || offset<*timeout_io)
1594             *timeout_io=offset;
1595     }
1596 }
1597
1598 static int site_beforepoll(void *sst, struct pollfd *fds, int *nfds_io,
1599                            int *timeout_io)
1600 {
1601     struct site *st=sst;
1602
1603     BEFOREPOLL_WANT_FDS(0); /* We don't use any file descriptors */
1604     st->now=*now;
1605
1606     /* Work out when our next timeout is. The earlier of 'timeout' or
1607        'current.key_timeout'. A stored value of '0' indicates no timeout
1608        active. */
1609     site_settimeout(st->timeout, timeout_io);
1610     site_settimeout(st->current.key_timeout, timeout_io);
1611     site_settimeout(st->auxiliary_key.key_timeout, timeout_io);
1612
1613     return 0; /* success */
1614 }
1615
1616 static void check_expiry(struct site *st, struct data_key *key,
1617                          const char *which)
1618 {
1619     if (key->key_timeout && *now>key->key_timeout) {
1620         delete_one_key(st,key,"maximum life exceeded",which,LOG_TIMEOUT_KEY);
1621     }
1622 }
1623
1624 /* NB site_afterpoll will be called before site_beforepoll is ever called */
1625 static void site_afterpoll(void *sst, struct pollfd *fds, int nfds)
1626 {
1627     struct site *st=sst;
1628
1629     st->now=*now;
1630     if (st->timeout && *now>st->timeout) {
1631         st->timeout=0;
1632         if (st->state>=SITE_SENTMSG1 && st->state<=SITE_SENTMSG5) {
1633             if (!hacky_par_start_failnow())
1634                 send_msg(st);
1635         } else if (st->state==SITE_WAIT) {
1636             enter_state_run(st);
1637         } else {
1638             slog(st,LOG_ERROR,"site_afterpoll: unexpected timeout, state=%d",
1639                  st->state);
1640         }
1641     }
1642     check_expiry(st,&st->current,"current key");
1643     check_expiry(st,&st->auxiliary_key,"auxiliary key");
1644 }
1645
1646 /* This function is called by the netlink device to deliver packets
1647    intended for the remote network. The packet is in "raw" wire
1648    format, but is guaranteed to be word-aligned. */
1649 static void site_outgoing(void *sst, struct buffer_if *buf)
1650 {
1651     struct site *st=sst;
1652     cstring_t transform_err;
1653     
1654     if (st->state==SITE_STOP) {
1655         BUF_FREE(buf);
1656         return;
1657     }
1658
1659     st->allow_send_prod=1;
1660
1661     /* In all other states we consider delivering the packet if we have
1662        a valid key and a valid address to send it to. */
1663     if (current_valid(st) && transport_peers_valid(&st->peers)) {
1664         /* Transform it and send it */
1665         if (buf->size>0) {
1666             buf_prepend_uint32(buf,LABEL_MSG9);
1667             if (call_transform_forwards(st, st->current.transform,
1668                                         buf, &transform_err))
1669                 goto free_out;
1670             buf_prepend_uint32(buf,LABEL_MSG0);
1671             buf_prepend_uint32(buf,st->index);
1672             buf_prepend_uint32(buf,st->current.remote_session_id);
1673             transport_xmit(st,&st->peers,buf,False);
1674         }
1675     free_out:
1676         BUF_FREE(buf);
1677         return;
1678     }
1679
1680     slog(st,LOG_DROP,"discarding outgoing packet of size %d",buf->size);
1681     BUF_FREE(buf);
1682     initiate_key_setup(st,"outgoing packet",0);
1683 }
1684
1685 static bool_t named_for_us(struct site *st, const struct buffer_if *buf_in,
1686                            uint32_t type, struct msg *m)
1687     /* For packets which are identified by the local and remote names.
1688      * If it has our name and our peer's name in it it's for us. */
1689 {
1690     struct buffer_if buf[1];
1691     buffer_readonly_clone(buf,buf_in);
1692     return unpick_msg(st,type,buf,m)
1693         && name_matches(&m->remote,st->remotename)
1694         && name_matches(&m->local,st->localname);
1695 }
1696
1697 /* This function is called by the communication device to deliver
1698    packets from our peers.
1699    It should return True if the packet is recognised as being for
1700    this current site instance (and should therefore not be processed
1701    by other sites), even if the packet was otherwise ignored. */
1702 static bool_t site_incoming(void *sst, struct buffer_if *buf,
1703                             const struct comm_addr *source)
1704 {
1705     struct site *st=sst;
1706
1707     if (buf->size < 12) return False;
1708
1709     uint32_t dest=get_uint32(buf->start);
1710     uint32_t msgtype=get_uint32(buf->start+8);
1711     struct msg named_msg;
1712
1713     if (msgtype==LABEL_MSG1) {
1714         if (!named_for_us(st,buf,msgtype,&named_msg))
1715             return False;
1716         /* It's a MSG1 addressed to us. Decide what to do about it. */
1717         dump_packet(st,buf,source,True);
1718         if (st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1719             st->state==SITE_WAIT) {
1720             /* We should definitely process it */
1721             transport_compute_setupinit_peers(st,0,0,source);
1722             if (process_msg1(st,buf,source,&named_msg)) {
1723                 slog(st,LOG_SETUP_INIT,"key setup initiated by peer");
1724                 bool_t entered=enter_new_state(st,SITE_SENTMSG2);
1725                 if (entered && st->addresses && st->local_mobile)
1726                     /* We must do this as the very last thing, because
1727                        the resolver callback might reenter us. */
1728                     ensure_resolving(st);
1729             } else {
1730                 slog(st,LOG_ERROR,"failed to process incoming msg1");
1731             }
1732             BUF_FREE(buf);
1733             return True;
1734         } else if (st->state==SITE_SENTMSG1) {
1735             /* We've just sent a message 1! They may have crossed on
1736                the wire. If we have priority then we ignore the
1737                incoming one, otherwise we process it as usual. */
1738             if (st->setup_priority) {
1739                 BUF_FREE(buf);
1740                 slog(st,LOG_DUMP,"crossed msg1s; we are higher "
1741                      "priority => ignore incoming msg1");
1742                 return True;
1743             } else {
1744                 slog(st,LOG_DUMP,"crossed msg1s; we are lower "
1745                      "priority => use incoming msg1");
1746                 if (process_msg1(st,buf,source,&named_msg)) {
1747                     BUF_FREE(&st->buffer); /* Free our old message 1 */
1748                     transport_setup_msgok(st,source);
1749                     enter_new_state(st,SITE_SENTMSG2);
1750                 } else {
1751                     slog(st,LOG_ERROR,"failed to process an incoming "
1752                          "crossed msg1 (we have low priority)");
1753                 }
1754                 BUF_FREE(buf);
1755                 return True;
1756             }
1757         }
1758         /* The message 1 was received at an unexpected stage of the
1759            key setup. XXX POLICY - what do we do? */
1760         slog(st,LOG_UNEXPECTED,"unexpected incoming message 1");
1761         BUF_FREE(buf);
1762         return True;
1763     }
1764     if (msgtype==LABEL_PROD) {
1765         if (!named_for_us(st,buf,msgtype,&named_msg))
1766             return False;
1767         dump_packet(st,buf,source,True);
1768         if (st->state!=SITE_RUN) {
1769             slog(st,LOG_DROP,"ignoring PROD when not in state RUN");
1770         } else if (current_valid(st)) {
1771             slog(st,LOG_DROP,"ignoring PROD when we think we have a key");
1772         } else {
1773             initiate_key_setup(st,"peer sent PROD packet",source);
1774         }
1775         BUF_FREE(buf);
1776         return True;
1777     }
1778     if (dest==st->index) {
1779         /* Explicitly addressed to us */
1780         if (msgtype!=LABEL_MSG0) dump_packet(st,buf,source,True);
1781         switch (msgtype) {
1782         case LABEL_NAK:
1783             /* If the source is our current peer then initiate a key setup,
1784                because our peer's forgotten the key */
1785             if (get_uint32(buf->start+4)==st->current.remote_session_id) {
1786                 bool_t initiated;
1787                 initiated = initiate_key_setup(st,"received a NAK",source);
1788                 if (!initiated) generate_send_prod(st,source);
1789             } else {
1790                 slog(st,LOG_SEC,"bad incoming NAK");
1791             }
1792             break;
1793         case LABEL_MSG0:
1794             process_msg0(st,buf,source);
1795             break;
1796         case LABEL_MSG1:
1797             /* Setup packet: should not have been explicitly addressed
1798                to us */
1799             slog(st,LOG_SEC,"incoming explicitly addressed msg1");
1800             break;
1801         case LABEL_MSG2:
1802             /* Setup packet: expected only in state SENTMSG1 */
1803             if (st->state!=SITE_SENTMSG1) {
1804                 slog(st,LOG_UNEXPECTED,"unexpected MSG2");
1805             } else if (process_msg2(st,buf,source)) {
1806                 transport_setup_msgok(st,source);
1807                 enter_new_state(st,SITE_SENTMSG3);
1808             } else {
1809                 slog(st,LOG_SEC,"invalid MSG2");
1810             }
1811             break;
1812         case LABEL_MSG3:
1813         case LABEL_MSG3BIS:
1814             /* Setup packet: expected only in state SENTMSG2 */
1815             if (st->state!=SITE_SENTMSG2) {
1816                 slog(st,LOG_UNEXPECTED,"unexpected MSG3");
1817             } else if (process_msg3(st,buf,source,msgtype)) {
1818                 transport_setup_msgok(st,source);
1819                 enter_new_state(st,SITE_SENTMSG4);
1820             } else {
1821                 slog(st,LOG_SEC,"invalid MSG3");
1822             }
1823             break;
1824         case LABEL_MSG4:
1825             /* Setup packet: expected only in state SENTMSG3 */
1826             if (st->state!=SITE_SENTMSG3) {
1827                 slog(st,LOG_UNEXPECTED,"unexpected MSG4");
1828             } else if (process_msg4(st,buf,source)) {
1829                 transport_setup_msgok(st,source);
1830                 enter_new_state(st,SITE_SENTMSG5);
1831             } else {
1832                 slog(st,LOG_SEC,"invalid MSG4");
1833             }
1834             break;
1835         case LABEL_MSG5:
1836             /* Setup packet: expected only in state SENTMSG4 */
1837             /* (may turn up in state RUN if our return MSG6 was lost
1838                and the new key has already been activated. In that
1839                case we discard it. The peer will realise that we
1840                are using the new key when they see our data packets.
1841                Until then the peer's data packets to us get discarded. */
1842             if (st->state==SITE_SENTMSG4) {
1843                 if (process_msg5(st,buf,source,st->new_transform)) {
1844                     transport_setup_msgok(st,source);
1845                     enter_new_state(st,SITE_RUN);
1846                 } else {
1847                     slog(st,LOG_SEC,"invalid MSG5");
1848                 }
1849             } else if (st->state==SITE_RUN) {
1850                 if (process_msg5(st,buf,source,st->current.transform)) {
1851                     slog(st,LOG_DROP,"got MSG5, retransmitting MSG6");
1852                     transport_setup_msgok(st,source);
1853                     create_msg6(st,st->current.transform,
1854                                 st->current.remote_session_id);
1855                     transport_xmit(st,&st->peers,&st->buffer,True);
1856                     BUF_FREE(&st->buffer);
1857                 } else {
1858                     slog(st,LOG_SEC,"invalid MSG5 (in state RUN)");
1859                 }
1860             } else {
1861                 slog(st,LOG_UNEXPECTED,"unexpected MSG5");
1862             }
1863             break;
1864         case LABEL_MSG6:
1865             /* Setup packet: expected only in state SENTMSG5 */
1866             if (st->state!=SITE_SENTMSG5) {
1867                 slog(st,LOG_UNEXPECTED,"unexpected MSG6");
1868             } else if (process_msg6(st,buf,source)) {
1869                 BUF_FREE(&st->buffer); /* Free message 5 */
1870                 transport_setup_msgok(st,source);
1871                 activate_new_key(st);
1872             } else {
1873                 slog(st,LOG_SEC,"invalid MSG6");
1874             }
1875             break;
1876         default:
1877             slog(st,LOG_SEC,"received message of unknown type 0x%08x",
1878                  msgtype);
1879             break;
1880         }
1881         BUF_FREE(buf);
1882         return True;
1883     }
1884
1885     return False;
1886 }
1887
1888 static void site_control(void *vst, bool_t run)
1889 {
1890     struct site *st=vst;
1891     if (run) enter_state_run(st);
1892     else enter_state_stop(st);
1893 }
1894
1895 static void site_phase_hook(void *sst, uint32_t newphase)
1896 {
1897     struct site *st=sst;
1898
1899     /* The program is shutting down; tell our peer */
1900     send_msg7(st,"shutting down");
1901 }
1902
1903 static list_t *site_apply(closure_t *self, struct cloc loc, dict_t *context,
1904                           list_t *args)
1905 {
1906     static uint32_t index_sequence;
1907     struct site *st;
1908     item_t *item;
1909     dict_t *dict;
1910     int i;
1911
1912     st=safe_malloc(sizeof(*st),"site_apply");
1913
1914     st->cl.description="site";
1915     st->cl.type=CL_SITE;
1916     st->cl.apply=NULL;
1917     st->cl.interface=&st->ops;
1918     st->ops.st=st;
1919     st->ops.control=site_control;
1920     st->ops.status=site_status;
1921
1922     /* First parameter must be a dict */
1923     item=list_elem(args,0);
1924     if (!item || item->type!=t_dict)
1925         cfgfatal(loc,"site","parameter must be a dictionary\n");
1926     
1927     dict=item->data.dict;
1928     st->localname=dict_read_string(dict, "local-name", True, "site", loc);
1929     st->remotename=dict_read_string(dict, "name", True, "site", loc);
1930
1931     st->peer_mobile=dict_read_bool(dict,"mobile",False,"site",loc,False);
1932     st->local_mobile=
1933         dict_read_bool(dict,"local-mobile",False,"site",loc,False);
1934
1935     /* Sanity check (which also allows the 'sites' file to include
1936        site() closures for all sites including our own): refuse to
1937        talk to ourselves */
1938     if (strcmp(st->localname,st->remotename)==0) {
1939         Message(M_DEBUG,"site %s: local-name==name -> ignoring this site\n",
1940                 st->localname);
1941         if (st->peer_mobile != st->local_mobile)
1942             cfgfatal(loc,"site","site %s's peer-mobile=%d"
1943                     " but our local-mobile=%d\n",
1944                     st->localname, st->peer_mobile, st->local_mobile);
1945         free(st);
1946         return NULL;
1947     }
1948     if (st->peer_mobile && st->local_mobile) {
1949         Message(M_WARNING,"site %s: site is mobile but so are we"
1950                 " -> ignoring this site\n", st->remotename);
1951         free(st);
1952         return NULL;
1953     }
1954
1955     assert(index_sequence < 0xffffffffUL);
1956     st->index = ++index_sequence;
1957     st->local_capabilities = 0;
1958     st->netlink=find_cl_if(dict,"link",CL_NETLINK,True,"site",loc);
1959
1960 #define GET_CLOSURE_LIST(dictkey,things,nthings,CL_TYPE) do{            \
1961     list_t *things##_cfg=dict_lookup(dict,dictkey);                     \
1962     if (!things##_cfg)                                                  \
1963         cfgfatal(loc,"site","closure list \"%s\" not found\n",dictkey); \
1964     st->nthings=list_length(things##_cfg);                              \
1965     st->things=safe_malloc_ary(sizeof(*st->things),st->nthings,dictkey "s"); \
1966     assert(st->nthings);                                                \
1967     for (i=0; i<st->nthings; i++) {                                     \
1968         item_t *item=list_elem(things##_cfg,i);                         \
1969         if (item->type!=t_closure)                                      \
1970             cfgfatal(loc,"site","%s is not a closure\n",dictkey);       \
1971         closure_t *cl=item->data.closure;                               \
1972         if (cl->type!=CL_TYPE)                                          \
1973             cfgfatal(loc,"site","%s closure wrong type\n",dictkey);     \
1974         st->things[i]=cl->interface;                                    \
1975     }                                                                   \
1976 }while(0)
1977
1978     GET_CLOSURE_LIST("comm",comms,ncomms,CL_COMM);
1979
1980     st->resolver=find_cl_if(dict,"resolver",CL_RESOLVER,True,"site",loc);
1981     st->log=find_cl_if(dict,"log",CL_LOG,True,"site",loc);
1982     st->random=find_cl_if(dict,"random",CL_RANDOMSRC,True,"site",loc);
1983
1984     st->privkey=find_cl_if(dict,"local-key",CL_RSAPRIVKEY,True,"site",loc);
1985     st->addresses=dict_read_string_array(dict,"address",False,"site",loc,0);
1986     if (st->addresses)
1987         st->remoteport=dict_read_number(dict,"port",True,"site",loc,0);
1988     else st->remoteport=0;
1989     st->pubkey=find_cl_if(dict,"key",CL_RSAPUBKEY,True,"site",loc);
1990
1991     GET_CLOSURE_LIST("transform",transforms,ntransforms,CL_TRANSFORM);
1992
1993     st->dh=find_cl_if(dict,"dh",CL_DH,True,"site",loc);
1994     st->hash=find_cl_if(dict,"hash",CL_HASH,True,"site",loc);
1995
1996 #define DEFAULT(D) (st->peer_mobile || st->local_mobile \
1997                     ? DEFAULT_MOBILE_##D : DEFAULT_##D)
1998 #define CFG_NUMBER(k,D) dict_read_number(dict,(k),False,"site",loc,DEFAULT(D));
1999
2000     st->key_lifetime=         CFG_NUMBER("key-lifetime",  KEY_LIFETIME);
2001     st->setup_retries=        CFG_NUMBER("setup-retries", SETUP_RETRIES);
2002     st->setup_retry_interval= CFG_NUMBER("setup-timeout", SETUP_RETRY_INTERVAL);
2003     st->wait_timeout=         CFG_NUMBER("wait-time",     WAIT_TIME);
2004     st->mtu_target= dict_read_number(dict,"mtu-target",False,"site",loc,0);
2005
2006     st->mobile_peer_expiry= dict_read_number(
2007        dict,"mobile-peer-expiry",False,"site",loc,DEFAULT_MOBILE_PEER_EXPIRY);
2008
2009     const char *peerskey= st->peer_mobile
2010         ? "mobile-peers-max" : "static-peers-max";
2011     st->transport_peers_max= dict_read_number(
2012         dict,peerskey,False,"site",loc,DEFAULT_MOBILE_PEERS_MAX);
2013     if (st->transport_peers_max<1 ||
2014         st->transport_peers_max>=MAX_PEER_ADDRS) {
2015         cfgfatal(loc,"site", "%s must be in range 1.."
2016                  STRING(MAX_PEER_ADDRS) "\n", peerskey);
2017     }
2018
2019     if (st->key_lifetime < DEFAULT(KEY_RENEGOTIATE_GAP)*2)
2020         st->key_renegotiate_time=st->key_lifetime/2;
2021     else
2022         st->key_renegotiate_time=st->key_lifetime-DEFAULT(KEY_RENEGOTIATE_GAP);
2023     st->key_renegotiate_time=dict_read_number(
2024         dict,"renegotiate-time",False,"site",loc,st->key_renegotiate_time);
2025     if (st->key_renegotiate_time > st->key_lifetime) {
2026         cfgfatal(loc,"site",
2027                  "renegotiate-time must be less than key-lifetime\n");
2028     }
2029
2030     st->log_events=string_list_to_word(dict_lookup(dict,"log-events"),
2031                                        log_event_table,"site");
2032
2033     st->resolving_count=0;
2034     st->allow_send_prod=0;
2035
2036     st->tunname=safe_malloc(strlen(st->localname)+strlen(st->remotename)+5,
2037                             "site_apply");
2038     sprintf(st->tunname,"%s<->%s",st->localname,st->remotename);
2039
2040     /* The information we expect to see in incoming messages of type 1 */
2041     /* fixme: lots of unchecked overflows here, but the results are only
2042        corrupted packets rather than undefined behaviour */
2043     st->setup_priority=(strcmp(st->localname,st->remotename)>0);
2044
2045     buffer_new(&st->buffer,SETUP_BUFFER_LEN);
2046
2047     buffer_new(&st->scratch,SETUP_BUFFER_LEN);
2048     BUF_ALLOC(&st->scratch,"site:scratch");
2049
2050     /* We are interested in poll(), but only for timeouts. We don't have
2051        any fds of our own. */
2052     register_for_poll(st, site_beforepoll, site_afterpoll, "site");
2053     st->timeout=0;
2054
2055     st->remote_capabilities=0;
2056     st->chosen_transform=0;
2057     st->current.key_timeout=0;
2058     st->auxiliary_key.key_timeout=0;
2059     transport_peers_clear(st,&st->peers);
2060     transport_peers_clear(st,&st->setup_peers);
2061     /* XXX mlock these */
2062     st->dhsecret=safe_malloc(st->dh->len,"site:dhsecret");
2063     st->sharedsecretlen=st->sharedsecretallocd=0;
2064     st->sharedsecret=0;
2065
2066     for (i=0; i<st->ntransforms; i++) {
2067         struct transform_if *ti=st->transforms[i];
2068         uint32_t capbit = 1UL << ti->capab_transformnum;
2069         if (st->local_capabilities & capbit)
2070             slog(st,LOG_ERROR,"transformnum capability bit"
2071                  " %d (%#"PRIx32") reused", ti->capab_transformnum, capbit);
2072         st->local_capabilities |= capbit;
2073     }
2074
2075     /* We need to register the remote networks with the netlink device */
2076     uint32_t netlink_mtu; /* local virtual interface mtu */
2077     st->netlink->reg(st->netlink->st, site_outgoing, st, &netlink_mtu);
2078     if (!st->mtu_target)
2079         st->mtu_target=netlink_mtu;
2080     
2081     for (i=0; i<st->ncomms; i++)
2082         st->comms[i]->request_notify(st->comms[i]->st, st, site_incoming);
2083
2084     st->current.transform=0;
2085     st->auxiliary_key.transform=0;
2086     st->new_transform=0;
2087     st->auxiliary_is_new=0;
2088
2089     enter_state_stop(st);
2090
2091     add_hook(PHASE_SHUTDOWN,site_phase_hook,st);
2092
2093     return new_closure(&st->cl);
2094 }
2095
2096 void site_module(dict_t *dict)
2097 {
2098     add_closure(dict,"site",site_apply);
2099 }
2100
2101
2102 /***** TRANSPORT PEERS definitions *****/
2103
2104 static void transport_peers_debug(struct site *st, transport_peers *dst,
2105                                   const char *didwhat,
2106                                   int nargs, const struct comm_addr *args,
2107                                   size_t stride) {
2108     int i;
2109     char *argp;
2110
2111     if (!(st->log_events & LOG_PEER_ADDRS))
2112         return; /* an optimisation */
2113
2114     slog(st, LOG_PEER_ADDRS, "peers (%s) %s nargs=%d => npeers=%d",
2115          (dst==&st->peers ? "data" :
2116           dst==&st->setup_peers ? "setup" : "UNKNOWN"),
2117          didwhat, nargs, dst->npeers);
2118
2119     for (i=0, argp=(void*)args;
2120          i<nargs;
2121          i++, (argp+=stride?stride:sizeof(*args))) {
2122         const struct comm_addr *ca=(void*)argp;
2123         slog(st, LOG_PEER_ADDRS, " args: addrs[%d]=%s",
2124              i, comm_addr_to_string(ca));
2125     }
2126     for (i=0; i<dst->npeers; i++) {
2127         struct timeval diff;
2128         timersub(tv_now,&dst->peers[i].last,&diff);
2129         const struct comm_addr *ca=&dst->peers[i].addr;
2130         slog(st, LOG_PEER_ADDRS, " peers: addrs[%d]=%s T-%ld.%06ld",
2131              i, comm_addr_to_string(ca),
2132              (unsigned long)diff.tv_sec, (unsigned long)diff.tv_usec);
2133     }
2134 }
2135
2136 static bool_t transport_addrs_equal(const struct comm_addr *a,
2137                                     const struct comm_addr *b) {
2138     return !memcmp(a,b,sizeof(*a));
2139 }
2140
2141 static void transport_peers_expire(struct site *st, transport_peers *peers) {
2142     /* peers must be sorted first */
2143     int previous_peers=peers->npeers;
2144     struct timeval oldest;
2145     oldest.tv_sec  = tv_now->tv_sec - st->mobile_peer_expiry;
2146     oldest.tv_usec = tv_now->tv_usec;
2147     while (peers->npeers>1 &&
2148            timercmp(&peers->peers[peers->npeers-1].last, &oldest, <))
2149         peers->npeers--;
2150     if (peers->npeers != previous_peers)
2151         transport_peers_debug(st,peers,"expire", 0,0,0);
2152 }
2153
2154 static bool_t transport_peer_record_one(struct site *st, transport_peers *peers,
2155                                         const struct comm_addr *ca,
2156                                         const struct timeval *tv) {
2157     /* returns false if output is full */
2158     int search;
2159
2160     if (peers->npeers > st->transport_peers_max)
2161         return 0;
2162
2163     for (search=0; search<peers->npeers; search++)
2164         if (transport_addrs_equal(&peers->peers[search].addr, ca))
2165             return 1;
2166
2167     peers->peers[peers->npeers].addr = *ca;
2168     peers->peers[peers->npeers].last = *tv;
2169     peers->npeers++;
2170     return 1;
2171 }
2172
2173 static void transport_record_peers(struct site *st, transport_peers *peers,
2174                                    const struct comm_addr *addrs, int naddrs,
2175                                    const char *m) {
2176     /* We add addrs into peers.  The new entries end up at the front
2177      * and displace entries towards the end (perhaps even off the end).
2178      * Any existing matching entries are moved up to the front.
2179      * Caller must first call transport_peers_expire. */
2180
2181     if (naddrs==1 && peers->npeers>=1 &&
2182         transport_addrs_equal(&addrs[0], &peers->peers[0].addr)) {
2183         /* optimisation, also avoids debug for trivial updates */
2184         peers->peers[0].last = *tv_now;
2185         return;
2186     }
2187
2188     int old_npeers=peers->npeers;
2189     transport_peer old_peers[old_npeers];
2190     COPY_ARRAY(old_peers,peers->peers,old_npeers);
2191
2192     peers->npeers=0;
2193     int i;
2194     for (i=0; i<naddrs; i++) {
2195         if (!transport_peer_record_one(st,peers, &addrs[i], tv_now))
2196             break;
2197     }
2198     for (i=0; i<old_npeers; i++) {
2199         const transport_peer *old=&old_peers[i];
2200         if (!transport_peer_record_one(st,peers, &old->addr, &old->last))
2201             break;
2202     }
2203
2204     transport_peers_debug(st,peers,m, naddrs,addrs,0);
2205 }
2206
2207 static bool_t transport_compute_setupinit_peers(struct site *st,
2208         const struct comm_addr *configured_addrs /* 0 if none or not found */,
2209         int n_configured_addrs /* 0 if none or not found */,
2210         const struct comm_addr *incoming_packet_addr /* 0 if none */) {
2211     if (!n_configured_addrs && !incoming_packet_addr &&
2212         !transport_peers_valid(&st->peers))
2213         return False;
2214
2215     slog(st,LOG_SETUP_INIT,
2216          "using: %d configured addr(s);%s %d old peer addrs(es)",
2217          n_configured_addrs,
2218          incoming_packet_addr ? " incoming packet address;" : "",
2219          st->peers.npeers);
2220
2221     /* Non-mobile peers try addresses until one is plausible.  The
2222      * effect is that this code always tries first the configured
2223      * address if supplied, or otherwise the address of the incoming
2224      * PROD, or finally the existing data peer if one exists; this is
2225      * as desired. */
2226
2227     transport_peers_copy(st,&st->setup_peers,&st->peers);
2228     transport_peers_expire(st,&st->setup_peers);
2229
2230     if (incoming_packet_addr)
2231         transport_record_peers(st,&st->setup_peers,
2232                                incoming_packet_addr,1, "incoming");
2233
2234     if (n_configured_addrs)
2235         transport_record_peers(st,&st->setup_peers,
2236                               configured_addrs,n_configured_addrs, "setupinit");
2237
2238     assert(transport_peers_valid(&st->setup_peers));
2239     return True;
2240 }
2241
2242 static void transport_setup_msgok(struct site *st, const struct comm_addr *a) {
2243     if (st->peer_mobile) {
2244         transport_peers_expire(st,&st->setup_peers);
2245         transport_record_peers(st,&st->setup_peers,a,1,"setupmsg");
2246     }
2247 }
2248 static void transport_data_msgok(struct site *st, const struct comm_addr *a) {
2249     if (st->peer_mobile) {
2250         transport_peers_expire(st,&st->setup_peers);
2251         transport_record_peers(st,&st->peers,a,1,"datamsg");
2252     }
2253 }
2254
2255 static int transport_peers_valid(transport_peers *peers) {
2256     return peers->npeers;
2257 }
2258 static void transport_peers_clear(struct site *st, transport_peers *peers) {
2259     peers->npeers= 0;
2260     transport_peers_debug(st,peers,"clear",0,0,0);
2261 }
2262 static void transport_peers_copy(struct site *st, transport_peers *dst,
2263                                  const transport_peers *src) {
2264     dst->npeers=src->npeers;
2265     COPY_ARRAY(dst->peers, src->peers, dst->npeers);
2266     transport_peers_debug(st,dst,"copy",
2267                           src->npeers, &src->peers->addr, sizeof(*src->peers));
2268 }
2269
2270 static void transport_resolve_complete(struct site *st,
2271                                        const struct comm_addr *addrs,
2272                                        int naddrs) {
2273     transport_peers_expire(st,&st->peers);
2274     transport_record_peers(st,&st->peers,addrs,naddrs,"resolved data");
2275     transport_peers_expire(st,&st->setup_peers);
2276     transport_record_peers(st,&st->setup_peers,addrs,naddrs,"resolved setup");
2277 }
2278
2279 static void transport_resolve_complete_tardy(struct site *st,
2280                                              const struct comm_addr *addrs,
2281                                              int naddrs) {
2282     transport_peers_expire(st,&st->peers);
2283     transport_record_peers(st,&st->peers,addrs,naddrs,"resolved tardily");
2284 }
2285
2286 static void transport_peers__copy_by_mask(transport_peer *out, int *nout_io,
2287                                           unsigned mask,
2288                                           const transport_peers *inp) {
2289     /* out and in->peers may be the same region, or nonoverlapping */
2290     const transport_peer *in=inp->peers;
2291     int slot;
2292     for (slot=0; slot<inp->npeers; slot++) {
2293         if (!(mask & (1U << slot)))
2294             continue;
2295         if (!(out==in && slot==*nout_io))
2296             COPY_OBJ(out[*nout_io], in[slot]);
2297         (*nout_io)++;
2298     }
2299 }
2300
2301 void transport_xmit(struct site *st, transport_peers *peers,
2302                     struct buffer_if *buf, bool_t candebug) {
2303     int slot;
2304     transport_peers_expire(st, peers);
2305     unsigned failed=0; /* bitmask */
2306     assert(MAX_PEER_ADDRS < sizeof(unsigned)*CHAR_BIT);
2307
2308     int nfailed=0;
2309     for (slot=0; slot<peers->npeers; slot++) {
2310         transport_peer *peer=&peers->peers[slot];
2311         if (candebug)
2312             dump_packet(st, buf, &peer->addr, False);
2313         bool_t ok =
2314             peer->addr.comm->sendmsg(peer->addr.comm->st, buf, &peer->addr);
2315         if (!ok) {
2316             failed |= 1U << slot;
2317             nfailed++;
2318         }
2319         if (ok && !st->peer_mobile)
2320             break;
2321     }
2322     /* Now we need to demote/delete failing addrs: if we are mobile we
2323      * merely demote them; otherwise we delete them. */
2324     if (st->local_mobile) {
2325         unsigned expected = ((1U << nfailed)-1) << (peers->npeers-nfailed);
2326         /* `expected' has all the failures at the end already */
2327         if (failed != expected) {
2328             int fslot=0;
2329             transport_peer failedpeers[nfailed];
2330             transport_peers__copy_by_mask(failedpeers, &fslot, failed,peers);
2331             assert(fslot == nfailed);
2332             int wslot=0;
2333             transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2334             assert(wslot+nfailed == peers->npeers);
2335             COPY_ARRAY(peers->peers+wslot, failedpeers, nfailed);
2336         }
2337     } else {
2338         if (failed && peers->npeers > 1) {
2339             int wslot=0;
2340             transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2341             peers->npeers=wslot;
2342         }
2343     }
2344 }
2345
2346 /***** END of transport peers declarations *****/