chiark / gitweb /
15dace88d3c74f0e22a35b891d91a061c311877e
[secnet.git] / site.c
1 /* site.c - manage communication with a remote network site */
2
3 /* The 'site' code doesn't know anything about the structure of the
4    packets it's transmitting.  In fact, under the new netlink
5    configuration scheme it doesn't need to know anything at all about
6    IP addresses, except how to contact its peer.  This means it could
7    potentially be used to tunnel other protocols too (IPv6, IPX, plain
8    old Ethernet frames) if appropriate netlink code can be written
9    (and that ought not to be too hard, eg. using the TUN/TAP device to
10    pretend to be an Ethernet interface).  */
11
12 /* At some point in the future the netlink code will be asked for
13    configuration information to go in the PING/PONG packets at the end
14    of the key exchange. */
15
16 #include "secnet.h"
17 #include <stdio.h>
18 #include <string.h>
19 #include <limits.h>
20 #include <assert.h>
21 #include <sys/socket.h>
22
23 #include <sys/mman.h>
24 #include "util.h"
25 #include "unaligned.h"
26 #include "magic.h"
27
28 #define SETUP_BUFFER_LEN 2048
29
30 #define DEFAULT_KEY_LIFETIME                  (3600*1000) /* [ms] */
31 #define DEFAULT_KEY_RENEGOTIATE_GAP           (5*60*1000) /* [ms] */
32 #define DEFAULT_SETUP_RETRIES 5
33 #define DEFAULT_SETUP_RETRY_INTERVAL             (2*1000) /* [ms] */
34 #define DEFAULT_WAIT_TIME                       (20*1000) /* [ms] */
35
36 #define DEFAULT_MOBILE_KEY_LIFETIME      (2*24*3600*1000) /* [ms] */
37 #define DEFAULT_MOBILE_KEY_RENEGOTIATE_GAP (12*3600*1000) /* [ms] */
38 #define DEFAULT_MOBILE_SETUP_RETRIES 30
39 #define DEFAULT_MOBILE_SETUP_RETRY_INTERVAL      (1*1000) /* [ms] */
40 #define DEFAULT_MOBILE_WAIT_TIME                (10*1000) /* [ms] */
41
42 #define DEFAULT_MOBILE_PEER_EXPIRY            (2*60)      /* [s] */
43
44 /* Each site can be in one of several possible states. */
45
46 /* States:
47    SITE_STOP         - nothing is allowed to happen; tunnel is down;
48                        all session keys have been erased
49      -> SITE_RUN upon external instruction
50    SITE_RUN          - site up, maybe with valid key
51      -> SITE_RESOLVE upon outgoing packet and no valid key
52          we start name resolution for the other end of the tunnel
53      -> SITE_SENTMSG2 upon valid incoming message 1 and suitable time
54          we send an appropriate message 2
55    SITE_RESOLVE      - waiting for name resolution
56      -> SITE_SENTMSG1 upon successful resolution
57          we send an appropriate message 1
58      -> SITE_SENTMSG2 upon valid incoming message 1 (then abort resolution)
59          we abort resolution and 
60      -> SITE_WAIT on timeout or resolution failure
61    SITE_SENTMSG1
62      -> SITE_SENTMSG2 upon valid incoming message 1 from higher priority end
63      -> SITE_SENTMSG3 upon valid incoming message 2
64      -> SITE_WAIT on timeout
65    SITE_SENTMSG2
66      -> SITE_SENTMSG4 upon valid incoming message 3
67      -> SITE_WAIT on timeout
68    SITE_SENTMSG3
69      -> SITE_SENTMSG5 upon valid incoming message 4
70      -> SITE_WAIT on timeout
71    SITE_SENTMSG4
72      -> SITE_RUN upon valid incoming message 5
73      -> SITE_WAIT on timeout
74    SITE_SENTMSG5
75      -> SITE_RUN upon valid incoming message 6
76      -> SITE_WAIT on timeout
77    SITE_WAIT         - failed to establish key; do nothing for a while
78      -> SITE_RUN on timeout
79    */
80
81 #define SITE_STOP     0
82 #define SITE_RUN      1
83 #define SITE_RESOLVE  2
84 #define SITE_SENTMSG1 3
85 #define SITE_SENTMSG2 4
86 #define SITE_SENTMSG3 5
87 #define SITE_SENTMSG4 6
88 #define SITE_SENTMSG5 7
89 #define SITE_WAIT     8
90
91 int32_t site_max_start_pad = 4*4;
92
93 static cstring_t state_name(uint32_t state)
94 {
95     switch (state) {
96     case 0: return "STOP";
97     case 1: return "RUN";
98     case 2: return "RESOLVE";
99     case 3: return "SENTMSG1";
100     case 4: return "SENTMSG2";
101     case 5: return "SENTMSG3";
102     case 6: return "SENTMSG4";
103     case 7: return "SENTMSG5";
104     case 8: return "WAIT";
105     default: return "*bad state*";
106     }
107 }
108
109 #define NONCELEN 8
110
111 #define LOG_UNEXPECTED    0x00000001
112 #define LOG_SETUP_INIT    0x00000002
113 #define LOG_SETUP_TIMEOUT 0x00000004
114 #define LOG_ACTIVATE_KEY  0x00000008
115 #define LOG_TIMEOUT_KEY   0x00000010
116 #define LOG_SEC           0x00000020
117 #define LOG_STATE         0x00000040
118 #define LOG_DROP          0x00000080
119 #define LOG_DUMP          0x00000100
120 #define LOG_ERROR         0x00000400
121 #define LOG_PEER_ADDRS    0x00000800
122
123 static struct flagstr log_event_table[]={
124     { "unexpected", LOG_UNEXPECTED },
125     { "setup-init", LOG_SETUP_INIT },
126     { "setup-timeout", LOG_SETUP_TIMEOUT },
127     { "activate-key", LOG_ACTIVATE_KEY },
128     { "timeout-key", LOG_TIMEOUT_KEY },
129     { "security", LOG_SEC },
130     { "state-change", LOG_STATE },
131     { "packet-drop", LOG_DROP },
132     { "dump-packets", LOG_DUMP },
133     { "errors", LOG_ERROR },
134     { "peer-addrs", LOG_PEER_ADDRS },
135     { "default", LOG_SETUP_INIT|LOG_SETUP_TIMEOUT|
136       LOG_ACTIVATE_KEY|LOG_TIMEOUT_KEY|LOG_SEC|LOG_ERROR },
137     { "all", 0xffffffff },
138     { NULL, 0 }
139 };
140
141
142 /***** TRANSPORT PEERS declarations *****/
143
144 /* Details of "mobile peer" semantics:
145
146    - We use the same data structure for the different configurations,
147      but manage it with different algorithms.
148    
149    - We record up to mobile_peers_max peer address/port numbers
150      ("peers") for key setup, and separately up to mobile_peers_max
151      for data transfer.
152
153    - In general, we make a new set of addrs (see below) when we start
154      a new key exchange; the key setup addrs become the data transport
155      addrs when key setup complets.
156
157    If our peer is mobile:
158
159    - We send to all recent addresses of incoming packets, plus
160      initially all configured addresses (which we also expire).
161
162    - So, we record addrs of good incoming packets, as follows:
163       1. expire any peers last seen >120s ("mobile-peer-expiry") ago
164       2. add the peer of the just received packet to the applicable list
165          (possibly evicting the oldest entries to make room)
166      NB that we do not expire peers until an incoming packet arrives.
167
168    - If the peer has a configured address or name, we record them the
169      same way, but only as a result of our own initiation of key
170      setup.  (We might evict some incoming packet addrs to make room.)
171
172    - The default number of addrs to keep is 3, or 4 if we have a
173      configured name or address.  That's space for two configured
174      addresses (one IPv6 and one IPv4), plus two received addresses.
175
176    - Outgoing packets are sent to every recorded address in the
177      applicable list.  Any unsupported[1] addresses are deleted from
178      the list right away.  (This should only happen to configured
179      addresses, of course, but there is no need to check that.)
180
181    - When we successfully complete a key setup, we merge the key setup
182      peers into the data transfer peers.
183
184    [1] An unsupported address is one for whose AF we don't have a
185      socket (perhaps because we got EAFNOSUPPORT or some such) or for
186      which sendto gives ENETUNREACH.
187
188    If neither end is mobile:
189
190    - When peer initiated the key exchange, we use the incoming packet
191      address.
192
193    - When we initiate the key exchange, we try configured addresses
194      until we get one which isn't unsupported then fixate on that.
195
196    - When we complete a key setup, we replace the data transport peers
197      with those from the key setup.
198
199    If we are mobile:
200
201    - We can't tell when local network setup changes so we can't cache
202      the unsupported addrs and completely remove the spurious calls to
203      sendto, but we can optimise things a bit by deprioritising addrs
204      which seem to be unsupported.
205
206    - Use only configured addresses.  (Except, that if our peer
207      initiated a key exchange we use the incoming packet address until
208      our name resolution completes.)
209
210    - When we send a packet, try each address in turn; if addr
211      supported, put that address to the end of the list for future
212      packets, and go onto the next address.
213
214    - When we complete a key setup, we replace the data transport peers
215      with those from the key setup.
216
217    */
218
219 typedef struct {
220     struct timeval last;
221     struct comm_addr addr;
222 } transport_peer;
223
224 typedef struct {
225 /* configuration information */
226 /* runtime information */
227     int npeers;
228     transport_peer peers[MAX_PEER_ADDRS];
229 } transport_peers;
230
231 /* Basic operations on transport peer address sets */
232 static void transport_peers_clear(struct site *st, transport_peers *peers);
233 static int transport_peers_valid(transport_peers *peers);
234 static void transport_peers_copy(struct site *st, transport_peers *dst,
235                                  const transport_peers *src);
236
237 /* Record address of incoming setup packet; resp. data packet. */
238 static void transport_setup_msgok(struct site *st, const struct comm_addr *a);
239 static void transport_data_msgok(struct site *st, const struct comm_addr *a);
240
241 /* Initialise the setup addresses.  Called before we send the first
242  * packet in a key exchange.  If we are the initiator, as a result of
243  * resolve completing (or being determined not to be relevant) or an
244  * incoming PROD; if we are the responder, as a result of the MSG1. */
245 static bool_t transport_compute_setupinit_peers(struct site *st,
246         const struct comm_addr *configured_addrs /* 0 if none or not found */,
247         int n_configured_addrs /* 0 if none or not found */,
248         const struct comm_addr *incoming_packet_addr /* 0 if none */);
249
250 /* Called if we are the responder in a key setup, when the resolve
251  * completes.  transport_compute_setupinit_peers will hvae been called
252  * earlier.  If _complete is called, we are still doing the key setup
253  * (and we should use the new values for both the rest of the key
254  * setup and the ongoing data exchange); if _tardy is called, the key
255  * setup is done (either completed or not) and only the data peers are
256  * relevant */
257 static void transport_resolve_complete(struct site *st,
258         const struct comm_addr *addrs, int naddrs);
259 static void transport_resolve_complete_tardy(struct site *st,
260         const struct comm_addr *addrs, int naddrs);
261
262 static void transport_xmit(struct site *st, transport_peers *peers,
263                            struct buffer_if *buf, bool_t candebug);
264
265  /***** END of transport peers declarations *****/
266
267
268 struct data_key {
269     struct transform_inst_if *transform;
270     uint64_t key_timeout; /* End of life of current key */
271     uint32_t remote_session_id;
272 };
273
274 struct site {
275     closure_t cl;
276     struct site_if ops;
277 /* configuration information */
278     string_t localname;
279     string_t remotename;
280     bool_t local_mobile, peer_mobile; /* Mobile client support */
281     int32_t transport_peers_max;
282     string_t tunname; /* localname<->remotename by default, used in logs */
283     string_t address; /* DNS name for bootstrapping, optional */
284     int remoteport; /* Port for bootstrapping, optional */
285     uint32_t mtu_target;
286     struct netlink_if *netlink;
287     struct comm_if **comms;
288     int ncomms;
289     struct resolver_if *resolver;
290     struct log_if *log;
291     struct random_if *random;
292     struct rsaprivkey_if *privkey;
293     struct rsapubkey_if *pubkey;
294     struct transform_if **transforms;
295     int ntransforms;
296     struct dh_if *dh;
297     struct hash_if *hash;
298
299     uint32_t index; /* Index of this site */
300     uint32_t local_capabilities;
301     int32_t setup_retries; /* How many times to send setup packets */
302     int32_t setup_retry_interval; /* Initial timeout for setup packets */
303     int32_t wait_timeout; /* How long to wait if setup unsuccessful */
304     int32_t mobile_peer_expiry; /* How long to remember 2ary addresses */
305     int32_t key_lifetime; /* How long a key lasts once set up */
306     int32_t key_renegotiate_time; /* If we see traffic (or a keepalive)
307                                       after this time, initiate a new
308                                       key exchange */
309
310     bool_t setup_priority; /* Do we have precedence if both sites emit
311                               message 1 simultaneously? */
312     uint32_t log_events;
313
314 /* runtime information */
315     uint32_t state;
316     uint64_t now; /* Most recently seen time */
317     bool_t allow_send_prod;
318     bool_t resolving;
319
320     /* The currently established session */
321     struct data_key current;
322     struct data_key auxiliary_key;
323     bool_t auxiliary_is_new;
324     uint64_t renegotiate_key_time; /* When we can negotiate a new key */
325     uint64_t auxiliary_renegotiate_key_time;
326     transport_peers peers; /* Current address(es) of peer for data traffic */
327
328     /* The current key setup protocol exchange.  We can only be
329        involved in one of these at a time.  There's a potential for
330        denial of service here (the attacker keeps sending a setup
331        packet; we keep trying to continue the exchange, and have to
332        timeout before we can listen for another setup packet); perhaps
333        we should keep a list of 'bad' sources for setup packets. */
334     uint32_t remote_capabilities;
335     uint16_t remote_adv_mtu;
336     struct transform_if *chosen_transform;
337     uint32_t setup_session_id;
338     transport_peers setup_peers;
339     uint8_t localN[NONCELEN]; /* Nonces for key exchange */
340     uint8_t remoteN[NONCELEN];
341     struct buffer_if buffer; /* Current outgoing key exchange packet */
342     struct buffer_if scratch;
343     int32_t retries; /* Number of retries remaining */
344     uint64_t timeout; /* Timeout for current state */
345     uint8_t *dhsecret;
346     uint8_t *sharedsecret;
347     uint32_t sharedsecretlen, sharedsecretallocd;
348     struct transform_inst_if *new_transform; /* For key setup/verify */
349 };
350
351 static uint32_t event_log_priority(struct site *st, uint32_t event)
352 {
353     if (!(event&st->log_events))
354         return 0;
355     switch(event) {
356     case LOG_UNEXPECTED:    return M_INFO;
357     case LOG_SETUP_INIT:    return M_INFO;
358     case LOG_SETUP_TIMEOUT: return M_NOTICE;
359     case LOG_ACTIVATE_KEY:  return M_INFO;
360     case LOG_TIMEOUT_KEY:   return M_INFO;
361     case LOG_SEC:           return M_SECURITY;
362     case LOG_STATE:         return M_DEBUG;
363     case LOG_DROP:          return M_DEBUG;
364     case LOG_DUMP:          return M_DEBUG;
365     case LOG_ERROR:         return M_ERR;
366     case LOG_PEER_ADDRS:    return M_DEBUG;
367     default:                return M_ERR;
368     }
369 }
370
371 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
372 FORMAT(printf,3,0);
373 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
374 {
375     uint32_t class;
376
377     class=event_log_priority(st, event);
378     if (class) {
379         slilog_part(st->log,class,"%s: ",st->tunname);
380         vslilog_part(st->log,class,msg,ap);
381         slilog_part(st->log,class,"\n");
382     }
383 }
384
385 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
386 FORMAT(printf,3,4);
387 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
388 {
389     va_list ap;
390     va_start(ap,msg);
391     vslog(st,event,msg,ap);
392     va_end(ap);
393 }
394
395 static void logtimeout(struct site *st, const char *fmt, ...)
396 FORMAT(printf,2,3);
397 static void logtimeout(struct site *st, const char *fmt, ...)
398 {
399     uint32_t class=event_log_priority(st,LOG_SETUP_TIMEOUT);
400     if (!class)
401         return;
402
403     va_list ap;
404     va_start(ap,fmt);
405
406     slilog_part(st->log,class,"%s: ",st->tunname);
407     vslilog_part(st->log,class,fmt,ap);
408
409     const char *delim;
410     int i;
411     for (i=0, delim=" (tried ";
412          i<st->setup_peers.npeers;
413          i++, delim=", ") {
414         transport_peer *peer=&st->setup_peers.peers[i];
415         const char *s=comm_addr_to_string(&peer->addr);
416         slilog_part(st->log,class,"%s%s",delim,s);
417     }
418
419     slilog_part(st->log,class,")\n");
420     va_end(ap);
421 }
422
423 static void set_link_quality(struct site *st);
424 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel);
425 static void delete_one_key(struct site *st, struct data_key *key,
426                            const char *reason /* may be 0 meaning don't log*/,
427                            const char *which /* ignored if !reasonn */,
428                            uint32_t loglevel /* ignored if !reasonn */);
429 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
430                                  const struct comm_addr *prod_hint);
431 static void enter_state_run(struct site *st);
432 static bool_t enter_state_resolve(struct site *st);
433 static bool_t enter_new_state(struct site *st,uint32_t next);
434 static void enter_state_wait(struct site *st);
435 static void activate_new_key(struct site *st);
436
437 static bool_t is_transform_valid(struct transform_inst_if *transform)
438 {
439     return transform && transform->valid(transform->st);
440 }
441
442 static bool_t current_valid(struct site *st)
443 {
444     return is_transform_valid(st->current.transform);
445 }
446
447 #define DEFINE_CALL_TRANSFORM(fwdrev)                                   \
448 static int call_transform_##fwdrev(struct site *st,                     \
449                                    struct transform_inst_if *transform, \
450                                    struct buffer_if *buf,               \
451                                    const char **errmsg)                 \
452 {                                                                       \
453     if (!is_transform_valid(transform)) {                               \
454         *errmsg="transform not set up";                                 \
455         return 1;                                                       \
456     }                                                                   \
457     return transform->fwdrev(transform->st,buf,errmsg);                 \
458 }
459
460 DEFINE_CALL_TRANSFORM(forwards)
461 DEFINE_CALL_TRANSFORM(reverse)
462
463 static void dispose_transform(struct transform_inst_if **transform_var)
464 {
465     struct transform_inst_if *transform=*transform_var;
466     if (transform) {
467         transform->delkey(transform->st);
468         transform->destroy(transform->st);
469     }
470     *transform_var = 0;
471 }    
472
473 #define CHECK_AVAIL(b,l) do { if ((b)->size<(l)) return False; } while(0)
474 #define CHECK_EMPTY(b) do { if ((b)->size!=0) return False; } while(0)
475 #define CHECK_TYPE(b,t) do { uint32_t type; \
476     CHECK_AVAIL((b),4); \
477     type=buf_unprepend_uint32((b)); \
478     if (type!=(t)) return False; } while(0)
479
480 static _Bool type_is_msg34(uint32_t type)
481 {
482     return
483         type == LABEL_MSG3 ||
484         type == LABEL_MSG3BIS ||
485         type == LABEL_MSG4;
486 }
487
488 struct parsedname {
489     int32_t len;
490     uint8_t *name;
491     struct buffer_if extrainfo;
492 };
493
494 struct msg {
495     uint8_t *hashstart;
496     uint32_t dest;
497     uint32_t source;
498     struct parsedname remote;
499     struct parsedname local;
500     uint32_t remote_capabilities;
501     uint16_t remote_mtu;
502     int capab_transformnum;
503     uint8_t *nR;
504     uint8_t *nL;
505     int32_t pklen;
506     char *pk;
507     int32_t hashlen;
508     int32_t siglen;
509     char *sig;
510 };
511
512 static void set_new_transform(struct site *st, char *pk)
513 {
514     /* Make room for the shared key */
515     st->sharedsecretlen=st->chosen_transform->keylen?:st->dh->ceil_len;
516     assert(st->sharedsecretlen);
517     if (st->sharedsecretlen > st->sharedsecretallocd) {
518         st->sharedsecretallocd=st->sharedsecretlen;
519         st->sharedsecret=realloc(st->sharedsecret,st->sharedsecretallocd);
520     }
521     if (!st->sharedsecret) fatal_perror("site:sharedsecret");
522
523     /* Generate the shared key */
524     st->dh->makeshared(st->dh->st,st->dhsecret,st->dh->len,pk,
525                        st->sharedsecret,st->sharedsecretlen);
526
527     /* Set up the transform */
528     struct transform_if *generator=st->chosen_transform;
529     struct transform_inst_if *generated=generator->create(generator->st);
530     generated->setkey(generated->st,st->sharedsecret,
531                       st->sharedsecretlen,st->setup_priority);
532     dispose_transform(&st->new_transform);
533     st->new_transform=generated;
534
535     slog(st,LOG_SETUP_INIT,"key exchange negotiated transform"
536          " %d (capabilities ours=%#"PRIx32" theirs=%#"PRIx32")",
537          st->chosen_transform->capab_transformnum,
538          st->local_capabilities, st->remote_capabilities);
539 }
540
541 struct xinfoadd {
542     int32_t lenpos, afternul;
543 };
544 static void append_string_xinfo_start(struct buffer_if *buf,
545                                       struct xinfoadd *xia,
546                                       const char *str)
547     /* Helps construct one of the names with additional info as found
548      * in MSG1..4.  Call this function first, then append all the
549      * desired extra info (not including the nul byte) to the buffer,
550      * then call append_string_xinfo_done. */
551 {
552     xia->lenpos = buf->size;
553     buf_append_string(buf,str);
554     buf_append_uint8(buf,0);
555     xia->afternul = buf->size;
556 }
557 static void append_string_xinfo_done(struct buffer_if *buf,
558                                      struct xinfoadd *xia)
559 {
560     /* we just need to adjust the string length */
561     if (buf->size == xia->afternul) {
562         /* no extra info, strip the nul too */
563         buf_unappend_uint8(buf);
564     } else {
565         put_uint16(buf->start+xia->lenpos, buf->size-(xia->lenpos+2));
566     }
567 }
568
569 /* Build any of msg1 to msg4. msg5 and msg6 are built from the inside
570    out using a transform of config data supplied by netlink */
571 static bool_t generate_msg(struct site *st, uint32_t type, cstring_t what)
572 {
573     void *hst;
574     uint8_t *hash;
575     string_t dhpub, sig;
576
577     st->retries=st->setup_retries;
578     BUF_ALLOC(&st->buffer,what);
579     buffer_init(&st->buffer,0);
580     buf_append_uint32(&st->buffer,
581         (type==LABEL_MSG1?0:st->setup_session_id));
582     buf_append_uint32(&st->buffer,st->index);
583     buf_append_uint32(&st->buffer,type);
584
585     struct xinfoadd xia;
586     append_string_xinfo_start(&st->buffer,&xia,st->localname);
587     if ((st->local_capabilities & CAPAB_EARLY) || (type != LABEL_MSG1)) {
588         buf_append_uint32(&st->buffer,st->local_capabilities);
589     }
590     if (type_is_msg34(type)) {
591         buf_append_uint16(&st->buffer,st->mtu_target);
592     }
593     append_string_xinfo_done(&st->buffer,&xia);
594
595     buf_append_string(&st->buffer,st->remotename);
596     BUF_ADD_OBJ(append,&st->buffer,st->localN);
597     if (type==LABEL_MSG1) return True;
598     BUF_ADD_OBJ(append,&st->buffer,st->remoteN);
599     if (type==LABEL_MSG2) return True;
600
601     if (hacky_par_mid_failnow()) return False;
602
603     if (type==LABEL_MSG3BIS)
604         buf_append_uint8(&st->buffer,st->chosen_transform->capab_transformnum);
605
606     dhpub=st->dh->makepublic(st->dh->st,st->dhsecret,st->dh->len);
607     buf_append_string(&st->buffer,dhpub);
608     free(dhpub);
609     hash=safe_malloc(st->hash->len, "generate_msg");
610     hst=st->hash->init();
611     st->hash->update(hst,st->buffer.start,st->buffer.size);
612     st->hash->final(hst,hash);
613     sig=st->privkey->sign(st->privkey->st,hash,st->hash->len);
614     buf_append_string(&st->buffer,sig);
615     free(sig);
616     free(hash);
617     return True;
618 }
619
620 static bool_t unpick_name(struct buffer_if *msg, struct parsedname *nm)
621 {
622     CHECK_AVAIL(msg,2);
623     nm->len=buf_unprepend_uint16(msg);
624     CHECK_AVAIL(msg,nm->len);
625     nm->name=buf_unprepend(msg,nm->len);
626     uint8_t *nul=memchr(nm->name,0,nm->len);
627     if (!nul) {
628         buffer_readonly_view(&nm->extrainfo,0,0);
629     } else {
630         buffer_readonly_view(&nm->extrainfo, nul+1, msg->start-(nul+1));
631         nm->len=nul-nm->name;
632     }
633     return True;
634 }
635
636 static bool_t unpick_msg(struct site *st, uint32_t type,
637                          struct buffer_if *msg, struct msg *m)
638 {
639     m->capab_transformnum=-1;
640     m->hashstart=msg->start;
641     CHECK_AVAIL(msg,4);
642     m->dest=buf_unprepend_uint32(msg);
643     CHECK_AVAIL(msg,4);
644     m->source=buf_unprepend_uint32(msg);
645     CHECK_TYPE(msg,type);
646     if (!unpick_name(msg,&m->remote)) return False;
647     m->remote_capabilities=0;
648     m->remote_mtu=0;
649     if (m->remote.extrainfo.size) {
650         CHECK_AVAIL(&m->remote.extrainfo,4);
651         m->remote_capabilities=buf_unprepend_uint32(&m->remote.extrainfo);
652     }
653     if (type_is_msg34(type) && m->remote.extrainfo.size) {
654         CHECK_AVAIL(&m->remote.extrainfo,2);
655         m->remote_mtu=buf_unprepend_uint16(&m->remote.extrainfo);
656     }
657     if (!unpick_name(msg,&m->local)) return False;
658     if (type==LABEL_PROD) {
659         CHECK_EMPTY(msg);
660         return True;
661     }
662     CHECK_AVAIL(msg,NONCELEN);
663     m->nR=buf_unprepend(msg,NONCELEN);
664     if (type==LABEL_MSG1) {
665         CHECK_EMPTY(msg);
666         return True;
667     }
668     CHECK_AVAIL(msg,NONCELEN);
669     m->nL=buf_unprepend(msg,NONCELEN);
670     if (type==LABEL_MSG2) {
671         CHECK_EMPTY(msg);
672         return True;
673     }
674     if (type==LABEL_MSG3BIS) {
675         CHECK_AVAIL(msg,1);
676         m->capab_transformnum = buf_unprepend_uint8(msg);
677     } else {
678         m->capab_transformnum = CAPAB_TRANSFORMNUM_ANCIENT;
679     }
680     CHECK_AVAIL(msg,2);
681     m->pklen=buf_unprepend_uint16(msg);
682     CHECK_AVAIL(msg,m->pklen);
683     m->pk=buf_unprepend(msg,m->pklen);
684     m->hashlen=msg->start-m->hashstart;
685     CHECK_AVAIL(msg,2);
686     m->siglen=buf_unprepend_uint16(msg);
687     CHECK_AVAIL(msg,m->siglen);
688     m->sig=buf_unprepend(msg,m->siglen);
689     CHECK_EMPTY(msg);
690     return True;
691 }
692
693 static bool_t name_matches(const struct parsedname *nm, const char *expected)
694 {
695     int expected_len=strlen(expected);
696     return
697         nm->len == expected_len &&
698         !memcmp(nm->name, expected, expected_len);
699 }    
700
701 static bool_t check_msg(struct site *st, uint32_t type, struct msg *m,
702                         cstring_t *error)
703 {
704     if (type==LABEL_MSG1) return True;
705
706     /* Check that the site names and our nonce have been sent
707        back correctly, and then store our peer's nonce. */ 
708     if (!name_matches(&m->remote,st->remotename)) {
709         *error="wrong remote site name";
710         return False;
711     }
712     if (!name_matches(&m->local,st->localname)) {
713         *error="wrong local site name";
714         return False;
715     }
716     if (memcmp(m->nL,st->localN,NONCELEN)!=0) {
717         *error="wrong locally-generated nonce";
718         return False;
719     }
720     if (type==LABEL_MSG2) return True;
721     if (!consttime_memeq(m->nR,st->remoteN,NONCELEN)!=0) {
722         *error="wrong remotely-generated nonce";
723         return False;
724     }
725     /* MSG3 has complicated rules about capabilities, which are
726      * handled in process_msg3. */
727     if (type==LABEL_MSG3 || type==LABEL_MSG3BIS) return True;
728     if (m->remote_capabilities!=st->remote_capabilities) {
729         *error="remote capabilities changed";
730         return False;
731     }
732     if (type==LABEL_MSG4) return True;
733     *error="unknown message type";
734     return False;
735 }
736
737 static bool_t generate_msg1(struct site *st)
738 {
739     st->random->generate(st->random->st,NONCELEN,st->localN);
740     return generate_msg(st,LABEL_MSG1,"site:MSG1");
741 }
742
743 static bool_t process_msg1(struct site *st, struct buffer_if *msg1,
744                            const struct comm_addr *src, struct msg *m)
745 {
746     /* We've already determined we're in an appropriate state to
747        process an incoming MSG1, and that the MSG1 has correct values
748        of A and B. */
749
750     st->setup_session_id=m->source;
751     st->remote_capabilities=m->remote_capabilities;
752     memcpy(st->remoteN,m->nR,NONCELEN);
753     return True;
754 }
755
756 static bool_t generate_msg2(struct site *st)
757 {
758     st->random->generate(st->random->st,NONCELEN,st->localN);
759     return generate_msg(st,LABEL_MSG2,"site:MSG2");
760 }
761
762 static bool_t process_msg2(struct site *st, struct buffer_if *msg2,
763                            const struct comm_addr *src)
764 {
765     struct msg m;
766     cstring_t err;
767
768     if (!unpick_msg(st,LABEL_MSG2,msg2,&m)) return False;
769     if (!check_msg(st,LABEL_MSG2,&m,&err)) {
770         slog(st,LOG_SEC,"msg2: %s",err);
771         return False;
772     }
773     st->setup_session_id=m.source;
774     st->remote_capabilities=m.remote_capabilities;
775
776     /* Select the transform to use */
777
778     uint32_t remote_transforms = st->remote_capabilities & CAPAB_TRANSFORM_MASK;
779     if (!remote_transforms)
780         /* old secnets only had this one transform */
781         remote_transforms = 1UL << CAPAB_TRANSFORMNUM_ANCIENT;
782
783     struct transform_if *ti;
784     int i;
785     for (i=0; i<st->ntransforms; i++) {
786         ti=st->transforms[i];
787         if ((1UL << ti->capab_transformnum) & remote_transforms)
788             goto transform_found;
789     }
790     slog(st,LOG_ERROR,"no transforms in common"
791          " (us %#"PRIx32"; them: %#"PRIx32")",
792          st->local_capabilities & CAPAB_TRANSFORM_MASK,
793          remote_transforms);
794     return False;
795  transform_found:
796     st->chosen_transform=ti;
797
798     memcpy(st->remoteN,m.nR,NONCELEN);
799     return True;
800 }
801
802 static bool_t generate_msg3(struct site *st)
803 {
804     /* Now we have our nonce and their nonce. Think of a secret key,
805        and create message number 3. */
806     st->random->generate(st->random->st,st->dh->len,st->dhsecret);
807     return generate_msg(st,
808                         (st->remote_capabilities & CAPAB_TRANSFORM_MASK
809                          ? LABEL_MSG3BIS : LABEL_MSG3),
810                         "site:MSG3");
811 }
812
813 static bool_t process_msg3_msg4(struct site *st, struct msg *m)
814 {
815     uint8_t *hash;
816     void *hst;
817
818     /* Check signature and store g^x mod m */
819     hash=safe_malloc(st->hash->len, "process_msg3_msg4");
820     hst=st->hash->init();
821     st->hash->update(hst,m->hashstart,m->hashlen);
822     st->hash->final(hst,hash);
823     /* Terminate signature with a '0' - cheating, but should be ok */
824     m->sig[m->siglen]=0;
825     if (!st->pubkey->check(st->pubkey->st,hash,st->hash->len,m->sig)) {
826         slog(st,LOG_SEC,"msg3/msg4 signature failed check!");
827         free(hash);
828         return False;
829     }
830     free(hash);
831
832     st->remote_adv_mtu=m->remote_mtu;
833
834     return True;
835 }
836
837 static bool_t process_msg3(struct site *st, struct buffer_if *msg3,
838                            const struct comm_addr *src, uint32_t msgtype)
839 {
840     struct msg m;
841     cstring_t err;
842
843     assert(msgtype==LABEL_MSG3 || msgtype==LABEL_MSG3BIS);
844
845     if (!unpick_msg(st,msgtype,msg3,&m)) return False;
846     if (!check_msg(st,msgtype,&m,&err)) {
847         slog(st,LOG_SEC,"msg3: %s",err);
848         return False;
849     }
850     uint32_t capab_adv_late = m.remote_capabilities
851         & ~st->remote_capabilities & CAPAB_EARLY;
852     if (capab_adv_late) {
853         slog(st,LOG_SEC,"msg3 impermissibly adds early capability flag(s)"
854              " %#"PRIx32" (was %#"PRIx32", now %#"PRIx32")",
855              capab_adv_late, st->remote_capabilities, m.remote_capabilities);
856         return False;
857     }
858     st->remote_capabilities|=m.remote_capabilities;
859
860     struct transform_if *ti;
861     int i;
862     for (i=0; i<st->ntransforms; i++) {
863         ti=st->transforms[i];
864         if (ti->capab_transformnum == m.capab_transformnum)
865             goto transform_found;
866     }
867     slog(st,LOG_SEC,"peer chose unknown-to-us transform %d!",
868          m.capab_transformnum);
869     return False;
870  transform_found:
871     st->chosen_transform=ti;
872
873     if (!process_msg3_msg4(st,&m))
874         return False;
875
876     /* Terminate their DH public key with a '0' */
877     m.pk[m.pklen]=0;
878     /* Invent our DH secret key */
879     st->random->generate(st->random->st,st->dh->len,st->dhsecret);
880
881     /* Generate the shared key and set up the transform */
882     set_new_transform(st,m.pk);
883
884     return True;
885 }
886
887 static bool_t generate_msg4(struct site *st)
888 {
889     /* We have both nonces, their public key and our private key. Generate
890        our public key, sign it and send it to them. */
891     return generate_msg(st,LABEL_MSG4,"site:MSG4");
892 }
893
894 static bool_t process_msg4(struct site *st, struct buffer_if *msg4,
895                            const struct comm_addr *src)
896 {
897     struct msg m;
898     cstring_t err;
899
900     if (!unpick_msg(st,LABEL_MSG4,msg4,&m)) return False;
901     if (!check_msg(st,LABEL_MSG4,&m,&err)) {
902         slog(st,LOG_SEC,"msg4: %s",err);
903         return False;
904     }
905     
906     if (!process_msg3_msg4(st,&m))
907         return False;
908
909     /* Terminate their DH public key with a '0' */
910     m.pk[m.pklen]=0;
911
912     /* Generate the shared key and set up the transform */
913     set_new_transform(st,m.pk);
914
915     return True;
916 }
917
918 struct msg0 {
919     uint32_t dest;
920     uint32_t source;
921     uint32_t type;
922 };
923
924 static bool_t unpick_msg0(struct site *st, struct buffer_if *msg0,
925                           struct msg0 *m)
926 {
927     CHECK_AVAIL(msg0,4);
928     m->dest=buf_unprepend_uint32(msg0);
929     CHECK_AVAIL(msg0,4);
930     m->source=buf_unprepend_uint32(msg0);
931     CHECK_AVAIL(msg0,4);
932     m->type=buf_unprepend_uint32(msg0);
933     return True;
934     /* Leaves transformed part of buffer untouched */
935 }
936
937 static bool_t generate_msg5(struct site *st)
938 {
939     cstring_t transform_err;
940
941     BUF_ALLOC(&st->buffer,"site:MSG5");
942     /* We are going to add four words to the message */
943     buffer_init(&st->buffer,calculate_max_start_pad());
944     /* Give the netlink code an opportunity to put its own stuff in the
945        message (configuration information, etc.) */
946     buf_prepend_uint32(&st->buffer,LABEL_MSG5);
947     if (call_transform_forwards(st,st->new_transform,
948                                 &st->buffer,&transform_err))
949         return False;
950     buf_prepend_uint32(&st->buffer,LABEL_MSG5);
951     buf_prepend_uint32(&st->buffer,st->index);
952     buf_prepend_uint32(&st->buffer,st->setup_session_id);
953
954     st->retries=st->setup_retries;
955     return True;
956 }
957
958 static bool_t process_msg5(struct site *st, struct buffer_if *msg5,
959                            const struct comm_addr *src,
960                            struct transform_inst_if *transform)
961 {
962     struct msg0 m;
963     cstring_t transform_err;
964
965     if (!unpick_msg0(st,msg5,&m)) return False;
966
967     if (call_transform_reverse(st,transform,msg5,&transform_err)) {
968         /* There's a problem */
969         slog(st,LOG_SEC,"process_msg5: transform: %s",transform_err);
970         return False;
971     }
972     /* Buffer should now contain untransformed PING packet data */
973     CHECK_AVAIL(msg5,4);
974     if (buf_unprepend_uint32(msg5)!=LABEL_MSG5) {
975         slog(st,LOG_SEC,"MSG5/PING packet contained wrong label");
976         return False;
977     }
978     /* Older versions of secnet used to write some config data here
979      * which we ignore.  So we don't CHECK_EMPTY */
980     return True;
981 }
982
983 static void create_msg6(struct site *st, struct transform_inst_if *transform,
984                         uint32_t session_id)
985 {
986     cstring_t transform_err;
987
988     BUF_ALLOC(&st->buffer,"site:MSG6");
989     /* We are going to add four words to the message */
990     buffer_init(&st->buffer,calculate_max_start_pad());
991     /* Give the netlink code an opportunity to put its own stuff in the
992        message (configuration information, etc.) */
993     buf_prepend_uint32(&st->buffer,LABEL_MSG6);
994     int problem = call_transform_forwards(st,transform,
995                                           &st->buffer,&transform_err);
996     assert(!problem);
997     buf_prepend_uint32(&st->buffer,LABEL_MSG6);
998     buf_prepend_uint32(&st->buffer,st->index);
999     buf_prepend_uint32(&st->buffer,session_id);
1000 }
1001
1002 static bool_t generate_msg6(struct site *st)
1003 {
1004     if (!is_transform_valid(st->new_transform))
1005         return False;
1006     create_msg6(st,st->new_transform,st->setup_session_id);
1007     st->retries=1; /* Peer will retransmit MSG5 if this packet gets lost */
1008     return True;
1009 }
1010
1011 static bool_t process_msg6(struct site *st, struct buffer_if *msg6,
1012                            const struct comm_addr *src)
1013 {
1014     struct msg0 m;
1015     cstring_t transform_err;
1016
1017     if (!unpick_msg0(st,msg6,&m)) return False;
1018
1019     if (call_transform_reverse(st,st->new_transform,msg6,&transform_err)) {
1020         /* There's a problem */
1021         slog(st,LOG_SEC,"process_msg6: transform: %s",transform_err);
1022         return False;
1023     }
1024     /* Buffer should now contain untransformed PING packet data */
1025     CHECK_AVAIL(msg6,4);
1026     if (buf_unprepend_uint32(msg6)!=LABEL_MSG6) {
1027         slog(st,LOG_SEC,"MSG6/PONG packet contained invalid data");
1028         return False;
1029     }
1030     /* Older versions of secnet used to write some config data here
1031      * which we ignore.  So we don't CHECK_EMPTY */
1032     return True;
1033 }
1034
1035 static bool_t decrypt_msg0(struct site *st, struct buffer_if *msg0,
1036                            const struct comm_addr *src)
1037 {
1038     cstring_t transform_err, auxkey_err, newkey_err="n/a";
1039     struct msg0 m;
1040     uint32_t problem;
1041
1042     if (!unpick_msg0(st,msg0,&m)) return False;
1043
1044     /* Keep a copy so we can try decrypting it with multiple keys */
1045     buffer_copy(&st->scratch, msg0);
1046
1047     problem = call_transform_reverse(st,st->current.transform,
1048                                      msg0,&transform_err);
1049     if (!problem) {
1050         if (!st->auxiliary_is_new)
1051             delete_one_key(st,&st->auxiliary_key,
1052                            "peer has used new key","auxiliary key",LOG_SEC);
1053         return True;
1054     }
1055     if (problem==2)
1056         goto skew;
1057
1058     buffer_copy(msg0, &st->scratch);
1059     problem = call_transform_reverse(st,st->auxiliary_key.transform,
1060                                      msg0,&auxkey_err);
1061     if (problem==0) {
1062         slog(st,LOG_DROP,"processing packet which uses auxiliary key");
1063         if (st->auxiliary_is_new) {
1064             /* We previously timed out in state SENTMSG5 but it turns
1065              * out that our peer did in fact get our MSG5 and is
1066              * using the new key.  So we should switch to it too. */
1067             /* This is a bit like activate_new_key. */
1068             struct data_key t;
1069             t=st->current;
1070             st->current=st->auxiliary_key;
1071             st->auxiliary_key=t;
1072
1073             delete_one_key(st,&st->auxiliary_key,"peer has used new key",
1074                            "previous key",LOG_SEC);
1075             st->auxiliary_is_new=0;
1076             st->renegotiate_key_time=st->auxiliary_renegotiate_key_time;
1077         }
1078         return True;
1079     }
1080     if (problem==2)
1081         goto skew;
1082
1083     if (st->state==SITE_SENTMSG5) {
1084         buffer_copy(msg0, &st->scratch);
1085         problem = call_transform_reverse(st,st->new_transform,
1086                                          msg0,&newkey_err);
1087         if (!problem) {
1088             /* It looks like we didn't get the peer's MSG6 */
1089             /* This is like a cut-down enter_new_state(SITE_RUN) */
1090             slog(st,LOG_STATE,"will enter state RUN (MSG0 with new key)");
1091             BUF_FREE(&st->buffer);
1092             st->timeout=0;
1093             activate_new_key(st);
1094             return True; /* do process the data in this packet */
1095         }
1096         if (problem==2)
1097             goto skew;
1098     }
1099
1100     slog(st,LOG_SEC,"transform: %s (aux: %s, new: %s)",
1101          transform_err,auxkey_err,newkey_err);
1102     initiate_key_setup(st,"incoming message would not decrypt",0);
1103     send_nak(src,m.dest,m.source,m.type,msg0,"message would not decrypt");
1104     return False;
1105
1106  skew:
1107     slog(st,LOG_DROP,"transform: %s (merely skew)",transform_err);
1108     return False;
1109 }
1110
1111 static bool_t process_msg0(struct site *st, struct buffer_if *msg0,
1112                            const struct comm_addr *src)
1113 {
1114     uint32_t type;
1115
1116     if (!decrypt_msg0(st,msg0,src))
1117         return False;
1118
1119     CHECK_AVAIL(msg0,4);
1120     type=buf_unprepend_uint32(msg0);
1121     switch(type) {
1122     case LABEL_MSG7:
1123         /* We must forget about the current session. */
1124         delete_keys(st,"request from peer",LOG_SEC);
1125         return True;
1126     case LABEL_MSG9:
1127         /* Deliver to netlink layer */
1128         st->netlink->deliver(st->netlink->st,msg0);
1129         transport_data_msgok(st,src);
1130         /* See whether we should start negotiating a new key */
1131         if (st->now > st->renegotiate_key_time)
1132             initiate_key_setup(st,"incoming packet in renegotiation window",0);
1133         return True;
1134     default:
1135         slog(st,LOG_SEC,"incoming encrypted message of type %08x "
1136              "(unknown)",type);
1137         break;
1138     }
1139     return False;
1140 }
1141
1142 static void dump_packet(struct site *st, struct buffer_if *buf,
1143                         const struct comm_addr *addr, bool_t incoming)
1144 {
1145     uint32_t dest=get_uint32(buf->start);
1146     uint32_t source=get_uint32(buf->start+4);
1147     uint32_t msgtype=get_uint32(buf->start+8);
1148
1149     if (st->log_events & LOG_DUMP)
1150         slilog(st->log,M_DEBUG,"%s: %s: %08x<-%08x: %08x:",
1151                st->tunname,incoming?"incoming":"outgoing",
1152                dest,source,msgtype);
1153 }
1154
1155 static uint32_t site_status(void *st)
1156 {
1157     return 0;
1158 }
1159
1160 static bool_t send_msg(struct site *st)
1161 {
1162     if (st->retries>0) {
1163         transport_xmit(st, &st->setup_peers, &st->buffer, True);
1164         st->timeout=st->now+st->setup_retry_interval;
1165         st->retries--;
1166         return True;
1167     } else if (st->state==SITE_SENTMSG5) {
1168         logtimeout(st,"timed out sending MSG5, stashing new key");
1169         /* We stash the key we have produced, in case it turns out that
1170          * our peer did see our MSG5 after all and starts using it. */
1171         /* This is a bit like some of activate_new_key */
1172         struct transform_inst_if *t;
1173         t=st->auxiliary_key.transform;
1174         st->auxiliary_key.transform=st->new_transform;
1175         st->new_transform=t;
1176         dispose_transform(&st->new_transform);
1177
1178         st->auxiliary_is_new=1;
1179         st->auxiliary_key.key_timeout=st->now+st->key_lifetime;
1180         st->auxiliary_renegotiate_key_time=st->now+st->key_renegotiate_time;
1181         st->auxiliary_key.remote_session_id=st->setup_session_id;
1182
1183         enter_state_wait(st);
1184         return False;
1185     } else {
1186         logtimeout(st,"timed out sending key setup packet "
1187             "(in state %s)",state_name(st->state));
1188         enter_state_wait(st);
1189         return False;
1190     }
1191 }
1192
1193 static void site_resolve_callback(void *sst, const struct comm_addr *addrs,
1194                                   int naddrs, int was_naddrs,
1195                                   const char *failwhy)
1196 {
1197     struct site *st=sst;
1198
1199     st->resolving=False;
1200
1201     if (naddrs) {
1202         slog(st,LOG_STATE,"resolution of %s completed, %d addrs, eg: %s",
1203              st->address, was_naddrs, comm_addr_to_string(&addrs[0]));;
1204         if (naddrs != was_naddrs) {
1205             slog(st,LOG_SETUP_INIT,"resolution of supplied addresses/names"
1206                  " yielded too many results (%d > %d), some ignored",
1207                  was_naddrs, naddrs);
1208         }
1209     } else {
1210         slog(st,LOG_ERROR,"resolution of %s failed: %s",st->address,failwhy);
1211     }
1212
1213     switch (st->state) {
1214     case SITE_RESOLVE:
1215         if (transport_compute_setupinit_peers(st,addrs,naddrs,0)) {
1216             enter_new_state(st,SITE_SENTMSG1);
1217         } else {
1218             /* Can't figure out who to try to to talk to */
1219             slog(st,LOG_SETUP_INIT,
1220                  "key exchange failed: cannot find peer address");
1221             enter_state_run(st);
1222         }
1223         break;
1224     case SITE_SENTMSG1: case SITE_SENTMSG2:
1225     case SITE_SENTMSG3: case SITE_SENTMSG4:
1226     case SITE_SENTMSG5:
1227         if (naddrs) {
1228             /* We start using the address immediately for data too.
1229              * It's best to store it in st->peers now because we might
1230              * go via SENTMSG5, WAIT, and a MSG0, straight into using
1231              * the new key (without updating the data peer addrs). */
1232             transport_resolve_complete(st,addrs,naddrs);
1233         } else if (st->local_mobile) {
1234             /* We can't let this rest because we may have a peer
1235              * address which will break in the future. */
1236             slog(st,LOG_SETUP_INIT,"resolution of %s failed: "
1237                  "abandoning key exchange",st->address);
1238             enter_state_wait(st);
1239         } else {
1240             slog(st,LOG_SETUP_INIT,"resolution of %s failed: "
1241                  " continuing to use source address of peer's packets"
1242                  " for key exchange and ultimately data",
1243                  st->address);
1244         }
1245         break;
1246     case SITE_RUN:
1247         if (naddrs) {
1248             slog(st,LOG_SETUP_INIT,"resolution of %s completed tardily,"
1249                  " updating peer address(es)",st->address);
1250             transport_resolve_complete_tardy(st,addrs,naddrs);
1251         } else if (st->local_mobile) {
1252             /* Not very good.  We should queue (another) renegotiation
1253              * so that we can update the peer address. */
1254             st->key_renegotiate_time=st->now+st->wait_timeout;
1255         } else {
1256             slog(st,LOG_SETUP_INIT,"resolution of %s failed: "
1257                  " continuing to use source address of peer's packets",
1258                  st->address);
1259         }
1260         break;
1261     case SITE_WAIT:
1262     case SITE_STOP:
1263         /* oh well */
1264         break;
1265     }
1266 }
1267
1268 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
1269                                  const struct comm_addr *prod_hint)
1270 {
1271     /* Reentrancy hazard: can call enter_new_state/enter_state_* */
1272     if (st->state!=SITE_RUN) return False;
1273     slog(st,LOG_SETUP_INIT,"initiating key exchange (%s)",reason);
1274     if (st->address) {
1275         slog(st,LOG_SETUP_INIT,"resolving peer address");
1276         return enter_state_resolve(st);
1277     } else if (transport_compute_setupinit_peers(st,0,0,prod_hint)) {
1278         return enter_new_state(st,SITE_SENTMSG1);
1279     }
1280     slog(st,LOG_SETUP_INIT,"key exchange failed: no address for peer");
1281     return False;
1282 }
1283
1284 static void activate_new_key(struct site *st)
1285 {
1286     struct transform_inst_if *t;
1287
1288     /* We have three transform instances, which we swap between old,
1289        active and setup */
1290     t=st->auxiliary_key.transform;
1291     st->auxiliary_key.transform=st->current.transform;
1292     st->current.transform=st->new_transform;
1293     st->new_transform=t;
1294     dispose_transform(&st->new_transform);
1295
1296     st->timeout=0;
1297     st->auxiliary_is_new=0;
1298     st->auxiliary_key.key_timeout=st->current.key_timeout;
1299     st->current.key_timeout=st->now+st->key_lifetime;
1300     st->renegotiate_key_time=st->now+st->key_renegotiate_time;
1301     transport_peers_copy(st,&st->peers,&st->setup_peers);
1302     st->current.remote_session_id=st->setup_session_id;
1303
1304     /* Compute the inter-site MTU.  This is min( our_mtu, their_mtu ).
1305      * But their mtu be unspecified, in which case we just use ours. */
1306     uint32_t intersite_mtu=
1307         MIN(st->mtu_target, st->remote_adv_mtu ?: ~(uint32_t)0);
1308     st->netlink->set_mtu(st->netlink->st,intersite_mtu);
1309
1310     slog(st,LOG_ACTIVATE_KEY,"new key activated"
1311          " (mtu ours=%"PRId32" theirs=%"PRId32" intersite=%"PRId32")",
1312          st->mtu_target, st->remote_adv_mtu, intersite_mtu);
1313     enter_state_run(st);
1314 }
1315
1316 static void delete_one_key(struct site *st, struct data_key *key,
1317                            cstring_t reason, cstring_t which, uint32_t loglevel)
1318 {
1319     if (!is_transform_valid(key->transform)) return;
1320     if (reason) slog(st,loglevel,"%s deleted (%s)",which,reason);
1321     dispose_transform(&key->transform);
1322     key->key_timeout=0;
1323 }
1324
1325 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel)
1326 {
1327     if (current_valid(st)) {
1328         slog(st,loglevel,"session closed (%s)",reason);
1329
1330         delete_one_key(st,&st->current,0,0,0);
1331         set_link_quality(st);
1332     }
1333     delete_one_key(st,&st->auxiliary_key,0,0,0);
1334 }
1335
1336 static void state_assert(struct site *st, bool_t ok)
1337 {
1338     if (!ok) fatal("site:state_assert");
1339 }
1340
1341 static void enter_state_stop(struct site *st)
1342 {
1343     st->state=SITE_STOP;
1344     st->timeout=0;
1345     delete_keys(st,"entering state STOP",LOG_TIMEOUT_KEY);
1346     dispose_transform(&st->new_transform);
1347 }
1348
1349 static void set_link_quality(struct site *st)
1350 {
1351     uint32_t quality;
1352     if (current_valid(st))
1353         quality=LINK_QUALITY_UP;
1354     else if (st->state==SITE_WAIT || st->state==SITE_STOP)
1355         quality=LINK_QUALITY_DOWN;
1356     else if (st->address)
1357         quality=LINK_QUALITY_DOWN_CURRENT_ADDRESS;
1358     else if (transport_peers_valid(&st->peers))
1359         quality=LINK_QUALITY_DOWN_STALE_ADDRESS;
1360     else
1361         quality=LINK_QUALITY_DOWN;
1362
1363     st->netlink->set_quality(st->netlink->st,quality);
1364 }
1365
1366 static void enter_state_run(struct site *st)
1367 {
1368     slog(st,LOG_STATE,"entering state RUN");
1369     st->state=SITE_RUN;
1370     st->timeout=0;
1371
1372     st->setup_session_id=0;
1373     transport_peers_clear(st,&st->setup_peers);
1374     FILLZERO(st->localN);
1375     FILLZERO(st->remoteN);
1376     dispose_transform(&st->new_transform);
1377     memset(st->dhsecret,0,st->dh->len);
1378     memset(st->sharedsecret,0,st->sharedsecretlen);
1379     set_link_quality(st);
1380 }
1381
1382 static bool_t ensure_resolving(struct site *st)
1383 {
1384     /* Reentrancy hazard: may call site_resolve_callback and hence
1385      * enter_new_state, enter_state_* and generate_msg*. */
1386     if (st->resolving)
1387         return True;
1388
1389     assert(st->address);
1390
1391     /* resolver->request might reentrantly call site_resolve_callback
1392      * which will clear st->resolving, so we need to set it beforehand
1393      * rather than afterwards; also, it might return False, in which
1394      * case we have to clear ->resolving again. */
1395     st->resolving=True;
1396     bool_t ok = st->resolver->request(st->resolver->st,st->address,
1397                                       st->remoteport,st->comms[0],
1398                                       site_resolve_callback,st);
1399     if (!ok)
1400         st->resolving=False;
1401
1402     return ok;
1403 }
1404
1405 static bool_t enter_state_resolve(struct site *st)
1406 {
1407     /* Reentrancy hazard!  See ensure_resolving. */
1408     state_assert(st,st->state==SITE_RUN);
1409     slog(st,LOG_STATE,"entering state RESOLVE");
1410     st->state=SITE_RESOLVE;
1411     return ensure_resolving(st);
1412 }
1413
1414 static bool_t enter_new_state(struct site *st, uint32_t next)
1415 {
1416     bool_t (*gen)(struct site *st);
1417     int r;
1418
1419     slog(st,LOG_STATE,"entering state %s",state_name(next));
1420     switch(next) {
1421     case SITE_SENTMSG1:
1422         state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE);
1423         gen=generate_msg1;
1424         break;
1425     case SITE_SENTMSG2:
1426         state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1427                      st->state==SITE_SENTMSG1 || st->state==SITE_WAIT);
1428         gen=generate_msg2;
1429         break;
1430     case SITE_SENTMSG3:
1431         state_assert(st,st->state==SITE_SENTMSG1);
1432         BUF_FREE(&st->buffer);
1433         gen=generate_msg3;
1434         break;
1435     case SITE_SENTMSG4:
1436         state_assert(st,st->state==SITE_SENTMSG2);
1437         BUF_FREE(&st->buffer);
1438         gen=generate_msg4;
1439         break;
1440     case SITE_SENTMSG5:
1441         state_assert(st,st->state==SITE_SENTMSG3);
1442         BUF_FREE(&st->buffer);
1443         gen=generate_msg5;
1444         break;
1445     case SITE_RUN:
1446         state_assert(st,st->state==SITE_SENTMSG4);
1447         BUF_FREE(&st->buffer);
1448         gen=generate_msg6;
1449         break;
1450     default:
1451         gen=NULL;
1452         fatal("enter_new_state(%s): invalid new state",state_name(next));
1453         break;
1454     }
1455
1456     if (hacky_par_start_failnow()) return False;
1457
1458     r= gen(st) && send_msg(st);
1459
1460     hacky_par_end(&r,
1461                   st->setup_retries, st->setup_retry_interval,
1462                   send_msg, st);
1463     
1464     if (r) {
1465         st->state=next;
1466         if (next==SITE_RUN) {
1467             BUF_FREE(&st->buffer); /* Never reused */
1468             st->timeout=0; /* Never retransmit */
1469             activate_new_key(st);
1470         }
1471         return True;
1472     }
1473     slog(st,LOG_ERROR,"error entering state %s",state_name(next));
1474     st->buffer.free=False; /* Unconditionally use the buffer; it may be
1475                               in either state, and enter_state_wait() will
1476                               do a BUF_FREE() */
1477     enter_state_wait(st);
1478     return False;
1479 }
1480
1481 /* msg7 tells our peer that we're about to forget our key */
1482 static bool_t send_msg7(struct site *st, cstring_t reason)
1483 {
1484     cstring_t transform_err;
1485
1486     if (current_valid(st) && st->buffer.free
1487         && transport_peers_valid(&st->peers)) {
1488         BUF_ALLOC(&st->buffer,"site:MSG7");
1489         buffer_init(&st->buffer,calculate_max_start_pad());
1490         buf_append_uint32(&st->buffer,LABEL_MSG7);
1491         buf_append_string(&st->buffer,reason);
1492         if (call_transform_forwards(st, st->current.transform,
1493                                     &st->buffer, &transform_err))
1494             goto free_out;
1495         buf_prepend_uint32(&st->buffer,LABEL_MSG0);
1496         buf_prepend_uint32(&st->buffer,st->index);
1497         buf_prepend_uint32(&st->buffer,st->current.remote_session_id);
1498         transport_xmit(st,&st->peers,&st->buffer,True);
1499         BUF_FREE(&st->buffer);
1500     free_out:
1501         return True;
1502     }
1503     return False;
1504 }
1505
1506 /* We go into this state if our peer becomes uncommunicative. Similar to
1507    the "stop" state, we forget all session keys for a while, before
1508    re-entering the "run" state. */
1509 static void enter_state_wait(struct site *st)
1510 {
1511     slog(st,LOG_STATE,"entering state WAIT");
1512     st->timeout=st->now+st->wait_timeout;
1513     st->state=SITE_WAIT;
1514     set_link_quality(st);
1515     BUF_FREE(&st->buffer); /* will have had an outgoing packet in it */
1516     /* XXX Erase keys etc. */
1517 }
1518
1519 static void generate_prod(struct site *st, struct buffer_if *buf)
1520 {
1521     buffer_init(buf,0);
1522     buf_append_uint32(buf,0);
1523     buf_append_uint32(buf,0);
1524     buf_append_uint32(buf,LABEL_PROD);
1525     buf_append_string(buf,st->localname);
1526     buf_append_string(buf,st->remotename);
1527 }
1528
1529 static void generate_send_prod(struct site *st,
1530                                const struct comm_addr *source)
1531 {
1532     if (!st->allow_send_prod) return; /* too soon */
1533     if (!(st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1534           st->state==SITE_WAIT)) return; /* we'd ignore peer's MSG1 */
1535
1536     slog(st,LOG_SETUP_INIT,"prodding peer for key exchange");
1537     st->allow_send_prod=0;
1538     generate_prod(st,&st->scratch);
1539     dump_packet(st,&st->scratch,source,False);
1540     source->comm->sendmsg(source->comm->st, &st->scratch, source);
1541 }
1542
1543 static inline void site_settimeout(uint64_t timeout, int *timeout_io)
1544 {
1545     if (timeout) {
1546         int64_t offset=timeout-*now;
1547         if (offset<0) offset=0;
1548         if (offset>INT_MAX) offset=INT_MAX;
1549         if (*timeout_io<0 || offset<*timeout_io)
1550             *timeout_io=offset;
1551     }
1552 }
1553
1554 static int site_beforepoll(void *sst, struct pollfd *fds, int *nfds_io,
1555                            int *timeout_io)
1556 {
1557     struct site *st=sst;
1558
1559     *nfds_io=0; /* We don't use any file descriptors */
1560     st->now=*now;
1561
1562     /* Work out when our next timeout is. The earlier of 'timeout' or
1563        'current.key_timeout'. A stored value of '0' indicates no timeout
1564        active. */
1565     site_settimeout(st->timeout, timeout_io);
1566     site_settimeout(st->current.key_timeout, timeout_io);
1567     site_settimeout(st->auxiliary_key.key_timeout, timeout_io);
1568
1569     return 0; /* success */
1570 }
1571
1572 static void check_expiry(struct site *st, struct data_key *key,
1573                          const char *which)
1574 {
1575     if (key->key_timeout && *now>key->key_timeout) {
1576         delete_one_key(st,key,"maximum life exceeded",which,LOG_TIMEOUT_KEY);
1577     }
1578 }
1579
1580 /* NB site_afterpoll will be called before site_beforepoll is ever called */
1581 static void site_afterpoll(void *sst, struct pollfd *fds, int nfds)
1582 {
1583     struct site *st=sst;
1584
1585     st->now=*now;
1586     if (st->timeout && *now>st->timeout) {
1587         st->timeout=0;
1588         if (st->state>=SITE_SENTMSG1 && st->state<=SITE_SENTMSG5) {
1589             if (!hacky_par_start_failnow())
1590                 send_msg(st);
1591         } else if (st->state==SITE_WAIT) {
1592             enter_state_run(st);
1593         } else {
1594             slog(st,LOG_ERROR,"site_afterpoll: unexpected timeout, state=%d",
1595                  st->state);
1596         }
1597     }
1598     check_expiry(st,&st->current,"current key");
1599     check_expiry(st,&st->auxiliary_key,"auxiliary key");
1600 }
1601
1602 /* This function is called by the netlink device to deliver packets
1603    intended for the remote network. The packet is in "raw" wire
1604    format, but is guaranteed to be word-aligned. */
1605 static void site_outgoing(void *sst, struct buffer_if *buf)
1606 {
1607     struct site *st=sst;
1608     cstring_t transform_err;
1609     
1610     if (st->state==SITE_STOP) {
1611         BUF_FREE(buf);
1612         return;
1613     }
1614
1615     st->allow_send_prod=1;
1616
1617     /* In all other states we consider delivering the packet if we have
1618        a valid key and a valid address to send it to. */
1619     if (current_valid(st) && transport_peers_valid(&st->peers)) {
1620         /* Transform it and send it */
1621         if (buf->size>0) {
1622             buf_prepend_uint32(buf,LABEL_MSG9);
1623             if (call_transform_forwards(st, st->current.transform,
1624                                         buf, &transform_err))
1625                 goto free_out;
1626             buf_prepend_uint32(buf,LABEL_MSG0);
1627             buf_prepend_uint32(buf,st->index);
1628             buf_prepend_uint32(buf,st->current.remote_session_id);
1629             transport_xmit(st,&st->peers,buf,False);
1630         }
1631     free_out:
1632         BUF_FREE(buf);
1633         return;
1634     }
1635
1636     slog(st,LOG_DROP,"discarding outgoing packet of size %d",buf->size);
1637     BUF_FREE(buf);
1638     initiate_key_setup(st,"outgoing packet",0);
1639 }
1640
1641 static bool_t named_for_us(struct site *st, const struct buffer_if *buf_in,
1642                            uint32_t type, struct msg *m)
1643     /* For packets which are identified by the local and remote names.
1644      * If it has our name and our peer's name in it it's for us. */
1645 {
1646     struct buffer_if buf[1];
1647     buffer_readonly_clone(buf,buf_in);
1648     return unpick_msg(st,type,buf,m)
1649         && name_matches(&m->remote,st->remotename)
1650         && name_matches(&m->local,st->localname);
1651 }
1652
1653 /* This function is called by the communication device to deliver
1654    packets from our peers.
1655    It should return True if the packet is recognised as being for
1656    this current site instance (and should therefore not be processed
1657    by other sites), even if the packet was otherwise ignored. */
1658 static bool_t site_incoming(void *sst, struct buffer_if *buf,
1659                             const struct comm_addr *source)
1660 {
1661     struct site *st=sst;
1662
1663     if (buf->size < 12) return False;
1664
1665     uint32_t dest=get_uint32(buf->start);
1666     uint32_t msgtype=get_uint32(buf->start+8);
1667     struct msg named_msg;
1668
1669     if (msgtype==LABEL_MSG1) {
1670         if (!named_for_us(st,buf,msgtype,&named_msg))
1671             return False;
1672         /* It's a MSG1 addressed to us. Decide what to do about it. */
1673         dump_packet(st,buf,source,True);
1674         if (st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1675             st->state==SITE_WAIT) {
1676             /* We should definitely process it */
1677             transport_compute_setupinit_peers(st,0,0,source);
1678             if (process_msg1(st,buf,source,&named_msg)) {
1679                 slog(st,LOG_SETUP_INIT,"key setup initiated by peer");
1680                 bool_t entered=enter_new_state(st,SITE_SENTMSG2);
1681                 if (entered && st->address && st->local_mobile)
1682                     /* We must do this as the very last thing, because
1683                        the resolver callback might reenter us. */
1684                     ensure_resolving(st);
1685             } else {
1686                 slog(st,LOG_ERROR,"failed to process incoming msg1");
1687             }
1688             BUF_FREE(buf);
1689             return True;
1690         } else if (st->state==SITE_SENTMSG1) {
1691             /* We've just sent a message 1! They may have crossed on
1692                the wire. If we have priority then we ignore the
1693                incoming one, otherwise we process it as usual. */
1694             if (st->setup_priority) {
1695                 BUF_FREE(buf);
1696                 slog(st,LOG_DUMP,"crossed msg1s; we are higher "
1697                      "priority => ignore incoming msg1");
1698                 return True;
1699             } else {
1700                 slog(st,LOG_DUMP,"crossed msg1s; we are lower "
1701                      "priority => use incoming msg1");
1702                 if (process_msg1(st,buf,source,&named_msg)) {
1703                     BUF_FREE(&st->buffer); /* Free our old message 1 */
1704                     transport_setup_msgok(st,source);
1705                     enter_new_state(st,SITE_SENTMSG2);
1706                 } else {
1707                     slog(st,LOG_ERROR,"failed to process an incoming "
1708                          "crossed msg1 (we have low priority)");
1709                 }
1710                 BUF_FREE(buf);
1711                 return True;
1712             }
1713         }
1714         /* The message 1 was received at an unexpected stage of the
1715            key setup. XXX POLICY - what do we do? */
1716         slog(st,LOG_UNEXPECTED,"unexpected incoming message 1");
1717         BUF_FREE(buf);
1718         return True;
1719     }
1720     if (msgtype==LABEL_PROD) {
1721         if (!named_for_us(st,buf,msgtype,&named_msg))
1722             return False;
1723         dump_packet(st,buf,source,True);
1724         if (st->state!=SITE_RUN) {
1725             slog(st,LOG_DROP,"ignoring PROD when not in state RUN");
1726         } else if (current_valid(st)) {
1727             slog(st,LOG_DROP,"ignoring PROD when we think we have a key");
1728         } else {
1729             initiate_key_setup(st,"peer sent PROD packet",source);
1730         }
1731         BUF_FREE(buf);
1732         return True;
1733     }
1734     if (dest==st->index) {
1735         /* Explicitly addressed to us */
1736         if (msgtype!=LABEL_MSG0) dump_packet(st,buf,source,True);
1737         switch (msgtype) {
1738         case LABEL_NAK:
1739             /* If the source is our current peer then initiate a key setup,
1740                because our peer's forgotten the key */
1741             if (get_uint32(buf->start+4)==st->current.remote_session_id) {
1742                 bool_t initiated;
1743                 initiated = initiate_key_setup(st,"received a NAK",source);
1744                 if (!initiated) generate_send_prod(st,source);
1745             } else {
1746                 slog(st,LOG_SEC,"bad incoming NAK");
1747             }
1748             break;
1749         case LABEL_MSG0:
1750             process_msg0(st,buf,source);
1751             break;
1752         case LABEL_MSG1:
1753             /* Setup packet: should not have been explicitly addressed
1754                to us */
1755             slog(st,LOG_SEC,"incoming explicitly addressed msg1");
1756             break;
1757         case LABEL_MSG2:
1758             /* Setup packet: expected only in state SENTMSG1 */
1759             if (st->state!=SITE_SENTMSG1) {
1760                 slog(st,LOG_UNEXPECTED,"unexpected MSG2");
1761             } else if (process_msg2(st,buf,source)) {
1762                 transport_setup_msgok(st,source);
1763                 enter_new_state(st,SITE_SENTMSG3);
1764             } else {
1765                 slog(st,LOG_SEC,"invalid MSG2");
1766             }
1767             break;
1768         case LABEL_MSG3:
1769         case LABEL_MSG3BIS:
1770             /* Setup packet: expected only in state SENTMSG2 */
1771             if (st->state!=SITE_SENTMSG2) {
1772                 slog(st,LOG_UNEXPECTED,"unexpected MSG3");
1773             } else if (process_msg3(st,buf,source,msgtype)) {
1774                 transport_setup_msgok(st,source);
1775                 enter_new_state(st,SITE_SENTMSG4);
1776             } else {
1777                 slog(st,LOG_SEC,"invalid MSG3");
1778             }
1779             break;
1780         case LABEL_MSG4:
1781             /* Setup packet: expected only in state SENTMSG3 */
1782             if (st->state!=SITE_SENTMSG3) {
1783                 slog(st,LOG_UNEXPECTED,"unexpected MSG4");
1784             } else if (process_msg4(st,buf,source)) {
1785                 transport_setup_msgok(st,source);
1786                 enter_new_state(st,SITE_SENTMSG5);
1787             } else {
1788                 slog(st,LOG_SEC,"invalid MSG4");
1789             }
1790             break;
1791         case LABEL_MSG5:
1792             /* Setup packet: expected only in state SENTMSG4 */
1793             /* (may turn up in state RUN if our return MSG6 was lost
1794                and the new key has already been activated. In that
1795                case we discard it. The peer will realise that we
1796                are using the new key when they see our data packets.
1797                Until then the peer's data packets to us get discarded. */
1798             if (st->state==SITE_SENTMSG4) {
1799                 if (process_msg5(st,buf,source,st->new_transform)) {
1800                     transport_setup_msgok(st,source);
1801                     enter_new_state(st,SITE_RUN);
1802                 } else {
1803                     slog(st,LOG_SEC,"invalid MSG5");
1804                 }
1805             } else if (st->state==SITE_RUN) {
1806                 if (process_msg5(st,buf,source,st->current.transform)) {
1807                     slog(st,LOG_DROP,"got MSG5, retransmitting MSG6");
1808                     transport_setup_msgok(st,source);
1809                     create_msg6(st,st->current.transform,
1810                                 st->current.remote_session_id);
1811                     transport_xmit(st,&st->peers,&st->buffer,True);
1812                     BUF_FREE(&st->buffer);
1813                 } else {
1814                     slog(st,LOG_SEC,"invalid MSG5 (in state RUN)");
1815                 }
1816             } else {
1817                 slog(st,LOG_UNEXPECTED,"unexpected MSG5");
1818             }
1819             break;
1820         case LABEL_MSG6:
1821             /* Setup packet: expected only in state SENTMSG5 */
1822             if (st->state!=SITE_SENTMSG5) {
1823                 slog(st,LOG_UNEXPECTED,"unexpected MSG6");
1824             } else if (process_msg6(st,buf,source)) {
1825                 BUF_FREE(&st->buffer); /* Free message 5 */
1826                 transport_setup_msgok(st,source);
1827                 activate_new_key(st);
1828             } else {
1829                 slog(st,LOG_SEC,"invalid MSG6");
1830             }
1831             break;
1832         default:
1833             slog(st,LOG_SEC,"received message of unknown type 0x%08x",
1834                  msgtype);
1835             break;
1836         }
1837         BUF_FREE(buf);
1838         return True;
1839     }
1840
1841     return False;
1842 }
1843
1844 static void site_control(void *vst, bool_t run)
1845 {
1846     struct site *st=vst;
1847     if (run) enter_state_run(st);
1848     else enter_state_stop(st);
1849 }
1850
1851 static void site_phase_hook(void *sst, uint32_t newphase)
1852 {
1853     struct site *st=sst;
1854
1855     /* The program is shutting down; tell our peer */
1856     send_msg7(st,"shutting down");
1857 }
1858
1859 static list_t *site_apply(closure_t *self, struct cloc loc, dict_t *context,
1860                           list_t *args)
1861 {
1862     static uint32_t index_sequence;
1863     struct site *st;
1864     item_t *item;
1865     dict_t *dict;
1866     int i;
1867
1868     st=safe_malloc(sizeof(*st),"site_apply");
1869
1870     st->cl.description="site";
1871     st->cl.type=CL_SITE;
1872     st->cl.apply=NULL;
1873     st->cl.interface=&st->ops;
1874     st->ops.st=st;
1875     st->ops.control=site_control;
1876     st->ops.status=site_status;
1877
1878     /* First parameter must be a dict */
1879     item=list_elem(args,0);
1880     if (!item || item->type!=t_dict)
1881         cfgfatal(loc,"site","parameter must be a dictionary\n");
1882     
1883     dict=item->data.dict;
1884     st->localname=dict_read_string(dict, "local-name", True, "site", loc);
1885     st->remotename=dict_read_string(dict, "name", True, "site", loc);
1886
1887     st->peer_mobile=dict_read_bool(dict,"mobile",False,"site",loc,False);
1888     st->local_mobile=
1889         dict_read_bool(dict,"local-mobile",False,"site",loc,False);
1890
1891     /* Sanity check (which also allows the 'sites' file to include
1892        site() closures for all sites including our own): refuse to
1893        talk to ourselves */
1894     if (strcmp(st->localname,st->remotename)==0) {
1895         Message(M_DEBUG,"site %s: local-name==name -> ignoring this site\n",
1896                 st->localname);
1897         if (st->peer_mobile != st->local_mobile)
1898             cfgfatal(loc,"site","site %s's peer-mobile=%d"
1899                     " but our local-mobile=%d\n",
1900                     st->localname, st->peer_mobile, st->local_mobile);
1901         free(st);
1902         return NULL;
1903     }
1904     if (st->peer_mobile && st->local_mobile) {
1905         Message(M_WARNING,"site %s: site is mobile but so are we"
1906                 " -> ignoring this site\n", st->remotename);
1907         free(st);
1908         return NULL;
1909     }
1910
1911     assert(index_sequence < 0xffffffffUL);
1912     st->index = ++index_sequence;
1913     st->local_capabilities = 0;
1914     st->netlink=find_cl_if(dict,"link",CL_NETLINK,True,"site",loc);
1915
1916 #define GET_CLOSURE_LIST(dictkey,things,nthings,CL_TYPE) do{            \
1917     list_t *things##_cfg=dict_lookup(dict,dictkey);                     \
1918     if (!things##_cfg)                                                  \
1919         cfgfatal(loc,"site","closure list \"%s\" not found\n",dictkey); \
1920     st->nthings=list_length(things##_cfg);                              \
1921     st->things=safe_malloc_ary(sizeof(*st->things),st->nthings,dictkey "s"); \
1922     assert(st->nthings);                                                \
1923     for (i=0; i<st->nthings; i++) {                                     \
1924         item_t *item=list_elem(things##_cfg,i);                         \
1925         if (item->type!=t_closure)                                      \
1926             cfgfatal(loc,"site","%s is not a closure\n",dictkey);       \
1927         closure_t *cl=item->data.closure;                               \
1928         if (cl->type!=CL_TYPE)                                          \
1929             cfgfatal(loc,"site","%s closure wrong type\n",dictkey);     \
1930         st->things[i]=cl->interface;                                    \
1931     }                                                                   \
1932 }while(0)
1933
1934     GET_CLOSURE_LIST("comm",comms,ncomms,CL_COMM);
1935
1936     st->resolver=find_cl_if(dict,"resolver",CL_RESOLVER,True,"site",loc);
1937     st->log=find_cl_if(dict,"log",CL_LOG,True,"site",loc);
1938     st->random=find_cl_if(dict,"random",CL_RANDOMSRC,True,"site",loc);
1939
1940     st->privkey=find_cl_if(dict,"local-key",CL_RSAPRIVKEY,True,"site",loc);
1941     st->address=dict_read_string(dict, "address", False, "site", loc);
1942     if (st->address)
1943         st->remoteport=dict_read_number(dict,"port",True,"site",loc,0);
1944     else st->remoteport=0;
1945     st->pubkey=find_cl_if(dict,"key",CL_RSAPUBKEY,True,"site",loc);
1946
1947     GET_CLOSURE_LIST("transform",transforms,ntransforms,CL_TRANSFORM);
1948
1949     st->dh=find_cl_if(dict,"dh",CL_DH,True,"site",loc);
1950     st->hash=find_cl_if(dict,"hash",CL_HASH,True,"site",loc);
1951
1952 #define DEFAULT(D) (st->peer_mobile || st->local_mobile \
1953                     ? DEFAULT_MOBILE_##D : DEFAULT_##D)
1954 #define CFG_NUMBER(k,D) dict_read_number(dict,(k),False,"site",loc,DEFAULT(D));
1955
1956     st->key_lifetime=         CFG_NUMBER("key-lifetime",  KEY_LIFETIME);
1957     st->setup_retries=        CFG_NUMBER("setup-retries", SETUP_RETRIES);
1958     st->setup_retry_interval= CFG_NUMBER("setup-timeout", SETUP_RETRY_INTERVAL);
1959     st->wait_timeout=         CFG_NUMBER("wait-time",     WAIT_TIME);
1960     st->mtu_target= dict_read_number(dict,"mtu-target",False,"site",loc,0);
1961
1962     st->mobile_peer_expiry= dict_read_number(
1963        dict,"mobile-peer-expiry",False,"site",loc,DEFAULT_MOBILE_PEER_EXPIRY);
1964
1965     const char *peerskey= st->peer_mobile
1966         ? "mobile-peers-max" : "static-peers-max";
1967     st->transport_peers_max= dict_read_number(
1968         dict,peerskey,False,"site",loc, st->address ? 4 : 3);
1969     if (st->transport_peers_max<1 ||
1970         st->transport_peers_max>MAX_PEER_ADDRS) {
1971         cfgfatal(loc,"site", "%s must be in range 1.."
1972                  STRING(MAX_PEER_ADDRS) "\n", peerskey);
1973     }
1974
1975     if (st->key_lifetime < DEFAULT(KEY_RENEGOTIATE_GAP)*2)
1976         st->key_renegotiate_time=st->key_lifetime/2;
1977     else
1978         st->key_renegotiate_time=st->key_lifetime-DEFAULT(KEY_RENEGOTIATE_GAP);
1979     st->key_renegotiate_time=dict_read_number(
1980         dict,"renegotiate-time",False,"site",loc,st->key_renegotiate_time);
1981     if (st->key_renegotiate_time > st->key_lifetime) {
1982         cfgfatal(loc,"site",
1983                  "renegotiate-time must be less than key-lifetime\n");
1984     }
1985
1986     st->log_events=string_list_to_word(dict_lookup(dict,"log-events"),
1987                                        log_event_table,"site");
1988
1989     st->resolving=False;
1990     st->allow_send_prod=0;
1991
1992     st->tunname=safe_malloc(strlen(st->localname)+strlen(st->remotename)+5,
1993                             "site_apply");
1994     sprintf(st->tunname,"%s<->%s",st->localname,st->remotename);
1995
1996     /* The information we expect to see in incoming messages of type 1 */
1997     /* fixme: lots of unchecked overflows here, but the results are only
1998        corrupted packets rather than undefined behaviour */
1999     st->setup_priority=(strcmp(st->localname,st->remotename)>0);
2000
2001     buffer_new(&st->buffer,SETUP_BUFFER_LEN);
2002
2003     buffer_new(&st->scratch,SETUP_BUFFER_LEN);
2004     BUF_ALLOC(&st->scratch,"site:scratch");
2005
2006     /* We are interested in poll(), but only for timeouts. We don't have
2007        any fds of our own. */
2008     register_for_poll(st, site_beforepoll, site_afterpoll, 0, "site");
2009     st->timeout=0;
2010
2011     st->remote_capabilities=0;
2012     st->chosen_transform=0;
2013     st->current.key_timeout=0;
2014     st->auxiliary_key.key_timeout=0;
2015     transport_peers_clear(st,&st->peers);
2016     transport_peers_clear(st,&st->setup_peers);
2017     /* XXX mlock these */
2018     st->dhsecret=safe_malloc(st->dh->len,"site:dhsecret");
2019     st->sharedsecretlen=st->sharedsecretallocd=0;
2020     st->sharedsecret=0;
2021
2022     for (i=0; i<st->ntransforms; i++) {
2023         struct transform_if *ti=st->transforms[i];
2024         uint32_t capbit = 1UL << ti->capab_transformnum;
2025         if (st->local_capabilities & capbit)
2026             slog(st,LOG_ERROR,"transformnum capability bit"
2027                  " %d (%#"PRIx32") reused", ti->capab_transformnum, capbit);
2028         st->local_capabilities |= capbit;
2029     }
2030
2031     /* We need to register the remote networks with the netlink device */
2032     uint32_t netlink_mtu; /* local virtual interface mtu */
2033     st->netlink->reg(st->netlink->st, site_outgoing, st, &netlink_mtu);
2034     if (!st->mtu_target)
2035         st->mtu_target=netlink_mtu;
2036     
2037     for (i=0; i<st->ncomms; i++)
2038         st->comms[i]->request_notify(st->comms[i]->st, st, site_incoming);
2039
2040     st->current.transform=0;
2041     st->auxiliary_key.transform=0;
2042     st->new_transform=0;
2043     st->auxiliary_is_new=0;
2044
2045     enter_state_stop(st);
2046
2047     add_hook(PHASE_SHUTDOWN,site_phase_hook,st);
2048
2049     return new_closure(&st->cl);
2050 }
2051
2052 void site_module(dict_t *dict)
2053 {
2054     add_closure(dict,"site",site_apply);
2055 }
2056
2057
2058 /***** TRANSPORT PEERS definitions *****/
2059
2060 static void transport_peers_debug(struct site *st, transport_peers *dst,
2061                                   const char *didwhat,
2062                                   int nargs, const struct comm_addr *args,
2063                                   size_t stride) {
2064     int i;
2065     char *argp;
2066
2067     if (!(st->log_events & LOG_PEER_ADDRS))
2068         return; /* an optimisation */
2069
2070     slog(st, LOG_PEER_ADDRS, "peers (%s) %s nargs=%d => npeers=%d",
2071          (dst==&st->peers ? "data" :
2072           dst==&st->setup_peers ? "setup" : "UNKNOWN"),
2073          didwhat, nargs, dst->npeers);
2074
2075     for (i=0, argp=(void*)args;
2076          i<nargs;
2077          i++, (argp+=stride?stride:sizeof(*args))) {
2078         const struct comm_addr *ca=(void*)argp;
2079         slog(st, LOG_PEER_ADDRS, " args: addrs[%d]=%s",
2080              i, comm_addr_to_string(ca));
2081     }
2082     for (i=0; i<dst->npeers; i++) {
2083         struct timeval diff;
2084         timersub(tv_now,&dst->peers[i].last,&diff);
2085         const struct comm_addr *ca=&dst->peers[i].addr;
2086         slog(st, LOG_PEER_ADDRS, " peers: addrs[%d]=%s T-%ld.%06ld",
2087              i, comm_addr_to_string(ca),
2088              (unsigned long)diff.tv_sec, (unsigned long)diff.tv_usec);
2089     }
2090 }
2091
2092 static void transport_peers_expire(struct site *st, transport_peers *peers) {
2093     /* peers must be sorted first */
2094     int previous_peers=peers->npeers;
2095     struct timeval oldest;
2096     oldest.tv_sec  = tv_now->tv_sec - st->mobile_peer_expiry;
2097     oldest.tv_usec = tv_now->tv_usec;
2098     while (peers->npeers>1 &&
2099            timercmp(&peers->peers[peers->npeers-1].last, &oldest, <))
2100         peers->npeers--;
2101     if (peers->npeers != previous_peers)
2102         transport_peers_debug(st,peers,"expire", 0,0,0);
2103 }
2104
2105 static bool_t transport_peer_record_one(struct site *st, transport_peers *peers,
2106                                         const struct comm_addr *ca,
2107                                         const struct timeval *tv) {
2108     /* returns false if output is full */
2109     int search;
2110
2111     if (peers->npeers >= st->transport_peers_max)
2112         return 0;
2113
2114     for (search=0; search<peers->npeers; search++)
2115         if (comm_addr_equal(&peers->peers[search].addr, ca))
2116             return 1;
2117
2118     peers->peers[peers->npeers].addr = *ca;
2119     peers->peers[peers->npeers].last = *tv;
2120     peers->npeers++;
2121     return 1;
2122 }
2123
2124 static void transport_record_peers(struct site *st, transport_peers *peers,
2125                                    const struct comm_addr *addrs, int naddrs,
2126                                    const char *m) {
2127     /* We add addrs into peers.  The new entries end up at the front
2128      * and displace entries towards the end (perhaps even off the
2129      * end).  Any existing matching entries are moved up to the front.
2130      *
2131      * Caller must first call transport_peers_expire. */
2132
2133     if (naddrs==1 && peers->npeers>=1 &&
2134         comm_addr_equal(&addrs[0], &peers->peers[0].addr)) {
2135         /* optimisation, also avoids debug for trivial updates */
2136         peers->peers[0].last = *tv_now;
2137         return;
2138     }
2139
2140     int old_npeers=peers->npeers;
2141     transport_peer old_peers[old_npeers];
2142     COPY_ARRAY(old_peers,peers->peers,old_npeers);
2143
2144     peers->npeers=0;
2145     int i;
2146     for (i=0; i<naddrs; i++) {
2147         if (!transport_peer_record_one(st,peers, &addrs[i], tv_now))
2148             break;
2149     }
2150     for (i=0; i<old_npeers; i++) {
2151         const transport_peer *old=&old_peers[i];
2152         if (!transport_peer_record_one(st,peers, &old->addr, &old->last))
2153             break;
2154     }
2155
2156     transport_peers_debug(st,peers,m, naddrs,addrs,0);
2157 }
2158
2159 static void transport_expire_record_peers(struct site *st,
2160                                           transport_peers *peers,
2161                                           const struct comm_addr *addrs,
2162                                           int naddrs, const char *m) {
2163     /* Convenience function */
2164     transport_peers_expire(st,peers);
2165     transport_record_peers(st,peers,addrs,naddrs,m);
2166 }
2167
2168 static bool_t transport_compute_setupinit_peers(struct site *st,
2169         const struct comm_addr *configured_addrs /* 0 if none or not found */,
2170         int n_configured_addrs /* 0 if none or not found */,
2171         const struct comm_addr *incoming_packet_addr /* 0 if none */) {
2172     if (!n_configured_addrs && !incoming_packet_addr &&
2173         !transport_peers_valid(&st->peers))
2174         return False;
2175
2176     slog(st,LOG_SETUP_INIT,
2177          "using: %d configured addr(s);%s %d old peer addrs(es)",
2178          n_configured_addrs,
2179          incoming_packet_addr ? " incoming packet address;" : "",
2180          st->peers.npeers);
2181
2182     /* Non-mobile peers try addresses until one is plausible.  The
2183      * effect is that this code always tries first the configured
2184      * address if supplied, or otherwise the address of the incoming
2185      * PROD, or finally the existing data peer if one exists; this is
2186      * as desired. */
2187
2188     transport_peers_copy(st,&st->setup_peers,&st->peers);
2189     transport_peers_expire(st,&st->setup_peers);
2190
2191     if (incoming_packet_addr)
2192         transport_record_peers(st,&st->setup_peers,
2193                                incoming_packet_addr,1, "incoming");
2194
2195     if (n_configured_addrs)
2196         transport_record_peers(st,&st->setup_peers,
2197                               configured_addrs,n_configured_addrs, "setupinit");
2198
2199     assert(transport_peers_valid(&st->setup_peers));
2200     return True;
2201 }
2202
2203 static void transport_setup_msgok(struct site *st, const struct comm_addr *a) {
2204     if (st->peer_mobile)
2205         transport_expire_record_peers(st,&st->setup_peers,a,1,"setupmsg");
2206 }
2207 static void transport_data_msgok(struct site *st, const struct comm_addr *a) {
2208     if (st->peer_mobile)
2209         transport_expire_record_peers(st,&st->peers,a,1,"datamsg");
2210 }
2211
2212 static int transport_peers_valid(transport_peers *peers) {
2213     return peers->npeers;
2214 }
2215 static void transport_peers_clear(struct site *st, transport_peers *peers) {
2216     peers->npeers= 0;
2217     transport_peers_debug(st,peers,"clear",0,0,0);
2218 }
2219 static void transport_peers_copy(struct site *st, transport_peers *dst,
2220                                  const transport_peers *src) {
2221     dst->npeers=src->npeers;
2222     COPY_ARRAY(dst->peers, src->peers, dst->npeers);
2223     transport_peers_debug(st,dst,"copy",
2224                           src->npeers, &src->peers->addr, sizeof(*src->peers));
2225 }
2226
2227 static void transport_resolve_complete(struct site *st,
2228                                        const struct comm_addr *addrs,
2229                                        int naddrs) {
2230     transport_expire_record_peers(st,&st->peers,addrs,naddrs,
2231                                   "resolved data");
2232     transport_expire_record_peers(st,&st->setup_peers,addrs,naddrs,
2233                                   "resolved setup");
2234 }
2235
2236 static void transport_resolve_complete_tardy(struct site *st,
2237                                              const struct comm_addr *addrs,
2238                                              int naddrs) {
2239     transport_expire_record_peers(st,&st->peers,addrs,naddrs,
2240                                   "resolved tardily");
2241 }
2242
2243 static void transport_peers__copy_by_mask(transport_peer *out, int *nout_io,
2244                                           unsigned mask,
2245                                           const transport_peers *inp) {
2246     /* out and in->peers may be the same region, or nonoverlapping */
2247     const transport_peer *in=inp->peers;
2248     int slot;
2249     for (slot=0; slot<inp->npeers; slot++) {
2250         if (!(mask & (1U << slot)))
2251             continue;
2252         if (!(out==in && slot==*nout_io))
2253             COPY_OBJ(out[*nout_io], in[slot]);
2254         (*nout_io)++;
2255     }
2256 }
2257
2258 void transport_xmit(struct site *st, transport_peers *peers,
2259                     struct buffer_if *buf, bool_t candebug) {
2260     int slot;
2261     transport_peers_expire(st, peers);
2262     unsigned failed=0; /* bitmask */
2263     assert(MAX_PEER_ADDRS < sizeof(unsigned)*CHAR_BIT);
2264
2265     int nfailed=0;
2266     for (slot=0; slot<peers->npeers; slot++) {
2267         transport_peer *peer=&peers->peers[slot];
2268         if (candebug)
2269             dump_packet(st, buf, &peer->addr, False);
2270         bool_t ok =
2271             peer->addr.comm->sendmsg(peer->addr.comm->st, buf, &peer->addr);
2272         if (!ok) {
2273             failed |= 1U << slot;
2274             nfailed++;
2275         }
2276         if (ok && !st->peer_mobile)
2277             break;
2278     }
2279     /* Now we need to demote/delete failing addrs: if we are mobile we
2280      * merely demote them; otherwise we delete them. */
2281     if (st->local_mobile) {
2282         unsigned expected = ((1U << nfailed)-1) << (peers->npeers-nfailed);
2283         /* `expected' has all the failures at the end already */
2284         if (failed != expected) {
2285             int fslot=0;
2286             transport_peer failedpeers[nfailed];
2287             transport_peers__copy_by_mask(failedpeers, &fslot, failed,peers);
2288             assert(fslot == nfailed);
2289             int wslot=0;
2290             transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2291             assert(wslot+nfailed == peers->npeers);
2292             COPY_ARRAY(peers->peers+wslot, failedpeers, nfailed);
2293         }
2294     } else {
2295         if (failed && peers->npeers > 1) {
2296             int wslot=0;
2297             transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2298             peers->npeers=wslot;
2299         }
2300     }
2301 }
2302
2303 /***** END of transport peers declarations *****/