site: Introduce comm_addr_sendmsg
[secnet] / site.c
1 /* site.c - manage communication with a remote network site */
2
3 /*
4 * This file is part of secnet.
5 * See README for full list of copyright holders.
6 *
7 * secnet is free software; you can redistribute it and/or modify it
8 * under the terms of the GNU General Public License as published by
9 * the Free Software Foundation; either version d of the License, or
10 * (at your option) any later version.
11 *
12 * secnet is distributed in the hope that it will be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * version 3 along with secnet; if not, see
19 * https://www.gnu.org/licenses/gpl.html.
20 */
21
22 /* The 'site' code doesn't know anything about the structure of the
23 packets it's transmitting. In fact, under the new netlink
24 configuration scheme it doesn't need to know anything at all about
25 IP addresses, except how to contact its peer. This means it could
26 potentially be used to tunnel other protocols too (IPv6, IPX, plain
27 old Ethernet frames) if appropriate netlink code can be written
28 (and that ought not to be too hard, eg. using the TUN/TAP device to
29 pretend to be an Ethernet interface). */
30
31 /* At some point in the future the netlink code will be asked for
32 configuration information to go in the PING/PONG packets at the end
33 of the key exchange. */
34
35 #include "secnet.h"
36 #include <stdio.h>
37 #include <string.h>
38 #include <limits.h>
39 #include <assert.h>
40 #include <sys/socket.h>
41
42 #include <sys/mman.h>
43 #include "util.h"
44 #include "unaligned.h"
45 #include "magic.h"
46
47 #define SETUP_BUFFER_LEN 2048
48
49 #define DEFAULT_KEY_LIFETIME (3600*1000) /* [ms] */
50 #define DEFAULT_KEY_RENEGOTIATE_GAP (5*60*1000) /* [ms] */
51 #define DEFAULT_SETUP_RETRIES 5
52 #define DEFAULT_SETUP_RETRY_INTERVAL (2*1000) /* [ms] */
53 #define DEFAULT_WAIT_TIME (20*1000) /* [ms] */
54
55 #define DEFAULT_MOBILE_KEY_LIFETIME (2*24*3600*1000) /* [ms] */
56 #define DEFAULT_MOBILE_KEY_RENEGOTIATE_GAP (12*3600*1000) /* [ms] */
57 #define DEFAULT_MOBILE_SETUP_RETRIES 30
58 #define DEFAULT_MOBILE_SETUP_RETRY_INTERVAL (1*1000) /* [ms] */
59 #define DEFAULT_MOBILE_WAIT_TIME (10*1000) /* [ms] */
60
61 #define DEFAULT_MOBILE_PEER_EXPIRY (2*60) /* [s] */
62
63 /* Each site can be in one of several possible states. */
64
65 /* States:
66 SITE_STOP - nothing is allowed to happen; tunnel is down;
67 all session keys have been erased
68 -> SITE_RUN upon external instruction
69 SITE_RUN - site up, maybe with valid key
70 -> SITE_RESOLVE upon outgoing packet and no valid key
71 we start name resolution for the other end of the tunnel
72 -> SITE_SENTMSG2 upon valid incoming message 1 and suitable time
73 we send an appropriate message 2
74 SITE_RESOLVE - waiting for name resolution
75 -> SITE_SENTMSG1 upon successful resolution
76 we send an appropriate message 1
77 -> SITE_SENTMSG2 upon valid incoming message 1 (then abort resolution)
78 we abort resolution and
79 -> SITE_WAIT on timeout or resolution failure
80 SITE_SENTMSG1
81 -> SITE_SENTMSG2 upon valid incoming message 1 from higher priority end
82 -> SITE_SENTMSG3 upon valid incoming message 2
83 -> SITE_WAIT on timeout
84 SITE_SENTMSG2
85 -> SITE_SENTMSG4 upon valid incoming message 3
86 -> SITE_WAIT on timeout
87 SITE_SENTMSG3
88 -> SITE_SENTMSG5 upon valid incoming message 4
89 -> SITE_WAIT on timeout
90 SITE_SENTMSG4
91 -> SITE_RUN upon valid incoming message 5
92 -> SITE_WAIT on timeout
93 SITE_SENTMSG5
94 -> SITE_RUN upon valid incoming message 6
95 -> SITE_WAIT on timeout
96 SITE_WAIT - failed to establish key; do nothing for a while
97 -> SITE_RUN on timeout
98 */
99
100 #define SITE_STOP 0
101 #define SITE_RUN 1
102 #define SITE_RESOLVE 2
103 #define SITE_SENTMSG1 3
104 #define SITE_SENTMSG2 4
105 #define SITE_SENTMSG3 5
106 #define SITE_SENTMSG4 6
107 #define SITE_SENTMSG5 7
108 #define SITE_WAIT 8
109
110 int32_t site_max_start_pad = 4*4;
111
112 static cstring_t state_name(uint32_t state)
113 {
114 switch (state) {
115 case 0: return "STOP";
116 case 1: return "RUN";
117 case 2: return "RESOLVE";
118 case 3: return "SENTMSG1";
119 case 4: return "SENTMSG2";
120 case 5: return "SENTMSG3";
121 case 6: return "SENTMSG4";
122 case 7: return "SENTMSG5";
123 case 8: return "WAIT";
124 default: return "*bad state*";
125 }
126 }
127
128 #define NONCELEN 8
129
130 #define LOG_UNEXPECTED 0x00000001
131 #define LOG_SETUP_INIT 0x00000002
132 #define LOG_SETUP_TIMEOUT 0x00000004
133 #define LOG_ACTIVATE_KEY 0x00000008
134 #define LOG_TIMEOUT_KEY 0x00000010
135 #define LOG_SEC 0x00000020
136 #define LOG_STATE 0x00000040
137 #define LOG_DROP 0x00000080
138 #define LOG_DUMP 0x00000100
139 #define LOG_ERROR 0x00000400
140 #define LOG_PEER_ADDRS 0x00000800
141
142 static struct flagstr log_event_table[]={
143 { "unexpected", LOG_UNEXPECTED },
144 { "setup-init", LOG_SETUP_INIT },
145 { "setup-timeout", LOG_SETUP_TIMEOUT },
146 { "activate-key", LOG_ACTIVATE_KEY },
147 { "timeout-key", LOG_TIMEOUT_KEY },
148 { "security", LOG_SEC },
149 { "state-change", LOG_STATE },
150 { "packet-drop", LOG_DROP },
151 { "dump-packets", LOG_DUMP },
152 { "errors", LOG_ERROR },
153 { "peer-addrs", LOG_PEER_ADDRS },
154 { "default", LOG_SETUP_INIT|LOG_SETUP_TIMEOUT|
155 LOG_ACTIVATE_KEY|LOG_TIMEOUT_KEY|LOG_SEC|LOG_ERROR },
156 { "all", 0xffffffff },
157 { NULL, 0 }
158 };
159
160
161 /***** TRANSPORT PEERS declarations *****/
162
163 /* Details of "mobile peer" semantics:
164
165 - We use the same data structure for the different configurations,
166 but manage it with different algorithms.
167
168 - We record up to mobile_peers_max peer address/port numbers
169 ("peers") for key setup, and separately up to mobile_peers_max
170 for data transfer.
171
172 - In general, we make a new set of addrs (see below) when we start
173 a new key exchange; the key setup addrs become the data transport
174 addrs when key setup complets.
175
176 If our peer is mobile:
177
178 - We send to all recent addresses of incoming packets, plus
179 initially all configured addresses (which we also expire).
180
181 - So, we record addrs of good incoming packets, as follows:
182 1. expire any peers last seen >120s ("mobile-peer-expiry") ago
183 2. add the peer of the just received packet to the applicable list
184 (possibly evicting the oldest entries to make room)
185 NB that we do not expire peers until an incoming packet arrives.
186
187 - If the peer has a configured address or name, we record them the
188 same way, but only as a result of our own initiation of key
189 setup. (We might evict some incoming packet addrs to make room.)
190
191 - The default number of addrs to keep is 3, or 4 if we have a
192 configured name or address. That's space for two configured
193 addresses (one IPv6 and one IPv4), plus two received addresses.
194
195 - Outgoing packets are sent to every recorded address in the
196 applicable list. Any unsupported[1] addresses are deleted from
197 the list right away. (This should only happen to configured
198 addresses, of course, but there is no need to check that.)
199
200 - When we successfully complete a key setup, we merge the key setup
201 peers into the data transfer peers.
202
203 [1] An unsupported address is one for whose AF we don't have a
204 socket (perhaps because we got EAFNOSUPPORT or some such) or for
205 which sendto gives ENETUNREACH.
206
207 If neither end is mobile:
208
209 - When peer initiated the key exchange, we use the incoming packet
210 address.
211
212 - When we initiate the key exchange, we try configured addresses
213 until we get one which isn't unsupported then fixate on that.
214
215 - When we complete a key setup, we replace the data transport peers
216 with those from the key setup.
217
218 If we are mobile:
219
220 - We can't tell when local network setup changes so we can't cache
221 the unsupported addrs and completely remove the spurious calls to
222 sendto, but we can optimise things a bit by deprioritising addrs
223 which seem to be unsupported.
224
225 - Use only configured addresses. (Except, that if our peer
226 initiated a key exchange we use the incoming packet address until
227 our name resolution completes.)
228
229 - When we send a packet, try each address in turn; if addr
230 supported, put that address to the end of the list for future
231 packets, and go onto the next address.
232
233 - When we complete a key setup, we replace the data transport peers
234 with those from the key setup.
235
236 */
237
238 typedef struct {
239 struct timeval last;
240 struct comm_addr addr;
241 } transport_peer;
242
243 typedef struct {
244 /* configuration information */
245 /* runtime information */
246 int npeers;
247 transport_peer peers[MAX_PEER_ADDRS];
248 } transport_peers;
249
250 /* Basic operations on transport peer address sets */
251 static void transport_peers_clear(struct site *st, transport_peers *peers);
252 static int transport_peers_valid(transport_peers *peers);
253 static void transport_peers_copy(struct site *st, transport_peers *dst,
254 const transport_peers *src);
255
256 /* Record address of incoming setup packet; resp. data packet. */
257 static void transport_setup_msgok(struct site *st, const struct comm_addr *a);
258 static void transport_data_msgok(struct site *st, const struct comm_addr *a);
259
260 /* Initialise the setup addresses. Called before we send the first
261 * packet in a key exchange. If we are the initiator, as a result of
262 * resolve completing (or being determined not to be relevant) or an
263 * incoming PROD; if we are the responder, as a result of the MSG1. */
264 static bool_t transport_compute_setupinit_peers(struct site *st,
265 const struct comm_addr *configured_addrs /* 0 if none or not found */,
266 int n_configured_addrs /* 0 if none or not found */,
267 const struct comm_addr *incoming_packet_addr /* 0 if none */);
268
269 /* Called if we are the responder in a key setup, when the resolve
270 * completes. transport_compute_setupinit_peers will hvae been called
271 * earlier. If _complete is called, we are still doing the key setup
272 * (and we should use the new values for both the rest of the key
273 * setup and the ongoing data exchange); if _tardy is called, the key
274 * setup is done (either completed or not) and only the data peers are
275 * relevant */
276 static void transport_resolve_complete(struct site *st,
277 const struct comm_addr *addrs, int naddrs);
278 static void transport_resolve_complete_tardy(struct site *st,
279 const struct comm_addr *addrs, int naddrs);
280
281 static void transport_xmit(struct site *st, transport_peers *peers,
282 struct buffer_if *buf, bool_t candebug);
283
284 /***** END of transport peers declarations *****/
285
286
287 struct data_key {
288 struct transform_inst_if *transform;
289 uint64_t key_timeout; /* End of life of current key */
290 uint32_t remote_session_id;
291 };
292
293 struct site {
294 closure_t cl;
295 struct site_if ops;
296 /* configuration information */
297 string_t localname;
298 string_t remotename;
299 bool_t keepalive;
300 bool_t local_mobile, peer_mobile; /* Mobile client support */
301 int32_t transport_peers_max;
302 string_t tunname; /* localname<->remotename by default, used in logs */
303 cstring_t *addresses; /* DNS name or address(es) for bootstrapping, optional */
304 int remoteport; /* Port for bootstrapping, optional */
305 uint32_t mtu_target;
306 struct netlink_if *netlink;
307 struct comm_if **comms;
308 int ncomms;
309 struct resolver_if *resolver;
310 struct log_if *log;
311 struct random_if *random;
312 struct rsaprivkey_if *privkey;
313 struct rsapubkey_if *pubkey;
314 struct transform_if **transforms;
315 int ntransforms;
316 struct dh_if *dh;
317 struct hash_if *hash;
318
319 uint32_t index; /* Index of this site */
320 uint32_t local_capabilities;
321 int32_t setup_retries; /* How many times to send setup packets */
322 int32_t setup_retry_interval; /* Initial timeout for setup packets */
323 int32_t wait_timeout; /* How long to wait if setup unsuccessful */
324 int32_t mobile_peer_expiry; /* How long to remember 2ary addresses */
325 int32_t key_lifetime; /* How long a key lasts once set up */
326 int32_t key_renegotiate_time; /* If we see traffic (or a keepalive)
327 after this time, initiate a new
328 key exchange */
329
330 bool_t setup_priority; /* Do we have precedence if both sites emit
331 message 1 simultaneously? */
332 uint32_t log_events;
333
334 /* runtime information */
335 uint32_t state;
336 uint64_t now; /* Most recently seen time */
337 bool_t allow_send_prod;
338 int resolving_count;
339 int resolving_n_results_all;
340 int resolving_n_results_stored;
341 struct comm_addr resolving_results[MAX_PEER_ADDRS];
342
343 /* The currently established session */
344 struct data_key current;
345 struct data_key auxiliary_key;
346 bool_t auxiliary_is_new;
347 uint64_t renegotiate_key_time; /* When we can negotiate a new key */
348 uint64_t auxiliary_renegotiate_key_time;
349 transport_peers peers; /* Current address(es) of peer for data traffic */
350
351 /* The current key setup protocol exchange. We can only be
352 involved in one of these at a time. There's a potential for
353 denial of service here (the attacker keeps sending a setup
354 packet; we keep trying to continue the exchange, and have to
355 timeout before we can listen for another setup packet); perhaps
356 we should keep a list of 'bad' sources for setup packets. */
357 uint32_t remote_capabilities;
358 uint16_t remote_adv_mtu;
359 struct transform_if *chosen_transform;
360 uint32_t setup_session_id;
361 transport_peers setup_peers;
362 uint8_t localN[NONCELEN]; /* Nonces for key exchange */
363 uint8_t remoteN[NONCELEN];
364 struct buffer_if buffer; /* Current outgoing key exchange packet */
365 struct buffer_if scratch;
366 int32_t retries; /* Number of retries remaining */
367 uint64_t timeout; /* Timeout for current state */
368 uint8_t *dhsecret;
369 uint8_t *sharedsecret;
370 uint32_t sharedsecretlen, sharedsecretallocd;
371 struct transform_inst_if *new_transform; /* For key setup/verify */
372 };
373
374 static uint32_t event_log_priority(struct site *st, uint32_t event)
375 {
376 if (!(event&st->log_events))
377 return 0;
378 switch(event) {
379 case LOG_UNEXPECTED: return M_INFO;
380 case LOG_SETUP_INIT: return M_INFO;
381 case LOG_SETUP_TIMEOUT: return M_NOTICE;
382 case LOG_ACTIVATE_KEY: return M_INFO;
383 case LOG_TIMEOUT_KEY: return M_INFO;
384 case LOG_SEC: return M_SECURITY;
385 case LOG_STATE: return M_DEBUG;
386 case LOG_DROP: return M_DEBUG;
387 case LOG_DUMP: return M_DEBUG;
388 case LOG_ERROR: return M_ERR;
389 case LOG_PEER_ADDRS: return M_DEBUG;
390 default: return M_ERR;
391 }
392 }
393
394 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
395 FORMAT(printf,3,0);
396 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
397 {
398 uint32_t class;
399
400 class=event_log_priority(st, event);
401 if (class) {
402 slilog_part(st->log,class,"%s: ",st->tunname);
403 vslilog_part(st->log,class,msg,ap);
404 slilog_part(st->log,class,"\n");
405 }
406 }
407
408 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
409 FORMAT(printf,3,4);
410 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
411 {
412 va_list ap;
413 va_start(ap,msg);
414 vslog(st,event,msg,ap);
415 va_end(ap);
416 }
417
418 static void logtimeout(struct site *st, const char *fmt, ...)
419 FORMAT(printf,2,3);
420 static void logtimeout(struct site *st, const char *fmt, ...)
421 {
422 uint32_t class=event_log_priority(st,LOG_SETUP_TIMEOUT);
423 if (!class)
424 return;
425
426 va_list ap;
427 va_start(ap,fmt);
428
429 slilog_part(st->log,class,"%s: ",st->tunname);
430 vslilog_part(st->log,class,fmt,ap);
431
432 const char *delim;
433 int i;
434 for (i=0, delim=" (tried ";
435 i<st->setup_peers.npeers;
436 i++, delim=", ") {
437 transport_peer *peer=&st->setup_peers.peers[i];
438 const char *s=comm_addr_to_string(&peer->addr);
439 slilog_part(st->log,class,"%s%s",delim,s);
440 }
441
442 slilog_part(st->log,class,")\n");
443 va_end(ap);
444 }
445
446 static void set_link_quality(struct site *st);
447 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel);
448 static void delete_one_key(struct site *st, struct data_key *key,
449 const char *reason /* may be 0 meaning don't log*/,
450 const char *which /* ignored if !reasonn */,
451 uint32_t loglevel /* ignored if !reasonn */);
452 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
453 const struct comm_addr *prod_hint);
454 static void enter_state_run(struct site *st);
455 static bool_t enter_state_resolve(struct site *st);
456 static void decrement_resolving_count(struct site *st, int by);
457 static bool_t enter_new_state(struct site *st,uint32_t next);
458 static void enter_state_wait(struct site *st);
459 static void activate_new_key(struct site *st);
460
461 static bool_t is_transform_valid(struct transform_inst_if *transform)
462 {
463 return transform && transform->valid(transform->st);
464 }
465
466 static bool_t current_valid(struct site *st)
467 {
468 return is_transform_valid(st->current.transform);
469 }
470
471 #define DEFINE_CALL_TRANSFORM(fwdrev) \
472 static int call_transform_##fwdrev(struct site *st, \
473 struct transform_inst_if *transform, \
474 struct buffer_if *buf, \
475 const char **errmsg) \
476 { \
477 if (!is_transform_valid(transform)) { \
478 *errmsg="transform not set up"; \
479 return 1; \
480 } \
481 return transform->fwdrev(transform->st,buf,errmsg); \
482 }
483
484 DEFINE_CALL_TRANSFORM(forwards)
485 DEFINE_CALL_TRANSFORM(reverse)
486
487 static void dispose_transform(struct transform_inst_if **transform_var)
488 {
489 struct transform_inst_if *transform=*transform_var;
490 if (transform) {
491 transform->delkey(transform->st);
492 transform->destroy(transform->st);
493 }
494 *transform_var = 0;
495 }
496
497 #define CHECK_AVAIL(b,l) do { if ((b)->size<(l)) return False; } while(0)
498 #define CHECK_EMPTY(b) do { if ((b)->size!=0) return False; } while(0)
499 #define CHECK_TYPE(b,t) do { uint32_t type; \
500 CHECK_AVAIL((b),4); \
501 type=buf_unprepend_uint32((b)); \
502 if (type!=(t)) return False; } while(0)
503
504 static _Bool type_is_msg34(uint32_t type)
505 {
506 return
507 type == LABEL_MSG3 ||
508 type == LABEL_MSG3BIS ||
509 type == LABEL_MSG4;
510 }
511
512 struct parsedname {
513 int32_t len;
514 uint8_t *name;
515 struct buffer_if extrainfo;
516 };
517
518 struct msg {
519 uint8_t *hashstart;
520 uint32_t dest;
521 uint32_t source;
522 struct parsedname remote;
523 struct parsedname local;
524 uint32_t remote_capabilities;
525 uint16_t remote_mtu;
526 int capab_transformnum;
527 uint8_t *nR;
528 uint8_t *nL;
529 int32_t pklen;
530 char *pk;
531 int32_t hashlen;
532 int32_t siglen;
533 char *sig;
534 };
535
536 static void set_new_transform(struct site *st, char *pk)
537 {
538 /* Make room for the shared key */
539 st->sharedsecretlen=st->chosen_transform->keylen?:st->dh->ceil_len;
540 assert(st->sharedsecretlen);
541 if (st->sharedsecretlen > st->sharedsecretallocd) {
542 st->sharedsecretallocd=st->sharedsecretlen;
543 st->sharedsecret=safe_realloc_ary(st->sharedsecret,1,
544 st->sharedsecretallocd,
545 "site:sharedsecret");
546 }
547
548 /* Generate the shared key */
549 st->dh->makeshared(st->dh->st,st->dhsecret,st->dh->len,pk,
550 st->sharedsecret,st->sharedsecretlen);
551
552 /* Set up the transform */
553 struct transform_if *generator=st->chosen_transform;
554 struct transform_inst_if *generated=generator->create(generator->st);
555 generated->setkey(generated->st,st->sharedsecret,
556 st->sharedsecretlen,st->setup_priority);
557 dispose_transform(&st->new_transform);
558 st->new_transform=generated;
559
560 slog(st,LOG_SETUP_INIT,"key exchange negotiated transform"
561 " %d (capabilities ours=%#"PRIx32" theirs=%#"PRIx32")",
562 st->chosen_transform->capab_transformnum,
563 st->local_capabilities, st->remote_capabilities);
564 }
565
566 struct xinfoadd {
567 int32_t lenpos, afternul;
568 };
569 static void append_string_xinfo_start(struct buffer_if *buf,
570 struct xinfoadd *xia,
571 const char *str)
572 /* Helps construct one of the names with additional info as found
573 * in MSG1..4. Call this function first, then append all the
574 * desired extra info (not including the nul byte) to the buffer,
575 * then call append_string_xinfo_done. */
576 {
577 xia->lenpos = buf->size;
578 buf_append_string(buf,str);
579 buf_append_uint8(buf,0);
580 xia->afternul = buf->size;
581 }
582 static void append_string_xinfo_done(struct buffer_if *buf,
583 struct xinfoadd *xia)
584 {
585 /* we just need to adjust the string length */
586 if (buf->size == xia->afternul) {
587 /* no extra info, strip the nul too */
588 buf_unappend_uint8(buf);
589 } else {
590 put_uint16(buf->start+xia->lenpos, buf->size-(xia->lenpos+2));
591 }
592 }
593
594 /* Build any of msg1 to msg4. msg5 and msg6 are built from the inside
595 out using a transform of config data supplied by netlink */
596 static bool_t generate_msg(struct site *st, uint32_t type, cstring_t what)
597 {
598 void *hst;
599 uint8_t *hash;
600 string_t dhpub, sig;
601
602 st->retries=st->setup_retries;
603 BUF_ALLOC(&st->buffer,what);
604 buffer_init(&st->buffer,0);
605 buf_append_uint32(&st->buffer,
606 (type==LABEL_MSG1?0:st->setup_session_id));
607 buf_append_uint32(&st->buffer,st->index);
608 buf_append_uint32(&st->buffer,type);
609
610 struct xinfoadd xia;
611 append_string_xinfo_start(&st->buffer,&xia,st->localname);
612 if ((st->local_capabilities & CAPAB_EARLY) || (type != LABEL_MSG1)) {
613 buf_append_uint32(&st->buffer,st->local_capabilities);
614 }
615 if (type_is_msg34(type)) {
616 buf_append_uint16(&st->buffer,st->mtu_target);
617 }
618 append_string_xinfo_done(&st->buffer,&xia);
619
620 buf_append_string(&st->buffer,st->remotename);
621 BUF_ADD_OBJ(append,&st->buffer,st->localN);
622 if (type==LABEL_MSG1) return True;
623 BUF_ADD_OBJ(append,&st->buffer,st->remoteN);
624 if (type==LABEL_MSG2) return True;
625
626 if (hacky_par_mid_failnow()) return False;
627
628 if (type==LABEL_MSG3BIS)
629 buf_append_uint8(&st->buffer,st->chosen_transform->capab_transformnum);
630
631 dhpub=st->dh->makepublic(st->dh->st,st->dhsecret,st->dh->len);
632 buf_append_string(&st->buffer,dhpub);
633 free(dhpub);
634 hash=safe_malloc(st->hash->len, "generate_msg");
635 hst=st->hash->init();
636 st->hash->update(hst,st->buffer.start,st->buffer.size);
637 st->hash->final(hst,hash);
638 sig=st->privkey->sign(st->privkey->st,hash,st->hash->len);
639 buf_append_string(&st->buffer,sig);
640 free(sig);
641 free(hash);
642 return True;
643 }
644
645 static bool_t unpick_name(struct buffer_if *msg, struct parsedname *nm)
646 {
647 CHECK_AVAIL(msg,2);
648 nm->len=buf_unprepend_uint16(msg);
649 CHECK_AVAIL(msg,nm->len);
650 nm->name=buf_unprepend(msg,nm->len);
651 uint8_t *nul=memchr(nm->name,0,nm->len);
652 if (!nul) {
653 buffer_readonly_view(&nm->extrainfo,0,0);
654 } else {
655 buffer_readonly_view(&nm->extrainfo, nul+1, msg->start-(nul+1));
656 nm->len=nul-nm->name;
657 }
658 return True;
659 }
660
661 static bool_t unpick_msg(struct site *st, uint32_t type,
662 struct buffer_if *msg, struct msg *m)
663 {
664 m->capab_transformnum=-1;
665 m->hashstart=msg->start;
666 CHECK_AVAIL(msg,4);
667 m->dest=buf_unprepend_uint32(msg);
668 CHECK_AVAIL(msg,4);
669 m->source=buf_unprepend_uint32(msg);
670 CHECK_TYPE(msg,type);
671 if (!unpick_name(msg,&m->remote)) return False;
672 m->remote_capabilities=0;
673 m->remote_mtu=0;
674 if (m->remote.extrainfo.size) {
675 CHECK_AVAIL(&m->remote.extrainfo,4);
676 m->remote_capabilities=buf_unprepend_uint32(&m->remote.extrainfo);
677 }
678 if (type_is_msg34(type) && m->remote.extrainfo.size) {
679 CHECK_AVAIL(&m->remote.extrainfo,2);
680 m->remote_mtu=buf_unprepend_uint16(&m->remote.extrainfo);
681 }
682 if (!unpick_name(msg,&m->local)) return False;
683 if (type==LABEL_PROD) {
684 CHECK_EMPTY(msg);
685 return True;
686 }
687 CHECK_AVAIL(msg,NONCELEN);
688 m->nR=buf_unprepend(msg,NONCELEN);
689 if (type==LABEL_MSG1) {
690 CHECK_EMPTY(msg);
691 return True;
692 }
693 CHECK_AVAIL(msg,NONCELEN);
694 m->nL=buf_unprepend(msg,NONCELEN);
695 if (type==LABEL_MSG2) {
696 CHECK_EMPTY(msg);
697 return True;
698 }
699 if (type==LABEL_MSG3BIS) {
700 CHECK_AVAIL(msg,1);
701 m->capab_transformnum = buf_unprepend_uint8(msg);
702 } else {
703 m->capab_transformnum = CAPAB_TRANSFORMNUM_ANCIENT;
704 }
705 CHECK_AVAIL(msg,2);
706 m->pklen=buf_unprepend_uint16(msg);
707 CHECK_AVAIL(msg,m->pklen);
708 m->pk=buf_unprepend(msg,m->pklen);
709 m->hashlen=msg->start-m->hashstart;
710 CHECK_AVAIL(msg,2);
711 m->siglen=buf_unprepend_uint16(msg);
712 CHECK_AVAIL(msg,m->siglen);
713 m->sig=buf_unprepend(msg,m->siglen);
714 CHECK_EMPTY(msg);
715 return True;
716 }
717
718 static bool_t name_matches(const struct parsedname *nm, const char *expected)
719 {
720 int expected_len=strlen(expected);
721 return
722 nm->len == expected_len &&
723 !memcmp(nm->name, expected, expected_len);
724 }
725
726 static bool_t check_msg(struct site *st, uint32_t type, struct msg *m,
727 cstring_t *error)
728 {
729 if (type==LABEL_MSG1) return True;
730
731 /* Check that the site names and our nonce have been sent
732 back correctly, and then store our peer's nonce. */
733 if (!name_matches(&m->remote,st->remotename)) {
734 *error="wrong remote site name";
735 return False;
736 }
737 if (!name_matches(&m->local,st->localname)) {
738 *error="wrong local site name";
739 return False;
740 }
741 if (memcmp(m->nL,st->localN,NONCELEN)!=0) {
742 *error="wrong locally-generated nonce";
743 return False;
744 }
745 if (type==LABEL_MSG2) return True;
746 if (!consttime_memeq(m->nR,st->remoteN,NONCELEN)!=0) {
747 *error="wrong remotely-generated nonce";
748 return False;
749 }
750 /* MSG3 has complicated rules about capabilities, which are
751 * handled in process_msg3. */
752 if (type==LABEL_MSG3 || type==LABEL_MSG3BIS) return True;
753 if (m->remote_capabilities!=st->remote_capabilities) {
754 *error="remote capabilities changed";
755 return False;
756 }
757 if (type==LABEL_MSG4) return True;
758 *error="unknown message type";
759 return False;
760 }
761
762 static bool_t generate_msg1(struct site *st)
763 {
764 st->random->generate(st->random->st,NONCELEN,st->localN);
765 return generate_msg(st,LABEL_MSG1,"site:MSG1");
766 }
767
768 static bool_t process_msg1(struct site *st, struct buffer_if *msg1,
769 const struct comm_addr *src, struct msg *m)
770 {
771 /* We've already determined we're in an appropriate state to
772 process an incoming MSG1, and that the MSG1 has correct values
773 of A and B. */
774
775 st->setup_session_id=m->source;
776 st->remote_capabilities=m->remote_capabilities;
777 memcpy(st->remoteN,m->nR,NONCELEN);
778 return True;
779 }
780
781 static bool_t generate_msg2(struct site *st)
782 {
783 st->random->generate(st->random->st,NONCELEN,st->localN);
784 return generate_msg(st,LABEL_MSG2,"site:MSG2");
785 }
786
787 static bool_t process_msg2(struct site *st, struct buffer_if *msg2,
788 const struct comm_addr *src)
789 {
790 struct msg m;
791 cstring_t err;
792
793 if (!unpick_msg(st,LABEL_MSG2,msg2,&m)) return False;
794 if (!check_msg(st,LABEL_MSG2,&m,&err)) {
795 slog(st,LOG_SEC,"msg2: %s",err);
796 return False;
797 }
798 st->setup_session_id=m.source;
799 st->remote_capabilities=m.remote_capabilities;
800
801 /* Select the transform to use */
802
803 uint32_t remote_transforms = st->remote_capabilities & CAPAB_TRANSFORM_MASK;
804 if (!remote_transforms)
805 /* old secnets only had this one transform */
806 remote_transforms = 1UL << CAPAB_TRANSFORMNUM_ANCIENT;
807
808 struct transform_if *ti;
809 int i;
810 for (i=0; i<st->ntransforms; i++) {
811 ti=st->transforms[i];
812 if ((1UL << ti->capab_transformnum) & remote_transforms)
813 goto transform_found;
814 }
815 slog(st,LOG_ERROR,"no transforms in common"
816 " (us %#"PRIx32"; them: %#"PRIx32")",
817 st->local_capabilities & CAPAB_TRANSFORM_MASK,
818 remote_transforms);
819 return False;
820 transform_found:
821 st->chosen_transform=ti;
822
823 memcpy(st->remoteN,m.nR,NONCELEN);
824 return True;
825 }
826
827 static bool_t generate_msg3(struct site *st)
828 {
829 /* Now we have our nonce and their nonce. Think of a secret key,
830 and create message number 3. */
831 st->random->generate(st->random->st,st->dh->len,st->dhsecret);
832 return generate_msg(st,
833 (st->remote_capabilities & CAPAB_TRANSFORM_MASK
834 ? LABEL_MSG3BIS : LABEL_MSG3),
835 "site:MSG3");
836 }
837
838 static bool_t process_msg3_msg4(struct site *st, struct msg *m)
839 {
840 uint8_t *hash;
841 void *hst;
842
843 /* Check signature and store g^x mod m */
844 hash=safe_malloc(st->hash->len, "process_msg3_msg4");
845 hst=st->hash->init();
846 st->hash->update(hst,m->hashstart,m->hashlen);
847 st->hash->final(hst,hash);
848 /* Terminate signature with a '0' - cheating, but should be ok */
849 m->sig[m->siglen]=0;
850 if (!st->pubkey->check(st->pubkey->st,hash,st->hash->len,m->sig)) {
851 slog(st,LOG_SEC,"msg3/msg4 signature failed check!");
852 free(hash);
853 return False;
854 }
855 free(hash);
856
857 st->remote_adv_mtu=m->remote_mtu;
858
859 return True;
860 }
861
862 static bool_t process_msg3(struct site *st, struct buffer_if *msg3,
863 const struct comm_addr *src, uint32_t msgtype)
864 {
865 struct msg m;
866 cstring_t err;
867
868 assert(msgtype==LABEL_MSG3 || msgtype==LABEL_MSG3BIS);
869
870 if (!unpick_msg(st,msgtype,msg3,&m)) return False;
871 if (!check_msg(st,msgtype,&m,&err)) {
872 slog(st,LOG_SEC,"msg3: %s",err);
873 return False;
874 }
875 uint32_t capab_adv_late = m.remote_capabilities
876 & ~st->remote_capabilities & CAPAB_EARLY;
877 if (capab_adv_late) {
878 slog(st,LOG_SEC,"msg3 impermissibly adds early capability flag(s)"
879 " %#"PRIx32" (was %#"PRIx32", now %#"PRIx32")",
880 capab_adv_late, st->remote_capabilities, m.remote_capabilities);
881 return False;
882 }
883 st->remote_capabilities|=m.remote_capabilities;
884
885 struct transform_if *ti;
886 int i;
887 for (i=0; i<st->ntransforms; i++) {
888 ti=st->transforms[i];
889 if (ti->capab_transformnum == m.capab_transformnum)
890 goto transform_found;
891 }
892 slog(st,LOG_SEC,"peer chose unknown-to-us transform %d!",
893 m.capab_transformnum);
894 return False;
895 transform_found:
896 st->chosen_transform=ti;
897
898 if (!process_msg3_msg4(st,&m))
899 return False;
900
901 /* Terminate their DH public key with a '0' */
902 m.pk[m.pklen]=0;
903 /* Invent our DH secret key */
904 st->random->generate(st->random->st,st->dh->len,st->dhsecret);
905
906 /* Generate the shared key and set up the transform */
907 set_new_transform(st,m.pk);
908
909 return True;
910 }
911
912 static bool_t generate_msg4(struct site *st)
913 {
914 /* We have both nonces, their public key and our private key. Generate
915 our public key, sign it and send it to them. */
916 return generate_msg(st,LABEL_MSG4,"site:MSG4");
917 }
918
919 static bool_t process_msg4(struct site *st, struct buffer_if *msg4,
920 const struct comm_addr *src)
921 {
922 struct msg m;
923 cstring_t err;
924
925 if (!unpick_msg(st,LABEL_MSG4,msg4,&m)) return False;
926 if (!check_msg(st,LABEL_MSG4,&m,&err)) {
927 slog(st,LOG_SEC,"msg4: %s",err);
928 return False;
929 }
930
931 if (!process_msg3_msg4(st,&m))
932 return False;
933
934 /* Terminate their DH public key with a '0' */
935 m.pk[m.pklen]=0;
936
937 /* Generate the shared key and set up the transform */
938 set_new_transform(st,m.pk);
939
940 return True;
941 }
942
943 struct msg0 {
944 uint32_t dest;
945 uint32_t source;
946 uint32_t type;
947 };
948
949 static bool_t unpick_msg0(struct site *st, struct buffer_if *msg0,
950 struct msg0 *m)
951 {
952 CHECK_AVAIL(msg0,4);
953 m->dest=buf_unprepend_uint32(msg0);
954 CHECK_AVAIL(msg0,4);
955 m->source=buf_unprepend_uint32(msg0);
956 CHECK_AVAIL(msg0,4);
957 m->type=buf_unprepend_uint32(msg0);
958 return True;
959 /* Leaves transformed part of buffer untouched */
960 }
961
962 static bool_t generate_msg5(struct site *st)
963 {
964 cstring_t transform_err;
965
966 BUF_ALLOC(&st->buffer,"site:MSG5");
967 /* We are going to add four words to the message */
968 buffer_init(&st->buffer,calculate_max_start_pad());
969 /* Give the netlink code an opportunity to put its own stuff in the
970 message (configuration information, etc.) */
971 buf_prepend_uint32(&st->buffer,LABEL_MSG5);
972 if (call_transform_forwards(st,st->new_transform,
973 &st->buffer,&transform_err))
974 return False;
975 buf_prepend_uint32(&st->buffer,LABEL_MSG5);
976 buf_prepend_uint32(&st->buffer,st->index);
977 buf_prepend_uint32(&st->buffer,st->setup_session_id);
978
979 st->retries=st->setup_retries;
980 return True;
981 }
982
983 static bool_t process_msg5(struct site *st, struct buffer_if *msg5,
984 const struct comm_addr *src,
985 struct transform_inst_if *transform)
986 {
987 struct msg0 m;
988 cstring_t transform_err;
989
990 if (!unpick_msg0(st,msg5,&m)) return False;
991
992 if (call_transform_reverse(st,transform,msg5,&transform_err)) {
993 /* There's a problem */
994 slog(st,LOG_SEC,"process_msg5: transform: %s",transform_err);
995 return False;
996 }
997 /* Buffer should now contain untransformed PING packet data */
998 CHECK_AVAIL(msg5,4);
999 if (buf_unprepend_uint32(msg5)!=LABEL_MSG5) {
1000 slog(st,LOG_SEC,"MSG5/PING packet contained wrong label");
1001 return False;
1002 }
1003 /* Older versions of secnet used to write some config data here
1004 * which we ignore. So we don't CHECK_EMPTY */
1005 return True;
1006 }
1007
1008 static void create_msg6(struct site *st, struct transform_inst_if *transform,
1009 uint32_t session_id)
1010 {
1011 cstring_t transform_err;
1012
1013 BUF_ALLOC(&st->buffer,"site:MSG6");
1014 /* We are going to add four words to the message */
1015 buffer_init(&st->buffer,calculate_max_start_pad());
1016 /* Give the netlink code an opportunity to put its own stuff in the
1017 message (configuration information, etc.) */
1018 buf_prepend_uint32(&st->buffer,LABEL_MSG6);
1019 int problem = call_transform_forwards(st,transform,
1020 &st->buffer,&transform_err);
1021 assert(!problem);
1022 buf_prepend_uint32(&st->buffer,LABEL_MSG6);
1023 buf_prepend_uint32(&st->buffer,st->index);
1024 buf_prepend_uint32(&st->buffer,session_id);
1025 }
1026
1027 static bool_t generate_msg6(struct site *st)
1028 {
1029 if (!is_transform_valid(st->new_transform))
1030 return False;
1031 create_msg6(st,st->new_transform,st->setup_session_id);
1032 st->retries=1; /* Peer will retransmit MSG5 if this packet gets lost */
1033 return True;
1034 }
1035
1036 static bool_t process_msg6(struct site *st, struct buffer_if *msg6,
1037 const struct comm_addr *src)
1038 {
1039 struct msg0 m;
1040 cstring_t transform_err;
1041
1042 if (!unpick_msg0(st,msg6,&m)) return False;
1043
1044 if (call_transform_reverse(st,st->new_transform,msg6,&transform_err)) {
1045 /* There's a problem */
1046 slog(st,LOG_SEC,"process_msg6: transform: %s",transform_err);
1047 return False;
1048 }
1049 /* Buffer should now contain untransformed PING packet data */
1050 CHECK_AVAIL(msg6,4);
1051 if (buf_unprepend_uint32(msg6)!=LABEL_MSG6) {
1052 slog(st,LOG_SEC,"MSG6/PONG packet contained invalid data");
1053 return False;
1054 }
1055 /* Older versions of secnet used to write some config data here
1056 * which we ignore. So we don't CHECK_EMPTY */
1057 return True;
1058 }
1059
1060 static bool_t decrypt_msg0(struct site *st, struct buffer_if *msg0,
1061 const struct comm_addr *src)
1062 {
1063 cstring_t transform_err, auxkey_err, newkey_err="n/a";
1064 struct msg0 m;
1065 uint32_t problem;
1066
1067 if (!unpick_msg0(st,msg0,&m)) return False;
1068
1069 /* Keep a copy so we can try decrypting it with multiple keys */
1070 buffer_copy(&st->scratch, msg0);
1071
1072 problem = call_transform_reverse(st,st->current.transform,
1073 msg0,&transform_err);
1074 if (!problem) {
1075 if (!st->auxiliary_is_new)
1076 delete_one_key(st,&st->auxiliary_key,
1077 "peer has used new key","auxiliary key",LOG_SEC);
1078 return True;
1079 }
1080 if (problem==2)
1081 goto skew;
1082
1083 buffer_copy(msg0, &st->scratch);
1084 problem = call_transform_reverse(st,st->auxiliary_key.transform,
1085 msg0,&auxkey_err);
1086 if (problem==0) {
1087 slog(st,LOG_DROP,"processing packet which uses auxiliary key");
1088 if (st->auxiliary_is_new) {
1089 /* We previously timed out in state SENTMSG5 but it turns
1090 * out that our peer did in fact get our MSG5 and is
1091 * using the new key. So we should switch to it too. */
1092 /* This is a bit like activate_new_key. */
1093 struct data_key t;
1094 t=st->current;
1095 st->current=st->auxiliary_key;
1096 st->auxiliary_key=t;
1097
1098 delete_one_key(st,&st->auxiliary_key,"peer has used new key",
1099 "previous key",LOG_SEC);
1100 st->auxiliary_is_new=0;
1101 st->renegotiate_key_time=st->auxiliary_renegotiate_key_time;
1102 }
1103 return True;
1104 }
1105 if (problem==2)
1106 goto skew;
1107
1108 if (st->state==SITE_SENTMSG5) {
1109 buffer_copy(msg0, &st->scratch);
1110 problem = call_transform_reverse(st,st->new_transform,
1111 msg0,&newkey_err);
1112 if (!problem) {
1113 /* It looks like we didn't get the peer's MSG6 */
1114 /* This is like a cut-down enter_new_state(SITE_RUN) */
1115 slog(st,LOG_STATE,"will enter state RUN (MSG0 with new key)");
1116 BUF_FREE(&st->buffer);
1117 st->timeout=0;
1118 activate_new_key(st);
1119 return True; /* do process the data in this packet */
1120 }
1121 if (problem==2)
1122 goto skew;
1123 }
1124
1125 slog(st,LOG_SEC,"transform: %s (aux: %s, new: %s)",
1126 transform_err,auxkey_err,newkey_err);
1127 initiate_key_setup(st,"incoming message would not decrypt",0);
1128 send_nak(src,m.dest,m.source,m.type,msg0,"message would not decrypt");
1129 return False;
1130
1131 skew:
1132 slog(st,LOG_DROP,"transform: %s (merely skew)",transform_err);
1133 return False;
1134 }
1135
1136 static bool_t process_msg0(struct site *st, struct buffer_if *msg0,
1137 const struct comm_addr *src)
1138 {
1139 uint32_t type;
1140
1141 if (!decrypt_msg0(st,msg0,src))
1142 return False;
1143
1144 CHECK_AVAIL(msg0,4);
1145 type=buf_unprepend_uint32(msg0);
1146 switch(type) {
1147 case LABEL_MSG7:
1148 /* We must forget about the current session. */
1149 delete_keys(st,"request from peer",LOG_SEC);
1150 /* probably, the peer is shutting down, and this is going to fail,
1151 * but we need to be trying to bring the link up again */
1152 if (st->keepalive)
1153 initiate_key_setup(st,"peer requested key teardown",0);
1154 return True;
1155 case LABEL_MSG9:
1156 /* Deliver to netlink layer */
1157 st->netlink->deliver(st->netlink->st,msg0);
1158 transport_data_msgok(st,src);
1159 /* See whether we should start negotiating a new key */
1160 if (st->now > st->renegotiate_key_time)
1161 initiate_key_setup(st,"incoming packet in renegotiation window",0);
1162 return True;
1163 default:
1164 slog(st,LOG_SEC,"incoming encrypted message of type %08x "
1165 "(unknown)",type);
1166 break;
1167 }
1168 return False;
1169 }
1170
1171 static void dump_packet(struct site *st, struct buffer_if *buf,
1172 const struct comm_addr *addr, bool_t incoming,
1173 bool_t ok)
1174 {
1175 uint32_t dest=get_uint32(buf->start);
1176 uint32_t source=get_uint32(buf->start+4);
1177 uint32_t msgtype=get_uint32(buf->start+8);
1178
1179 if (st->log_events & LOG_DUMP)
1180 slilog(st->log,M_DEBUG,"%s: %s: %08x<-%08x: %08x: %s%s",
1181 st->tunname,incoming?"incoming":"outgoing",
1182 dest,source,msgtype,comm_addr_to_string(addr),
1183 ok?"":" - fail");
1184 }
1185
1186 static bool_t comm_addr_sendmsg(struct site *st,
1187 const struct comm_addr *dest,
1188 struct buffer_if *buf)
1189 {
1190 return dest->comm->sendmsg(dest->comm->st, buf, dest);
1191 }
1192
1193 static uint32_t site_status(void *st)
1194 {
1195 return 0;
1196 }
1197
1198 static bool_t send_msg(struct site *st)
1199 {
1200 if (st->retries>0) {
1201 transport_xmit(st, &st->setup_peers, &st->buffer, True);
1202 st->timeout=st->now+st->setup_retry_interval;
1203 st->retries--;
1204 return True;
1205 } else if (st->state==SITE_SENTMSG5) {
1206 logtimeout(st,"timed out sending MSG5, stashing new key");
1207 /* We stash the key we have produced, in case it turns out that
1208 * our peer did see our MSG5 after all and starts using it. */
1209 /* This is a bit like some of activate_new_key */
1210 struct transform_inst_if *t;
1211 t=st->auxiliary_key.transform;
1212 st->auxiliary_key.transform=st->new_transform;
1213 st->new_transform=t;
1214 dispose_transform(&st->new_transform);
1215
1216 st->auxiliary_is_new=1;
1217 st->auxiliary_key.key_timeout=st->now+st->key_lifetime;
1218 st->auxiliary_renegotiate_key_time=st->now+st->key_renegotiate_time;
1219 st->auxiliary_key.remote_session_id=st->setup_session_id;
1220
1221 enter_state_wait(st);
1222 return False;
1223 } else {
1224 logtimeout(st,"timed out sending key setup packet "
1225 "(in state %s)",state_name(st->state));
1226 enter_state_wait(st);
1227 return False;
1228 }
1229 }
1230
1231 static void site_resolve_callback(void *sst, const struct comm_addr *addrs,
1232 int stored_naddrs, int all_naddrs,
1233 const char *address, const char *failwhy)
1234 {
1235 struct site *st=sst;
1236
1237 if (!stored_naddrs) {
1238 slog(st,LOG_ERROR,"resolution of %s failed: %s",address,failwhy);
1239 } else {
1240 slog(st,LOG_PEER_ADDRS,"resolution of %s completed, %d addrs, eg: %s",
1241 address, all_naddrs, comm_addr_to_string(&addrs[0]));;
1242
1243 int space=st->transport_peers_max-st->resolving_n_results_stored;
1244 int n_tocopy=MIN(stored_naddrs,space);
1245 COPY_ARRAY(st->resolving_results + st->resolving_n_results_stored,
1246 addrs,
1247 n_tocopy);
1248 st->resolving_n_results_stored += n_tocopy;
1249 st->resolving_n_results_all += all_naddrs;
1250 }
1251
1252 decrement_resolving_count(st,1);
1253 }
1254
1255 static void decrement_resolving_count(struct site *st, int by)
1256 {
1257 assert(st->resolving_count>0);
1258 st->resolving_count-=by;
1259
1260 if (st->resolving_count)
1261 return;
1262
1263 /* OK, we are done with them all. Handle combined results. */
1264
1265 const struct comm_addr *addrs=st->resolving_results;
1266 int naddrs=st->resolving_n_results_stored;
1267 assert(naddrs<=st->transport_peers_max);
1268
1269 if (naddrs) {
1270 if (naddrs != st->resolving_n_results_all) {
1271 slog(st,LOG_SETUP_INIT,"resolution of supplied addresses/names"
1272 " yielded too many results (%d > %d), some ignored",
1273 st->resolving_n_results_all, naddrs);
1274 }
1275 slog(st,LOG_STATE,"resolution completed, %d addrs, eg: %s",
1276 naddrs, iaddr_to_string(&addrs[0].ia));;
1277 }
1278
1279 switch (st->state) {
1280 case SITE_RESOLVE:
1281 if (transport_compute_setupinit_peers(st,addrs,naddrs,0)) {
1282 enter_new_state(st,SITE_SENTMSG1);
1283 } else {
1284 /* Can't figure out who to try to to talk to */
1285 slog(st,LOG_SETUP_INIT,
1286 "key exchange failed: cannot find peer address");
1287 enter_state_run(st);
1288 }
1289 break;
1290 case SITE_SENTMSG1: case SITE_SENTMSG2:
1291 case SITE_SENTMSG3: case SITE_SENTMSG4:
1292 case SITE_SENTMSG5:
1293 if (naddrs) {
1294 /* We start using the address immediately for data too.
1295 * It's best to store it in st->peers now because we might
1296 * go via SENTMSG5, WAIT, and a MSG0, straight into using
1297 * the new key (without updating the data peer addrs). */
1298 transport_resolve_complete(st,addrs,naddrs);
1299 } else if (st->local_mobile) {
1300 /* We can't let this rest because we may have a peer
1301 * address which will break in the future. */
1302 slog(st,LOG_SETUP_INIT,"resolution failed: "
1303 "abandoning key exchange");
1304 enter_state_wait(st);
1305 } else {
1306 slog(st,LOG_SETUP_INIT,"resolution failed: "
1307 " continuing to use source address of peer's packets"
1308 " for key exchange and ultimately data");
1309 }
1310 break;
1311 case SITE_RUN:
1312 if (naddrs) {
1313 slog(st,LOG_SETUP_INIT,"resolution completed tardily,"
1314 " updating peer address(es)");
1315 transport_resolve_complete_tardy(st,addrs,naddrs);
1316 } else if (st->local_mobile) {
1317 /* Not very good. We should queue (another) renegotiation
1318 * so that we can update the peer address. */
1319 st->key_renegotiate_time=st->now+st->wait_timeout;
1320 } else {
1321 slog(st,LOG_SETUP_INIT,"resolution failed: "
1322 " continuing to use source address of peer's packets");
1323 }
1324 break;
1325 case SITE_WAIT:
1326 case SITE_STOP:
1327 /* oh well */
1328 break;
1329 }
1330 }
1331
1332 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
1333 const struct comm_addr *prod_hint)
1334 {
1335 /* Reentrancy hazard: can call enter_new_state/enter_state_* */
1336 if (st->state!=SITE_RUN) return False;
1337 slog(st,LOG_SETUP_INIT,"initiating key exchange (%s)",reason);
1338 if (st->addresses) {
1339 slog(st,LOG_SETUP_INIT,"resolving peer address(es)");
1340 return enter_state_resolve(st);
1341 } else if (transport_compute_setupinit_peers(st,0,0,prod_hint)) {
1342 return enter_new_state(st,SITE_SENTMSG1);
1343 }
1344 slog(st,LOG_SETUP_INIT,"key exchange failed: no address for peer");
1345 return False;
1346 }
1347
1348 static void activate_new_key(struct site *st)
1349 {
1350 struct transform_inst_if *t;
1351
1352 /* We have three transform instances, which we swap between old,
1353 active and setup */
1354 t=st->auxiliary_key.transform;
1355 st->auxiliary_key.transform=st->current.transform;
1356 st->current.transform=st->new_transform;
1357 st->new_transform=t;
1358 dispose_transform(&st->new_transform);
1359
1360 st->timeout=0;
1361 st->auxiliary_is_new=0;
1362 st->auxiliary_key.key_timeout=st->current.key_timeout;
1363 st->current.key_timeout=st->now+st->key_lifetime;
1364 st->renegotiate_key_time=st->now+st->key_renegotiate_time;
1365 transport_peers_copy(st,&st->peers,&st->setup_peers);
1366 st->current.remote_session_id=st->setup_session_id;
1367
1368 /* Compute the inter-site MTU. This is min( our_mtu, their_mtu ).
1369 * But their mtu be unspecified, in which case we just use ours. */
1370 uint32_t intersite_mtu=
1371 MIN(st->mtu_target, st->remote_adv_mtu ?: ~(uint32_t)0);
1372 st->netlink->set_mtu(st->netlink->st,intersite_mtu);
1373
1374 slog(st,LOG_ACTIVATE_KEY,"new key activated"
1375 " (mtu ours=%"PRId32" theirs=%"PRId32" intersite=%"PRId32")",
1376 st->mtu_target, st->remote_adv_mtu, intersite_mtu);
1377 enter_state_run(st);
1378 }
1379
1380 static void delete_one_key(struct site *st, struct data_key *key,
1381 cstring_t reason, cstring_t which, uint32_t loglevel)
1382 {
1383 if (!is_transform_valid(key->transform)) return;
1384 if (reason) slog(st,loglevel,"%s deleted (%s)",which,reason);
1385 dispose_transform(&key->transform);
1386 key->key_timeout=0;
1387 }
1388
1389 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel)
1390 {
1391 if (current_valid(st)) {
1392 slog(st,loglevel,"session closed (%s)",reason);
1393
1394 delete_one_key(st,&st->current,0,0,0);
1395 set_link_quality(st);
1396 }
1397 delete_one_key(st,&st->auxiliary_key,0,0,0);
1398 }
1399
1400 static void state_assert(struct site *st, bool_t ok)
1401 {
1402 if (!ok) fatal("site:state_assert");
1403 }
1404
1405 static void enter_state_stop(struct site *st)
1406 {
1407 st->state=SITE_STOP;
1408 st->timeout=0;
1409 delete_keys(st,"entering state STOP",LOG_TIMEOUT_KEY);
1410 dispose_transform(&st->new_transform);
1411 }
1412
1413 static void set_link_quality(struct site *st)
1414 {
1415 uint32_t quality;
1416 if (current_valid(st))
1417 quality=LINK_QUALITY_UP;
1418 else if (st->state==SITE_WAIT || st->state==SITE_STOP)
1419 quality=LINK_QUALITY_DOWN;
1420 else if (st->addresses)
1421 quality=LINK_QUALITY_DOWN_CURRENT_ADDRESS;
1422 else if (transport_peers_valid(&st->peers))
1423 quality=LINK_QUALITY_DOWN_STALE_ADDRESS;
1424 else
1425 quality=LINK_QUALITY_DOWN;
1426
1427 st->netlink->set_quality(st->netlink->st,quality);
1428 }
1429
1430 static void enter_state_run(struct site *st)
1431 {
1432 slog(st,LOG_STATE,"entering state RUN");
1433 st->state=SITE_RUN;
1434 st->timeout=0;
1435
1436 st->setup_session_id=0;
1437 transport_peers_clear(st,&st->setup_peers);
1438 FILLZERO(st->localN);
1439 FILLZERO(st->remoteN);
1440 dispose_transform(&st->new_transform);
1441 memset(st->dhsecret,0,st->dh->len);
1442 memset(st->sharedsecret,0,st->sharedsecretlen);
1443 set_link_quality(st);
1444
1445 if (st->keepalive && !current_valid(st))
1446 initiate_key_setup(st, "keepalive", 0);
1447 }
1448
1449 static bool_t ensure_resolving(struct site *st)
1450 {
1451 /* Reentrancy hazard: may call site_resolve_callback and hence
1452 * enter_new_state, enter_state_* and generate_msg*. */
1453 if (st->resolving_count)
1454 return True;
1455
1456 assert(st->addresses);
1457
1458 /* resolver->request might reentrantly call site_resolve_callback
1459 * which will decrement st->resolving, so we need to increment it
1460 * twice beforehand to prevent decrement from thinking we're
1461 * finished, and decrement it ourselves. Alternatively if
1462 * everything fails then there are no callbacks due and we simply
1463 * set it to 0 and return false.. */
1464 st->resolving_n_results_stored=0;
1465 st->resolving_n_results_all=0;
1466 st->resolving_count+=2;
1467 const char **addrp=st->addresses;
1468 const char *address;
1469 bool_t anyok=False;
1470 for (; (address=*addrp++); ) {
1471 bool_t ok = st->resolver->request(st->resolver->st,address,
1472 st->remoteport,st->comms[0],
1473 site_resolve_callback,st);
1474 if (ok)
1475 st->resolving_count++;
1476 anyok|=ok;
1477 }
1478 if (!anyok) {
1479 st->resolving_count=0;
1480 return False;
1481 }
1482 decrement_resolving_count(st,2);
1483 return True;
1484 }
1485
1486 static bool_t enter_state_resolve(struct site *st)
1487 {
1488 /* Reentrancy hazard! See ensure_resolving. */
1489 state_assert(st,st->state==SITE_RUN);
1490 slog(st,LOG_STATE,"entering state RESOLVE");
1491 st->state=SITE_RESOLVE;
1492 return ensure_resolving(st);
1493 }
1494
1495 static bool_t enter_new_state(struct site *st, uint32_t next)
1496 {
1497 bool_t (*gen)(struct site *st);
1498 int r;
1499
1500 slog(st,LOG_STATE,"entering state %s",state_name(next));
1501 switch(next) {
1502 case SITE_SENTMSG1:
1503 state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE);
1504 gen=generate_msg1;
1505 break;
1506 case SITE_SENTMSG2:
1507 state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1508 st->state==SITE_SENTMSG1 || st->state==SITE_WAIT);
1509 gen=generate_msg2;
1510 break;
1511 case SITE_SENTMSG3:
1512 state_assert(st,st->state==SITE_SENTMSG1);
1513 BUF_FREE(&st->buffer);
1514 gen=generate_msg3;
1515 break;
1516 case SITE_SENTMSG4:
1517 state_assert(st,st->state==SITE_SENTMSG2);
1518 BUF_FREE(&st->buffer);
1519 gen=generate_msg4;
1520 break;
1521 case SITE_SENTMSG5:
1522 state_assert(st,st->state==SITE_SENTMSG3);
1523 BUF_FREE(&st->buffer);
1524 gen=generate_msg5;
1525 break;
1526 case SITE_RUN:
1527 state_assert(st,st->state==SITE_SENTMSG4);
1528 BUF_FREE(&st->buffer);
1529 gen=generate_msg6;
1530 break;
1531 default:
1532 gen=NULL;
1533 fatal("enter_new_state(%s): invalid new state",state_name(next));
1534 break;
1535 }
1536
1537 if (hacky_par_start_failnow()) return False;
1538
1539 r= gen(st) && send_msg(st);
1540
1541 hacky_par_end(&r,
1542 st->setup_retries, st->setup_retry_interval,
1543 send_msg, st);
1544
1545 if (r) {
1546 st->state=next;
1547 if (next==SITE_RUN) {
1548 BUF_FREE(&st->buffer); /* Never reused */
1549 st->timeout=0; /* Never retransmit */
1550 activate_new_key(st);
1551 }
1552 return True;
1553 }
1554 slog(st,LOG_ERROR,"error entering state %s",state_name(next));
1555 st->buffer.free=False; /* Unconditionally use the buffer; it may be
1556 in either state, and enter_state_wait() will
1557 do a BUF_FREE() */
1558 enter_state_wait(st);
1559 return False;
1560 }
1561
1562 /* msg7 tells our peer that we're about to forget our key */
1563 static bool_t send_msg7(struct site *st, cstring_t reason)
1564 {
1565 cstring_t transform_err;
1566
1567 if (current_valid(st) && st->buffer.free
1568 && transport_peers_valid(&st->peers)) {
1569 BUF_ALLOC(&st->buffer,"site:MSG7");
1570 buffer_init(&st->buffer,calculate_max_start_pad());
1571 buf_append_uint32(&st->buffer,LABEL_MSG7);
1572 buf_append_string(&st->buffer,reason);
1573 if (call_transform_forwards(st, st->current.transform,
1574 &st->buffer, &transform_err))
1575 goto free_out;
1576 buf_prepend_uint32(&st->buffer,LABEL_MSG0);
1577 buf_prepend_uint32(&st->buffer,st->index);
1578 buf_prepend_uint32(&st->buffer,st->current.remote_session_id);
1579 transport_xmit(st,&st->peers,&st->buffer,True);
1580 BUF_FREE(&st->buffer);
1581 free_out:
1582 return True;
1583 }
1584 return False;
1585 }
1586
1587 /* We go into this state if our peer becomes uncommunicative. Similar to
1588 the "stop" state, we forget all session keys for a while, before
1589 re-entering the "run" state. */
1590 static void enter_state_wait(struct site *st)
1591 {
1592 slog(st,LOG_STATE,"entering state WAIT");
1593 st->timeout=st->now+st->wait_timeout;
1594 st->state=SITE_WAIT;
1595 set_link_quality(st);
1596 BUF_FREE(&st->buffer); /* will have had an outgoing packet in it */
1597 /* XXX Erase keys etc. */
1598 }
1599
1600 static void generate_prod(struct site *st, struct buffer_if *buf)
1601 {
1602 buffer_init(buf,0);
1603 buf_append_uint32(buf,0);
1604 buf_append_uint32(buf,0);
1605 buf_append_uint32(buf,LABEL_PROD);
1606 buf_append_string(buf,st->localname);
1607 buf_append_string(buf,st->remotename);
1608 }
1609
1610 static void generate_send_prod(struct site *st,
1611 const struct comm_addr *source)
1612 {
1613 if (!st->allow_send_prod) return; /* too soon */
1614 if (!(st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1615 st->state==SITE_WAIT)) return; /* we'd ignore peer's MSG1 */
1616
1617 slog(st,LOG_SETUP_INIT,"prodding peer for key exchange");
1618 st->allow_send_prod=0;
1619 generate_prod(st,&st->scratch);
1620 bool_t ok = comm_addr_sendmsg(st, source, &st->scratch);
1621 dump_packet(st,&st->scratch,source,False,ok);
1622 }
1623
1624 static inline void site_settimeout(uint64_t timeout, int *timeout_io)
1625 {
1626 if (timeout) {
1627 int64_t offset=timeout-*now;
1628 if (offset<0) offset=0;
1629 if (offset>INT_MAX) offset=INT_MAX;
1630 if (*timeout_io<0 || offset<*timeout_io)
1631 *timeout_io=offset;
1632 }
1633 }
1634
1635 static int site_beforepoll(void *sst, struct pollfd *fds, int *nfds_io,
1636 int *timeout_io)
1637 {
1638 struct site *st=sst;
1639
1640 BEFOREPOLL_WANT_FDS(0); /* We don't use any file descriptors */
1641 st->now=*now;
1642
1643 /* Work out when our next timeout is. The earlier of 'timeout' or
1644 'current.key_timeout'. A stored value of '0' indicates no timeout
1645 active. */
1646 site_settimeout(st->timeout, timeout_io);
1647 site_settimeout(st->current.key_timeout, timeout_io);
1648 site_settimeout(st->auxiliary_key.key_timeout, timeout_io);
1649
1650 return 0; /* success */
1651 }
1652
1653 static void check_expiry(struct site *st, struct data_key *key,
1654 const char *which)
1655 {
1656 if (key->key_timeout && *now>key->key_timeout) {
1657 delete_one_key(st,key,"maximum life exceeded",which,LOG_TIMEOUT_KEY);
1658 }
1659 }
1660
1661 /* NB site_afterpoll will be called before site_beforepoll is ever called */
1662 static void site_afterpoll(void *sst, struct pollfd *fds, int nfds)
1663 {
1664 struct site *st=sst;
1665
1666 st->now=*now;
1667 if (st->timeout && *now>st->timeout) {
1668 st->timeout=0;
1669 if (st->state>=SITE_SENTMSG1 && st->state<=SITE_SENTMSG5) {
1670 if (!hacky_par_start_failnow())
1671 send_msg(st);
1672 } else if (st->state==SITE_WAIT) {
1673 enter_state_run(st);
1674 } else {
1675 slog(st,LOG_ERROR,"site_afterpoll: unexpected timeout, state=%d",
1676 st->state);
1677 }
1678 }
1679 check_expiry(st,&st->current,"current key");
1680 check_expiry(st,&st->auxiliary_key,"auxiliary key");
1681 }
1682
1683 /* This function is called by the netlink device to deliver packets
1684 intended for the remote network. The packet is in "raw" wire
1685 format, but is guaranteed to be word-aligned. */
1686 static void site_outgoing(void *sst, struct buffer_if *buf)
1687 {
1688 struct site *st=sst;
1689 cstring_t transform_err;
1690
1691 if (st->state==SITE_STOP) {
1692 BUF_FREE(buf);
1693 return;
1694 }
1695
1696 st->allow_send_prod=1;
1697
1698 /* In all other states we consider delivering the packet if we have
1699 a valid key and a valid address to send it to. */
1700 if (current_valid(st) && transport_peers_valid(&st->peers)) {
1701 /* Transform it and send it */
1702 if (buf->size>0) {
1703 buf_prepend_uint32(buf,LABEL_MSG9);
1704 if (call_transform_forwards(st, st->current.transform,
1705 buf, &transform_err))
1706 goto free_out;
1707 buf_prepend_uint32(buf,LABEL_MSG0);
1708 buf_prepend_uint32(buf,st->index);
1709 buf_prepend_uint32(buf,st->current.remote_session_id);
1710 transport_xmit(st,&st->peers,buf,False);
1711 }
1712 free_out:
1713 BUF_FREE(buf);
1714 return;
1715 }
1716
1717 slog(st,LOG_DROP,"discarding outgoing packet of size %d",buf->size);
1718 BUF_FREE(buf);
1719 initiate_key_setup(st,"outgoing packet",0);
1720 }
1721
1722 static bool_t named_for_us(struct site *st, const struct buffer_if *buf_in,
1723 uint32_t type, struct msg *m)
1724 /* For packets which are identified by the local and remote names.
1725 * If it has our name and our peer's name in it it's for us. */
1726 {
1727 struct buffer_if buf[1];
1728 buffer_readonly_clone(buf,buf_in);
1729 return unpick_msg(st,type,buf,m)
1730 && name_matches(&m->remote,st->remotename)
1731 && name_matches(&m->local,st->localname);
1732 }
1733
1734 /* This function is called by the communication device to deliver
1735 packets from our peers.
1736 It should return True if the packet is recognised as being for
1737 this current site instance (and should therefore not be processed
1738 by other sites), even if the packet was otherwise ignored. */
1739 static bool_t site_incoming(void *sst, struct buffer_if *buf,
1740 const struct comm_addr *source)
1741 {
1742 struct site *st=sst;
1743
1744 if (buf->size < 12) return False;
1745
1746 uint32_t dest=get_uint32(buf->start);
1747 uint32_t msgtype=get_uint32(buf->start+8);
1748 struct msg named_msg;
1749
1750 if (msgtype==LABEL_MSG1) {
1751 if (!named_for_us(st,buf,msgtype,&named_msg))
1752 return False;
1753 /* It's a MSG1 addressed to us. Decide what to do about it. */
1754 dump_packet(st,buf,source,True,True);
1755 if (st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1756 st->state==SITE_WAIT) {
1757 /* We should definitely process it */
1758 transport_compute_setupinit_peers(st,0,0,source);
1759 if (process_msg1(st,buf,source,&named_msg)) {
1760 slog(st,LOG_SETUP_INIT,"key setup initiated by peer");
1761 bool_t entered=enter_new_state(st,SITE_SENTMSG2);
1762 if (entered && st->addresses && st->local_mobile)
1763 /* We must do this as the very last thing, because
1764 the resolver callback might reenter us. */
1765 ensure_resolving(st);
1766 } else {
1767 slog(st,LOG_ERROR,"failed to process incoming msg1");
1768 }
1769 BUF_FREE(buf);
1770 return True;
1771 } else if (st->state==SITE_SENTMSG1) {
1772 /* We've just sent a message 1! They may have crossed on
1773 the wire. If we have priority then we ignore the
1774 incoming one, otherwise we process it as usual. */
1775 if (st->setup_priority) {
1776 BUF_FREE(buf);
1777 slog(st,LOG_DUMP,"crossed msg1s; we are higher "
1778 "priority => ignore incoming msg1");
1779 return True;
1780 } else {
1781 slog(st,LOG_DUMP,"crossed msg1s; we are lower "
1782 "priority => use incoming msg1");
1783 if (process_msg1(st,buf,source,&named_msg)) {
1784 BUF_FREE(&st->buffer); /* Free our old message 1 */
1785 transport_setup_msgok(st,source);
1786 enter_new_state(st,SITE_SENTMSG2);
1787 } else {
1788 slog(st,LOG_ERROR,"failed to process an incoming "
1789 "crossed msg1 (we have low priority)");
1790 }
1791 BUF_FREE(buf);
1792 return True;
1793 }
1794 }
1795 /* The message 1 was received at an unexpected stage of the
1796 key setup. XXX POLICY - what do we do? */
1797 slog(st,LOG_UNEXPECTED,"unexpected incoming message 1");
1798 BUF_FREE(buf);
1799 return True;
1800 }
1801 if (msgtype==LABEL_PROD) {
1802 if (!named_for_us(st,buf,msgtype,&named_msg))
1803 return False;
1804 dump_packet(st,buf,source,True,True);
1805 if (st->state!=SITE_RUN) {
1806 slog(st,LOG_DROP,"ignoring PROD when not in state RUN");
1807 } else if (current_valid(st)) {
1808 slog(st,LOG_DROP,"ignoring PROD when we think we have a key");
1809 } else {
1810 initiate_key_setup(st,"peer sent PROD packet",source);
1811 }
1812 BUF_FREE(buf);
1813 return True;
1814 }
1815 if (dest==st->index) {
1816 /* Explicitly addressed to us */
1817 if (msgtype!=LABEL_MSG0) dump_packet(st,buf,source,True,True);
1818 switch (msgtype) {
1819 case LABEL_NAK:
1820 /* If the source is our current peer then initiate a key setup,
1821 because our peer's forgotten the key */
1822 if (get_uint32(buf->start+4)==st->current.remote_session_id) {
1823 bool_t initiated;
1824 initiated = initiate_key_setup(st,"received a NAK",source);
1825 if (!initiated) generate_send_prod(st,source);
1826 } else {
1827 slog(st,LOG_SEC,"bad incoming NAK");
1828 }
1829 break;
1830 case LABEL_MSG0:
1831 process_msg0(st,buf,source);
1832 break;
1833 case LABEL_MSG1:
1834 /* Setup packet: should not have been explicitly addressed
1835 to us */
1836 slog(st,LOG_SEC,"incoming explicitly addressed msg1");
1837 break;
1838 case LABEL_MSG2:
1839 /* Setup packet: expected only in state SENTMSG1 */
1840 if (st->state!=SITE_SENTMSG1) {
1841 slog(st,LOG_UNEXPECTED,"unexpected MSG2");
1842 } else if (process_msg2(st,buf,source)) {
1843 transport_setup_msgok(st,source);
1844 enter_new_state(st,SITE_SENTMSG3);
1845 } else {
1846 slog(st,LOG_SEC,"invalid MSG2");
1847 }
1848 break;
1849 case LABEL_MSG3:
1850 case LABEL_MSG3BIS:
1851 /* Setup packet: expected only in state SENTMSG2 */
1852 if (st->state!=SITE_SENTMSG2) {
1853 slog(st,LOG_UNEXPECTED,"unexpected MSG3");
1854 } else if (process_msg3(st,buf,source,msgtype)) {
1855 transport_setup_msgok(st,source);
1856 enter_new_state(st,SITE_SENTMSG4);
1857 } else {
1858 slog(st,LOG_SEC,"invalid MSG3");
1859 }
1860 break;
1861 case LABEL_MSG4:
1862 /* Setup packet: expected only in state SENTMSG3 */
1863 if (st->state!=SITE_SENTMSG3) {
1864 slog(st,LOG_UNEXPECTED,"unexpected MSG4");
1865 } else if (process_msg4(st,buf,source)) {
1866 transport_setup_msgok(st,source);
1867 enter_new_state(st,SITE_SENTMSG5);
1868 } else {
1869 slog(st,LOG_SEC,"invalid MSG4");
1870 }
1871 break;
1872 case LABEL_MSG5:
1873 /* Setup packet: expected only in state SENTMSG4 */
1874 /* (may turn up in state RUN if our return MSG6 was lost
1875 and the new key has already been activated. In that
1876 case we discard it. The peer will realise that we
1877 are using the new key when they see our data packets.
1878 Until then the peer's data packets to us get discarded. */
1879 if (st->state==SITE_SENTMSG4) {
1880 if (process_msg5(st,buf,source,st->new_transform)) {
1881 transport_setup_msgok(st,source);
1882 enter_new_state(st,SITE_RUN);
1883 } else {
1884 slog(st,LOG_SEC,"invalid MSG5");
1885 }
1886 } else if (st->state==SITE_RUN) {
1887 if (process_msg5(st,buf,source,st->current.transform)) {
1888 slog(st,LOG_DROP,"got MSG5, retransmitting MSG6");
1889 transport_setup_msgok(st,source);
1890 create_msg6(st,st->current.transform,
1891 st->current.remote_session_id);
1892 transport_xmit(st,&st->peers,&st->buffer,True);
1893 BUF_FREE(&st->buffer);
1894 } else {
1895 slog(st,LOG_SEC,"invalid MSG5 (in state RUN)");
1896 }
1897 } else {
1898 slog(st,LOG_UNEXPECTED,"unexpected MSG5");
1899 }
1900 break;
1901 case LABEL_MSG6:
1902 /* Setup packet: expected only in state SENTMSG5 */
1903 if (st->state!=SITE_SENTMSG5) {
1904 slog(st,LOG_UNEXPECTED,"unexpected MSG6");
1905 } else if (process_msg6(st,buf,source)) {
1906 BUF_FREE(&st->buffer); /* Free message 5 */
1907 transport_setup_msgok(st,source);
1908 activate_new_key(st);
1909 } else {
1910 slog(st,LOG_SEC,"invalid MSG6");
1911 }
1912 break;
1913 default:
1914 slog(st,LOG_SEC,"received message of unknown type 0x%08x",
1915 msgtype);
1916 break;
1917 }
1918 BUF_FREE(buf);
1919 return True;
1920 }
1921
1922 return False;
1923 }
1924
1925 static void site_control(void *vst, bool_t run)
1926 {
1927 struct site *st=vst;
1928 if (run) enter_state_run(st);
1929 else enter_state_stop(st);
1930 }
1931
1932 static void site_phase_hook(void *sst, uint32_t newphase)
1933 {
1934 struct site *st=sst;
1935
1936 /* The program is shutting down; tell our peer */
1937 send_msg7(st,"shutting down");
1938 }
1939
1940 static void site_childpersist_clearkeys(void *sst, uint32_t newphase)
1941 {
1942 struct site *st=sst;
1943 dispose_transform(&st->current.transform);
1944 dispose_transform(&st->auxiliary_key.transform);
1945 dispose_transform(&st->new_transform);
1946 /* Not much point overwiting the signing key, since we loaded it
1947 from disk, and it is only valid prospectively if at all,
1948 anyway. */
1949 /* XXX it would be best to overwrite the DH state, because that
1950 _is_ relevant to forward secrecy. However we have no
1951 convenient interface for doing that and in practice gmp has
1952 probably dribbled droppings all over the malloc arena. A good
1953 way to fix this would be to have a privsep child for asymmetric
1954 crypto operations, but that's a task for another day. */
1955 }
1956
1957 static list_t *site_apply(closure_t *self, struct cloc loc, dict_t *context,
1958 list_t *args)
1959 {
1960 static uint32_t index_sequence;
1961 struct site *st;
1962 item_t *item;
1963 dict_t *dict;
1964 int i;
1965
1966 NEW(st);
1967
1968 st->cl.description="site";
1969 st->cl.type=CL_SITE;
1970 st->cl.apply=NULL;
1971 st->cl.interface=&st->ops;
1972 st->ops.st=st;
1973 st->ops.control=site_control;
1974 st->ops.status=site_status;
1975
1976 /* First parameter must be a dict */
1977 item=list_elem(args,0);
1978 if (!item || item->type!=t_dict)
1979 cfgfatal(loc,"site","parameter must be a dictionary\n");
1980
1981 dict=item->data.dict;
1982 st->localname=dict_read_string(dict, "local-name", True, "site", loc);
1983 st->remotename=dict_read_string(dict, "name", True, "site", loc);
1984
1985 st->keepalive=dict_read_bool(dict,"keepalive",False,"site",loc,False);
1986
1987 st->peer_mobile=dict_read_bool(dict,"mobile",False,"site",loc,False);
1988 st->local_mobile=
1989 dict_read_bool(dict,"local-mobile",False,"site",loc,False);
1990
1991 /* Sanity check (which also allows the 'sites' file to include
1992 site() closures for all sites including our own): refuse to
1993 talk to ourselves */
1994 if (strcmp(st->localname,st->remotename)==0) {
1995 Message(M_DEBUG,"site %s: local-name==name -> ignoring this site\n",
1996 st->localname);
1997 if (st->peer_mobile != st->local_mobile)
1998 cfgfatal(loc,"site","site %s's peer-mobile=%d"
1999 " but our local-mobile=%d\n",
2000 st->localname, st->peer_mobile, st->local_mobile);
2001 free(st);
2002 return NULL;
2003 }
2004 if (st->peer_mobile && st->local_mobile) {
2005 Message(M_WARNING,"site %s: site is mobile but so are we"
2006 " -> ignoring this site\n", st->remotename);
2007 free(st);
2008 return NULL;
2009 }
2010
2011 assert(index_sequence < 0xffffffffUL);
2012 st->index = ++index_sequence;
2013 st->local_capabilities = 0;
2014 st->netlink=find_cl_if(dict,"link",CL_NETLINK,True,"site",loc);
2015
2016 #define GET_CLOSURE_LIST(dictkey,things,nthings,CL_TYPE) do{ \
2017 list_t *things##_cfg=dict_lookup(dict,dictkey); \
2018 if (!things##_cfg) \
2019 cfgfatal(loc,"site","closure list \"%s\" not found\n",dictkey); \
2020 st->nthings=list_length(things##_cfg); \
2021 NEW_ARY(st->things,st->nthings); \
2022 assert(st->nthings); \
2023 for (i=0; i<st->nthings; i++) { \
2024 item_t *item=list_elem(things##_cfg,i); \
2025 if (item->type!=t_closure) \
2026 cfgfatal(loc,"site","%s is not a closure\n",dictkey); \
2027 closure_t *cl=item->data.closure; \
2028 if (cl->type!=CL_TYPE) \
2029 cfgfatal(loc,"site","%s closure wrong type\n",dictkey); \
2030 st->things[i]=cl->interface; \
2031 } \
2032 }while(0)
2033
2034 GET_CLOSURE_LIST("comm",comms,ncomms,CL_COMM);
2035
2036 st->resolver=find_cl_if(dict,"resolver",CL_RESOLVER,True,"site",loc);
2037 st->log=find_cl_if(dict,"log",CL_LOG,True,"site",loc);
2038 st->random=find_cl_if(dict,"random",CL_RANDOMSRC,True,"site",loc);
2039
2040 st->privkey=find_cl_if(dict,"local-key",CL_RSAPRIVKEY,True,"site",loc);
2041 st->addresses=dict_read_string_array(dict,"address",False,"site",loc,0);
2042 if (st->addresses)
2043 st->remoteport=dict_read_number(dict,"port",True,"site",loc,0);
2044 else st->remoteport=0;
2045 st->pubkey=find_cl_if(dict,"key",CL_RSAPUBKEY,True,"site",loc);
2046
2047 GET_CLOSURE_LIST("transform",transforms,ntransforms,CL_TRANSFORM);
2048
2049 st->dh=find_cl_if(dict,"dh",CL_DH,True,"site",loc);
2050 st->hash=find_cl_if(dict,"hash",CL_HASH,True,"site",loc);
2051
2052 #define DEFAULT(D) (st->peer_mobile || st->local_mobile \
2053 ? DEFAULT_MOBILE_##D : DEFAULT_##D)
2054 #define CFG_NUMBER(k,D) dict_read_number(dict,(k),False,"site",loc,DEFAULT(D));
2055
2056 st->key_lifetime= CFG_NUMBER("key-lifetime", KEY_LIFETIME);
2057 st->setup_retries= CFG_NUMBER("setup-retries", SETUP_RETRIES);
2058 st->setup_retry_interval= CFG_NUMBER("setup-timeout", SETUP_RETRY_INTERVAL);
2059 st->wait_timeout= CFG_NUMBER("wait-time", WAIT_TIME);
2060 st->mtu_target= dict_read_number(dict,"mtu-target",False,"site",loc,0);
2061
2062 st->mobile_peer_expiry= dict_read_number(
2063 dict,"mobile-peer-expiry",False,"site",loc,DEFAULT_MOBILE_PEER_EXPIRY);
2064
2065 const char *peerskey= st->peer_mobile
2066 ? "mobile-peers-max" : "static-peers-max";
2067 st->transport_peers_max= dict_read_number(
2068 dict,peerskey,False,"site",loc, st->addresses ? 4 : 3);
2069 if (st->transport_peers_max<1 ||
2070 st->transport_peers_max>MAX_PEER_ADDRS) {
2071 cfgfatal(loc,"site", "%s must be in range 1.."
2072 STRING(MAX_PEER_ADDRS) "\n", peerskey);
2073 }
2074
2075 if (st->key_lifetime < DEFAULT(KEY_RENEGOTIATE_GAP)*2)
2076 st->key_renegotiate_time=st->key_lifetime/2;
2077 else
2078 st->key_renegotiate_time=st->key_lifetime-DEFAULT(KEY_RENEGOTIATE_GAP);
2079 st->key_renegotiate_time=dict_read_number(
2080 dict,"renegotiate-time",False,"site",loc,st->key_renegotiate_time);
2081 if (st->key_renegotiate_time > st->key_lifetime) {
2082 cfgfatal(loc,"site",
2083 "renegotiate-time must be less than key-lifetime\n");
2084 }
2085
2086 st->log_events=string_list_to_word(dict_lookup(dict,"log-events"),
2087 log_event_table,"site");
2088
2089 st->resolving_count=0;
2090 st->allow_send_prod=0;
2091
2092 st->tunname=safe_malloc(strlen(st->localname)+strlen(st->remotename)+5,
2093 "site_apply");
2094 sprintf(st->tunname,"%s<->%s",st->localname,st->remotename);
2095
2096 /* The information we expect to see in incoming messages of type 1 */
2097 /* fixme: lots of unchecked overflows here, but the results are only
2098 corrupted packets rather than undefined behaviour */
2099 st->setup_priority=(strcmp(st->localname,st->remotename)>0);
2100
2101 buffer_new(&st->buffer,SETUP_BUFFER_LEN);
2102
2103 buffer_new(&st->scratch,SETUP_BUFFER_LEN);
2104 BUF_ALLOC(&st->scratch,"site:scratch");
2105
2106 /* We are interested in poll(), but only for timeouts. We don't have
2107 any fds of our own. */
2108 register_for_poll(st, site_beforepoll, site_afterpoll, "site");
2109 st->timeout=0;
2110
2111 st->remote_capabilities=0;
2112 st->chosen_transform=0;
2113 st->current.key_timeout=0;
2114 st->auxiliary_key.key_timeout=0;
2115 transport_peers_clear(st,&st->peers);
2116 transport_peers_clear(st,&st->setup_peers);
2117 /* XXX mlock these */
2118 st->dhsecret=safe_malloc(st->dh->len,"site:dhsecret");
2119 st->sharedsecretlen=st->sharedsecretallocd=0;
2120 st->sharedsecret=0;
2121
2122 for (i=0; i<st->ntransforms; i++) {
2123 struct transform_if *ti=st->transforms[i];
2124 uint32_t capbit = 1UL << ti->capab_transformnum;
2125 if (st->local_capabilities & capbit)
2126 slog(st,LOG_ERROR,"transformnum capability bit"
2127 " %d (%#"PRIx32") reused", ti->capab_transformnum, capbit);
2128 st->local_capabilities |= capbit;
2129 }
2130
2131 /* We need to register the remote networks with the netlink device */
2132 uint32_t netlink_mtu; /* local virtual interface mtu */
2133 st->netlink->reg(st->netlink->st, site_outgoing, st, &netlink_mtu);
2134 if (!st->mtu_target)
2135 st->mtu_target=netlink_mtu;
2136
2137 for (i=0; i<st->ncomms; i++)
2138 st->comms[i]->request_notify(st->comms[i]->st, st, site_incoming);
2139
2140 st->current.transform=0;
2141 st->auxiliary_key.transform=0;
2142 st->new_transform=0;
2143 st->auxiliary_is_new=0;
2144
2145 enter_state_stop(st);
2146
2147 add_hook(PHASE_SHUTDOWN,site_phase_hook,st);
2148 add_hook(PHASE_CHILDPERSIST,site_childpersist_clearkeys,st);
2149
2150 return new_closure(&st->cl);
2151 }
2152
2153 void site_module(dict_t *dict)
2154 {
2155 add_closure(dict,"site",site_apply);
2156 }
2157
2158
2159 /***** TRANSPORT PEERS definitions *****/
2160
2161 static void transport_peers_debug(struct site *st, transport_peers *dst,
2162 const char *didwhat,
2163 int nargs, const struct comm_addr *args,
2164 size_t stride) {
2165 int i;
2166 char *argp;
2167
2168 if (!(st->log_events & LOG_PEER_ADDRS))
2169 return; /* an optimisation */
2170
2171 slog(st, LOG_PEER_ADDRS, "peers (%s) %s nargs=%d => npeers=%d",
2172 (dst==&st->peers ? "data" :
2173 dst==&st->setup_peers ? "setup" : "UNKNOWN"),
2174 didwhat, nargs, dst->npeers);
2175
2176 for (i=0, argp=(void*)args;
2177 i<nargs;
2178 i++, (argp+=stride?stride:sizeof(*args))) {
2179 const struct comm_addr *ca=(void*)argp;
2180 slog(st, LOG_PEER_ADDRS, " args: addrs[%d]=%s",
2181 i, comm_addr_to_string(ca));
2182 }
2183 for (i=0; i<dst->npeers; i++) {
2184 struct timeval diff;
2185 timersub(tv_now,&dst->peers[i].last,&diff);
2186 const struct comm_addr *ca=&dst->peers[i].addr;
2187 slog(st, LOG_PEER_ADDRS, " peers: addrs[%d]=%s T-%ld.%06ld",
2188 i, comm_addr_to_string(ca),
2189 (unsigned long)diff.tv_sec, (unsigned long)diff.tv_usec);
2190 }
2191 }
2192
2193 static void transport_peers_expire(struct site *st, transport_peers *peers) {
2194 /* peers must be sorted first */
2195 int previous_peers=peers->npeers;
2196 struct timeval oldest;
2197 oldest.tv_sec = tv_now->tv_sec - st->mobile_peer_expiry;
2198 oldest.tv_usec = tv_now->tv_usec;
2199 while (peers->npeers>1 &&
2200 timercmp(&peers->peers[peers->npeers-1].last, &oldest, <))
2201 peers->npeers--;
2202 if (peers->npeers != previous_peers)
2203 transport_peers_debug(st,peers,"expire", 0,0,0);
2204 }
2205
2206 static bool_t transport_peer_record_one(struct site *st, transport_peers *peers,
2207 const struct comm_addr *ca,
2208 const struct timeval *tv) {
2209 /* returns false if output is full */
2210 int search;
2211
2212 if (peers->npeers >= st->transport_peers_max)
2213 return 0;
2214
2215 for (search=0; search<peers->npeers; search++)
2216 if (comm_addr_equal(&peers->peers[search].addr, ca))
2217 return 1;
2218
2219 peers->peers[peers->npeers].addr = *ca;
2220 peers->peers[peers->npeers].last = *tv;
2221 peers->npeers++;
2222 return 1;
2223 }
2224
2225 static void transport_record_peers(struct site *st, transport_peers *peers,
2226 const struct comm_addr *addrs, int naddrs,
2227 const char *m) {
2228 /* We add addrs into peers. The new entries end up at the front
2229 * and displace entries towards the end (perhaps even off the
2230 * end). Any existing matching entries are moved up to the front.
2231 *
2232 * Caller must first call transport_peers_expire. */
2233
2234 if (naddrs==1 && peers->npeers>=1 &&
2235 comm_addr_equal(&addrs[0], &peers->peers[0].addr)) {
2236 /* optimisation, also avoids debug for trivial updates */
2237 peers->peers[0].last = *tv_now;
2238 return;
2239 }
2240
2241 int old_npeers=peers->npeers;
2242 transport_peer old_peers[old_npeers];
2243 COPY_ARRAY(old_peers,peers->peers,old_npeers);
2244
2245 peers->npeers=0;
2246 int i;
2247 for (i=0; i<naddrs; i++) {
2248 if (!transport_peer_record_one(st,peers, &addrs[i], tv_now))
2249 break;
2250 }
2251 for (i=0; i<old_npeers; i++) {
2252 const transport_peer *old=&old_peers[i];
2253 if (!transport_peer_record_one(st,peers, &old->addr, &old->last))
2254 break;
2255 }
2256
2257 transport_peers_debug(st,peers,m, naddrs,addrs,0);
2258 }
2259
2260 static void transport_expire_record_peers(struct site *st,
2261 transport_peers *peers,
2262 const struct comm_addr *addrs,
2263 int naddrs, const char *m) {
2264 /* Convenience function */
2265 transport_peers_expire(st,peers);
2266 transport_record_peers(st,peers,addrs,naddrs,m);
2267 }
2268
2269 static bool_t transport_compute_setupinit_peers(struct site *st,
2270 const struct comm_addr *configured_addrs /* 0 if none or not found */,
2271 int n_configured_addrs /* 0 if none or not found */,
2272 const struct comm_addr *incoming_packet_addr /* 0 if none */) {
2273 if (!n_configured_addrs && !incoming_packet_addr &&
2274 !transport_peers_valid(&st->peers))
2275 return False;
2276
2277 slog(st,LOG_SETUP_INIT,
2278 "using: %d configured addr(s);%s %d old peer addrs(es)",
2279 n_configured_addrs,
2280 incoming_packet_addr ? " incoming packet address;" : "",
2281 st->peers.npeers);
2282
2283 /* Non-mobile peers try addresses until one is plausible. The
2284 * effect is that this code always tries first the configured
2285 * address if supplied, or otherwise the address of the incoming
2286 * PROD, or finally the existing data peer if one exists; this is
2287 * as desired. */
2288
2289 transport_peers_copy(st,&st->setup_peers,&st->peers);
2290 transport_peers_expire(st,&st->setup_peers);
2291
2292 if (incoming_packet_addr)
2293 transport_record_peers(st,&st->setup_peers,
2294 incoming_packet_addr,1, "incoming");
2295
2296 if (n_configured_addrs)
2297 transport_record_peers(st,&st->setup_peers,
2298 configured_addrs,n_configured_addrs, "setupinit");
2299
2300 assert(transport_peers_valid(&st->setup_peers));
2301 return True;
2302 }
2303
2304 static void transport_setup_msgok(struct site *st, const struct comm_addr *a) {
2305 if (st->peer_mobile)
2306 transport_expire_record_peers(st,&st->setup_peers,a,1,"setupmsg");
2307 }
2308 static void transport_data_msgok(struct site *st, const struct comm_addr *a) {
2309 if (st->peer_mobile)
2310 transport_expire_record_peers(st,&st->peers,a,1,"datamsg");
2311 }
2312
2313 static int transport_peers_valid(transport_peers *peers) {
2314 return peers->npeers;
2315 }
2316 static void transport_peers_clear(struct site *st, transport_peers *peers) {
2317 peers->npeers= 0;
2318 transport_peers_debug(st,peers,"clear",0,0,0);
2319 }
2320 static void transport_peers_copy(struct site *st, transport_peers *dst,
2321 const transport_peers *src) {
2322 dst->npeers=src->npeers;
2323 COPY_ARRAY(dst->peers, src->peers, dst->npeers);
2324 transport_peers_debug(st,dst,"copy",
2325 src->npeers, &src->peers->addr, sizeof(*src->peers));
2326 }
2327
2328 static void transport_resolve_complete(struct site *st,
2329 const struct comm_addr *addrs,
2330 int naddrs) {
2331 transport_expire_record_peers(st,&st->peers,addrs,naddrs,
2332 "resolved data");
2333 transport_expire_record_peers(st,&st->setup_peers,addrs,naddrs,
2334 "resolved setup");
2335 }
2336
2337 static void transport_resolve_complete_tardy(struct site *st,
2338 const struct comm_addr *addrs,
2339 int naddrs) {
2340 transport_expire_record_peers(st,&st->peers,addrs,naddrs,
2341 "resolved tardily");
2342 }
2343
2344 static void transport_peers__copy_by_mask(transport_peer *out, int *nout_io,
2345 unsigned mask,
2346 const transport_peers *inp) {
2347 /* out and in->peers may be the same region, or nonoverlapping */
2348 const transport_peer *in=inp->peers;
2349 int slot;
2350 for (slot=0; slot<inp->npeers; slot++) {
2351 if (!(mask & (1U << slot)))
2352 continue;
2353 if (!(out==in && slot==*nout_io))
2354 COPY_OBJ(out[*nout_io], in[slot]);
2355 (*nout_io)++;
2356 }
2357 }
2358
2359 void transport_xmit(struct site *st, transport_peers *peers,
2360 struct buffer_if *buf, bool_t candebug) {
2361 int slot;
2362 transport_peers_expire(st, peers);
2363 unsigned failed=0; /* bitmask */
2364 assert(MAX_PEER_ADDRS < sizeof(unsigned)*CHAR_BIT);
2365
2366 int nfailed=0;
2367 for (slot=0; slot<peers->npeers; slot++) {
2368 transport_peer *peer=&peers->peers[slot];
2369 bool_t ok = comm_addr_sendmsg(st, &peer->addr, buf);
2370 if (candebug)
2371 dump_packet(st, buf, &peer->addr, False, ok);
2372 if (!ok) {
2373 failed |= 1U << slot;
2374 nfailed++;
2375 }
2376 if (ok && !st->peer_mobile)
2377 break;
2378 }
2379 /* Now we need to demote/delete failing addrs: if we are mobile we
2380 * merely demote them; otherwise we delete them. */
2381 if (st->local_mobile) {
2382 unsigned expected = ((1U << nfailed)-1) << (peers->npeers-nfailed);
2383 /* `expected' has all the failures at the end already */
2384 if (failed != expected) {
2385 int fslot=0;
2386 transport_peer failedpeers[nfailed];
2387 transport_peers__copy_by_mask(failedpeers, &fslot, failed,peers);
2388 assert(fslot == nfailed);
2389 int wslot=0;
2390 transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2391 assert(wslot+nfailed == peers->npeers);
2392 COPY_ARRAY(peers->peers+wslot, failedpeers, nfailed);
2393 transport_peers_debug(st,peers,"mobile failure reorder",0,0,0);
2394 }
2395 } else {
2396 if (failed && peers->npeers > 1) {
2397 int wslot=0;
2398 transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2399 peers->npeers=wslot;
2400 transport_peers_debug(st,peers,"non-mobile failure cleanup",0,0,0);
2401 }
2402 }
2403 }
2404
2405 /***** END of transport peers declarations *****/