site: Packet-level debugging notes errors from transmit.
[secnet] / site.c
1 /* site.c - manage communication with a remote network site */
2
3 /*
4 * This file is part of secnet.
5 * See README for full list of copyright holders.
6 *
7 * secnet is free software; you can redistribute it and/or modify it
8 * under the terms of the GNU General Public License as published by
9 * the Free Software Foundation; either version d of the License, or
10 * (at your option) any later version.
11 *
12 * secnet is distributed in the hope that it will be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * version 3 along with secnet; if not, see
19 * https://www.gnu.org/licenses/gpl.html.
20 */
21
22 /* The 'site' code doesn't know anything about the structure of the
23 packets it's transmitting. In fact, under the new netlink
24 configuration scheme it doesn't need to know anything at all about
25 IP addresses, except how to contact its peer. This means it could
26 potentially be used to tunnel other protocols too (IPv6, IPX, plain
27 old Ethernet frames) if appropriate netlink code can be written
28 (and that ought not to be too hard, eg. using the TUN/TAP device to
29 pretend to be an Ethernet interface). */
30
31 /* At some point in the future the netlink code will be asked for
32 configuration information to go in the PING/PONG packets at the end
33 of the key exchange. */
34
35 #include "secnet.h"
36 #include <stdio.h>
37 #include <string.h>
38 #include <limits.h>
39 #include <assert.h>
40 #include <sys/socket.h>
41
42 #include <sys/mman.h>
43 #include "util.h"
44 #include "unaligned.h"
45 #include "magic.h"
46
47 #define SETUP_BUFFER_LEN 2048
48
49 #define DEFAULT_KEY_LIFETIME (3600*1000) /* [ms] */
50 #define DEFAULT_KEY_RENEGOTIATE_GAP (5*60*1000) /* [ms] */
51 #define DEFAULT_SETUP_RETRIES 5
52 #define DEFAULT_SETUP_RETRY_INTERVAL (2*1000) /* [ms] */
53 #define DEFAULT_WAIT_TIME (20*1000) /* [ms] */
54
55 #define DEFAULT_MOBILE_KEY_LIFETIME (2*24*3600*1000) /* [ms] */
56 #define DEFAULT_MOBILE_KEY_RENEGOTIATE_GAP (12*3600*1000) /* [ms] */
57 #define DEFAULT_MOBILE_SETUP_RETRIES 30
58 #define DEFAULT_MOBILE_SETUP_RETRY_INTERVAL (1*1000) /* [ms] */
59 #define DEFAULT_MOBILE_WAIT_TIME (10*1000) /* [ms] */
60
61 #define DEFAULT_MOBILE_PEER_EXPIRY (2*60) /* [s] */
62
63 /* Each site can be in one of several possible states. */
64
65 /* States:
66 SITE_STOP - nothing is allowed to happen; tunnel is down;
67 all session keys have been erased
68 -> SITE_RUN upon external instruction
69 SITE_RUN - site up, maybe with valid key
70 -> SITE_RESOLVE upon outgoing packet and no valid key
71 we start name resolution for the other end of the tunnel
72 -> SITE_SENTMSG2 upon valid incoming message 1 and suitable time
73 we send an appropriate message 2
74 SITE_RESOLVE - waiting for name resolution
75 -> SITE_SENTMSG1 upon successful resolution
76 we send an appropriate message 1
77 -> SITE_SENTMSG2 upon valid incoming message 1 (then abort resolution)
78 we abort resolution and
79 -> SITE_WAIT on timeout or resolution failure
80 SITE_SENTMSG1
81 -> SITE_SENTMSG2 upon valid incoming message 1 from higher priority end
82 -> SITE_SENTMSG3 upon valid incoming message 2
83 -> SITE_WAIT on timeout
84 SITE_SENTMSG2
85 -> SITE_SENTMSG4 upon valid incoming message 3
86 -> SITE_WAIT on timeout
87 SITE_SENTMSG3
88 -> SITE_SENTMSG5 upon valid incoming message 4
89 -> SITE_WAIT on timeout
90 SITE_SENTMSG4
91 -> SITE_RUN upon valid incoming message 5
92 -> SITE_WAIT on timeout
93 SITE_SENTMSG5
94 -> SITE_RUN upon valid incoming message 6
95 -> SITE_WAIT on timeout
96 SITE_WAIT - failed to establish key; do nothing for a while
97 -> SITE_RUN on timeout
98 */
99
100 #define SITE_STOP 0
101 #define SITE_RUN 1
102 #define SITE_RESOLVE 2
103 #define SITE_SENTMSG1 3
104 #define SITE_SENTMSG2 4
105 #define SITE_SENTMSG3 5
106 #define SITE_SENTMSG4 6
107 #define SITE_SENTMSG5 7
108 #define SITE_WAIT 8
109
110 int32_t site_max_start_pad = 4*4;
111
112 static cstring_t state_name(uint32_t state)
113 {
114 switch (state) {
115 case 0: return "STOP";
116 case 1: return "RUN";
117 case 2: return "RESOLVE";
118 case 3: return "SENTMSG1";
119 case 4: return "SENTMSG2";
120 case 5: return "SENTMSG3";
121 case 6: return "SENTMSG4";
122 case 7: return "SENTMSG5";
123 case 8: return "WAIT";
124 default: return "*bad state*";
125 }
126 }
127
128 #define NONCELEN 8
129
130 #define LOG_UNEXPECTED 0x00000001
131 #define LOG_SETUP_INIT 0x00000002
132 #define LOG_SETUP_TIMEOUT 0x00000004
133 #define LOG_ACTIVATE_KEY 0x00000008
134 #define LOG_TIMEOUT_KEY 0x00000010
135 #define LOG_SEC 0x00000020
136 #define LOG_STATE 0x00000040
137 #define LOG_DROP 0x00000080
138 #define LOG_DUMP 0x00000100
139 #define LOG_ERROR 0x00000400
140 #define LOG_PEER_ADDRS 0x00000800
141
142 static struct flagstr log_event_table[]={
143 { "unexpected", LOG_UNEXPECTED },
144 { "setup-init", LOG_SETUP_INIT },
145 { "setup-timeout", LOG_SETUP_TIMEOUT },
146 { "activate-key", LOG_ACTIVATE_KEY },
147 { "timeout-key", LOG_TIMEOUT_KEY },
148 { "security", LOG_SEC },
149 { "state-change", LOG_STATE },
150 { "packet-drop", LOG_DROP },
151 { "dump-packets", LOG_DUMP },
152 { "errors", LOG_ERROR },
153 { "peer-addrs", LOG_PEER_ADDRS },
154 { "default", LOG_SETUP_INIT|LOG_SETUP_TIMEOUT|
155 LOG_ACTIVATE_KEY|LOG_TIMEOUT_KEY|LOG_SEC|LOG_ERROR },
156 { "all", 0xffffffff },
157 { NULL, 0 }
158 };
159
160
161 /***** TRANSPORT PEERS declarations *****/
162
163 /* Details of "mobile peer" semantics:
164
165 - We use the same data structure for the different configurations,
166 but manage it with different algorithms.
167
168 - We record up to mobile_peers_max peer address/port numbers
169 ("peers") for key setup, and separately up to mobile_peers_max
170 for data transfer.
171
172 - In general, we make a new set of addrs (see below) when we start
173 a new key exchange; the key setup addrs become the data transport
174 addrs when key setup complets.
175
176 If our peer is mobile:
177
178 - We send to all recent addresses of incoming packets, plus
179 initially all configured addresses (which we also expire).
180
181 - So, we record addrs of good incoming packets, as follows:
182 1. expire any peers last seen >120s ("mobile-peer-expiry") ago
183 2. add the peer of the just received packet to the applicable list
184 (possibly evicting the oldest entries to make room)
185 NB that we do not expire peers until an incoming packet arrives.
186
187 - If the peer has a configured address or name, we record them the
188 same way, but only as a result of our own initiation of key
189 setup. (We might evict some incoming packet addrs to make room.)
190
191 - The default number of addrs to keep is 3, or 4 if we have a
192 configured name or address. That's space for two configured
193 addresses (one IPv6 and one IPv4), plus two received addresses.
194
195 - Outgoing packets are sent to every recorded address in the
196 applicable list. Any unsupported[1] addresses are deleted from
197 the list right away. (This should only happen to configured
198 addresses, of course, but there is no need to check that.)
199
200 - When we successfully complete a key setup, we merge the key setup
201 peers into the data transfer peers.
202
203 [1] An unsupported address is one for whose AF we don't have a
204 socket (perhaps because we got EAFNOSUPPORT or some such) or for
205 which sendto gives ENETUNREACH.
206
207 If neither end is mobile:
208
209 - When peer initiated the key exchange, we use the incoming packet
210 address.
211
212 - When we initiate the key exchange, we try configured addresses
213 until we get one which isn't unsupported then fixate on that.
214
215 - When we complete a key setup, we replace the data transport peers
216 with those from the key setup.
217
218 If we are mobile:
219
220 - We can't tell when local network setup changes so we can't cache
221 the unsupported addrs and completely remove the spurious calls to
222 sendto, but we can optimise things a bit by deprioritising addrs
223 which seem to be unsupported.
224
225 - Use only configured addresses. (Except, that if our peer
226 initiated a key exchange we use the incoming packet address until
227 our name resolution completes.)
228
229 - When we send a packet, try each address in turn; if addr
230 supported, put that address to the end of the list for future
231 packets, and go onto the next address.
232
233 - When we complete a key setup, we replace the data transport peers
234 with those from the key setup.
235
236 */
237
238 typedef struct {
239 struct timeval last;
240 struct comm_addr addr;
241 } transport_peer;
242
243 typedef struct {
244 /* configuration information */
245 /* runtime information */
246 int npeers;
247 transport_peer peers[MAX_PEER_ADDRS];
248 } transport_peers;
249
250 /* Basic operations on transport peer address sets */
251 static void transport_peers_clear(struct site *st, transport_peers *peers);
252 static int transport_peers_valid(transport_peers *peers);
253 static void transport_peers_copy(struct site *st, transport_peers *dst,
254 const transport_peers *src);
255
256 /* Record address of incoming setup packet; resp. data packet. */
257 static void transport_setup_msgok(struct site *st, const struct comm_addr *a);
258 static void transport_data_msgok(struct site *st, const struct comm_addr *a);
259
260 /* Initialise the setup addresses. Called before we send the first
261 * packet in a key exchange. If we are the initiator, as a result of
262 * resolve completing (or being determined not to be relevant) or an
263 * incoming PROD; if we are the responder, as a result of the MSG1. */
264 static bool_t transport_compute_setupinit_peers(struct site *st,
265 const struct comm_addr *configured_addrs /* 0 if none or not found */,
266 int n_configured_addrs /* 0 if none or not found */,
267 const struct comm_addr *incoming_packet_addr /* 0 if none */);
268
269 /* Called if we are the responder in a key setup, when the resolve
270 * completes. transport_compute_setupinit_peers will hvae been called
271 * earlier. If _complete is called, we are still doing the key setup
272 * (and we should use the new values for both the rest of the key
273 * setup and the ongoing data exchange); if _tardy is called, the key
274 * setup is done (either completed or not) and only the data peers are
275 * relevant */
276 static void transport_resolve_complete(struct site *st,
277 const struct comm_addr *addrs, int naddrs);
278 static void transport_resolve_complete_tardy(struct site *st,
279 const struct comm_addr *addrs, int naddrs);
280
281 static void transport_xmit(struct site *st, transport_peers *peers,
282 struct buffer_if *buf, bool_t candebug);
283
284 /***** END of transport peers declarations *****/
285
286
287 struct data_key {
288 struct transform_inst_if *transform;
289 uint64_t key_timeout; /* End of life of current key */
290 uint32_t remote_session_id;
291 };
292
293 struct site {
294 closure_t cl;
295 struct site_if ops;
296 /* configuration information */
297 string_t localname;
298 string_t remotename;
299 bool_t local_mobile, peer_mobile; /* Mobile client support */
300 int32_t transport_peers_max;
301 string_t tunname; /* localname<->remotename by default, used in logs */
302 cstring_t *addresses; /* DNS name or address(es) for bootstrapping, optional */
303 int remoteport; /* Port for bootstrapping, optional */
304 uint32_t mtu_target;
305 struct netlink_if *netlink;
306 struct comm_if **comms;
307 int ncomms;
308 struct resolver_if *resolver;
309 struct log_if *log;
310 struct random_if *random;
311 struct rsaprivkey_if *privkey;
312 struct rsapubkey_if *pubkey;
313 struct transform_if **transforms;
314 int ntransforms;
315 struct dh_if *dh;
316 struct hash_if *hash;
317
318 uint32_t index; /* Index of this site */
319 uint32_t local_capabilities;
320 int32_t setup_retries; /* How many times to send setup packets */
321 int32_t setup_retry_interval; /* Initial timeout for setup packets */
322 int32_t wait_timeout; /* How long to wait if setup unsuccessful */
323 int32_t mobile_peer_expiry; /* How long to remember 2ary addresses */
324 int32_t key_lifetime; /* How long a key lasts once set up */
325 int32_t key_renegotiate_time; /* If we see traffic (or a keepalive)
326 after this time, initiate a new
327 key exchange */
328
329 bool_t setup_priority; /* Do we have precedence if both sites emit
330 message 1 simultaneously? */
331 uint32_t log_events;
332
333 /* runtime information */
334 uint32_t state;
335 uint64_t now; /* Most recently seen time */
336 bool_t allow_send_prod;
337 int resolving_count;
338 int resolving_n_results_all;
339 int resolving_n_results_stored;
340 struct comm_addr resolving_results[MAX_PEER_ADDRS];
341
342 /* The currently established session */
343 struct data_key current;
344 struct data_key auxiliary_key;
345 bool_t auxiliary_is_new;
346 uint64_t renegotiate_key_time; /* When we can negotiate a new key */
347 uint64_t auxiliary_renegotiate_key_time;
348 transport_peers peers; /* Current address(es) of peer for data traffic */
349
350 /* The current key setup protocol exchange. We can only be
351 involved in one of these at a time. There's a potential for
352 denial of service here (the attacker keeps sending a setup
353 packet; we keep trying to continue the exchange, and have to
354 timeout before we can listen for another setup packet); perhaps
355 we should keep a list of 'bad' sources for setup packets. */
356 uint32_t remote_capabilities;
357 uint16_t remote_adv_mtu;
358 struct transform_if *chosen_transform;
359 uint32_t setup_session_id;
360 transport_peers setup_peers;
361 uint8_t localN[NONCELEN]; /* Nonces for key exchange */
362 uint8_t remoteN[NONCELEN];
363 struct buffer_if buffer; /* Current outgoing key exchange packet */
364 struct buffer_if scratch;
365 int32_t retries; /* Number of retries remaining */
366 uint64_t timeout; /* Timeout for current state */
367 uint8_t *dhsecret;
368 uint8_t *sharedsecret;
369 uint32_t sharedsecretlen, sharedsecretallocd;
370 struct transform_inst_if *new_transform; /* For key setup/verify */
371 };
372
373 static uint32_t event_log_priority(struct site *st, uint32_t event)
374 {
375 if (!(event&st->log_events))
376 return 0;
377 switch(event) {
378 case LOG_UNEXPECTED: return M_INFO;
379 case LOG_SETUP_INIT: return M_INFO;
380 case LOG_SETUP_TIMEOUT: return M_NOTICE;
381 case LOG_ACTIVATE_KEY: return M_INFO;
382 case LOG_TIMEOUT_KEY: return M_INFO;
383 case LOG_SEC: return M_SECURITY;
384 case LOG_STATE: return M_DEBUG;
385 case LOG_DROP: return M_DEBUG;
386 case LOG_DUMP: return M_DEBUG;
387 case LOG_ERROR: return M_ERR;
388 case LOG_PEER_ADDRS: return M_DEBUG;
389 default: return M_ERR;
390 }
391 }
392
393 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
394 FORMAT(printf,3,0);
395 static void vslog(struct site *st, uint32_t event, cstring_t msg, va_list ap)
396 {
397 uint32_t class;
398
399 class=event_log_priority(st, event);
400 if (class) {
401 slilog_part(st->log,class,"%s: ",st->tunname);
402 vslilog_part(st->log,class,msg,ap);
403 slilog_part(st->log,class,"\n");
404 }
405 }
406
407 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
408 FORMAT(printf,3,4);
409 static void slog(struct site *st, uint32_t event, cstring_t msg, ...)
410 {
411 va_list ap;
412 va_start(ap,msg);
413 vslog(st,event,msg,ap);
414 va_end(ap);
415 }
416
417 static void logtimeout(struct site *st, const char *fmt, ...)
418 FORMAT(printf,2,3);
419 static void logtimeout(struct site *st, const char *fmt, ...)
420 {
421 uint32_t class=event_log_priority(st,LOG_SETUP_TIMEOUT);
422 if (!class)
423 return;
424
425 va_list ap;
426 va_start(ap,fmt);
427
428 slilog_part(st->log,class,"%s: ",st->tunname);
429 vslilog_part(st->log,class,fmt,ap);
430
431 const char *delim;
432 int i;
433 for (i=0, delim=" (tried ";
434 i<st->setup_peers.npeers;
435 i++, delim=", ") {
436 transport_peer *peer=&st->setup_peers.peers[i];
437 const char *s=comm_addr_to_string(&peer->addr);
438 slilog_part(st->log,class,"%s%s",delim,s);
439 }
440
441 slilog_part(st->log,class,")\n");
442 va_end(ap);
443 }
444
445 static void set_link_quality(struct site *st);
446 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel);
447 static void delete_one_key(struct site *st, struct data_key *key,
448 const char *reason /* may be 0 meaning don't log*/,
449 const char *which /* ignored if !reasonn */,
450 uint32_t loglevel /* ignored if !reasonn */);
451 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
452 const struct comm_addr *prod_hint);
453 static void enter_state_run(struct site *st);
454 static bool_t enter_state_resolve(struct site *st);
455 static void decrement_resolving_count(struct site *st, int by);
456 static bool_t enter_new_state(struct site *st,uint32_t next);
457 static void enter_state_wait(struct site *st);
458 static void activate_new_key(struct site *st);
459
460 static bool_t is_transform_valid(struct transform_inst_if *transform)
461 {
462 return transform && transform->valid(transform->st);
463 }
464
465 static bool_t current_valid(struct site *st)
466 {
467 return is_transform_valid(st->current.transform);
468 }
469
470 #define DEFINE_CALL_TRANSFORM(fwdrev) \
471 static int call_transform_##fwdrev(struct site *st, \
472 struct transform_inst_if *transform, \
473 struct buffer_if *buf, \
474 const char **errmsg) \
475 { \
476 if (!is_transform_valid(transform)) { \
477 *errmsg="transform not set up"; \
478 return 1; \
479 } \
480 return transform->fwdrev(transform->st,buf,errmsg); \
481 }
482
483 DEFINE_CALL_TRANSFORM(forwards)
484 DEFINE_CALL_TRANSFORM(reverse)
485
486 static void dispose_transform(struct transform_inst_if **transform_var)
487 {
488 struct transform_inst_if *transform=*transform_var;
489 if (transform) {
490 transform->delkey(transform->st);
491 transform->destroy(transform->st);
492 }
493 *transform_var = 0;
494 }
495
496 #define CHECK_AVAIL(b,l) do { if ((b)->size<(l)) return False; } while(0)
497 #define CHECK_EMPTY(b) do { if ((b)->size!=0) return False; } while(0)
498 #define CHECK_TYPE(b,t) do { uint32_t type; \
499 CHECK_AVAIL((b),4); \
500 type=buf_unprepend_uint32((b)); \
501 if (type!=(t)) return False; } while(0)
502
503 static _Bool type_is_msg34(uint32_t type)
504 {
505 return
506 type == LABEL_MSG3 ||
507 type == LABEL_MSG3BIS ||
508 type == LABEL_MSG4;
509 }
510
511 struct parsedname {
512 int32_t len;
513 uint8_t *name;
514 struct buffer_if extrainfo;
515 };
516
517 struct msg {
518 uint8_t *hashstart;
519 uint32_t dest;
520 uint32_t source;
521 struct parsedname remote;
522 struct parsedname local;
523 uint32_t remote_capabilities;
524 uint16_t remote_mtu;
525 int capab_transformnum;
526 uint8_t *nR;
527 uint8_t *nL;
528 int32_t pklen;
529 char *pk;
530 int32_t hashlen;
531 int32_t siglen;
532 char *sig;
533 };
534
535 static void set_new_transform(struct site *st, char *pk)
536 {
537 /* Make room for the shared key */
538 st->sharedsecretlen=st->chosen_transform->keylen?:st->dh->ceil_len;
539 assert(st->sharedsecretlen);
540 if (st->sharedsecretlen > st->sharedsecretallocd) {
541 st->sharedsecretallocd=st->sharedsecretlen;
542 st->sharedsecret=safe_realloc_ary(st->sharedsecret,1,
543 st->sharedsecretallocd,
544 "site:sharedsecret");
545 }
546
547 /* Generate the shared key */
548 st->dh->makeshared(st->dh->st,st->dhsecret,st->dh->len,pk,
549 st->sharedsecret,st->sharedsecretlen);
550
551 /* Set up the transform */
552 struct transform_if *generator=st->chosen_transform;
553 struct transform_inst_if *generated=generator->create(generator->st);
554 generated->setkey(generated->st,st->sharedsecret,
555 st->sharedsecretlen,st->setup_priority);
556 dispose_transform(&st->new_transform);
557 st->new_transform=generated;
558
559 slog(st,LOG_SETUP_INIT,"key exchange negotiated transform"
560 " %d (capabilities ours=%#"PRIx32" theirs=%#"PRIx32")",
561 st->chosen_transform->capab_transformnum,
562 st->local_capabilities, st->remote_capabilities);
563 }
564
565 struct xinfoadd {
566 int32_t lenpos, afternul;
567 };
568 static void append_string_xinfo_start(struct buffer_if *buf,
569 struct xinfoadd *xia,
570 const char *str)
571 /* Helps construct one of the names with additional info as found
572 * in MSG1..4. Call this function first, then append all the
573 * desired extra info (not including the nul byte) to the buffer,
574 * then call append_string_xinfo_done. */
575 {
576 xia->lenpos = buf->size;
577 buf_append_string(buf,str);
578 buf_append_uint8(buf,0);
579 xia->afternul = buf->size;
580 }
581 static void append_string_xinfo_done(struct buffer_if *buf,
582 struct xinfoadd *xia)
583 {
584 /* we just need to adjust the string length */
585 if (buf->size == xia->afternul) {
586 /* no extra info, strip the nul too */
587 buf_unappend_uint8(buf);
588 } else {
589 put_uint16(buf->start+xia->lenpos, buf->size-(xia->lenpos+2));
590 }
591 }
592
593 /* Build any of msg1 to msg4. msg5 and msg6 are built from the inside
594 out using a transform of config data supplied by netlink */
595 static bool_t generate_msg(struct site *st, uint32_t type, cstring_t what)
596 {
597 void *hst;
598 uint8_t *hash;
599 string_t dhpub, sig;
600
601 st->retries=st->setup_retries;
602 BUF_ALLOC(&st->buffer,what);
603 buffer_init(&st->buffer,0);
604 buf_append_uint32(&st->buffer,
605 (type==LABEL_MSG1?0:st->setup_session_id));
606 buf_append_uint32(&st->buffer,st->index);
607 buf_append_uint32(&st->buffer,type);
608
609 struct xinfoadd xia;
610 append_string_xinfo_start(&st->buffer,&xia,st->localname);
611 if ((st->local_capabilities & CAPAB_EARLY) || (type != LABEL_MSG1)) {
612 buf_append_uint32(&st->buffer,st->local_capabilities);
613 }
614 if (type_is_msg34(type)) {
615 buf_append_uint16(&st->buffer,st->mtu_target);
616 }
617 append_string_xinfo_done(&st->buffer,&xia);
618
619 buf_append_string(&st->buffer,st->remotename);
620 BUF_ADD_OBJ(append,&st->buffer,st->localN);
621 if (type==LABEL_MSG1) return True;
622 BUF_ADD_OBJ(append,&st->buffer,st->remoteN);
623 if (type==LABEL_MSG2) return True;
624
625 if (hacky_par_mid_failnow()) return False;
626
627 if (type==LABEL_MSG3BIS)
628 buf_append_uint8(&st->buffer,st->chosen_transform->capab_transformnum);
629
630 dhpub=st->dh->makepublic(st->dh->st,st->dhsecret,st->dh->len);
631 buf_append_string(&st->buffer,dhpub);
632 free(dhpub);
633 hash=safe_malloc(st->hash->len, "generate_msg");
634 hst=st->hash->init();
635 st->hash->update(hst,st->buffer.start,st->buffer.size);
636 st->hash->final(hst,hash);
637 sig=st->privkey->sign(st->privkey->st,hash,st->hash->len);
638 buf_append_string(&st->buffer,sig);
639 free(sig);
640 free(hash);
641 return True;
642 }
643
644 static bool_t unpick_name(struct buffer_if *msg, struct parsedname *nm)
645 {
646 CHECK_AVAIL(msg,2);
647 nm->len=buf_unprepend_uint16(msg);
648 CHECK_AVAIL(msg,nm->len);
649 nm->name=buf_unprepend(msg,nm->len);
650 uint8_t *nul=memchr(nm->name,0,nm->len);
651 if (!nul) {
652 buffer_readonly_view(&nm->extrainfo,0,0);
653 } else {
654 buffer_readonly_view(&nm->extrainfo, nul+1, msg->start-(nul+1));
655 nm->len=nul-nm->name;
656 }
657 return True;
658 }
659
660 static bool_t unpick_msg(struct site *st, uint32_t type,
661 struct buffer_if *msg, struct msg *m)
662 {
663 m->capab_transformnum=-1;
664 m->hashstart=msg->start;
665 CHECK_AVAIL(msg,4);
666 m->dest=buf_unprepend_uint32(msg);
667 CHECK_AVAIL(msg,4);
668 m->source=buf_unprepend_uint32(msg);
669 CHECK_TYPE(msg,type);
670 if (!unpick_name(msg,&m->remote)) return False;
671 m->remote_capabilities=0;
672 m->remote_mtu=0;
673 if (m->remote.extrainfo.size) {
674 CHECK_AVAIL(&m->remote.extrainfo,4);
675 m->remote_capabilities=buf_unprepend_uint32(&m->remote.extrainfo);
676 }
677 if (type_is_msg34(type) && m->remote.extrainfo.size) {
678 CHECK_AVAIL(&m->remote.extrainfo,2);
679 m->remote_mtu=buf_unprepend_uint16(&m->remote.extrainfo);
680 }
681 if (!unpick_name(msg,&m->local)) return False;
682 if (type==LABEL_PROD) {
683 CHECK_EMPTY(msg);
684 return True;
685 }
686 CHECK_AVAIL(msg,NONCELEN);
687 m->nR=buf_unprepend(msg,NONCELEN);
688 if (type==LABEL_MSG1) {
689 CHECK_EMPTY(msg);
690 return True;
691 }
692 CHECK_AVAIL(msg,NONCELEN);
693 m->nL=buf_unprepend(msg,NONCELEN);
694 if (type==LABEL_MSG2) {
695 CHECK_EMPTY(msg);
696 return True;
697 }
698 if (type==LABEL_MSG3BIS) {
699 CHECK_AVAIL(msg,1);
700 m->capab_transformnum = buf_unprepend_uint8(msg);
701 } else {
702 m->capab_transformnum = CAPAB_TRANSFORMNUM_ANCIENT;
703 }
704 CHECK_AVAIL(msg,2);
705 m->pklen=buf_unprepend_uint16(msg);
706 CHECK_AVAIL(msg,m->pklen);
707 m->pk=buf_unprepend(msg,m->pklen);
708 m->hashlen=msg->start-m->hashstart;
709 CHECK_AVAIL(msg,2);
710 m->siglen=buf_unprepend_uint16(msg);
711 CHECK_AVAIL(msg,m->siglen);
712 m->sig=buf_unprepend(msg,m->siglen);
713 CHECK_EMPTY(msg);
714 return True;
715 }
716
717 static bool_t name_matches(const struct parsedname *nm, const char *expected)
718 {
719 int expected_len=strlen(expected);
720 return
721 nm->len == expected_len &&
722 !memcmp(nm->name, expected, expected_len);
723 }
724
725 static bool_t check_msg(struct site *st, uint32_t type, struct msg *m,
726 cstring_t *error)
727 {
728 if (type==LABEL_MSG1) return True;
729
730 /* Check that the site names and our nonce have been sent
731 back correctly, and then store our peer's nonce. */
732 if (!name_matches(&m->remote,st->remotename)) {
733 *error="wrong remote site name";
734 return False;
735 }
736 if (!name_matches(&m->local,st->localname)) {
737 *error="wrong local site name";
738 return False;
739 }
740 if (memcmp(m->nL,st->localN,NONCELEN)!=0) {
741 *error="wrong locally-generated nonce";
742 return False;
743 }
744 if (type==LABEL_MSG2) return True;
745 if (!consttime_memeq(m->nR,st->remoteN,NONCELEN)!=0) {
746 *error="wrong remotely-generated nonce";
747 return False;
748 }
749 /* MSG3 has complicated rules about capabilities, which are
750 * handled in process_msg3. */
751 if (type==LABEL_MSG3 || type==LABEL_MSG3BIS) return True;
752 if (m->remote_capabilities!=st->remote_capabilities) {
753 *error="remote capabilities changed";
754 return False;
755 }
756 if (type==LABEL_MSG4) return True;
757 *error="unknown message type";
758 return False;
759 }
760
761 static bool_t generate_msg1(struct site *st)
762 {
763 st->random->generate(st->random->st,NONCELEN,st->localN);
764 return generate_msg(st,LABEL_MSG1,"site:MSG1");
765 }
766
767 static bool_t process_msg1(struct site *st, struct buffer_if *msg1,
768 const struct comm_addr *src, struct msg *m)
769 {
770 /* We've already determined we're in an appropriate state to
771 process an incoming MSG1, and that the MSG1 has correct values
772 of A and B. */
773
774 st->setup_session_id=m->source;
775 st->remote_capabilities=m->remote_capabilities;
776 memcpy(st->remoteN,m->nR,NONCELEN);
777 return True;
778 }
779
780 static bool_t generate_msg2(struct site *st)
781 {
782 st->random->generate(st->random->st,NONCELEN,st->localN);
783 return generate_msg(st,LABEL_MSG2,"site:MSG2");
784 }
785
786 static bool_t process_msg2(struct site *st, struct buffer_if *msg2,
787 const struct comm_addr *src)
788 {
789 struct msg m;
790 cstring_t err;
791
792 if (!unpick_msg(st,LABEL_MSG2,msg2,&m)) return False;
793 if (!check_msg(st,LABEL_MSG2,&m,&err)) {
794 slog(st,LOG_SEC,"msg2: %s",err);
795 return False;
796 }
797 st->setup_session_id=m.source;
798 st->remote_capabilities=m.remote_capabilities;
799
800 /* Select the transform to use */
801
802 uint32_t remote_transforms = st->remote_capabilities & CAPAB_TRANSFORM_MASK;
803 if (!remote_transforms)
804 /* old secnets only had this one transform */
805 remote_transforms = 1UL << CAPAB_TRANSFORMNUM_ANCIENT;
806
807 struct transform_if *ti;
808 int i;
809 for (i=0; i<st->ntransforms; i++) {
810 ti=st->transforms[i];
811 if ((1UL << ti->capab_transformnum) & remote_transforms)
812 goto transform_found;
813 }
814 slog(st,LOG_ERROR,"no transforms in common"
815 " (us %#"PRIx32"; them: %#"PRIx32")",
816 st->local_capabilities & CAPAB_TRANSFORM_MASK,
817 remote_transforms);
818 return False;
819 transform_found:
820 st->chosen_transform=ti;
821
822 memcpy(st->remoteN,m.nR,NONCELEN);
823 return True;
824 }
825
826 static bool_t generate_msg3(struct site *st)
827 {
828 /* Now we have our nonce and their nonce. Think of a secret key,
829 and create message number 3. */
830 st->random->generate(st->random->st,st->dh->len,st->dhsecret);
831 return generate_msg(st,
832 (st->remote_capabilities & CAPAB_TRANSFORM_MASK
833 ? LABEL_MSG3BIS : LABEL_MSG3),
834 "site:MSG3");
835 }
836
837 static bool_t process_msg3_msg4(struct site *st, struct msg *m)
838 {
839 uint8_t *hash;
840 void *hst;
841
842 /* Check signature and store g^x mod m */
843 hash=safe_malloc(st->hash->len, "process_msg3_msg4");
844 hst=st->hash->init();
845 st->hash->update(hst,m->hashstart,m->hashlen);
846 st->hash->final(hst,hash);
847 /* Terminate signature with a '0' - cheating, but should be ok */
848 m->sig[m->siglen]=0;
849 if (!st->pubkey->check(st->pubkey->st,hash,st->hash->len,m->sig)) {
850 slog(st,LOG_SEC,"msg3/msg4 signature failed check!");
851 free(hash);
852 return False;
853 }
854 free(hash);
855
856 st->remote_adv_mtu=m->remote_mtu;
857
858 return True;
859 }
860
861 static bool_t process_msg3(struct site *st, struct buffer_if *msg3,
862 const struct comm_addr *src, uint32_t msgtype)
863 {
864 struct msg m;
865 cstring_t err;
866
867 assert(msgtype==LABEL_MSG3 || msgtype==LABEL_MSG3BIS);
868
869 if (!unpick_msg(st,msgtype,msg3,&m)) return False;
870 if (!check_msg(st,msgtype,&m,&err)) {
871 slog(st,LOG_SEC,"msg3: %s",err);
872 return False;
873 }
874 uint32_t capab_adv_late = m.remote_capabilities
875 & ~st->remote_capabilities & CAPAB_EARLY;
876 if (capab_adv_late) {
877 slog(st,LOG_SEC,"msg3 impermissibly adds early capability flag(s)"
878 " %#"PRIx32" (was %#"PRIx32", now %#"PRIx32")",
879 capab_adv_late, st->remote_capabilities, m.remote_capabilities);
880 return False;
881 }
882 st->remote_capabilities|=m.remote_capabilities;
883
884 struct transform_if *ti;
885 int i;
886 for (i=0; i<st->ntransforms; i++) {
887 ti=st->transforms[i];
888 if (ti->capab_transformnum == m.capab_transformnum)
889 goto transform_found;
890 }
891 slog(st,LOG_SEC,"peer chose unknown-to-us transform %d!",
892 m.capab_transformnum);
893 return False;
894 transform_found:
895 st->chosen_transform=ti;
896
897 if (!process_msg3_msg4(st,&m))
898 return False;
899
900 /* Terminate their DH public key with a '0' */
901 m.pk[m.pklen]=0;
902 /* Invent our DH secret key */
903 st->random->generate(st->random->st,st->dh->len,st->dhsecret);
904
905 /* Generate the shared key and set up the transform */
906 set_new_transform(st,m.pk);
907
908 return True;
909 }
910
911 static bool_t generate_msg4(struct site *st)
912 {
913 /* We have both nonces, their public key and our private key. Generate
914 our public key, sign it and send it to them. */
915 return generate_msg(st,LABEL_MSG4,"site:MSG4");
916 }
917
918 static bool_t process_msg4(struct site *st, struct buffer_if *msg4,
919 const struct comm_addr *src)
920 {
921 struct msg m;
922 cstring_t err;
923
924 if (!unpick_msg(st,LABEL_MSG4,msg4,&m)) return False;
925 if (!check_msg(st,LABEL_MSG4,&m,&err)) {
926 slog(st,LOG_SEC,"msg4: %s",err);
927 return False;
928 }
929
930 if (!process_msg3_msg4(st,&m))
931 return False;
932
933 /* Terminate their DH public key with a '0' */
934 m.pk[m.pklen]=0;
935
936 /* Generate the shared key and set up the transform */
937 set_new_transform(st,m.pk);
938
939 return True;
940 }
941
942 struct msg0 {
943 uint32_t dest;
944 uint32_t source;
945 uint32_t type;
946 };
947
948 static bool_t unpick_msg0(struct site *st, struct buffer_if *msg0,
949 struct msg0 *m)
950 {
951 CHECK_AVAIL(msg0,4);
952 m->dest=buf_unprepend_uint32(msg0);
953 CHECK_AVAIL(msg0,4);
954 m->source=buf_unprepend_uint32(msg0);
955 CHECK_AVAIL(msg0,4);
956 m->type=buf_unprepend_uint32(msg0);
957 return True;
958 /* Leaves transformed part of buffer untouched */
959 }
960
961 static bool_t generate_msg5(struct site *st)
962 {
963 cstring_t transform_err;
964
965 BUF_ALLOC(&st->buffer,"site:MSG5");
966 /* We are going to add four words to the message */
967 buffer_init(&st->buffer,calculate_max_start_pad());
968 /* Give the netlink code an opportunity to put its own stuff in the
969 message (configuration information, etc.) */
970 buf_prepend_uint32(&st->buffer,LABEL_MSG5);
971 if (call_transform_forwards(st,st->new_transform,
972 &st->buffer,&transform_err))
973 return False;
974 buf_prepend_uint32(&st->buffer,LABEL_MSG5);
975 buf_prepend_uint32(&st->buffer,st->index);
976 buf_prepend_uint32(&st->buffer,st->setup_session_id);
977
978 st->retries=st->setup_retries;
979 return True;
980 }
981
982 static bool_t process_msg5(struct site *st, struct buffer_if *msg5,
983 const struct comm_addr *src,
984 struct transform_inst_if *transform)
985 {
986 struct msg0 m;
987 cstring_t transform_err;
988
989 if (!unpick_msg0(st,msg5,&m)) return False;
990
991 if (call_transform_reverse(st,transform,msg5,&transform_err)) {
992 /* There's a problem */
993 slog(st,LOG_SEC,"process_msg5: transform: %s",transform_err);
994 return False;
995 }
996 /* Buffer should now contain untransformed PING packet data */
997 CHECK_AVAIL(msg5,4);
998 if (buf_unprepend_uint32(msg5)!=LABEL_MSG5) {
999 slog(st,LOG_SEC,"MSG5/PING packet contained wrong label");
1000 return False;
1001 }
1002 /* Older versions of secnet used to write some config data here
1003 * which we ignore. So we don't CHECK_EMPTY */
1004 return True;
1005 }
1006
1007 static void create_msg6(struct site *st, struct transform_inst_if *transform,
1008 uint32_t session_id)
1009 {
1010 cstring_t transform_err;
1011
1012 BUF_ALLOC(&st->buffer,"site:MSG6");
1013 /* We are going to add four words to the message */
1014 buffer_init(&st->buffer,calculate_max_start_pad());
1015 /* Give the netlink code an opportunity to put its own stuff in the
1016 message (configuration information, etc.) */
1017 buf_prepend_uint32(&st->buffer,LABEL_MSG6);
1018 int problem = call_transform_forwards(st,transform,
1019 &st->buffer,&transform_err);
1020 assert(!problem);
1021 buf_prepend_uint32(&st->buffer,LABEL_MSG6);
1022 buf_prepend_uint32(&st->buffer,st->index);
1023 buf_prepend_uint32(&st->buffer,session_id);
1024 }
1025
1026 static bool_t generate_msg6(struct site *st)
1027 {
1028 if (!is_transform_valid(st->new_transform))
1029 return False;
1030 create_msg6(st,st->new_transform,st->setup_session_id);
1031 st->retries=1; /* Peer will retransmit MSG5 if this packet gets lost */
1032 return True;
1033 }
1034
1035 static bool_t process_msg6(struct site *st, struct buffer_if *msg6,
1036 const struct comm_addr *src)
1037 {
1038 struct msg0 m;
1039 cstring_t transform_err;
1040
1041 if (!unpick_msg0(st,msg6,&m)) return False;
1042
1043 if (call_transform_reverse(st,st->new_transform,msg6,&transform_err)) {
1044 /* There's a problem */
1045 slog(st,LOG_SEC,"process_msg6: transform: %s",transform_err);
1046 return False;
1047 }
1048 /* Buffer should now contain untransformed PING packet data */
1049 CHECK_AVAIL(msg6,4);
1050 if (buf_unprepend_uint32(msg6)!=LABEL_MSG6) {
1051 slog(st,LOG_SEC,"MSG6/PONG packet contained invalid data");
1052 return False;
1053 }
1054 /* Older versions of secnet used to write some config data here
1055 * which we ignore. So we don't CHECK_EMPTY */
1056 return True;
1057 }
1058
1059 static bool_t decrypt_msg0(struct site *st, struct buffer_if *msg0,
1060 const struct comm_addr *src)
1061 {
1062 cstring_t transform_err, auxkey_err, newkey_err="n/a";
1063 struct msg0 m;
1064 uint32_t problem;
1065
1066 if (!unpick_msg0(st,msg0,&m)) return False;
1067
1068 /* Keep a copy so we can try decrypting it with multiple keys */
1069 buffer_copy(&st->scratch, msg0);
1070
1071 problem = call_transform_reverse(st,st->current.transform,
1072 msg0,&transform_err);
1073 if (!problem) {
1074 if (!st->auxiliary_is_new)
1075 delete_one_key(st,&st->auxiliary_key,
1076 "peer has used new key","auxiliary key",LOG_SEC);
1077 return True;
1078 }
1079 if (problem==2)
1080 goto skew;
1081
1082 buffer_copy(msg0, &st->scratch);
1083 problem = call_transform_reverse(st,st->auxiliary_key.transform,
1084 msg0,&auxkey_err);
1085 if (problem==0) {
1086 slog(st,LOG_DROP,"processing packet which uses auxiliary key");
1087 if (st->auxiliary_is_new) {
1088 /* We previously timed out in state SENTMSG5 but it turns
1089 * out that our peer did in fact get our MSG5 and is
1090 * using the new key. So we should switch to it too. */
1091 /* This is a bit like activate_new_key. */
1092 struct data_key t;
1093 t=st->current;
1094 st->current=st->auxiliary_key;
1095 st->auxiliary_key=t;
1096
1097 delete_one_key(st,&st->auxiliary_key,"peer has used new key",
1098 "previous key",LOG_SEC);
1099 st->auxiliary_is_new=0;
1100 st->renegotiate_key_time=st->auxiliary_renegotiate_key_time;
1101 }
1102 return True;
1103 }
1104 if (problem==2)
1105 goto skew;
1106
1107 if (st->state==SITE_SENTMSG5) {
1108 buffer_copy(msg0, &st->scratch);
1109 problem = call_transform_reverse(st,st->new_transform,
1110 msg0,&newkey_err);
1111 if (!problem) {
1112 /* It looks like we didn't get the peer's MSG6 */
1113 /* This is like a cut-down enter_new_state(SITE_RUN) */
1114 slog(st,LOG_STATE,"will enter state RUN (MSG0 with new key)");
1115 BUF_FREE(&st->buffer);
1116 st->timeout=0;
1117 activate_new_key(st);
1118 return True; /* do process the data in this packet */
1119 }
1120 if (problem==2)
1121 goto skew;
1122 }
1123
1124 slog(st,LOG_SEC,"transform: %s (aux: %s, new: %s)",
1125 transform_err,auxkey_err,newkey_err);
1126 initiate_key_setup(st,"incoming message would not decrypt",0);
1127 send_nak(src,m.dest,m.source,m.type,msg0,"message would not decrypt");
1128 return False;
1129
1130 skew:
1131 slog(st,LOG_DROP,"transform: %s (merely skew)",transform_err);
1132 return False;
1133 }
1134
1135 static bool_t process_msg0(struct site *st, struct buffer_if *msg0,
1136 const struct comm_addr *src)
1137 {
1138 uint32_t type;
1139
1140 if (!decrypt_msg0(st,msg0,src))
1141 return False;
1142
1143 CHECK_AVAIL(msg0,4);
1144 type=buf_unprepend_uint32(msg0);
1145 switch(type) {
1146 case LABEL_MSG7:
1147 /* We must forget about the current session. */
1148 delete_keys(st,"request from peer",LOG_SEC);
1149 return True;
1150 case LABEL_MSG9:
1151 /* Deliver to netlink layer */
1152 st->netlink->deliver(st->netlink->st,msg0);
1153 transport_data_msgok(st,src);
1154 /* See whether we should start negotiating a new key */
1155 if (st->now > st->renegotiate_key_time)
1156 initiate_key_setup(st,"incoming packet in renegotiation window",0);
1157 return True;
1158 default:
1159 slog(st,LOG_SEC,"incoming encrypted message of type %08x "
1160 "(unknown)",type);
1161 break;
1162 }
1163 return False;
1164 }
1165
1166 static void dump_packet(struct site *st, struct buffer_if *buf,
1167 const struct comm_addr *addr, bool_t incoming,
1168 bool_t ok)
1169 {
1170 uint32_t dest=get_uint32(buf->start);
1171 uint32_t source=get_uint32(buf->start+4);
1172 uint32_t msgtype=get_uint32(buf->start+8);
1173
1174 if (st->log_events & LOG_DUMP)
1175 slilog(st->log,M_DEBUG,"%s: %s: %08x<-%08x: %08x: %s%s",
1176 st->tunname,incoming?"incoming":"outgoing",
1177 dest,source,msgtype,comm_addr_to_string(addr),
1178 ok?"":" - fail");
1179 }
1180
1181 static uint32_t site_status(void *st)
1182 {
1183 return 0;
1184 }
1185
1186 static bool_t send_msg(struct site *st)
1187 {
1188 if (st->retries>0) {
1189 transport_xmit(st, &st->setup_peers, &st->buffer, True);
1190 st->timeout=st->now+st->setup_retry_interval;
1191 st->retries--;
1192 return True;
1193 } else if (st->state==SITE_SENTMSG5) {
1194 logtimeout(st,"timed out sending MSG5, stashing new key");
1195 /* We stash the key we have produced, in case it turns out that
1196 * our peer did see our MSG5 after all and starts using it. */
1197 /* This is a bit like some of activate_new_key */
1198 struct transform_inst_if *t;
1199 t=st->auxiliary_key.transform;
1200 st->auxiliary_key.transform=st->new_transform;
1201 st->new_transform=t;
1202 dispose_transform(&st->new_transform);
1203
1204 st->auxiliary_is_new=1;
1205 st->auxiliary_key.key_timeout=st->now+st->key_lifetime;
1206 st->auxiliary_renegotiate_key_time=st->now+st->key_renegotiate_time;
1207 st->auxiliary_key.remote_session_id=st->setup_session_id;
1208
1209 enter_state_wait(st);
1210 return False;
1211 } else {
1212 logtimeout(st,"timed out sending key setup packet "
1213 "(in state %s)",state_name(st->state));
1214 enter_state_wait(st);
1215 return False;
1216 }
1217 }
1218
1219 static void site_resolve_callback(void *sst, const struct comm_addr *addrs,
1220 int stored_naddrs, int all_naddrs,
1221 const char *address, const char *failwhy)
1222 {
1223 struct site *st=sst;
1224
1225 if (!stored_naddrs) {
1226 slog(st,LOG_ERROR,"resolution of %s failed: %s",address,failwhy);
1227 } else {
1228 slog(st,LOG_PEER_ADDRS,"resolution of %s completed, %d addrs, eg: %s",
1229 address, all_naddrs, comm_addr_to_string(&addrs[0]));;
1230
1231 int space=st->transport_peers_max-st->resolving_n_results_stored;
1232 int n_tocopy=MIN(stored_naddrs,space);
1233 COPY_ARRAY(st->resolving_results + st->resolving_n_results_stored,
1234 addrs,
1235 n_tocopy);
1236 st->resolving_n_results_stored += n_tocopy;
1237 st->resolving_n_results_all += all_naddrs;
1238 }
1239
1240 decrement_resolving_count(st,1);
1241 }
1242
1243 static void decrement_resolving_count(struct site *st, int by)
1244 {
1245 assert(st->resolving_count>0);
1246 st->resolving_count-=by;
1247
1248 if (st->resolving_count)
1249 return;
1250
1251 /* OK, we are done with them all. Handle combined results. */
1252
1253 const struct comm_addr *addrs=st->resolving_results;
1254 int naddrs=st->resolving_n_results_stored;
1255 assert(naddrs<=st->transport_peers_max);
1256
1257 if (naddrs) {
1258 if (naddrs != st->resolving_n_results_all) {
1259 slog(st,LOG_SETUP_INIT,"resolution of supplied addresses/names"
1260 " yielded too many results (%d > %d), some ignored",
1261 st->resolving_n_results_all, naddrs);
1262 }
1263 slog(st,LOG_STATE,"resolution completed, %d addrs, eg: %s",
1264 naddrs, iaddr_to_string(&addrs[0].ia));;
1265 }
1266
1267 switch (st->state) {
1268 case SITE_RESOLVE:
1269 if (transport_compute_setupinit_peers(st,addrs,naddrs,0)) {
1270 enter_new_state(st,SITE_SENTMSG1);
1271 } else {
1272 /* Can't figure out who to try to to talk to */
1273 slog(st,LOG_SETUP_INIT,
1274 "key exchange failed: cannot find peer address");
1275 enter_state_run(st);
1276 }
1277 break;
1278 case SITE_SENTMSG1: case SITE_SENTMSG2:
1279 case SITE_SENTMSG3: case SITE_SENTMSG4:
1280 case SITE_SENTMSG5:
1281 if (naddrs) {
1282 /* We start using the address immediately for data too.
1283 * It's best to store it in st->peers now because we might
1284 * go via SENTMSG5, WAIT, and a MSG0, straight into using
1285 * the new key (without updating the data peer addrs). */
1286 transport_resolve_complete(st,addrs,naddrs);
1287 } else if (st->local_mobile) {
1288 /* We can't let this rest because we may have a peer
1289 * address which will break in the future. */
1290 slog(st,LOG_SETUP_INIT,"resolution failed: "
1291 "abandoning key exchange");
1292 enter_state_wait(st);
1293 } else {
1294 slog(st,LOG_SETUP_INIT,"resolution failed: "
1295 " continuing to use source address of peer's packets"
1296 " for key exchange and ultimately data");
1297 }
1298 break;
1299 case SITE_RUN:
1300 if (naddrs) {
1301 slog(st,LOG_SETUP_INIT,"resolution completed tardily,"
1302 " updating peer address(es)");
1303 transport_resolve_complete_tardy(st,addrs,naddrs);
1304 } else if (st->local_mobile) {
1305 /* Not very good. We should queue (another) renegotiation
1306 * so that we can update the peer address. */
1307 st->key_renegotiate_time=st->now+st->wait_timeout;
1308 } else {
1309 slog(st,LOG_SETUP_INIT,"resolution failed: "
1310 " continuing to use source address of peer's packets");
1311 }
1312 break;
1313 case SITE_WAIT:
1314 case SITE_STOP:
1315 /* oh well */
1316 break;
1317 }
1318 }
1319
1320 static bool_t initiate_key_setup(struct site *st, cstring_t reason,
1321 const struct comm_addr *prod_hint)
1322 {
1323 /* Reentrancy hazard: can call enter_new_state/enter_state_* */
1324 if (st->state!=SITE_RUN) return False;
1325 slog(st,LOG_SETUP_INIT,"initiating key exchange (%s)",reason);
1326 if (st->addresses) {
1327 slog(st,LOG_SETUP_INIT,"resolving peer address(es)");
1328 return enter_state_resolve(st);
1329 } else if (transport_compute_setupinit_peers(st,0,0,prod_hint)) {
1330 return enter_new_state(st,SITE_SENTMSG1);
1331 }
1332 slog(st,LOG_SETUP_INIT,"key exchange failed: no address for peer");
1333 return False;
1334 }
1335
1336 static void activate_new_key(struct site *st)
1337 {
1338 struct transform_inst_if *t;
1339
1340 /* We have three transform instances, which we swap between old,
1341 active and setup */
1342 t=st->auxiliary_key.transform;
1343 st->auxiliary_key.transform=st->current.transform;
1344 st->current.transform=st->new_transform;
1345 st->new_transform=t;
1346 dispose_transform(&st->new_transform);
1347
1348 st->timeout=0;
1349 st->auxiliary_is_new=0;
1350 st->auxiliary_key.key_timeout=st->current.key_timeout;
1351 st->current.key_timeout=st->now+st->key_lifetime;
1352 st->renegotiate_key_time=st->now+st->key_renegotiate_time;
1353 transport_peers_copy(st,&st->peers,&st->setup_peers);
1354 st->current.remote_session_id=st->setup_session_id;
1355
1356 /* Compute the inter-site MTU. This is min( our_mtu, their_mtu ).
1357 * But their mtu be unspecified, in which case we just use ours. */
1358 uint32_t intersite_mtu=
1359 MIN(st->mtu_target, st->remote_adv_mtu ?: ~(uint32_t)0);
1360 st->netlink->set_mtu(st->netlink->st,intersite_mtu);
1361
1362 slog(st,LOG_ACTIVATE_KEY,"new key activated"
1363 " (mtu ours=%"PRId32" theirs=%"PRId32" intersite=%"PRId32")",
1364 st->mtu_target, st->remote_adv_mtu, intersite_mtu);
1365 enter_state_run(st);
1366 }
1367
1368 static void delete_one_key(struct site *st, struct data_key *key,
1369 cstring_t reason, cstring_t which, uint32_t loglevel)
1370 {
1371 if (!is_transform_valid(key->transform)) return;
1372 if (reason) slog(st,loglevel,"%s deleted (%s)",which,reason);
1373 dispose_transform(&key->transform);
1374 key->key_timeout=0;
1375 }
1376
1377 static void delete_keys(struct site *st, cstring_t reason, uint32_t loglevel)
1378 {
1379 if (current_valid(st)) {
1380 slog(st,loglevel,"session closed (%s)",reason);
1381
1382 delete_one_key(st,&st->current,0,0,0);
1383 set_link_quality(st);
1384 }
1385 delete_one_key(st,&st->auxiliary_key,0,0,0);
1386 }
1387
1388 static void state_assert(struct site *st, bool_t ok)
1389 {
1390 if (!ok) fatal("site:state_assert");
1391 }
1392
1393 static void enter_state_stop(struct site *st)
1394 {
1395 st->state=SITE_STOP;
1396 st->timeout=0;
1397 delete_keys(st,"entering state STOP",LOG_TIMEOUT_KEY);
1398 dispose_transform(&st->new_transform);
1399 }
1400
1401 static void set_link_quality(struct site *st)
1402 {
1403 uint32_t quality;
1404 if (current_valid(st))
1405 quality=LINK_QUALITY_UP;
1406 else if (st->state==SITE_WAIT || st->state==SITE_STOP)
1407 quality=LINK_QUALITY_DOWN;
1408 else if (st->addresses)
1409 quality=LINK_QUALITY_DOWN_CURRENT_ADDRESS;
1410 else if (transport_peers_valid(&st->peers))
1411 quality=LINK_QUALITY_DOWN_STALE_ADDRESS;
1412 else
1413 quality=LINK_QUALITY_DOWN;
1414
1415 st->netlink->set_quality(st->netlink->st,quality);
1416 }
1417
1418 static void enter_state_run(struct site *st)
1419 {
1420 slog(st,LOG_STATE,"entering state RUN");
1421 st->state=SITE_RUN;
1422 st->timeout=0;
1423
1424 st->setup_session_id=0;
1425 transport_peers_clear(st,&st->setup_peers);
1426 FILLZERO(st->localN);
1427 FILLZERO(st->remoteN);
1428 dispose_transform(&st->new_transform);
1429 memset(st->dhsecret,0,st->dh->len);
1430 memset(st->sharedsecret,0,st->sharedsecretlen);
1431 set_link_quality(st);
1432 }
1433
1434 static bool_t ensure_resolving(struct site *st)
1435 {
1436 /* Reentrancy hazard: may call site_resolve_callback and hence
1437 * enter_new_state, enter_state_* and generate_msg*. */
1438 if (st->resolving_count)
1439 return True;
1440
1441 assert(st->addresses);
1442
1443 /* resolver->request might reentrantly call site_resolve_callback
1444 * which will decrement st->resolving, so we need to increment it
1445 * twice beforehand to prevent decrement from thinking we're
1446 * finished, and decrement it ourselves. Alternatively if
1447 * everything fails then there are no callbacks due and we simply
1448 * set it to 0 and return false.. */
1449 st->resolving_n_results_stored=0;
1450 st->resolving_n_results_all=0;
1451 st->resolving_count+=2;
1452 const char **addrp=st->addresses;
1453 const char *address;
1454 bool_t anyok=False;
1455 for (; (address=*addrp++); ) {
1456 bool_t ok = st->resolver->request(st->resolver->st,address,
1457 st->remoteport,st->comms[0],
1458 site_resolve_callback,st);
1459 if (ok)
1460 st->resolving_count++;
1461 anyok|=ok;
1462 }
1463 if (!anyok) {
1464 st->resolving_count=0;
1465 return False;
1466 }
1467 decrement_resolving_count(st,2);
1468 return True;
1469 }
1470
1471 static bool_t enter_state_resolve(struct site *st)
1472 {
1473 /* Reentrancy hazard! See ensure_resolving. */
1474 state_assert(st,st->state==SITE_RUN);
1475 slog(st,LOG_STATE,"entering state RESOLVE");
1476 st->state=SITE_RESOLVE;
1477 return ensure_resolving(st);
1478 }
1479
1480 static bool_t enter_new_state(struct site *st, uint32_t next)
1481 {
1482 bool_t (*gen)(struct site *st);
1483 int r;
1484
1485 slog(st,LOG_STATE,"entering state %s",state_name(next));
1486 switch(next) {
1487 case SITE_SENTMSG1:
1488 state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE);
1489 gen=generate_msg1;
1490 break;
1491 case SITE_SENTMSG2:
1492 state_assert(st,st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1493 st->state==SITE_SENTMSG1 || st->state==SITE_WAIT);
1494 gen=generate_msg2;
1495 break;
1496 case SITE_SENTMSG3:
1497 state_assert(st,st->state==SITE_SENTMSG1);
1498 BUF_FREE(&st->buffer);
1499 gen=generate_msg3;
1500 break;
1501 case SITE_SENTMSG4:
1502 state_assert(st,st->state==SITE_SENTMSG2);
1503 BUF_FREE(&st->buffer);
1504 gen=generate_msg4;
1505 break;
1506 case SITE_SENTMSG5:
1507 state_assert(st,st->state==SITE_SENTMSG3);
1508 BUF_FREE(&st->buffer);
1509 gen=generate_msg5;
1510 break;
1511 case SITE_RUN:
1512 state_assert(st,st->state==SITE_SENTMSG4);
1513 BUF_FREE(&st->buffer);
1514 gen=generate_msg6;
1515 break;
1516 default:
1517 gen=NULL;
1518 fatal("enter_new_state(%s): invalid new state",state_name(next));
1519 break;
1520 }
1521
1522 if (hacky_par_start_failnow()) return False;
1523
1524 r= gen(st) && send_msg(st);
1525
1526 hacky_par_end(&r,
1527 st->setup_retries, st->setup_retry_interval,
1528 send_msg, st);
1529
1530 if (r) {
1531 st->state=next;
1532 if (next==SITE_RUN) {
1533 BUF_FREE(&st->buffer); /* Never reused */
1534 st->timeout=0; /* Never retransmit */
1535 activate_new_key(st);
1536 }
1537 return True;
1538 }
1539 slog(st,LOG_ERROR,"error entering state %s",state_name(next));
1540 st->buffer.free=False; /* Unconditionally use the buffer; it may be
1541 in either state, and enter_state_wait() will
1542 do a BUF_FREE() */
1543 enter_state_wait(st);
1544 return False;
1545 }
1546
1547 /* msg7 tells our peer that we're about to forget our key */
1548 static bool_t send_msg7(struct site *st, cstring_t reason)
1549 {
1550 cstring_t transform_err;
1551
1552 if (current_valid(st) && st->buffer.free
1553 && transport_peers_valid(&st->peers)) {
1554 BUF_ALLOC(&st->buffer,"site:MSG7");
1555 buffer_init(&st->buffer,calculate_max_start_pad());
1556 buf_append_uint32(&st->buffer,LABEL_MSG7);
1557 buf_append_string(&st->buffer,reason);
1558 if (call_transform_forwards(st, st->current.transform,
1559 &st->buffer, &transform_err))
1560 goto free_out;
1561 buf_prepend_uint32(&st->buffer,LABEL_MSG0);
1562 buf_prepend_uint32(&st->buffer,st->index);
1563 buf_prepend_uint32(&st->buffer,st->current.remote_session_id);
1564 transport_xmit(st,&st->peers,&st->buffer,True);
1565 BUF_FREE(&st->buffer);
1566 free_out:
1567 return True;
1568 }
1569 return False;
1570 }
1571
1572 /* We go into this state if our peer becomes uncommunicative. Similar to
1573 the "stop" state, we forget all session keys for a while, before
1574 re-entering the "run" state. */
1575 static void enter_state_wait(struct site *st)
1576 {
1577 slog(st,LOG_STATE,"entering state WAIT");
1578 st->timeout=st->now+st->wait_timeout;
1579 st->state=SITE_WAIT;
1580 set_link_quality(st);
1581 BUF_FREE(&st->buffer); /* will have had an outgoing packet in it */
1582 /* XXX Erase keys etc. */
1583 }
1584
1585 static void generate_prod(struct site *st, struct buffer_if *buf)
1586 {
1587 buffer_init(buf,0);
1588 buf_append_uint32(buf,0);
1589 buf_append_uint32(buf,0);
1590 buf_append_uint32(buf,LABEL_PROD);
1591 buf_append_string(buf,st->localname);
1592 buf_append_string(buf,st->remotename);
1593 }
1594
1595 static void generate_send_prod(struct site *st,
1596 const struct comm_addr *source)
1597 {
1598 if (!st->allow_send_prod) return; /* too soon */
1599 if (!(st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1600 st->state==SITE_WAIT)) return; /* we'd ignore peer's MSG1 */
1601
1602 slog(st,LOG_SETUP_INIT,"prodding peer for key exchange");
1603 st->allow_send_prod=0;
1604 generate_prod(st,&st->scratch);
1605 bool_t ok = source->comm->sendmsg(source->comm->st, &st->scratch, source);
1606 dump_packet(st,&st->scratch,source,False,ok);
1607 }
1608
1609 static inline void site_settimeout(uint64_t timeout, int *timeout_io)
1610 {
1611 if (timeout) {
1612 int64_t offset=timeout-*now;
1613 if (offset<0) offset=0;
1614 if (offset>INT_MAX) offset=INT_MAX;
1615 if (*timeout_io<0 || offset<*timeout_io)
1616 *timeout_io=offset;
1617 }
1618 }
1619
1620 static int site_beforepoll(void *sst, struct pollfd *fds, int *nfds_io,
1621 int *timeout_io)
1622 {
1623 struct site *st=sst;
1624
1625 BEFOREPOLL_WANT_FDS(0); /* We don't use any file descriptors */
1626 st->now=*now;
1627
1628 /* Work out when our next timeout is. The earlier of 'timeout' or
1629 'current.key_timeout'. A stored value of '0' indicates no timeout
1630 active. */
1631 site_settimeout(st->timeout, timeout_io);
1632 site_settimeout(st->current.key_timeout, timeout_io);
1633 site_settimeout(st->auxiliary_key.key_timeout, timeout_io);
1634
1635 return 0; /* success */
1636 }
1637
1638 static void check_expiry(struct site *st, struct data_key *key,
1639 const char *which)
1640 {
1641 if (key->key_timeout && *now>key->key_timeout) {
1642 delete_one_key(st,key,"maximum life exceeded",which,LOG_TIMEOUT_KEY);
1643 }
1644 }
1645
1646 /* NB site_afterpoll will be called before site_beforepoll is ever called */
1647 static void site_afterpoll(void *sst, struct pollfd *fds, int nfds)
1648 {
1649 struct site *st=sst;
1650
1651 st->now=*now;
1652 if (st->timeout && *now>st->timeout) {
1653 st->timeout=0;
1654 if (st->state>=SITE_SENTMSG1 && st->state<=SITE_SENTMSG5) {
1655 if (!hacky_par_start_failnow())
1656 send_msg(st);
1657 } else if (st->state==SITE_WAIT) {
1658 enter_state_run(st);
1659 } else {
1660 slog(st,LOG_ERROR,"site_afterpoll: unexpected timeout, state=%d",
1661 st->state);
1662 }
1663 }
1664 check_expiry(st,&st->current,"current key");
1665 check_expiry(st,&st->auxiliary_key,"auxiliary key");
1666 }
1667
1668 /* This function is called by the netlink device to deliver packets
1669 intended for the remote network. The packet is in "raw" wire
1670 format, but is guaranteed to be word-aligned. */
1671 static void site_outgoing(void *sst, struct buffer_if *buf)
1672 {
1673 struct site *st=sst;
1674 cstring_t transform_err;
1675
1676 if (st->state==SITE_STOP) {
1677 BUF_FREE(buf);
1678 return;
1679 }
1680
1681 st->allow_send_prod=1;
1682
1683 /* In all other states we consider delivering the packet if we have
1684 a valid key and a valid address to send it to. */
1685 if (current_valid(st) && transport_peers_valid(&st->peers)) {
1686 /* Transform it and send it */
1687 if (buf->size>0) {
1688 buf_prepend_uint32(buf,LABEL_MSG9);
1689 if (call_transform_forwards(st, st->current.transform,
1690 buf, &transform_err))
1691 goto free_out;
1692 buf_prepend_uint32(buf,LABEL_MSG0);
1693 buf_prepend_uint32(buf,st->index);
1694 buf_prepend_uint32(buf,st->current.remote_session_id);
1695 transport_xmit(st,&st->peers,buf,False);
1696 }
1697 free_out:
1698 BUF_FREE(buf);
1699 return;
1700 }
1701
1702 slog(st,LOG_DROP,"discarding outgoing packet of size %d",buf->size);
1703 BUF_FREE(buf);
1704 initiate_key_setup(st,"outgoing packet",0);
1705 }
1706
1707 static bool_t named_for_us(struct site *st, const struct buffer_if *buf_in,
1708 uint32_t type, struct msg *m)
1709 /* For packets which are identified by the local and remote names.
1710 * If it has our name and our peer's name in it it's for us. */
1711 {
1712 struct buffer_if buf[1];
1713 buffer_readonly_clone(buf,buf_in);
1714 return unpick_msg(st,type,buf,m)
1715 && name_matches(&m->remote,st->remotename)
1716 && name_matches(&m->local,st->localname);
1717 }
1718
1719 /* This function is called by the communication device to deliver
1720 packets from our peers.
1721 It should return True if the packet is recognised as being for
1722 this current site instance (and should therefore not be processed
1723 by other sites), even if the packet was otherwise ignored. */
1724 static bool_t site_incoming(void *sst, struct buffer_if *buf,
1725 const struct comm_addr *source)
1726 {
1727 struct site *st=sst;
1728
1729 if (buf->size < 12) return False;
1730
1731 uint32_t dest=get_uint32(buf->start);
1732 uint32_t msgtype=get_uint32(buf->start+8);
1733 struct msg named_msg;
1734
1735 if (msgtype==LABEL_MSG1) {
1736 if (!named_for_us(st,buf,msgtype,&named_msg))
1737 return False;
1738 /* It's a MSG1 addressed to us. Decide what to do about it. */
1739 dump_packet(st,buf,source,True,True);
1740 if (st->state==SITE_RUN || st->state==SITE_RESOLVE ||
1741 st->state==SITE_WAIT) {
1742 /* We should definitely process it */
1743 transport_compute_setupinit_peers(st,0,0,source);
1744 if (process_msg1(st,buf,source,&named_msg)) {
1745 slog(st,LOG_SETUP_INIT,"key setup initiated by peer");
1746 bool_t entered=enter_new_state(st,SITE_SENTMSG2);
1747 if (entered && st->addresses && st->local_mobile)
1748 /* We must do this as the very last thing, because
1749 the resolver callback might reenter us. */
1750 ensure_resolving(st);
1751 } else {
1752 slog(st,LOG_ERROR,"failed to process incoming msg1");
1753 }
1754 BUF_FREE(buf);
1755 return True;
1756 } else if (st->state==SITE_SENTMSG1) {
1757 /* We've just sent a message 1! They may have crossed on
1758 the wire. If we have priority then we ignore the
1759 incoming one, otherwise we process it as usual. */
1760 if (st->setup_priority) {
1761 BUF_FREE(buf);
1762 slog(st,LOG_DUMP,"crossed msg1s; we are higher "
1763 "priority => ignore incoming msg1");
1764 return True;
1765 } else {
1766 slog(st,LOG_DUMP,"crossed msg1s; we are lower "
1767 "priority => use incoming msg1");
1768 if (process_msg1(st,buf,source,&named_msg)) {
1769 BUF_FREE(&st->buffer); /* Free our old message 1 */
1770 transport_setup_msgok(st,source);
1771 enter_new_state(st,SITE_SENTMSG2);
1772 } else {
1773 slog(st,LOG_ERROR,"failed to process an incoming "
1774 "crossed msg1 (we have low priority)");
1775 }
1776 BUF_FREE(buf);
1777 return True;
1778 }
1779 }
1780 /* The message 1 was received at an unexpected stage of the
1781 key setup. XXX POLICY - what do we do? */
1782 slog(st,LOG_UNEXPECTED,"unexpected incoming message 1");
1783 BUF_FREE(buf);
1784 return True;
1785 }
1786 if (msgtype==LABEL_PROD) {
1787 if (!named_for_us(st,buf,msgtype,&named_msg))
1788 return False;
1789 dump_packet(st,buf,source,True,True);
1790 if (st->state!=SITE_RUN) {
1791 slog(st,LOG_DROP,"ignoring PROD when not in state RUN");
1792 } else if (current_valid(st)) {
1793 slog(st,LOG_DROP,"ignoring PROD when we think we have a key");
1794 } else {
1795 initiate_key_setup(st,"peer sent PROD packet",source);
1796 }
1797 BUF_FREE(buf);
1798 return True;
1799 }
1800 if (dest==st->index) {
1801 /* Explicitly addressed to us */
1802 if (msgtype!=LABEL_MSG0) dump_packet(st,buf,source,True,True);
1803 switch (msgtype) {
1804 case LABEL_NAK:
1805 /* If the source is our current peer then initiate a key setup,
1806 because our peer's forgotten the key */
1807 if (get_uint32(buf->start+4)==st->current.remote_session_id) {
1808 bool_t initiated;
1809 initiated = initiate_key_setup(st,"received a NAK",source);
1810 if (!initiated) generate_send_prod(st,source);
1811 } else {
1812 slog(st,LOG_SEC,"bad incoming NAK");
1813 }
1814 break;
1815 case LABEL_MSG0:
1816 process_msg0(st,buf,source);
1817 break;
1818 case LABEL_MSG1:
1819 /* Setup packet: should not have been explicitly addressed
1820 to us */
1821 slog(st,LOG_SEC,"incoming explicitly addressed msg1");
1822 break;
1823 case LABEL_MSG2:
1824 /* Setup packet: expected only in state SENTMSG1 */
1825 if (st->state!=SITE_SENTMSG1) {
1826 slog(st,LOG_UNEXPECTED,"unexpected MSG2");
1827 } else if (process_msg2(st,buf,source)) {
1828 transport_setup_msgok(st,source);
1829 enter_new_state(st,SITE_SENTMSG3);
1830 } else {
1831 slog(st,LOG_SEC,"invalid MSG2");
1832 }
1833 break;
1834 case LABEL_MSG3:
1835 case LABEL_MSG3BIS:
1836 /* Setup packet: expected only in state SENTMSG2 */
1837 if (st->state!=SITE_SENTMSG2) {
1838 slog(st,LOG_UNEXPECTED,"unexpected MSG3");
1839 } else if (process_msg3(st,buf,source,msgtype)) {
1840 transport_setup_msgok(st,source);
1841 enter_new_state(st,SITE_SENTMSG4);
1842 } else {
1843 slog(st,LOG_SEC,"invalid MSG3");
1844 }
1845 break;
1846 case LABEL_MSG4:
1847 /* Setup packet: expected only in state SENTMSG3 */
1848 if (st->state!=SITE_SENTMSG3) {
1849 slog(st,LOG_UNEXPECTED,"unexpected MSG4");
1850 } else if (process_msg4(st,buf,source)) {
1851 transport_setup_msgok(st,source);
1852 enter_new_state(st,SITE_SENTMSG5);
1853 } else {
1854 slog(st,LOG_SEC,"invalid MSG4");
1855 }
1856 break;
1857 case LABEL_MSG5:
1858 /* Setup packet: expected only in state SENTMSG4 */
1859 /* (may turn up in state RUN if our return MSG6 was lost
1860 and the new key has already been activated. In that
1861 case we discard it. The peer will realise that we
1862 are using the new key when they see our data packets.
1863 Until then the peer's data packets to us get discarded. */
1864 if (st->state==SITE_SENTMSG4) {
1865 if (process_msg5(st,buf,source,st->new_transform)) {
1866 transport_setup_msgok(st,source);
1867 enter_new_state(st,SITE_RUN);
1868 } else {
1869 slog(st,LOG_SEC,"invalid MSG5");
1870 }
1871 } else if (st->state==SITE_RUN) {
1872 if (process_msg5(st,buf,source,st->current.transform)) {
1873 slog(st,LOG_DROP,"got MSG5, retransmitting MSG6");
1874 transport_setup_msgok(st,source);
1875 create_msg6(st,st->current.transform,
1876 st->current.remote_session_id);
1877 transport_xmit(st,&st->peers,&st->buffer,True);
1878 BUF_FREE(&st->buffer);
1879 } else {
1880 slog(st,LOG_SEC,"invalid MSG5 (in state RUN)");
1881 }
1882 } else {
1883 slog(st,LOG_UNEXPECTED,"unexpected MSG5");
1884 }
1885 break;
1886 case LABEL_MSG6:
1887 /* Setup packet: expected only in state SENTMSG5 */
1888 if (st->state!=SITE_SENTMSG5) {
1889 slog(st,LOG_UNEXPECTED,"unexpected MSG6");
1890 } else if (process_msg6(st,buf,source)) {
1891 BUF_FREE(&st->buffer); /* Free message 5 */
1892 transport_setup_msgok(st,source);
1893 activate_new_key(st);
1894 } else {
1895 slog(st,LOG_SEC,"invalid MSG6");
1896 }
1897 break;
1898 default:
1899 slog(st,LOG_SEC,"received message of unknown type 0x%08x",
1900 msgtype);
1901 break;
1902 }
1903 BUF_FREE(buf);
1904 return True;
1905 }
1906
1907 return False;
1908 }
1909
1910 static void site_control(void *vst, bool_t run)
1911 {
1912 struct site *st=vst;
1913 if (run) enter_state_run(st);
1914 else enter_state_stop(st);
1915 }
1916
1917 static void site_phase_hook(void *sst, uint32_t newphase)
1918 {
1919 struct site *st=sst;
1920
1921 /* The program is shutting down; tell our peer */
1922 send_msg7(st,"shutting down");
1923 }
1924
1925 static void site_childpersist_clearkeys(void *sst, uint32_t newphase)
1926 {
1927 struct site *st=sst;
1928 dispose_transform(&st->current.transform);
1929 dispose_transform(&st->auxiliary_key.transform);
1930 dispose_transform(&st->new_transform);
1931 /* Not much point overwiting the signing key, since we loaded it
1932 from disk, and it is only valid prospectively if at all,
1933 anyway. */
1934 /* XXX it would be best to overwrite the DH state, because that
1935 _is_ relevant to forward secrecy. However we have no
1936 convenient interface for doing that and in practice gmp has
1937 probably dribbled droppings all over the malloc arena. A good
1938 way to fix this would be to have a privsep child for asymmetric
1939 crypto operations, but that's a task for another day. */
1940 }
1941
1942 static list_t *site_apply(closure_t *self, struct cloc loc, dict_t *context,
1943 list_t *args)
1944 {
1945 static uint32_t index_sequence;
1946 struct site *st;
1947 item_t *item;
1948 dict_t *dict;
1949 int i;
1950
1951 NEW(st);
1952
1953 st->cl.description="site";
1954 st->cl.type=CL_SITE;
1955 st->cl.apply=NULL;
1956 st->cl.interface=&st->ops;
1957 st->ops.st=st;
1958 st->ops.control=site_control;
1959 st->ops.status=site_status;
1960
1961 /* First parameter must be a dict */
1962 item=list_elem(args,0);
1963 if (!item || item->type!=t_dict)
1964 cfgfatal(loc,"site","parameter must be a dictionary\n");
1965
1966 dict=item->data.dict;
1967 st->localname=dict_read_string(dict, "local-name", True, "site", loc);
1968 st->remotename=dict_read_string(dict, "name", True, "site", loc);
1969
1970 st->peer_mobile=dict_read_bool(dict,"mobile",False,"site",loc,False);
1971 st->local_mobile=
1972 dict_read_bool(dict,"local-mobile",False,"site",loc,False);
1973
1974 /* Sanity check (which also allows the 'sites' file to include
1975 site() closures for all sites including our own): refuse to
1976 talk to ourselves */
1977 if (strcmp(st->localname,st->remotename)==0) {
1978 Message(M_DEBUG,"site %s: local-name==name -> ignoring this site\n",
1979 st->localname);
1980 if (st->peer_mobile != st->local_mobile)
1981 cfgfatal(loc,"site","site %s's peer-mobile=%d"
1982 " but our local-mobile=%d\n",
1983 st->localname, st->peer_mobile, st->local_mobile);
1984 free(st);
1985 return NULL;
1986 }
1987 if (st->peer_mobile && st->local_mobile) {
1988 Message(M_WARNING,"site %s: site is mobile but so are we"
1989 " -> ignoring this site\n", st->remotename);
1990 free(st);
1991 return NULL;
1992 }
1993
1994 assert(index_sequence < 0xffffffffUL);
1995 st->index = ++index_sequence;
1996 st->local_capabilities = 0;
1997 st->netlink=find_cl_if(dict,"link",CL_NETLINK,True,"site",loc);
1998
1999 #define GET_CLOSURE_LIST(dictkey,things,nthings,CL_TYPE) do{ \
2000 list_t *things##_cfg=dict_lookup(dict,dictkey); \
2001 if (!things##_cfg) \
2002 cfgfatal(loc,"site","closure list \"%s\" not found\n",dictkey); \
2003 st->nthings=list_length(things##_cfg); \
2004 NEW_ARY(st->things,st->nthings); \
2005 assert(st->nthings); \
2006 for (i=0; i<st->nthings; i++) { \
2007 item_t *item=list_elem(things##_cfg,i); \
2008 if (item->type!=t_closure) \
2009 cfgfatal(loc,"site","%s is not a closure\n",dictkey); \
2010 closure_t *cl=item->data.closure; \
2011 if (cl->type!=CL_TYPE) \
2012 cfgfatal(loc,"site","%s closure wrong type\n",dictkey); \
2013 st->things[i]=cl->interface; \
2014 } \
2015 }while(0)
2016
2017 GET_CLOSURE_LIST("comm",comms,ncomms,CL_COMM);
2018
2019 st->resolver=find_cl_if(dict,"resolver",CL_RESOLVER,True,"site",loc);
2020 st->log=find_cl_if(dict,"log",CL_LOG,True,"site",loc);
2021 st->random=find_cl_if(dict,"random",CL_RANDOMSRC,True,"site",loc);
2022
2023 st->privkey=find_cl_if(dict,"local-key",CL_RSAPRIVKEY,True,"site",loc);
2024 st->addresses=dict_read_string_array(dict,"address",False,"site",loc,0);
2025 if (st->addresses)
2026 st->remoteport=dict_read_number(dict,"port",True,"site",loc,0);
2027 else st->remoteport=0;
2028 st->pubkey=find_cl_if(dict,"key",CL_RSAPUBKEY,True,"site",loc);
2029
2030 GET_CLOSURE_LIST("transform",transforms,ntransforms,CL_TRANSFORM);
2031
2032 st->dh=find_cl_if(dict,"dh",CL_DH,True,"site",loc);
2033 st->hash=find_cl_if(dict,"hash",CL_HASH,True,"site",loc);
2034
2035 #define DEFAULT(D) (st->peer_mobile || st->local_mobile \
2036 ? DEFAULT_MOBILE_##D : DEFAULT_##D)
2037 #define CFG_NUMBER(k,D) dict_read_number(dict,(k),False,"site",loc,DEFAULT(D));
2038
2039 st->key_lifetime= CFG_NUMBER("key-lifetime", KEY_LIFETIME);
2040 st->setup_retries= CFG_NUMBER("setup-retries", SETUP_RETRIES);
2041 st->setup_retry_interval= CFG_NUMBER("setup-timeout", SETUP_RETRY_INTERVAL);
2042 st->wait_timeout= CFG_NUMBER("wait-time", WAIT_TIME);
2043 st->mtu_target= dict_read_number(dict,"mtu-target",False,"site",loc,0);
2044
2045 st->mobile_peer_expiry= dict_read_number(
2046 dict,"mobile-peer-expiry",False,"site",loc,DEFAULT_MOBILE_PEER_EXPIRY);
2047
2048 const char *peerskey= st->peer_mobile
2049 ? "mobile-peers-max" : "static-peers-max";
2050 st->transport_peers_max= dict_read_number(
2051 dict,peerskey,False,"site",loc, st->addresses ? 4 : 3);
2052 if (st->transport_peers_max<1 ||
2053 st->transport_peers_max>MAX_PEER_ADDRS) {
2054 cfgfatal(loc,"site", "%s must be in range 1.."
2055 STRING(MAX_PEER_ADDRS) "\n", peerskey);
2056 }
2057
2058 if (st->key_lifetime < DEFAULT(KEY_RENEGOTIATE_GAP)*2)
2059 st->key_renegotiate_time=st->key_lifetime/2;
2060 else
2061 st->key_renegotiate_time=st->key_lifetime-DEFAULT(KEY_RENEGOTIATE_GAP);
2062 st->key_renegotiate_time=dict_read_number(
2063 dict,"renegotiate-time",False,"site",loc,st->key_renegotiate_time);
2064 if (st->key_renegotiate_time > st->key_lifetime) {
2065 cfgfatal(loc,"site",
2066 "renegotiate-time must be less than key-lifetime\n");
2067 }
2068
2069 st->log_events=string_list_to_word(dict_lookup(dict,"log-events"),
2070 log_event_table,"site");
2071
2072 st->resolving_count=0;
2073 st->allow_send_prod=0;
2074
2075 st->tunname=safe_malloc(strlen(st->localname)+strlen(st->remotename)+5,
2076 "site_apply");
2077 sprintf(st->tunname,"%s<->%s",st->localname,st->remotename);
2078
2079 /* The information we expect to see in incoming messages of type 1 */
2080 /* fixme: lots of unchecked overflows here, but the results are only
2081 corrupted packets rather than undefined behaviour */
2082 st->setup_priority=(strcmp(st->localname,st->remotename)>0);
2083
2084 buffer_new(&st->buffer,SETUP_BUFFER_LEN);
2085
2086 buffer_new(&st->scratch,SETUP_BUFFER_LEN);
2087 BUF_ALLOC(&st->scratch,"site:scratch");
2088
2089 /* We are interested in poll(), but only for timeouts. We don't have
2090 any fds of our own. */
2091 register_for_poll(st, site_beforepoll, site_afterpoll, "site");
2092 st->timeout=0;
2093
2094 st->remote_capabilities=0;
2095 st->chosen_transform=0;
2096 st->current.key_timeout=0;
2097 st->auxiliary_key.key_timeout=0;
2098 transport_peers_clear(st,&st->peers);
2099 transport_peers_clear(st,&st->setup_peers);
2100 /* XXX mlock these */
2101 st->dhsecret=safe_malloc(st->dh->len,"site:dhsecret");
2102 st->sharedsecretlen=st->sharedsecretallocd=0;
2103 st->sharedsecret=0;
2104
2105 for (i=0; i<st->ntransforms; i++) {
2106 struct transform_if *ti=st->transforms[i];
2107 uint32_t capbit = 1UL << ti->capab_transformnum;
2108 if (st->local_capabilities & capbit)
2109 slog(st,LOG_ERROR,"transformnum capability bit"
2110 " %d (%#"PRIx32") reused", ti->capab_transformnum, capbit);
2111 st->local_capabilities |= capbit;
2112 }
2113
2114 /* We need to register the remote networks with the netlink device */
2115 uint32_t netlink_mtu; /* local virtual interface mtu */
2116 st->netlink->reg(st->netlink->st, site_outgoing, st, &netlink_mtu);
2117 if (!st->mtu_target)
2118 st->mtu_target=netlink_mtu;
2119
2120 for (i=0; i<st->ncomms; i++)
2121 st->comms[i]->request_notify(st->comms[i]->st, st, site_incoming);
2122
2123 st->current.transform=0;
2124 st->auxiliary_key.transform=0;
2125 st->new_transform=0;
2126 st->auxiliary_is_new=0;
2127
2128 enter_state_stop(st);
2129
2130 add_hook(PHASE_SHUTDOWN,site_phase_hook,st);
2131 add_hook(PHASE_CHILDPERSIST,site_childpersist_clearkeys,st);
2132
2133 return new_closure(&st->cl);
2134 }
2135
2136 void site_module(dict_t *dict)
2137 {
2138 add_closure(dict,"site",site_apply);
2139 }
2140
2141
2142 /***** TRANSPORT PEERS definitions *****/
2143
2144 static void transport_peers_debug(struct site *st, transport_peers *dst,
2145 const char *didwhat,
2146 int nargs, const struct comm_addr *args,
2147 size_t stride) {
2148 int i;
2149 char *argp;
2150
2151 if (!(st->log_events & LOG_PEER_ADDRS))
2152 return; /* an optimisation */
2153
2154 slog(st, LOG_PEER_ADDRS, "peers (%s) %s nargs=%d => npeers=%d",
2155 (dst==&st->peers ? "data" :
2156 dst==&st->setup_peers ? "setup" : "UNKNOWN"),
2157 didwhat, nargs, dst->npeers);
2158
2159 for (i=0, argp=(void*)args;
2160 i<nargs;
2161 i++, (argp+=stride?stride:sizeof(*args))) {
2162 const struct comm_addr *ca=(void*)argp;
2163 slog(st, LOG_PEER_ADDRS, " args: addrs[%d]=%s",
2164 i, comm_addr_to_string(ca));
2165 }
2166 for (i=0; i<dst->npeers; i++) {
2167 struct timeval diff;
2168 timersub(tv_now,&dst->peers[i].last,&diff);
2169 const struct comm_addr *ca=&dst->peers[i].addr;
2170 slog(st, LOG_PEER_ADDRS, " peers: addrs[%d]=%s T-%ld.%06ld",
2171 i, comm_addr_to_string(ca),
2172 (unsigned long)diff.tv_sec, (unsigned long)diff.tv_usec);
2173 }
2174 }
2175
2176 static void transport_peers_expire(struct site *st, transport_peers *peers) {
2177 /* peers must be sorted first */
2178 int previous_peers=peers->npeers;
2179 struct timeval oldest;
2180 oldest.tv_sec = tv_now->tv_sec - st->mobile_peer_expiry;
2181 oldest.tv_usec = tv_now->tv_usec;
2182 while (peers->npeers>1 &&
2183 timercmp(&peers->peers[peers->npeers-1].last, &oldest, <))
2184 peers->npeers--;
2185 if (peers->npeers != previous_peers)
2186 transport_peers_debug(st,peers,"expire", 0,0,0);
2187 }
2188
2189 static bool_t transport_peer_record_one(struct site *st, transport_peers *peers,
2190 const struct comm_addr *ca,
2191 const struct timeval *tv) {
2192 /* returns false if output is full */
2193 int search;
2194
2195 if (peers->npeers >= st->transport_peers_max)
2196 return 0;
2197
2198 for (search=0; search<peers->npeers; search++)
2199 if (comm_addr_equal(&peers->peers[search].addr, ca))
2200 return 1;
2201
2202 peers->peers[peers->npeers].addr = *ca;
2203 peers->peers[peers->npeers].last = *tv;
2204 peers->npeers++;
2205 return 1;
2206 }
2207
2208 static void transport_record_peers(struct site *st, transport_peers *peers,
2209 const struct comm_addr *addrs, int naddrs,
2210 const char *m) {
2211 /* We add addrs into peers. The new entries end up at the front
2212 * and displace entries towards the end (perhaps even off the
2213 * end). Any existing matching entries are moved up to the front.
2214 *
2215 * Caller must first call transport_peers_expire. */
2216
2217 if (naddrs==1 && peers->npeers>=1 &&
2218 comm_addr_equal(&addrs[0], &peers->peers[0].addr)) {
2219 /* optimisation, also avoids debug for trivial updates */
2220 peers->peers[0].last = *tv_now;
2221 return;
2222 }
2223
2224 int old_npeers=peers->npeers;
2225 transport_peer old_peers[old_npeers];
2226 COPY_ARRAY(old_peers,peers->peers,old_npeers);
2227
2228 peers->npeers=0;
2229 int i;
2230 for (i=0; i<naddrs; i++) {
2231 if (!transport_peer_record_one(st,peers, &addrs[i], tv_now))
2232 break;
2233 }
2234 for (i=0; i<old_npeers; i++) {
2235 const transport_peer *old=&old_peers[i];
2236 if (!transport_peer_record_one(st,peers, &old->addr, &old->last))
2237 break;
2238 }
2239
2240 transport_peers_debug(st,peers,m, naddrs,addrs,0);
2241 }
2242
2243 static void transport_expire_record_peers(struct site *st,
2244 transport_peers *peers,
2245 const struct comm_addr *addrs,
2246 int naddrs, const char *m) {
2247 /* Convenience function */
2248 transport_peers_expire(st,peers);
2249 transport_record_peers(st,peers,addrs,naddrs,m);
2250 }
2251
2252 static bool_t transport_compute_setupinit_peers(struct site *st,
2253 const struct comm_addr *configured_addrs /* 0 if none or not found */,
2254 int n_configured_addrs /* 0 if none or not found */,
2255 const struct comm_addr *incoming_packet_addr /* 0 if none */) {
2256 if (!n_configured_addrs && !incoming_packet_addr &&
2257 !transport_peers_valid(&st->peers))
2258 return False;
2259
2260 slog(st,LOG_SETUP_INIT,
2261 "using: %d configured addr(s);%s %d old peer addrs(es)",
2262 n_configured_addrs,
2263 incoming_packet_addr ? " incoming packet address;" : "",
2264 st->peers.npeers);
2265
2266 /* Non-mobile peers try addresses until one is plausible. The
2267 * effect is that this code always tries first the configured
2268 * address if supplied, or otherwise the address of the incoming
2269 * PROD, or finally the existing data peer if one exists; this is
2270 * as desired. */
2271
2272 transport_peers_copy(st,&st->setup_peers,&st->peers);
2273 transport_peers_expire(st,&st->setup_peers);
2274
2275 if (incoming_packet_addr)
2276 transport_record_peers(st,&st->setup_peers,
2277 incoming_packet_addr,1, "incoming");
2278
2279 if (n_configured_addrs)
2280 transport_record_peers(st,&st->setup_peers,
2281 configured_addrs,n_configured_addrs, "setupinit");
2282
2283 assert(transport_peers_valid(&st->setup_peers));
2284 return True;
2285 }
2286
2287 static void transport_setup_msgok(struct site *st, const struct comm_addr *a) {
2288 if (st->peer_mobile)
2289 transport_expire_record_peers(st,&st->setup_peers,a,1,"setupmsg");
2290 }
2291 static void transport_data_msgok(struct site *st, const struct comm_addr *a) {
2292 if (st->peer_mobile)
2293 transport_expire_record_peers(st,&st->peers,a,1,"datamsg");
2294 }
2295
2296 static int transport_peers_valid(transport_peers *peers) {
2297 return peers->npeers;
2298 }
2299 static void transport_peers_clear(struct site *st, transport_peers *peers) {
2300 peers->npeers= 0;
2301 transport_peers_debug(st,peers,"clear",0,0,0);
2302 }
2303 static void transport_peers_copy(struct site *st, transport_peers *dst,
2304 const transport_peers *src) {
2305 dst->npeers=src->npeers;
2306 COPY_ARRAY(dst->peers, src->peers, dst->npeers);
2307 transport_peers_debug(st,dst,"copy",
2308 src->npeers, &src->peers->addr, sizeof(*src->peers));
2309 }
2310
2311 static void transport_resolve_complete(struct site *st,
2312 const struct comm_addr *addrs,
2313 int naddrs) {
2314 transport_expire_record_peers(st,&st->peers,addrs,naddrs,
2315 "resolved data");
2316 transport_expire_record_peers(st,&st->setup_peers,addrs,naddrs,
2317 "resolved setup");
2318 }
2319
2320 static void transport_resolve_complete_tardy(struct site *st,
2321 const struct comm_addr *addrs,
2322 int naddrs) {
2323 transport_expire_record_peers(st,&st->peers,addrs,naddrs,
2324 "resolved tardily");
2325 }
2326
2327 static void transport_peers__copy_by_mask(transport_peer *out, int *nout_io,
2328 unsigned mask,
2329 const transport_peers *inp) {
2330 /* out and in->peers may be the same region, or nonoverlapping */
2331 const transport_peer *in=inp->peers;
2332 int slot;
2333 for (slot=0; slot<inp->npeers; slot++) {
2334 if (!(mask & (1U << slot)))
2335 continue;
2336 if (!(out==in && slot==*nout_io))
2337 COPY_OBJ(out[*nout_io], in[slot]);
2338 (*nout_io)++;
2339 }
2340 }
2341
2342 void transport_xmit(struct site *st, transport_peers *peers,
2343 struct buffer_if *buf, bool_t candebug) {
2344 int slot;
2345 transport_peers_expire(st, peers);
2346 unsigned failed=0; /* bitmask */
2347 assert(MAX_PEER_ADDRS < sizeof(unsigned)*CHAR_BIT);
2348
2349 int nfailed=0;
2350 for (slot=0; slot<peers->npeers; slot++) {
2351 transport_peer *peer=&peers->peers[slot];
2352 bool_t ok =
2353 peer->addr.comm->sendmsg(peer->addr.comm->st, buf, &peer->addr);
2354 if (candebug)
2355 dump_packet(st, buf, &peer->addr, False, ok);
2356 if (!ok) {
2357 failed |= 1U << slot;
2358 nfailed++;
2359 }
2360 if (ok && !st->peer_mobile)
2361 break;
2362 }
2363 /* Now we need to demote/delete failing addrs: if we are mobile we
2364 * merely demote them; otherwise we delete them. */
2365 if (st->local_mobile) {
2366 unsigned expected = ((1U << nfailed)-1) << (peers->npeers-nfailed);
2367 /* `expected' has all the failures at the end already */
2368 if (failed != expected) {
2369 int fslot=0;
2370 transport_peer failedpeers[nfailed];
2371 transport_peers__copy_by_mask(failedpeers, &fslot, failed,peers);
2372 assert(fslot == nfailed);
2373 int wslot=0;
2374 transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2375 assert(wslot+nfailed == peers->npeers);
2376 COPY_ARRAY(peers->peers+wslot, failedpeers, nfailed);
2377 }
2378 } else {
2379 if (failed && peers->npeers > 1) {
2380 int wslot=0;
2381 transport_peers__copy_by_mask(peers->peers,&wslot,~failed,peers);
2382 peers->npeers=wslot;
2383 }
2384 }
2385 }
2386
2387 /***** END of transport peers declarations *****/