ntp_proto.c revision 282408
1/*
2 * ntp_proto.c - NTP version 4 protocol machinery
3 *
4 * ATTENTION: Get approval from Dave Mills on all changes to this file!
5 *
6 */
7#ifdef HAVE_CONFIG_H
8#include <config.h>
9#endif
10
11#include "ntpd.h"
12#include "ntp_stdlib.h"
13#include "ntp_unixtime.h"
14#include "ntp_control.h"
15#include "ntp_string.h"
16#include "ntp_leapsec.h"
17
18#include <stdio.h>
19#ifdef HAVE_LIBSCF_H
20#include <libscf.h>
21#endif
22#ifdef HAVE_UNISTD_H
23#include <unistd.h>
24#endif
25
26/*
27 * This macro defines the authentication state. If x is 1 authentication
28 * is required; othewise it is optional.
29 */
30#define	AUTH(x, y)	((x) ? (y) == AUTH_OK : (y) == AUTH_OK || \
31			    (y) == AUTH_NONE)
32
33#define	AUTH_NONE	0	/* authentication not required */
34#define	AUTH_OK		1	/* authentication OK */
35#define	AUTH_ERROR	2	/* authentication error */
36#define	AUTH_CRYPTO	3	/* crypto_NAK */
37
38/*
39 * traffic shaping parameters
40 */
41#define	NTP_IBURST	6	/* packets in iburst */
42#define	RESP_DELAY	1	/* refclock burst delay (s) */
43
44/*
45 * pool soliciting restriction duration (s)
46 */
47#define	POOL_SOLICIT_WINDOW	8
48
49/*
50 * peer_select groups statistics for a peer used by clock_select() and
51 * clock_cluster().
52 */
53typedef struct peer_select_tag {
54	struct peer *	peer;
55	double		synch;	/* sync distance */
56	double		error;	/* jitter */
57	double		seljit;	/* selection jitter */
58} peer_select;
59
60/*
61 * System variables are declared here. Unless specified otherwise, all
62 * times are in seconds.
63 */
64u_char	sys_leap;		/* system leap indicator */
65u_char	sys_stratum;		/* system stratum */
66s_char	sys_precision;		/* local clock precision (log2 s) */
67double	sys_rootdelay;		/* roundtrip delay to primary source */
68double	sys_rootdisp;		/* dispersion to primary source */
69u_int32 sys_refid;		/* reference id (network byte order) */
70l_fp	sys_reftime;		/* last update time */
71struct	peer *sys_peer;		/* current peer */
72
73/*
74 * Rate controls. Leaky buckets are used to throttle the packet
75 * transmission rates in order to protect busy servers such as at NIST
76 * and USNO. There is a counter for each association and another for KoD
77 * packets. The association counter decrements each second, but not
78 * below zero. Each time a packet is sent the counter is incremented by
79 * a configurable value representing the average interval between
80 * packets. A packet is delayed as long as the counter is greater than
81 * zero. Note this does not affect the time value computations.
82 */
83/*
84 * Nonspecified system state variables
85 */
86int	sys_bclient;		/* broadcast client enable */
87double	sys_bdelay;		/* broadcast client default delay */
88int	sys_authenticate;	/* requre authentication for config */
89l_fp	sys_authdelay;		/* authentication delay */
90double	sys_offset;	/* current local clock offset */
91double	sys_mindisp = MINDISPERSE; /* minimum distance (s) */
92double	sys_maxdist = MAXDISTANCE; /* selection threshold */
93double	sys_jitter;		/* system jitter */
94u_long	sys_epoch;		/* last clock update time */
95static	double sys_clockhop;	/* clockhop threshold */
96static int leap_vote_ins;	/* leap consensus for insert */
97static int leap_vote_del;	/* leap consensus for delete */
98keyid_t	sys_private;		/* private value for session seed */
99int	sys_manycastserver;	/* respond to manycast client pkts */
100int	ntp_mode7;		/* respond to ntpdc (mode7) */
101int	peer_ntpdate;		/* active peers in ntpdate mode */
102int	sys_survivors;		/* truest of the truechimers */
103char	*sys_ident = NULL;	/* identity scheme */
104
105/*
106 * TOS and multicast mapping stuff
107 */
108int	sys_floor = 0;		/* cluster stratum floor */
109int	sys_ceiling = STRATUM_UNSPEC - 1; /* cluster stratum ceiling */
110int	sys_minsane = 1;	/* minimum candidates */
111int	sys_minclock = NTP_MINCLOCK; /* minimum candidates */
112int	sys_maxclock = NTP_MAXCLOCK; /* maximum candidates */
113int	sys_cohort = 0;		/* cohort switch */
114int	sys_orphan = STRATUM_UNSPEC + 1; /* orphan stratum */
115int	sys_orphwait = NTP_ORPHWAIT; /* orphan wait */
116int	sys_beacon = BEACON;	/* manycast beacon interval */
117int	sys_ttlmax;		/* max ttl mapping vector index */
118u_char	sys_ttl[MAX_TTL];	/* ttl mapping vector */
119
120/*
121 * Statistics counters - first the good, then the bad
122 */
123u_long	sys_stattime;		/* elapsed time */
124u_long	sys_received;		/* packets received */
125u_long	sys_processed;		/* packets for this host */
126u_long	sys_newversion;		/* current version */
127u_long	sys_oldversion;		/* old version */
128u_long	sys_restricted;		/* access denied */
129u_long	sys_badlength;		/* bad length or format */
130u_long	sys_badauth;		/* bad authentication */
131u_long	sys_declined;		/* declined */
132u_long	sys_limitrejected;	/* rate exceeded */
133u_long	sys_kodsent;		/* KoD sent */
134
135static	double	root_distance	(struct peer *);
136static	void	clock_combine	(peer_select *, int, int);
137static	void	peer_xmit	(struct peer *);
138static	void	fast_xmit	(struct recvbuf *, int, keyid_t, int);
139static	void	pool_xmit	(struct peer *);
140static	void	clock_update	(struct peer *);
141static	void	measure_precision(void);
142static	double	measure_tick_fuzz(void);
143static	int	local_refid	(struct peer *);
144static	int	peer_unfit	(struct peer *);
145#ifdef AUTOKEY
146static	int	group_test	(char *, char *);
147#endif /* AUTOKEY */
148#ifdef WORKER
149void	pool_name_resolved	(int, int, void *, const char *,
150				 const char *, const struct addrinfo *,
151				 const struct addrinfo *);
152#endif /* WORKER */
153
154
155/*
156 * transmit - transmit procedure called by poll timeout
157 */
158void
159transmit(
160	struct peer *peer	/* peer structure pointer */
161	)
162{
163	u_char	hpoll;
164
165	/*
166	 * The polling state machine. There are two kinds of machines,
167	 * those that never expect a reply (broadcast and manycast
168	 * server modes) and those that do (all other modes). The dance
169	 * is intricate...
170	 */
171	hpoll = peer->hpoll;
172
173	/*
174	 * In broadcast mode the poll interval is never changed from
175	 * minpoll.
176	 */
177	if (peer->cast_flags & (MDF_BCAST | MDF_MCAST)) {
178		peer->outdate = current_time;
179		if (sys_leap != LEAP_NOTINSYNC)
180			peer_xmit(peer);
181		poll_update(peer, hpoll);
182		return;
183	}
184
185	/*
186	 * In manycast mode we start with unity ttl. The ttl is
187	 * increased by one for each poll until either sys_maxclock
188	 * servers have been found or the maximum ttl is reached. When
189	 * sys_maxclock servers are found we stop polling until one or
190	 * more servers have timed out or until less than sys_minclock
191	 * associations turn up. In this case additional better servers
192	 * are dragged in and preempt the existing ones.  Once every
193	 * sys_beacon seconds we are to transmit unconditionally, but
194	 * this code is not quite right -- peer->unreach counts polls
195	 * and is being compared with sys_beacon, so the beacons happen
196	 * every sys_beacon polls.
197	 */
198	if (peer->cast_flags & MDF_ACAST) {
199		peer->outdate = current_time;
200		if (peer->unreach > sys_beacon) {
201			peer->unreach = 0;
202			peer->ttl = 0;
203			peer_xmit(peer);
204		} else if (sys_survivors < sys_minclock ||
205		    peer_associations < sys_maxclock) {
206			if (peer->ttl < (u_int32)sys_ttlmax)
207				peer->ttl++;
208			peer_xmit(peer);
209		}
210		peer->unreach++;
211		poll_update(peer, hpoll);
212		return;
213	}
214
215	/*
216	 * Pool associations transmit unicast solicitations when there
217	 * are less than a hard limit of 2 * sys_maxclock associations,
218	 * and either less than sys_minclock survivors or less than
219	 * sys_maxclock associations.  The hard limit prevents unbounded
220	 * growth in associations if the system clock or network quality
221	 * result in survivor count dipping below sys_minclock often.
222	 * This was observed testing with pool, where sys_maxclock == 12
223	 * resulted in 60 associations without the hard limit.  A
224	 * similar hard limit on manycastclient ephemeral associations
225	 * may be appropriate.
226	 */
227	if (peer->cast_flags & MDF_POOL) {
228		peer->outdate = current_time;
229		if ((peer_associations <= 2 * sys_maxclock) &&
230		    (peer_associations < sys_maxclock ||
231		     sys_survivors < sys_minclock))
232			pool_xmit(peer);
233		poll_update(peer, hpoll);
234		return;
235	}
236
237	/*
238	 * In unicast modes the dance is much more intricate. It is
239	 * designed to back off whenever possible to minimize network
240	 * traffic.
241	 */
242	if (peer->burst == 0) {
243		u_char oreach;
244
245		/*
246		 * Update the reachability status. If not heard for
247		 * three consecutive polls, stuff infinity in the clock
248		 * filter.
249		 */
250		oreach = peer->reach;
251		peer->outdate = current_time;
252		peer->unreach++;
253		peer->reach <<= 1;
254		if (!peer->reach) {
255
256			/*
257			 * Here the peer is unreachable. If it was
258			 * previously reachable raise a trap. Send a
259			 * burst if enabled.
260			 */
261			clock_filter(peer, 0., 0., MAXDISPERSE);
262			if (oreach) {
263				peer_unfit(peer);
264				report_event(PEVNT_UNREACH, peer, NULL);
265			}
266			if ((peer->flags & FLAG_IBURST) &&
267			    peer->retry == 0)
268				peer->retry = NTP_RETRY;
269		} else {
270
271			/*
272			 * Here the peer is reachable. Send a burst if
273			 * enabled and the peer is fit.  Reset unreach
274			 * for persistent and ephemeral associations.
275			 * Unreach is also reset for survivors in
276			 * clock_select().
277			 */
278			hpoll = sys_poll;
279			if (!(peer->flags & FLAG_PREEMPT))
280				peer->unreach = 0;
281			if ((peer->flags & FLAG_BURST) && peer->retry ==
282			    0 && !peer_unfit(peer))
283				peer->retry = NTP_RETRY;
284		}
285
286		/*
287		 * Watch for timeout.  If ephemeral, toss the rascal;
288		 * otherwise, bump the poll interval. Note the
289		 * poll_update() routine will clamp it to maxpoll.
290		 * If preemptible and we have more peers than maxclock,
291		 * and this peer has the minimum score of preemptibles,
292		 * demobilize.
293		 */
294		if (peer->unreach >= NTP_UNREACH) {
295			hpoll++;
296			/* ephemeral: no FLAG_CONFIG nor FLAG_PREEMPT */
297			if (!(peer->flags & (FLAG_CONFIG | FLAG_PREEMPT))) {
298				report_event(PEVNT_RESTART, peer, "timeout");
299				peer_clear(peer, "TIME");
300				unpeer(peer);
301				return;
302			}
303			if ((peer->flags & FLAG_PREEMPT) &&
304			    (peer_associations > sys_maxclock) &&
305			    score_all(peer)) {
306				report_event(PEVNT_RESTART, peer, "timeout");
307				peer_clear(peer, "TIME");
308				unpeer(peer);
309				return;
310			}
311		}
312	} else {
313		peer->burst--;
314		if (peer->burst == 0) {
315
316			/*
317			 * If ntpdate mode and the clock has not been
318			 * set and all peers have completed the burst,
319			 * we declare a successful failure.
320			 */
321			if (mode_ntpdate) {
322				peer_ntpdate--;
323				if (peer_ntpdate == 0) {
324					msyslog(LOG_NOTICE,
325					    "ntpd: no servers found");
326					if (!msyslog_term)
327						printf(
328						    "ntpd: no servers found\n");
329					exit (0);
330				}
331			}
332		}
333	}
334	if (peer->retry > 0)
335		peer->retry--;
336
337	/*
338	 * Do not transmit if in broadcast client mode.
339	 */
340	if (peer->hmode != MODE_BCLIENT)
341		peer_xmit(peer);
342	poll_update(peer, hpoll);
343}
344
345
346/*
347 * receive - receive procedure called for each packet received
348 */
349void
350receive(
351	struct recvbuf *rbufp
352	)
353{
354	register struct peer *peer;	/* peer structure pointer */
355	register struct pkt *pkt;	/* receive packet pointer */
356	u_char	hisversion;		/* packet version */
357	u_char	hisleap;		/* packet leap indicator */
358	u_char	hismode;		/* packet mode */
359	u_char	hisstratum;		/* packet stratum */
360	u_short	restrict_mask;		/* restrict bits */
361	int	has_mac;		/* length of MAC field */
362	int	authlen;		/* offset of MAC field */
363	int	is_authentic = 0;	/* cryptosum ok */
364	int	retcode = AM_NOMATCH;	/* match code */
365	keyid_t	skeyid = 0;		/* key IDs */
366	u_int32	opcode = 0;		/* extension field opcode */
367	sockaddr_u *dstadr_sin; 	/* active runway */
368	struct peer *peer2;		/* aux peer structure pointer */
369	endpt *	match_ep;		/* newpeer() local address */
370	l_fp	p_org;			/* origin timestamp */
371	l_fp	p_rec;			/* receive timestamp */
372	l_fp	p_xmt;			/* transmit timestamp */
373#ifdef AUTOKEY
374	char	hostname[NTP_MAXSTRLEN + 1];
375	char	*groupname = NULL;
376	struct autokey *ap;		/* autokey structure pointer */
377	int	rval;			/* cookie snatcher */
378	keyid_t	pkeyid = 0, tkeyid = 0;	/* key IDs */
379#endif	/* AUTOKEY */
380#ifdef HAVE_NTP_SIGND
381	static unsigned char zero_key[16];
382#endif /* HAVE_NTP_SIGND */
383
384	/*
385	 * Monitor the packet and get restrictions. Note that the packet
386	 * length for control and private mode packets must be checked
387	 * by the service routines. Some restrictions have to be handled
388	 * later in order to generate a kiss-o'-death packet.
389	 */
390	/*
391	 * Bogus port check is before anything, since it probably
392	 * reveals a clogging attack.
393	 */
394	sys_received++;
395	if (0 == SRCPORT(&rbufp->recv_srcadr)) {
396		sys_badlength++;
397		return;				/* bogus port */
398	}
399	restrict_mask = restrictions(&rbufp->recv_srcadr);
400	DPRINTF(2, ("receive: at %ld %s<-%s flags %x restrict %03x\n",
401		    current_time, stoa(&rbufp->dstadr->sin),
402		    stoa(&rbufp->recv_srcadr),
403		    rbufp->dstadr->flags, restrict_mask));
404	pkt = &rbufp->recv_pkt;
405	hisversion = PKT_VERSION(pkt->li_vn_mode);
406	hisleap = PKT_LEAP(pkt->li_vn_mode);
407	hismode = (int)PKT_MODE(pkt->li_vn_mode);
408	hisstratum = PKT_TO_STRATUM(pkt->stratum);
409	if (restrict_mask & RES_IGNORE) {
410		sys_restricted++;
411		return;				/* ignore everything */
412	}
413	if (hismode == MODE_PRIVATE) {
414		if (!ntp_mode7 || (restrict_mask & RES_NOQUERY)) {
415			sys_restricted++;
416			return;			/* no query private */
417		}
418		process_private(rbufp, ((restrict_mask &
419		    RES_NOMODIFY) == 0));
420		return;
421	}
422	if (hismode == MODE_CONTROL) {
423		if (restrict_mask & RES_NOQUERY) {
424			sys_restricted++;
425			return;			/* no query control */
426		}
427		process_control(rbufp, restrict_mask);
428		return;
429	}
430	if (restrict_mask & RES_DONTSERVE) {
431		sys_restricted++;
432		return;				/* no time serve */
433	}
434
435	/*
436	 * This is for testing. If restricted drop ten percent of
437	 * surviving packets.
438	 */
439	if (restrict_mask & RES_FLAKE) {
440		if ((double)ntp_random() / 0x7fffffff < .1) {
441			sys_restricted++;
442			return;			/* no flakeway */
443		}
444	}
445
446	/*
447	 * Version check must be after the query packets, since they
448	 * intentionally use an early version.
449	 */
450	if (hisversion == NTP_VERSION) {
451		sys_newversion++;		/* new version */
452	} else if (!(restrict_mask & RES_VERSION) && hisversion >=
453	    NTP_OLDVERSION) {
454		sys_oldversion++;		/* previous version */
455	} else {
456		sys_badlength++;
457		return;				/* old version */
458	}
459
460	/*
461	 * Figure out his mode and validate the packet. This has some
462	 * legacy raunch that probably should be removed. In very early
463	 * NTP versions mode 0 was equivalent to what later versions
464	 * would interpret as client mode.
465	 */
466	if (hismode == MODE_UNSPEC) {
467		if (hisversion == NTP_OLDVERSION) {
468			hismode = MODE_CLIENT;
469		} else {
470			sys_badlength++;
471			return;                 /* invalid mode */
472		}
473	}
474
475	/*
476	 * Parse the extension field if present. We figure out whether
477	 * an extension field is present by measuring the MAC size. If
478	 * the number of words following the packet header is 0, no MAC
479	 * is present and the packet is not authenticated. If 1, the
480	 * packet is a crypto-NAK; if 3, the packet is authenticated
481	 * with DES; if 5, the packet is authenticated with MD5; if 6,
482	 * the packet is authenticated with SHA. If 2 or * 4, the packet
483	 * is a runt and discarded forthwith. If greater than 6, an
484	 * extension field is present, so we subtract the length of the
485	 * field and go around again.
486	 */
487	authlen = LEN_PKT_NOMAC;
488	has_mac = rbufp->recv_length - authlen;
489	while (has_mac > 0) {
490		u_int32	len;
491#ifdef AUTOKEY
492		u_int32	hostlen;
493		struct exten *ep;
494#endif /*AUTOKEY */
495
496		if (has_mac % 4 != 0 || has_mac < (int)MIN_MAC_LEN) {
497			sys_badlength++;
498			return;			/* bad length */
499		}
500		if (has_mac <= (int)MAX_MAC_LEN) {
501			skeyid = ntohl(((u_int32 *)pkt)[authlen / 4]);
502			break;
503
504		} else {
505			opcode = ntohl(((u_int32 *)pkt)[authlen / 4]);
506			len = opcode & 0xffff;
507			if (len % 4 != 0 || len < 4 || (int)len +
508			    authlen > rbufp->recv_length) {
509				sys_badlength++;
510				return;		/* bad length */
511			}
512#ifdef AUTOKEY
513			/*
514			 * Extract calling group name for later.  If
515			 * sys_groupname is non-NULL, there must be
516			 * a group name provided to elicit a response.
517			 */
518			if ((opcode & 0x3fff0000) == CRYPTO_ASSOC &&
519			    sys_groupname != NULL) {
520				ep = (struct exten *)&((u_int32 *)pkt)[authlen / 4];
521				hostlen = ntohl(ep->vallen);
522				if (hostlen >= sizeof(hostname) ||
523				    hostlen > len -
524				    offsetof(struct exten, pkt)) {
525					sys_badlength++;
526					return;		/* bad length */
527				}
528				memcpy(hostname, &ep->pkt, hostlen);
529				hostname[hostlen] = '\0';
530				groupname = strchr(hostname, '@');
531				if (groupname == NULL) {
532					sys_declined++;
533					return;
534				}
535				groupname++;
536			}
537#endif /* AUTOKEY */
538			authlen += len;
539			has_mac -= len;
540		}
541	}
542
543	/*
544	 * If has_mac is < 0 we had a malformed packet.
545	 */
546	if (has_mac < 0) {
547		sys_badlength++;
548		return;		/* bad length */
549	}
550
551	/*
552	 * If authentication required, a MAC must be present.
553	 */
554	if (restrict_mask & RES_DONTTRUST && has_mac == 0) {
555		sys_restricted++;
556		return;				/* access denied */
557	}
558
559	/*
560	 * Update the MRU list and finger the cloggers. It can be a
561	 * little expensive, so turn it off for production use.
562	 * RES_LIMITED and RES_KOD will be cleared in the returned
563	 * restrict_mask unless one or both actions are warranted.
564	 */
565	restrict_mask = ntp_monitor(rbufp, restrict_mask);
566	if (restrict_mask & RES_LIMITED) {
567		sys_limitrejected++;
568		if (!(restrict_mask & RES_KOD) || MODE_BROADCAST ==
569		    hismode || MODE_SERVER == hismode) {
570			if (MODE_SERVER == hismode)
571				DPRINTF(1, ("Possibly self-induced rate limiting of MODE_SERVER from %s\n",
572					stoa(&rbufp->recv_srcadr)));
573			return;			/* rate exceeded */
574		}
575		if (hismode == MODE_CLIENT)
576			fast_xmit(rbufp, MODE_SERVER, skeyid,
577			    restrict_mask);
578		else
579			fast_xmit(rbufp, MODE_ACTIVE, skeyid,
580			    restrict_mask);
581		return;				/* rate exceeded */
582	}
583	restrict_mask &= ~RES_KOD;
584
585	/*
586	 * We have tossed out as many buggy packets as possible early in
587	 * the game to reduce the exposure to a clogging attack. Now we
588	 * have to burn some cycles to find the association and
589	 * authenticate the packet if required. Note that we burn only
590	 * digest cycles, again to reduce exposure. There may be no
591	 * matching association and that's okay.
592	 *
593	 * More on the autokey mambo. Normally the local interface is
594	 * found when the association was mobilized with respect to a
595	 * designated remote address. We assume packets arriving from
596	 * the remote address arrive via this interface and the local
597	 * address used to construct the autokey is the unicast address
598	 * of the interface. However, if the sender is a broadcaster,
599	 * the interface broadcast address is used instead.
600	 * Notwithstanding this technobabble, if the sender is a
601	 * multicaster, the broadcast address is null, so we use the
602	 * unicast address anyway. Don't ask.
603	 */
604	peer = findpeer(rbufp,  hismode, &retcode);
605	dstadr_sin = &rbufp->dstadr->sin;
606	NTOHL_FP(&pkt->org, &p_org);
607	NTOHL_FP(&pkt->rec, &p_rec);
608	NTOHL_FP(&pkt->xmt, &p_xmt);
609
610	/*
611	 * Authentication is conditioned by three switches:
612	 *
613	 * NOPEER  (RES_NOPEER) do not mobilize an association unless
614	 *         authenticated
615	 * NOTRUST (RES_DONTTRUST) do not allow access unless
616	 *         authenticated (implies NOPEER)
617	 * enable  (sys_authenticate) master NOPEER switch, by default
618	 *         on
619	 *
620	 * The NOPEER and NOTRUST can be specified on a per-client basis
621	 * using the restrict command. The enable switch if on implies
622	 * NOPEER for all clients. There are four outcomes:
623	 *
624	 * NONE    The packet has no MAC.
625	 * OK      the packet has a MAC and authentication succeeds
626	 * ERROR   the packet has a MAC and authentication fails
627	 * CRYPTO  crypto-NAK. The MAC has four octets only.
628	 *
629	 * Note: The AUTH(x, y) macro is used to filter outcomes. If x
630	 * is zero, acceptable outcomes of y are NONE and OK. If x is
631	 * one, the only acceptable outcome of y is OK.
632	 */
633
634	if (has_mac == 0) {
635		restrict_mask &= ~RES_MSSNTP;
636		is_authentic = AUTH_NONE; /* not required */
637#ifdef DEBUG
638		if (debug)
639			printf(
640			    "receive: at %ld %s<-%s mode %d len %d\n",
641			    current_time, stoa(dstadr_sin),
642			    stoa(&rbufp->recv_srcadr), hismode,
643			    authlen);
644#endif
645	} else if (has_mac == 4) {
646		restrict_mask &= ~RES_MSSNTP;
647		is_authentic = AUTH_CRYPTO; /* crypto-NAK */
648#ifdef DEBUG
649		if (debug)
650			printf(
651			    "receive: at %ld %s<-%s mode %d keyid %08x len %d auth %d\n",
652			    current_time, stoa(dstadr_sin),
653			    stoa(&rbufp->recv_srcadr), hismode, skeyid,
654			    authlen + has_mac, is_authentic);
655#endif
656
657#ifdef HAVE_NTP_SIGND
658		/*
659		 * If the signature is 20 bytes long, the last 16 of
660		 * which are zero, then this is a Microsoft client
661		 * wanting AD-style authentication of the server's
662		 * reply.
663		 *
664		 * This is described in Microsoft's WSPP docs, in MS-SNTP:
665		 * http://msdn.microsoft.com/en-us/library/cc212930.aspx
666		 */
667	} else if (has_mac == MAX_MD5_LEN && (restrict_mask & RES_MSSNTP) &&
668	   (retcode == AM_FXMIT || retcode == AM_NEWPASS) &&
669	   (memcmp(zero_key, (char *)pkt + authlen + 4, MAX_MD5_LEN - 4) ==
670	   0)) {
671		is_authentic = AUTH_NONE;
672#endif /* HAVE_NTP_SIGND */
673
674	} else {
675		restrict_mask &= ~RES_MSSNTP;
676#ifdef AUTOKEY
677		/*
678		 * For autokey modes, generate the session key
679		 * and install in the key cache. Use the socket
680		 * broadcast or unicast address as appropriate.
681		 */
682		if (crypto_flags && skeyid > NTP_MAXKEY) {
683
684			/*
685			 * More on the autokey dance (AKD). A cookie is
686			 * constructed from public and private values.
687			 * For broadcast packets, the cookie is public
688			 * (zero). For packets that match no
689			 * association, the cookie is hashed from the
690			 * addresses and private value. For server
691			 * packets, the cookie was previously obtained
692			 * from the server. For symmetric modes, the
693			 * cookie was previously constructed using an
694			 * agreement protocol; however, should PKI be
695			 * unavailable, we construct a fake agreement as
696			 * the EXOR of the peer and host cookies.
697			 *
698			 * hismode	ephemeral	persistent
699			 * =======================================
700			 * active	0		cookie#
701			 * passive	0%		cookie#
702			 * client	sys cookie	0%
703			 * server	0%		sys cookie
704			 * broadcast	0		0
705			 *
706			 * # if unsync, 0
707			 * % can't happen
708			 */
709			if (has_mac < (int)MAX_MD5_LEN) {
710				sys_badauth++;
711				return;
712			}
713			if (hismode == MODE_BROADCAST) {
714
715				/*
716				 * For broadcaster, use the interface
717				 * broadcast address when available;
718				 * otherwise, use the unicast address
719				 * found when the association was
720				 * mobilized. However, if this is from
721				 * the wildcard interface, game over.
722				 */
723				if (crypto_flags && rbufp->dstadr ==
724				    ANY_INTERFACE_CHOOSE(&rbufp->recv_srcadr)) {
725					sys_restricted++;
726					return;	     /* no wildcard */
727				}
728				pkeyid = 0;
729				if (!SOCK_UNSPEC(&rbufp->dstadr->bcast))
730					dstadr_sin =
731					    &rbufp->dstadr->bcast;
732			} else if (peer == NULL) {
733				pkeyid = session_key(
734				    &rbufp->recv_srcadr, dstadr_sin, 0,
735				    sys_private, 0);
736			} else {
737				pkeyid = peer->pcookie;
738			}
739
740			/*
741			 * The session key includes both the public
742			 * values and cookie. In case of an extension
743			 * field, the cookie used for authentication
744			 * purposes is zero. Note the hash is saved for
745			 * use later in the autokey mambo.
746			 */
747			if (authlen > (int)LEN_PKT_NOMAC && pkeyid != 0) {
748				session_key(&rbufp->recv_srcadr,
749				    dstadr_sin, skeyid, 0, 2);
750				tkeyid = session_key(
751				    &rbufp->recv_srcadr, dstadr_sin,
752				    skeyid, pkeyid, 0);
753			} else {
754				tkeyid = session_key(
755				    &rbufp->recv_srcadr, dstadr_sin,
756				    skeyid, pkeyid, 2);
757			}
758
759		}
760#endif	/* AUTOKEY */
761
762		/*
763		 * Compute the cryptosum. Note a clogging attack may
764		 * succeed in bloating the key cache. If an autokey,
765		 * purge it immediately, since we won't be needing it
766		 * again. If the packet is authentic, it can mobilize an
767		 * association. Note that there is no key zero.
768		 */
769		if (!authdecrypt(skeyid, (u_int32 *)pkt, authlen,
770		    has_mac))
771			is_authentic = AUTH_ERROR;
772		else
773			is_authentic = AUTH_OK;
774#ifdef AUTOKEY
775		if (crypto_flags && skeyid > NTP_MAXKEY)
776			authtrust(skeyid, 0);
777#endif	/* AUTOKEY */
778#ifdef DEBUG
779		if (debug)
780			printf(
781			    "receive: at %ld %s<-%s mode %d keyid %08x len %d auth %d\n",
782			    current_time, stoa(dstadr_sin),
783			    stoa(&rbufp->recv_srcadr), hismode, skeyid,
784			    authlen + has_mac, is_authentic);
785#endif
786	}
787
788	/*
789	 * The association matching rules are implemented by a set of
790	 * routines and an association table. A packet matching an
791	 * association is processed by the peer process for that
792	 * association. If there are no errors, an ephemeral association
793	 * is mobilized: a broadcast packet mobilizes a broadcast client
794	 * aassociation; a manycast server packet mobilizes a manycast
795	 * client association; a symmetric active packet mobilizes a
796	 * symmetric passive association.
797	 */
798	switch (retcode) {
799
800	/*
801	 * This is a client mode packet not matching any association. If
802	 * an ordinary client, simply toss a server mode packet back
803	 * over the fence. If a manycast client, we have to work a
804	 * little harder.
805	 */
806	case AM_FXMIT:
807
808		/*
809		 * If authentication OK, send a server reply; otherwise,
810		 * send a crypto-NAK.
811		 */
812		if (!(rbufp->dstadr->flags & INT_MCASTOPEN)) {
813			if (AUTH(restrict_mask & RES_DONTTRUST,
814			   is_authentic)) {
815				fast_xmit(rbufp, MODE_SERVER, skeyid,
816				    restrict_mask);
817			} else if (is_authentic == AUTH_ERROR) {
818				fast_xmit(rbufp, MODE_SERVER, 0,
819				    restrict_mask);
820				sys_badauth++;
821			} else {
822				sys_restricted++;
823			}
824			return;			/* hooray */
825		}
826
827		/*
828		 * This must be manycast. Do not respond if not
829		 * configured as a manycast server.
830		 */
831		if (!sys_manycastserver) {
832			sys_restricted++;
833			return;			/* not enabled */
834		}
835
836#ifdef AUTOKEY
837		/*
838		 * Do not respond if not the same group.
839		 */
840		if (group_test(groupname, NULL)) {
841			sys_declined++;
842			return;
843		}
844#endif /* AUTOKEY */
845
846		/*
847		 * Do not respond if we are not synchronized or our
848		 * stratum is greater than the manycaster or the
849		 * manycaster has already synchronized to us.
850		 */
851		if (sys_leap == LEAP_NOTINSYNC || sys_stratum >=
852		    hisstratum || (!sys_cohort && sys_stratum ==
853		    hisstratum + 1) || rbufp->dstadr->addr_refid ==
854		    pkt->refid) {
855			sys_declined++;
856			return;			/* no help */
857		}
858
859		/*
860		 * Respond only if authentication succeeds. Don't do a
861		 * crypto-NAK, as that would not be useful.
862		 */
863		if (AUTH(restrict_mask & RES_DONTTRUST, is_authentic))
864			fast_xmit(rbufp, MODE_SERVER, skeyid,
865			    restrict_mask);
866		return;				/* hooray */
867
868	/*
869	 * This is a server mode packet returned in response to a client
870	 * mode packet sent to a multicast group address (for
871	 * manycastclient) or to a unicast address (for pool). The
872	 * origin timestamp is a good nonce to reliably associate the
873	 * reply with what was sent. If there is no match, that's
874	 * curious and could be an intruder attempting to clog, so we
875	 * just ignore it.
876	 *
877	 * If the packet is authentic and the manycastclient or pool
878	 * association is found, we mobilize a client association and
879	 * copy pertinent variables from the manycastclient or pool
880	 * association to the new client association. If not, just
881	 * ignore the packet.
882	 *
883	 * There is an implosion hazard at the manycast client, since
884	 * the manycast servers send the server packet immediately. If
885	 * the guy is already here, don't fire up a duplicate.
886	 */
887	case AM_MANYCAST:
888
889#ifdef AUTOKEY
890		/*
891		 * Do not respond if not the same group.
892		 */
893		if (group_test(groupname, NULL)) {
894			sys_declined++;
895			return;
896		}
897#endif /* AUTOKEY */
898		if ((peer2 = findmanycastpeer(rbufp)) == NULL) {
899			sys_restricted++;
900			return;			/* not enabled */
901		}
902		if (!AUTH((!(peer2->cast_flags & MDF_POOL) &&
903		    sys_authenticate) | (restrict_mask & (RES_NOPEER |
904		    RES_DONTTRUST)), is_authentic)) {
905			sys_restricted++;
906			return;			/* access denied */
907		}
908
909		/*
910		 * Do not respond if unsynchronized or stratum is below
911		 * the floor or at or above the ceiling.
912		 */
913		if (hisleap == LEAP_NOTINSYNC || hisstratum <
914		    sys_floor || hisstratum >= sys_ceiling) {
915			sys_declined++;
916			return;			/* no help */
917		}
918		peer = newpeer(&rbufp->recv_srcadr, NULL, rbufp->dstadr,
919			       MODE_CLIENT, hisversion, peer2->minpoll,
920			       peer2->maxpoll, FLAG_PREEMPT |
921			       (FLAG_IBURST & peer2->flags), MDF_UCAST |
922			       MDF_UCLNT, 0, skeyid, sys_ident);
923		if (NULL == peer) {
924			sys_declined++;
925			return;			/* ignore duplicate  */
926		}
927
928		/*
929		 * After each ephemeral pool association is spun,
930		 * accelerate the next poll for the pool solicitor so
931		 * the pool will fill promptly.
932		 */
933		if (peer2->cast_flags & MDF_POOL)
934			peer2->nextdate = current_time + 1;
935
936		/*
937		 * Further processing of the solicitation response would
938		 * simply detect its origin timestamp as bogus for the
939		 * brand-new association (it matches the prototype
940		 * association) and tinker with peer->nextdate delaying
941		 * first sync.
942		 */
943		return;		/* solicitation response handled */
944
945	/*
946	 * This is the first packet received from a broadcast server. If
947	 * the packet is authentic and we are enabled as broadcast
948	 * client, mobilize a broadcast client association. We don't
949	 * kiss any frogs here.
950	 */
951	case AM_NEWBCL:
952
953#ifdef AUTOKEY
954		/*
955		 * Do not respond if not the same group.
956		 */
957		if (group_test(groupname, sys_ident)) {
958			sys_declined++;
959			return;
960		}
961#endif /* AUTOKEY */
962		if (sys_bclient == 0) {
963			sys_restricted++;
964			return;			/* not enabled */
965		}
966		if (!AUTH(sys_authenticate | (restrict_mask &
967		    (RES_NOPEER | RES_DONTTRUST)), is_authentic)) {
968			sys_restricted++;
969			return;			/* access denied */
970		}
971
972		/*
973		 * Do not respond if unsynchronized or stratum is below
974		 * the floor or at or above the ceiling.
975		 */
976		if (hisleap == LEAP_NOTINSYNC || hisstratum <
977		    sys_floor || hisstratum >= sys_ceiling) {
978			sys_declined++;
979			return;			/* no help */
980		}
981
982#ifdef AUTOKEY
983		/*
984		 * Do not respond if Autokey and the opcode is not a
985		 * CRYPTO_ASSOC response with association ID.
986		 */
987		if (crypto_flags && skeyid > NTP_MAXKEY && (opcode &
988		    0xffff0000) != (CRYPTO_ASSOC | CRYPTO_RESP)) {
989			sys_declined++;
990			return;			/* protocol error */
991		}
992#endif	/* AUTOKEY */
993
994		/*
995		 * Broadcasts received via a multicast address may
996		 * arrive after a unicast volley has begun
997		 * with the same remote address.  newpeer() will not
998		 * find duplicate associations on other local endpoints
999		 * if a non-NULL endpoint is supplied.  multicastclient
1000		 * ephemeral associations are unique across all local
1001		 * endpoints.
1002		 */
1003		if (!(INT_MCASTOPEN & rbufp->dstadr->flags))
1004			match_ep = rbufp->dstadr;
1005		else
1006			match_ep = NULL;
1007
1008		/*
1009		 * Determine whether to execute the initial volley.
1010		 */
1011		if (sys_bdelay != 0) {
1012#ifdef AUTOKEY
1013			/*
1014			 * If a two-way exchange is not possible,
1015			 * neither is Autokey.
1016			 */
1017			if (crypto_flags && skeyid > NTP_MAXKEY) {
1018				sys_restricted++;
1019				return;		/* no autokey */
1020			}
1021#endif	/* AUTOKEY */
1022
1023			/*
1024			 * Do not execute the volley. Start out in
1025			 * broadcast client mode.
1026			 */
1027			peer = newpeer(&rbufp->recv_srcadr, NULL,
1028			    match_ep, MODE_BCLIENT, hisversion,
1029			    pkt->ppoll, pkt->ppoll, FLAG_PREEMPT,
1030			    MDF_BCLNT, 0, skeyid, sys_ident);
1031			if (NULL == peer) {
1032				sys_restricted++;
1033				return;		/* ignore duplicate */
1034
1035			} else {
1036				peer->delay = sys_bdelay;
1037			}
1038			break;
1039		}
1040
1041		/*
1042		 * Execute the initial volley in order to calibrate the
1043		 * propagation delay and run the Autokey protocol.
1044		 *
1045		 * Note that the minpoll is taken from the broadcast
1046		 * packet, normally 6 (64 s) and that the poll interval
1047		 * is fixed at this value.
1048		 */
1049		peer = newpeer(&rbufp->recv_srcadr, NULL, match_ep,
1050		    MODE_CLIENT, hisversion, pkt->ppoll, pkt->ppoll,
1051		    FLAG_BC_VOL | FLAG_IBURST | FLAG_PREEMPT, MDF_BCLNT,
1052		    0, skeyid, sys_ident);
1053		if (NULL == peer) {
1054			sys_restricted++;
1055			return;			/* ignore duplicate */
1056		}
1057#ifdef AUTOKEY
1058		if (skeyid > NTP_MAXKEY)
1059			crypto_recv(peer, rbufp);
1060#endif	/* AUTOKEY */
1061
1062		return;				/* hooray */
1063
1064	/*
1065	 * This is the first packet received from a symmetric active
1066	 * peer. If the packet is authentic and the first he sent,
1067	 * mobilize a passive association. If not, kiss the frog.
1068	 */
1069	case AM_NEWPASS:
1070
1071#ifdef AUTOKEY
1072		/*
1073		 * Do not respond if not the same group.
1074		 */
1075		if (group_test(groupname, sys_ident)) {
1076			sys_declined++;
1077			return;
1078		}
1079#endif /* AUTOKEY */
1080		if (!AUTH(sys_authenticate | (restrict_mask &
1081		    (RES_NOPEER | RES_DONTTRUST)), is_authentic)) {
1082
1083			/*
1084			 * If authenticated but cannot mobilize an
1085			 * association, send a symmetric passive
1086			 * response without mobilizing an association.
1087			 * This is for drat broken Windows clients. See
1088			 * Microsoft KB 875424 for preferred workaround.
1089			 */
1090			if (AUTH(restrict_mask & RES_DONTTRUST,
1091			    is_authentic)) {
1092				fast_xmit(rbufp, MODE_PASSIVE, skeyid,
1093				    restrict_mask);
1094				return;			/* hooray */
1095			}
1096			if (is_authentic == AUTH_ERROR) {
1097				fast_xmit(rbufp, MODE_ACTIVE, 0,
1098				    restrict_mask);
1099				sys_restricted++;
1100				return;
1101			}
1102		}
1103
1104		/*
1105		 * Do not respond if synchronized and if stratum is
1106		 * below the floor or at or above the ceiling. Note,
1107		 * this allows an unsynchronized peer to synchronize to
1108		 * us. It would be very strange if he did and then was
1109		 * nipped, but that could only happen if we were
1110		 * operating at the top end of the range.  It also means
1111		 * we will spin an ephemeral association in response to
1112		 * MODE_ACTIVE KoDs, which will time out eventually.
1113		 */
1114		if (hisleap != LEAP_NOTINSYNC && (hisstratum <
1115		    sys_floor || hisstratum >= sys_ceiling)) {
1116			sys_declined++;
1117			return;			/* no help */
1118		}
1119
1120		/*
1121		 * The message is correctly authenticated and allowed.
1122		 * Mobilize a symmetric passive association.
1123		 */
1124		if ((peer = newpeer(&rbufp->recv_srcadr, NULL,
1125		    rbufp->dstadr, MODE_PASSIVE, hisversion, pkt->ppoll,
1126		    NTP_MAXDPOLL, 0, MDF_UCAST, 0, skeyid,
1127		    sys_ident)) == NULL) {
1128			sys_declined++;
1129			return;			/* ignore duplicate */
1130		}
1131		break;
1132
1133
1134	/*
1135	 * Process regular packet. Nothing special.
1136	 */
1137	case AM_PROCPKT:
1138
1139#ifdef AUTOKEY
1140		/*
1141		 * Do not respond if not the same group.
1142		 */
1143		if (group_test(groupname, peer->ident)) {
1144			sys_declined++;
1145			return;
1146		}
1147#endif /* AUTOKEY */
1148		break;
1149
1150	/*
1151	 * A passive packet matches a passive association. This is
1152	 * usually the result of reconfiguring a client on the fly. As
1153	 * this association might be legitimate and this packet an
1154	 * attempt to deny service, just ignore it.
1155	 */
1156	case AM_ERR:
1157		sys_declined++;
1158		return;
1159
1160	/*
1161	 * For everything else there is the bit bucket.
1162	 */
1163	default:
1164		sys_declined++;
1165		return;
1166	}
1167
1168#ifdef AUTOKEY
1169	/*
1170	 * If the association is configured for Autokey, the packet must
1171	 * have a public key ID; if not, the packet must have a
1172	 * symmetric key ID.
1173	 */
1174	if (is_authentic != AUTH_CRYPTO && (((peer->flags &
1175	    FLAG_SKEY) && skeyid <= NTP_MAXKEY) || (!(peer->flags &
1176	    FLAG_SKEY) && skeyid > NTP_MAXKEY))) {
1177		sys_badauth++;
1178		return;
1179	}
1180#endif	/* AUTOKEY */
1181	peer->received++;
1182	peer->flash &= ~PKT_TEST_MASK;
1183	if (peer->flags & FLAG_XBOGUS) {
1184		peer->flags &= ~FLAG_XBOGUS;
1185		peer->flash |= TEST3;
1186	}
1187
1188	/*
1189	 * Next comes a rigorous schedule of timestamp checking. If the
1190	 * transmit timestamp is zero, the server has not initialized in
1191	 * interleaved modes or is horribly broken.
1192	 */
1193	if (L_ISZERO(&p_xmt)) {
1194		peer->flash |= TEST3;			/* unsynch */
1195
1196	/*
1197	 * If the transmit timestamp duplicates a previous one, the
1198	 * packet is a replay. This prevents the bad guys from replaying
1199	 * the most recent packet, authenticated or not.
1200	 */
1201	} else if (L_ISEQU(&peer->xmt, &p_xmt)) {
1202		peer->flash |= TEST1;			/* duplicate */
1203		peer->oldpkt++;
1204		return;
1205
1206	/*
1207	 * If this is a broadcast mode packet, skip further checking. If
1208	 * an initial volley, bail out now and let the client do its
1209	 * stuff. If the origin timestamp is nonzero, this is an
1210	 * interleaved broadcast. so restart the protocol.
1211	 */
1212	} else if (hismode == MODE_BROADCAST) {
1213		if (!L_ISZERO(&p_org) && !(peer->flags & FLAG_XB)) {
1214			peer->flags |= FLAG_XB;
1215			peer->aorg = p_xmt;
1216			peer->borg = rbufp->recv_time;
1217			report_event(PEVNT_XLEAVE, peer, NULL);
1218			return;
1219		}
1220
1221	/*
1222	 * Check for bogus packet in basic mode. If found, switch to
1223	 * interleaved mode and resynchronize, but only after confirming
1224	 * the packet is not bogus in symmetric interleaved mode.
1225	 */
1226	} else if (peer->flip == 0) {
1227		if (!L_ISEQU(&p_org, &peer->aorg)) {
1228			peer->bogusorg++;
1229			peer->flash |= TEST2;	/* bogus */
1230			if (!L_ISZERO(&peer->dst) && L_ISEQU(&p_org,
1231			    &peer->dst)) {
1232				peer->flip = 1;
1233				report_event(PEVNT_XLEAVE, peer, NULL);
1234			}
1235		} else {
1236			L_CLR(&peer->aorg);
1237		}
1238
1239	/*
1240	 * Check for valid nonzero timestamp fields.
1241	 */
1242	} else if (L_ISZERO(&p_org) || L_ISZERO(&p_rec) ||
1243	    L_ISZERO(&peer->dst)) {
1244		peer->flash |= TEST3;		/* unsynch */
1245
1246	/*
1247	 * Check for bogus packet in interleaved symmetric mode. This
1248	 * can happen if a packet is lost, duplicated or crossed. If
1249	 * found, flip and resynchronize.
1250	 */
1251	} else if (!L_ISZERO(&peer->dst) && !L_ISEQU(&p_org,
1252	    &peer->dst)) {
1253		peer->bogusorg++;
1254		peer->flags |= FLAG_XBOGUS;
1255		peer->flash |= TEST2;		/* bogus */
1256	}
1257
1258	/*
1259	 * If this is a crypto_NAK, the server cannot authenticate a
1260	 * client packet. The server might have just changed keys. Clear
1261	 * the association and restart the protocol.
1262	 */
1263	if (is_authentic == AUTH_CRYPTO) {
1264		report_event(PEVNT_AUTH, peer, "crypto_NAK");
1265		peer->flash |= TEST5;		/* bad auth */
1266		peer->badauth++;
1267		if (peer->flags & FLAG_PREEMPT) {
1268			unpeer(peer);
1269			return;
1270		}
1271#ifdef AUTOKEY
1272		if (peer->crypto)
1273			peer_clear(peer, "AUTH");
1274#endif	/* AUTOKEY */
1275		return;
1276
1277	/*
1278	 * If the digest fails or it's missing for authenticated
1279	 * associations, the client cannot authenticate a server
1280	 * reply to a client packet previously sent. The loopback check
1281	 * is designed to avoid a bait-and-switch attack, which was
1282	 * possible in past versions. If symmetric modes, return a
1283	 * crypto-NAK. The peer should restart the protocol.
1284	 */
1285	} else if (!AUTH(peer->keyid || has_mac ||
1286			 (restrict_mask & RES_DONTTRUST), is_authentic)) {
1287		report_event(PEVNT_AUTH, peer, "digest");
1288		peer->flash |= TEST5;		/* bad auth */
1289		peer->badauth++;
1290		if (has_mac &&
1291		    (hismode == MODE_ACTIVE || hismode == MODE_PASSIVE))
1292			fast_xmit(rbufp, MODE_ACTIVE, 0, restrict_mask);
1293		if (peer->flags & FLAG_PREEMPT) {
1294			unpeer(peer);
1295			return;
1296		}
1297#ifdef AUTOKEY
1298		if (peer->crypto)
1299			peer_clear(peer, "AUTH");
1300#endif	/* AUTOKEY */
1301		return;
1302	}
1303
1304	/*
1305	 * Update the state variables.
1306	 */
1307	if (peer->flip == 0) {
1308		if (hismode != MODE_BROADCAST)
1309			peer->rec = p_xmt;
1310		peer->dst = rbufp->recv_time;
1311	}
1312	peer->xmt = p_xmt;
1313
1314	/*
1315	 * Set the peer ppoll to the maximum of the packet ppoll and the
1316	 * peer minpoll. If a kiss-o'-death, set the peer minpoll to
1317	 * this maximum and advance the headway to give the sender some
1318	 * headroom. Very intricate.
1319	 */
1320	peer->ppoll = max(peer->minpoll, pkt->ppoll);
1321	if (hismode == MODE_SERVER && hisleap == LEAP_NOTINSYNC &&
1322	    hisstratum == STRATUM_UNSPEC && memcmp(&pkt->refid,
1323	    "RATE", 4) == 0) {
1324		peer->selbroken++;
1325		report_event(PEVNT_RATE, peer, NULL);
1326		if (pkt->ppoll > peer->minpoll)
1327			peer->minpoll = peer->ppoll;
1328		peer->burst = peer->retry = 0;
1329		peer->throttle = (NTP_SHIFT + 1) * (1 << peer->minpoll);
1330		poll_update(peer, pkt->ppoll);
1331		return;				/* kiss-o'-death */
1332	}
1333
1334	/*
1335	 * That was hard and I am sweaty, but the packet is squeaky
1336	 * clean. Get on with real work.
1337	 */
1338	peer->timereceived = current_time;
1339	if (is_authentic == AUTH_OK)
1340		peer->flags |= FLAG_AUTHENTIC;
1341	else
1342		peer->flags &= ~FLAG_AUTHENTIC;
1343
1344#ifdef AUTOKEY
1345	/*
1346	 * More autokey dance. The rules of the cha-cha are as follows:
1347	 *
1348	 * 1. If there is no key or the key is not auto, do nothing.
1349	 *
1350	 * 2. If this packet is in response to the one just previously
1351	 *    sent or from a broadcast server, do the extension fields.
1352	 *    Otherwise, assume bogosity and bail out.
1353	 *
1354	 * 3. If an extension field contains a verified signature, it is
1355	 *    self-authenticated and we sit the dance.
1356	 *
1357	 * 4. If this is a server reply, check only to see that the
1358	 *    transmitted key ID matches the received key ID.
1359	 *
1360	 * 5. Check to see that one or more hashes of the current key ID
1361	 *    matches the previous key ID or ultimate original key ID
1362	 *    obtained from the broadcaster or symmetric peer. If no
1363	 *    match, sit the dance and call for new autokey values.
1364	 *
1365	 * In case of crypto error, fire the orchestra, stop dancing and
1366	 * restart the protocol.
1367	 */
1368	if (peer->flags & FLAG_SKEY) {
1369		/*
1370		 * Decrement remaining autokey hashes. This isn't
1371		 * perfect if a packet is lost, but results in no harm.
1372		 */
1373		ap = (struct autokey *)peer->recval.ptr;
1374		if (ap != NULL) {
1375			if (ap->seq > 0)
1376				ap->seq--;
1377		}
1378		peer->flash |= TEST8;
1379		rval = crypto_recv(peer, rbufp);
1380		if (rval == XEVNT_OK) {
1381			peer->unreach = 0;
1382		} else {
1383			if (rval == XEVNT_ERR) {
1384				report_event(PEVNT_RESTART, peer,
1385				    "crypto error");
1386				peer_clear(peer, "CRYP");
1387				peer->flash |= TEST9;	/* bad crypt */
1388				if (peer->flags & FLAG_PREEMPT)
1389					unpeer(peer);
1390			}
1391			return;
1392		}
1393
1394		/*
1395		 * If server mode, verify the receive key ID matches
1396		 * the transmit key ID.
1397		 */
1398		if (hismode == MODE_SERVER) {
1399			if (skeyid == peer->keyid)
1400				peer->flash &= ~TEST8;
1401
1402		/*
1403		 * If an extension field is present, verify only that it
1404		 * has been correctly signed. We don't need a sequence
1405		 * check here, but the sequence continues.
1406		 */
1407		} else if (!(peer->flash & TEST8)) {
1408			peer->pkeyid = skeyid;
1409
1410		/*
1411		 * Now the fun part. Here, skeyid is the current ID in
1412		 * the packet, pkeyid is the ID in the last packet and
1413		 * tkeyid is the hash of skeyid. If the autokey values
1414		 * have not been received, this is an automatic error.
1415		 * If so, check that the tkeyid matches pkeyid. If not,
1416		 * hash tkeyid and try again. If the number of hashes
1417		 * exceeds the number remaining in the sequence, declare
1418		 * a successful failure and refresh the autokey values.
1419		 */
1420		} else if (ap != NULL) {
1421			int i;
1422
1423			for (i = 0; ; i++) {
1424				if (tkeyid == peer->pkeyid ||
1425				    tkeyid == ap->key) {
1426					peer->flash &= ~TEST8;
1427					peer->pkeyid = skeyid;
1428					ap->seq -= i;
1429					break;
1430				}
1431				if (i > ap->seq) {
1432					peer->crypto &=
1433					    ~CRYPTO_FLAG_AUTO;
1434					break;
1435				}
1436				tkeyid = session_key(
1437				    &rbufp->recv_srcadr, dstadr_sin,
1438				    tkeyid, pkeyid, 0);
1439			}
1440			if (peer->flash & TEST8)
1441				report_event(PEVNT_AUTH, peer, "keylist");
1442		}
1443		if (!(peer->crypto & CRYPTO_FLAG_PROV)) /* test 9 */
1444			peer->flash |= TEST8;	/* bad autokey */
1445
1446		/*
1447		 * The maximum lifetime of the protocol is about one
1448		 * week before restarting the Autokey protocol to
1449		 * refresh certificates and leapseconds values.
1450		 */
1451		if (current_time > peer->refresh) {
1452			report_event(PEVNT_RESTART, peer,
1453			    "crypto refresh");
1454			peer_clear(peer, "TIME");
1455			return;
1456		}
1457	}
1458#endif	/* AUTOKEY */
1459
1460	/*
1461	 * The dance is complete and the flash bits have been lit. Toss
1462	 * the packet over the fence for processing, which may light up
1463	 * more flashers.
1464	 */
1465	process_packet(peer, pkt, rbufp->recv_length);
1466
1467	/*
1468	 * In interleaved mode update the state variables. Also adjust the
1469	 * transmit phase to avoid crossover.
1470	 */
1471	if (peer->flip != 0) {
1472		peer->rec = p_rec;
1473		peer->dst = rbufp->recv_time;
1474		if (peer->nextdate - current_time < (1U << min(peer->ppoll,
1475		    peer->hpoll)) / 2)
1476			peer->nextdate++;
1477		else
1478			peer->nextdate--;
1479	}
1480}
1481
1482
1483/*
1484 * process_packet - Packet Procedure, a la Section 3.4.4 of the
1485 *	specification. Or almost, at least. If we're in here we have a
1486 *	reasonable expectation that we will be having a long term
1487 *	relationship with this host.
1488 */
1489void
1490process_packet(
1491	register struct peer *peer,
1492	register struct pkt *pkt,
1493	u_int	len
1494	)
1495{
1496	double	t34, t21;
1497	double	p_offset, p_del, p_disp;
1498	l_fp	p_rec, p_xmt, p_org, p_reftime, ci;
1499	u_char	pmode, pleap, pversion, pstratum;
1500	char	statstr[NTP_MAXSTRLEN];
1501#ifdef ASSYM
1502	int	itemp;
1503	double	etemp, ftemp, td;
1504#endif /* ASSYM */
1505
1506	sys_processed++;
1507	peer->processed++;
1508	p_del = FPTOD(NTOHS_FP(pkt->rootdelay));
1509	p_offset = 0;
1510	p_disp = FPTOD(NTOHS_FP(pkt->rootdisp));
1511	NTOHL_FP(&pkt->reftime, &p_reftime);
1512	NTOHL_FP(&pkt->org, &p_org);
1513	NTOHL_FP(&pkt->rec, &p_rec);
1514	NTOHL_FP(&pkt->xmt, &p_xmt);
1515	pmode = PKT_MODE(pkt->li_vn_mode);
1516	pleap = PKT_LEAP(pkt->li_vn_mode);
1517	pversion = PKT_VERSION(pkt->li_vn_mode);
1518	pstratum = PKT_TO_STRATUM(pkt->stratum);
1519
1520	/*
1521	 * Capture the header values in the client/peer association..
1522	 */
1523	record_raw_stats(&peer->srcadr, peer->dstadr ?
1524	    &peer->dstadr->sin : NULL,
1525	    &p_org, &p_rec, &p_xmt, &peer->dst,
1526	    pleap, pversion, pmode, pstratum, pkt->ppoll, pkt->precision,
1527	    p_del, p_disp, pkt->refid);
1528	peer->leap = pleap;
1529	peer->stratum = min(pstratum, STRATUM_UNSPEC);
1530	peer->pmode = pmode;
1531	peer->precision = pkt->precision;
1532	peer->rootdelay = p_del;
1533	peer->rootdisp = p_disp;
1534	peer->refid = pkt->refid;		/* network byte order */
1535	peer->reftime = p_reftime;
1536
1537	/*
1538	 * First, if either burst mode is armed, enable the burst.
1539	 * Compute the headway for the next packet and delay if
1540	 * necessary to avoid exceeding the threshold.
1541	 */
1542	if (peer->retry > 0) {
1543		peer->retry = 0;
1544		if (peer->reach)
1545			peer->burst = min(1 << (peer->hpoll -
1546			    peer->minpoll), NTP_SHIFT) - 1;
1547		else
1548			peer->burst = NTP_IBURST - 1;
1549		if (peer->burst > 0)
1550			peer->nextdate = current_time;
1551	}
1552	poll_update(peer, peer->hpoll);
1553
1554	/*
1555	 * Verify the server is synchronized; that is, the leap bits,
1556	 * stratum and root distance are valid.
1557	 */
1558	if (pleap == LEAP_NOTINSYNC ||		/* test 6 */
1559	    pstratum < sys_floor || pstratum >= sys_ceiling)
1560		peer->flash |= TEST6;		/* bad synch or strat */
1561	if (p_del / 2 + p_disp >= MAXDISPERSE)	/* test 7 */
1562		peer->flash |= TEST7;		/* bad header */
1563
1564	/*
1565	 * If any tests fail at this point, the packet is discarded.
1566	 * Note that some flashers may have already been set in the
1567	 * receive() routine.
1568	 */
1569	if (peer->flash & PKT_TEST_MASK) {
1570		peer->seldisptoolarge++;
1571#ifdef DEBUG
1572		if (debug)
1573			printf("packet: flash header %04x\n",
1574			    peer->flash);
1575#endif
1576		return;
1577	}
1578
1579	/*
1580	 * If the peer was previously unreachable, raise a trap. In any
1581	 * case, mark it reachable.
1582	 */
1583	if (!peer->reach) {
1584		report_event(PEVNT_REACH, peer, NULL);
1585		peer->timereachable = current_time;
1586	}
1587	peer->reach |= 1;
1588
1589	/*
1590	 * For a client/server association, calculate the clock offset,
1591	 * roundtrip delay and dispersion. The equations are reordered
1592	 * from the spec for more efficient use of temporaries. For a
1593	 * broadcast association, offset the last measurement by the
1594	 * computed delay during the client/server volley. Note the
1595	 * computation of dispersion includes the system precision plus
1596	 * that due to the frequency error since the origin time.
1597	 *
1598	 * It is very important to respect the hazards of overflow. The
1599	 * only permitted operation on raw timestamps is subtraction,
1600	 * where the result is a signed quantity spanning from 68 years
1601	 * in the past to 68 years in the future. To avoid loss of
1602	 * precision, these calculations are done using 64-bit integer
1603	 * arithmetic. However, the offset and delay calculations are
1604	 * sums and differences of these first-order differences, which
1605	 * if done using 64-bit integer arithmetic, would be valid over
1606	 * only half that span. Since the typical first-order
1607	 * differences are usually very small, they are converted to 64-
1608	 * bit doubles and all remaining calculations done in floating-
1609	 * double arithmetic. This preserves the accuracy while
1610	 * retaining the 68-year span.
1611	 *
1612	 * There are three interleaving schemes, basic, interleaved
1613	 * symmetric and interleaved broadcast. The timestamps are
1614	 * idioscyncratically different. See the onwire briefing/white
1615	 * paper at www.eecis.udel.edu/~mills for details.
1616	 *
1617	 * Interleaved symmetric mode
1618	 * t1 = peer->aorg/borg, t2 = peer->rec, t3 = p_xmt,
1619	 * t4 = peer->dst
1620	 */
1621	if (peer->flip != 0) {
1622		ci = p_xmt;				/* t3 - t4 */
1623		L_SUB(&ci, &peer->dst);
1624		LFPTOD(&ci, t34);
1625		ci = p_rec;				/* t2 - t1 */
1626		if (peer->flip > 0)
1627			L_SUB(&ci, &peer->borg);
1628		else
1629			L_SUB(&ci, &peer->aorg);
1630		LFPTOD(&ci, t21);
1631		p_del = t21 - t34;
1632		p_offset = (t21 + t34) / 2.;
1633		if (p_del < 0 || p_del > 1.) {
1634			snprintf(statstr, sizeof(statstr),
1635			    "t21 %.6f t34 %.6f", t21, t34);
1636			report_event(PEVNT_XERR, peer, statstr);
1637			return;
1638		}
1639
1640	/*
1641	 * Broadcast modes
1642	 */
1643	} else if (peer->pmode == MODE_BROADCAST) {
1644
1645		/*
1646		 * Interleaved broadcast mode. Use interleaved timestamps.
1647		 * t1 = peer->borg, t2 = p_org, t3 = p_org, t4 = aorg
1648		 */
1649		if (peer->flags & FLAG_XB) {
1650			ci = p_org;			/* delay */
1651			L_SUB(&ci, &peer->aorg);
1652			LFPTOD(&ci, t34);
1653			ci = p_org;			/* t2 - t1 */
1654			L_SUB(&ci, &peer->borg);
1655			LFPTOD(&ci, t21);
1656			peer->aorg = p_xmt;
1657			peer->borg = peer->dst;
1658			if (t34 < 0 || t34 > 1.) {
1659				snprintf(statstr, sizeof(statstr),
1660				    "offset %.6f delay %.6f", t21, t34);
1661				report_event(PEVNT_XERR, peer, statstr);
1662				return;
1663			}
1664			p_offset = t21;
1665			peer->xleave = t34;
1666
1667		/*
1668		 * Basic broadcast - use direct timestamps.
1669		 * t3 = p_xmt, t4 = peer->dst
1670		 */
1671		} else {
1672			ci = p_xmt;		/* t3 - t4 */
1673			L_SUB(&ci, &peer->dst);
1674			LFPTOD(&ci, t34);
1675			p_offset = t34;
1676		}
1677
1678		/*
1679		 * When calibration is complete and the clock is
1680		 * synchronized, the bias is calculated as the difference
1681		 * between the unicast timestamp and the broadcast
1682		 * timestamp. This works for both basic and interleaved
1683		 * modes.
1684		 */
1685		if (FLAG_BC_VOL & peer->flags) {
1686			peer->flags &= ~FLAG_BC_VOL;
1687			peer->delay = fabs(peer->offset - p_offset) * 2;
1688		}
1689		p_del = peer->delay;
1690		p_offset += p_del / 2;
1691
1692
1693	/*
1694	 * Basic mode, otherwise known as the old fashioned way.
1695	 *
1696	 * t1 = p_org, t2 = p_rec, t3 = p_xmt, t4 = peer->dst
1697	 */
1698	} else {
1699		ci = p_xmt;				/* t3 - t4 */
1700		L_SUB(&ci, &peer->dst);
1701		LFPTOD(&ci, t34);
1702		ci = p_rec;				/* t2 - t1 */
1703		L_SUB(&ci, &p_org);
1704		LFPTOD(&ci, t21);
1705		p_del = fabs(t21 - t34);
1706		p_offset = (t21 + t34) / 2.;
1707	}
1708	p_del = max(p_del, LOGTOD(sys_precision));
1709	p_disp = LOGTOD(sys_precision) + LOGTOD(peer->precision) +
1710	    clock_phi * p_del;
1711
1712#if ASSYM
1713	/*
1714	 * This code calculates the outbound and inbound data rates by
1715	 * measuring the differences between timestamps at different
1716	 * packet lengths. This is helpful in cases of large asymmetric
1717	 * delays commonly experienced on deep space communication
1718	 * links.
1719	 */
1720	if (peer->t21_last > 0 && peer->t34_bytes > 0) {
1721		itemp = peer->t21_bytes - peer->t21_last;
1722		if (itemp > 25) {
1723			etemp = t21 - peer->t21;
1724			if (fabs(etemp) > 1e-6) {
1725				ftemp = itemp / etemp;
1726				if (ftemp > 1000.)
1727					peer->r21 = ftemp;
1728			}
1729		}
1730		itemp = len - peer->t34_bytes;
1731		if (itemp > 25) {
1732			etemp = -t34 - peer->t34;
1733			if (fabs(etemp) > 1e-6) {
1734				ftemp = itemp / etemp;
1735				if (ftemp > 1000.)
1736					peer->r34 = ftemp;
1737			}
1738		}
1739	}
1740
1741	/*
1742	 * The following section compensates for different data rates on
1743	 * the outbound (d21) and inbound (t34) directions. To do this,
1744	 * it finds t such that r21 * t - r34 * (d - t) = 0, where d is
1745	 * the roundtrip delay. Then it calculates the correction as a
1746	 * fraction of d.
1747	 */
1748 	peer->t21 = t21;
1749	peer->t21_last = peer->t21_bytes;
1750	peer->t34 = -t34;
1751	peer->t34_bytes = len;
1752#ifdef DEBUG
1753	if (debug > 1)
1754		printf("packet: t21 %.9lf %d t34 %.9lf %d\n", peer->t21,
1755		    peer->t21_bytes, peer->t34, peer->t34_bytes);
1756#endif
1757	if (peer->r21 > 0 && peer->r34 > 0 && p_del > 0) {
1758		if (peer->pmode != MODE_BROADCAST)
1759			td = (peer->r34 / (peer->r21 + peer->r34) -
1760			    .5) * p_del;
1761		else
1762			td = 0;
1763
1764		/*
1765 		 * Unfortunately, in many cases the errors are
1766		 * unacceptable, so for the present the rates are not
1767		 * used. In future, we might find conditions where the
1768		 * calculations are useful, so this should be considered
1769		 * a work in progress.
1770		 */
1771		t21 -= td;
1772		t34 -= td;
1773#ifdef DEBUG
1774		if (debug > 1)
1775			printf("packet: del %.6lf r21 %.1lf r34 %.1lf %.6lf\n",
1776			    p_del, peer->r21 / 1e3, peer->r34 / 1e3,
1777			    td);
1778#endif
1779	}
1780#endif /* ASSYM */
1781
1782	/*
1783	 * That was awesome. Now hand off to the clock filter.
1784	 */
1785	clock_filter(peer, p_offset + peer->bias, p_del, p_disp);
1786
1787	/*
1788	 * If we are in broadcast calibrate mode, return to broadcast
1789	 * client mode when the client is fit and the autokey dance is
1790	 * complete.
1791	 */
1792	if ((FLAG_BC_VOL & peer->flags) && MODE_CLIENT == peer->hmode &&
1793	    !(TEST11 & peer_unfit(peer))) {	/* distance exceeded */
1794#ifdef AUTOKEY
1795		if (peer->flags & FLAG_SKEY) {
1796			if (!(~peer->crypto & CRYPTO_FLAG_ALL))
1797				peer->hmode = MODE_BCLIENT;
1798		} else {
1799			peer->hmode = MODE_BCLIENT;
1800		}
1801#else	/* !AUTOKEY follows */
1802		peer->hmode = MODE_BCLIENT;
1803#endif	/* !AUTOKEY */
1804	}
1805}
1806
1807
1808/*
1809 * clock_update - Called at system process update intervals.
1810 */
1811static void
1812clock_update(
1813	struct peer *peer	/* peer structure pointer */
1814	)
1815{
1816	double	dtemp;
1817	l_fp	now;
1818#ifdef HAVE_LIBSCF_H
1819	char	*fmri;
1820#endif /* HAVE_LIBSCF_H */
1821
1822	/*
1823	 * Update the system state variables. We do this very carefully,
1824	 * as the poll interval might need to be clamped differently.
1825	 */
1826	sys_peer = peer;
1827	sys_epoch = peer->epoch;
1828	if (sys_poll < peer->minpoll)
1829		sys_poll = peer->minpoll;
1830	if (sys_poll > peer->maxpoll)
1831		sys_poll = peer->maxpoll;
1832	poll_update(peer, sys_poll);
1833	sys_stratum = min(peer->stratum + 1, STRATUM_UNSPEC);
1834	if (peer->stratum == STRATUM_REFCLOCK ||
1835	    peer->stratum == STRATUM_UNSPEC)
1836		sys_refid = peer->refid;
1837	else
1838		sys_refid = addr2refid(&peer->srcadr);
1839	/*
1840	 * Root Dispersion (E) is defined (in RFC 5905) as:
1841	 *
1842	 * E = p.epsilon_r + p.epsilon + p.psi + PHI*(s.t - p.t) + |THETA|
1843	 *
1844	 * where:
1845	 *  p.epsilon_r is the PollProc's root dispersion
1846	 *  p.epsilon   is the PollProc's dispersion
1847	 *  p.psi       is the PollProc's jitter
1848	 *  THETA       is the combined offset
1849	 *
1850	 * NB: Think Hard about where these numbers come from and
1851	 * what they mean.  When did peer->update happen?  Has anything
1852	 * interesting happened since then?  What values are the most
1853	 * defensible?  Why?
1854	 *
1855	 * DLM thinks this equation is probably the best of all worse choices.
1856	 */
1857	dtemp	= peer->rootdisp
1858		+ peer->disp
1859		+ sys_jitter
1860		+ clock_phi * (current_time - peer->update)
1861		+ fabs(sys_offset);
1862
1863	if (dtemp > sys_mindisp)
1864		sys_rootdisp = dtemp;
1865	else
1866		sys_rootdisp = sys_mindisp;
1867	sys_rootdelay = peer->delay + peer->rootdelay;
1868	sys_reftime = peer->dst;
1869
1870#ifdef DEBUG
1871	if (debug)
1872		printf(
1873		    "clock_update: at %lu sample %lu associd %d\n",
1874		    current_time, peer->epoch, peer->associd);
1875#endif
1876
1877	/*
1878	 * Comes now the moment of truth. Crank the clock discipline and
1879	 * see what comes out.
1880	 */
1881	switch (local_clock(peer, sys_offset)) {
1882
1883	/*
1884	 * Clock exceeds panic threshold. Life as we know it ends.
1885	 */
1886	case -1:
1887#ifdef HAVE_LIBSCF_H
1888		/*
1889		 * For Solaris enter the maintenance mode.
1890		 */
1891		if ((fmri = getenv("SMF_FMRI")) != NULL) {
1892			if (smf_maintain_instance(fmri, 0) < 0) {
1893				printf("smf_maintain_instance: %s\n",
1894				    scf_strerror(scf_error()));
1895				exit(1);
1896			}
1897			/*
1898			 * Sleep until SMF kills us.
1899			 */
1900			for (;;)
1901				pause();
1902		}
1903#endif /* HAVE_LIBSCF_H */
1904		exit (-1);
1905		/* not reached */
1906
1907	/*
1908	 * Clock was stepped. Flush all time values of all peers.
1909	 */
1910	case 2:
1911		clear_all();
1912		sys_leap = LEAP_NOTINSYNC;
1913		sys_stratum = STRATUM_UNSPEC;
1914		memcpy(&sys_refid, "STEP", 4);
1915		sys_rootdelay = 0;
1916		sys_rootdisp = 0;
1917		L_CLR(&sys_reftime);
1918		sys_jitter = LOGTOD(sys_precision);
1919		leapsec_reset_frame();
1920		break;
1921
1922	/*
1923	 * Clock was slewed. Handle the leapsecond stuff.
1924	 */
1925	case 1:
1926
1927		/*
1928		 * If this is the first time the clock is set, reset the
1929		 * leap bits. If crypto, the timer will goose the setup
1930		 * process.
1931		 */
1932		if (sys_leap == LEAP_NOTINSYNC) {
1933			sys_leap = LEAP_NOWARNING;
1934#ifdef AUTOKEY
1935			if (crypto_flags)
1936				crypto_update();
1937#endif	/* AUTOKEY */
1938			/*
1939			 * If our parent process is waiting for the
1940			 * first clock sync, send them home satisfied.
1941			 */
1942#ifdef HAVE_WORKING_FORK
1943			if (waitsync_fd_to_close != -1) {
1944				close(waitsync_fd_to_close);
1945				waitsync_fd_to_close = -1;
1946				DPRINTF(1, ("notified parent --wait-sync is done\n"));
1947			}
1948#endif /* HAVE_WORKING_FORK */
1949
1950		}
1951
1952		/*
1953		 * If there is no leap second pending and the number of
1954		 * survivor leap bits is greater than half the number of
1955		 * survivors, try to schedule a leap for the end of the
1956		 * current month. (This only works if no leap second for
1957		 * that range is in the table, so doing this more than
1958		 * once is mostly harmless.)
1959		 */
1960		if (leapsec == LSPROX_NOWARN) {
1961			if (leap_vote_ins > leap_vote_del
1962			    && leap_vote_ins > sys_survivors / 2) {
1963				get_systime(&now);
1964				leapsec_add_dyn(TRUE, now.l_ui, NULL);
1965			}
1966			if (leap_vote_del > leap_vote_ins
1967			    && leap_vote_del > sys_survivors / 2) {
1968				get_systime(&now);
1969				leapsec_add_dyn(FALSE, now.l_ui, NULL);
1970			}
1971		}
1972		break;
1973
1974	/*
1975	 * Popcorn spike or step threshold exceeded. Pretend it never
1976	 * happened.
1977	 */
1978	default:
1979		break;
1980	}
1981}
1982
1983
1984/*
1985 * poll_update - update peer poll interval
1986 */
1987void
1988poll_update(
1989	struct peer *peer,	/* peer structure pointer */
1990	u_char	mpoll
1991	)
1992{
1993	u_long	next, utemp;
1994	u_char	hpoll;
1995
1996	/*
1997	 * This routine figures out when the next poll should be sent.
1998	 * That turns out to be wickedly complicated. One problem is
1999	 * that sometimes the time for the next poll is in the past when
2000	 * the poll interval is reduced. We watch out for races here
2001	 * between the receive process and the poll process.
2002	 *
2003	 * Clamp the poll interval between minpoll and maxpoll.
2004	 */
2005	hpoll = max(min(peer->maxpoll, mpoll), peer->minpoll);
2006
2007#ifdef AUTOKEY
2008	/*
2009	 * If during the crypto protocol the poll interval has changed,
2010	 * the lifetimes in the key list are probably bogus. Purge the
2011	 * the key list and regenerate it later.
2012	 */
2013	if ((peer->flags & FLAG_SKEY) && hpoll != peer->hpoll)
2014		key_expire(peer);
2015#endif	/* AUTOKEY */
2016	peer->hpoll = hpoll;
2017
2018	/*
2019	 * There are three variables important for poll scheduling, the
2020	 * current time (current_time), next scheduled time (nextdate)
2021	 * and the earliest time (utemp). The earliest time is 2 s
2022	 * seconds, but could be more due to rate management. When
2023	 * sending in a burst, use the earliest time. When not in a
2024	 * burst but with a reply pending, send at the earliest time
2025	 * unless the next scheduled time has not advanced. This can
2026	 * only happen if multiple replies are pending in the same
2027	 * response interval. Otherwise, send at the later of the next
2028	 * scheduled time and the earliest time.
2029	 *
2030	 * Now we figure out if there is an override. If a burst is in
2031	 * progress and we get called from the receive process, just
2032	 * slink away. If called from the poll process, delay 1 s for a
2033	 * reference clock, otherwise 2 s.
2034	 */
2035	utemp = current_time + max(peer->throttle - (NTP_SHIFT - 1) *
2036	    (1 << peer->minpoll), ntp_minpkt);
2037	if (peer->burst > 0) {
2038		if (peer->nextdate > current_time)
2039			return;
2040#ifdef REFCLOCK
2041		else if (peer->flags & FLAG_REFCLOCK)
2042			peer->nextdate = current_time + RESP_DELAY;
2043#endif /* REFCLOCK */
2044		else
2045			peer->nextdate = utemp;
2046
2047#ifdef AUTOKEY
2048	/*
2049	 * If a burst is not in progress and a crypto response message
2050	 * is pending, delay 2 s, but only if this is a new interval.
2051	 */
2052	} else if (peer->cmmd != NULL) {
2053		if (peer->nextdate > current_time) {
2054			if (peer->nextdate + ntp_minpkt != utemp)
2055				peer->nextdate = utemp;
2056		} else {
2057			peer->nextdate = utemp;
2058		}
2059#endif	/* AUTOKEY */
2060
2061	/*
2062	 * The ordinary case. If a retry, use minpoll; if unreachable,
2063	 * use host poll; otherwise, use the minimum of host and peer
2064	 * polls; In other words, oversampling is okay but
2065	 * understampling is evil. Use the maximum of this value and the
2066	 * headway. If the average headway is greater than the headway
2067	 * threshold, increase the headway by the minimum interval.
2068	 */
2069	} else {
2070		if (peer->retry > 0)
2071			hpoll = peer->minpoll;
2072		else if (!(peer->reach))
2073			hpoll = peer->hpoll;
2074		else
2075			hpoll = min(peer->ppoll, peer->hpoll);
2076#ifdef REFCLOCK
2077		if (peer->flags & FLAG_REFCLOCK)
2078			next = 1 << hpoll;
2079		else
2080#endif /* REFCLOCK */
2081			next = ((0x1000UL | (ntp_random() & 0x0ff)) <<
2082			    hpoll) >> 12;
2083		next += peer->outdate;
2084		if (next > utemp)
2085			peer->nextdate = next;
2086		else
2087			peer->nextdate = utemp;
2088		if (peer->throttle > (1 << peer->minpoll))
2089			peer->nextdate += ntp_minpkt;
2090	}
2091	DPRINTF(2, ("poll_update: at %lu %s poll %d burst %d retry %d head %d early %lu next %lu\n",
2092		    current_time, ntoa(&peer->srcadr), peer->hpoll,
2093		    peer->burst, peer->retry, peer->throttle,
2094		    utemp - current_time, peer->nextdate -
2095		    current_time));
2096}
2097
2098
2099/*
2100 * peer_clear - clear peer filter registers.  See Section 3.4.8 of the
2101 * spec.
2102 */
2103void
2104peer_clear(
2105	struct peer *peer,		/* peer structure */
2106	const char *ident		/* tally lights */
2107	)
2108{
2109	u_char	u;
2110
2111#ifdef AUTOKEY
2112	/*
2113	 * If cryptographic credentials have been acquired, toss them to
2114	 * Valhalla. Note that autokeys are ephemeral, in that they are
2115	 * tossed immediately upon use. Therefore, the keylist can be
2116	 * purged anytime without needing to preserve random keys. Note
2117	 * that, if the peer is purged, the cryptographic variables are
2118	 * purged, too. This makes it much harder to sneak in some
2119	 * unauthenticated data in the clock filter.
2120	 */
2121	key_expire(peer);
2122	if (peer->iffval != NULL)
2123		BN_free(peer->iffval);
2124	value_free(&peer->cookval);
2125	value_free(&peer->recval);
2126	value_free(&peer->encrypt);
2127	value_free(&peer->sndval);
2128	if (peer->cmmd != NULL)
2129		free(peer->cmmd);
2130	if (peer->subject != NULL)
2131		free(peer->subject);
2132	if (peer->issuer != NULL)
2133		free(peer->issuer);
2134#endif /* AUTOKEY */
2135
2136	/*
2137	 * Clear all values, including the optional crypto values above.
2138	 */
2139	memset(CLEAR_TO_ZERO(peer), 0, LEN_CLEAR_TO_ZERO(peer));
2140	peer->ppoll = peer->maxpoll;
2141	peer->hpoll = peer->minpoll;
2142	peer->disp = MAXDISPERSE;
2143	peer->flash = peer_unfit(peer);
2144	peer->jitter = LOGTOD(sys_precision);
2145
2146	/*
2147	 * If interleave mode, initialize the alternate origin switch.
2148	 */
2149	if (peer->flags & FLAG_XLEAVE)
2150		peer->flip = 1;
2151	for (u = 0; u < NTP_SHIFT; u++) {
2152		peer->filter_order[u] = u;
2153		peer->filter_disp[u] = MAXDISPERSE;
2154	}
2155#ifdef REFCLOCK
2156	if (!(peer->flags & FLAG_REFCLOCK)) {
2157#endif
2158		peer->leap = LEAP_NOTINSYNC;
2159		peer->stratum = STRATUM_UNSPEC;
2160		memcpy(&peer->refid, ident, 4);
2161#ifdef REFCLOCK
2162	}
2163#endif
2164
2165	/*
2166	 * During initialization use the association count to spread out
2167	 * the polls at one-second intervals. Passive associations'
2168	 * first poll is delayed by the "discard minimum" to avoid rate
2169	 * limiting. Other post-startup new or cleared associations
2170	 * randomize the first poll over the minimum poll interval to
2171	 * avoid implosion.
2172	 */
2173	peer->nextdate = peer->update = peer->outdate = current_time;
2174	if (initializing) {
2175		peer->nextdate += peer_associations;
2176	} else if (MODE_PASSIVE == peer->hmode) {
2177		peer->nextdate += ntp_minpkt;
2178	} else {
2179		peer->nextdate += ntp_random() % peer->minpoll;
2180	}
2181#ifdef AUTOKEY
2182	peer->refresh = current_time + (1 << NTP_REFRESH);
2183#endif	/* AUTOKEY */
2184#ifdef DEBUG
2185	if (debug)
2186		printf(
2187		    "peer_clear: at %ld next %ld associd %d refid %s\n",
2188		    current_time, peer->nextdate, peer->associd,
2189		    ident);
2190#endif
2191}
2192
2193
2194/*
2195 * clock_filter - add incoming clock sample to filter register and run
2196 *		  the filter procedure to find the best sample.
2197 */
2198void
2199clock_filter(
2200	struct peer *peer,		/* peer structure pointer */
2201	double	sample_offset,		/* clock offset */
2202	double	sample_delay,		/* roundtrip delay */
2203	double	sample_disp		/* dispersion */
2204	)
2205{
2206	double	dst[NTP_SHIFT];		/* distance vector */
2207	int	ord[NTP_SHIFT];		/* index vector */
2208	int	i, j, k, m;
2209	double	dtemp, etemp;
2210	char	tbuf[80];
2211
2212	/*
2213	 * A sample consists of the offset, delay, dispersion and epoch
2214	 * of arrival. The offset and delay are determined by the on-
2215	 * wire protocol. The dispersion grows from the last outbound
2216	 * packet to the arrival of this one increased by the sum of the
2217	 * peer precision and the system precision as required by the
2218	 * error budget. First, shift the new arrival into the shift
2219	 * register discarding the oldest one.
2220	 */
2221	j = peer->filter_nextpt;
2222	peer->filter_offset[j] = sample_offset;
2223	peer->filter_delay[j] = sample_delay;
2224	peer->filter_disp[j] = sample_disp;
2225	peer->filter_epoch[j] = current_time;
2226	j = (j + 1) % NTP_SHIFT;
2227	peer->filter_nextpt = j;
2228
2229	/*
2230	 * Update dispersions since the last update and at the same
2231	 * time initialize the distance and index lists. Since samples
2232	 * become increasingly uncorrelated beyond the Allan intercept,
2233	 * only under exceptional cases will an older sample be used.
2234	 * Therefore, the distance list uses a compound metric. If the
2235	 * dispersion is greater than the maximum dispersion, clamp the
2236	 * distance at that value. If the time since the last update is
2237	 * less than the Allan intercept use the delay; otherwise, use
2238	 * the sum of the delay and dispersion.
2239	 */
2240	dtemp = clock_phi * (current_time - peer->update);
2241	peer->update = current_time;
2242	for (i = NTP_SHIFT - 1; i >= 0; i--) {
2243		if (i != 0)
2244			peer->filter_disp[j] += dtemp;
2245		if (peer->filter_disp[j] >= MAXDISPERSE) {
2246			peer->filter_disp[j] = MAXDISPERSE;
2247			dst[i] = MAXDISPERSE;
2248		} else if (peer->update - peer->filter_epoch[j] >
2249		    (u_long)ULOGTOD(allan_xpt)) {
2250			dst[i] = peer->filter_delay[j] +
2251			    peer->filter_disp[j];
2252		} else {
2253			dst[i] = peer->filter_delay[j];
2254		}
2255		ord[i] = j;
2256		j = (j + 1) % NTP_SHIFT;
2257	}
2258
2259	/*
2260	 * If the clock has stabilized, sort the samples by distance.
2261	 */
2262	if (freq_cnt == 0) {
2263		for (i = 1; i < NTP_SHIFT; i++) {
2264			for (j = 0; j < i; j++) {
2265				if (dst[j] > dst[i]) {
2266					k = ord[j];
2267					ord[j] = ord[i];
2268					ord[i] = k;
2269					etemp = dst[j];
2270					dst[j] = dst[i];
2271					dst[i] = etemp;
2272				}
2273			}
2274		}
2275	}
2276
2277	/*
2278	 * Copy the index list to the association structure so ntpq
2279	 * can see it later. Prune the distance list to leave only
2280	 * samples less than the maximum dispersion, which disfavors
2281	 * uncorrelated samples older than the Allan intercept. To
2282	 * further improve the jitter estimate, of the remainder leave
2283	 * only samples less than the maximum distance, but keep at
2284	 * least two samples for jitter calculation.
2285	 */
2286	m = 0;
2287	for (i = 0; i < NTP_SHIFT; i++) {
2288		peer->filter_order[i] = (u_char) ord[i];
2289		if (dst[i] >= MAXDISPERSE || (m >= 2 && dst[i] >=
2290		    sys_maxdist))
2291			continue;
2292		m++;
2293	}
2294
2295	/*
2296	 * Compute the dispersion and jitter. The dispersion is weighted
2297	 * exponentially by NTP_FWEIGHT (0.5) so it is normalized close
2298	 * to 1.0. The jitter is the RMS differences relative to the
2299	 * lowest delay sample.
2300	 */
2301	peer->disp = peer->jitter = 0;
2302	k = ord[0];
2303	for (i = NTP_SHIFT - 1; i >= 0; i--) {
2304		j = ord[i];
2305		peer->disp = NTP_FWEIGHT * (peer->disp +
2306		    peer->filter_disp[j]);
2307		if (i < m)
2308			peer->jitter += DIFF(peer->filter_offset[j],
2309			    peer->filter_offset[k]);
2310	}
2311
2312	/*
2313	 * If no acceptable samples remain in the shift register,
2314	 * quietly tiptoe home leaving only the dispersion. Otherwise,
2315	 * save the offset, delay and jitter. Note the jitter must not
2316	 * be less than the precision.
2317	 */
2318	if (m == 0) {
2319		clock_select();
2320		return;
2321	}
2322	etemp = fabs(peer->offset - peer->filter_offset[k]);
2323	peer->offset = peer->filter_offset[k];
2324	peer->delay = peer->filter_delay[k];
2325	if (m > 1)
2326		peer->jitter /= m - 1;
2327	peer->jitter = max(SQRT(peer->jitter), LOGTOD(sys_precision));
2328
2329	/*
2330	 * If the the new sample and the current sample are both valid
2331	 * and the difference between their offsets exceeds CLOCK_SGATE
2332	 * (3) times the jitter and the interval between them is less
2333	 * than twice the host poll interval, consider the new sample
2334	 * a popcorn spike and ignore it.
2335	 */
2336	if (peer->disp < sys_maxdist && peer->filter_disp[k] <
2337	    sys_maxdist && etemp > CLOCK_SGATE * peer->jitter &&
2338	    peer->filter_epoch[k] - peer->epoch < 2. *
2339	    ULOGTOD(peer->hpoll)) {
2340		snprintf(tbuf, sizeof(tbuf), "%.6f s", etemp);
2341		report_event(PEVNT_POPCORN, peer, tbuf);
2342		return;
2343	}
2344
2345	/*
2346	 * A new minimum sample is useful only if it is later than the
2347	 * last one used. In this design the maximum lifetime of any
2348	 * sample is not greater than eight times the poll interval, so
2349	 * the maximum interval between minimum samples is eight
2350	 * packets.
2351	 */
2352	if (peer->filter_epoch[k] <= peer->epoch) {
2353#if DEBUG
2354	if (debug > 1)
2355		printf("clock_filter: old sample %lu\n", current_time -
2356		    peer->filter_epoch[k]);
2357#endif
2358		return;
2359	}
2360	peer->epoch = peer->filter_epoch[k];
2361
2362	/*
2363	 * The mitigated sample statistics are saved for later
2364	 * processing. If not synchronized or not in a burst, tickle the
2365	 * clock select algorithm.
2366	 */
2367	record_peer_stats(&peer->srcadr, ctlpeerstatus(peer),
2368	    peer->offset, peer->delay, peer->disp, peer->jitter);
2369#ifdef DEBUG
2370	if (debug)
2371		printf(
2372		    "clock_filter: n %d off %.6f del %.6f dsp %.6f jit %.6f\n",
2373		    m, peer->offset, peer->delay, peer->disp,
2374		    peer->jitter);
2375#endif
2376	if (peer->burst == 0 || sys_leap == LEAP_NOTINSYNC)
2377		clock_select();
2378}
2379
2380
2381/*
2382 * clock_select - find the pick-of-the-litter clock
2383 *
2384 * LOCKCLOCK: (1) If the local clock is the prefer peer, it will always
2385 * be enabled, even if declared falseticker, (2) only the prefer peer
2386 * can be selected as the system peer, (3) if the external source is
2387 * down, the system leap bits are set to 11 and the stratum set to
2388 * infinity.
2389 */
2390void
2391clock_select(void)
2392{
2393	struct peer *peer;
2394	int	i, j, k, n;
2395	int	nlist, nl2;
2396	int	allow;
2397	int	speer;
2398	double	d, e, f, g;
2399	double	high, low;
2400	double	speermet;
2401	double	orphmet = 2.0 * U_INT32_MAX; /* 2x is greater than */
2402	struct endpoint endp;
2403	struct peer *osys_peer;
2404	struct peer *sys_prefer = NULL;	/* prefer peer */
2405	struct peer *typesystem = NULL;
2406	struct peer *typeorphan = NULL;
2407#ifdef REFCLOCK
2408	struct peer *typeacts = NULL;
2409	struct peer *typelocal = NULL;
2410	struct peer *typepps = NULL;
2411#endif /* REFCLOCK */
2412	static struct endpoint *endpoint = NULL;
2413	static int *indx = NULL;
2414	static peer_select *peers = NULL;
2415	static u_int endpoint_size = 0;
2416	static u_int peers_size = 0;
2417	static u_int indx_size = 0;
2418	size_t octets;
2419
2420	/*
2421	 * Initialize and create endpoint, index and peer lists big
2422	 * enough to handle all associations.
2423	 */
2424	osys_peer = sys_peer;
2425	sys_survivors = 0;
2426#ifdef LOCKCLOCK
2427	sys_leap = LEAP_NOTINSYNC;
2428	sys_stratum = STRATUM_UNSPEC;
2429	memcpy(&sys_refid, "DOWN", 4);
2430#endif /* LOCKCLOCK */
2431
2432	/*
2433	 * Allocate dynamic space depending on the number of
2434	 * associations.
2435	 */
2436	nlist = 1;
2437	for (peer = peer_list; peer != NULL; peer = peer->p_link)
2438		nlist++;
2439	endpoint_size = ALIGNED_SIZE(nlist * 2 * sizeof(*endpoint));
2440	peers_size = ALIGNED_SIZE(nlist * sizeof(*peers));
2441	indx_size = ALIGNED_SIZE(nlist * 2 * sizeof(*indx));
2442	octets = endpoint_size + peers_size + indx_size;
2443	endpoint = erealloc(endpoint, octets);
2444	peers = INC_ALIGNED_PTR(endpoint, endpoint_size);
2445	indx = INC_ALIGNED_PTR(peers, peers_size);
2446
2447	/*
2448	 * Initially, we populate the island with all the rifraff peers
2449	 * that happen to be lying around. Those with seriously
2450	 * defective clocks are immediately booted off the island. Then,
2451	 * the falsetickers are culled and put to sea. The truechimers
2452	 * remaining are subject to repeated rounds where the most
2453	 * unpopular at each round is kicked off. When the population
2454	 * has dwindled to sys_minclock, the survivors split a million
2455	 * bucks and collectively crank the chimes.
2456	 */
2457	nlist = nl2 = 0;	/* none yet */
2458	for (peer = peer_list; peer != NULL; peer = peer->p_link) {
2459		peer->new_status = CTL_PST_SEL_REJECT;
2460
2461		/*
2462		 * Leave the island immediately if the peer is
2463		 * unfit to synchronize.
2464		 */
2465		if (peer_unfit(peer))
2466			continue;
2467
2468		/*
2469		 * If this peer is an orphan parent, elect the
2470		 * one with the lowest metric defined as the
2471		 * IPv4 address or the first 64 bits of the
2472		 * hashed IPv6 address.  To ensure convergence
2473		 * on the same selected orphan, consider as
2474		 * well that this system may have the lowest
2475		 * metric and be the orphan parent.  If this
2476		 * system wins, sys_peer will be NULL to trigger
2477		 * orphan mode in timer().
2478		 */
2479		if (peer->stratum == sys_orphan) {
2480			u_int32	localmet;
2481			u_int32 peermet;
2482
2483			if (peer->dstadr != NULL)
2484				localmet = ntohl(peer->dstadr->addr_refid);
2485			else
2486				localmet = U_INT32_MAX;
2487			peermet = ntohl(addr2refid(&peer->srcadr));
2488			if (peermet < localmet && peermet < orphmet) {
2489				typeorphan = peer;
2490				orphmet = peermet;
2491			}
2492			continue;
2493		}
2494
2495		/*
2496		 * If this peer could have the orphan parent
2497		 * as a synchronization ancestor, exclude it
2498		 * from selection to avoid forming a
2499		 * synchronization loop within the orphan mesh,
2500		 * triggering stratum climb to infinity
2501		 * instability.  Peers at stratum higher than
2502		 * the orphan stratum could have the orphan
2503		 * parent in ancestry so are excluded.
2504		 * See http://bugs.ntp.org/2050
2505		 */
2506		if (peer->stratum > sys_orphan)
2507			continue;
2508#ifdef REFCLOCK
2509		/*
2510		 * The following are special cases. We deal
2511		 * with them later.
2512		 */
2513		if (!(peer->flags & FLAG_PREFER)) {
2514			switch (peer->refclktype) {
2515			case REFCLK_LOCALCLOCK:
2516				if (current_time > orphwait &&
2517				    typelocal == NULL)
2518					typelocal = peer;
2519				continue;
2520
2521			case REFCLK_ACTS:
2522				if (current_time > orphwait &&
2523				    typeacts == NULL)
2524					typeacts = peer;
2525				continue;
2526			}
2527		}
2528#endif /* REFCLOCK */
2529
2530		/*
2531		 * If we get this far, the peer can stay on the
2532		 * island, but does not yet have the immunity
2533		 * idol.
2534		 */
2535		peer->new_status = CTL_PST_SEL_SANE;
2536		f = root_distance(peer);
2537		peers[nlist].peer = peer;
2538		peers[nlist].error = peer->jitter;
2539		peers[nlist].synch = f;
2540		nlist++;
2541
2542		/*
2543		 * Insert each interval endpoint on the unsorted
2544		 * endpoint[] list.
2545		 */
2546		e = peer->offset;
2547		endpoint[nl2].type = -1;	/* lower end */
2548		endpoint[nl2].val = e - f;
2549		nl2++;
2550		endpoint[nl2].type = 1;		/* upper end */
2551		endpoint[nl2].val = e + f;
2552		nl2++;
2553	}
2554	/*
2555	 * Construct sorted indx[] of endpoint[] indexes ordered by
2556	 * offset.
2557	 */
2558	for (i = 0; i < nl2; i++)
2559		indx[i] = i;
2560	for (i = 0; i < nl2; i++) {
2561		endp = endpoint[indx[i]];
2562		e = endp.val;
2563		k = i;
2564		for (j = i + 1; j < nl2; j++) {
2565			endp = endpoint[indx[j]];
2566			if (endp.val < e) {
2567				e = endp.val;
2568				k = j;
2569			}
2570		}
2571		if (k != i) {
2572			j = indx[k];
2573			indx[k] = indx[i];
2574			indx[i] = j;
2575		}
2576	}
2577	for (i = 0; i < nl2; i++)
2578		DPRINTF(3, ("select: endpoint %2d %.6f\n",
2579			endpoint[indx[i]].type, endpoint[indx[i]].val));
2580
2581	/*
2582	 * This is the actual algorithm that cleaves the truechimers
2583	 * from the falsetickers. The original algorithm was described
2584	 * in Keith Marzullo's dissertation, but has been modified for
2585	 * better accuracy.
2586	 *
2587	 * Briefly put, we first assume there are no falsetickers, then
2588	 * scan the candidate list first from the low end upwards and
2589	 * then from the high end downwards. The scans stop when the
2590	 * number of intersections equals the number of candidates less
2591	 * the number of falsetickers. If this doesn't happen for a
2592	 * given number of falsetickers, we bump the number of
2593	 * falsetickers and try again. If the number of falsetickers
2594	 * becomes equal to or greater than half the number of
2595	 * candidates, the Albanians have won the Byzantine wars and
2596	 * correct synchronization is not possible.
2597	 *
2598	 * Here, nlist is the number of candidates and allow is the
2599	 * number of falsetickers. Upon exit, the truechimers are the
2600	 * survivors with offsets not less than low and not greater than
2601	 * high. There may be none of them.
2602	 */
2603	low = 1e9;
2604	high = -1e9;
2605	for (allow = 0; 2 * allow < nlist; allow++) {
2606
2607		/*
2608		 * Bound the interval (low, high) as the smallest
2609		 * interval containing points from the most sources.
2610		 */
2611		n = 0;
2612		for (i = 0; i < nl2; i++) {
2613			low = endpoint[indx[i]].val;
2614			n -= endpoint[indx[i]].type;
2615			if (n >= nlist - allow)
2616				break;
2617		}
2618		n = 0;
2619		for (j = nl2 - 1; j >= 0; j--) {
2620			high = endpoint[indx[j]].val;
2621			n += endpoint[indx[j]].type;
2622			if (n >= nlist - allow)
2623				break;
2624		}
2625
2626		/*
2627		 * If an interval containing truechimers is found, stop.
2628		 * If not, increase the number of falsetickers and go
2629		 * around again.
2630		 */
2631		if (high > low)
2632			break;
2633	}
2634
2635	/*
2636	 * Clustering algorithm. Whittle candidate list of falsetickers,
2637	 * who leave the island immediately. The TRUE peer is always a
2638	 * truechimer. We must leave at least one peer to collect the
2639	 * million bucks.
2640	 *
2641	 * We assert the correct time is contained in the interval, but
2642	 * the best offset estimate for the interval might not be
2643	 * contained in the interval. For this purpose, a truechimer is
2644	 * defined as the midpoint of an interval that overlaps the
2645	 * intersection interval.
2646	 */
2647	j = 0;
2648	for (i = 0; i < nlist; i++) {
2649		double	h;
2650
2651		peer = peers[i].peer;
2652		h = peers[i].synch;
2653		if ((high <= low || peer->offset + h < low ||
2654		    peer->offset - h > high) && !(peer->flags & FLAG_TRUE))
2655			continue;
2656
2657#ifdef REFCLOCK
2658		/*
2659		 * Eligible PPS peers must survive the intersection
2660		 * algorithm. Use the first one found, but don't
2661		 * include any of them in the cluster population.
2662		 */
2663		if (peer->flags & FLAG_PPS) {
2664			if (typepps == NULL)
2665				typepps = peer;
2666			if (!(peer->flags & FLAG_TSTAMP_PPS))
2667				continue;
2668		}
2669#endif /* REFCLOCK */
2670
2671		if (j != i)
2672			peers[j] = peers[i];
2673		j++;
2674	}
2675	nlist = j;
2676
2677	/*
2678	 * If no survivors remain at this point, check if the modem
2679	 * driver, local driver or orphan parent in that order. If so,
2680	 * nominate the first one found as the only survivor.
2681	 * Otherwise, give up and leave the island to the rats.
2682	 */
2683	if (nlist == 0) {
2684		peers[0].error = 0;
2685		peers[0].synch = sys_mindisp;
2686#ifdef REFCLOCK
2687		if (typeacts != NULL) {
2688			peers[0].peer = typeacts;
2689			nlist = 1;
2690		} else if (typelocal != NULL) {
2691			peers[0].peer = typelocal;
2692			nlist = 1;
2693		} else
2694#endif /* REFCLOCK */
2695		if (typeorphan != NULL) {
2696			peers[0].peer = typeorphan;
2697			nlist = 1;
2698		}
2699	}
2700
2701	/*
2702	 * Mark the candidates at this point as truechimers.
2703	 */
2704	for (i = 0; i < nlist; i++) {
2705		peers[i].peer->new_status = CTL_PST_SEL_SELCAND;
2706		DPRINTF(2, ("select: survivor %s %f\n",
2707			stoa(&peers[i].peer->srcadr), peers[i].synch));
2708	}
2709
2710	/*
2711	 * Now, vote outlyers off the island by select jitter weighted
2712	 * by root distance. Continue voting as long as there are more
2713	 * than sys_minclock survivors and the select jitter of the peer
2714	 * with the worst metric is greater than the minimum peer
2715	 * jitter. Stop if we are about to discard a TRUE or PREFER
2716	 * peer, who of course have the immunity idol.
2717	 */
2718	while (1) {
2719		d = 1e9;
2720		e = -1e9;
2721		g = 0;
2722		k = 0;
2723		for (i = 0; i < nlist; i++) {
2724			if (peers[i].error < d)
2725				d = peers[i].error;
2726			peers[i].seljit = 0;
2727			if (nlist > 1) {
2728				f = 0;
2729				for (j = 0; j < nlist; j++)
2730					f += DIFF(peers[j].peer->offset,
2731					    peers[i].peer->offset);
2732				peers[i].seljit = SQRT(f / (nlist - 1));
2733			}
2734			if (peers[i].seljit * peers[i].synch > e) {
2735				g = peers[i].seljit;
2736				e = peers[i].seljit * peers[i].synch;
2737				k = i;
2738			}
2739		}
2740		g = max(g, LOGTOD(sys_precision));
2741		if (nlist <= max(1, sys_minclock) || g <= d ||
2742		    ((FLAG_TRUE | FLAG_PREFER) & peers[k].peer->flags))
2743			break;
2744
2745		DPRINTF(3, ("select: drop %s seljit %.6f jit %.6f\n",
2746			ntoa(&peers[k].peer->srcadr), g, d));
2747		if (nlist > sys_maxclock)
2748			peers[k].peer->new_status = CTL_PST_SEL_EXCESS;
2749		for (j = k + 1; j < nlist; j++)
2750			peers[j - 1] = peers[j];
2751		nlist--;
2752	}
2753
2754	/*
2755	 * What remains is a list usually not greater than sys_minclock
2756	 * peers. Note that unsynchronized peers cannot survive this
2757	 * far.  Count and mark these survivors.
2758	 *
2759	 * While at it, count the number of leap warning bits found.
2760	 * This will be used later to vote the system leap warning bit.
2761	 * If a leap warning bit is found on a reference clock, the vote
2762	 * is always won.
2763	 *
2764	 * Choose the system peer using a hybrid metric composed of the
2765	 * selection jitter scaled by the root distance augmented by
2766	 * stratum scaled by sys_mindisp (.001 by default). The goal of
2767	 * the small stratum factor is to avoid clockhop between a
2768	 * reference clock and a network peer which has a refclock and
2769	 * is using an older ntpd, which does not floor sys_rootdisp at
2770	 * sys_mindisp.
2771	 *
2772	 * In contrast, ntpd 4.2.6 and earlier used stratum primarily
2773	 * in selecting the system peer, using a weight of 1 second of
2774	 * additional root distance per stratum.  This heavy bias is no
2775	 * longer appropriate, as the scaled root distance provides a
2776	 * more rational metric carrying the cumulative error budget.
2777	 */
2778	e = 1e9;
2779	speer = 0;
2780	leap_vote_ins = 0;
2781	leap_vote_del = 0;
2782	for (i = 0; i < nlist; i++) {
2783		peer = peers[i].peer;
2784		peer->unreach = 0;
2785		peer->new_status = CTL_PST_SEL_SYNCCAND;
2786		sys_survivors++;
2787		if (peer->leap == LEAP_ADDSECOND) {
2788			if (peer->flags & FLAG_REFCLOCK)
2789				leap_vote_ins = nlist;
2790			else if (leap_vote_ins < nlist)
2791				leap_vote_ins++;
2792		}
2793		if (peer->leap == LEAP_DELSECOND) {
2794			if (peer->flags & FLAG_REFCLOCK)
2795				leap_vote_del = nlist;
2796			else if (leap_vote_del < nlist)
2797				leap_vote_del++;
2798		}
2799		if (peer->flags & FLAG_PREFER)
2800			sys_prefer = peer;
2801		speermet = peers[i].seljit * peers[i].synch +
2802		    peer->stratum * sys_mindisp;
2803		if (speermet < e) {
2804			e = speermet;
2805			speer = i;
2806		}
2807	}
2808
2809	/*
2810	 * Unless there are at least sys_misane survivors, leave the
2811	 * building dark. Otherwise, do a clockhop dance. Ordinarily,
2812	 * use the selected survivor speer. However, if the current
2813	 * system peer is not speer, stay with the current system peer
2814	 * as long as it doesn't get too old or too ugly.
2815	 */
2816	if (nlist > 0 && nlist >= sys_minsane) {
2817		double	x;
2818
2819		typesystem = peers[speer].peer;
2820		if (osys_peer == NULL || osys_peer == typesystem) {
2821			sys_clockhop = 0;
2822		} else if ((x = fabs(typesystem->offset -
2823		    osys_peer->offset)) < sys_mindisp) {
2824			if (sys_clockhop == 0)
2825				sys_clockhop = sys_mindisp;
2826			else
2827				sys_clockhop *= .5;
2828			DPRINTF(1, ("select: clockhop %d %.6f %.6f\n",
2829				j, x, sys_clockhop));
2830			if (fabs(x) < sys_clockhop)
2831				typesystem = osys_peer;
2832			else
2833				sys_clockhop = 0;
2834		} else {
2835			sys_clockhop = 0;
2836		}
2837	}
2838
2839	/*
2840	 * Mitigation rules of the game. We have the pick of the
2841	 * litter in typesystem if any survivors are left. If
2842	 * there is a prefer peer, use its offset and jitter.
2843	 * Otherwise, use the combined offset and jitter of all kitters.
2844	 */
2845	if (typesystem != NULL) {
2846		if (sys_prefer == NULL) {
2847			typesystem->new_status = CTL_PST_SEL_SYSPEER;
2848			clock_combine(peers, sys_survivors, speer);
2849		} else {
2850			typesystem = sys_prefer;
2851			sys_clockhop = 0;
2852			typesystem->new_status = CTL_PST_SEL_SYSPEER;
2853			sys_offset = typesystem->offset;
2854			sys_jitter = typesystem->jitter;
2855		}
2856		DPRINTF(1, ("select: combine offset %.9f jitter %.9f\n",
2857			sys_offset, sys_jitter));
2858	}
2859#ifdef REFCLOCK
2860	/*
2861	 * If a PPS driver is lit and the combined offset is less than
2862	 * 0.4 s, select the driver as the PPS peer and use its offset
2863	 * and jitter. However, if this is the atom driver, use it only
2864	 * if there is a prefer peer or there are no survivors and none
2865	 * are required.
2866	 */
2867	if (typepps != NULL && fabs(sys_offset) < 0.4 &&
2868	    (typepps->refclktype != REFCLK_ATOM_PPS ||
2869	    (typepps->refclktype == REFCLK_ATOM_PPS && (sys_prefer !=
2870	    NULL || (typesystem == NULL && sys_minsane == 0))))) {
2871		typesystem = typepps;
2872		sys_clockhop = 0;
2873		typesystem->new_status = CTL_PST_SEL_PPS;
2874 		sys_offset = typesystem->offset;
2875		sys_jitter = typesystem->jitter;
2876		DPRINTF(1, ("select: pps offset %.9f jitter %.9f\n",
2877			sys_offset, sys_jitter));
2878	}
2879#endif /* REFCLOCK */
2880
2881	/*
2882	 * If there are no survivors at this point, there is no
2883	 * system peer. If so and this is an old update, keep the
2884	 * current statistics, but do not update the clock.
2885	 */
2886	if (typesystem == NULL) {
2887		if (osys_peer != NULL) {
2888			if (sys_orphwait > 0)
2889				orphwait = current_time + sys_orphwait;
2890			report_event(EVNT_NOPEER, NULL, NULL);
2891		}
2892		sys_peer = NULL;
2893		for (peer = peer_list; peer != NULL; peer = peer->p_link)
2894			peer->status = peer->new_status;
2895		return;
2896	}
2897
2898	/*
2899	 * Do not use old data, as this may mess up the clock discipline
2900	 * stability.
2901	 */
2902	if (typesystem->epoch <= sys_epoch)
2903		return;
2904
2905	/*
2906	 * We have found the alpha male. Wind the clock.
2907	 */
2908	if (osys_peer != typesystem)
2909		report_event(PEVNT_NEWPEER, typesystem, NULL);
2910	for (peer = peer_list; peer != NULL; peer = peer->p_link)
2911		peer->status = peer->new_status;
2912	clock_update(typesystem);
2913}
2914
2915
2916static void
2917clock_combine(
2918	peer_select *	peers,	/* survivor list */
2919	int		npeers,	/* number of survivors */
2920	int		syspeer	/* index of sys.peer */
2921	)
2922{
2923	int	i;
2924	double	x, y, z, w;
2925
2926	y = z = w = 0;
2927	for (i = 0; i < npeers; i++) {
2928		x = 1. / peers[i].synch;
2929		y += x;
2930		z += x * peers[i].peer->offset;
2931		w += x * DIFF(peers[i].peer->offset,
2932		    peers[syspeer].peer->offset);
2933	}
2934	sys_offset = z / y;
2935	sys_jitter = SQRT(w / y + SQUARE(peers[syspeer].seljit));
2936}
2937
2938
2939/*
2940 * root_distance - compute synchronization distance from peer to root
2941 */
2942static double
2943root_distance(
2944	struct peer *peer	/* peer structure pointer */
2945	)
2946{
2947	double	dtemp;
2948
2949	/*
2950	 * Root Distance (LAMBDA) is defined as:
2951	 * (delta + DELTA)/2 + epsilon + EPSILON + phi
2952	 *
2953	 * where:
2954	 *  delta   is the round-trip delay
2955	 *  DELTA   is the root delay
2956	 *  epsilon is the remote server precision + local precision
2957	 *	    + (15 usec each second)
2958	 *  EPSILON is the root dispersion
2959	 *  phi     is the peer jitter statistic
2960	 *
2961	 * NB: Think hard about why we are using these values, and what
2962	 * the alternatives are, and the various pros/cons.
2963	 *
2964	 * DLM thinks these are probably the best choices from any of the
2965	 * other worse choices.
2966	 */
2967	dtemp = (peer->delay + peer->rootdelay) / 2
2968		+ LOGTOD(peer->precision)
2969		  + LOGTOD(sys_precision)
2970		  + clock_phi * (current_time - peer->update)
2971		+ peer->rootdisp
2972		+ peer->jitter;
2973	/*
2974	 * Careful squeak here. The value returned must be greater than
2975	 * the minimum root dispersion in order to avoid clockhop with
2976	 * highly precise reference clocks. Note that the root distance
2977	 * cannot exceed the sys_maxdist, as this is the cutoff by the
2978	 * selection algorithm.
2979	 */
2980	if (dtemp < sys_mindisp)
2981		dtemp = sys_mindisp;
2982	return (dtemp);
2983}
2984
2985
2986/*
2987 * peer_xmit - send packet for persistent association.
2988 */
2989static void
2990peer_xmit(
2991	struct peer *peer	/* peer structure pointer */
2992	)
2993{
2994	struct pkt xpkt;	/* transmit packet */
2995	size_t	sendlen, authlen;
2996	keyid_t	xkeyid = 0;	/* transmit key ID */
2997	l_fp	xmt_tx, xmt_ty;
2998
2999	if (!peer->dstadr)	/* drop peers without interface */
3000		return;
3001
3002	xpkt.li_vn_mode = PKT_LI_VN_MODE(sys_leap, peer->version,
3003	    peer->hmode);
3004	xpkt.stratum = STRATUM_TO_PKT(sys_stratum);
3005	xpkt.ppoll = peer->hpoll;
3006	xpkt.precision = sys_precision;
3007	xpkt.refid = sys_refid;
3008	xpkt.rootdelay = HTONS_FP(DTOFP(sys_rootdelay));
3009	xpkt.rootdisp =  HTONS_FP(DTOUFP(sys_rootdisp));
3010	HTONL_FP(&sys_reftime, &xpkt.reftime);
3011	HTONL_FP(&peer->rec, &xpkt.org);
3012	HTONL_FP(&peer->dst, &xpkt.rec);
3013
3014	/*
3015	 * If the received packet contains a MAC, the transmitted packet
3016	 * is authenticated and contains a MAC. If not, the transmitted
3017	 * packet is not authenticated.
3018	 *
3019	 * It is most important when autokey is in use that the local
3020	 * interface IP address be known before the first packet is
3021	 * sent. Otherwise, it is not possible to compute a correct MAC
3022	 * the recipient will accept. Thus, the I/O semantics have to do
3023	 * a little more work. In particular, the wildcard interface
3024	 * might not be usable.
3025	 */
3026	sendlen = LEN_PKT_NOMAC;
3027#ifdef AUTOKEY
3028	if (!(peer->flags & FLAG_SKEY) && peer->keyid == 0) {
3029#else	/* !AUTOKEY follows */
3030	if (peer->keyid == 0) {
3031#endif	/* !AUTOKEY */
3032
3033		/*
3034		 * Transmit a-priori timestamps
3035		 */
3036		get_systime(&xmt_tx);
3037		if (peer->flip == 0) {	/* basic mode */
3038			peer->aorg = xmt_tx;
3039			HTONL_FP(&xmt_tx, &xpkt.xmt);
3040		} else {		/* interleaved modes */
3041			if (peer->hmode == MODE_BROADCAST) { /* bcst */
3042				HTONL_FP(&xmt_tx, &xpkt.xmt);
3043				if (peer->flip > 0)
3044					HTONL_FP(&peer->borg,
3045					    &xpkt.org);
3046				else
3047					HTONL_FP(&peer->aorg,
3048					    &xpkt.org);
3049			} else {	/* symmetric */
3050				if (peer->flip > 0)
3051					HTONL_FP(&peer->borg,
3052					    &xpkt.xmt);
3053				else
3054					HTONL_FP(&peer->aorg,
3055					    &xpkt.xmt);
3056			}
3057		}
3058		peer->t21_bytes = sendlen;
3059		sendpkt(&peer->srcadr, peer->dstadr, sys_ttl[peer->ttl],
3060		    &xpkt, sendlen);
3061		peer->sent++;
3062		peer->throttle += (1 << peer->minpoll) - 2;
3063
3064		/*
3065		 * Capture a-posteriori timestamps
3066		 */
3067		get_systime(&xmt_ty);
3068		if (peer->flip != 0) {		/* interleaved modes */
3069			if (peer->flip > 0)
3070				peer->aorg = xmt_ty;
3071			else
3072				peer->borg = xmt_ty;
3073			peer->flip = -peer->flip;
3074		}
3075		L_SUB(&xmt_ty, &xmt_tx);
3076		LFPTOD(&xmt_ty, peer->xleave);
3077#ifdef DEBUG
3078		if (debug)
3079			printf("transmit: at %ld %s->%s mode %d len %zu\n",
3080		    	    current_time, peer->dstadr ?
3081			    stoa(&peer->dstadr->sin) : "-",
3082		            stoa(&peer->srcadr), peer->hmode, sendlen);
3083#endif
3084		return;
3085	}
3086
3087	/*
3088	 * Authentication is enabled, so the transmitted packet must be
3089	 * authenticated. If autokey is enabled, fuss with the various
3090	 * modes; otherwise, symmetric key cryptography is used.
3091	 */
3092#ifdef AUTOKEY
3093	if (peer->flags & FLAG_SKEY) {
3094		struct exten *exten;	/* extension field */
3095
3096		/*
3097		 * The Public Key Dance (PKD): Cryptographic credentials
3098		 * are contained in extension fields, each including a
3099		 * 4-octet length/code word followed by a 4-octet
3100		 * association ID and optional additional data. Optional
3101		 * data includes a 4-octet data length field followed by
3102		 * the data itself. Request messages are sent from a
3103		 * configured association; response messages can be sent
3104		 * from a configured association or can take the fast
3105		 * path without ever matching an association. Response
3106		 * messages have the same code as the request, but have
3107		 * a response bit and possibly an error bit set. In this
3108		 * implementation, a message may contain no more than
3109		 * one command and one or more responses.
3110		 *
3111		 * Cryptographic session keys include both a public and
3112		 * a private componet. Request and response messages
3113		 * using extension fields are always sent with the
3114		 * private component set to zero. Packets without
3115		 * extension fields indlude the private component when
3116		 * the session key is generated.
3117		 */
3118		while (1) {
3119
3120			/*
3121			 * Allocate and initialize a keylist if not
3122			 * already done. Then, use the list in inverse
3123			 * order, discarding keys once used. Keep the
3124			 * latest key around until the next one, so
3125			 * clients can use client/server packets to
3126			 * compute propagation delay.
3127			 *
3128			 * Note that once a key is used from the list,
3129			 * it is retained in the key cache until the
3130			 * next key is used. This is to allow a client
3131			 * to retrieve the encrypted session key
3132			 * identifier to verify authenticity.
3133			 *
3134			 * If for some reason a key is no longer in the
3135			 * key cache, a birthday has happened or the key
3136			 * has expired, so the pseudo-random sequence is
3137			 * broken. In that case, purge the keylist and
3138			 * regenerate it.
3139			 */
3140			if (peer->keynumber == 0)
3141				make_keylist(peer, peer->dstadr);
3142			else
3143				peer->keynumber--;
3144			xkeyid = peer->keylist[peer->keynumber];
3145			if (authistrusted(xkeyid))
3146				break;
3147			else
3148				key_expire(peer);
3149		}
3150		peer->keyid = xkeyid;
3151		exten = NULL;
3152		switch (peer->hmode) {
3153
3154		/*
3155		 * In broadcast server mode the autokey values are
3156		 * required by the broadcast clients. Push them when a
3157		 * new keylist is generated; otherwise, push the
3158		 * association message so the client can request them at
3159		 * other times.
3160		 */
3161		case MODE_BROADCAST:
3162			if (peer->flags & FLAG_ASSOC)
3163				exten = crypto_args(peer, CRYPTO_AUTO |
3164				    CRYPTO_RESP, peer->associd, NULL);
3165			else
3166				exten = crypto_args(peer, CRYPTO_ASSOC |
3167				    CRYPTO_RESP, peer->associd, NULL);
3168			break;
3169
3170		/*
3171		 * In symmetric modes the parameter, certificate,
3172		 * identity, cookie and autokey exchanges are
3173		 * required. The leapsecond exchange is optional. But, a
3174		 * peer will not believe the other peer until the other
3175		 * peer has synchronized, so the certificate exchange
3176		 * might loop until then. If a peer finds a broken
3177		 * autokey sequence, it uses the autokey exchange to
3178		 * retrieve the autokey values. In any case, if a new
3179		 * keylist is generated, the autokey values are pushed.
3180		 */
3181		case MODE_ACTIVE:
3182		case MODE_PASSIVE:
3183
3184			/*
3185			 * Parameter, certificate and identity.
3186			 */
3187			if (!peer->crypto)
3188				exten = crypto_args(peer, CRYPTO_ASSOC,
3189				    peer->associd, hostval.ptr);
3190			else if (!(peer->crypto & CRYPTO_FLAG_CERT))
3191				exten = crypto_args(peer, CRYPTO_CERT,
3192				    peer->associd, peer->issuer);
3193			else if (!(peer->crypto & CRYPTO_FLAG_VRFY))
3194				exten = crypto_args(peer,
3195				    crypto_ident(peer), peer->associd,
3196				    NULL);
3197
3198			/*
3199			 * Cookie and autokey. We request the cookie
3200			 * only when the this peer and the other peer
3201			 * are synchronized. But, this peer needs the
3202			 * autokey values when the cookie is zero. Any
3203			 * time we regenerate the key list, we offer the
3204			 * autokey values without being asked. If for
3205			 * some reason either peer finds a broken
3206			 * autokey sequence, the autokey exchange is
3207			 * used to retrieve the autokey values.
3208			 */
3209			else if (sys_leap != LEAP_NOTINSYNC &&
3210			    peer->leap != LEAP_NOTINSYNC &&
3211			    !(peer->crypto & CRYPTO_FLAG_COOK))
3212				exten = crypto_args(peer, CRYPTO_COOK,
3213				    peer->associd, NULL);
3214			else if (!(peer->crypto & CRYPTO_FLAG_AUTO))
3215				exten = crypto_args(peer, CRYPTO_AUTO,
3216				    peer->associd, NULL);
3217			else if (peer->flags & FLAG_ASSOC &&
3218			    peer->crypto & CRYPTO_FLAG_SIGN)
3219				exten = crypto_args(peer, CRYPTO_AUTO |
3220				    CRYPTO_RESP, peer->assoc, NULL);
3221
3222			/*
3223			 * Wait for clock sync, then sign the
3224			 * certificate and retrieve the leapsecond
3225			 * values.
3226			 */
3227			else if (sys_leap == LEAP_NOTINSYNC)
3228				break;
3229
3230			else if (!(peer->crypto & CRYPTO_FLAG_SIGN))
3231				exten = crypto_args(peer, CRYPTO_SIGN,
3232				    peer->associd, hostval.ptr);
3233			else if (!(peer->crypto & CRYPTO_FLAG_LEAP))
3234				exten = crypto_args(peer, CRYPTO_LEAP,
3235				    peer->associd, NULL);
3236			break;
3237
3238		/*
3239		 * In client mode the parameter, certificate, identity,
3240		 * cookie and sign exchanges are required. The
3241		 * leapsecond exchange is optional. If broadcast client
3242		 * mode the same exchanges are required, except that the
3243		 * autokey exchange is substitutes for the cookie
3244		 * exchange, since the cookie is always zero. If the
3245		 * broadcast client finds a broken autokey sequence, it
3246		 * uses the autokey exchange to retrieve the autokey
3247		 * values.
3248		 */
3249		case MODE_CLIENT:
3250
3251			/*
3252			 * Parameter, certificate and identity.
3253			 */
3254			if (!peer->crypto)
3255				exten = crypto_args(peer, CRYPTO_ASSOC,
3256				    peer->associd, hostval.ptr);
3257			else if (!(peer->crypto & CRYPTO_FLAG_CERT))
3258				exten = crypto_args(peer, CRYPTO_CERT,
3259				    peer->associd, peer->issuer);
3260			else if (!(peer->crypto & CRYPTO_FLAG_VRFY))
3261				exten = crypto_args(peer,
3262				    crypto_ident(peer), peer->associd,
3263				    NULL);
3264
3265			/*
3266			 * Cookie and autokey. These are requests, but
3267			 * we use the peer association ID with autokey
3268			 * rather than our own.
3269			 */
3270			else if (!(peer->crypto & CRYPTO_FLAG_COOK))
3271				exten = crypto_args(peer, CRYPTO_COOK,
3272				    peer->associd, NULL);
3273			else if (!(peer->crypto & CRYPTO_FLAG_AUTO))
3274				exten = crypto_args(peer, CRYPTO_AUTO,
3275				    peer->assoc, NULL);
3276
3277			/*
3278			 * Wait for clock sync, then sign the
3279			 * certificate and retrieve the leapsecond
3280			 * values.
3281			 */
3282			else if (sys_leap == LEAP_NOTINSYNC)
3283				break;
3284
3285			else if (!(peer->crypto & CRYPTO_FLAG_SIGN))
3286				exten = crypto_args(peer, CRYPTO_SIGN,
3287				    peer->associd, hostval.ptr);
3288			else if (!(peer->crypto & CRYPTO_FLAG_LEAP))
3289				exten = crypto_args(peer, CRYPTO_LEAP,
3290				    peer->associd, NULL);
3291			break;
3292		}
3293
3294		/*
3295		 * Add a queued extension field if present. This is
3296		 * always a request message, so the reply ID is already
3297		 * in the message. If an error occurs, the error bit is
3298		 * lit in the response.
3299		 */
3300		if (peer->cmmd != NULL) {
3301			u_int32 temp32;
3302
3303			temp32 = CRYPTO_RESP;
3304			peer->cmmd->opcode |= htonl(temp32);
3305			sendlen += crypto_xmit(peer, &xpkt, NULL,
3306			    sendlen, peer->cmmd, 0);
3307			free(peer->cmmd);
3308			peer->cmmd = NULL;
3309		}
3310
3311		/*
3312		 * Add an extension field created above. All but the
3313		 * autokey response message are request messages.
3314		 */
3315		if (exten != NULL) {
3316			if (exten->opcode != 0)
3317				sendlen += crypto_xmit(peer, &xpkt,
3318				    NULL, sendlen, exten, 0);
3319			free(exten);
3320		}
3321
3322		/*
3323		 * Calculate the next session key. Since extension
3324		 * fields are present, the cookie value is zero.
3325		 */
3326		if (sendlen > (int)LEN_PKT_NOMAC) {
3327			session_key(&peer->dstadr->sin, &peer->srcadr,
3328			    xkeyid, 0, 2);
3329		}
3330	}
3331#endif	/* AUTOKEY */
3332
3333	/*
3334	 * Transmit a-priori timestamps
3335	 */
3336	get_systime(&xmt_tx);
3337	if (peer->flip == 0) {		/* basic mode */
3338		peer->aorg = xmt_tx;
3339		HTONL_FP(&xmt_tx, &xpkt.xmt);
3340	} else {			/* interleaved modes */
3341		if (peer->hmode == MODE_BROADCAST) { /* bcst */
3342			HTONL_FP(&xmt_tx, &xpkt.xmt);
3343			if (peer->flip > 0)
3344				HTONL_FP(&peer->borg, &xpkt.org);
3345			else
3346				HTONL_FP(&peer->aorg, &xpkt.org);
3347		} else {		/* symmetric */
3348			if (peer->flip > 0)
3349				HTONL_FP(&peer->borg, &xpkt.xmt);
3350			else
3351				HTONL_FP(&peer->aorg, &xpkt.xmt);
3352		}
3353	}
3354	xkeyid = peer->keyid;
3355	authlen = authencrypt(xkeyid, (u_int32 *)&xpkt, sendlen);
3356	if (authlen == 0) {
3357		report_event(PEVNT_AUTH, peer, "no key");
3358		peer->flash |= TEST5;		/* auth error */
3359		peer->badauth++;
3360		return;
3361	}
3362	sendlen += authlen;
3363#ifdef AUTOKEY
3364	if (xkeyid > NTP_MAXKEY)
3365		authtrust(xkeyid, 0);
3366#endif	/* AUTOKEY */
3367	if (sendlen > sizeof(xpkt)) {
3368		msyslog(LOG_ERR, "proto: buffer overflow %zu", sendlen);
3369		exit (-1);
3370	}
3371	peer->t21_bytes = sendlen;
3372	sendpkt(&peer->srcadr, peer->dstadr, sys_ttl[peer->ttl], &xpkt,
3373	    sendlen);
3374	peer->sent++;
3375	peer->throttle += (1 << peer->minpoll) - 2;
3376
3377	/*
3378	 * Capture a-posteriori timestamps
3379	 */
3380	get_systime(&xmt_ty);
3381	if (peer->flip != 0) {			/* interleaved modes */
3382		if (peer->flip > 0)
3383			peer->aorg = xmt_ty;
3384		else
3385			peer->borg = xmt_ty;
3386		peer->flip = -peer->flip;
3387	}
3388	L_SUB(&xmt_ty, &xmt_tx);
3389	LFPTOD(&xmt_ty, peer->xleave);
3390#ifdef AUTOKEY
3391#ifdef DEBUG
3392	if (debug)
3393		printf("transmit: at %ld %s->%s mode %d keyid %08x len %zu index %d\n",
3394		    current_time, latoa(peer->dstadr),
3395		    ntoa(&peer->srcadr), peer->hmode, xkeyid, sendlen,
3396		    peer->keynumber);
3397#endif
3398#else	/* !AUTOKEY follows */
3399#ifdef DEBUG
3400	if (debug)
3401		printf("transmit: at %ld %s->%s mode %d keyid %08x len %d\n",
3402		    current_time, peer->dstadr ?
3403		    ntoa(&peer->dstadr->sin) : "-",
3404		    ntoa(&peer->srcadr), peer->hmode, xkeyid, sendlen);
3405#endif
3406#endif	/* !AUTOKEY */
3407}
3408
3409
3410/*
3411 * fast_xmit - Send packet for nonpersistent association. Note that
3412 * neither the source or destination can be a broadcast address.
3413 */
3414static void
3415fast_xmit(
3416	struct recvbuf *rbufp,	/* receive packet pointer */
3417	int	xmode,		/* receive mode */
3418	keyid_t	xkeyid,		/* transmit key ID */
3419	int	flags		/* restrict mask */
3420	)
3421{
3422	struct pkt xpkt;	/* transmit packet structure */
3423	struct pkt *rpkt;	/* receive packet structure */
3424	l_fp	xmt_tx, xmt_ty;
3425	int	sendlen;
3426#ifdef AUTOKEY
3427	u_int32	temp32;
3428#endif
3429
3430	/*
3431	 * Initialize transmit packet header fields from the receive
3432	 * buffer provided. We leave the fields intact as received, but
3433	 * set the peer poll at the maximum of the receive peer poll and
3434	 * the system minimum poll (ntp_minpoll). This is for KoD rate
3435	 * control and not strictly specification compliant, but doesn't
3436	 * break anything.
3437	 *
3438	 * If the gazinta was from a multicast address, the gazoutta
3439	 * must go out another way.
3440	 */
3441	rpkt = &rbufp->recv_pkt;
3442	if (rbufp->dstadr->flags & INT_MCASTOPEN)
3443		rbufp->dstadr = findinterface(&rbufp->recv_srcadr);
3444
3445	/*
3446	 * If this is a kiss-o'-death (KoD) packet, show leap
3447	 * unsynchronized, stratum zero, reference ID the four-character
3448	 * kiss code and system root delay. Note we don't reveal the
3449	 * local time, so these packets can't be used for
3450	 * synchronization.
3451	 */
3452	if (flags & RES_KOD) {
3453		sys_kodsent++;
3454		xpkt.li_vn_mode = PKT_LI_VN_MODE(LEAP_NOTINSYNC,
3455		    PKT_VERSION(rpkt->li_vn_mode), xmode);
3456		xpkt.stratum = STRATUM_PKT_UNSPEC;
3457		xpkt.ppoll = max(rpkt->ppoll, ntp_minpoll);
3458		xpkt.precision = rpkt->precision;
3459		memcpy(&xpkt.refid, "RATE", 4);
3460		xpkt.rootdelay = rpkt->rootdelay;
3461		xpkt.rootdisp = rpkt->rootdisp;
3462		xpkt.reftime = rpkt->reftime;
3463		xpkt.org = rpkt->xmt;
3464		xpkt.rec = rpkt->xmt;
3465		xpkt.xmt = rpkt->xmt;
3466
3467	/*
3468	 * This is a normal packet. Use the system variables.
3469	 */
3470	} else {
3471		xpkt.li_vn_mode = PKT_LI_VN_MODE(sys_leap,
3472		    PKT_VERSION(rpkt->li_vn_mode), xmode);
3473		xpkt.stratum = STRATUM_TO_PKT(sys_stratum);
3474		xpkt.ppoll = max(rpkt->ppoll, ntp_minpoll);
3475		xpkt.precision = sys_precision;
3476		xpkt.refid = sys_refid;
3477		xpkt.rootdelay = HTONS_FP(DTOFP(sys_rootdelay));
3478		xpkt.rootdisp = HTONS_FP(DTOUFP(sys_rootdisp));
3479		HTONL_FP(&sys_reftime, &xpkt.reftime);
3480		xpkt.org = rpkt->xmt;
3481		HTONL_FP(&rbufp->recv_time, &xpkt.rec);
3482		get_systime(&xmt_tx);
3483		HTONL_FP(&xmt_tx, &xpkt.xmt);
3484	}
3485
3486#ifdef HAVE_NTP_SIGND
3487	if (flags & RES_MSSNTP) {
3488		send_via_ntp_signd(rbufp, xmode, xkeyid, flags, &xpkt);
3489		return;
3490	}
3491#endif /* HAVE_NTP_SIGND */
3492
3493	/*
3494	 * If the received packet contains a MAC, the transmitted packet
3495	 * is authenticated and contains a MAC. If not, the transmitted
3496	 * packet is not authenticated.
3497	 */
3498	sendlen = LEN_PKT_NOMAC;
3499	if (rbufp->recv_length == sendlen) {
3500		sendpkt(&rbufp->recv_srcadr, rbufp->dstadr, 0, &xpkt,
3501		    sendlen);
3502#ifdef DEBUG
3503		if (debug)
3504			printf(
3505			    "transmit: at %ld %s->%s mode %d len %d\n",
3506			    current_time, stoa(&rbufp->dstadr->sin),
3507			    stoa(&rbufp->recv_srcadr), xmode, sendlen);
3508#endif
3509		return;
3510	}
3511
3512	/*
3513	 * The received packet contains a MAC, so the transmitted packet
3514	 * must be authenticated. For symmetric key cryptography, use
3515	 * the predefined and trusted symmetric keys to generate the
3516	 * cryptosum. For autokey cryptography, use the server private
3517	 * value to generate the cookie, which is unique for every
3518	 * source-destination-key ID combination.
3519	 */
3520#ifdef AUTOKEY
3521	if (xkeyid > NTP_MAXKEY) {
3522		keyid_t cookie;
3523
3524		/*
3525		 * The only way to get here is a reply to a legitimate
3526		 * client request message, so the mode must be
3527		 * MODE_SERVER. If an extension field is present, there
3528		 * can be only one and that must be a command. Do what
3529		 * needs, but with private value of zero so the poor
3530		 * jerk can decode it. If no extension field is present,
3531		 * use the cookie to generate the session key.
3532		 */
3533		cookie = session_key(&rbufp->recv_srcadr,
3534		    &rbufp->dstadr->sin, 0, sys_private, 0);
3535		if (rbufp->recv_length > sendlen + (int)MAX_MAC_LEN) {
3536			session_key(&rbufp->dstadr->sin,
3537			    &rbufp->recv_srcadr, xkeyid, 0, 2);
3538			temp32 = CRYPTO_RESP;
3539			rpkt->exten[0] |= htonl(temp32);
3540			sendlen += crypto_xmit(NULL, &xpkt, rbufp,
3541			    sendlen, (struct exten *)rpkt->exten,
3542			    cookie);
3543		} else {
3544			session_key(&rbufp->dstadr->sin,
3545			    &rbufp->recv_srcadr, xkeyid, cookie, 2);
3546		}
3547	}
3548#endif	/* AUTOKEY */
3549	get_systime(&xmt_tx);
3550	sendlen += authencrypt(xkeyid, (u_int32 *)&xpkt, sendlen);
3551#ifdef AUTOKEY
3552	if (xkeyid > NTP_MAXKEY)
3553		authtrust(xkeyid, 0);
3554#endif	/* AUTOKEY */
3555	sendpkt(&rbufp->recv_srcadr, rbufp->dstadr, 0, &xpkt, sendlen);
3556	get_systime(&xmt_ty);
3557	L_SUB(&xmt_ty, &xmt_tx);
3558	sys_authdelay = xmt_ty;
3559#ifdef DEBUG
3560	if (debug)
3561		printf(
3562		    "transmit: at %ld %s->%s mode %d keyid %08x len %d\n",
3563		    current_time, ntoa(&rbufp->dstadr->sin),
3564		    ntoa(&rbufp->recv_srcadr), xmode, xkeyid, sendlen);
3565#endif
3566}
3567
3568
3569/*
3570 * pool_xmit - resolve hostname or send unicast solicitation for pool.
3571 */
3572static void
3573pool_xmit(
3574	struct peer *pool	/* pool solicitor association */
3575	)
3576{
3577#ifdef WORKER
3578	struct pkt		xpkt;	/* transmit packet structure */
3579	struct addrinfo		hints;
3580	int			rc;
3581	struct interface *	lcladr;
3582	sockaddr_u *		rmtadr;
3583	int			restrict_mask;
3584	struct peer *		p;
3585	l_fp			xmt_tx;
3586
3587	if (NULL == pool->ai) {
3588		if (pool->addrs != NULL) {
3589			/* free() is used with copy_addrinfo_list() */
3590			free(pool->addrs);
3591			pool->addrs = NULL;
3592		}
3593		ZERO(hints);
3594		hints.ai_family = AF(&pool->srcadr);
3595		hints.ai_socktype = SOCK_DGRAM;
3596		hints.ai_protocol = IPPROTO_UDP;
3597		/* ignore getaddrinfo_sometime() errors, we will retry */
3598		rc = getaddrinfo_sometime(
3599			pool->hostname,
3600			"ntp",
3601			&hints,
3602			0,			/* no retry */
3603			&pool_name_resolved,
3604			(void *)(intptr_t)pool->associd);
3605		if (!rc)
3606			DPRINTF(1, ("pool DNS lookup %s started\n",
3607				pool->hostname));
3608		else
3609			msyslog(LOG_ERR,
3610				"unable to start pool DNS %s %m",
3611				pool->hostname);
3612		return;
3613	}
3614
3615	do {
3616		/* copy_addrinfo_list ai_addr points to a sockaddr_u */
3617		rmtadr = (sockaddr_u *)(void *)pool->ai->ai_addr;
3618		pool->ai = pool->ai->ai_next;
3619		p = findexistingpeer(rmtadr, NULL, NULL, MODE_CLIENT, 0);
3620	} while (p != NULL && pool->ai != NULL);
3621	if (p != NULL)
3622		return;	/* out of addresses, re-query DNS next poll */
3623	restrict_mask = restrictions(rmtadr);
3624	if (RES_FLAGS & restrict_mask)
3625		restrict_source(rmtadr, 0,
3626				current_time + POOL_SOLICIT_WINDOW + 1);
3627	lcladr = findinterface(rmtadr);
3628	memset(&xpkt, 0, sizeof(xpkt));
3629	xpkt.li_vn_mode = PKT_LI_VN_MODE(sys_leap, pool->version,
3630					 MODE_CLIENT);
3631	xpkt.stratum = STRATUM_TO_PKT(sys_stratum);
3632	xpkt.ppoll = pool->hpoll;
3633	xpkt.precision = sys_precision;
3634	xpkt.refid = sys_refid;
3635	xpkt.rootdelay = HTONS_FP(DTOFP(sys_rootdelay));
3636	xpkt.rootdisp = HTONS_FP(DTOUFP(sys_rootdisp));
3637	HTONL_FP(&sys_reftime, &xpkt.reftime);
3638	get_systime(&xmt_tx);
3639	pool->aorg = xmt_tx;
3640	HTONL_FP(&xmt_tx, &xpkt.xmt);
3641	sendpkt(rmtadr, lcladr,	sys_ttl[pool->ttl], &xpkt,
3642		LEN_PKT_NOMAC);
3643	pool->sent++;
3644	pool->throttle += (1 << pool->minpoll) - 2;
3645#ifdef DEBUG
3646	if (debug)
3647		printf("transmit: at %ld %s->%s pool\n",
3648		    current_time, latoa(lcladr), stoa(rmtadr));
3649#endif
3650	msyslog(LOG_INFO, "Soliciting pool server %s", stoa(rmtadr));
3651#endif	/* WORKER */
3652}
3653
3654
3655#ifdef AUTOKEY
3656	/*
3657	 * group_test - test if this is the same group
3658	 *
3659	 * host		assoc		return		action
3660	 * none		none		0		mobilize *
3661	 * none		group		0		mobilize *
3662	 * group	none		0		mobilize *
3663	 * group	group		1		mobilize
3664	 * group	different	1		ignore
3665	 * * ignore if notrust
3666	 */
3667int group_test(
3668	char	*grp,
3669	char	*ident
3670	)
3671{
3672	if (grp == NULL)
3673		return (0);
3674
3675	if (strcmp(grp, sys_groupname) == 0)
3676		return (0);
3677
3678	if (ident == NULL)
3679		return (1);
3680
3681	if (strcmp(grp, ident) == 0)
3682		return (0);
3683
3684	return (1);
3685}
3686#endif /* AUTOKEY */
3687
3688#ifdef WORKER
3689void
3690pool_name_resolved(
3691	int			rescode,
3692	int			gai_errno,
3693	void *			context,
3694	const char *		name,
3695	const char *		service,
3696	const struct addrinfo *	hints,
3697	const struct addrinfo *	res
3698	)
3699{
3700	struct peer *	pool;	/* pool solicitor association */
3701	associd_t	assoc;
3702
3703	if (rescode) {
3704		msyslog(LOG_ERR,
3705			"error resolving pool %s: %s (%d)",
3706			name, gai_strerror(rescode), rescode);
3707		return;
3708	}
3709
3710	assoc = (associd_t)(intptr_t)context;
3711	pool = findpeerbyassoc(assoc);
3712	if (NULL == pool) {
3713		msyslog(LOG_ERR,
3714			"Could not find assoc %u for pool DNS %s",
3715			assoc, name);
3716		return;
3717	}
3718	DPRINTF(1, ("pool DNS %s completed\n", name));
3719	pool->addrs = copy_addrinfo_list(res);
3720	pool->ai = pool->addrs;
3721	pool_xmit(pool);
3722
3723}
3724#endif	/* WORKER */
3725
3726
3727#ifdef AUTOKEY
3728/*
3729 * key_expire - purge the key list
3730 */
3731void
3732key_expire(
3733	struct peer *peer	/* peer structure pointer */
3734	)
3735{
3736	int i;
3737
3738	if (peer->keylist != NULL) {
3739		for (i = 0; i <= peer->keynumber; i++)
3740			authtrust(peer->keylist[i], 0);
3741		free(peer->keylist);
3742		peer->keylist = NULL;
3743	}
3744	value_free(&peer->sndval);
3745	peer->keynumber = 0;
3746	peer->flags &= ~FLAG_ASSOC;
3747#ifdef DEBUG
3748	if (debug)
3749		printf("key_expire: at %lu associd %d\n", current_time,
3750		    peer->associd);
3751#endif
3752}
3753#endif	/* AUTOKEY */
3754
3755
3756/*
3757 * local_refid(peer) - check peer refid to avoid selecting peers
3758 *		       currently synced to this ntpd.
3759 */
3760static int
3761local_refid(
3762	struct peer *	p
3763	)
3764{
3765	endpt *	unicast_ep;
3766
3767	if (p->dstadr != NULL && !(INT_MCASTIF & p->dstadr->flags))
3768		unicast_ep = p->dstadr;
3769	else
3770		unicast_ep = findinterface(&p->srcadr);
3771
3772	if (unicast_ep != NULL && p->refid == unicast_ep->addr_refid)
3773		return TRUE;
3774	else
3775		return FALSE;
3776}
3777
3778
3779/*
3780 * Determine if the peer is unfit for synchronization
3781 *
3782 * A peer is unfit for synchronization if
3783 * > TEST10 bad leap or stratum below floor or at or above ceiling
3784 * > TEST11 root distance exceeded for remote peer
3785 * > TEST12 a direct or indirect synchronization loop would form
3786 * > TEST13 unreachable or noselect
3787 */
3788int				/* FALSE if fit, TRUE if unfit */
3789peer_unfit(
3790	struct peer *peer	/* peer structure pointer */
3791	)
3792{
3793	int	rval = 0;
3794
3795	/*
3796	 * A stratum error occurs if (1) the server has never been
3797	 * synchronized, (2) the server stratum is below the floor or
3798	 * greater than or equal to the ceiling.
3799	 */
3800	if (peer->leap == LEAP_NOTINSYNC || peer->stratum < sys_floor ||
3801	    peer->stratum >= sys_ceiling)
3802		rval |= TEST10;		/* bad synch or stratum */
3803
3804	/*
3805	 * A distance error for a remote peer occurs if the root
3806	 * distance is greater than or equal to the distance threshold
3807	 * plus the increment due to one host poll interval.
3808	 */
3809	if (!(peer->flags & FLAG_REFCLOCK) && root_distance(peer) >=
3810	    sys_maxdist + clock_phi * ULOGTOD(peer->hpoll))
3811		rval |= TEST11;		/* distance exceeded */
3812
3813	/*
3814	 * A loop error occurs if the remote peer is synchronized to the
3815	 * local peer or if the remote peer is synchronized to the same
3816	 * server as the local peer but only if the remote peer is
3817	 * neither a reference clock nor an orphan.
3818	 */
3819	if (peer->stratum > 1 && local_refid(peer))
3820		rval |= TEST12;		/* synchronization loop */
3821
3822	/*
3823	 * An unreachable error occurs if the server is unreachable or
3824	 * the noselect bit is set.
3825	 */
3826	if (!peer->reach || (peer->flags & FLAG_NOSELECT))
3827		rval |= TEST13;		/* unreachable */
3828
3829	peer->flash &= ~PEER_TEST_MASK;
3830	peer->flash |= rval;
3831	return (rval);
3832}
3833
3834
3835/*
3836 * Find the precision of this particular machine
3837 */
3838#define MINSTEP		20e-9	/* minimum clock increment (s) */
3839#define MAXSTEP		1	/* maximum clock increment (s) */
3840#define MINCHANGES	12	/* minimum number of step samples */
3841#define MAXLOOPS	((int)(1. / MINSTEP))	/* avoid infinite loop */
3842
3843/*
3844 * This routine measures the system precision defined as the minimum of
3845 * a sequence of differences between successive readings of the system
3846 * clock. However, if a difference is less than MINSTEP, the clock has
3847 * been read more than once during a clock tick and the difference is
3848 * ignored. We set MINSTEP greater than zero in case something happens
3849 * like a cache miss, and to tolerate underlying system clocks which
3850 * ensure each reading is strictly greater than prior readings while
3851 * using an underlying stepping (not interpolated) clock.
3852 *
3853 * sys_tick and sys_precision represent the time to read the clock for
3854 * systems with high-precision clocks, and the tick interval or step
3855 * size for lower-precision stepping clocks.
3856 *
3857 * This routine also measures the time to read the clock on stepping
3858 * system clocks by counting the number of readings between changes of
3859 * the underlying clock.  With either type of clock, the minimum time
3860 * to read the clock is saved as sys_fuzz, and used to ensure the
3861 * get_systime() readings always increase and are fuzzed below sys_fuzz.
3862 */
3863void
3864measure_precision(void)
3865{
3866	/*
3867	 * With sys_fuzz set to zero, get_systime() fuzzing of low bits
3868	 * is effectively disabled.  trunc_os_clock is FALSE to disable
3869	 * get_ostime() simulation of a low-precision system clock.
3870	 */
3871	set_sys_fuzz(0.);
3872	trunc_os_clock = FALSE;
3873	measured_tick = measure_tick_fuzz();
3874	set_sys_tick_precision(measured_tick);
3875	msyslog(LOG_INFO, "proto: precision = %.3f usec (%d)",
3876		sys_tick * 1e6, sys_precision);
3877	if (sys_fuzz < sys_tick) {
3878		msyslog(LOG_NOTICE, "proto: fuzz beneath %.3f usec",
3879			sys_fuzz * 1e6);
3880	}
3881}
3882
3883
3884/*
3885 * measure_tick_fuzz()
3886 *
3887 * measures the minimum time to read the clock (stored in sys_fuzz)
3888 * and returns the tick, the larger of the minimum increment observed
3889 * between successive clock readings and the time to read the clock.
3890 */
3891double
3892measure_tick_fuzz(void)
3893{
3894	l_fp	minstep;	/* MINSTEP as l_fp */
3895	l_fp	val;		/* current seconds fraction */
3896	l_fp	last;		/* last seconds fraction */
3897	l_fp	ldiff;		/* val - last */
3898	double	tick;		/* computed tick value */
3899	double	diff;
3900	long	repeats;
3901	long	max_repeats;
3902	int	changes;
3903	int	i;		/* log2 precision */
3904
3905	tick = MAXSTEP;
3906	max_repeats = 0;
3907	repeats = 0;
3908	changes = 0;
3909	DTOLFP(MINSTEP, &minstep);
3910	get_systime(&last);
3911	for (i = 0; i < MAXLOOPS && changes < MINCHANGES; i++) {
3912		get_systime(&val);
3913		ldiff = val;
3914		L_SUB(&ldiff, &last);
3915		last = val;
3916		if (L_ISGT(&ldiff, &minstep)) {
3917			max_repeats = max(repeats, max_repeats);
3918			repeats = 0;
3919			changes++;
3920			LFPTOD(&ldiff, diff);
3921			tick = min(diff, tick);
3922		} else {
3923			repeats++;
3924		}
3925	}
3926	if (changes < MINCHANGES) {
3927		msyslog(LOG_ERR, "Fatal error: precision could not be measured (MINSTEP too large?)");
3928		exit(1);
3929	}
3930
3931	if (0 == max_repeats) {
3932		set_sys_fuzz(tick);
3933	} else {
3934		set_sys_fuzz(tick / max_repeats);
3935	}
3936
3937	return tick;
3938}
3939
3940
3941void
3942set_sys_tick_precision(
3943	double tick
3944	)
3945{
3946	int i;
3947
3948	if (tick > 1.) {
3949		msyslog(LOG_ERR,
3950			"unsupported tick %.3f > 1s ignored", tick);
3951		return;
3952	}
3953	if (tick < measured_tick) {
3954		msyslog(LOG_ERR,
3955			"proto: tick %.3f less than measured tick %.3f, ignored",
3956			tick, measured_tick);
3957		return;
3958	} else if (tick > measured_tick) {
3959		trunc_os_clock = TRUE;
3960		msyslog(LOG_NOTICE,
3961			"proto: truncating system clock to multiples of %.9f",
3962			tick);
3963	}
3964	sys_tick = tick;
3965
3966	/*
3967	 * Find the nearest power of two.
3968	 */
3969	for (i = 0; tick <= 1; i--)
3970		tick *= 2;
3971	if (tick - 1 > 1 - tick / 2)
3972		i++;
3973
3974	sys_precision = (s_char)i;
3975}
3976
3977
3978/*
3979 * init_proto - initialize the protocol module's data
3980 */
3981void
3982init_proto(void)
3983{
3984	l_fp	dummy;
3985	int	i;
3986
3987	/*
3988	 * Fill in the sys_* stuff.  Default is don't listen to
3989	 * broadcasting, require authentication.
3990	 */
3991	sys_leap = LEAP_NOTINSYNC;
3992	sys_stratum = STRATUM_UNSPEC;
3993	memcpy(&sys_refid, "INIT", 4);
3994	sys_peer = NULL;
3995	sys_rootdelay = 0;
3996	sys_rootdisp = 0;
3997	L_CLR(&sys_reftime);
3998	sys_jitter = 0;
3999	measure_precision();
4000	get_systime(&dummy);
4001	sys_survivors = 0;
4002	sys_manycastserver = 0;
4003	sys_bclient = 0;
4004	sys_bdelay = 0;
4005	sys_authenticate = 1;
4006	sys_stattime = current_time;
4007	orphwait = current_time + sys_orphwait;
4008	proto_clr_stats();
4009	for (i = 0; i < MAX_TTL; i++) {
4010		sys_ttl[i] = (u_char)((i * 256) / MAX_TTL);
4011		sys_ttlmax = i;
4012	}
4013	hardpps_enable = 0;
4014	stats_control = 1;
4015}
4016
4017
4018/*
4019 * proto_config - configure the protocol module
4020 */
4021void
4022proto_config(
4023	int	item,
4024	u_long	value,
4025	double	dvalue,
4026	sockaddr_u *svalue
4027	)
4028{
4029	/*
4030	 * Figure out what he wants to change, then do it
4031	 */
4032	DPRINTF(2, ("proto_config: code %d value %lu dvalue %lf\n",
4033		    item, value, dvalue));
4034
4035	switch (item) {
4036
4037	/*
4038	 * enable and disable commands - arguments are Boolean.
4039	 */
4040	case PROTO_AUTHENTICATE: /* authentication (auth) */
4041		sys_authenticate = value;
4042		break;
4043
4044	case PROTO_BROADCLIENT: /* broadcast client (bclient) */
4045		sys_bclient = (int)value;
4046		if (sys_bclient == 0)
4047			io_unsetbclient();
4048		else
4049			io_setbclient();
4050		break;
4051
4052#ifdef REFCLOCK
4053	case PROTO_CAL:		/* refclock calibrate (calibrate) */
4054		cal_enable = value;
4055		break;
4056#endif /* REFCLOCK */
4057
4058	case PROTO_KERNEL:	/* kernel discipline (kernel) */
4059		select_loop(value);
4060		break;
4061
4062	case PROTO_MONITOR:	/* monitoring (monitor) */
4063		if (value)
4064			mon_start(MON_ON);
4065		else
4066			mon_stop(MON_ON);
4067		break;
4068
4069	case PROTO_NTP:		/* NTP discipline (ntp) */
4070		ntp_enable = value;
4071		break;
4072
4073	case PROTO_MODE7:	/* mode7 management (ntpdc) */
4074		ntp_mode7 = value;
4075		break;
4076
4077	case PROTO_PPS:		/* PPS discipline (pps) */
4078		hardpps_enable = value;
4079		break;
4080
4081	case PROTO_FILEGEN:	/* statistics (stats) */
4082		stats_control = value;
4083		break;
4084
4085	/*
4086	 * tos command - arguments are double, sometimes cast to int
4087	 */
4088	case PROTO_BEACON:	/* manycast beacon (beacon) */
4089		sys_beacon = (int)dvalue;
4090		break;
4091
4092	case PROTO_BROADDELAY:	/* default broadcast delay (bdelay) */
4093		sys_bdelay = dvalue;
4094		break;
4095
4096	case PROTO_CEILING:	/* stratum ceiling (ceiling) */
4097		sys_ceiling = (int)dvalue;
4098		break;
4099
4100	case PROTO_COHORT:	/* cohort switch (cohort) */
4101		sys_cohort = (int)dvalue;
4102		break;
4103
4104	case PROTO_FLOOR:	/* stratum floor (floor) */
4105		sys_floor = (int)dvalue;
4106		break;
4107
4108	case PROTO_MAXCLOCK:	/* maximum candidates (maxclock) */
4109		sys_maxclock = (int)dvalue;
4110		break;
4111
4112	case PROTO_MAXDIST:	/* select threshold (maxdist) */
4113		sys_maxdist = dvalue;
4114		break;
4115
4116	case PROTO_CALLDELAY:	/* modem call delay (mdelay) */
4117		break;		/* NOT USED */
4118
4119	case PROTO_MINCLOCK:	/* minimum candidates (minclock) */
4120		sys_minclock = (int)dvalue;
4121		break;
4122
4123	case PROTO_MINDISP:	/* minimum distance (mindist) */
4124		sys_mindisp = dvalue;
4125		break;
4126
4127	case PROTO_MINSANE:	/* minimum survivors (minsane) */
4128		sys_minsane = (int)dvalue;
4129		break;
4130
4131	case PROTO_ORPHAN:	/* orphan stratum (orphan) */
4132		sys_orphan = (int)dvalue;
4133		break;
4134
4135	case PROTO_ORPHWAIT:	/* orphan wait (orphwait) */
4136		orphwait -= sys_orphwait;
4137		sys_orphwait = (int)dvalue;
4138		orphwait += sys_orphwait;
4139		break;
4140
4141	/*
4142	 * Miscellaneous commands
4143	 */
4144	case PROTO_MULTICAST_ADD: /* add group address */
4145		if (svalue != NULL)
4146			io_multicast_add(svalue);
4147		sys_bclient = 1;
4148		break;
4149
4150	case PROTO_MULTICAST_DEL: /* delete group address */
4151		if (svalue != NULL)
4152			io_multicast_del(svalue);
4153		break;
4154
4155	default:
4156		msyslog(LOG_NOTICE,
4157		    "proto: unsupported option %d", item);
4158	}
4159}
4160
4161
4162/*
4163 * proto_clr_stats - clear protocol stat counters
4164 */
4165void
4166proto_clr_stats(void)
4167{
4168	sys_stattime = current_time;
4169	sys_received = 0;
4170	sys_processed = 0;
4171	sys_newversion = 0;
4172	sys_oldversion = 0;
4173	sys_declined = 0;
4174	sys_restricted = 0;
4175	sys_badlength = 0;
4176	sys_badauth = 0;
4177	sys_limitrejected = 0;
4178	sys_kodsent = 0;
4179}
4180