ntp.c 12.2 KB
Newer Older
1 2 3 4 5 6 7
/*
 * NTP state machine interfaces and logic.
 *
 * This code was mainly moved from kernel/timer.c and kernel/time.c
 * Please see those files for relevant copyright info and historical
 * changelogs.
 */
A
Alexey Dobriyan 已提交
8
#include <linux/capability.h>
R
Roman Zippel 已提交
9
#include <linux/clocksource.h>
10
#include <linux/workqueue.h>
11 12 13 14 15 16
#include <linux/hrtimer.h>
#include <linux/jiffies.h>
#include <linux/math64.h>
#include <linux/timex.h>
#include <linux/time.h>
#include <linux/mm.h>
17

18
/*
19
 * NTP timekeeping variables:
20 21
 */

22 23 24 25 26
/* USER_HZ period (usecs): */
unsigned long			tick_usec = TICK_USEC;

/* ACTHZ period (nsecs): */
unsigned long			tick_nsec;
R
Roman Zippel 已提交
27

28 29 30 31 32
u64				tick_length;
static u64			tick_length_base;

static struct hrtimer		leap_timer;

33
#define MAX_TICKADJ		500LL		/* usecs */
34
#define MAX_TICKADJ_SCALED \
35
	(((MAX_TICKADJ * NSEC_PER_USEC) << NTP_SCALE_SHIFT) / NTP_INTERVAL_FREQ)
36 37 38 39

/*
 * phase-lock loop variables
 */
40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78

/*
 * clock synchronization status
 *
 * (TIME_ERROR prevents overwriting the CMOS clock)
 */
static int			time_state = TIME_OK;

/* clock status bits:							*/
int				time_status = STA_UNSYNC;

/* TAI offset (secs):							*/
static long			time_tai;

/* time adjustment (nsecs):						*/
static s64			time_offset;

/* pll time constant:							*/
static long			time_constant = 2;

/* maximum error (usecs):						*/
long				time_maxerror = NTP_PHASE_LIMIT;

/* estimated error (usecs):						*/
long				time_esterror = NTP_PHASE_LIMIT;

/* frequency offset (scaled nsecs/secs):				*/
static s64			time_freq;

/* time at last adjustment (secs):					*/
static long			time_reftime;

long				time_adjust;

static long			ntp_tick_adj;

/*
 * NTP methods:
 */
79

80 81 82 83
/*
 * Update (tick_length, tick_length_base, tick_nsec), based
 * on (tick_usec, ntp_tick_adj, time_freq):
 */
84 85
static void ntp_update_frequency(void)
{
86
	u64 second_length;
87
	u64 new_base;
88 89 90 91 92 93

	second_length		 = (u64)(tick_usec * NSEC_PER_USEC * USER_HZ)
						<< NTP_SCALE_SHIFT;

	second_length		+= (s64)ntp_tick_adj << NTP_SCALE_SHIFT;
	second_length		+= time_freq;
94

95
	tick_nsec		 = div_u64(second_length, HZ) >> NTP_SCALE_SHIFT;
96
	new_base		 = div_u64(second_length, NTP_INTERVAL_FREQ);
97 98 99

	/*
	 * Don't wait for the next second_overflow, apply
100
	 * the change to the tick length immediately:
101
	 */
102 103
	tick_length		+= new_base - tick_length_base;
	tick_length_base	 = new_base;
104 105
}

106
static inline s64 ntp_update_offset_fll(s64 offset64, long secs)
107 108 109 110
{
	time_status &= ~STA_MODE;

	if (secs < MINSEC)
111
		return 0;
112 113

	if (!(time_status & STA_FLL) && (secs <= MAXSEC))
114
		return 0;
115 116 117

	time_status |= STA_MODE;

118
	return div_s64(offset64 << (NTP_SCALE_SHIFT - SHIFT_FLL), secs);
119 120
}

R
Roman Zippel 已提交
121 122 123
static void ntp_update_offset(long offset)
{
	s64 freq_adj;
124 125
	s64 offset64;
	long secs;
R
Roman Zippel 已提交
126 127 128 129

	if (!(time_status & STA_PLL))
		return;

R
Roman Zippel 已提交
130
	if (!(time_status & STA_NANO))
131
		offset *= NSEC_PER_USEC;
R
Roman Zippel 已提交
132 133 134 135 136

	/*
	 * Scale the phase adjustment and
	 * clamp to the operating range.
	 */
137 138
	offset = min(offset, MAXPHASE);
	offset = max(offset, -MAXPHASE);
R
Roman Zippel 已提交
139 140 141 142 143

	/*
	 * Select how the frequency is to be controlled
	 * and in which mode (PLL or FLL).
	 */
144
	secs = xtime.tv_sec - time_reftime;
145
	if (unlikely(time_status & STA_FREQHOLD))
146 147
		secs = 0;

R
Roman Zippel 已提交
148 149
	time_reftime = xtime.tv_sec;

150 151 152 153
	offset64    = offset;
	freq_adj    = (offset64 * secs) <<
			(NTP_SCALE_SHIFT - 2 * (SHIFT_PLL + 2 + time_constant));

154
	freq_adj    += ntp_update_offset_fll(offset64, secs);
155 156 157 158 159 160

	freq_adj    = min(freq_adj + time_freq, MAXFREQ_SCALED);

	time_freq   = max(freq_adj, -MAXFREQ_SCALED);

	time_offset = div_s64(offset64 << NTP_SCALE_SHIFT, NTP_INTERVAL_FREQ);
R
Roman Zippel 已提交
161 162
}

163 164 165 166 167 168 169
/**
 * ntp_clear - Clears the NTP state variables
 *
 * Must be called while holding a write on the xtime_lock
 */
void ntp_clear(void)
{
170 171 172 173
	time_adjust	= 0;		/* stop active adjtime() */
	time_status	|= STA_UNSYNC;
	time_maxerror	= NTP_PHASE_LIMIT;
	time_esterror	= NTP_PHASE_LIMIT;
174 175 176

	ntp_update_frequency();

177 178
	tick_length	= tick_length_base;
	time_offset	= 0;
179 180
}

181
/*
R
Roman Zippel 已提交
182 183 184
 * Leap second processing. If in leap-insert state at the end of the
 * day, the system clock is set back one second; if in leap-delete
 * state, the system clock is set ahead one second.
185
 */
R
Roman Zippel 已提交
186
static enum hrtimer_restart ntp_leap_second(struct hrtimer *timer)
187
{
R
Roman Zippel 已提交
188
	enum hrtimer_restart res = HRTIMER_NORESTART;
189

190
	write_seqlock(&xtime_lock);
191 192 193 194 195

	switch (time_state) {
	case TIME_OK:
		break;
	case TIME_INS:
R
Roman Zippel 已提交
196 197 198
		xtime.tv_sec--;
		wall_to_monotonic.tv_sec++;
		time_state = TIME_OOP;
199 200
		printk(KERN_NOTICE
			"Clock: inserting leap second 23:59:60 UTC\n");
201
		hrtimer_add_expires_ns(&leap_timer, NSEC_PER_SEC);
R
Roman Zippel 已提交
202
		res = HRTIMER_RESTART;
203 204
		break;
	case TIME_DEL:
R
Roman Zippel 已提交
205 206 207 208
		xtime.tv_sec++;
		time_tai--;
		wall_to_monotonic.tv_sec--;
		time_state = TIME_WAIT;
209 210
		printk(KERN_NOTICE
			"Clock: deleting leap second 23:59:59 UTC\n");
211 212
		break;
	case TIME_OOP:
R
Roman Zippel 已提交
213
		time_tai++;
214
		time_state = TIME_WAIT;
R
Roman Zippel 已提交
215
		/* fall through */
216 217
	case TIME_WAIT:
		if (!(time_status & (STA_INS | STA_DEL)))
R
Roman Zippel 已提交
218
			time_state = TIME_OK;
R
Roman Zippel 已提交
219 220 221 222
		break;
	}
	update_vsyscall(&xtime, clock);

223
	write_sequnlock(&xtime_lock);
R
Roman Zippel 已提交
224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244

	return res;
}

/*
 * this routine handles the overflow of the microsecond field
 *
 * The tricky bits of code to handle the accurate clock support
 * were provided by Dave Mills (Mills@UDEL.EDU) of NTP fame.
 * They were originally developed for SUN and DEC kernels.
 * All the kudos should go to Dave for this stuff.
 */
void second_overflow(void)
{
	s64 time_adj;

	/* Bump the maxerror field */
	time_maxerror += MAXFREQ / NSEC_PER_USEC;
	if (time_maxerror > NTP_PHASE_LIMIT) {
		time_maxerror = NTP_PHASE_LIMIT;
		time_status |= STA_UNSYNC;
245 246 247
	}

	/*
248 249
	 * Compute the phase adjustment for the next second. The offset is
	 * reduced by a fixed factor times the time constant.
250
	 */
251 252 253 254
	tick_length	= tick_length_base;
	time_adj	= shift_right(time_offset, SHIFT_PLL + time_constant);
	time_offset	-= time_adj;
	tick_length	+= time_adj;
255

256 257 258 259 260 261 262
	if (!time_adjust)
		return;

	if (time_adjust > MAX_TICKADJ) {
		time_adjust -= MAX_TICKADJ;
		tick_length += MAX_TICKADJ_SCALED;
		return;
263
	}
264 265 266 267 268 269 270 271 272 273

	if (time_adjust < -MAX_TICKADJ) {
		time_adjust += MAX_TICKADJ;
		tick_length -= MAX_TICKADJ_SCALED;
		return;
	}

	tick_length += (s64)(time_adjust * NSEC_PER_USEC / NTP_INTERVAL_FREQ)
							 << NTP_SCALE_SHIFT;
	time_adjust = 0;
274 275
}

276
#ifdef CONFIG_GENERIC_CMOS_UPDATE
277

278 279 280
/* Disable the cmos update - used by virtualization and embedded */
int no_sync_cmos_clock  __read_mostly;

281
static void sync_cmos_clock(struct work_struct *work);
282

283
static DECLARE_DELAYED_WORK(sync_cmos_work, sync_cmos_clock);
284

285
static void sync_cmos_clock(struct work_struct *work)
286 287 288 289 290 291 292 293 294 295 296
{
	struct timespec now, next;
	int fail = 1;

	/*
	 * If we have an externally synchronized Linux clock, then update
	 * CMOS clock accordingly every ~11 minutes. Set_rtc_mmss() has to be
	 * called as close as possible to 500 ms before the new second starts.
	 * This code is run on a timer.  If the clock is set, that timer
	 * may not expire at the correct time.  Thus, we adjust...
	 */
297
	if (!ntp_synced()) {
298 299 300 301 302
		/*
		 * Not synced, exit, do not restart a timer (if one is
		 * running, let it run out).
		 */
		return;
303
	}
304 305

	getnstimeofday(&now);
306
	if (abs(now.tv_nsec - (NSEC_PER_SEC / 2)) <= tick_nsec / 2)
307 308
		fail = update_persistent_clock(now);

309
	next.tv_nsec = (NSEC_PER_SEC / 2) - now.tv_nsec - (TICK_NSEC / 2);
310 311 312 313 314 315 316 317 318 319 320 321
	if (next.tv_nsec <= 0)
		next.tv_nsec += NSEC_PER_SEC;

	if (!fail)
		next.tv_sec = 659;
	else
		next.tv_sec = 0;

	if (next.tv_nsec >= NSEC_PER_SEC) {
		next.tv_sec++;
		next.tv_nsec -= NSEC_PER_SEC;
	}
322
	schedule_delayed_work(&sync_cmos_work, timespec_to_jiffies(&next));
323 324 325
}

static void notify_cmos_timer(void)
326
{
327
	if (!no_sync_cmos_clock)
328
		schedule_delayed_work(&sync_cmos_work, 0);
329 330
}

331 332 333 334
#else
static inline void notify_cmos_timer(void) { }
#endif

335 336
/*
 * adjtimex mainly allows reading (and writing, if superuser) of
337 338 339 340
 * kernel time-keeping variables. used by xntpd.
 */
int do_adjtimex(struct timex *txc)
{
R
Roman Zippel 已提交
341
	struct timespec ts;
342 343
	int result;

344 345
	/* Validate the data before disabling interrupts */
	if (txc->modes & ADJ_ADJTIME) {
R
Roman Zippel 已提交
346
		/* singleshot must not be used with any other mode bits */
347
		if (!(txc->modes & ADJ_OFFSET_SINGLESHOT))
348
			return -EINVAL;
349 350 351 352 353 354 355 356
		if (!(txc->modes & ADJ_OFFSET_READONLY) &&
		    !capable(CAP_SYS_TIME))
			return -EPERM;
	} else {
		/* In order to modify anything, you gotta be super-user! */
		 if (txc->modes && !capable(CAP_SYS_TIME))
			return -EPERM;

357 358 359 360
		/*
		 * if the quartz is off by more than 10% then
		 * something is VERY wrong!
		 */
361 362 363 364 365 366 367
		if (txc->modes & ADJ_TICK &&
		    (txc->tick <  900000/USER_HZ ||
		     txc->tick > 1100000/USER_HZ))
				return -EINVAL;

		if (txc->modes & ADJ_STATUS && time_state != TIME_OK)
			hrtimer_cancel(&leap_timer);
J
John Stultz 已提交
368
	}
369

R
Roman Zippel 已提交
370 371
	getnstimeofday(&ts);

372 373 374
	write_seqlock_irq(&xtime_lock);

	/* If there are input parameters, then process them */
375 376 377 378 379 380 381 382 383 384 385
	if (txc->modes & ADJ_ADJTIME) {
		long save_adjust = time_adjust;

		if (!(txc->modes & ADJ_OFFSET_READONLY)) {
			/* adjtime() is independent from ntp_adjtime() */
			time_adjust = txc->offset;
			ntp_update_frequency();
		}
		txc->offset = save_adjust;
		goto adj_done;
	}
R
Roman Zippel 已提交
386
	if (txc->modes) {
387 388
		long sec;

R
Roman Zippel 已提交
389 390 391 392 393 394 395 396
		if (txc->modes & ADJ_STATUS) {
			if ((time_status & STA_PLL) &&
			    !(txc->status & STA_PLL)) {
				time_state = TIME_OK;
				time_status = STA_UNSYNC;
			}
			/* only set allowed bits */
			time_status &= STA_RONLY;
397 398 399 400 401 402 403
			/*
			 * If we turn on PLL adjustments then reset the
			 * reference time to current time.
			 */
			if (!(time_status & STA_PLL) && (txc->status & STA_PLL))
				time_reftime = xtime.tv_sec;

R
Roman Zippel 已提交
404
			time_status |= txc->status & ~STA_RONLY;
R
Roman Zippel 已提交
405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432

			switch (time_state) {
			case TIME_OK:
			start_timer:
				sec = ts.tv_sec;
				if (time_status & STA_INS) {
					time_state = TIME_INS;
					sec += 86400 - sec % 86400;
					hrtimer_start(&leap_timer, ktime_set(sec, 0), HRTIMER_MODE_ABS);
				} else if (time_status & STA_DEL) {
					time_state = TIME_DEL;
					sec += 86400 - (sec + 1) % 86400;
					hrtimer_start(&leap_timer, ktime_set(sec, 0), HRTIMER_MODE_ABS);
				}
				break;
			case TIME_INS:
			case TIME_DEL:
				time_state = TIME_OK;
				goto start_timer;
				break;
			case TIME_WAIT:
				if (!(time_status & (STA_INS | STA_DEL)))
					time_state = TIME_OK;
				break;
			case TIME_OOP:
				hrtimer_restart(&leap_timer);
				break;
			}
R
Roman Zippel 已提交
433 434 435 436 437 438
		}

		if (txc->modes & ADJ_NANO)
			time_status |= STA_NANO;
		if (txc->modes & ADJ_MICRO)
			time_status &= ~STA_NANO;
R
Roman Zippel 已提交
439 440

		if (txc->modes & ADJ_FREQUENCY) {
441 442 443
			time_freq = (s64)txc->freq * PPM_SCALE;
			time_freq = min(time_freq, MAXFREQ_SCALED);
			time_freq = max(time_freq, -MAXFREQ_SCALED);
444
		}
R
Roman Zippel 已提交
445

R
Roman Zippel 已提交
446
		if (txc->modes & ADJ_MAXERROR)
R
Roman Zippel 已提交
447
			time_maxerror = txc->maxerror;
R
Roman Zippel 已提交
448
		if (txc->modes & ADJ_ESTERROR)
R
Roman Zippel 已提交
449
			time_esterror = txc->esterror;
450

R
Roman Zippel 已提交
451
		if (txc->modes & ADJ_TIMECONST) {
R
Roman Zippel 已提交
452 453 454 455 456
			time_constant = txc->constant;
			if (!(time_status & STA_NANO))
				time_constant += 4;
			time_constant = min(time_constant, (long)MAXTC);
			time_constant = max(time_constant, 0l);
457 458
		}

R
Roman Zippel 已提交
459 460 461
		if (txc->modes & ADJ_TAI && txc->constant > 0)
			time_tai = txc->constant;

462 463
		if (txc->modes & ADJ_OFFSET)
			ntp_update_offset(txc->offset);
R
Roman Zippel 已提交
464 465 466 467 468 469
		if (txc->modes & ADJ_TICK)
			tick_usec = txc->tick;

		if (txc->modes & (ADJ_TICK|ADJ_FREQUENCY|ADJ_OFFSET))
			ntp_update_frequency();
	}
R
Roman Zippel 已提交
470

471 472 473 474 475 476
	txc->offset = shift_right(time_offset * NTP_INTERVAL_FREQ,
				  NTP_SCALE_SHIFT);
	if (!(time_status & STA_NANO))
		txc->offset /= NSEC_PER_USEC;

adj_done:
R
Roman Zippel 已提交
477
	result = time_state;	/* mostly `TIME_OK' */
R
Roman Zippel 已提交
478
	if (time_status & (STA_UNSYNC|STA_CLOCKERR))
479 480
		result = TIME_ERROR;

481 482
	txc->freq	   = shift_right((time_freq >> PPM_SCALE_INV_SHIFT) *
					 (s64)PPM_SCALE_INV, NTP_SCALE_SHIFT);
483 484 485 486
	txc->maxerror	   = time_maxerror;
	txc->esterror	   = time_esterror;
	txc->status	   = time_status;
	txc->constant	   = time_constant;
487
	txc->precision	   = 1;
488
	txc->tolerance	   = MAXFREQ_SCALED / PPM_SCALE;
489
	txc->tick	   = tick_usec;
R
Roman Zippel 已提交
490
	txc->tai	   = time_tai;
491 492 493 494 495 496 497 498 499 500 501

	/* PPS is not implemented, so these are zero */
	txc->ppsfreq	   = 0;
	txc->jitter	   = 0;
	txc->shift	   = 0;
	txc->stabil	   = 0;
	txc->jitcnt	   = 0;
	txc->calcnt	   = 0;
	txc->errcnt	   = 0;
	txc->stbcnt	   = 0;
	write_sequnlock_irq(&xtime_lock);
R
Roman Zippel 已提交
502

R
Roman Zippel 已提交
503 504 505 506
	txc->time.tv_sec = ts.tv_sec;
	txc->time.tv_usec = ts.tv_nsec;
	if (!(time_status & STA_NANO))
		txc->time.tv_usec /= NSEC_PER_USEC;
R
Roman Zippel 已提交
507

508
	notify_cmos_timer();
R
Roman Zippel 已提交
509 510

	return result;
511
}
512 513 514 515 516 517 518 519

static int __init ntp_tick_adj_setup(char *str)
{
	ntp_tick_adj = simple_strtol(str, NULL, 0);
	return 1;
}

__setup("ntp_tick_adj=", ntp_tick_adj_setup);
R
Roman Zippel 已提交
520 521 522 523 524 525 526

void __init ntp_init(void)
{
	ntp_clear();
	hrtimer_init(&leap_timer, CLOCK_REALTIME, HRTIMER_MODE_ABS);
	leap_timer.function = ntp_leap_second;
}