ntp.c 12.5 KB
Newer Older
1 2 3 4 5 6 7
/*
 * NTP state machine interfaces and logic.
 *
 * This code was mainly moved from kernel/timer.c and kernel/time.c
 * Please see those files for relevant copyright info and historical
 * changelogs.
 */
A
Alexey Dobriyan 已提交
8
#include <linux/capability.h>
R
Roman Zippel 已提交
9
#include <linux/clocksource.h>
10
#include <linux/workqueue.h>
11 12 13 14 15 16
#include <linux/hrtimer.h>
#include <linux/jiffies.h>
#include <linux/math64.h>
#include <linux/timex.h>
#include <linux/time.h>
#include <linux/mm.h>
17

18
/*
19
 * NTP timekeeping variables:
20 21
 */

22 23 24 25 26
/* USER_HZ period (usecs): */
unsigned long			tick_usec = TICK_USEC;

/* ACTHZ period (nsecs): */
unsigned long			tick_nsec;
R
Roman Zippel 已提交
27

28 29 30 31 32
u64				tick_length;
static u64			tick_length_base;

static struct hrtimer		leap_timer;

33
#define MAX_TICKADJ		500LL		/* usecs */
34
#define MAX_TICKADJ_SCALED \
35
	(((MAX_TICKADJ * NSEC_PER_USEC) << NTP_SCALE_SHIFT) / NTP_INTERVAL_FREQ)
36 37 38 39

/*
 * phase-lock loop variables
 */
40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78

/*
 * clock synchronization status
 *
 * (TIME_ERROR prevents overwriting the CMOS clock)
 */
static int			time_state = TIME_OK;

/* clock status bits:							*/
int				time_status = STA_UNSYNC;

/* TAI offset (secs):							*/
static long			time_tai;

/* time adjustment (nsecs):						*/
static s64			time_offset;

/* pll time constant:							*/
static long			time_constant = 2;

/* maximum error (usecs):						*/
long				time_maxerror = NTP_PHASE_LIMIT;

/* estimated error (usecs):						*/
long				time_esterror = NTP_PHASE_LIMIT;

/* frequency offset (scaled nsecs/secs):				*/
static s64			time_freq;

/* time at last adjustment (secs):					*/
static long			time_reftime;

long				time_adjust;

static long			ntp_tick_adj;

/*
 * NTP methods:
 */
79

80 81 82 83
/*
 * Update (tick_length, tick_length_base, tick_nsec), based
 * on (tick_usec, ntp_tick_adj, time_freq):
 */
84 85
static void ntp_update_frequency(void)
{
86
	u64 second_length;
87
	u64 new_base;
88 89 90 91 92 93

	second_length		 = (u64)(tick_usec * NSEC_PER_USEC * USER_HZ)
						<< NTP_SCALE_SHIFT;

	second_length		+= (s64)ntp_tick_adj << NTP_SCALE_SHIFT;
	second_length		+= time_freq;
94

95
	tick_nsec		 = div_u64(second_length, HZ) >> NTP_SCALE_SHIFT;
96
	new_base		 = div_u64(second_length, NTP_INTERVAL_FREQ);
97 98 99

	/*
	 * Don't wait for the next second_overflow, apply
100
	 * the change to the tick length immediately:
101
	 */
102 103
	tick_length		+= new_base - tick_length_base;
	tick_length_base	 = new_base;
104 105
}

106
static inline s64 ntp_update_offset_fll(s64 offset64, long secs)
107 108 109 110
{
	time_status &= ~STA_MODE;

	if (secs < MINSEC)
111
		return 0;
112 113

	if (!(time_status & STA_FLL) && (secs <= MAXSEC))
114
		return 0;
115 116 117

	time_status |= STA_MODE;

118
	return div_s64(offset64 << (NTP_SCALE_SHIFT - SHIFT_FLL), secs);
119 120
}

R
Roman Zippel 已提交
121 122 123
static void ntp_update_offset(long offset)
{
	s64 freq_adj;
124 125
	s64 offset64;
	long secs;
R
Roman Zippel 已提交
126 127 128 129

	if (!(time_status & STA_PLL))
		return;

R
Roman Zippel 已提交
130
	if (!(time_status & STA_NANO))
131
		offset *= NSEC_PER_USEC;
R
Roman Zippel 已提交
132 133 134 135 136

	/*
	 * Scale the phase adjustment and
	 * clamp to the operating range.
	 */
137 138
	offset = min(offset, MAXPHASE);
	offset = max(offset, -MAXPHASE);
R
Roman Zippel 已提交
139 140 141 142 143

	/*
	 * Select how the frequency is to be controlled
	 * and in which mode (PLL or FLL).
	 */
144
	secs = xtime.tv_sec - time_reftime;
145
	if (unlikely(time_status & STA_FREQHOLD))
146 147
		secs = 0;

R
Roman Zippel 已提交
148 149
	time_reftime = xtime.tv_sec;

150 151 152 153
	offset64    = offset;
	freq_adj    = (offset64 * secs) <<
			(NTP_SCALE_SHIFT - 2 * (SHIFT_PLL + 2 + time_constant));

154
	freq_adj    += ntp_update_offset_fll(offset64, secs);
155 156 157 158 159 160

	freq_adj    = min(freq_adj + time_freq, MAXFREQ_SCALED);

	time_freq   = max(freq_adj, -MAXFREQ_SCALED);

	time_offset = div_s64(offset64 << NTP_SCALE_SHIFT, NTP_INTERVAL_FREQ);
R
Roman Zippel 已提交
161 162
}

163 164 165 166 167 168 169
/**
 * ntp_clear - Clears the NTP state variables
 *
 * Must be called while holding a write on the xtime_lock
 */
void ntp_clear(void)
{
170 171 172 173
	time_adjust	= 0;		/* stop active adjtime() */
	time_status	|= STA_UNSYNC;
	time_maxerror	= NTP_PHASE_LIMIT;
	time_esterror	= NTP_PHASE_LIMIT;
174 175 176

	ntp_update_frequency();

177 178
	tick_length	= tick_length_base;
	time_offset	= 0;
179 180
}

181
/*
R
Roman Zippel 已提交
182 183 184
 * Leap second processing. If in leap-insert state at the end of the
 * day, the system clock is set back one second; if in leap-delete
 * state, the system clock is set ahead one second.
185
 */
R
Roman Zippel 已提交
186
static enum hrtimer_restart ntp_leap_second(struct hrtimer *timer)
187
{
R
Roman Zippel 已提交
188
	enum hrtimer_restart res = HRTIMER_NORESTART;
189

190
	write_seqlock(&xtime_lock);
191 192 193 194 195

	switch (time_state) {
	case TIME_OK:
		break;
	case TIME_INS:
R
Roman Zippel 已提交
196 197 198
		xtime.tv_sec--;
		wall_to_monotonic.tv_sec++;
		time_state = TIME_OOP;
199 200
		printk(KERN_NOTICE
			"Clock: inserting leap second 23:59:60 UTC\n");
201
		hrtimer_add_expires_ns(&leap_timer, NSEC_PER_SEC);
R
Roman Zippel 已提交
202
		res = HRTIMER_RESTART;
203 204
		break;
	case TIME_DEL:
R
Roman Zippel 已提交
205 206 207 208
		xtime.tv_sec++;
		time_tai--;
		wall_to_monotonic.tv_sec--;
		time_state = TIME_WAIT;
209 210
		printk(KERN_NOTICE
			"Clock: deleting leap second 23:59:59 UTC\n");
211 212
		break;
	case TIME_OOP:
R
Roman Zippel 已提交
213
		time_tai++;
214
		time_state = TIME_WAIT;
R
Roman Zippel 已提交
215
		/* fall through */
216 217
	case TIME_WAIT:
		if (!(time_status & (STA_INS | STA_DEL)))
R
Roman Zippel 已提交
218
			time_state = TIME_OK;
R
Roman Zippel 已提交
219 220 221 222
		break;
	}
	update_vsyscall(&xtime, clock);

223
	write_sequnlock(&xtime_lock);
R
Roman Zippel 已提交
224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244

	return res;
}

/*
 * this routine handles the overflow of the microsecond field
 *
 * The tricky bits of code to handle the accurate clock support
 * were provided by Dave Mills (Mills@UDEL.EDU) of NTP fame.
 * They were originally developed for SUN and DEC kernels.
 * All the kudos should go to Dave for this stuff.
 */
void second_overflow(void)
{
	s64 time_adj;

	/* Bump the maxerror field */
	time_maxerror += MAXFREQ / NSEC_PER_USEC;
	if (time_maxerror > NTP_PHASE_LIMIT) {
		time_maxerror = NTP_PHASE_LIMIT;
		time_status |= STA_UNSYNC;
245 246 247
	}

	/*
248 249
	 * Compute the phase adjustment for the next second. The offset is
	 * reduced by a fixed factor times the time constant.
250
	 */
251 252 253 254
	tick_length	= tick_length_base;
	time_adj	= shift_right(time_offset, SHIFT_PLL + time_constant);
	time_offset	-= time_adj;
	tick_length	+= time_adj;
255

256 257 258 259 260 261 262
	if (!time_adjust)
		return;

	if (time_adjust > MAX_TICKADJ) {
		time_adjust -= MAX_TICKADJ;
		tick_length += MAX_TICKADJ_SCALED;
		return;
263
	}
264 265 266 267 268 269 270 271 272 273

	if (time_adjust < -MAX_TICKADJ) {
		time_adjust += MAX_TICKADJ;
		tick_length -= MAX_TICKADJ_SCALED;
		return;
	}

	tick_length += (s64)(time_adjust * NSEC_PER_USEC / NTP_INTERVAL_FREQ)
							 << NTP_SCALE_SHIFT;
	time_adjust = 0;
274 275
}

276
#ifdef CONFIG_GENERIC_CMOS_UPDATE
277

278 279 280
/* Disable the cmos update - used by virtualization and embedded */
int no_sync_cmos_clock  __read_mostly;

281
static void sync_cmos_clock(struct work_struct *work);
282

283
static DECLARE_DELAYED_WORK(sync_cmos_work, sync_cmos_clock);
284

285
static void sync_cmos_clock(struct work_struct *work)
286 287 288 289 290 291 292 293 294 295 296
{
	struct timespec now, next;
	int fail = 1;

	/*
	 * If we have an externally synchronized Linux clock, then update
	 * CMOS clock accordingly every ~11 minutes. Set_rtc_mmss() has to be
	 * called as close as possible to 500 ms before the new second starts.
	 * This code is run on a timer.  If the clock is set, that timer
	 * may not expire at the correct time.  Thus, we adjust...
	 */
297
	if (!ntp_synced()) {
298 299 300 301 302
		/*
		 * Not synced, exit, do not restart a timer (if one is
		 * running, let it run out).
		 */
		return;
303
	}
304 305

	getnstimeofday(&now);
306
	if (abs(now.tv_nsec - (NSEC_PER_SEC / 2)) <= tick_nsec / 2)
307 308
		fail = update_persistent_clock(now);

309
	next.tv_nsec = (NSEC_PER_SEC / 2) - now.tv_nsec - (TICK_NSEC / 2);
310 311 312 313 314 315 316 317 318 319 320 321
	if (next.tv_nsec <= 0)
		next.tv_nsec += NSEC_PER_SEC;

	if (!fail)
		next.tv_sec = 659;
	else
		next.tv_sec = 0;

	if (next.tv_nsec >= NSEC_PER_SEC) {
		next.tv_sec++;
		next.tv_nsec -= NSEC_PER_SEC;
	}
322
	schedule_delayed_work(&sync_cmos_work, timespec_to_jiffies(&next));
323 324 325
}

static void notify_cmos_timer(void)
326
{
327
	if (!no_sync_cmos_clock)
328
		schedule_delayed_work(&sync_cmos_work, 0);
329 330
}

331 332 333 334
#else
static inline void notify_cmos_timer(void) { }
#endif

I
Ingo Molnar 已提交
335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430

/*
 * Propagate a new txc->status value into the NTP state:
 */
static inline void process_adj_status(struct timex *txc, struct timespec *ts)
{
	long now;

	if ((time_status & STA_PLL) && !(txc->status & STA_PLL)) {
		time_state = TIME_OK;
		time_status = STA_UNSYNC;
	}
	/* only set allowed bits */
	time_status &= STA_RONLY;

	/*
	 * If we turn on PLL adjustments then reset the
	 * reference time to current time.
	 */
	if (!(time_status & STA_PLL) && (txc->status & STA_PLL))
		time_reftime = xtime.tv_sec;

	time_status |= txc->status & ~STA_RONLY;

	switch (time_state) {
	case TIME_OK:
	start_timer:
		now = ts->tv_sec;
		if (time_status & STA_INS) {
			time_state = TIME_INS;
			now += 86400 - now % 86400;
			hrtimer_start(&leap_timer, ktime_set(now, 0), HRTIMER_MODE_ABS);
		} else if (time_status & STA_DEL) {
			time_state = TIME_DEL;
			now += 86400 - (now + 1) % 86400;
			hrtimer_start(&leap_timer, ktime_set(now, 0), HRTIMER_MODE_ABS);
		}
		break;
	case TIME_INS:
	case TIME_DEL:
		time_state = TIME_OK;
		goto start_timer;
	case TIME_WAIT:
		if (!(time_status & (STA_INS | STA_DEL)))
			time_state = TIME_OK;
		break;
	case TIME_OOP:
		hrtimer_restart(&leap_timer);
		break;
	}
}
/*
 * Called with the xtime lock held, so we can access and modify
 * all the global NTP state:
 */
static inline void process_adjtimex_modes(struct timex *txc, struct timespec *ts)
{
	if (txc->modes & ADJ_STATUS)
		process_adj_status(txc, ts);

	if (txc->modes & ADJ_NANO)
		time_status |= STA_NANO;
	if (txc->modes & ADJ_MICRO)
		time_status &= ~STA_NANO;

	if (txc->modes & ADJ_FREQUENCY) {
		time_freq = (s64)txc->freq * PPM_SCALE;
		time_freq = min(time_freq, MAXFREQ_SCALED);
		time_freq = max(time_freq, -MAXFREQ_SCALED);
	}

	if (txc->modes & ADJ_MAXERROR)
		time_maxerror = txc->maxerror;
	if (txc->modes & ADJ_ESTERROR)
		time_esterror = txc->esterror;

	if (txc->modes & ADJ_TIMECONST) {
		time_constant = txc->constant;
		if (!(time_status & STA_NANO))
			time_constant += 4;
		time_constant = min(time_constant, (long)MAXTC);
		time_constant = max(time_constant, 0l);
	}

	if (txc->modes & ADJ_TAI && txc->constant > 0)
		time_tai = txc->constant;

	if (txc->modes & ADJ_OFFSET)
		ntp_update_offset(txc->offset);
	if (txc->modes & ADJ_TICK)
		tick_usec = txc->tick;

	if (txc->modes & (ADJ_TICK|ADJ_FREQUENCY|ADJ_OFFSET))
		ntp_update_frequency();
}

431 432
/*
 * adjtimex mainly allows reading (and writing, if superuser) of
433 434 435 436
 * kernel time-keeping variables. used by xntpd.
 */
int do_adjtimex(struct timex *txc)
{
R
Roman Zippel 已提交
437
	struct timespec ts;
438 439
	int result;

440 441
	/* Validate the data before disabling interrupts */
	if (txc->modes & ADJ_ADJTIME) {
R
Roman Zippel 已提交
442
		/* singleshot must not be used with any other mode bits */
443
		if (!(txc->modes & ADJ_OFFSET_SINGLESHOT))
444
			return -EINVAL;
445 446 447 448 449 450 451 452
		if (!(txc->modes & ADJ_OFFSET_READONLY) &&
		    !capable(CAP_SYS_TIME))
			return -EPERM;
	} else {
		/* In order to modify anything, you gotta be super-user! */
		 if (txc->modes && !capable(CAP_SYS_TIME))
			return -EPERM;

453 454 455 456
		/*
		 * if the quartz is off by more than 10% then
		 * something is VERY wrong!
		 */
457 458 459 460 461 462 463
		if (txc->modes & ADJ_TICK &&
		    (txc->tick <  900000/USER_HZ ||
		     txc->tick > 1100000/USER_HZ))
				return -EINVAL;

		if (txc->modes & ADJ_STATUS && time_state != TIME_OK)
			hrtimer_cancel(&leap_timer);
J
John Stultz 已提交
464
	}
465

R
Roman Zippel 已提交
466 467
	getnstimeofday(&ts);

468 469 470
	write_seqlock_irq(&xtime_lock);

	/* If there are input parameters, then process them */
471 472 473 474 475 476 477 478 479 480 481
	if (txc->modes & ADJ_ADJTIME) {
		long save_adjust = time_adjust;

		if (!(txc->modes & ADJ_OFFSET_READONLY)) {
			/* adjtime() is independent from ntp_adjtime() */
			time_adjust = txc->offset;
			ntp_update_frequency();
		}
		txc->offset = save_adjust;
		goto adj_done;
	}
R
Roman Zippel 已提交
482

I
Ingo Molnar 已提交
483 484 485
	/* If there are input parameters, then process them: */
	if (txc->modes)
		process_adjtimex_modes(txc, &ts);
R
Roman Zippel 已提交
486

487 488 489 490 491 492
	txc->offset = shift_right(time_offset * NTP_INTERVAL_FREQ,
				  NTP_SCALE_SHIFT);
	if (!(time_status & STA_NANO))
		txc->offset /= NSEC_PER_USEC;

adj_done:
R
Roman Zippel 已提交
493
	result = time_state;	/* mostly `TIME_OK' */
R
Roman Zippel 已提交
494
	if (time_status & (STA_UNSYNC|STA_CLOCKERR))
495 496
		result = TIME_ERROR;

497 498
	txc->freq	   = shift_right((time_freq >> PPM_SCALE_INV_SHIFT) *
					 (s64)PPM_SCALE_INV, NTP_SCALE_SHIFT);
499 500 501 502
	txc->maxerror	   = time_maxerror;
	txc->esterror	   = time_esterror;
	txc->status	   = time_status;
	txc->constant	   = time_constant;
503
	txc->precision	   = 1;
504
	txc->tolerance	   = MAXFREQ_SCALED / PPM_SCALE;
505
	txc->tick	   = tick_usec;
R
Roman Zippel 已提交
506
	txc->tai	   = time_tai;
507 508 509 510 511 512 513 514 515 516 517

	/* PPS is not implemented, so these are zero */
	txc->ppsfreq	   = 0;
	txc->jitter	   = 0;
	txc->shift	   = 0;
	txc->stabil	   = 0;
	txc->jitcnt	   = 0;
	txc->calcnt	   = 0;
	txc->errcnt	   = 0;
	txc->stbcnt	   = 0;
	write_sequnlock_irq(&xtime_lock);
R
Roman Zippel 已提交
518

R
Roman Zippel 已提交
519 520 521 522
	txc->time.tv_sec = ts.tv_sec;
	txc->time.tv_usec = ts.tv_nsec;
	if (!(time_status & STA_NANO))
		txc->time.tv_usec /= NSEC_PER_USEC;
R
Roman Zippel 已提交
523

524
	notify_cmos_timer();
R
Roman Zippel 已提交
525 526

	return result;
527
}
528 529 530 531 532 533 534 535

static int __init ntp_tick_adj_setup(char *str)
{
	ntp_tick_adj = simple_strtol(str, NULL, 0);
	return 1;
}

__setup("ntp_tick_adj=", ntp_tick_adj_setup);
R
Roman Zippel 已提交
536 537 538 539 540 541 542

void __init ntp_init(void)
{
	ntp_clear();
	hrtimer_init(&leap_timer, CLOCK_REALTIME, HRTIMER_MODE_ABS);
	leap_timer.function = ntp_leap_second;
}