hpet.c 28.6 KB
Newer Older
1
#include <linux/clocksource.h>
2
#include <linux/clockchips.h>
3 4
#include <linux/interrupt.h>
#include <linux/sysdev.h>
5
#include <linux/delay.h>
6
#include <linux/errno.h>
7
#include <linux/slab.h>
8 9
#include <linux/hpet.h>
#include <linux/init.h>
10
#include <linux/cpu.h>
11 12
#include <linux/pm.h>
#include <linux/io.h>
13

14
#include <asm/fixmap.h>
15
#include <asm/i8253.h>
16
#include <asm/hpet.h>
17

18
#define HPET_MASK			CLOCKSOURCE_MASK(32)
19

P
Pavel Machek 已提交
20 21
/* FSEC = 10^-15
   NSEC = 10^-9 */
22
#define FSEC_PER_NSEC			1000000L
23

24 25 26 27 28 29 30 31
#define HPET_DEV_USED_BIT		2
#define HPET_DEV_USED			(1 << HPET_DEV_USED_BIT)
#define HPET_DEV_VALID			0x8
#define HPET_DEV_FSB_CAP		0x1000
#define HPET_DEV_PERI_CAP		0x2000

#define EVT_TO_HPET_DEV(evt) container_of(evt, struct hpet_dev, evt)

32 33 34
/*
 * HPET address is set in acpi/boot.c, when an ACPI entry exists
 */
35
unsigned long				hpet_address;
36
u8					hpet_blockid; /* OS timer block num */
37
u8					hpet_msi_disable;
38
u8					hpet_readback_cmp;
39

40
#ifdef CONFIG_PCI_MSI
H
Hannes Eder 已提交
41
static unsigned long			hpet_num_timers;
42
#endif
43
static void __iomem			*hpet_virt_address;
44

45
struct hpet_dev {
46 47 48 49 50 51
	struct clock_event_device	evt;
	unsigned int			num;
	int				cpu;
	unsigned int			irq;
	unsigned int			flags;
	char				name[10];
52 53
};

J
Jan Beulich 已提交
54
inline unsigned int hpet_readl(unsigned int a)
55 56 57 58
{
	return readl(hpet_virt_address + a);
}

J
Jan Beulich 已提交
59
static inline void hpet_writel(unsigned int d, unsigned int a)
60 61 62 63
{
	writel(d, hpet_virt_address + a);
}

64 65
#ifdef CONFIG_X86_64
#include <asm/pgtable.h>
66
#endif
67

68 69 70
static inline void hpet_set_mapping(void)
{
	hpet_virt_address = ioremap_nocache(hpet_address, HPET_MMAP_SIZE);
71 72 73
#ifdef CONFIG_X86_64
	__set_fixmap(VSYSCALL_HPET, hpet_address, PAGE_KERNEL_VSYSCALL_NOCACHE);
#endif
74 75 76 77 78 79 80 81
}

static inline void hpet_clear_mapping(void)
{
	iounmap(hpet_virt_address);
	hpet_virt_address = NULL;
}

82 83 84 85
/*
 * HPET command line enable / disable
 */
static int boot_hpet_disable;
T
Thomas Gleixner 已提交
86
int hpet_force_user;
87
static int hpet_verbose;
88

89
static int __init hpet_setup(char *str)
90 91 92 93
{
	if (str) {
		if (!strncmp("disable", str, 7))
			boot_hpet_disable = 1;
T
Thomas Gleixner 已提交
94 95
		if (!strncmp("force", str, 5))
			hpet_force_user = 1;
96 97
		if (!strncmp("verbose", str, 7))
			hpet_verbose = 1;
98 99 100 101 102
	}
	return 1;
}
__setup("hpet=", hpet_setup);

103 104 105 106 107 108 109
static int __init disable_hpet(char *str)
{
	boot_hpet_disable = 1;
	return 1;
}
__setup("nohpet", disable_hpet);

110 111
static inline int is_hpet_capable(void)
{
112
	return !boot_hpet_disable && hpet_address;
113 114 115 116 117 118 119 120 121 122 123 124 125 126
}

/*
 * HPET timer interrupt enable / disable
 */
static int hpet_legacy_int_enabled;

/**
 * is_hpet_enabled - check whether the hpet timer interrupt is enabled
 */
int is_hpet_enabled(void)
{
	return is_hpet_capable() && hpet_legacy_int_enabled;
}
127
EXPORT_SYMBOL_GPL(is_hpet_enabled);
128

129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165
static void _hpet_print_config(const char *function, int line)
{
	u32 i, timers, l, h;
	printk(KERN_INFO "hpet: %s(%d):\n", function, line);
	l = hpet_readl(HPET_ID);
	h = hpet_readl(HPET_PERIOD);
	timers = ((l & HPET_ID_NUMBER) >> HPET_ID_NUMBER_SHIFT) + 1;
	printk(KERN_INFO "hpet: ID: 0x%x, PERIOD: 0x%x\n", l, h);
	l = hpet_readl(HPET_CFG);
	h = hpet_readl(HPET_STATUS);
	printk(KERN_INFO "hpet: CFG: 0x%x, STATUS: 0x%x\n", l, h);
	l = hpet_readl(HPET_COUNTER);
	h = hpet_readl(HPET_COUNTER+4);
	printk(KERN_INFO "hpet: COUNTER_l: 0x%x, COUNTER_h: 0x%x\n", l, h);

	for (i = 0; i < timers; i++) {
		l = hpet_readl(HPET_Tn_CFG(i));
		h = hpet_readl(HPET_Tn_CFG(i)+4);
		printk(KERN_INFO "hpet: T%d: CFG_l: 0x%x, CFG_h: 0x%x\n",
		       i, l, h);
		l = hpet_readl(HPET_Tn_CMP(i));
		h = hpet_readl(HPET_Tn_CMP(i)+4);
		printk(KERN_INFO "hpet: T%d: CMP_l: 0x%x, CMP_h: 0x%x\n",
		       i, l, h);
		l = hpet_readl(HPET_Tn_ROUTE(i));
		h = hpet_readl(HPET_Tn_ROUTE(i)+4);
		printk(KERN_INFO "hpet: T%d ROUTE_l: 0x%x, ROUTE_h: 0x%x\n",
		       i, l, h);
	}
}

#define hpet_print_config()					\
do {								\
	if (hpet_verbose)					\
		_hpet_print_config(__FUNCTION__, __LINE__);	\
} while (0)

166 167 168 169 170
/*
 * When the hpet driver (/dev/hpet) is enabled, we need to reserve
 * timer 0 and timer 1 in case of RTC emulation.
 */
#ifdef CONFIG_HPET
171

V
Venki Pallipadi 已提交
172
static void hpet_reserve_msi_timers(struct hpet_data *hd);
173

J
Jan Beulich 已提交
174
static void hpet_reserve_platform_timers(unsigned int id)
175 176
{
	struct hpet __iomem *hpet = hpet_virt_address;
177 178
	struct hpet_timer __iomem *timer = &hpet->hpet_timers[2];
	unsigned int nrtimers, i;
179 180 181 182
	struct hpet_data hd;

	nrtimers = ((id & HPET_ID_NUMBER) >> HPET_ID_NUMBER_SHIFT) + 1;

183 184 185 186
	memset(&hd, 0, sizeof(hd));
	hd.hd_phys_address	= hpet_address;
	hd.hd_address		= hpet;
	hd.hd_nirqs		= nrtimers;
187 188 189 190 191
	hpet_reserve_timer(&hd, 0);

#ifdef CONFIG_HPET_EMULATE_RTC
	hpet_reserve_timer(&hd, 1);
#endif
192

193 194 195 196 197
	/*
	 * NOTE that hd_irq[] reflects IOAPIC input pins (LEGACY_8254
	 * is wrong for i8259!) not the output IRQ.  Many BIOS writers
	 * don't bother configuring *any* comparator interrupts.
	 */
198 199 200
	hd.hd_irq[0] = HPET_LEGACY_8254;
	hd.hd_irq[1] = HPET_LEGACY_RTC;

I
Ingo Molnar 已提交
201
	for (i = 2; i < nrtimers; timer++, i++) {
202 203
		hd.hd_irq[i] = (readl(&timer->hpet_config) &
			Tn_INT_ROUTE_CNF_MASK) >> Tn_INT_ROUTE_CNF_SHIFT;
I
Ingo Molnar 已提交
204
	}
205

206
	hpet_reserve_msi_timers(&hd);
207

208
	hpet_alloc(&hd);
209

210 211
}
#else
J
Jan Beulich 已提交
212
static void hpet_reserve_platform_timers(unsigned int id) { }
213 214 215 216 217 218 219
#endif

/*
 * Common hpet info
 */
static unsigned long hpet_period;

220
static void hpet_legacy_set_mode(enum clock_event_mode mode,
221
			  struct clock_event_device *evt);
222
static int hpet_legacy_next_event(unsigned long delta,
223 224 225 226 227 228 229 230
			   struct clock_event_device *evt);

/*
 * The hpet clock event device
 */
static struct clock_event_device hpet_clockevent = {
	.name		= "hpet",
	.features	= CLOCK_EVT_FEAT_PERIODIC | CLOCK_EVT_FEAT_ONESHOT,
231 232
	.set_mode	= hpet_legacy_set_mode,
	.set_next_event = hpet_legacy_next_event,
233 234
	.shift		= 32,
	.irq		= 0,
235
	.rating		= 50,
236 237
};

238
static void hpet_stop_counter(void)
239 240 241 242
{
	unsigned long cfg = hpet_readl(HPET_CFG);
	cfg &= ~HPET_CFG_ENABLE;
	hpet_writel(cfg, HPET_CFG);
243 244 245 246
}

static void hpet_reset_counter(void)
{
247 248
	hpet_writel(0, HPET_COUNTER);
	hpet_writel(0, HPET_COUNTER + 4);
249 250 251 252
}

static void hpet_start_counter(void)
{
J
Jan Beulich 已提交
253
	unsigned int cfg = hpet_readl(HPET_CFG);
254 255 256 257
	cfg |= HPET_CFG_ENABLE;
	hpet_writel(cfg, HPET_CFG);
}

258 259 260
static void hpet_restart_counter(void)
{
	hpet_stop_counter();
261
	hpet_reset_counter();
262 263 264
	hpet_start_counter();
}

265 266
static void hpet_resume_device(void)
{
V
Venki Pallipadi 已提交
267
	force_hpet_resume();
268 269
}

270
static void hpet_resume_counter(struct clocksource *cs)
271 272
{
	hpet_resume_device();
273
	hpet_restart_counter();
274 275
}

276
static void hpet_enable_legacy_int(void)
277
{
J
Jan Beulich 已提交
278
	unsigned int cfg = hpet_readl(HPET_CFG);
279 280 281 282 283 284

	cfg |= HPET_CFG_LEGACY;
	hpet_writel(cfg, HPET_CFG);
	hpet_legacy_int_enabled = 1;
}

285 286 287 288 289 290
static void hpet_legacy_clockevent_register(void)
{
	/* Start HPET legacy interrupts */
	hpet_enable_legacy_int();

	/*
291 292 293 294 295 296
	 * The mult factor is defined as (include/linux/clockchips.h)
	 *  mult/2^shift = cyc/ns (in contrast to ns/cyc in clocksource.h)
	 * hpet_period is in units of femtoseconds (per cycle), so
	 *  mult/2^shift = cyc/ns = 10^6/hpet_period
	 *  mult = (10^6 * 2^shift)/hpet_period
	 *  mult = (FSEC_PER_NSEC << hpet_clockevent.shift)/hpet_period
297
	 */
298 299
	hpet_clockevent.mult = div_sc((unsigned long) FSEC_PER_NSEC,
				      hpet_period, hpet_clockevent.shift);
300 301 302
	/* Calculate the min / max delta */
	hpet_clockevent.max_delta_ns = clockevent_delta2ns(0x7FFFFFFF,
							   &hpet_clockevent);
303 304
	/* 5 usec minimum reprogramming delta. */
	hpet_clockevent.min_delta_ns = 5000;
305 306 307 308 309

	/*
	 * Start hpet with the boot cpu mask and make it
	 * global after the IO_APIC has been initialized.
	 */
310
	hpet_clockevent.cpumask = cpumask_of(smp_processor_id());
311 312 313 314 315
	clockevents_register_device(&hpet_clockevent);
	global_clock_event = &hpet_clockevent;
	printk(KERN_DEBUG "hpet clockevent registered\n");
}

316 317
static int hpet_setup_msi_irq(unsigned int irq);

318 319
static void hpet_set_mode(enum clock_event_mode mode,
			  struct clock_event_device *evt, int timer)
320
{
J
Jan Beulich 已提交
321
	unsigned int cfg, cmp, now;
322 323
	uint64_t delta;

324
	switch (mode) {
325
	case CLOCK_EVT_MODE_PERIODIC:
326
		hpet_stop_counter();
327 328
		delta = ((uint64_t)(NSEC_PER_SEC/HZ)) * evt->mult;
		delta >>= evt->shift;
329
		now = hpet_readl(HPET_COUNTER);
J
Jan Beulich 已提交
330
		cmp = now + (unsigned int) delta;
331
		cfg = hpet_readl(HPET_Tn_CFG(timer));
332 333
		/* Make sure we use edge triggered interrupts */
		cfg &= ~HPET_TN_LEVEL;
334 335
		cfg |= HPET_TN_ENABLE | HPET_TN_PERIODIC |
		       HPET_TN_SETVAL | HPET_TN_32BIT;
336
		hpet_writel(cfg, HPET_Tn_CFG(timer));
337 338 339 340 341 342 343 344 345
		hpet_writel(cmp, HPET_Tn_CMP(timer));
		udelay(1);
		/*
		 * HPET on AMD 81xx needs a second write (with HPET_TN_SETVAL
		 * cleared) to T0_CMP to set the period. The HPET_TN_SETVAL
		 * bit is automatically cleared after the first write.
		 * (See AMD-8111 HyperTransport I/O Hub Data Sheet,
		 * Publication # 24674)
		 */
J
Jan Beulich 已提交
346
		hpet_writel((unsigned int) delta, HPET_Tn_CMP(timer));
347
		hpet_start_counter();
348
		hpet_print_config();
349 350 351
		break;

	case CLOCK_EVT_MODE_ONESHOT:
352
		cfg = hpet_readl(HPET_Tn_CFG(timer));
353 354
		cfg &= ~HPET_TN_PERIODIC;
		cfg |= HPET_TN_ENABLE | HPET_TN_32BIT;
355
		hpet_writel(cfg, HPET_Tn_CFG(timer));
356 357 358 359
		break;

	case CLOCK_EVT_MODE_UNUSED:
	case CLOCK_EVT_MODE_SHUTDOWN:
360
		cfg = hpet_readl(HPET_Tn_CFG(timer));
361
		cfg &= ~HPET_TN_ENABLE;
362
		hpet_writel(cfg, HPET_Tn_CFG(timer));
363
		break;
T
Thomas Gleixner 已提交
364 365

	case CLOCK_EVT_MODE_RESUME:
366 367 368 369 370 371
		if (timer == 0) {
			hpet_enable_legacy_int();
		} else {
			struct hpet_dev *hdev = EVT_TO_HPET_DEV(evt);
			hpet_setup_msi_irq(hdev->irq);
			disable_irq(hdev->irq);
372
			irq_set_affinity(hdev->irq, cpumask_of(hdev->cpu));
373 374
			enable_irq(hdev->irq);
		}
375
		hpet_print_config();
T
Thomas Gleixner 已提交
376
		break;
377 378 379
	}
}

380 381
static int hpet_next_event(unsigned long delta,
			   struct clock_event_device *evt, int timer)
382
{
383
	u32 cnt;
384 385

	cnt = hpet_readl(HPET_COUNTER);
386
	cnt += (u32) delta;
387
	hpet_writel(cnt, HPET_Tn_CMP(timer));
388

389
	/*
390 391 392 393 394 395 396 397
	 * We need to read back the CMP register on certain HPET
	 * implementations (ATI chipsets) which seem to delay the
	 * transfer of the compare register into the internal compare
	 * logic. With small deltas this might actually be too late as
	 * the counter could already be higher than the compare value
	 * at that point and we would wait for the next hpet interrupt
	 * forever. We found out that reading the CMP register back
	 * forces the transfer so we can rely on the comparison with
398 399 400 401 402 403 404 405 406 407
	 * the counter register below.
	 *
	 * That works fine on those ATI chipsets, but on newer Intel
	 * chipsets (ICH9...) this triggers due to an erratum: Reading
	 * the comparator immediately following a write is returning
	 * the old value.
	 *
	 * We restrict the read back to the affected ATI chipsets (set
	 * by quirks) and also run it with hpet=verbose for debugging
	 * purposes.
408
	 */
409 410 411 412 413 414
	if (hpet_readback_cmp || hpet_verbose) {
		u32 cmp = hpet_readl(HPET_Tn_CMP(timer));

		if (cmp != cnt)
			printk_once(KERN_WARNING
			    "hpet: compare register read back failed.\n");
415
	}
416

J
Jan Beulich 已提交
417
	return (s32)(hpet_readl(HPET_COUNTER) - cnt) >= 0 ? -ETIME : 0;
418 419
}

420 421 422 423 424 425 426 427 428 429 430 431
static void hpet_legacy_set_mode(enum clock_event_mode mode,
			struct clock_event_device *evt)
{
	hpet_set_mode(mode, evt, 0);
}

static int hpet_legacy_next_event(unsigned long delta,
			struct clock_event_device *evt)
{
	return hpet_next_event(delta, evt, 0);
}

432 433 434
/*
 * HPET MSI Support
 */
435
#ifdef CONFIG_PCI_MSI
V
Venki Pallipadi 已提交
436 437 438 439

static DEFINE_PER_CPU(struct hpet_dev *, cpu_hpet_dev);
static struct hpet_dev	*hpet_devs;

440 441 442
void hpet_msi_unmask(unsigned int irq)
{
	struct hpet_dev *hdev = get_irq_data(irq);
J
Jan Beulich 已提交
443
	unsigned int cfg;
444 445 446 447 448 449 450 451 452

	/* unmask it */
	cfg = hpet_readl(HPET_Tn_CFG(hdev->num));
	cfg |= HPET_TN_FSB;
	hpet_writel(cfg, HPET_Tn_CFG(hdev->num));
}

void hpet_msi_mask(unsigned int irq)
{
J
Jan Beulich 已提交
453
	unsigned int cfg;
454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478
	struct hpet_dev *hdev = get_irq_data(irq);

	/* mask it */
	cfg = hpet_readl(HPET_Tn_CFG(hdev->num));
	cfg &= ~HPET_TN_FSB;
	hpet_writel(cfg, HPET_Tn_CFG(hdev->num));
}

void hpet_msi_write(unsigned int irq, struct msi_msg *msg)
{
	struct hpet_dev *hdev = get_irq_data(irq);

	hpet_writel(msg->data, HPET_Tn_ROUTE(hdev->num));
	hpet_writel(msg->address_lo, HPET_Tn_ROUTE(hdev->num) + 4);
}

void hpet_msi_read(unsigned int irq, struct msi_msg *msg)
{
	struct hpet_dev *hdev = get_irq_data(irq);

	msg->data = hpet_readl(HPET_Tn_ROUTE(hdev->num));
	msg->address_lo = hpet_readl(HPET_Tn_ROUTE(hdev->num) + 4);
	msg->address_hi = 0;
}

479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494
static void hpet_msi_set_mode(enum clock_event_mode mode,
				struct clock_event_device *evt)
{
	struct hpet_dev *hdev = EVT_TO_HPET_DEV(evt);
	hpet_set_mode(mode, evt, hdev->num);
}

static int hpet_msi_next_event(unsigned long delta,
				struct clock_event_device *evt)
{
	struct hpet_dev *hdev = EVT_TO_HPET_DEV(evt);
	return hpet_next_event(delta, evt, hdev->num);
}

static int hpet_setup_msi_irq(unsigned int irq)
{
495
	if (arch_setup_hpet_msi(irq, hpet_blockid)) {
496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537
		destroy_irq(irq);
		return -EINVAL;
	}
	return 0;
}

static int hpet_assign_irq(struct hpet_dev *dev)
{
	unsigned int irq;

	irq = create_irq();
	if (!irq)
		return -EINVAL;

	set_irq_data(irq, dev);

	if (hpet_setup_msi_irq(irq))
		return -EINVAL;

	dev->irq = irq;
	return 0;
}

static irqreturn_t hpet_interrupt_handler(int irq, void *data)
{
	struct hpet_dev *dev = (struct hpet_dev *)data;
	struct clock_event_device *hevt = &dev->evt;

	if (!hevt->event_handler) {
		printk(KERN_INFO "Spurious HPET timer interrupt on HPET timer %d\n",
				dev->num);
		return IRQ_HANDLED;
	}

	hevt->event_handler(hevt);
	return IRQ_HANDLED;
}

static int hpet_setup_irq(struct hpet_dev *dev)
{

	if (request_irq(dev->irq, hpet_interrupt_handler,
538 539
			IRQF_TIMER | IRQF_DISABLED | IRQF_NOBALANCING,
			dev->name, dev))
540 541 542
		return -1;

	disable_irq(dev->irq);
543
	irq_set_affinity(dev->irq, cpumask_of(dev->cpu));
544 545
	enable_irq(dev->irq);

Y
Yinghai Lu 已提交
546 547 548
	printk(KERN_DEBUG "hpet: %s irq %d for MSI\n",
			 dev->name, dev->irq);

549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584
	return 0;
}

/* This should be called in specific @cpu */
static void init_one_hpet_msi_clockevent(struct hpet_dev *hdev, int cpu)
{
	struct clock_event_device *evt = &hdev->evt;
	uint64_t hpet_freq;

	WARN_ON(cpu != smp_processor_id());
	if (!(hdev->flags & HPET_DEV_VALID))
		return;

	if (hpet_setup_msi_irq(hdev->irq))
		return;

	hdev->cpu = cpu;
	per_cpu(cpu_hpet_dev, cpu) = hdev;
	evt->name = hdev->name;
	hpet_setup_irq(hdev);
	evt->irq = hdev->irq;

	evt->rating = 110;
	evt->features = CLOCK_EVT_FEAT_ONESHOT;
	if (hdev->flags & HPET_DEV_PERI_CAP)
		evt->features |= CLOCK_EVT_FEAT_PERIODIC;

	evt->set_mode = hpet_msi_set_mode;
	evt->set_next_event = hpet_msi_next_event;
	evt->shift = 32;

	/*
	 * The period is a femto seconds value. We need to calculate the
	 * scaled math multiplication factor for nanosecond to hpet tick
	 * conversion.
	 */
585
	hpet_freq = FSEC_PER_SEC;
586 587 588 589 590 591 592 593
	do_div(hpet_freq, hpet_period);
	evt->mult = div_sc((unsigned long) hpet_freq,
				      NSEC_PER_SEC, evt->shift);
	/* Calculate the max delta */
	evt->max_delta_ns = clockevent_delta2ns(0x7FFFFFFF, evt);
	/* 5 usec minimum reprogramming delta. */
	evt->min_delta_ns = 5000;

594
	evt->cpumask = cpumask_of(hdev->cpu);
595 596 597 598 599 600 601 602 603
	clockevents_register_device(evt);
}

#ifdef CONFIG_HPET
/* Reserve at least one timer for userspace (/dev/hpet) */
#define RESERVE_TIMERS 1
#else
#define RESERVE_TIMERS 0
#endif
V
Venki Pallipadi 已提交
604 605

static void hpet_msi_capability_lookup(unsigned int start_timer)
606 607 608 609 610 611
{
	unsigned int id;
	unsigned int num_timers;
	unsigned int num_timers_used = 0;
	int i;

612 613 614
	if (hpet_msi_disable)
		return;

615 616
	if (boot_cpu_has(X86_FEATURE_ARAT))
		return;
617 618 619 620
	id = hpet_readl(HPET_ID);

	num_timers = ((id & HPET_ID_NUMBER) >> HPET_ID_NUMBER_SHIFT);
	num_timers++; /* Value read out starts from 0 */
621
	hpet_print_config();
622 623 624 625 626 627 628 629 630

	hpet_devs = kzalloc(sizeof(struct hpet_dev) * num_timers, GFP_KERNEL);
	if (!hpet_devs)
		return;

	hpet_num_timers = num_timers;

	for (i = start_timer; i < num_timers - RESERVE_TIMERS; i++) {
		struct hpet_dev *hdev = &hpet_devs[num_timers_used];
J
Jan Beulich 已提交
631
		unsigned int cfg = hpet_readl(HPET_Tn_CFG(i));
632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656

		/* Only consider HPET timer with MSI support */
		if (!(cfg & HPET_TN_FSB_CAP))
			continue;

		hdev->flags = 0;
		if (cfg & HPET_TN_PERIODIC_CAP)
			hdev->flags |= HPET_DEV_PERI_CAP;
		hdev->num = i;

		sprintf(hdev->name, "hpet%d", i);
		if (hpet_assign_irq(hdev))
			continue;

		hdev->flags |= HPET_DEV_FSB_CAP;
		hdev->flags |= HPET_DEV_VALID;
		num_timers_used++;
		if (num_timers_used == num_possible_cpus())
			break;
	}

	printk(KERN_INFO "HPET: %d timers in total, %d timers will be used for per-cpu timer\n",
		num_timers, num_timers_used);
}

V
Venki Pallipadi 已提交
657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676
#ifdef CONFIG_HPET
static void hpet_reserve_msi_timers(struct hpet_data *hd)
{
	int i;

	if (!hpet_devs)
		return;

	for (i = 0; i < hpet_num_timers; i++) {
		struct hpet_dev *hdev = &hpet_devs[i];

		if (!(hdev->flags & HPET_DEV_VALID))
			continue;

		hd->hd_irq[hdev->num] = hdev->irq;
		hpet_reserve_timer(hd, hdev->num);
	}
}
#endif

677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 725
static struct hpet_dev *hpet_get_unused_timer(void)
{
	int i;

	if (!hpet_devs)
		return NULL;

	for (i = 0; i < hpet_num_timers; i++) {
		struct hpet_dev *hdev = &hpet_devs[i];

		if (!(hdev->flags & HPET_DEV_VALID))
			continue;
		if (test_and_set_bit(HPET_DEV_USED_BIT,
			(unsigned long *)&hdev->flags))
			continue;
		return hdev;
	}
	return NULL;
}

struct hpet_work_struct {
	struct delayed_work work;
	struct completion complete;
};

static void hpet_work(struct work_struct *w)
{
	struct hpet_dev *hdev;
	int cpu = smp_processor_id();
	struct hpet_work_struct *hpet_work;

	hpet_work = container_of(w, struct hpet_work_struct, work.work);

	hdev = hpet_get_unused_timer();
	if (hdev)
		init_one_hpet_msi_clockevent(hdev, cpu);

	complete(&hpet_work->complete);
}

static int hpet_cpuhp_notify(struct notifier_block *n,
		unsigned long action, void *hcpu)
{
	unsigned long cpu = (unsigned long)hcpu;
	struct hpet_work_struct work;
	struct hpet_dev *hdev = per_cpu(cpu_hpet_dev, cpu);

	switch (action & 0xf) {
	case CPU_ONLINE:
726
		INIT_DELAYED_WORK_ON_STACK(&work.work, hpet_work);
727 728 729 730
		init_completion(&work.complete);
		/* FIXME: add schedule_work_on() */
		schedule_delayed_work_on(cpu, &work.work, 0);
		wait_for_completion(&work.complete);
731
		destroy_timer_on_stack(&work.work.timer);
732 733 734 735 736 737 738 739 740 741 742 743 744
		break;
	case CPU_DEAD:
		if (hdev) {
			free_irq(hdev->irq, hdev);
			hdev->flags &= ~HPET_DEV_USED;
			per_cpu(cpu_hpet_dev, cpu) = NULL;
		}
		break;
	}
	return NOTIFY_OK;
}
#else

745 746 747 748
static int hpet_setup_msi_irq(unsigned int irq)
{
	return 0;
}
V
Venki Pallipadi 已提交
749 750 751 752 753 754 755
static void hpet_msi_capability_lookup(unsigned int start_timer)
{
	return;
}

#ifdef CONFIG_HPET
static void hpet_reserve_msi_timers(struct hpet_data *hd)
756 757 758
{
	return;
}
V
Venki Pallipadi 已提交
759
#endif
760 761 762 763 764 765 766 767 768

static int hpet_cpuhp_notify(struct notifier_block *n,
		unsigned long action, void *hcpu)
{
	return NOTIFY_OK;
}

#endif

769 770 771
/*
 * Clock source related code
 */
772
static cycle_t read_hpet(struct clocksource *cs)
773 774 775 776
{
	return (cycle_t)hpet_readl(HPET_COUNTER);
}

777 778 779 780 781 782 783
#ifdef CONFIG_X86_64
static cycle_t __vsyscall_fn vread_hpet(void)
{
	return readl((const void __iomem *)fix_to_virt(VSYSCALL_HPET) + 0xf0);
}
#endif

784 785 786 787 788 789
static struct clocksource clocksource_hpet = {
	.name		= "hpet",
	.rating		= 250,
	.read		= read_hpet,
	.mask		= HPET_MASK,
	.flags		= CLOCK_SOURCE_IS_CONTINUOUS,
790
	.resume		= hpet_resume_counter,
791 792 793
#ifdef CONFIG_X86_64
	.vread		= vread_hpet,
#endif
794 795
};

796
static int hpet_clocksource_register(void)
797
{
798
	u64 start, now;
799
	u64 hpet_freq;
800
	cycle_t t1;
801 802

	/* Start the counter */
803
	hpet_restart_counter();
804

805
	/* Verify whether hpet counter works */
806
	t1 = hpet_readl(HPET_COUNTER);
807 808 809 810 811 812 813 814 815 816 817 818 819
	rdtscll(start);

	/*
	 * We don't know the TSC frequency yet, but waiting for
	 * 200000 TSC cycles is safe:
	 * 4 GHz == 50us
	 * 1 GHz == 200us
	 */
	do {
		rep_nop();
		rdtscll(now);
	} while ((now - start) < 200000UL);

820
	if (t1 == hpet_readl(HPET_COUNTER)) {
821 822
		printk(KERN_WARNING
		       "HPET counter not counting. HPET disabled\n");
823
		return -ENODEV;
824 825
	}

826 827 828 829 830 831 832
	/*
	 * The definition of mult is (include/linux/clocksource.h)
	 * mult/2^shift = ns/cyc and hpet_period is in units of fsec/cyc
	 * so we first need to convert hpet_period to ns/cyc units:
	 *  mult/2^shift = ns/cyc = hpet_period/10^6
	 *  mult = (hpet_period * 2^shift)/10^6
	 *  mult = (hpet_period << shift)/FSEC_PER_NSEC
833 834
	 */

835 836 837 838 839
	/* Need to convert hpet_period (fsec/cyc) to cyc/sec:
	 *
	 * cyc/sec = FSEC_PER_SEC/hpet_period(fsec/cyc)
	 * cyc/sec = (FSEC_PER_NSEC * NSEC_PER_SEC)/hpet_period
	 */
840
	hpet_freq = FSEC_PER_SEC;
841 842
	do_div(hpet_freq, hpet_period);
	clocksource_register_hz(&clocksource_hpet, (u32)hpet_freq);
843

844 845 846
	return 0;
}

P
Pavel Machek 已提交
847 848
/**
 * hpet_enable - Try to setup the HPET timer. Returns 1 on success.
849 850 851
 */
int __init hpet_enable(void)
{
J
Jan Beulich 已提交
852
	unsigned int id;
853
	int i;
854 855 856 857 858 859 860 861 862 863

	if (!is_hpet_capable())
		return 0;

	hpet_set_mapping();

	/*
	 * Read the period and check for a sane value:
	 */
	hpet_period = hpet_readl(HPET_PERIOD);
864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883 884 885 886

	/*
	 * AMD SB700 based systems with spread spectrum enabled use a
	 * SMM based HPET emulation to provide proper frequency
	 * setting. The SMM code is initialized with the first HPET
	 * register access and takes some time to complete. During
	 * this time the config register reads 0xffffffff. We check
	 * for max. 1000 loops whether the config register reads a non
	 * 0xffffffff value to make sure that HPET is up and running
	 * before we go further. A counting loop is safe, as the HPET
	 * access takes thousands of CPU cycles. On non SB700 based
	 * machines this check is only done once and has no side
	 * effects.
	 */
	for (i = 0; hpet_readl(HPET_CFG) == 0xFFFFFFFF; i++) {
		if (i == 1000) {
			printk(KERN_WARNING
			       "HPET config register value = 0xFFFFFFFF. "
			       "Disabling HPET\n");
			goto out_nohpet;
		}
	}

887 888 889 890 891 892 893 894
	if (hpet_period < HPET_MIN_PERIOD || hpet_period > HPET_MAX_PERIOD)
		goto out_nohpet;

	/*
	 * Read the HPET ID register to retrieve the IRQ routing
	 * information and the number of channels
	 */
	id = hpet_readl(HPET_ID);
895
	hpet_print_config();
896 897 898 899 900 901 902 903 904 905 906 907 908

#ifdef CONFIG_HPET_EMULATE_RTC
	/*
	 * The legacy routing mode needs at least two channels, tick timer
	 * and the rtc emulation channel.
	 */
	if (!(id & HPET_ID_NUMBER))
		goto out_nohpet;
#endif

	if (hpet_clocksource_register())
		goto out_nohpet;

909
	if (id & HPET_ID_LEGSUP) {
910
		hpet_legacy_clockevent_register();
911 912 913
		return 1;
	}
	return 0;
914

915
out_nohpet:
916
	hpet_clear_mapping();
J
Janne Kulmala 已提交
917
	hpet_address = 0;
918 919 920
	return 0;
}

921 922 923 924 925 926 927 928
/*
 * Needs to be late, as the reserve_timer code calls kalloc !
 *
 * Not a problem on i386 as hpet_enable is called from late_time_init,
 * but on x86_64 it is necessary !
 */
static __init int hpet_late_init(void)
{
929 930
	int cpu;

931
	if (boot_hpet_disable)
932 933
		return -ENODEV;

934 935 936 937 938 939 940 941
	if (!hpet_address) {
		if (!force_hpet_address)
			return -ENODEV;

		hpet_address = force_hpet_address;
		hpet_enable();
	}

942 943 944
	if (!hpet_virt_address)
		return -ENODEV;

945 946 947 948 949
	if (hpet_readl(HPET_ID) & HPET_ID_LEGSUP)
		hpet_msi_capability_lookup(2);
	else
		hpet_msi_capability_lookup(0);

950
	hpet_reserve_platform_timers(hpet_readl(HPET_ID));
951
	hpet_print_config();
952

953 954 955
	if (hpet_msi_disable)
		return 0;

956 957 958
	if (boot_cpu_has(X86_FEATURE_ARAT))
		return 0;

959 960 961 962 963 964 965
	for_each_online_cpu(cpu) {
		hpet_cpuhp_notify(NULL, CPU_ONLINE, (void *)(long)cpu);
	}

	/* This notifier should be called after workqueue is ready */
	hotcpu_notifier(hpet_cpuhp_notify, -20);

966 967 968 969
	return 0;
}
fs_initcall(hpet_late_init);

O
OGAWA Hirofumi 已提交
970 971
void hpet_disable(void)
{
972
	if (is_hpet_capable() && hpet_virt_address) {
J
Jan Beulich 已提交
973
		unsigned int cfg = hpet_readl(HPET_CFG);
O
OGAWA Hirofumi 已提交
974 975 976 977 978 979 980 981 982 983

		if (hpet_legacy_int_enabled) {
			cfg &= ~HPET_CFG_LEGACY;
			hpet_legacy_int_enabled = 0;
		}
		cfg &= ~HPET_CFG_ENABLE;
		hpet_writel(cfg, HPET_CFG);
	}
}

984 985 986 987 988 989 990 991 992 993 994 995 996 997 998 999 1000 1001
#ifdef CONFIG_HPET_EMULATE_RTC

/* HPET in LegacyReplacement Mode eats up RTC interrupt line. When, HPET
 * is enabled, we support RTC interrupt functionality in software.
 * RTC has 3 kinds of interrupts:
 * 1) Update Interrupt - generate an interrupt, every sec, when RTC clock
 *    is updated
 * 2) Alarm Interrupt - generate an interrupt at a specific time of day
 * 3) Periodic Interrupt - generate periodic interrupt, with frequencies
 *    2Hz-8192Hz (2Hz-64Hz for non-root user) (all freqs in powers of 2)
 * (1) and (2) above are implemented using polling at a frequency of
 * 64 Hz. The exact frequency is a tradeoff between accuracy and interrupt
 * overhead. (DEFAULT_RTC_INT_FREQ)
 * For (3), we use interrupts at 64Hz or user specified periodic
 * frequency, whichever is higher.
 */
#include <linux/mc146818rtc.h>
#include <linux/rtc.h>
1002
#include <asm/rtc.h>
1003 1004 1005 1006 1007 1008

#define DEFAULT_RTC_INT_FREQ	64
#define DEFAULT_RTC_SHIFT	6
#define RTC_NUM_INTS		1

static unsigned long hpet_rtc_flags;
D
David Brownell 已提交
1009
static int hpet_prev_update_sec;
1010 1011
static struct rtc_time hpet_alarm_time;
static unsigned long hpet_pie_count;
1012
static u32 hpet_t1_cmp;
J
Jan Beulich 已提交
1013 1014
static u32 hpet_default_delta;
static u32 hpet_pie_delta;
1015 1016
static unsigned long hpet_pie_limit;

1017 1018
static rtc_irq_handler irq_handler;

1019 1020 1021 1022 1023 1024 1025 1026
/*
 * Check that the hpet counter c1 is ahead of the c2
 */
static inline int hpet_cnt_ahead(u32 c1, u32 c2)
{
	return (s32)(c2 - c1) < 0;
}

1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056
/*
 * Registers a IRQ handler.
 */
int hpet_register_irq_handler(rtc_irq_handler handler)
{
	if (!is_hpet_enabled())
		return -ENODEV;
	if (irq_handler)
		return -EBUSY;

	irq_handler = handler;

	return 0;
}
EXPORT_SYMBOL_GPL(hpet_register_irq_handler);

/*
 * Deregisters the IRQ handler registered with hpet_register_irq_handler()
 * and does cleanup.
 */
void hpet_unregister_irq_handler(rtc_irq_handler handler)
{
	if (!is_hpet_enabled())
		return;

	irq_handler = NULL;
	hpet_rtc_flags = 0;
}
EXPORT_SYMBOL_GPL(hpet_unregister_irq_handler);

1057 1058 1059 1060 1061 1062 1063 1064
/*
 * Timer 1 for RTC emulation. We use one shot mode, as periodic mode
 * is not supported by all HPET implementations for timer 1.
 *
 * hpet_rtc_timer_init() is called when the rtc is initialized.
 */
int hpet_rtc_timer_init(void)
{
J
Jan Beulich 已提交
1065 1066
	unsigned int cfg, cnt, delta;
	unsigned long flags;
1067 1068 1069 1070 1071 1072 1073 1074 1075

	if (!is_hpet_enabled())
		return 0;

	if (!hpet_default_delta) {
		uint64_t clc;

		clc = (uint64_t) hpet_clockevent.mult * NSEC_PER_SEC;
		clc >>= hpet_clockevent.shift + DEFAULT_RTC_SHIFT;
J
Jan Beulich 已提交
1076
		hpet_default_delta = clc;
1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096 1097 1098
	}

	if (!(hpet_rtc_flags & RTC_PIE) || hpet_pie_limit)
		delta = hpet_default_delta;
	else
		delta = hpet_pie_delta;

	local_irq_save(flags);

	cnt = delta + hpet_readl(HPET_COUNTER);
	hpet_writel(cnt, HPET_T1_CMP);
	hpet_t1_cmp = cnt;

	cfg = hpet_readl(HPET_T1_CFG);
	cfg &= ~HPET_TN_PERIODIC;
	cfg |= HPET_TN_ENABLE | HPET_TN_32BIT;
	hpet_writel(cfg, HPET_T1_CFG);

	local_irq_restore(flags);

	return 1;
}
1099
EXPORT_SYMBOL_GPL(hpet_rtc_timer_init);
1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113

/*
 * The functions below are called from rtc driver.
 * Return 0 if HPET is not being used.
 * Otherwise do the necessary changes and return 1.
 */
int hpet_mask_rtc_irq_bit(unsigned long bit_mask)
{
	if (!is_hpet_enabled())
		return 0;

	hpet_rtc_flags &= ~bit_mask;
	return 1;
}
1114
EXPORT_SYMBOL_GPL(hpet_mask_rtc_irq_bit);
1115 1116 1117 1118 1119 1120 1121 1122 1123 1124

int hpet_set_rtc_irq_bit(unsigned long bit_mask)
{
	unsigned long oldbits = hpet_rtc_flags;

	if (!is_hpet_enabled())
		return 0;

	hpet_rtc_flags |= bit_mask;

D
David Brownell 已提交
1125 1126 1127
	if ((bit_mask & RTC_UIE) && !(oldbits & RTC_UIE))
		hpet_prev_update_sec = -1;

1128 1129 1130 1131 1132
	if (!oldbits)
		hpet_rtc_timer_init();

	return 1;
}
1133
EXPORT_SYMBOL_GPL(hpet_set_rtc_irq_bit);
1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146

int hpet_set_alarm_time(unsigned char hrs, unsigned char min,
			unsigned char sec)
{
	if (!is_hpet_enabled())
		return 0;

	hpet_alarm_time.tm_hour = hrs;
	hpet_alarm_time.tm_min = min;
	hpet_alarm_time.tm_sec = sec;

	return 1;
}
1147
EXPORT_SYMBOL_GPL(hpet_set_alarm_time);
1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161

int hpet_set_periodic_freq(unsigned long freq)
{
	uint64_t clc;

	if (!is_hpet_enabled())
		return 0;

	if (freq <= DEFAULT_RTC_INT_FREQ)
		hpet_pie_limit = DEFAULT_RTC_INT_FREQ / freq;
	else {
		clc = (uint64_t) hpet_clockevent.mult * NSEC_PER_SEC;
		do_div(clc, freq);
		clc >>= hpet_clockevent.shift;
J
Jan Beulich 已提交
1162
		hpet_pie_delta = clc;
1163
		hpet_pie_limit = 0;
1164 1165 1166
	}
	return 1;
}
1167
EXPORT_SYMBOL_GPL(hpet_set_periodic_freq);
1168 1169 1170 1171 1172

int hpet_rtc_dropped_irq(void)
{
	return is_hpet_enabled();
}
1173
EXPORT_SYMBOL_GPL(hpet_rtc_dropped_irq);
1174 1175 1176

static void hpet_rtc_timer_reinit(void)
{
J
Jan Beulich 已提交
1177
	unsigned int cfg, delta;
1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199
	int lost_ints = -1;

	if (unlikely(!hpet_rtc_flags)) {
		cfg = hpet_readl(HPET_T1_CFG);
		cfg &= ~HPET_TN_ENABLE;
		hpet_writel(cfg, HPET_T1_CFG);
		return;
	}

	if (!(hpet_rtc_flags & RTC_PIE) || hpet_pie_limit)
		delta = hpet_default_delta;
	else
		delta = hpet_pie_delta;

	/*
	 * Increment the comparator value until we are ahead of the
	 * current count.
	 */
	do {
		hpet_t1_cmp += delta;
		hpet_writel(hpet_t1_cmp, HPET_T1_CMP);
		lost_ints++;
1200
	} while (!hpet_cnt_ahead(hpet_t1_cmp, hpet_readl(HPET_COUNTER)));
1201 1202 1203 1204 1205

	if (lost_ints) {
		if (hpet_rtc_flags & RTC_PIE)
			hpet_pie_count += lost_ints;
		if (printk_ratelimit())
D
David Brownell 已提交
1206
			printk(KERN_WARNING "hpet1: lost %d rtc interrupts\n",
1207 1208 1209 1210 1211 1212 1213 1214 1215 1216
				lost_ints);
	}
}

irqreturn_t hpet_rtc_interrupt(int irq, void *dev_id)
{
	struct rtc_time curr_time;
	unsigned long rtc_int_flag = 0;

	hpet_rtc_timer_reinit();
1217
	memset(&curr_time, 0, sizeof(struct rtc_time));
1218 1219

	if (hpet_rtc_flags & (RTC_UIE | RTC_AIE))
1220
		get_rtc_time(&curr_time);
1221 1222 1223

	if (hpet_rtc_flags & RTC_UIE &&
	    curr_time.tm_sec != hpet_prev_update_sec) {
D
David Brownell 已提交
1224 1225
		if (hpet_prev_update_sec >= 0)
			rtc_int_flag = RTC_UF;
1226 1227 1228 1229 1230 1231 1232 1233 1234
		hpet_prev_update_sec = curr_time.tm_sec;
	}

	if (hpet_rtc_flags & RTC_PIE &&
	    ++hpet_pie_count >= hpet_pie_limit) {
		rtc_int_flag |= RTC_PF;
		hpet_pie_count = 0;
	}

1235
	if (hpet_rtc_flags & RTC_AIE &&
1236 1237 1238 1239 1240 1241 1242
	    (curr_time.tm_sec == hpet_alarm_time.tm_sec) &&
	    (curr_time.tm_min == hpet_alarm_time.tm_min) &&
	    (curr_time.tm_hour == hpet_alarm_time.tm_hour))
			rtc_int_flag |= RTC_AF;

	if (rtc_int_flag) {
		rtc_int_flag |= (RTC_IRQF | (RTC_NUM_INTS << 8));
1243 1244
		if (irq_handler)
			irq_handler(rtc_int_flag, dev_id);
1245 1246 1247
	}
	return IRQ_HANDLED;
}
1248
EXPORT_SYMBOL_GPL(hpet_rtc_interrupt);
1249
#endif