enlighten.c 11.4 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0-only
S
Stefano Stabellini 已提交
2
#include <xen/xen.h>
3
#include <xen/events.h>
4 5
#include <xen/grant_table.h>
#include <xen/hvm.h>
S
Stefano Stabellini 已提交
6
#include <xen/interface/vcpu.h>
S
Stefano Stabellini 已提交
7 8
#include <xen/interface/xen.h>
#include <xen/interface/memory.h>
9
#include <xen/interface/hvm/params.h>
10
#include <xen/features.h>
S
Stefano Stabellini 已提交
11
#include <xen/platform_pci.h>
12
#include <xen/xenbus.h>
I
Ian Campbell 已提交
13
#include <xen/page.h>
14
#include <xen/interface/sched.h>
15
#include <xen/xen-ops.h>
S
Stefano Stabellini 已提交
16 17
#include <asm/xen/hypervisor.h>
#include <asm/xen/hypercall.h>
18
#include <asm/system_misc.h>
19
#include <asm/efi.h>
20 21
#include <linux/interrupt.h>
#include <linux/irqreturn.h>
S
Stefano Stabellini 已提交
22
#include <linux/module.h>
23
#include <linux/of.h>
24
#include <linux/of_fdt.h>
25 26
#include <linux/of_irq.h>
#include <linux/of_address.h>
27 28
#include <linux/cpuidle.h>
#include <linux/cpufreq.h>
29
#include <linux/cpu.h>
30
#include <linux/console.h>
31 32
#include <linux/pvclock_gtod.h>
#include <linux/time64.h>
33
#include <linux/timekeeping.h>
34
#include <linux/timekeeper_internal.h>
35
#include <linux/acpi.h>
S
Stefano Stabellini 已提交
36

37 38
#include <linux/mm.h>

J
Jason Yan 已提交
39
static struct start_info _xen_start_info;
S
Stefano Stabellini 已提交
40
struct start_info *xen_start_info = &_xen_start_info;
41
EXPORT_SYMBOL(xen_start_info);
S
Stefano Stabellini 已提交
42 43

enum xen_domain_type xen_domain_type = XEN_NATIVE;
44
EXPORT_SYMBOL(xen_domain_type);
S
Stefano Stabellini 已提交
45 46 47 48 49

struct shared_info xen_dummy_shared_info;
struct shared_info *HYPERVISOR_shared_info = (void *)&xen_dummy_shared_info;

DEFINE_PER_CPU(struct vcpu_info *, xen_vcpu);
S
Stefano Stabellini 已提交
50
static struct vcpu_info __percpu *xen_vcpu_info;
S
Stefano Stabellini 已提交
51

52
/* Linux <-> Xen vCPU id mapping */
53
DEFINE_PER_CPU(uint32_t, xen_vcpu_id);
54 55
EXPORT_PER_CPU_SYMBOL(xen_vcpu_id);

I
Ian Campbell 已提交
56 57 58 59
/* These are unused until we support booting "pre-ballooned" */
unsigned long xen_released_pages;
struct xen_memory_region xen_extra_mem[XEN_EXTRA_MEM_MAX_REGIONS] __initdata;

60
static __read_mostly unsigned int xen_events_irq;
61

62 63 64
uint32_t xen_start_flags;
EXPORT_SYMBOL(xen_start_flags);

65
int xen_unmap_domain_gfn_range(struct vm_area_struct *vma,
66 67
			       int nr, struct page **pages)
{
68
	return xen_xlate_unmap_gfn_range(vma, nr, pages);
69
}
70
EXPORT_SYMBOL_GPL(xen_unmap_domain_gfn_range);
71

72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92
static void xen_read_wallclock(struct timespec64 *ts)
{
	u32 version;
	struct timespec64 now, ts_monotonic;
	struct shared_info *s = HYPERVISOR_shared_info;
	struct pvclock_wall_clock *wall_clock = &(s->wc);

	/* get wallclock at system boot */
	do {
		version = wall_clock->version;
		rmb();		/* fetch version before time */
		now.tv_sec  = ((uint64_t)wall_clock->sec_hi << 32) | wall_clock->sec;
		now.tv_nsec = wall_clock->nsec;
		rmb();		/* fetch time before checking version */
	} while ((wall_clock->version & 1) || (version != wall_clock->version));

	/* time since system boot */
	ktime_get_ts64(&ts_monotonic);
	*ts = timespec64_add(now, ts_monotonic);
}

93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135
static int xen_pvclock_gtod_notify(struct notifier_block *nb,
				   unsigned long was_set, void *priv)
{
	/* Protected by the calling core code serialization */
	static struct timespec64 next_sync;

	struct xen_platform_op op;
	struct timespec64 now, system_time;
	struct timekeeper *tk = priv;

	now.tv_sec = tk->xtime_sec;
	now.tv_nsec = (long)(tk->tkr_mono.xtime_nsec >> tk->tkr_mono.shift);
	system_time = timespec64_add(now, tk->wall_to_monotonic);

	/*
	 * We only take the expensive HV call when the clock was set
	 * or when the 11 minutes RTC synchronization time elapsed.
	 */
	if (!was_set && timespec64_compare(&now, &next_sync) < 0)
		return NOTIFY_OK;

	op.cmd = XENPF_settime64;
	op.u.settime64.mbz = 0;
	op.u.settime64.secs = now.tv_sec;
	op.u.settime64.nsecs = now.tv_nsec;
	op.u.settime64.system_time = timespec64_to_ns(&system_time);
	(void)HYPERVISOR_platform_op(&op);

	/*
	 * Move the next drift compensation time 11 minutes
	 * ahead. That's emulating the sync_cmos_clock() update for
	 * the hardware RTC.
	 */
	next_sync = now;
	next_sync.tv_sec += 11 * 60;

	return NOTIFY_OK;
}

static struct notifier_block xen_pvclock_gtod_notifier = {
	.notifier_call = xen_pvclock_gtod_notify,
};

136
static int xen_starting_cpu(unsigned int cpu)
S
Stefano Stabellini 已提交
137 138 139 140 141
{
	struct vcpu_register_vcpu_info info;
	struct vcpu_info *vcpup;
	int err;

142 143 144 145 146 147 148 149
	/* 
	 * VCPUOP_register_vcpu_info cannot be called twice for the same
	 * vcpu, so if vcpu_info is already registered, just get out. This
	 * can happen with cpu-hotplug.
	 */
	if (per_cpu(xen_vcpu, cpu) != NULL)
		goto after_register_vcpu_info;

S
Stefano Stabellini 已提交
150 151 152
	pr_info("Xen: initializing cpu%d\n", cpu);
	vcpup = per_cpu_ptr(xen_vcpu_info, cpu);

153 154
	info.mfn = virt_to_gfn(vcpup);
	info.offset = xen_offset_in_page(vcpup);
S
Stefano Stabellini 已提交
155

156 157
	err = HYPERVISOR_vcpu_op(VCPUOP_register_vcpu_info, xen_vcpu_nr(cpu),
				 &info);
158 159 160
	BUG_ON(err);
	per_cpu(xen_vcpu, cpu) = vcpup;

161 162
	if (!xen_kernel_unmapped_at_usr())
		xen_setup_runstate_info(cpu);
163

164
after_register_vcpu_info:
165
	enable_percpu_irq(xen_events_irq, 0);
166 167 168 169 170 171 172
	return 0;
}

static int xen_dying_cpu(unsigned int cpu)
{
	disable_percpu_irq(xen_events_irq);
	return 0;
S
Stefano Stabellini 已提交
173 174
}

175
void xen_reboot(int reason)
176
{
177
	struct sched_shutdown r = { .reason = reason };
178
	int rc;
179

180
	rc = HYPERVISOR_sched_op(SCHEDOP_shutdown, &r);
H
Himangi Saraogi 已提交
181
	BUG_ON(rc);
182 183
}

184 185 186 187 188 189
static void xen_restart(enum reboot_mode reboot_mode, const char *cmd)
{
	xen_reboot(SHUTDOWN_reboot);
}


190 191
static void xen_power_off(void)
{
192
	xen_reboot(SHUTDOWN_poweroff);
193 194
}

195 196 197 198 199 200
static irqreturn_t xen_arm_callback(int irq, void *arg)
{
	xen_hvm_evtchn_do_upcall();
	return IRQ_HANDLED;
}

201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224
static __initdata struct {
	const char *compat;
	const char *prefix;
	const char *version;
	bool found;
} hyper_node = {"xen,xen", "xen,xen-", NULL, false};

static int __init fdt_find_hyper_node(unsigned long node, const char *uname,
				      int depth, void *data)
{
	const void *s = NULL;
	int len;

	if (depth != 1 || strcmp(uname, "hypervisor") != 0)
		return 0;

	if (of_flat_dt_is_compatible(node, hyper_node.compat))
		hyper_node.found = true;

	s = of_get_flat_dt_prop(node, "compatible", &len);
	if (strlen(hyper_node.prefix) + 3  < len &&
	    !strncmp(hyper_node.prefix, s, strlen(hyper_node.prefix)))
		hyper_node.version = s + strlen(hyper_node.prefix);

225 226 227 228 229 230 231 232 233 234 235 236 237
	/*
	 * Check if Xen supports EFI by checking whether there is the
	 * "/hypervisor/uefi" node in DT. If so, runtime services are available
	 * through proxy functions (e.g. in case of Xen dom0 EFI implementation
	 * they call special hypercall which executes relevant EFI functions)
	 * and that is why they are always enabled.
	 */
	if (IS_ENABLED(CONFIG_XEN_EFI)) {
		if ((of_get_flat_dt_subnode_by_name(node, "uefi") > 0) &&
		    !efi_runtime_disabled())
			set_bit(EFI_RUNTIME_SERVICES, &efi.flags);
	}

238 239 240
	return 0;
}

241 242 243 244
/*
 * see Documentation/devicetree/bindings/arm/xen.txt for the
 * documentation of the Xen Device Tree format.
 */
245
void __init xen_early_init(void)
246
{
247 248
	of_scan_flat_dt(fdt_find_hyper_node, NULL);
	if (!hyper_node.found) {
249
		pr_debug("No Xen support\n");
250
		return;
251
	}
252 253

	if (hyper_node.version == NULL) {
254
		pr_debug("Xen version not found\n");
255
		return;
256 257
	}

258
	pr_info("Xen %s support found\n", hyper_node.version);
259

260 261
	xen_domain_type = XEN_HVM_DOMAIN;

262
	xen_setup_features();
263

264
	if (xen_feature(XENFEAT_dom0))
265
		xen_start_flags |= SIF_INITDOMAIN|SIF_PRIVILEGED;
266 267 268

	if (!console_set_on_cmdline && !xen_initial_domain())
		add_preferred_console("hvc", 0, NULL);
269 270
}

271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296
static void __init xen_acpi_guest_init(void)
{
#ifdef CONFIG_ACPI
	struct xen_hvm_param a;
	int interrupt, trigger, polarity;

	a.domid = DOMID_SELF;
	a.index = HVM_PARAM_CALLBACK_IRQ;

	if (HYPERVISOR_hvm_op(HVMOP_get_param, &a)
	    || (a.value >> 56) != HVM_PARAM_CALLBACK_TYPE_PPI) {
		xen_events_irq = 0;
		return;
	}

	interrupt = a.value & 0xff;
	trigger = ((a.value >> 8) & 0x1) ? ACPI_EDGE_SENSITIVE
					 : ACPI_LEVEL_SENSITIVE;
	polarity = ((a.value >> 8) & 0x2) ? ACPI_ACTIVE_LOW
					  : ACPI_ACTIVE_HIGH;
	xen_events_irq = acpi_register_gsi(NULL, interrupt, trigger, polarity);
#endif
}

static void __init xen_dt_guest_init(void)
{
297 298 299 300 301 302 303 304
	struct device_node *xen_node;

	xen_node = of_find_compatible_node(NULL, NULL, "xen,xen");
	if (!xen_node) {
		pr_err("Xen support was detected before, but it has disappeared\n");
		return;
	}

305 306 307
	xen_events_irq = irq_of_parse_and_map(xen_node, 0);
}

308 309 310 311
static int __init xen_guest_init(void)
{
	struct xen_add_to_physmap xatp;
	struct shared_info *shared_info_page = NULL;
V
Vitaly Kuznetsov 已提交
312
	int cpu;
313 314 315 316

	if (!xen_domain())
		return 0;

317 318 319 320 321
	if (!acpi_disabled)
		xen_acpi_guest_init();
	else
		xen_dt_guest_init();

322 323 324 325 326
	if (!xen_events_irq) {
		pr_err("Xen event channel interrupt not found\n");
		return -ENODEV;
	}

327 328 329 330 331 332 333
	/*
	 * The fdt parsing codes have set EFI_RUNTIME_SERVICES if Xen EFI
	 * parameters are found. Force enable runtime services.
	 */
	if (efi_enabled(EFI_RUNTIME_SERVICES))
		xen_efi_runtime_setup();

334
	shared_info_page = (struct shared_info *)get_zeroed_page(GFP_KERNEL);
335

336 337 338 339 340 341 342
	if (!shared_info_page) {
		pr_err("not enough memory\n");
		return -ENOMEM;
	}
	xatp.domid = DOMID_SELF;
	xatp.idx = 0;
	xatp.space = XENMAPSPACE_shared_info;
343
	xatp.gpfn = virt_to_gfn(shared_info_page);
344 345 346 347 348 349 350
	if (HYPERVISOR_memory_op(XENMEM_add_to_physmap, &xatp))
		BUG();

	HYPERVISOR_shared_info = (struct shared_info *)shared_info_page;

	/* xen_vcpu is a pointer to the vcpu_info struct in the shared_info
	 * page, we use it in the event channel upcall and in some pvclock
S
Stefano Stabellini 已提交
351
	 * related functions. 
352 353
	 * The shared info contains exactly 1 CPU (the boot CPU). The guest
	 * is required to use VCPUOP_register_vcpu_info to place vcpu info
S
Stefano Stabellini 已提交
354 355 356
	 * for secondary CPUs as they are brought up.
	 * For uniformity we use VCPUOP_register_vcpu_info even on cpu0.
	 */
357
	xen_vcpu_info = alloc_percpu(struct vcpu_info);
S
Stefano Stabellini 已提交
358 359
	if (xen_vcpu_info == NULL)
		return -ENOMEM;
360

361
	/* Direct vCPU id mapping for ARM guests. */
V
Vitaly Kuznetsov 已提交
362 363
	for_each_possible_cpu(cpu)
		per_cpu(xen_vcpu_id, cpu) = cpu;
364

365 366 367 368
	xen_auto_xlat_grant_frames.count = gnttab_max_grant_frames();
	if (xen_xlate_map_ballooned_pages(&xen_auto_xlat_grant_frames.pfn,
					  &xen_auto_xlat_grant_frames.vaddr,
					  xen_auto_xlat_grant_frames.count)) {
369 370 371
		free_percpu(xen_vcpu_info);
		return -ENOMEM;
	}
372 373 374 375
	gnttab_init();
	if (!xen_initial_domain())
		xenbus_probe(NULL);

376 377 378 379 380 381 382
	/*
	 * Making sure board specific code will not set up ops for
	 * cpu idle and cpu freq.
	 */
	disable_cpuidle();
	disable_cpufreq();

383 384 385 386 387 388 389 390
	xen_init_IRQ();

	if (request_percpu_irq(xen_events_irq, xen_arm_callback,
			       "events", &xen_vcpu)) {
		pr_err("Error request IRQ %d\n", xen_events_irq);
		return -EINVAL;
	}

391 392
	if (!xen_kernel_unmapped_at_usr())
		xen_time_setup_guest();
393

394 395
	if (xen_initial_domain())
		pvclock_gtod_register_notifier(&xen_pvclock_gtod_notifier);
396

397
	return cpuhp_setup_state(CPUHP_AP_ARM_XEN_STARTING,
T
Thomas Gleixner 已提交
398
				 "arm/xen:starting", xen_starting_cpu,
399
				 xen_dying_cpu);
400
}
401
early_initcall(xen_guest_init);
402 403 404

static int __init xen_pm_init(void)
{
405 406 407
	if (!xen_domain())
		return -ENODEV;

408 409
	pm_power_off = xen_power_off;
	arm_pm_restart = xen_restart;
410 411 412 413 414
	if (!xen_initial_domain()) {
		struct timespec64 ts;
		xen_read_wallclock(&ts);
		do_settimeofday64(&ts);
	}
415

416 417
	return 0;
}
418
late_initcall(xen_pm_init);
419

420 421 422 423 424 425

/* empty stubs */
void xen_arch_pre_suspend(void) { }
void xen_arch_post_suspend(int suspend_cancelled) { }
void xen_timer_resume(void) { }
void xen_arch_resume(void) { }
426
void xen_arch_suspend(void) { }
427 428


429
/* In the hypercall.S file. */
430 431
EXPORT_SYMBOL_GPL(HYPERVISOR_event_channel_op);
EXPORT_SYMBOL_GPL(HYPERVISOR_grant_table_op);
432 433 434 435 436 437
EXPORT_SYMBOL_GPL(HYPERVISOR_xen_version);
EXPORT_SYMBOL_GPL(HYPERVISOR_console_io);
EXPORT_SYMBOL_GPL(HYPERVISOR_sched_op);
EXPORT_SYMBOL_GPL(HYPERVISOR_hvm_op);
EXPORT_SYMBOL_GPL(HYPERVISOR_memory_op);
EXPORT_SYMBOL_GPL(HYPERVISOR_physdev_op);
438
EXPORT_SYMBOL_GPL(HYPERVISOR_vcpu_op);
439
EXPORT_SYMBOL_GPL(HYPERVISOR_tmem_op);
440
EXPORT_SYMBOL_GPL(HYPERVISOR_platform_op_raw);
441
EXPORT_SYMBOL_GPL(HYPERVISOR_multicall);
442
EXPORT_SYMBOL_GPL(HYPERVISOR_vm_assist);
443
EXPORT_SYMBOL_GPL(HYPERVISOR_dm_op);
444
EXPORT_SYMBOL_GPL(privcmd_call);