enlighten_hvm.c 6.2 KB
Newer Older
1 2
// SPDX-License-Identifier: GPL-2.0

3
#include <linux/acpi.h>
4 5
#include <linux/cpu.h>
#include <linux/kexec.h>
6
#include <linux/memblock.h>
7 8 9 10 11 12 13 14 15 16

#include <xen/features.h>
#include <xen/events.h>
#include <xen/interface/memory.h>

#include <asm/cpu.h>
#include <asm/smp.h>
#include <asm/reboot.h>
#include <asm/setup.h>
#include <asm/hypervisor.h>
17
#include <asm/e820/api.h>
18
#include <asm/early_ioremap.h>
19 20 21

#include <asm/xen/cpuid.h>
#include <asm/xen/hypervisor.h>
22
#include <asm/xen/page.h>
23 24 25 26 27

#include "xen-ops.h"
#include "mmu.h"
#include "smp.h"

28 29
static unsigned long shared_info_pfn;

30
void xen_hvm_init_shared_info(void)
31 32 33 34 35 36
{
	struct xen_add_to_physmap xatp;

	xatp.domid = DOMID_SELF;
	xatp.idx = 0;
	xatp.space = XENMAPSPACE_shared_info;
37
	xatp.gpfn = shared_info_pfn;
38 39 40 41
	if (HYPERVISOR_memory_op(XENMEM_add_to_physmap, &xatp))
		BUG();
}

42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59
static void __init reserve_shared_info(void)
{
	u64 pa;

	/*
	 * Search for a free page starting at 4kB physical address.
	 * Low memory is preferred to avoid an EPT large page split up
	 * by the mapping.
	 * Starting below X86_RESERVE_LOW (usually 64kB) is fine as
	 * the BIOS used for HVM guests is well behaved and won't
	 * clobber memory other than the first 4kB.
	 */
	for (pa = PAGE_SIZE;
	     !e820__mapped_all(pa, pa + PAGE_SIZE, E820_TYPE_RAM) ||
	     memblock_is_reserved(pa);
	     pa += PAGE_SIZE)
		;

60 61
	shared_info_pfn = PHYS_PFN(pa);

62
	memblock_reserve(pa, PAGE_SIZE);
63 64 65 66 67 68 69
	HYPERVISOR_shared_info = early_memremap(pa, PAGE_SIZE);
}

static void __init xen_hvm_init_mem_mapping(void)
{
	early_memunmap(HYPERVISOR_shared_info, PAGE_SIZE);
	HYPERVISOR_shared_info = __va(PFN_PHYS(shared_info_pfn));
70 71 72 73 74 75 76 77 78 79 80 81 82

	/*
	 * The virtual address of the shared_info page has changed, so
	 * the vcpu_info pointer for VCPU 0 is now stale.
	 *
	 * The prepare_boot_cpu callback will re-initialize it via
	 * xen_vcpu_setup, but we can't rely on that to be called for
	 * old Xen versions (xen_have_vector_callback == 0).
	 *
	 * It is, in any case, bad to have a stale vcpu_info pointer
	 * so reset it now.
	 */
	xen_vcpu_info_reset(0);
83 84
}

85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137
static void __init init_hvm_pv_info(void)
{
	int major, minor;
	uint32_t eax, ebx, ecx, edx, base;

	base = xen_cpuid_base();
	eax = cpuid_eax(base + 1);

	major = eax >> 16;
	minor = eax & 0xffff;
	printk(KERN_INFO "Xen version %d.%d.\n", major, minor);

	xen_domain_type = XEN_HVM_DOMAIN;

	/* PVH set up hypercall page in xen_prepare_pvh(). */
	if (xen_pvh_domain())
		pv_info.name = "Xen PVH";
	else {
		u64 pfn;
		uint32_t msr;

		pv_info.name = "Xen HVM";
		msr = cpuid_ebx(base + 2);
		pfn = __pa(hypercall_page);
		wrmsr_safe(msr, (u32)pfn, (u32)(pfn >> 32));
	}

	xen_setup_features();

	cpuid(base + 4, &eax, &ebx, &ecx, &edx);
	if (eax & XEN_HVM_CPUID_VCPU_ID_PRESENT)
		this_cpu_write(xen_vcpu_id, ebx);
	else
		this_cpu_write(xen_vcpu_id, smp_processor_id());
}

#ifdef CONFIG_KEXEC_CORE
static void xen_hvm_shutdown(void)
{
	native_machine_shutdown();
	if (kexec_in_progress)
		xen_reboot(SHUTDOWN_soft_reset);
}

static void xen_hvm_crash_shutdown(struct pt_regs *regs)
{
	native_machine_crash_shutdown(regs);
	xen_reboot(SHUTDOWN_soft_reset);
}
#endif

static int xen_cpu_up_prepare_hvm(unsigned int cpu)
{
138
	int rc = 0;
139 140 141 142 143 144 145 146 147 148 149 150 151 152

	/*
	 * This can happen if CPU was offlined earlier and
	 * offlining timed out in common_cpu_die().
	 */
	if (cpu_report_state(cpu) == CPU_DEAD_FROZEN) {
		xen_smp_intr_free(cpu);
		xen_uninit_lock_cpu(cpu);
	}

	if (cpu_acpi_id(cpu) != U32_MAX)
		per_cpu(xen_vcpu_id, cpu) = cpu_acpi_id(cpu);
	else
		per_cpu(xen_vcpu_id, cpu) = cpu;
153 154 155
	rc = xen_vcpu_setup(cpu);
	if (rc)
		return rc;
156

157
	if (xen_have_vector_callback && xen_feature(XENFEAT_hvm_safe_pvclock))
158 159 160 161 162 163 164
		xen_setup_timer(cpu);

	rc = xen_smp_intr_init(cpu);
	if (rc) {
		WARN(1, "xen_smp_intr_init() for CPU %d failed: %d\n",
		     cpu, rc);
	}
165
	return rc;
166 167 168 169 170 171
}

static int xen_cpu_dead_hvm(unsigned int cpu)
{
	xen_smp_intr_free(cpu);

172
	if (xen_have_vector_callback && xen_feature(XENFEAT_hvm_safe_pvclock))
173 174 175 176 177 178 179 180 181 182 183 184
		xen_teardown_timer(cpu);

       return 0;
}

static void __init xen_hvm_guest_init(void)
{
	if (xen_pv_domain())
		return;

	init_hvm_pv_info();

185
	reserve_shared_info();
186 187
	xen_hvm_init_shared_info();

188 189 190 191 192 193 194
	/*
	 * xen_vcpu is a pointer to the vcpu_info struct in the shared_info
	 * page, we use it in the event channel upcall and in some pvclock
	 * related functions.
	 */
	xen_vcpu_info_reset(0);

195 196
	xen_panic_handler_init();

197 198
	if (xen_feature(XENFEAT_hvm_callback_vector))
		xen_have_vector_callback = 1;
199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214

	xen_hvm_smp_init();
	WARN_ON(xen_cpuhp_setup(xen_cpu_up_prepare_hvm, xen_cpu_dead_hvm));
	xen_unplug_emulated_devices();
	x86_init.irqs.intr_init = xen_init_IRQ;
	xen_hvm_init_time_ops();
	xen_hvm_init_mmu_ops();

#ifdef CONFIG_KEXEC_CORE
	machine_ops.shutdown = xen_hvm_shutdown;
	machine_ops.crash_shutdown = xen_hvm_crash_shutdown;
#endif
}

static __init int xen_parse_nopv(char *arg)
{
215 216 217 218 219
	pr_notice("\"xen_nopv\" is deprecated, please use \"nopv\" instead\n");

	if (xen_cpuid_base())
		nopv = true;
	return 0;
220 221 222
}
early_param("xen_nopv", xen_parse_nopv);

223
bool __init xen_hvm_need_lapic(void)
224 225 226 227 228
{
	if (xen_pv_domain())
		return false;
	if (!xen_hvm_domain())
		return false;
229
	if (xen_feature(XENFEAT_hvm_pirqs) && xen_have_vector_callback)
230 231 232 233 234 235
		return false;
	return true;
}

static uint32_t __init xen_platform_hvm(void)
{
236
	if (xen_pv_domain())
237 238 239 240 241
		return 0;

	return xen_cpuid_base();
}

242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261
static __init void xen_hvm_guest_late_init(void)
{
#ifdef CONFIG_XEN_PVH
	/* Test for PVH domain (PVH boot path taken overrides ACPI flags). */
	if (!xen_pvh &&
	    (x86_platform.legacy.rtc || !x86_platform.legacy.no_vga))
		return;

	/* PVH detected. */
	xen_pvh = true;

	/* Make sure we don't fall back to (default) ACPI_IRQ_MODEL_PIC. */
	if (!nr_ioapics && acpi_irq_model == ACPI_IRQ_MODEL_PIC)
		acpi_irq_model = ACPI_IRQ_MODEL_PLATFORM;

	machine_ops.emergency_restart = xen_emergency_restart;
	pv_info.name = "Xen PVH";
#endif
}

262
struct hypervisor_x86 x86_hyper_xen_hvm __initdata = {
263 264
	.name                   = "Xen HVM",
	.detect                 = xen_platform_hvm,
265
	.type			= X86_HYPER_XEN_HVM,
266 267 268
	.init.init_platform     = xen_hvm_guest_init,
	.init.x2apic_available  = xen_x2apic_para_available,
	.init.init_mem_mapping	= xen_hvm_init_mem_mapping,
269
	.init.guest_late_init	= xen_hvm_guest_late_init,
270
	.runtime.pin_vcpu       = xen_pin_vcpu,
271
};