lg.h 7.5 KB
Newer Older
R
Rusty Russell 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
#ifndef _LGUEST_H
#define _LGUEST_H

#ifndef __ASSEMBLY__
#include <linux/types.h>
#include <linux/init.h>
#include <linux/stringify.h>
#include <linux/lguest.h>
#include <linux/lguest_launcher.h>
#include <linux/wait.h>
#include <linux/err.h>
#include <asm/semaphore.h>

14
#include <asm/lguest.h>
R
Rusty Russell 已提交
15 16 17 18 19 20

void free_pagetables(void);
int init_pagetables(struct page **switcher_page, unsigned int pages);

struct pgdir
{
21
	unsigned long gpgdir;
22
	pgd_t *pgdir;
R
Rusty Russell 已提交
23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40
};

/* We have two pages shared with guests, per cpu.  */
struct lguest_pages
{
	/* This is the stack page mapped rw in guest */
	char spare[PAGE_SIZE - sizeof(struct lguest_regs)];
	struct lguest_regs regs;

	/* This is the host state & guest descriptor page, ro in guest */
	struct lguest_ro_state state;
} __attribute__((aligned(PAGE_SIZE)));

#define CHANGED_IDT		1
#define CHANGED_GDT		2
#define CHANGED_GDT_TLS		4 /* Actually a subset of CHANGED_GDT */
#define CHANGED_ALL	        3

41 42 43 44 45
struct lguest;

struct lg_cpu {
	unsigned int id;
	struct lguest *lg;
46 47
	struct task_struct *tsk;
	struct mm_struct *mm; 	/* == tsk->mm, but that becomes NULL on exit */
48

49 50 51 52
	/* At end of a page shared mapped over lguest_pages in guest.  */
	unsigned long regs_page;
	struct lguest_regs *regs;

53 54 55
	/* If a hypercall was asked for, this points to the arguments. */
	struct hcall_args *hcall;
	u32 next_hcall;
56 57 58

	/* Virtual clock device */
	struct hrtimer hrt;
59

60 61 62 63 64
	/* Do we need to stop what we're doing and return to userspace? */
	int break_out;
	wait_queue_head_t break_wq;
	int halted;

65 66
	/* Pending virtual interrupts */
	DECLARE_BITMAP(irqs_pending, LGUEST_IRQS);
67 68

	struct lg_cpu_arch arch;
69 70
};

R
Rusty Russell 已提交
71 72 73 74
/* The private info the thread maintains about the guest. */
struct lguest
{
	struct lguest_data __user *lguest_data;
75 76 77
	struct lg_cpu cpus[NR_CPUS];
	unsigned int nr_cpus;

R
Rusty Russell 已提交
78
	u32 pfn_limit;
79 80 81
	/* This provides the offset to the base of guest-physical
	 * memory in the Launcher. */
	void __user *mem_base;
82
	unsigned long kernel_address;
R
Rusty Russell 已提交
83 84 85 86 87 88 89 90 91 92 93 94 95 96
	u32 cr2;
	int ts;
	u32 esp1;
	u8 ss1;

	/* Bitmap of what has changed: see CHANGED_* above. */
	int changed;
	struct lguest_pages *last_pages;

	/* We keep a small number of these. */
	u32 pgdidx;
	struct pgdir pgdirs[4];

	unsigned long noirq_start, noirq_end;
97
	unsigned long pending_notify; /* pfn from LHCALL_NOTIFY */
R
Rusty Russell 已提交
98 99 100 101 102 103 104 105 106 107 108 109 110

	unsigned int stack_pages;
	u32 tsc_khz;

	/* Dead? */
	const char *dead;
};

extern struct mutex lguest_lock;

/* core.c: */
int lguest_address_ok(const struct lguest *lg,
		      unsigned long addr, unsigned long len);
R
Rusty Russell 已提交
111 112 113
void __lgread(struct lguest *, void *, unsigned long, unsigned);
void __lgwrite(struct lguest *, unsigned long, const void *, unsigned);

R
Rusty Russell 已提交
114
/*H:035 Using memory-copy operations like that is usually inconvient, so we
R
Rusty Russell 已提交
115 116 117 118 119 120 121 122 123 124 125 126 127 128 129
 * have the following helper macros which read and write a specific type (often
 * an unsigned long).
 *
 * This reads into a variable of the given type then returns that. */
#define lgread(lg, addr, type)						\
	({ type _v; __lgread((lg), &_v, (addr), sizeof(_v)); _v; })

/* This checks that the variable is of the given type, then writes it out. */
#define lgwrite(lg, addr, type, val)				\
	do {							\
		typecheck(type, val);				\
		__lgwrite((lg), (addr), &(val), sizeof(val));	\
	} while(0)
/* (end of memory access helper routines) :*/

130
int run_guest(struct lg_cpu *cpu, unsigned long __user *user);
R
Rusty Russell 已提交
131

132 133 134 135 136 137
/* Helper macros to obtain the first 12 or the last 20 bits, this is only the
 * first step in the migration to the kernel types.  pte_pfn is already defined
 * in the kernel. */
#define pgd_flags(x)	(pgd_val(x) & ~PAGE_MASK)
#define pte_flags(x)	(pte_val(x) & ~PAGE_MASK)
#define pgd_pfn(x)	(pgd_val(x) >> PAGE_SHIFT)
R
Rusty Russell 已提交
138 139

/* interrupts_and_traps.c: */
140 141
void maybe_do_interrupt(struct lg_cpu *cpu);
int deliver_trap(struct lg_cpu *cpu, unsigned int num);
142 143
void load_guest_idt_entry(struct lg_cpu *cpu, unsigned int i,
			  u32 low, u32 hi);
R
Rusty Russell 已提交
144 145 146 147
void guest_set_stack(struct lguest *lg, u32 seg, u32 esp, unsigned int pages);
void pin_stack_pages(struct lguest *lg);
void setup_default_idt_entries(struct lguest_ro_state *state,
			       const unsigned long *def);
148
void copy_traps(const struct lg_cpu *cpu, struct desc_struct *idt,
R
Rusty Russell 已提交
149
		const unsigned long *def);
150 151
void guest_set_clockevent(struct lg_cpu *cpu, unsigned long delta);
void init_clockdev(struct lg_cpu *cpu);
152 153 154
bool check_syscall_vector(struct lguest *lg);
int init_interrupts(void);
void free_interrupts(void);
R
Rusty Russell 已提交
155 156 157

/* segments.c: */
void setup_default_gdt_entries(struct lguest_ro_state *state);
158 159 160 161 162
void setup_guest_gdt(struct lg_cpu *cpu);
void load_guest_gdt(struct lg_cpu *cpu, unsigned long table, u32 num);
void guest_load_tls(struct lg_cpu *cpu, unsigned long tls_array);
void copy_gdt(const struct lg_cpu *cpu, struct desc_struct *gdt);
void copy_gdt_tls(const struct lg_cpu *cpu, struct desc_struct *gdt);
R
Rusty Russell 已提交
163 164 165 166 167

/* page_tables.c: */
int init_guest_pagetable(struct lguest *lg, unsigned long pgtable);
void free_guest_pagetable(struct lguest *lg);
void guest_new_pagetable(struct lguest *lg, unsigned long pgtable);
168
void guest_set_pmd(struct lguest *lg, unsigned long gpgdir, u32 i);
R
Rusty Russell 已提交
169 170
void guest_pagetable_clear_all(struct lguest *lg);
void guest_pagetable_flush_user(struct lguest *lg);
171
void guest_set_pte(struct lguest *lg, unsigned long gpgdir,
172
		   unsigned long vaddr, pte_t val);
173
void map_switcher_in_guest(struct lg_cpu *cpu, struct lguest_pages *pages);
R
Rusty Russell 已提交
174 175
int demand_page(struct lguest *info, unsigned long cr2, int errcode);
void pin_page(struct lguest *lg, unsigned long vaddr);
176 177
unsigned long guest_pa(struct lguest *lg, unsigned long vaddr);
void page_table_guest_data_init(struct lguest *lg);
R
Rusty Russell 已提交
178

179 180 181
/* <arch>/core.c: */
void lguest_arch_host_init(void);
void lguest_arch_host_fini(void);
182
void lguest_arch_run_guest(struct lg_cpu *cpu);
183 184 185
void lguest_arch_handle_trap(struct lg_cpu *cpu);
int lguest_arch_init_hypercalls(struct lg_cpu *cpu);
int lguest_arch_do_hcall(struct lg_cpu *cpu, struct hcall_args *args);
186
void lguest_arch_setup_regs(struct lg_cpu *cpu, unsigned long start);
187 188 189 190

/* <arch>/switcher.S: */
extern char start_switcher_text[], end_switcher_text[], switch_to_guest[];

R
Rusty Russell 已提交
191 192 193 194 195
/* lguest_user.c: */
int lguest_device_init(void);
void lguest_device_remove(void);

/* hypercalls.c: */
196
void do_hypercalls(struct lg_cpu *cpu);
197
void write_timestamp(struct lguest *lg);
R
Rusty Russell 已提交
198

199 200 201 202
/*L:035
 * Let's step aside for the moment, to study one important routine that's used
 * widely in the Host code.
 *
R
Rusty Russell 已提交
203
 * There are many cases where the Guest can do something invalid, like pass crap
204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222
 * to a hypercall.  Since only the Guest kernel can make hypercalls, it's quite
 * acceptable to simply terminate the Guest and give the Launcher a nicely
 * formatted reason.  It's also simpler for the Guest itself, which doesn't
 * need to check most hypercalls for "success"; if you're still running, it
 * succeeded.
 *
 * Once this is called, the Guest will never run again, so most Host code can
 * call this then continue as if nothing had happened.  This means many
 * functions don't have to explicitly return an error code, which keeps the
 * code simple.
 *
 * It also means that this can be called more than once: only the first one is
 * remembered.  The only trick is that we still need to kill the Guest even if
 * we can't allocate memory to store the reason.  Linux has a neat way of
 * packing error codes into invalid pointers, so we use that here.
 *
 * Like any macro which uses an "if", it is safely wrapped in a run-once "do {
 * } while(0)".
 */
R
Rusty Russell 已提交
223 224 225 226 227 228 229 230
#define kill_guest(lg, fmt...)					\
do {								\
	if (!(lg)->dead) {					\
		(lg)->dead = kasprintf(GFP_ATOMIC, fmt);	\
		if (!(lg)->dead)				\
			(lg)->dead = ERR_PTR(-ENOMEM);		\
	}							\
} while(0)
231
/* (End of aside) :*/
R
Rusty Russell 已提交
232 233 234

#endif	/* __ASSEMBLY__ */
#endif	/* _LGUEST_H */