diag.c 8.5 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0
2
/*
3
 * handling diagnose instructions
4
 *
5
 * Copyright IBM Corp. 2008, 2020
6 7 8 9 10 11 12
 *
 *    Author(s): Carsten Otte <cotte@de.ibm.com>
 *               Christian Borntraeger <borntraeger@de.ibm.com>
 */

#include <linux/kvm.h>
#include <linux/kvm_host.h>
13
#include <asm/gmap.h>
C
Cornelia Huck 已提交
14
#include <asm/virtio-ccw.h>
15
#include "kvm-s390.h"
16
#include "trace.h"
17
#include "trace-s390.h"
18
#include "gaccess.h"
19

20 21 22
static int diag_release_pages(struct kvm_vcpu *vcpu)
{
	unsigned long start, end;
23
	unsigned long prefix  = kvm_s390_get_prefix(vcpu);
24

25
	start = vcpu->run->s.regs.gprs[(vcpu->arch.sie_block->ipa & 0xf0) >> 4];
26
	end = vcpu->run->s.regs.gprs[vcpu->arch.sie_block->ipa & 0xf] + PAGE_SIZE;
27
	vcpu->stat.diagnose_10++;
28

29
	if (start & ~PAGE_MASK || end & ~PAGE_MASK || start >= end
30 31 32 33 34
	    || start < 2 * PAGE_SIZE)
		return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);

	VCPU_EVENT(vcpu, 5, "diag release pages %lX %lX", start, end);

35 36 37 38 39
	/*
	 * We checked for start >= end above, so lets check for the
	 * fast path (no prefix swap page involved)
	 */
	if (end <= prefix || start >= prefix + 2 * PAGE_SIZE) {
40
		gmap_discard(vcpu->arch.gmap, start, end);
41
	} else {
42 43 44 45 46 47 48 49
		/*
		 * This is slow path.  gmap_discard will check for start
		 * so lets split this into before prefix, prefix, after
		 * prefix and let gmap_discard make some of these calls
		 * NOPs.
		 */
		gmap_discard(vcpu->arch.gmap, start, prefix);
		if (start <= prefix)
50 51 52
			gmap_discard(vcpu->arch.gmap, 0, PAGE_SIZE);
		if (end > prefix + PAGE_SIZE)
			gmap_discard(vcpu->arch.gmap, PAGE_SIZE, 2 * PAGE_SIZE);
53
		gmap_discard(vcpu->arch.gmap, prefix + 2 * PAGE_SIZE, end);
54 55 56 57
	}
	return 0;
}

58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74
static int __diag_page_ref_service(struct kvm_vcpu *vcpu)
{
	struct prs_parm {
		u16 code;
		u16 subcode;
		u16 parm_len;
		u16 parm_version;
		u64 token_addr;
		u64 select_mask;
		u64 compare_mask;
		u64 zarch;
	};
	struct prs_parm parm;
	int rc;
	u16 rx = (vcpu->arch.sie_block->ipa & 0xf0) >> 4;
	u16 ry = (vcpu->arch.sie_block->ipa & 0x0f);

75 76
	VCPU_EVENT(vcpu, 3, "diag page reference parameter block at 0x%llx",
		   vcpu->run->s.regs.gprs[rx]);
77
	vcpu->stat.diagnose_258++;
78 79
	if (vcpu->run->s.regs.gprs[rx] & 7)
		return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);
80
	rc = read_guest(vcpu, vcpu->run->s.regs.gprs[rx], rx, &parm, sizeof(parm));
H
Heiko Carstens 已提交
81 82
	if (rc)
		return kvm_s390_inject_prog_cond(vcpu, rc);
83 84 85 86 87
	if (parm.parm_version != 2 || parm.parm_len < 5 || parm.code != 0x258)
		return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);

	switch (parm.subcode) {
	case 0: /* TOKEN */
88 89 90
		VCPU_EVENT(vcpu, 3, "pageref token addr 0x%llx "
			   "select mask 0x%llx compare mask 0x%llx",
			   parm.token_addr, parm.select_mask, parm.compare_mask);
91 92 93 94 95 96 97 98 99 100 101 102 103 104
		if (vcpu->arch.pfault_token != KVM_S390_PFAULT_TOKEN_INVALID) {
			/*
			 * If the pagefault handshake is already activated,
			 * the token must not be changed.  We have to return
			 * decimal 8 instead, as mandated in SC24-6084.
			 */
			vcpu->run->s.regs.gprs[ry] = 8;
			return 0;
		}

		if ((parm.compare_mask & parm.select_mask) != parm.compare_mask ||
		    parm.token_addr & 7 || parm.zarch != 0x8000000000000000ULL)
			return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);

H
Heiko Carstens 已提交
105
		if (kvm_is_error_gpa(vcpu->kvm, parm.token_addr))
106 107 108 109 110 111 112 113 114 115 116 117 118 119
			return kvm_s390_inject_program_int(vcpu, PGM_ADDRESSING);

		vcpu->arch.pfault_token = parm.token_addr;
		vcpu->arch.pfault_select = parm.select_mask;
		vcpu->arch.pfault_compare = parm.compare_mask;
		vcpu->run->s.regs.gprs[ry] = 0;
		rc = 0;
		break;
	case 1: /*
		 * CANCEL
		 * Specification allows to let already pending tokens survive
		 * the cancel, therefore to reduce code complexity, we assume
		 * all outstanding tokens are already pending.
		 */
120
		VCPU_EVENT(vcpu, 3, "pageref cancel addr 0x%llx", parm.token_addr);
121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144
		if (parm.token_addr || parm.select_mask ||
		    parm.compare_mask || parm.zarch)
			return kvm_s390_inject_program_int(vcpu, PGM_SPECIFICATION);

		vcpu->run->s.regs.gprs[ry] = 0;
		/*
		 * If the pfault handling was not established or is already
		 * canceled SC24-6084 requests to return decimal 4.
		 */
		if (vcpu->arch.pfault_token == KVM_S390_PFAULT_TOKEN_INVALID)
			vcpu->run->s.regs.gprs[ry] = 4;
		else
			vcpu->arch.pfault_token = KVM_S390_PFAULT_TOKEN_INVALID;

		rc = 0;
		break;
	default:
		rc = -EOPNOTSUPP;
		break;
	}

	return rc;
}

145 146 147 148
static int __diag_time_slice_end(struct kvm_vcpu *vcpu)
{
	VCPU_EVENT(vcpu, 5, "%s", "diag time slice end");
	vcpu->stat.diagnose_44++;
149
	kvm_vcpu_on_spin(vcpu, true);
150 151 152
	return 0;
}

153 154 155 156 157 158 159 160 161 162 163 164 165
static int forward_cnt;
static unsigned long cur_slice;

static int diag9c_forwarding_overrun(void)
{
	/* Reset the count on a new slice */
	if (time_after(jiffies, cur_slice)) {
		cur_slice = jiffies;
		forward_cnt = diag9c_forwarding_hz / HZ;
	}
	return forward_cnt-- <= 0 ? 1 : 0;
}

166 167 168 169 170 171 172 173
static int __diag_time_slice_end_directed(struct kvm_vcpu *vcpu)
{
	struct kvm_vcpu *tcpu;
	int tid;

	tid = vcpu->run->s.regs.gprs[(vcpu->arch.sie_block->ipa & 0xf0) >> 4];
	vcpu->stat.diagnose_9c++;

174
	/* yield to self */
175
	if (tid == vcpu->vcpu_id)
176
		goto no_yield;
177

178
	/* yield to invalid */
179
	tcpu = kvm_get_vcpu_by_id(vcpu->kvm, tid);
180 181 182
	if (!tcpu)
		goto no_yield;

183 184 185 186 187 188 189 190 191 192 193 194 195 196 197
	/* target guest VCPU already running */
	if (READ_ONCE(tcpu->cpu) >= 0) {
		if (!diag9c_forwarding_hz || diag9c_forwarding_overrun())
			goto no_yield;

		/* target host CPU already running */
		if (!vcpu_is_preempted(tcpu->cpu))
			goto no_yield;
		smp_yield_cpu(tcpu->cpu);
		VCPU_EVENT(vcpu, 5,
			   "diag time slice end directed to %d: yield forwarded",
			   tid);
		vcpu->stat.diagnose_9c_forward++;
		return 0;
	}
198

199 200 201 202 203 204 205 206
	if (kvm_vcpu_yield_to(tcpu) <= 0)
		goto no_yield;

	VCPU_EVENT(vcpu, 5, "diag time slice end directed to %d: done", tid);
	return 0;
no_yield:
	VCPU_EVENT(vcpu, 5, "diag time slice end directed to %d: ignored", tid);
	vcpu->stat.diagnose_9c_ignored++;
207 208 209
	return 0;
}

210 211 212
static int __diag_ipl_functions(struct kvm_vcpu *vcpu)
{
	unsigned int reg = vcpu->arch.sie_block->ipa & 0xf;
213
	unsigned long subcode = vcpu->run->s.regs.gprs[reg] & 0xffff;
214

215
	VCPU_EVENT(vcpu, 3, "diag ipl functions, subcode %lx", subcode);
216
	vcpu->stat.diagnose_308++;
217 218 219 220 221 222 223 224
	switch (subcode) {
	case 3:
		vcpu->run->s390_reset_flags = KVM_S390_RESET_CLEAR;
		break;
	case 4:
		vcpu->run->s390_reset_flags = 0;
		break;
	default:
225
		return -EOPNOTSUPP;
226 227
	}

228 229 230 231
	/*
	 * no need to check the return value of vcpu_stop as it can only have
	 * an error for protvirt, but protvirt means user cpu state
	 */
232 233
	if (!kvm_s390_user_cpu_state_ctrl(vcpu->kvm))
		kvm_s390_vcpu_stop(vcpu);
234 235 236 237
	vcpu->run->s390_reset_flags |= KVM_S390_RESET_SUBSYSTEM;
	vcpu->run->s390_reset_flags |= KVM_S390_RESET_IPL;
	vcpu->run->s390_reset_flags |= KVM_S390_RESET_CPU_INIT;
	vcpu->run->exit_reason = KVM_EXIT_S390_RESET;
238
	VCPU_EVENT(vcpu, 3, "requesting userspace resets %llx",
239
	  vcpu->run->s390_reset_flags);
240
	trace_kvm_s390_request_resets(vcpu->run->s390_reset_flags);
241 242 243
	return -EREMOTE;
}

C
Cornelia Huck 已提交
244 245
static int __diag_virtio_hypercall(struct kvm_vcpu *vcpu)
{
246
	int ret;
C
Cornelia Huck 已提交
247

248
	vcpu->stat.diagnose_500++;
C
Cornelia Huck 已提交
249 250 251 252 253
	/* No virtio-ccw notification? Get out quickly. */
	if (!vcpu->kvm->arch.css_support ||
	    (vcpu->run->s.regs.gprs[1] != KVM_S390_VIRTIO_CCW_NOTIFY))
		return -EOPNOTSUPP;

254 255 256 257 258
	VCPU_EVENT(vcpu, 4, "diag 0x500 schid 0x%8.8x queue 0x%x cookie 0x%llx",
			    (u32) vcpu->run->s.regs.gprs[2],
			    (u32) vcpu->run->s.regs.gprs[3],
			    vcpu->run->s.regs.gprs[4]);

C
Cornelia Huck 已提交
259 260 261 262
	/*
	 * The layout is as follows:
	 * - gpr 2 contains the subchannel id (passed as addr)
	 * - gpr 3 contains the virtqueue index (passed as datamatch)
263
	 * - gpr 4 contains the index on the bus (optionally)
C
Cornelia Huck 已提交
264
	 */
265
	ret = kvm_io_bus_write_cookie(vcpu, KVM_VIRTIO_CCW_NOTIFY_BUS,
266
				      vcpu->run->s.regs.gprs[2] & 0xffffffff,
267 268 269 270 271 272 273 274 275 276
				      8, &vcpu->run->s.regs.gprs[3],
				      vcpu->run->s.regs.gprs[4]);

	/*
	 * Return cookie in gpr 2, but don't overwrite the register if the
	 * diagnose will be handled by userspace.
	 */
	if (ret != -EOPNOTSUPP)
		vcpu->run->s.regs.gprs[2] = ret;
	/* kvm_io_bus_write_cookie returns -EOPNOTSUPP if it found no match. */
C
Cornelia Huck 已提交
277 278 279
	return ret < 0 ? ret : 0;
}

280 281
int kvm_s390_handle_diag(struct kvm_vcpu *vcpu)
{
282
	int code = kvm_s390_get_base_disp_rs(vcpu, NULL) & 0xffff;
283

284 285 286
	if (vcpu->arch.sie_block->gpsw.mask & PSW_MASK_PSTATE)
		return kvm_s390_inject_program_int(vcpu, PGM_PRIVILEGED_OP);

287
	trace_kvm_s390_handle_diag(vcpu, code);
288
	switch (code) {
289 290
	case 0x10:
		return diag_release_pages(vcpu);
291 292
	case 0x44:
		return __diag_time_slice_end(vcpu);
293 294
	case 0x9c:
		return __diag_time_slice_end_directed(vcpu);
295 296
	case 0x258:
		return __diag_page_ref_service(vcpu);
297 298
	case 0x308:
		return __diag_ipl_functions(vcpu);
C
Cornelia Huck 已提交
299 300
	case 0x500:
		return __diag_virtio_hypercall(vcpu);
301
	default:
302
		vcpu->stat.diagnose_other++;
303
		return -EOPNOTSUPP;
304 305
	}
}