kvm.c 26.0 KB
Newer Older
A
Alexander Graf 已提交
1 2 3 4
/*
 * QEMU S390x KVM implementation
 *
 * Copyright (c) 2009 Alexander Graf <agraf@suse.de>
5
 * Copyright IBM Corp. 2012
A
Alexander Graf 已提交
6 7 8 9 10 11 12 13 14 15 16
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
17 18 19 20
 * Contributions after 2012-10-29 are licensed under the terms of the
 * GNU GPL, version 2 or (at your option) any later version.
 *
 * You should have received a copy of the GNU (Lesser) General Public
A
Alexander Graf 已提交
21 22 23 24 25 26 27 28 29 30 31
 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
 */

#include <sys/types.h>
#include <sys/ioctl.h>
#include <sys/mman.h>

#include <linux/kvm.h>
#include <asm/ptrace.h>

#include "qemu-common.h"
32
#include "qemu/timer.h"
33 34
#include "sysemu/sysemu.h"
#include "sysemu/kvm.h"
A
Alexander Graf 已提交
35
#include "cpu.h"
36
#include "sysemu/device_tree.h"
37 38
#include "qapi/qmp/qjson.h"
#include "monitor/monitor.h"
39
#include "trace.h"
A
Alexander Graf 已提交
40 41 42 43

/* #define DEBUG_KVM */

#ifdef DEBUG_KVM
44
#define DPRINTF(fmt, ...) \
A
Alexander Graf 已提交
45 46
    do { fprintf(stderr, fmt, ## __VA_ARGS__); } while (0)
#else
47
#define DPRINTF(fmt, ...) \
A
Alexander Graf 已提交
48 49 50 51 52
    do { } while (0)
#endif

#define IPA0_DIAG                       0x8300
#define IPA0_SIGP                       0xae00
53 54 55
#define IPA0_B2                         0xb200
#define IPA0_B9                         0xb900
#define IPA0_EB                         0xeb00
A
Alexander Graf 已提交
56

57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78
#define PRIV_B2_SCLP_CALL               0x20
#define PRIV_B2_CSCH                    0x30
#define PRIV_B2_HSCH                    0x31
#define PRIV_B2_MSCH                    0x32
#define PRIV_B2_SSCH                    0x33
#define PRIV_B2_STSCH                   0x34
#define PRIV_B2_TSCH                    0x35
#define PRIV_B2_TPI                     0x36
#define PRIV_B2_SAL                     0x37
#define PRIV_B2_RSCH                    0x38
#define PRIV_B2_STCRW                   0x39
#define PRIV_B2_STCPS                   0x3a
#define PRIV_B2_RCHP                    0x3b
#define PRIV_B2_SCHM                    0x3c
#define PRIV_B2_CHSC                    0x5f
#define PRIV_B2_SIGA                    0x74
#define PRIV_B2_XSCH                    0x76

#define PRIV_EB_SQBS                    0x8a

#define PRIV_B9_EQBS                    0x9c

79
#define DIAG_IPL                        0x308
A
Alexander Graf 已提交
80 81 82 83 84 85 86 87 88
#define DIAG_KVM_HYPERCALL              0x500
#define DIAG_KVM_BREAKPOINT             0x501

#define ICPT_INSTRUCTION                0x04
#define ICPT_WAITPSW                    0x1c
#define ICPT_SOFT_INTERCEPT             0x24
#define ICPT_CPU_STOP                   0x28
#define ICPT_IO                         0x40

89 90 91 92
const KVMCapabilityInfo kvm_arch_required_capabilities[] = {
    KVM_CAP_LAST_INFO
};

93
static int cap_sync_regs;
94
static int cap_async_pf;
95

96
static void *legacy_s390_alloc(size_t size);
97

98
int kvm_arch_init(KVMState *s)
A
Alexander Graf 已提交
99
{
100
    cap_sync_regs = kvm_check_extension(s, KVM_CAP_SYNC_REGS);
101
    cap_async_pf = kvm_check_extension(s, KVM_CAP_ASYNC_PF);
102 103 104 105
    if (!kvm_check_extension(s, KVM_CAP_S390_GMAP)
        || !kvm_check_extension(s, KVM_CAP_S390_COW)) {
        phys_mem_set_alloc(legacy_s390_alloc);
    }
A
Alexander Graf 已提交
106 107 108
    return 0;
}

109 110 111 112 113
unsigned long kvm_arch_vcpu_id(CPUState *cpu)
{
    return cpu->cpu_index;
}

A
Andreas Färber 已提交
114
int kvm_arch_init_vcpu(CPUState *cpu)
A
Alexander Graf 已提交
115
{
116 117
    /* nothing todo yet */
    return 0;
A
Alexander Graf 已提交
118 119
}

120
void kvm_s390_reset_vcpu(S390CPU *cpu)
A
Alexander Graf 已提交
121
{
122 123
    CPUState *cs = CPU(cpu);

A
Alexander Graf 已提交
124 125 126 127 128
    /* The initial reset call is needed here to reset in-kernel
     * vcpu data that we can't access directly from QEMU
     * (i.e. with older kernels which don't support sync_regs/ONE_REG).
     * Before this ioctl cpu_synchronize_state() is called in common kvm
     * code (kvm-all) */
129
    if (kvm_vcpu_ioctl(cs, KVM_S390_INITIAL_RESET, NULL)) {
J
Jens Freimann 已提交
130 131
        perror("Can't reset vcpu\n");
    }
A
Alexander Graf 已提交
132 133
}

A
Andreas Färber 已提交
134
int kvm_arch_put_registers(CPUState *cs, int level)
A
Alexander Graf 已提交
135
{
A
Andreas Färber 已提交
136 137
    S390CPU *cpu = S390_CPU(cs);
    CPUS390XState *env = &cpu->env;
138
    struct kvm_sregs sregs;
A
Alexander Graf 已提交
139
    struct kvm_regs regs;
140
    int r;
A
Alexander Graf 已提交
141 142
    int i;

143
    /* always save the PSW  and the GPRS*/
A
Andreas Färber 已提交
144 145
    cs->kvm_run->psw_addr = env->psw.addr;
    cs->kvm_run->psw_mask = env->psw.mask;
A
Alexander Graf 已提交
146

A
Andreas Färber 已提交
147
    if (cap_sync_regs && cs->kvm_run->kvm_valid_regs & KVM_SYNC_GPRS) {
148
        for (i = 0; i < 16; i++) {
A
Andreas Färber 已提交
149 150
            cs->kvm_run->s.regs.gprs[i] = env->regs[i];
            cs->kvm_run->kvm_dirty_regs |= KVM_SYNC_GPRS;
151 152 153 154 155
        }
    } else {
        for (i = 0; i < 16; i++) {
            regs.gprs[i] = env->regs[i];
        }
156 157 158
        r = kvm_vcpu_ioctl(cs, KVM_SET_REGS, &regs);
        if (r < 0) {
            return r;
159
        }
A
Alexander Graf 已提交
160 161
    }

162 163 164 165
    /* Do we need to save more than that? */
    if (level == KVM_PUT_RUNTIME_STATE) {
        return 0;
    }
166

167 168 169 170 171 172 173 174
    /*
     * These ONE_REGS are not protected by a capability. As they are only
     * necessary for migration we just trace a possible error, but don't
     * return with an error return code.
     */
    kvm_set_one_reg(cs, KVM_REG_S390_CPU_TIMER, &env->cputm);
    kvm_set_one_reg(cs, KVM_REG_S390_CLOCK_COMP, &env->ckc);
    kvm_set_one_reg(cs, KVM_REG_S390_TODPR, &env->todpr);
175 176
    kvm_set_one_reg(cs, KVM_REG_S390_GBEA, &env->gbea);
    kvm_set_one_reg(cs, KVM_REG_S390_PP, &env->pp);
A
Alexander Graf 已提交
177

178
    if (cap_async_pf) {
179 180 181
        r = kvm_set_one_reg(cs, KVM_REG_S390_PFTOKEN, &env->pfault_token);
        if (r < 0) {
            return r;
182
        }
183 184 185
        r = kvm_set_one_reg(cs, KVM_REG_S390_PFCOMPARE, &env->pfault_compare);
        if (r < 0) {
            return r;
186
        }
187 188 189
        r = kvm_set_one_reg(cs, KVM_REG_S390_PFSELECT, &env->pfault_select);
        if (r < 0) {
            return r;
190 191 192
        }
    }

193
    if (cap_sync_regs &&
A
Andreas Färber 已提交
194 195
        cs->kvm_run->kvm_valid_regs & KVM_SYNC_ACRS &&
        cs->kvm_run->kvm_valid_regs & KVM_SYNC_CRS) {
196
        for (i = 0; i < 16; i++) {
A
Andreas Färber 已提交
197 198
            cs->kvm_run->s.regs.acrs[i] = env->aregs[i];
            cs->kvm_run->s.regs.crs[i] = env->cregs[i];
199
        }
A
Andreas Färber 已提交
200 201
        cs->kvm_run->kvm_dirty_regs |= KVM_SYNC_ACRS;
        cs->kvm_run->kvm_dirty_regs |= KVM_SYNC_CRS;
202 203 204 205 206
    } else {
        for (i = 0; i < 16; i++) {
            sregs.acrs[i] = env->aregs[i];
            sregs.crs[i] = env->cregs[i];
        }
207 208 209
        r = kvm_vcpu_ioctl(cs, KVM_SET_SREGS, &sregs);
        if (r < 0) {
            return r;
210 211
        }
    }
A
Alexander Graf 已提交
212

213
    /* Finally the prefix */
A
Andreas Färber 已提交
214 215 216
    if (cap_sync_regs && cs->kvm_run->kvm_valid_regs & KVM_SYNC_PREFIX) {
        cs->kvm_run->s.regs.prefix = env->psa;
        cs->kvm_run->kvm_dirty_regs |= KVM_SYNC_PREFIX;
217 218 219 220
    } else {
        /* prefix is only supported via sync regs */
    }
    return 0;
A
Alexander Graf 已提交
221 222
}

A
Andreas Färber 已提交
223
int kvm_arch_get_registers(CPUState *cs)
224 225 226
{
    S390CPU *cpu = S390_CPU(cs);
    CPUS390XState *env = &cpu->env;
227
    struct kvm_sregs sregs;
A
Alexander Graf 已提交
228
    struct kvm_regs regs;
229
    int i, r;
230

231
    /* get the PSW */
A
Andreas Färber 已提交
232 233
    env->psw.addr = cs->kvm_run->psw_addr;
    env->psw.mask = cs->kvm_run->psw_mask;
234 235

    /* the GPRS */
A
Andreas Färber 已提交
236
    if (cap_sync_regs && cs->kvm_run->kvm_valid_regs & KVM_SYNC_GPRS) {
237
        for (i = 0; i < 16; i++) {
A
Andreas Färber 已提交
238
            env->regs[i] = cs->kvm_run->s.regs.gprs[i];
239 240
        }
    } else {
241 242 243
        r = kvm_vcpu_ioctl(cs, KVM_GET_REGS, &regs);
        if (r < 0) {
            return r;
244 245 246 247
        }
         for (i = 0; i < 16; i++) {
            env->regs[i] = regs.gprs[i];
        }
A
Alexander Graf 已提交
248 249
    }

250 251
    /* The ACRS and CRS */
    if (cap_sync_regs &&
A
Andreas Färber 已提交
252 253
        cs->kvm_run->kvm_valid_regs & KVM_SYNC_ACRS &&
        cs->kvm_run->kvm_valid_regs & KVM_SYNC_CRS) {
254
        for (i = 0; i < 16; i++) {
A
Andreas Färber 已提交
255 256
            env->aregs[i] = cs->kvm_run->s.regs.acrs[i];
            env->cregs[i] = cs->kvm_run->s.regs.crs[i];
257 258
        }
    } else {
259 260 261
        r = kvm_vcpu_ioctl(cs, KVM_GET_SREGS, &sregs);
        if (r < 0) {
            return r;
262 263 264 265 266
        }
         for (i = 0; i < 16; i++) {
            env->aregs[i] = sregs.acrs[i];
            env->cregs[i] = sregs.crs[i];
        }
A
Alexander Graf 已提交
267 268
    }

269
    /* The prefix */
A
Andreas Färber 已提交
270 271
    if (cap_sync_regs && cs->kvm_run->kvm_valid_regs & KVM_SYNC_PREFIX) {
        env->psa = cs->kvm_run->s.regs.prefix;
272
    }
A
Alexander Graf 已提交
273

274 275 276 277 278 279 280 281
    /*
     * These ONE_REGS are not protected by a capability. As they are only
     * necessary for migration we just trace a possible error, but don't
     * return with an error return code.
     */
    kvm_get_one_reg(cs, KVM_REG_S390_CPU_TIMER, &env->cputm);
    kvm_get_one_reg(cs, KVM_REG_S390_CLOCK_COMP, &env->ckc);
    kvm_get_one_reg(cs, KVM_REG_S390_TODPR, &env->todpr);
282 283
    kvm_get_one_reg(cs, KVM_REG_S390_GBEA, &env->gbea);
    kvm_get_one_reg(cs, KVM_REG_S390_PP, &env->pp);
284

285
    if (cap_async_pf) {
286
        r = kvm_get_one_reg(cs, KVM_REG_S390_PFTOKEN, &env->pfault_token);
287 288 289
        if (r < 0) {
            return r;
        }
290
        r = kvm_get_one_reg(cs, KVM_REG_S390_PFCOMPARE, &env->pfault_compare);
291 292 293
        if (r < 0) {
            return r;
        }
294
        r = kvm_get_one_reg(cs, KVM_REG_S390_PFSELECT, &env->pfault_select);
295 296 297 298 299
        if (r < 0) {
            return r;
        }
    }

A
Alexander Graf 已提交
300 301 302
    return 0;
}

303 304 305 306 307 308 309 310 311 312
/*
 * Legacy layout for s390:
 * Older S390 KVM requires the topmost vma of the RAM to be
 * smaller than an system defined value, which is at least 256GB.
 * Larger systems have larger values. We put the guest between
 * the end of data segment (system break) and this value. We
 * use 32GB as a base to have enough room for the system break
 * to grow. We also have to use MAP parameters that avoid
 * read-only mapping of guest pages.
 */
313
static void *legacy_s390_alloc(size_t size)
314 315 316 317 318 319
{
    void *mem;

    mem = mmap((void *) 0x800000000ULL, size,
               PROT_EXEC|PROT_READ|PROT_WRITE,
               MAP_SHARED | MAP_ANONYMOUS | MAP_FIXED, -1, 0);
320
    return mem == MAP_FAILED ? NULL : mem;
321 322
}

323 324 325
/* DIAG 501 is used for sw breakpoints */
static const uint8_t diag_501[] = {0x83, 0x24, 0x05, 0x01};

A
Andreas Färber 已提交
326
int kvm_arch_insert_sw_breakpoint(CPUState *cs, struct kvm_sw_breakpoint *bp)
A
Alexander Graf 已提交
327 328
{

329 330 331 332
    if (cpu_memory_rw_debug(cs, bp->pc, (uint8_t *)&bp->saved_insn,
                            sizeof(diag_501), 0) ||
        cpu_memory_rw_debug(cs, bp->pc, (uint8_t *)diag_501,
                            sizeof(diag_501), 1)) {
A
Alexander Graf 已提交
333 334 335 336 337
        return -EINVAL;
    }
    return 0;
}

A
Andreas Färber 已提交
338
int kvm_arch_remove_sw_breakpoint(CPUState *cs, struct kvm_sw_breakpoint *bp)
A
Alexander Graf 已提交
339
{
340
    uint8_t t[sizeof(diag_501)];
A
Alexander Graf 已提交
341

342
    if (cpu_memory_rw_debug(cs, bp->pc, t, sizeof(diag_501), 0)) {
A
Alexander Graf 已提交
343
        return -EINVAL;
344
    } else if (memcmp(t, diag_501, sizeof(diag_501))) {
A
Alexander Graf 已提交
345
        return -EINVAL;
346 347
    } else if (cpu_memory_rw_debug(cs, bp->pc, (uint8_t *)&bp->saved_insn,
                                   sizeof(diag_501), 1)) {
A
Alexander Graf 已提交
348 349 350 351 352 353
        return -EINVAL;
    }

    return 0;
}

354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373
int kvm_arch_insert_hw_breakpoint(target_ulong addr,
                                  target_ulong len, int type)
{
    return -ENOSYS;
}

int kvm_arch_remove_hw_breakpoint(target_ulong addr,
                                  target_ulong len, int type)
{
    return -ENOSYS;
}

void kvm_arch_remove_all_hw_breakpoints(void)
{
}

void kvm_arch_update_guest_debug(CPUState *cpu, struct kvm_guest_debug *dbg)
{
}

A
Andreas Färber 已提交
374
void kvm_arch_pre_run(CPUState *cpu, struct kvm_run *run)
A
Alexander Graf 已提交
375 376 377
{
}

A
Andreas Färber 已提交
378
void kvm_arch_post_run(CPUState *cpu, struct kvm_run *run)
A
Alexander Graf 已提交
379 380 381
{
}

A
Andreas Färber 已提交
382
int kvm_arch_process_async_events(CPUState *cs)
M
Marcelo Tosatti 已提交
383
{
384
    return cs->halted;
M
Marcelo Tosatti 已提交
385 386
}

387
void kvm_s390_interrupt_internal(S390CPU *cpu, int type, uint32_t parm,
388
                                 uint64_t parm64, int vm)
A
Alexander Graf 已提交
389
{
390
    CPUState *cs = CPU(cpu);
A
Alexander Graf 已提交
391 392 393
    struct kvm_s390_interrupt kvmint;
    int r;

394
    if (!cs->kvm_state) {
A
Alexander Graf 已提交
395 396 397 398 399 400 401 402
        return;
    }

    kvmint.type = type;
    kvmint.parm = parm;
    kvmint.parm64 = parm64;

    if (vm) {
403
        r = kvm_vm_ioctl(cs->kvm_state, KVM_S390_INTERRUPT, &kvmint);
A
Alexander Graf 已提交
404
    } else {
405
        r = kvm_vcpu_ioctl(cs, KVM_S390_INTERRUPT, &kvmint);
A
Alexander Graf 已提交
406 407 408 409 410 411 412 413
    }

    if (r < 0) {
        fprintf(stderr, "KVM failed to inject interrupt\n");
        exit(1);
    }
}

414
void kvm_s390_virtio_irq(S390CPU *cpu, int config_change, uint64_t token)
A
Alexander Graf 已提交
415
{
416
    kvm_s390_interrupt_internal(cpu, KVM_S390_INT_VIRTIO, config_change,
A
Alexander Graf 已提交
417 418 419
                                token, 1);
}

420
void kvm_s390_interrupt(S390CPU *cpu, int type, uint32_t code)
A
Alexander Graf 已提交
421
{
422
    kvm_s390_interrupt_internal(cpu, type, code, 0, 0);
A
Alexander Graf 已提交
423 424
}

425
static void enter_pgmcheck(S390CPU *cpu, uint16_t code)
A
Alexander Graf 已提交
426
{
427
    kvm_s390_interrupt(cpu, KVM_S390_PROGRAM_INT, code);
A
Alexander Graf 已提交
428 429
}

430
static int kvm_sclp_service_call(S390CPU *cpu, struct kvm_run *run,
431
                                 uint16_t ipbh0)
A
Alexander Graf 已提交
432
{
433
    CPUS390XState *env = &cpu->env;
434 435
    uint64_t sccb;
    uint32_t code;
A
Alexander Graf 已提交
436 437
    int r = 0;

438
    cpu_synchronize_state(CPU(cpu));
A
Alexander Graf 已提交
439 440 441
    sccb = env->regs[ipbh0 & 0xf];
    code = env->regs[(ipbh0 & 0xf0) >> 4];

442
    r = sclp_service_call(env, sccb, code);
443
    if (r < 0) {
444
        enter_pgmcheck(cpu, -r);
445 446
    } else {
        setcc(cpu, r);
A
Alexander Graf 已提交
447
    }
A
Alexander Graf 已提交
448

A
Alexander Graf 已提交
449 450 451
    return 0;
}

452
static int handle_b2(S390CPU *cpu, struct kvm_run *run, uint8_t ipa1)
453 454
{
    CPUS390XState *env = &cpu->env;
455 456
    int rc = 0;
    uint16_t ipbh0 = (run->s390_sieic.ipb & 0xffff0000) >> 16;
457

458
    cpu_synchronize_state(CPU(cpu));
459

460
    switch (ipa1) {
461
    case PRIV_B2_XSCH:
462
        ioinst_handle_xsch(cpu, env->regs[1]);
463
        break;
464
    case PRIV_B2_CSCH:
465
        ioinst_handle_csch(cpu, env->regs[1]);
466
        break;
467
    case PRIV_B2_HSCH:
468
        ioinst_handle_hsch(cpu, env->regs[1]);
469
        break;
470
    case PRIV_B2_MSCH:
471
        ioinst_handle_msch(cpu, env->regs[1], run->s390_sieic.ipb);
472
        break;
473
    case PRIV_B2_SSCH:
474
        ioinst_handle_ssch(cpu, env->regs[1], run->s390_sieic.ipb);
475
        break;
476
    case PRIV_B2_STCRW:
477
        ioinst_handle_stcrw(cpu, run->s390_sieic.ipb);
478
        break;
479
    case PRIV_B2_STSCH:
480
        ioinst_handle_stsch(cpu, env->regs[1], run->s390_sieic.ipb);
481
        break;
482
    case PRIV_B2_TSCH:
483 484 485
        /* We should only get tsch via KVM_EXIT_S390_TSCH. */
        fprintf(stderr, "Spurious tsch intercept\n");
        break;
486
    case PRIV_B2_CHSC:
487
        ioinst_handle_chsc(cpu, run->s390_sieic.ipb);
488
        break;
489
    case PRIV_B2_TPI:
490 491 492
        /* This should have been handled by kvm already. */
        fprintf(stderr, "Spurious tpi intercept\n");
        break;
493
    case PRIV_B2_SCHM:
494 495
        ioinst_handle_schm(cpu, env->regs[1], env->regs[2],
                           run->s390_sieic.ipb);
496
        break;
497
    case PRIV_B2_RSCH:
498
        ioinst_handle_rsch(cpu, env->regs[1]);
499
        break;
500
    case PRIV_B2_RCHP:
501
        ioinst_handle_rchp(cpu, env->regs[1]);
502
        break;
503
    case PRIV_B2_STCPS:
504 505
        /* We do not provide this instruction, it is suppressed. */
        break;
506
    case PRIV_B2_SAL:
507
        ioinst_handle_sal(cpu, env->regs[1]);
508
        break;
509
    case PRIV_B2_SIGA:
510
        /* Not provided, set CC = 3 for subchannel not operational */
511
        setcc(cpu, 3);
512
        break;
513 514 515
    case PRIV_B2_SCLP_CALL:
        rc = kvm_sclp_service_call(cpu, run, ipbh0);
        break;
516
    default:
517 518 519
        rc = -1;
        DPRINTF("KVM: unhandled PRIV: 0xb2%x\n", ipa1);
        break;
520 521
    }

522
    return rc;
523 524
}

525
static int handle_b9(S390CPU *cpu, struct kvm_run *run, uint8_t ipa1)
A
Alexander Graf 已提交
526 527 528 529
{
    int r = 0;

    switch (ipa1) {
530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555
    case PRIV_B9_EQBS:
        /* just inject exception */
        r = -1;
        break;
    default:
        r = -1;
        DPRINTF("KVM: unhandled PRIV: 0xb9%x\n", ipa1);
        break;
    }

    return r;
}

static int handle_eb(S390CPU *cpu, struct kvm_run *run, uint8_t ipa1)
{
    int r = 0;

    switch (ipa1) {
    case PRIV_EB_SQBS:
        /* just inject exception */
        r = -1;
        break;
    default:
        r = -1;
        DPRINTF("KVM: unhandled PRIV: 0xeb%x\n", ipa1);
        break;
A
Alexander Graf 已提交
556 557 558 559 560
    }

    return r;
}

561
static int handle_hypercall(S390CPU *cpu, struct kvm_run *run)
A
Alexander Graf 已提交
562
{
563
    CPUS390XState *env = &cpu->env;
564
    int ret;
565

566
    cpu_synchronize_state(CPU(cpu));
567 568 569 570 571
    ret = s390_virtio_hypercall(env);
    if (ret == -EINVAL) {
        enter_pgmcheck(cpu, PGM_SPECIFICATION);
        return 0;
    }
A
Alexander Graf 已提交
572

573
    return ret;
A
Alexander Graf 已提交
574 575
}

576 577 578 579 580 581 582 583 584 585
static void kvm_handle_diag_308(S390CPU *cpu, struct kvm_run *run)
{
    uint64_t r1, r3;

    cpu_synchronize_state(CPU(cpu));
    r1 = (run->s390_sieic.ipa & 0x00f0) >> 8;
    r3 = run->s390_sieic.ipa & 0x000f;
    handle_diag_308(&cpu->env, r1, r3);
}

586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601
static int handle_sw_breakpoint(S390CPU *cpu, struct kvm_run *run)
{
    CPUS390XState *env = &cpu->env;
    unsigned long pc;

    cpu_synchronize_state(CPU(cpu));

    pc = env->psw.addr - 4;
    if (kvm_find_sw_breakpoint(CPU(cpu), pc)) {
        env->psw.addr = pc;
        return EXCP_DEBUG;
    }

    return -ENOENT;
}

C
Cornelia Huck 已提交
602 603 604
#define DIAG_KVM_CODE_MASK 0x000000000000ffff

static int handle_diag(S390CPU *cpu, struct kvm_run *run, uint32_t ipb)
A
Alexander Graf 已提交
605 606
{
    int r = 0;
C
Cornelia Huck 已提交
607 608 609 610 611 612 613 614
    uint16_t func_code;

    /*
     * For any diagnose call we support, bits 48-63 of the resulting
     * address specify the function code; the remainder is ignored.
     */
    func_code = decode_basedisp_rs(&cpu->env, ipb) & DIAG_KVM_CODE_MASK;
    switch (func_code) {
615 616 617
    case DIAG_IPL:
        kvm_handle_diag_308(cpu, run);
        break;
618 619 620 621
    case DIAG_KVM_HYPERCALL:
        r = handle_hypercall(cpu, run);
        break;
    case DIAG_KVM_BREAKPOINT:
622
        r = handle_sw_breakpoint(cpu, run);
623 624
        break;
    default:
C
Cornelia Huck 已提交
625
        DPRINTF("KVM: unknown DIAG: 0x%x\n", func_code);
626 627
        r = -1;
        break;
A
Alexander Graf 已提交
628 629 630 631 632
    }

    return r;
}

T
Thomas Huth 已提交
633 634 635 636 637 638 639 640
static int kvm_s390_cpu_start(S390CPU *cpu)
{
    s390_add_running_cpu(cpu);
    qemu_cpu_kick(CPU(cpu));
    DPRINTF("DONE: KVM cpu start: %p\n", &cpu->env);
    return 0;
}

641
int kvm_s390_cpu_restart(S390CPU *cpu)
A
Alexander Graf 已提交
642
{
643
    kvm_s390_interrupt(cpu, KVM_S390_RESTART, 0);
644
    s390_add_running_cpu(cpu);
645
    qemu_cpu_kick(CPU(cpu));
646
    DPRINTF("DONE: KVM cpu restart: %p\n", &cpu->env);
A
Alexander Graf 已提交
647 648 649
    return 0;
}

650
static void sigp_initial_cpu_reset(void *arg)
A
Alexander Graf 已提交
651
{
652 653
    CPUState *cpu = arg;
    S390CPUClass *scc = S390_CPU_GET_CLASS(cpu);
654

655 656
    cpu_synchronize_state(cpu);
    scc->initial_cpu_reset(cpu);
A
Alexander Graf 已提交
657 658
}

659 660 661 662 663 664 665 666 667
static void sigp_cpu_reset(void *arg)
{
    CPUState *cpu = arg;
    S390CPUClass *scc = S390_CPU_GET_CLASS(cpu);

    cpu_synchronize_state(cpu);
    scc->cpu_reset(cpu);
}

668 669
#define SIGP_ORDER_MASK 0x000000ff

A
Andreas Färber 已提交
670
static int handle_sigp(S390CPU *cpu, struct kvm_run *run, uint8_t ipa1)
A
Alexander Graf 已提交
671
{
A
Andreas Färber 已提交
672
    CPUS390XState *env = &cpu->env;
A
Alexander Graf 已提交
673 674
    uint8_t order_code;
    uint16_t cpu_addr;
675
    S390CPU *target_cpu;
676 677
    uint64_t *statusreg = &env->regs[ipa1 >> 4];
    int cc;
A
Alexander Graf 已提交
678

679
    cpu_synchronize_state(CPU(cpu));
A
Alexander Graf 已提交
680 681

    /* get order code */
682
    order_code = decode_basedisp_rs(env, run->s390_sieic.ipb) & SIGP_ORDER_MASK;
A
Alexander Graf 已提交
683 684

    cpu_addr = env->regs[ipa1 & 0x0f];
685 686
    target_cpu = s390_cpu_addr2state(cpu_addr);
    if (target_cpu == NULL) {
687
        cc = 3;    /* not operational */
A
Alexander Graf 已提交
688 689 690 691
        goto out;
    }

    switch (order_code) {
T
Thomas Huth 已提交
692
    case SIGP_START:
693
        cc = kvm_s390_cpu_start(target_cpu);
T
Thomas Huth 已提交
694
        break;
695
    case SIGP_RESTART:
696
        cc = kvm_s390_cpu_restart(target_cpu);
697 698
        break;
    case SIGP_SET_ARCH:
699 700 701 702
        *statusreg &= 0xffffffff00000000UL;
        *statusreg |= SIGP_STAT_INVALID_PARAMETER;
        cc = 1;   /* status stored */
        break;
703
    case SIGP_INITIAL_CPU_RESET:
704 705
        run_on_cpu(CPU(target_cpu), sigp_initial_cpu_reset, CPU(target_cpu));
        cc = 0;
706
        break;
707 708 709 710
    case SIGP_CPU_RESET:
        run_on_cpu(CPU(target_cpu), sigp_cpu_reset, CPU(target_cpu));
        cc = 0;
        break;
711
    default:
712 713 714 715
        DPRINTF("KVM: unknown SIGP: 0x%x\n", order_code);
        *statusreg &= 0xffffffff00000000UL;
        *statusreg |= SIGP_STAT_INVALID_ORDER;
        cc = 1;   /* status stored */
716
        break;
A
Alexander Graf 已提交
717 718 719
    }

out:
720
    setcc(cpu, cc);
A
Alexander Graf 已提交
721 722 723
    return 0;
}

724
static int handle_instruction(S390CPU *cpu, struct kvm_run *run)
A
Alexander Graf 已提交
725 726 727
{
    unsigned int ipa0 = (run->s390_sieic.ipa & 0xff00);
    uint8_t ipa1 = run->s390_sieic.ipa & 0x00ff;
728
    int r = -1;
A
Alexander Graf 已提交
729

730 731
    DPRINTF("handle_instruction 0x%x 0x%x\n",
            run->s390_sieic.ipa, run->s390_sieic.ipb);
A
Alexander Graf 已提交
732
    switch (ipa0) {
733
    case IPA0_B2:
734 735
        r = handle_b2(cpu, run, ipa1);
        break;
736
    case IPA0_B9:
737 738
        r = handle_b9(cpu, run, ipa1);
        break;
739
    case IPA0_EB:
740
        r = handle_eb(cpu, run, ipa1);
741 742
        break;
    case IPA0_DIAG:
C
Cornelia Huck 已提交
743
        r = handle_diag(cpu, run, run->s390_sieic.ipb);
744 745 746 747
        break;
    case IPA0_SIGP:
        r = handle_sigp(cpu, run, ipa1);
        break;
A
Alexander Graf 已提交
748 749 750
    }

    if (r < 0) {
751
        r = 0;
752
        enter_pgmcheck(cpu, 0x0001);
A
Alexander Graf 已提交
753
    }
754 755

    return r;
A
Alexander Graf 已提交
756 757
}

A
Andreas Färber 已提交
758
static bool is_special_wait_psw(CPUState *cs)
759 760
{
    /* signal quiesce */
A
Andreas Färber 已提交
761
    return cs->kvm_run->psw_addr == 0xfffUL;
762 763
}

764
static int handle_intercept(S390CPU *cpu)
A
Alexander Graf 已提交
765
{
A
Andreas Färber 已提交
766 767
    CPUState *cs = CPU(cpu);
    struct kvm_run *run = cs->kvm_run;
A
Alexander Graf 已提交
768 769 770
    int icpt_code = run->s390_sieic.icptcode;
    int r = 0;

771
    DPRINTF("intercept: 0x%x (at 0x%lx)\n", icpt_code,
A
Andreas Färber 已提交
772
            (long)cs->kvm_run->psw_addr);
A
Alexander Graf 已提交
773 774
    switch (icpt_code) {
        case ICPT_INSTRUCTION:
775
            r = handle_instruction(cpu, run);
A
Alexander Graf 已提交
776 777
            break;
        case ICPT_WAITPSW:
778 779 780 781 782 783 784 785 786 787 788 789
            /* disabled wait, since enabled wait is handled in kernel */
            if (s390_del_running_cpu(cpu) == 0) {
                if (is_special_wait_psw(cs)) {
                    qemu_system_shutdown_request();
                } else {
                    QObject *data;

                    data = qobject_from_jsonf("{ 'action': %s }", "pause");
                    monitor_protocol_event(QEVENT_GUEST_PANICKED, data);
                    qobject_decref(data);
                    vm_stop(RUN_STATE_GUEST_PANICKED);
                }
790 791 792
            }
            r = EXCP_HALTED;
            break;
793
        case ICPT_CPU_STOP:
794
            if (s390_del_running_cpu(cpu) == 0) {
795 796 797
                qemu_system_shutdown_request();
            }
            r = EXCP_HALTED;
A
Alexander Graf 已提交
798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815
            break;
        case ICPT_SOFT_INTERCEPT:
            fprintf(stderr, "KVM unimplemented icpt SOFT\n");
            exit(1);
            break;
        case ICPT_IO:
            fprintf(stderr, "KVM unimplemented icpt IO\n");
            exit(1);
            break;
        default:
            fprintf(stderr, "Unknown intercept code: %d\n", icpt_code);
            exit(1);
            break;
    }

    return r;
}

816 817 818 819 820 821 822
static int handle_tsch(S390CPU *cpu)
{
    CPUS390XState *env = &cpu->env;
    CPUState *cs = CPU(cpu);
    struct kvm_run *run = cs->kvm_run;
    int ret;

823
    cpu_synchronize_state(cs);
824

825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853
    ret = ioinst_handle_tsch(env, env->regs[1], run->s390_tsch.ipb);
    if (ret >= 0) {
        /* Success; set condition code. */
        setcc(cpu, ret);
        ret = 0;
    } else if (ret < -1) {
        /*
         * Failure.
         * If an I/O interrupt had been dequeued, we have to reinject it.
         */
        if (run->s390_tsch.dequeued) {
            uint16_t subchannel_id = run->s390_tsch.subchannel_id;
            uint16_t subchannel_nr = run->s390_tsch.subchannel_nr;
            uint32_t io_int_parm = run->s390_tsch.io_int_parm;
            uint32_t io_int_word = run->s390_tsch.io_int_word;
            uint32_t type = ((subchannel_id & 0xff00) << 24) |
                ((subchannel_id & 0x00060) << 22) | (subchannel_nr << 16);

            kvm_s390_interrupt_internal(cpu, type,
                                        ((uint32_t)subchannel_id << 16)
                                        | subchannel_nr,
                                        ((uint64_t)io_int_parm << 32)
                                        | io_int_word, 1);
        }
        ret = 0;
    }
    return ret;
}

854 855 856 857 858
static int kvm_arch_handle_debug_exit(S390CPU *cpu)
{
    return -ENOSYS;
}

A
Andreas Färber 已提交
859
int kvm_arch_handle_exit(CPUState *cs, struct kvm_run *run)
A
Alexander Graf 已提交
860
{
A
Andreas Färber 已提交
861
    S390CPU *cpu = S390_CPU(cs);
A
Alexander Graf 已提交
862 863 864 865
    int ret = 0;

    switch (run->exit_reason) {
        case KVM_EXIT_S390_SIEIC:
866
            ret = handle_intercept(cpu);
A
Alexander Graf 已提交
867 868
            break;
        case KVM_EXIT_S390_RESET:
869
            qemu_system_reset_request();
A
Alexander Graf 已提交
870
            break;
871 872 873
        case KVM_EXIT_S390_TSCH:
            ret = handle_tsch(cpu);
            break;
874 875 876
        case KVM_EXIT_DEBUG:
            ret = kvm_arch_handle_debug_exit(cpu);
            break;
A
Alexander Graf 已提交
877 878 879 880 881
        default:
            fprintf(stderr, "Unknown KVM exit: %d\n", run->exit_reason);
            break;
    }

882 883 884
    if (ret == 0) {
        ret = EXCP_INTERRUPT;
    }
A
Alexander Graf 已提交
885 886
    return ret;
}
887

A
Andreas Färber 已提交
888
bool kvm_arch_stop_on_emulation_error(CPUState *cpu)
889 890 891
{
    return true;
}
892

A
Andreas Färber 已提交
893
int kvm_arch_on_sigbus_vcpu(CPUState *cpu, int code, void *addr)
894 895 896 897 898 899 900 901
{
    return 1;
}

int kvm_arch_on_sigbus(int code, void *addr)
{
    return 1;
}
902 903 904 905 906 907 908

void kvm_s390_io_interrupt(S390CPU *cpu, uint16_t subchannel_id,
                           uint16_t subchannel_nr, uint32_t io_int_parm,
                           uint32_t io_int_word)
{
    uint32_t type;

909 910 911 912 913 914
    if (io_int_word & IO_INT_WORD_AI) {
        type = KVM_S390_INT_IO(1, 0, 0, 0);
    } else {
        type = ((subchannel_id & 0xff00) << 24) |
            ((subchannel_id & 0x00060) << 22) | (subchannel_nr << 16);
    }
915 916 917 918 919 920 921 922 923 924 925 926 927 928 929 930
    kvm_s390_interrupt_internal(cpu, type,
                                ((uint32_t)subchannel_id << 16) | subchannel_nr,
                                ((uint64_t)io_int_parm << 32) | io_int_word, 1);
}

void kvm_s390_crw_mchk(S390CPU *cpu)
{
    kvm_s390_interrupt_internal(cpu, KVM_S390_MCHK, 1 << 28,
                                0x00400f1d40330000, 1);
}

void kvm_s390_enable_css_support(S390CPU *cpu)
{
    int r;

    /* Activate host kernel channel subsystem support. */
C
Cornelia Huck 已提交
931
    r = kvm_vcpu_enable_cap(CPU(cpu), KVM_CAP_S390_CSS_SUPPORT, 0);
932 933
    assert(r == 0);
}
934 935 936

void kvm_arch_init_irq_routing(KVMState *s)
{
937 938 939 940 941 942 943 944 945 946
    /*
     * Note that while irqchip capabilities generally imply that cpustates
     * are handled in-kernel, it is not true for s390 (yet); therefore, we
     * have to override the common code kvm_halt_in_kernel_allowed setting.
     */
    if (kvm_check_extension(s, KVM_CAP_IRQ_ROUTING)) {
        kvm_irqfds_allowed = true;
        kvm_gsi_routing_allowed = true;
        kvm_halt_in_kernel_allowed = false;
    }
947
}
C
Cornelia Huck 已提交
948

949 950
int kvm_s390_assign_subch_ioeventfd(EventNotifier *notifier, uint32_t sch,
                                    int vq, bool assign)
C
Cornelia Huck 已提交
951 952 953 954
{
    struct kvm_ioeventfd kick = {
        .flags = KVM_IOEVENTFD_FLAG_VIRTIO_CCW_NOTIFY |
        KVM_IOEVENTFD_FLAG_DATAMATCH,
955
        .fd = event_notifier_get_fd(notifier),
C
Cornelia Huck 已提交
956 957 958 959 960 961 962 963 964 965 966 967
        .datamatch = vq,
        .addr = sch,
        .len = 8,
    };
    if (!kvm_check_extension(kvm_state, KVM_CAP_IOEVENTFD)) {
        return -ENOSYS;
    }
    if (!assign) {
        kick.flags |= KVM_IOEVENTFD_FLAG_DEASSIGN;
    }
    return kvm_vm_ioctl(kvm_state, KVM_IOEVENTFD, &kick);
}