kvm.c 25.7 KB
Newer Older
A
Alexander Graf 已提交
1 2 3 4
/*
 * QEMU S390x KVM implementation
 *
 * Copyright (c) 2009 Alexander Graf <agraf@suse.de>
5
 * Copyright IBM Corp. 2012
A
Alexander Graf 已提交
6 7 8 9 10 11 12 13 14 15 16
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
17 18 19 20
 * Contributions after 2012-10-29 are licensed under the terms of the
 * GNU GPL, version 2 or (at your option) any later version.
 *
 * You should have received a copy of the GNU (Lesser) General Public
A
Alexander Graf 已提交
21 22 23 24 25 26 27 28 29 30 31
 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
 */

#include <sys/types.h>
#include <sys/ioctl.h>
#include <sys/mman.h>

#include <linux/kvm.h>
#include <asm/ptrace.h>

#include "qemu-common.h"
32
#include "qemu/timer.h"
33 34
#include "sysemu/sysemu.h"
#include "sysemu/kvm.h"
A
Alexander Graf 已提交
35
#include "cpu.h"
36
#include "sysemu/device_tree.h"
37 38
#include "qapi/qmp/qjson.h"
#include "monitor/monitor.h"
39
#include "trace.h"
A
Alexander Graf 已提交
40 41 42 43

/* #define DEBUG_KVM */

#ifdef DEBUG_KVM
44
#define DPRINTF(fmt, ...) \
A
Alexander Graf 已提交
45 46
    do { fprintf(stderr, fmt, ## __VA_ARGS__); } while (0)
#else
47
#define DPRINTF(fmt, ...) \
A
Alexander Graf 已提交
48 49 50 51 52
    do { } while (0)
#endif

#define IPA0_DIAG                       0x8300
#define IPA0_SIGP                       0xae00
53 54 55
#define IPA0_B2                         0xb200
#define IPA0_B9                         0xb900
#define IPA0_EB                         0xeb00
A
Alexander Graf 已提交
56

57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78
#define PRIV_B2_SCLP_CALL               0x20
#define PRIV_B2_CSCH                    0x30
#define PRIV_B2_HSCH                    0x31
#define PRIV_B2_MSCH                    0x32
#define PRIV_B2_SSCH                    0x33
#define PRIV_B2_STSCH                   0x34
#define PRIV_B2_TSCH                    0x35
#define PRIV_B2_TPI                     0x36
#define PRIV_B2_SAL                     0x37
#define PRIV_B2_RSCH                    0x38
#define PRIV_B2_STCRW                   0x39
#define PRIV_B2_STCPS                   0x3a
#define PRIV_B2_RCHP                    0x3b
#define PRIV_B2_SCHM                    0x3c
#define PRIV_B2_CHSC                    0x5f
#define PRIV_B2_SIGA                    0x74
#define PRIV_B2_XSCH                    0x76

#define PRIV_EB_SQBS                    0x8a

#define PRIV_B9_EQBS                    0x9c

79
#define DIAG_IPL                        0x308
A
Alexander Graf 已提交
80 81 82 83 84 85 86 87 88
#define DIAG_KVM_HYPERCALL              0x500
#define DIAG_KVM_BREAKPOINT             0x501

#define ICPT_INSTRUCTION                0x04
#define ICPT_WAITPSW                    0x1c
#define ICPT_SOFT_INTERCEPT             0x24
#define ICPT_CPU_STOP                   0x28
#define ICPT_IO                         0x40

89 90 91 92
const KVMCapabilityInfo kvm_arch_required_capabilities[] = {
    KVM_CAP_LAST_INFO
};

93
static int cap_sync_regs;
94
static int cap_async_pf;
95

96
static void *legacy_s390_alloc(size_t size);
97

98
int kvm_arch_init(KVMState *s)
A
Alexander Graf 已提交
99
{
100
    cap_sync_regs = kvm_check_extension(s, KVM_CAP_SYNC_REGS);
101
    cap_async_pf = kvm_check_extension(s, KVM_CAP_ASYNC_PF);
102 103 104 105
    if (!kvm_check_extension(s, KVM_CAP_S390_GMAP)
        || !kvm_check_extension(s, KVM_CAP_S390_COW)) {
        phys_mem_set_alloc(legacy_s390_alloc);
    }
A
Alexander Graf 已提交
106 107 108
    return 0;
}

109 110 111 112 113
unsigned long kvm_arch_vcpu_id(CPUState *cpu)
{
    return cpu->cpu_index;
}

A
Andreas Färber 已提交
114
int kvm_arch_init_vcpu(CPUState *cpu)
A
Alexander Graf 已提交
115
{
116 117
    /* nothing todo yet */
    return 0;
A
Alexander Graf 已提交
118 119
}

120
void kvm_s390_reset_vcpu(S390CPU *cpu)
A
Alexander Graf 已提交
121
{
122 123
    CPUState *cs = CPU(cpu);

A
Alexander Graf 已提交
124 125 126 127 128
    /* The initial reset call is needed here to reset in-kernel
     * vcpu data that we can't access directly from QEMU
     * (i.e. with older kernels which don't support sync_regs/ONE_REG).
     * Before this ioctl cpu_synchronize_state() is called in common kvm
     * code (kvm-all) */
129
    if (kvm_vcpu_ioctl(cs, KVM_S390_INITIAL_RESET, NULL)) {
J
Jens Freimann 已提交
130 131
        perror("Can't reset vcpu\n");
    }
A
Alexander Graf 已提交
132 133
}

A
Andreas Färber 已提交
134
int kvm_arch_put_registers(CPUState *cs, int level)
A
Alexander Graf 已提交
135
{
A
Andreas Färber 已提交
136 137
    S390CPU *cpu = S390_CPU(cs);
    CPUS390XState *env = &cpu->env;
138
    struct kvm_sregs sregs;
A
Alexander Graf 已提交
139
    struct kvm_regs regs;
140
    int r;
A
Alexander Graf 已提交
141 142
    int i;

143
    /* always save the PSW  and the GPRS*/
A
Andreas Färber 已提交
144 145
    cs->kvm_run->psw_addr = env->psw.addr;
    cs->kvm_run->psw_mask = env->psw.mask;
A
Alexander Graf 已提交
146

A
Andreas Färber 已提交
147
    if (cap_sync_regs && cs->kvm_run->kvm_valid_regs & KVM_SYNC_GPRS) {
148
        for (i = 0; i < 16; i++) {
A
Andreas Färber 已提交
149 150
            cs->kvm_run->s.regs.gprs[i] = env->regs[i];
            cs->kvm_run->kvm_dirty_regs |= KVM_SYNC_GPRS;
151 152 153 154 155
        }
    } else {
        for (i = 0; i < 16; i++) {
            regs.gprs[i] = env->regs[i];
        }
156 157 158
        r = kvm_vcpu_ioctl(cs, KVM_SET_REGS, &regs);
        if (r < 0) {
            return r;
159
        }
A
Alexander Graf 已提交
160 161
    }

162 163 164 165
    /* Do we need to save more than that? */
    if (level == KVM_PUT_RUNTIME_STATE) {
        return 0;
    }
166

167 168 169 170 171 172 173 174
    /*
     * These ONE_REGS are not protected by a capability. As they are only
     * necessary for migration we just trace a possible error, but don't
     * return with an error return code.
     */
    kvm_set_one_reg(cs, KVM_REG_S390_CPU_TIMER, &env->cputm);
    kvm_set_one_reg(cs, KVM_REG_S390_CLOCK_COMP, &env->ckc);
    kvm_set_one_reg(cs, KVM_REG_S390_TODPR, &env->todpr);
175 176
    kvm_set_one_reg(cs, KVM_REG_S390_GBEA, &env->gbea);
    kvm_set_one_reg(cs, KVM_REG_S390_PP, &env->pp);
A
Alexander Graf 已提交
177

178
    if (cap_async_pf) {
179 180 181
        r = kvm_set_one_reg(cs, KVM_REG_S390_PFTOKEN, &env->pfault_token);
        if (r < 0) {
            return r;
182
        }
183 184 185
        r = kvm_set_one_reg(cs, KVM_REG_S390_PFCOMPARE, &env->pfault_compare);
        if (r < 0) {
            return r;
186
        }
187 188 189
        r = kvm_set_one_reg(cs, KVM_REG_S390_PFSELECT, &env->pfault_select);
        if (r < 0) {
            return r;
190 191 192
        }
    }

193
    if (cap_sync_regs &&
A
Andreas Färber 已提交
194 195
        cs->kvm_run->kvm_valid_regs & KVM_SYNC_ACRS &&
        cs->kvm_run->kvm_valid_regs & KVM_SYNC_CRS) {
196
        for (i = 0; i < 16; i++) {
A
Andreas Färber 已提交
197 198
            cs->kvm_run->s.regs.acrs[i] = env->aregs[i];
            cs->kvm_run->s.regs.crs[i] = env->cregs[i];
199
        }
A
Andreas Färber 已提交
200 201
        cs->kvm_run->kvm_dirty_regs |= KVM_SYNC_ACRS;
        cs->kvm_run->kvm_dirty_regs |= KVM_SYNC_CRS;
202 203 204 205 206
    } else {
        for (i = 0; i < 16; i++) {
            sregs.acrs[i] = env->aregs[i];
            sregs.crs[i] = env->cregs[i];
        }
207 208 209
        r = kvm_vcpu_ioctl(cs, KVM_SET_SREGS, &sregs);
        if (r < 0) {
            return r;
210 211
        }
    }
A
Alexander Graf 已提交
212

213
    /* Finally the prefix */
A
Andreas Färber 已提交
214 215 216
    if (cap_sync_regs && cs->kvm_run->kvm_valid_regs & KVM_SYNC_PREFIX) {
        cs->kvm_run->s.regs.prefix = env->psa;
        cs->kvm_run->kvm_dirty_regs |= KVM_SYNC_PREFIX;
217 218 219 220
    } else {
        /* prefix is only supported via sync regs */
    }
    return 0;
A
Alexander Graf 已提交
221 222
}

A
Andreas Färber 已提交
223
int kvm_arch_get_registers(CPUState *cs)
224 225 226
{
    S390CPU *cpu = S390_CPU(cs);
    CPUS390XState *env = &cpu->env;
227
    struct kvm_sregs sregs;
A
Alexander Graf 已提交
228
    struct kvm_regs regs;
229
    int i, r;
230

231
    /* get the PSW */
A
Andreas Färber 已提交
232 233
    env->psw.addr = cs->kvm_run->psw_addr;
    env->psw.mask = cs->kvm_run->psw_mask;
234 235

    /* the GPRS */
A
Andreas Färber 已提交
236
    if (cap_sync_regs && cs->kvm_run->kvm_valid_regs & KVM_SYNC_GPRS) {
237
        for (i = 0; i < 16; i++) {
A
Andreas Färber 已提交
238
            env->regs[i] = cs->kvm_run->s.regs.gprs[i];
239 240
        }
    } else {
241 242 243
        r = kvm_vcpu_ioctl(cs, KVM_GET_REGS, &regs);
        if (r < 0) {
            return r;
244 245 246 247
        }
         for (i = 0; i < 16; i++) {
            env->regs[i] = regs.gprs[i];
        }
A
Alexander Graf 已提交
248 249
    }

250 251
    /* The ACRS and CRS */
    if (cap_sync_regs &&
A
Andreas Färber 已提交
252 253
        cs->kvm_run->kvm_valid_regs & KVM_SYNC_ACRS &&
        cs->kvm_run->kvm_valid_regs & KVM_SYNC_CRS) {
254
        for (i = 0; i < 16; i++) {
A
Andreas Färber 已提交
255 256
            env->aregs[i] = cs->kvm_run->s.regs.acrs[i];
            env->cregs[i] = cs->kvm_run->s.regs.crs[i];
257 258
        }
    } else {
259 260 261
        r = kvm_vcpu_ioctl(cs, KVM_GET_SREGS, &sregs);
        if (r < 0) {
            return r;
262 263 264 265 266
        }
         for (i = 0; i < 16; i++) {
            env->aregs[i] = sregs.acrs[i];
            env->cregs[i] = sregs.crs[i];
        }
A
Alexander Graf 已提交
267 268
    }

269
    /* The prefix */
A
Andreas Färber 已提交
270 271
    if (cap_sync_regs && cs->kvm_run->kvm_valid_regs & KVM_SYNC_PREFIX) {
        env->psa = cs->kvm_run->s.regs.prefix;
272
    }
A
Alexander Graf 已提交
273

274 275 276 277 278 279 280 281
    /*
     * These ONE_REGS are not protected by a capability. As they are only
     * necessary for migration we just trace a possible error, but don't
     * return with an error return code.
     */
    kvm_get_one_reg(cs, KVM_REG_S390_CPU_TIMER, &env->cputm);
    kvm_get_one_reg(cs, KVM_REG_S390_CLOCK_COMP, &env->ckc);
    kvm_get_one_reg(cs, KVM_REG_S390_TODPR, &env->todpr);
282 283
    kvm_get_one_reg(cs, KVM_REG_S390_GBEA, &env->gbea);
    kvm_get_one_reg(cs, KVM_REG_S390_PP, &env->pp);
284

285
    if (cap_async_pf) {
286
        r = kvm_get_one_reg(cs, KVM_REG_S390_PFTOKEN, &env->pfault_token);
287 288 289
        if (r < 0) {
            return r;
        }
290
        r = kvm_get_one_reg(cs, KVM_REG_S390_PFCOMPARE, &env->pfault_compare);
291 292 293
        if (r < 0) {
            return r;
        }
294
        r = kvm_get_one_reg(cs, KVM_REG_S390_PFSELECT, &env->pfault_select);
295 296 297 298 299
        if (r < 0) {
            return r;
        }
    }

A
Alexander Graf 已提交
300 301 302
    return 0;
}

303 304 305 306 307 308 309 310 311 312
/*
 * Legacy layout for s390:
 * Older S390 KVM requires the topmost vma of the RAM to be
 * smaller than an system defined value, which is at least 256GB.
 * Larger systems have larger values. We put the guest between
 * the end of data segment (system break) and this value. We
 * use 32GB as a base to have enough room for the system break
 * to grow. We also have to use MAP parameters that avoid
 * read-only mapping of guest pages.
 */
313
static void *legacy_s390_alloc(size_t size)
314 315 316 317 318 319
{
    void *mem;

    mem = mmap((void *) 0x800000000ULL, size,
               PROT_EXEC|PROT_READ|PROT_WRITE,
               MAP_SHARED | MAP_ANONYMOUS | MAP_FIXED, -1, 0);
320
    return mem == MAP_FAILED ? NULL : mem;
321 322
}

323 324 325
/* DIAG 501 is used for sw breakpoints */
static const uint8_t diag_501[] = {0x83, 0x24, 0x05, 0x01};

A
Andreas Färber 已提交
326
int kvm_arch_insert_sw_breakpoint(CPUState *cs, struct kvm_sw_breakpoint *bp)
A
Alexander Graf 已提交
327 328
{

329 330 331 332
    if (cpu_memory_rw_debug(cs, bp->pc, (uint8_t *)&bp->saved_insn,
                            sizeof(diag_501), 0) ||
        cpu_memory_rw_debug(cs, bp->pc, (uint8_t *)diag_501,
                            sizeof(diag_501), 1)) {
A
Alexander Graf 已提交
333 334 335 336 337
        return -EINVAL;
    }
    return 0;
}

A
Andreas Färber 已提交
338
int kvm_arch_remove_sw_breakpoint(CPUState *cs, struct kvm_sw_breakpoint *bp)
A
Alexander Graf 已提交
339
{
340
    uint8_t t[sizeof(diag_501)];
A
Alexander Graf 已提交
341

342
    if (cpu_memory_rw_debug(cs, bp->pc, t, sizeof(diag_501), 0)) {
A
Alexander Graf 已提交
343
        return -EINVAL;
344
    } else if (memcmp(t, diag_501, sizeof(diag_501))) {
A
Alexander Graf 已提交
345
        return -EINVAL;
346 347
    } else if (cpu_memory_rw_debug(cs, bp->pc, (uint8_t *)&bp->saved_insn,
                                   sizeof(diag_501), 1)) {
A
Alexander Graf 已提交
348 349 350 351 352 353
        return -EINVAL;
    }

    return 0;
}

354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373
int kvm_arch_insert_hw_breakpoint(target_ulong addr,
                                  target_ulong len, int type)
{
    return -ENOSYS;
}

int kvm_arch_remove_hw_breakpoint(target_ulong addr,
                                  target_ulong len, int type)
{
    return -ENOSYS;
}

void kvm_arch_remove_all_hw_breakpoints(void)
{
}

void kvm_arch_update_guest_debug(CPUState *cpu, struct kvm_guest_debug *dbg)
{
}

A
Andreas Färber 已提交
374
void kvm_arch_pre_run(CPUState *cpu, struct kvm_run *run)
A
Alexander Graf 已提交
375 376 377
{
}

A
Andreas Färber 已提交
378
void kvm_arch_post_run(CPUState *cpu, struct kvm_run *run)
A
Alexander Graf 已提交
379 380 381
{
}

A
Andreas Färber 已提交
382
int kvm_arch_process_async_events(CPUState *cs)
M
Marcelo Tosatti 已提交
383
{
384
    return cs->halted;
M
Marcelo Tosatti 已提交
385 386
}

387
void kvm_s390_interrupt_internal(S390CPU *cpu, int type, uint32_t parm,
388
                                 uint64_t parm64, int vm)
A
Alexander Graf 已提交
389
{
390
    CPUState *cs = CPU(cpu);
A
Alexander Graf 已提交
391 392 393
    struct kvm_s390_interrupt kvmint;
    int r;

394
    if (!cs->kvm_state) {
A
Alexander Graf 已提交
395 396 397 398 399 400 401 402
        return;
    }

    kvmint.type = type;
    kvmint.parm = parm;
    kvmint.parm64 = parm64;

    if (vm) {
403
        r = kvm_vm_ioctl(cs->kvm_state, KVM_S390_INTERRUPT, &kvmint);
A
Alexander Graf 已提交
404
    } else {
405
        r = kvm_vcpu_ioctl(cs, KVM_S390_INTERRUPT, &kvmint);
A
Alexander Graf 已提交
406 407 408 409 410 411 412 413
    }

    if (r < 0) {
        fprintf(stderr, "KVM failed to inject interrupt\n");
        exit(1);
    }
}

414
void kvm_s390_virtio_irq(S390CPU *cpu, int config_change, uint64_t token)
A
Alexander Graf 已提交
415
{
416
    kvm_s390_interrupt_internal(cpu, KVM_S390_INT_VIRTIO, config_change,
A
Alexander Graf 已提交
417 418 419
                                token, 1);
}

420
void kvm_s390_interrupt(S390CPU *cpu, int type, uint32_t code)
A
Alexander Graf 已提交
421
{
422
    kvm_s390_interrupt_internal(cpu, type, code, 0, 0);
A
Alexander Graf 已提交
423 424
}

425
static void enter_pgmcheck(S390CPU *cpu, uint16_t code)
A
Alexander Graf 已提交
426
{
427
    kvm_s390_interrupt(cpu, KVM_S390_PROGRAM_INT, code);
A
Alexander Graf 已提交
428 429
}

430
static int kvm_sclp_service_call(S390CPU *cpu, struct kvm_run *run,
431
                                 uint16_t ipbh0)
A
Alexander Graf 已提交
432
{
433
    CPUS390XState *env = &cpu->env;
434 435
    uint64_t sccb;
    uint32_t code;
A
Alexander Graf 已提交
436 437
    int r = 0;

438
    cpu_synchronize_state(CPU(cpu));
A
Alexander Graf 已提交
439 440 441
    sccb = env->regs[ipbh0 & 0xf];
    code = env->regs[(ipbh0 & 0xf0) >> 4];

442
    r = sclp_service_call(env, sccb, code);
443
    if (r < 0) {
444
        enter_pgmcheck(cpu, -r);
445 446
    } else {
        setcc(cpu, r);
A
Alexander Graf 已提交
447
    }
A
Alexander Graf 已提交
448

A
Alexander Graf 已提交
449 450 451
    return 0;
}

452
static int handle_b2(S390CPU *cpu, struct kvm_run *run, uint8_t ipa1)
453 454
{
    CPUS390XState *env = &cpu->env;
455 456
    int rc = 0;
    uint16_t ipbh0 = (run->s390_sieic.ipb & 0xffff0000) >> 16;
457

458
    cpu_synchronize_state(CPU(cpu));
459

460
    switch (ipa1) {
461
    case PRIV_B2_XSCH:
462
        ioinst_handle_xsch(cpu, env->regs[1]);
463
        break;
464
    case PRIV_B2_CSCH:
465
        ioinst_handle_csch(cpu, env->regs[1]);
466
        break;
467
    case PRIV_B2_HSCH:
468
        ioinst_handle_hsch(cpu, env->regs[1]);
469
        break;
470
    case PRIV_B2_MSCH:
471
        ioinst_handle_msch(cpu, env->regs[1], run->s390_sieic.ipb);
472
        break;
473
    case PRIV_B2_SSCH:
474
        ioinst_handle_ssch(cpu, env->regs[1], run->s390_sieic.ipb);
475
        break;
476
    case PRIV_B2_STCRW:
477
        ioinst_handle_stcrw(cpu, run->s390_sieic.ipb);
478
        break;
479
    case PRIV_B2_STSCH:
480
        ioinst_handle_stsch(cpu, env->regs[1], run->s390_sieic.ipb);
481
        break;
482
    case PRIV_B2_TSCH:
483 484 485
        /* We should only get tsch via KVM_EXIT_S390_TSCH. */
        fprintf(stderr, "Spurious tsch intercept\n");
        break;
486
    case PRIV_B2_CHSC:
487
        ioinst_handle_chsc(cpu, run->s390_sieic.ipb);
488
        break;
489
    case PRIV_B2_TPI:
490 491 492
        /* This should have been handled by kvm already. */
        fprintf(stderr, "Spurious tpi intercept\n");
        break;
493
    case PRIV_B2_SCHM:
494 495
        ioinst_handle_schm(cpu, env->regs[1], env->regs[2],
                           run->s390_sieic.ipb);
496
        break;
497
    case PRIV_B2_RSCH:
498
        ioinst_handle_rsch(cpu, env->regs[1]);
499
        break;
500
    case PRIV_B2_RCHP:
501
        ioinst_handle_rchp(cpu, env->regs[1]);
502
        break;
503
    case PRIV_B2_STCPS:
504 505
        /* We do not provide this instruction, it is suppressed. */
        break;
506
    case PRIV_B2_SAL:
507
        ioinst_handle_sal(cpu, env->regs[1]);
508
        break;
509
    case PRIV_B2_SIGA:
510
        /* Not provided, set CC = 3 for subchannel not operational */
511
        setcc(cpu, 3);
512
        break;
513 514 515
    case PRIV_B2_SCLP_CALL:
        rc = kvm_sclp_service_call(cpu, run, ipbh0);
        break;
516
    default:
517 518 519
        rc = -1;
        DPRINTF("KVM: unhandled PRIV: 0xb2%x\n", ipa1);
        break;
520 521
    }

522
    return rc;
523 524
}

525
static int handle_b9(S390CPU *cpu, struct kvm_run *run, uint8_t ipa1)
A
Alexander Graf 已提交
526 527 528 529
{
    int r = 0;

    switch (ipa1) {
530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555
    case PRIV_B9_EQBS:
        /* just inject exception */
        r = -1;
        break;
    default:
        r = -1;
        DPRINTF("KVM: unhandled PRIV: 0xb9%x\n", ipa1);
        break;
    }

    return r;
}

static int handle_eb(S390CPU *cpu, struct kvm_run *run, uint8_t ipa1)
{
    int r = 0;

    switch (ipa1) {
    case PRIV_EB_SQBS:
        /* just inject exception */
        r = -1;
        break;
    default:
        r = -1;
        DPRINTF("KVM: unhandled PRIV: 0xeb%x\n", ipa1);
        break;
A
Alexander Graf 已提交
556 557 558 559 560
    }

    return r;
}

561
static int handle_hypercall(S390CPU *cpu, struct kvm_run *run)
A
Alexander Graf 已提交
562
{
563
    CPUS390XState *env = &cpu->env;
564
    int ret;
565

566
    cpu_synchronize_state(CPU(cpu));
567 568 569 570 571
    ret = s390_virtio_hypercall(env);
    if (ret == -EINVAL) {
        enter_pgmcheck(cpu, PGM_SPECIFICATION);
        return 0;
    }
A
Alexander Graf 已提交
572

573
    return ret;
A
Alexander Graf 已提交
574 575
}

576 577 578 579 580 581 582 583 584 585
static void kvm_handle_diag_308(S390CPU *cpu, struct kvm_run *run)
{
    uint64_t r1, r3;

    cpu_synchronize_state(CPU(cpu));
    r1 = (run->s390_sieic.ipa & 0x00f0) >> 8;
    r3 = run->s390_sieic.ipa & 0x000f;
    handle_diag_308(&cpu->env, r1, r3);
}

C
Cornelia Huck 已提交
586 587 588
#define DIAG_KVM_CODE_MASK 0x000000000000ffff

static int handle_diag(S390CPU *cpu, struct kvm_run *run, uint32_t ipb)
A
Alexander Graf 已提交
589 590
{
    int r = 0;
C
Cornelia Huck 已提交
591 592 593 594 595 596 597 598
    uint16_t func_code;

    /*
     * For any diagnose call we support, bits 48-63 of the resulting
     * address specify the function code; the remainder is ignored.
     */
    func_code = decode_basedisp_rs(&cpu->env, ipb) & DIAG_KVM_CODE_MASK;
    switch (func_code) {
599 600 601
    case DIAG_IPL:
        kvm_handle_diag_308(cpu, run);
        break;
602 603 604 605 606 607 608
    case DIAG_KVM_HYPERCALL:
        r = handle_hypercall(cpu, run);
        break;
    case DIAG_KVM_BREAKPOINT:
        sleep(10);
        break;
    default:
C
Cornelia Huck 已提交
609
        DPRINTF("KVM: unknown DIAG: 0x%x\n", func_code);
610 611
        r = -1;
        break;
A
Alexander Graf 已提交
612 613 614 615 616
    }

    return r;
}

T
Thomas Huth 已提交
617 618 619 620 621 622 623 624
static int kvm_s390_cpu_start(S390CPU *cpu)
{
    s390_add_running_cpu(cpu);
    qemu_cpu_kick(CPU(cpu));
    DPRINTF("DONE: KVM cpu start: %p\n", &cpu->env);
    return 0;
}

625
int kvm_s390_cpu_restart(S390CPU *cpu)
A
Alexander Graf 已提交
626
{
627
    kvm_s390_interrupt(cpu, KVM_S390_RESTART, 0);
628
    s390_add_running_cpu(cpu);
629
    qemu_cpu_kick(CPU(cpu));
630
    DPRINTF("DONE: KVM cpu restart: %p\n", &cpu->env);
A
Alexander Graf 已提交
631 632 633
    return 0;
}

634
static void sigp_initial_cpu_reset(void *arg)
A
Alexander Graf 已提交
635
{
636 637
    CPUState *cpu = arg;
    S390CPUClass *scc = S390_CPU_GET_CLASS(cpu);
638

639 640
    cpu_synchronize_state(cpu);
    scc->initial_cpu_reset(cpu);
A
Alexander Graf 已提交
641 642
}

643 644 645 646 647 648 649 650 651
static void sigp_cpu_reset(void *arg)
{
    CPUState *cpu = arg;
    S390CPUClass *scc = S390_CPU_GET_CLASS(cpu);

    cpu_synchronize_state(cpu);
    scc->cpu_reset(cpu);
}

652 653
#define SIGP_ORDER_MASK 0x000000ff

A
Andreas Färber 已提交
654
static int handle_sigp(S390CPU *cpu, struct kvm_run *run, uint8_t ipa1)
A
Alexander Graf 已提交
655
{
A
Andreas Färber 已提交
656
    CPUS390XState *env = &cpu->env;
A
Alexander Graf 已提交
657 658
    uint8_t order_code;
    uint16_t cpu_addr;
659
    S390CPU *target_cpu;
660 661
    uint64_t *statusreg = &env->regs[ipa1 >> 4];
    int cc;
A
Alexander Graf 已提交
662

663
    cpu_synchronize_state(CPU(cpu));
A
Alexander Graf 已提交
664 665

    /* get order code */
666
    order_code = decode_basedisp_rs(env, run->s390_sieic.ipb) & SIGP_ORDER_MASK;
A
Alexander Graf 已提交
667 668

    cpu_addr = env->regs[ipa1 & 0x0f];
669 670
    target_cpu = s390_cpu_addr2state(cpu_addr);
    if (target_cpu == NULL) {
671
        cc = 3;    /* not operational */
A
Alexander Graf 已提交
672 673 674 675
        goto out;
    }

    switch (order_code) {
T
Thomas Huth 已提交
676
    case SIGP_START:
677
        cc = kvm_s390_cpu_start(target_cpu);
T
Thomas Huth 已提交
678
        break;
679
    case SIGP_RESTART:
680
        cc = kvm_s390_cpu_restart(target_cpu);
681 682
        break;
    case SIGP_SET_ARCH:
683 684 685 686
        *statusreg &= 0xffffffff00000000UL;
        *statusreg |= SIGP_STAT_INVALID_PARAMETER;
        cc = 1;   /* status stored */
        break;
687
    case SIGP_INITIAL_CPU_RESET:
688 689
        run_on_cpu(CPU(target_cpu), sigp_initial_cpu_reset, CPU(target_cpu));
        cc = 0;
690
        break;
691 692 693 694
    case SIGP_CPU_RESET:
        run_on_cpu(CPU(target_cpu), sigp_cpu_reset, CPU(target_cpu));
        cc = 0;
        break;
695
    default:
696 697 698 699
        DPRINTF("KVM: unknown SIGP: 0x%x\n", order_code);
        *statusreg &= 0xffffffff00000000UL;
        *statusreg |= SIGP_STAT_INVALID_ORDER;
        cc = 1;   /* status stored */
700
        break;
A
Alexander Graf 已提交
701 702 703
    }

out:
704
    setcc(cpu, cc);
A
Alexander Graf 已提交
705 706 707
    return 0;
}

708
static void handle_instruction(S390CPU *cpu, struct kvm_run *run)
A
Alexander Graf 已提交
709 710 711
{
    unsigned int ipa0 = (run->s390_sieic.ipa & 0xff00);
    uint8_t ipa1 = run->s390_sieic.ipa & 0x00ff;
712
    int r = -1;
A
Alexander Graf 已提交
713

714 715
    DPRINTF("handle_instruction 0x%x 0x%x\n",
            run->s390_sieic.ipa, run->s390_sieic.ipb);
A
Alexander Graf 已提交
716
    switch (ipa0) {
717
    case IPA0_B2:
718 719
        r = handle_b2(cpu, run, ipa1);
        break;
720
    case IPA0_B9:
721 722
        r = handle_b9(cpu, run, ipa1);
        break;
723
    case IPA0_EB:
724
        r = handle_eb(cpu, run, ipa1);
725 726
        break;
    case IPA0_DIAG:
C
Cornelia Huck 已提交
727
        r = handle_diag(cpu, run, run->s390_sieic.ipb);
728 729 730 731
        break;
    case IPA0_SIGP:
        r = handle_sigp(cpu, run, ipa1);
        break;
A
Alexander Graf 已提交
732 733 734
    }

    if (r < 0) {
735
        enter_pgmcheck(cpu, 0x0001);
A
Alexander Graf 已提交
736 737 738
    }
}

A
Andreas Färber 已提交
739
static bool is_special_wait_psw(CPUState *cs)
740 741
{
    /* signal quiesce */
A
Andreas Färber 已提交
742
    return cs->kvm_run->psw_addr == 0xfffUL;
743 744
}

745
static int handle_intercept(S390CPU *cpu)
A
Alexander Graf 已提交
746
{
A
Andreas Färber 已提交
747 748
    CPUState *cs = CPU(cpu);
    struct kvm_run *run = cs->kvm_run;
A
Alexander Graf 已提交
749 750 751
    int icpt_code = run->s390_sieic.icptcode;
    int r = 0;

752
    DPRINTF("intercept: 0x%x (at 0x%lx)\n", icpt_code,
A
Andreas Färber 已提交
753
            (long)cs->kvm_run->psw_addr);
A
Alexander Graf 已提交
754 755
    switch (icpt_code) {
        case ICPT_INSTRUCTION:
756
            handle_instruction(cpu, run);
A
Alexander Graf 已提交
757 758
            break;
        case ICPT_WAITPSW:
759 760 761 762 763 764 765 766 767 768 769 770
            /* disabled wait, since enabled wait is handled in kernel */
            if (s390_del_running_cpu(cpu) == 0) {
                if (is_special_wait_psw(cs)) {
                    qemu_system_shutdown_request();
                } else {
                    QObject *data;

                    data = qobject_from_jsonf("{ 'action': %s }", "pause");
                    monitor_protocol_event(QEVENT_GUEST_PANICKED, data);
                    qobject_decref(data);
                    vm_stop(RUN_STATE_GUEST_PANICKED);
                }
771 772 773
            }
            r = EXCP_HALTED;
            break;
774
        case ICPT_CPU_STOP:
775
            if (s390_del_running_cpu(cpu) == 0) {
776 777 778
                qemu_system_shutdown_request();
            }
            r = EXCP_HALTED;
A
Alexander Graf 已提交
779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796
            break;
        case ICPT_SOFT_INTERCEPT:
            fprintf(stderr, "KVM unimplemented icpt SOFT\n");
            exit(1);
            break;
        case ICPT_IO:
            fprintf(stderr, "KVM unimplemented icpt IO\n");
            exit(1);
            break;
        default:
            fprintf(stderr, "Unknown intercept code: %d\n", icpt_code);
            exit(1);
            break;
    }

    return r;
}

797 798 799 800 801 802 803
static int handle_tsch(S390CPU *cpu)
{
    CPUS390XState *env = &cpu->env;
    CPUState *cs = CPU(cpu);
    struct kvm_run *run = cs->kvm_run;
    int ret;

804
    cpu_synchronize_state(cs);
805

806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834
    ret = ioinst_handle_tsch(env, env->regs[1], run->s390_tsch.ipb);
    if (ret >= 0) {
        /* Success; set condition code. */
        setcc(cpu, ret);
        ret = 0;
    } else if (ret < -1) {
        /*
         * Failure.
         * If an I/O interrupt had been dequeued, we have to reinject it.
         */
        if (run->s390_tsch.dequeued) {
            uint16_t subchannel_id = run->s390_tsch.subchannel_id;
            uint16_t subchannel_nr = run->s390_tsch.subchannel_nr;
            uint32_t io_int_parm = run->s390_tsch.io_int_parm;
            uint32_t io_int_word = run->s390_tsch.io_int_word;
            uint32_t type = ((subchannel_id & 0xff00) << 24) |
                ((subchannel_id & 0x00060) << 22) | (subchannel_nr << 16);

            kvm_s390_interrupt_internal(cpu, type,
                                        ((uint32_t)subchannel_id << 16)
                                        | subchannel_nr,
                                        ((uint64_t)io_int_parm << 32)
                                        | io_int_word, 1);
        }
        ret = 0;
    }
    return ret;
}

835 836 837 838 839
static int kvm_arch_handle_debug_exit(S390CPU *cpu)
{
    return -ENOSYS;
}

A
Andreas Färber 已提交
840
int kvm_arch_handle_exit(CPUState *cs, struct kvm_run *run)
A
Alexander Graf 已提交
841
{
A
Andreas Färber 已提交
842
    S390CPU *cpu = S390_CPU(cs);
A
Alexander Graf 已提交
843 844 845 846
    int ret = 0;

    switch (run->exit_reason) {
        case KVM_EXIT_S390_SIEIC:
847
            ret = handle_intercept(cpu);
A
Alexander Graf 已提交
848 849
            break;
        case KVM_EXIT_S390_RESET:
850
            qemu_system_reset_request();
A
Alexander Graf 已提交
851
            break;
852 853 854
        case KVM_EXIT_S390_TSCH:
            ret = handle_tsch(cpu);
            break;
855 856 857
        case KVM_EXIT_DEBUG:
            ret = kvm_arch_handle_debug_exit(cpu);
            break;
A
Alexander Graf 已提交
858 859 860 861 862
        default:
            fprintf(stderr, "Unknown KVM exit: %d\n", run->exit_reason);
            break;
    }

863 864 865
    if (ret == 0) {
        ret = EXCP_INTERRUPT;
    }
A
Alexander Graf 已提交
866 867
    return ret;
}
868

A
Andreas Färber 已提交
869
bool kvm_arch_stop_on_emulation_error(CPUState *cpu)
870 871 872
{
    return true;
}
873

A
Andreas Färber 已提交
874
int kvm_arch_on_sigbus_vcpu(CPUState *cpu, int code, void *addr)
875 876 877 878 879 880 881 882
{
    return 1;
}

int kvm_arch_on_sigbus(int code, void *addr)
{
    return 1;
}
883 884 885 886 887 888 889

void kvm_s390_io_interrupt(S390CPU *cpu, uint16_t subchannel_id,
                           uint16_t subchannel_nr, uint32_t io_int_parm,
                           uint32_t io_int_word)
{
    uint32_t type;

890 891 892 893 894 895
    if (io_int_word & IO_INT_WORD_AI) {
        type = KVM_S390_INT_IO(1, 0, 0, 0);
    } else {
        type = ((subchannel_id & 0xff00) << 24) |
            ((subchannel_id & 0x00060) << 22) | (subchannel_nr << 16);
    }
896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911
    kvm_s390_interrupt_internal(cpu, type,
                                ((uint32_t)subchannel_id << 16) | subchannel_nr,
                                ((uint64_t)io_int_parm << 32) | io_int_word, 1);
}

void kvm_s390_crw_mchk(S390CPU *cpu)
{
    kvm_s390_interrupt_internal(cpu, KVM_S390_MCHK, 1 << 28,
                                0x00400f1d40330000, 1);
}

void kvm_s390_enable_css_support(S390CPU *cpu)
{
    int r;

    /* Activate host kernel channel subsystem support. */
C
Cornelia Huck 已提交
912
    r = kvm_vcpu_enable_cap(CPU(cpu), KVM_CAP_S390_CSS_SUPPORT, 0);
913 914
    assert(r == 0);
}
915 916 917

void kvm_arch_init_irq_routing(KVMState *s)
{
918 919 920 921 922 923 924 925 926 927
    /*
     * Note that while irqchip capabilities generally imply that cpustates
     * are handled in-kernel, it is not true for s390 (yet); therefore, we
     * have to override the common code kvm_halt_in_kernel_allowed setting.
     */
    if (kvm_check_extension(s, KVM_CAP_IRQ_ROUTING)) {
        kvm_irqfds_allowed = true;
        kvm_gsi_routing_allowed = true;
        kvm_halt_in_kernel_allowed = false;
    }
928
}
C
Cornelia Huck 已提交
929

930 931
int kvm_s390_assign_subch_ioeventfd(EventNotifier *notifier, uint32_t sch,
                                    int vq, bool assign)
C
Cornelia Huck 已提交
932 933 934 935
{
    struct kvm_ioeventfd kick = {
        .flags = KVM_IOEVENTFD_FLAG_VIRTIO_CCW_NOTIFY |
        KVM_IOEVENTFD_FLAG_DATAMATCH,
936
        .fd = event_notifier_get_fd(notifier),
C
Cornelia Huck 已提交
937 938 939 940 941 942 943 944 945 946 947 948
        .datamatch = vq,
        .addr = sch,
        .len = 8,
    };
    if (!kvm_check_extension(kvm_state, KVM_CAP_IOEVENTFD)) {
        return -ENOSYS;
    }
    if (!assign) {
        kick.flags |= KVM_IOEVENTFD_FLAG_DEASSIGN;
    }
    return kvm_vm_ioctl(kvm_state, KVM_IOEVENTFD, &kick);
}