kvm.c 29.8 KB
Newer Older
A
Alexander Graf 已提交
1 2 3 4
/*
 * QEMU S390x KVM implementation
 *
 * Copyright (c) 2009 Alexander Graf <agraf@suse.de>
5
 * Copyright IBM Corp. 2012
A
Alexander Graf 已提交
6 7 8 9 10 11 12 13 14 15 16
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
17 18 19 20
 * Contributions after 2012-10-29 are licensed under the terms of the
 * GNU GPL, version 2 or (at your option) any later version.
 *
 * You should have received a copy of the GNU (Lesser) General Public
A
Alexander Graf 已提交
21 22 23 24 25 26 27 28 29 30 31
 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
 */

#include <sys/types.h>
#include <sys/ioctl.h>
#include <sys/mman.h>

#include <linux/kvm.h>
#include <asm/ptrace.h>

#include "qemu-common.h"
32
#include "qemu/timer.h"
33 34
#include "sysemu/sysemu.h"
#include "sysemu/kvm.h"
A
Alexander Graf 已提交
35
#include "cpu.h"
36
#include "sysemu/device_tree.h"
37 38
#include "qapi/qmp/qjson.h"
#include "monitor/monitor.h"
39
#include "exec/gdbstub.h"
40
#include "trace.h"
A
Alexander Graf 已提交
41 42 43 44

/* #define DEBUG_KVM */

#ifdef DEBUG_KVM
45
#define DPRINTF(fmt, ...) \
A
Alexander Graf 已提交
46 47
    do { fprintf(stderr, fmt, ## __VA_ARGS__); } while (0)
#else
48
#define DPRINTF(fmt, ...) \
A
Alexander Graf 已提交
49 50 51 52 53
    do { } while (0)
#endif

#define IPA0_DIAG                       0x8300
#define IPA0_SIGP                       0xae00
54 55 56
#define IPA0_B2                         0xb200
#define IPA0_B9                         0xb900
#define IPA0_EB                         0xeb00
A
Alexander Graf 已提交
57

58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79
#define PRIV_B2_SCLP_CALL               0x20
#define PRIV_B2_CSCH                    0x30
#define PRIV_B2_HSCH                    0x31
#define PRIV_B2_MSCH                    0x32
#define PRIV_B2_SSCH                    0x33
#define PRIV_B2_STSCH                   0x34
#define PRIV_B2_TSCH                    0x35
#define PRIV_B2_TPI                     0x36
#define PRIV_B2_SAL                     0x37
#define PRIV_B2_RSCH                    0x38
#define PRIV_B2_STCRW                   0x39
#define PRIV_B2_STCPS                   0x3a
#define PRIV_B2_RCHP                    0x3b
#define PRIV_B2_SCHM                    0x3c
#define PRIV_B2_CHSC                    0x5f
#define PRIV_B2_SIGA                    0x74
#define PRIV_B2_XSCH                    0x76

#define PRIV_EB_SQBS                    0x8a

#define PRIV_B9_EQBS                    0x9c

80
#define DIAG_IPL                        0x308
A
Alexander Graf 已提交
81 82 83 84 85 86 87 88 89
#define DIAG_KVM_HYPERCALL              0x500
#define DIAG_KVM_BREAKPOINT             0x501

#define ICPT_INSTRUCTION                0x04
#define ICPT_WAITPSW                    0x1c
#define ICPT_SOFT_INTERCEPT             0x24
#define ICPT_CPU_STOP                   0x28
#define ICPT_IO                         0x40

90 91 92 93 94 95 96 97
static CPUWatchpoint hw_watchpoint;
/*
 * We don't use a list because this structure is also used to transmit the
 * hardware breakpoints to the kernel.
 */
static struct kvm_hw_breakpoint *hw_breakpoints;
static int nb_hw_breakpoints;

98 99 100 101
const KVMCapabilityInfo kvm_arch_required_capabilities[] = {
    KVM_CAP_LAST_INFO
};

102
static int cap_sync_regs;
103
static int cap_async_pf;
104

105
static void *legacy_s390_alloc(size_t size);
106

107
int kvm_arch_init(KVMState *s)
A
Alexander Graf 已提交
108
{
109
    cap_sync_regs = kvm_check_extension(s, KVM_CAP_SYNC_REGS);
110
    cap_async_pf = kvm_check_extension(s, KVM_CAP_ASYNC_PF);
111 112 113 114
    if (!kvm_check_extension(s, KVM_CAP_S390_GMAP)
        || !kvm_check_extension(s, KVM_CAP_S390_COW)) {
        phys_mem_set_alloc(legacy_s390_alloc);
    }
A
Alexander Graf 已提交
115 116 117
    return 0;
}

118 119 120 121 122
unsigned long kvm_arch_vcpu_id(CPUState *cpu)
{
    return cpu->cpu_index;
}

A
Andreas Färber 已提交
123
int kvm_arch_init_vcpu(CPUState *cpu)
A
Alexander Graf 已提交
124
{
125 126
    /* nothing todo yet */
    return 0;
A
Alexander Graf 已提交
127 128
}

129
void kvm_s390_reset_vcpu(S390CPU *cpu)
A
Alexander Graf 已提交
130
{
131 132
    CPUState *cs = CPU(cpu);

A
Alexander Graf 已提交
133 134 135 136 137
    /* The initial reset call is needed here to reset in-kernel
     * vcpu data that we can't access directly from QEMU
     * (i.e. with older kernels which don't support sync_regs/ONE_REG).
     * Before this ioctl cpu_synchronize_state() is called in common kvm
     * code (kvm-all) */
138
    if (kvm_vcpu_ioctl(cs, KVM_S390_INITIAL_RESET, NULL)) {
J
Jens Freimann 已提交
139 140
        perror("Can't reset vcpu\n");
    }
A
Alexander Graf 已提交
141 142
}

A
Andreas Färber 已提交
143
int kvm_arch_put_registers(CPUState *cs, int level)
A
Alexander Graf 已提交
144
{
A
Andreas Färber 已提交
145 146
    S390CPU *cpu = S390_CPU(cs);
    CPUS390XState *env = &cpu->env;
147
    struct kvm_sregs sregs;
A
Alexander Graf 已提交
148
    struct kvm_regs regs;
149
    int r;
A
Alexander Graf 已提交
150 151
    int i;

152
    /* always save the PSW  and the GPRS*/
A
Andreas Färber 已提交
153 154
    cs->kvm_run->psw_addr = env->psw.addr;
    cs->kvm_run->psw_mask = env->psw.mask;
A
Alexander Graf 已提交
155

A
Andreas Färber 已提交
156
    if (cap_sync_regs && cs->kvm_run->kvm_valid_regs & KVM_SYNC_GPRS) {
157
        for (i = 0; i < 16; i++) {
A
Andreas Färber 已提交
158 159
            cs->kvm_run->s.regs.gprs[i] = env->regs[i];
            cs->kvm_run->kvm_dirty_regs |= KVM_SYNC_GPRS;
160 161 162 163 164
        }
    } else {
        for (i = 0; i < 16; i++) {
            regs.gprs[i] = env->regs[i];
        }
165 166 167
        r = kvm_vcpu_ioctl(cs, KVM_SET_REGS, &regs);
        if (r < 0) {
            return r;
168
        }
A
Alexander Graf 已提交
169 170
    }

171 172 173 174
    /* Do we need to save more than that? */
    if (level == KVM_PUT_RUNTIME_STATE) {
        return 0;
    }
175

176 177 178 179 180 181 182 183
    /*
     * These ONE_REGS are not protected by a capability. As they are only
     * necessary for migration we just trace a possible error, but don't
     * return with an error return code.
     */
    kvm_set_one_reg(cs, KVM_REG_S390_CPU_TIMER, &env->cputm);
    kvm_set_one_reg(cs, KVM_REG_S390_CLOCK_COMP, &env->ckc);
    kvm_set_one_reg(cs, KVM_REG_S390_TODPR, &env->todpr);
184 185
    kvm_set_one_reg(cs, KVM_REG_S390_GBEA, &env->gbea);
    kvm_set_one_reg(cs, KVM_REG_S390_PP, &env->pp);
A
Alexander Graf 已提交
186

187
    if (cap_async_pf) {
188 189 190
        r = kvm_set_one_reg(cs, KVM_REG_S390_PFTOKEN, &env->pfault_token);
        if (r < 0) {
            return r;
191
        }
192 193 194
        r = kvm_set_one_reg(cs, KVM_REG_S390_PFCOMPARE, &env->pfault_compare);
        if (r < 0) {
            return r;
195
        }
196 197 198
        r = kvm_set_one_reg(cs, KVM_REG_S390_PFSELECT, &env->pfault_select);
        if (r < 0) {
            return r;
199 200 201
        }
    }

202
    if (cap_sync_regs &&
A
Andreas Färber 已提交
203 204
        cs->kvm_run->kvm_valid_regs & KVM_SYNC_ACRS &&
        cs->kvm_run->kvm_valid_regs & KVM_SYNC_CRS) {
205
        for (i = 0; i < 16; i++) {
A
Andreas Färber 已提交
206 207
            cs->kvm_run->s.regs.acrs[i] = env->aregs[i];
            cs->kvm_run->s.regs.crs[i] = env->cregs[i];
208
        }
A
Andreas Färber 已提交
209 210
        cs->kvm_run->kvm_dirty_regs |= KVM_SYNC_ACRS;
        cs->kvm_run->kvm_dirty_regs |= KVM_SYNC_CRS;
211 212 213 214 215
    } else {
        for (i = 0; i < 16; i++) {
            sregs.acrs[i] = env->aregs[i];
            sregs.crs[i] = env->cregs[i];
        }
216 217 218
        r = kvm_vcpu_ioctl(cs, KVM_SET_SREGS, &sregs);
        if (r < 0) {
            return r;
219 220
        }
    }
A
Alexander Graf 已提交
221

222
    /* Finally the prefix */
A
Andreas Färber 已提交
223 224 225
    if (cap_sync_regs && cs->kvm_run->kvm_valid_regs & KVM_SYNC_PREFIX) {
        cs->kvm_run->s.regs.prefix = env->psa;
        cs->kvm_run->kvm_dirty_regs |= KVM_SYNC_PREFIX;
226 227 228 229
    } else {
        /* prefix is only supported via sync regs */
    }
    return 0;
A
Alexander Graf 已提交
230 231
}

A
Andreas Färber 已提交
232
int kvm_arch_get_registers(CPUState *cs)
233 234 235
{
    S390CPU *cpu = S390_CPU(cs);
    CPUS390XState *env = &cpu->env;
236
    struct kvm_sregs sregs;
A
Alexander Graf 已提交
237
    struct kvm_regs regs;
238
    int i, r;
239

240
    /* get the PSW */
A
Andreas Färber 已提交
241 242
    env->psw.addr = cs->kvm_run->psw_addr;
    env->psw.mask = cs->kvm_run->psw_mask;
243 244

    /* the GPRS */
A
Andreas Färber 已提交
245
    if (cap_sync_regs && cs->kvm_run->kvm_valid_regs & KVM_SYNC_GPRS) {
246
        for (i = 0; i < 16; i++) {
A
Andreas Färber 已提交
247
            env->regs[i] = cs->kvm_run->s.regs.gprs[i];
248 249
        }
    } else {
250 251 252
        r = kvm_vcpu_ioctl(cs, KVM_GET_REGS, &regs);
        if (r < 0) {
            return r;
253 254 255 256
        }
         for (i = 0; i < 16; i++) {
            env->regs[i] = regs.gprs[i];
        }
A
Alexander Graf 已提交
257 258
    }

259 260
    /* The ACRS and CRS */
    if (cap_sync_regs &&
A
Andreas Färber 已提交
261 262
        cs->kvm_run->kvm_valid_regs & KVM_SYNC_ACRS &&
        cs->kvm_run->kvm_valid_regs & KVM_SYNC_CRS) {
263
        for (i = 0; i < 16; i++) {
A
Andreas Färber 已提交
264 265
            env->aregs[i] = cs->kvm_run->s.regs.acrs[i];
            env->cregs[i] = cs->kvm_run->s.regs.crs[i];
266 267
        }
    } else {
268 269 270
        r = kvm_vcpu_ioctl(cs, KVM_GET_SREGS, &sregs);
        if (r < 0) {
            return r;
271 272 273 274 275
        }
         for (i = 0; i < 16; i++) {
            env->aregs[i] = sregs.acrs[i];
            env->cregs[i] = sregs.crs[i];
        }
A
Alexander Graf 已提交
276 277
    }

278
    /* The prefix */
A
Andreas Färber 已提交
279 280
    if (cap_sync_regs && cs->kvm_run->kvm_valid_regs & KVM_SYNC_PREFIX) {
        env->psa = cs->kvm_run->s.regs.prefix;
281
    }
A
Alexander Graf 已提交
282

283 284 285 286 287 288 289 290
    /*
     * These ONE_REGS are not protected by a capability. As they are only
     * necessary for migration we just trace a possible error, but don't
     * return with an error return code.
     */
    kvm_get_one_reg(cs, KVM_REG_S390_CPU_TIMER, &env->cputm);
    kvm_get_one_reg(cs, KVM_REG_S390_CLOCK_COMP, &env->ckc);
    kvm_get_one_reg(cs, KVM_REG_S390_TODPR, &env->todpr);
291 292
    kvm_get_one_reg(cs, KVM_REG_S390_GBEA, &env->gbea);
    kvm_get_one_reg(cs, KVM_REG_S390_PP, &env->pp);
293

294
    if (cap_async_pf) {
295
        r = kvm_get_one_reg(cs, KVM_REG_S390_PFTOKEN, &env->pfault_token);
296 297 298
        if (r < 0) {
            return r;
        }
299
        r = kvm_get_one_reg(cs, KVM_REG_S390_PFCOMPARE, &env->pfault_compare);
300 301 302
        if (r < 0) {
            return r;
        }
303
        r = kvm_get_one_reg(cs, KVM_REG_S390_PFSELECT, &env->pfault_select);
304 305 306 307 308
        if (r < 0) {
            return r;
        }
    }

A
Alexander Graf 已提交
309 310 311
    return 0;
}

312 313 314 315 316 317 318 319 320 321
/*
 * Legacy layout for s390:
 * Older S390 KVM requires the topmost vma of the RAM to be
 * smaller than an system defined value, which is at least 256GB.
 * Larger systems have larger values. We put the guest between
 * the end of data segment (system break) and this value. We
 * use 32GB as a base to have enough room for the system break
 * to grow. We also have to use MAP parameters that avoid
 * read-only mapping of guest pages.
 */
322
static void *legacy_s390_alloc(size_t size)
323 324 325 326 327 328
{
    void *mem;

    mem = mmap((void *) 0x800000000ULL, size,
               PROT_EXEC|PROT_READ|PROT_WRITE,
               MAP_SHARED | MAP_ANONYMOUS | MAP_FIXED, -1, 0);
329
    return mem == MAP_FAILED ? NULL : mem;
330 331
}

332 333 334
/* DIAG 501 is used for sw breakpoints */
static const uint8_t diag_501[] = {0x83, 0x24, 0x05, 0x01};

A
Andreas Färber 已提交
335
int kvm_arch_insert_sw_breakpoint(CPUState *cs, struct kvm_sw_breakpoint *bp)
A
Alexander Graf 已提交
336 337
{

338 339 340 341
    if (cpu_memory_rw_debug(cs, bp->pc, (uint8_t *)&bp->saved_insn,
                            sizeof(diag_501), 0) ||
        cpu_memory_rw_debug(cs, bp->pc, (uint8_t *)diag_501,
                            sizeof(diag_501), 1)) {
A
Alexander Graf 已提交
342 343 344 345 346
        return -EINVAL;
    }
    return 0;
}

A
Andreas Färber 已提交
347
int kvm_arch_remove_sw_breakpoint(CPUState *cs, struct kvm_sw_breakpoint *bp)
A
Alexander Graf 已提交
348
{
349
    uint8_t t[sizeof(diag_501)];
A
Alexander Graf 已提交
350

351
    if (cpu_memory_rw_debug(cs, bp->pc, t, sizeof(diag_501), 0)) {
A
Alexander Graf 已提交
352
        return -EINVAL;
353
    } else if (memcmp(t, diag_501, sizeof(diag_501))) {
A
Alexander Graf 已提交
354
        return -EINVAL;
355 356
    } else if (cpu_memory_rw_debug(cs, bp->pc, (uint8_t *)&bp->saved_insn,
                                   sizeof(diag_501), 1)) {
A
Alexander Graf 已提交
357 358 359 360 361 362
        return -EINVAL;
    }

    return 0;
}

363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409
static struct kvm_hw_breakpoint *find_hw_breakpoint(target_ulong addr,
                                                    int len, int type)
{
    int n;

    for (n = 0; n < nb_hw_breakpoints; n++) {
        if (hw_breakpoints[n].addr == addr && hw_breakpoints[n].type == type &&
            (hw_breakpoints[n].len == len || len == -1)) {
            return &hw_breakpoints[n];
        }
    }

    return NULL;
}

static int insert_hw_breakpoint(target_ulong addr, int len, int type)
{
    int size;

    if (find_hw_breakpoint(addr, len, type)) {
        return -EEXIST;
    }

    size = (nb_hw_breakpoints + 1) * sizeof(struct kvm_hw_breakpoint);

    if (!hw_breakpoints) {
        nb_hw_breakpoints = 0;
        hw_breakpoints = (struct kvm_hw_breakpoint *)g_try_malloc(size);
    } else {
        hw_breakpoints =
            (struct kvm_hw_breakpoint *)g_try_realloc(hw_breakpoints, size);
    }

    if (!hw_breakpoints) {
        nb_hw_breakpoints = 0;
        return -ENOMEM;
    }

    hw_breakpoints[nb_hw_breakpoints].addr = addr;
    hw_breakpoints[nb_hw_breakpoints].len = len;
    hw_breakpoints[nb_hw_breakpoints].type = type;

    nb_hw_breakpoints++;

    return 0;
}

410 411 412
int kvm_arch_insert_hw_breakpoint(target_ulong addr,
                                  target_ulong len, int type)
{
413 414 415 416 417 418 419 420 421 422 423 424 425 426
    switch (type) {
    case GDB_BREAKPOINT_HW:
        type = KVM_HW_BP;
        break;
    case GDB_WATCHPOINT_WRITE:
        if (len < 1) {
            return -EINVAL;
        }
        type = KVM_HW_WP_WRITE;
        break;
    default:
        return -ENOSYS;
    }
    return insert_hw_breakpoint(addr, len, type);
427 428 429 430 431
}

int kvm_arch_remove_hw_breakpoint(target_ulong addr,
                                  target_ulong len, int type)
{
432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456
    int size;
    struct kvm_hw_breakpoint *bp = find_hw_breakpoint(addr, len, type);

    if (bp == NULL) {
        return -ENOENT;
    }

    nb_hw_breakpoints--;
    if (nb_hw_breakpoints > 0) {
        /*
         * In order to trim the array, move the last element to the position to
         * be removed - if necessary.
         */
        if (bp != &hw_breakpoints[nb_hw_breakpoints]) {
            *bp = hw_breakpoints[nb_hw_breakpoints];
        }
        size = nb_hw_breakpoints * sizeof(struct kvm_hw_breakpoint);
        hw_breakpoints =
             (struct kvm_hw_breakpoint *)g_realloc(hw_breakpoints, size);
    } else {
        g_free(hw_breakpoints);
        hw_breakpoints = NULL;
    }

    return 0;
457 458 459 460
}

void kvm_arch_remove_all_hw_breakpoints(void)
{
461 462 463
    nb_hw_breakpoints = 0;
    g_free(hw_breakpoints);
    hw_breakpoints = NULL;
464 465 466 467
}

void kvm_arch_update_guest_debug(CPUState *cpu, struct kvm_guest_debug *dbg)
{
468 469 470 471 472 473 474 475 476 477 478 479 480 481 482
    int i;

    if (nb_hw_breakpoints > 0) {
        dbg->arch.nr_hw_bp = nb_hw_breakpoints;
        dbg->arch.hw_bp = hw_breakpoints;

        for (i = 0; i < nb_hw_breakpoints; ++i) {
            hw_breakpoints[i].phys_addr = s390_cpu_get_phys_addr_debug(cpu,
                                                       hw_breakpoints[i].addr);
        }
        dbg->control |= KVM_GUESTDBG_ENABLE | KVM_GUESTDBG_USE_HW_BP;
    } else {
        dbg->arch.nr_hw_bp = 0;
        dbg->arch.hw_bp = NULL;
    }
483 484
}

A
Andreas Färber 已提交
485
void kvm_arch_pre_run(CPUState *cpu, struct kvm_run *run)
A
Alexander Graf 已提交
486 487 488
{
}

A
Andreas Färber 已提交
489
void kvm_arch_post_run(CPUState *cpu, struct kvm_run *run)
A
Alexander Graf 已提交
490 491 492
{
}

A
Andreas Färber 已提交
493
int kvm_arch_process_async_events(CPUState *cs)
M
Marcelo Tosatti 已提交
494
{
495
    return cs->halted;
M
Marcelo Tosatti 已提交
496 497
}

498
void kvm_s390_interrupt_internal(S390CPU *cpu, int type, uint32_t parm,
499
                                 uint64_t parm64, int vm)
A
Alexander Graf 已提交
500
{
501
    CPUState *cs = CPU(cpu);
A
Alexander Graf 已提交
502 503 504
    struct kvm_s390_interrupt kvmint;
    int r;

505
    if (!cs->kvm_state) {
A
Alexander Graf 已提交
506 507 508 509 510 511 512 513
        return;
    }

    kvmint.type = type;
    kvmint.parm = parm;
    kvmint.parm64 = parm64;

    if (vm) {
514
        r = kvm_vm_ioctl(cs->kvm_state, KVM_S390_INTERRUPT, &kvmint);
A
Alexander Graf 已提交
515
    } else {
516
        r = kvm_vcpu_ioctl(cs, KVM_S390_INTERRUPT, &kvmint);
A
Alexander Graf 已提交
517 518 519 520 521 522 523 524
    }

    if (r < 0) {
        fprintf(stderr, "KVM failed to inject interrupt\n");
        exit(1);
    }
}

525
void kvm_s390_virtio_irq(S390CPU *cpu, int config_change, uint64_t token)
A
Alexander Graf 已提交
526
{
527
    kvm_s390_interrupt_internal(cpu, KVM_S390_INT_VIRTIO, config_change,
A
Alexander Graf 已提交
528 529 530
                                token, 1);
}

531
void kvm_s390_interrupt(S390CPU *cpu, int type, uint32_t code)
A
Alexander Graf 已提交
532
{
533
    kvm_s390_interrupt_internal(cpu, type, code, 0, 0);
A
Alexander Graf 已提交
534 535
}

536
static void enter_pgmcheck(S390CPU *cpu, uint16_t code)
A
Alexander Graf 已提交
537
{
538
    kvm_s390_interrupt(cpu, KVM_S390_PROGRAM_INT, code);
A
Alexander Graf 已提交
539 540
}

541
static int kvm_sclp_service_call(S390CPU *cpu, struct kvm_run *run,
542
                                 uint16_t ipbh0)
A
Alexander Graf 已提交
543
{
544
    CPUS390XState *env = &cpu->env;
545 546
    uint64_t sccb;
    uint32_t code;
A
Alexander Graf 已提交
547 548
    int r = 0;

549
    cpu_synchronize_state(CPU(cpu));
A
Alexander Graf 已提交
550 551 552
    sccb = env->regs[ipbh0 & 0xf];
    code = env->regs[(ipbh0 & 0xf0) >> 4];

553
    r = sclp_service_call(env, sccb, code);
554
    if (r < 0) {
555
        enter_pgmcheck(cpu, -r);
556 557
    } else {
        setcc(cpu, r);
A
Alexander Graf 已提交
558
    }
A
Alexander Graf 已提交
559

A
Alexander Graf 已提交
560 561 562
    return 0;
}

563
static int handle_b2(S390CPU *cpu, struct kvm_run *run, uint8_t ipa1)
564 565
{
    CPUS390XState *env = &cpu->env;
566 567
    int rc = 0;
    uint16_t ipbh0 = (run->s390_sieic.ipb & 0xffff0000) >> 16;
568

569
    cpu_synchronize_state(CPU(cpu));
570

571
    switch (ipa1) {
572
    case PRIV_B2_XSCH:
573
        ioinst_handle_xsch(cpu, env->regs[1]);
574
        break;
575
    case PRIV_B2_CSCH:
576
        ioinst_handle_csch(cpu, env->regs[1]);
577
        break;
578
    case PRIV_B2_HSCH:
579
        ioinst_handle_hsch(cpu, env->regs[1]);
580
        break;
581
    case PRIV_B2_MSCH:
582
        ioinst_handle_msch(cpu, env->regs[1], run->s390_sieic.ipb);
583
        break;
584
    case PRIV_B2_SSCH:
585
        ioinst_handle_ssch(cpu, env->regs[1], run->s390_sieic.ipb);
586
        break;
587
    case PRIV_B2_STCRW:
588
        ioinst_handle_stcrw(cpu, run->s390_sieic.ipb);
589
        break;
590
    case PRIV_B2_STSCH:
591
        ioinst_handle_stsch(cpu, env->regs[1], run->s390_sieic.ipb);
592
        break;
593
    case PRIV_B2_TSCH:
594 595 596
        /* We should only get tsch via KVM_EXIT_S390_TSCH. */
        fprintf(stderr, "Spurious tsch intercept\n");
        break;
597
    case PRIV_B2_CHSC:
598
        ioinst_handle_chsc(cpu, run->s390_sieic.ipb);
599
        break;
600
    case PRIV_B2_TPI:
601 602 603
        /* This should have been handled by kvm already. */
        fprintf(stderr, "Spurious tpi intercept\n");
        break;
604
    case PRIV_B2_SCHM:
605 606
        ioinst_handle_schm(cpu, env->regs[1], env->regs[2],
                           run->s390_sieic.ipb);
607
        break;
608
    case PRIV_B2_RSCH:
609
        ioinst_handle_rsch(cpu, env->regs[1]);
610
        break;
611
    case PRIV_B2_RCHP:
612
        ioinst_handle_rchp(cpu, env->regs[1]);
613
        break;
614
    case PRIV_B2_STCPS:
615 616
        /* We do not provide this instruction, it is suppressed. */
        break;
617
    case PRIV_B2_SAL:
618
        ioinst_handle_sal(cpu, env->regs[1]);
619
        break;
620
    case PRIV_B2_SIGA:
621
        /* Not provided, set CC = 3 for subchannel not operational */
622
        setcc(cpu, 3);
623
        break;
624 625 626
    case PRIV_B2_SCLP_CALL:
        rc = kvm_sclp_service_call(cpu, run, ipbh0);
        break;
627
    default:
628 629 630
        rc = -1;
        DPRINTF("KVM: unhandled PRIV: 0xb2%x\n", ipa1);
        break;
631 632
    }

633
    return rc;
634 635
}

636
static int handle_b9(S390CPU *cpu, struct kvm_run *run, uint8_t ipa1)
A
Alexander Graf 已提交
637 638 639 640
{
    int r = 0;

    switch (ipa1) {
641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666
    case PRIV_B9_EQBS:
        /* just inject exception */
        r = -1;
        break;
    default:
        r = -1;
        DPRINTF("KVM: unhandled PRIV: 0xb9%x\n", ipa1);
        break;
    }

    return r;
}

static int handle_eb(S390CPU *cpu, struct kvm_run *run, uint8_t ipa1)
{
    int r = 0;

    switch (ipa1) {
    case PRIV_EB_SQBS:
        /* just inject exception */
        r = -1;
        break;
    default:
        r = -1;
        DPRINTF("KVM: unhandled PRIV: 0xeb%x\n", ipa1);
        break;
A
Alexander Graf 已提交
667 668 669 670 671
    }

    return r;
}

672
static int handle_hypercall(S390CPU *cpu, struct kvm_run *run)
A
Alexander Graf 已提交
673
{
674
    CPUS390XState *env = &cpu->env;
675
    int ret;
676

677
    cpu_synchronize_state(CPU(cpu));
678 679 680 681 682
    ret = s390_virtio_hypercall(env);
    if (ret == -EINVAL) {
        enter_pgmcheck(cpu, PGM_SPECIFICATION);
        return 0;
    }
A
Alexander Graf 已提交
683

684
    return ret;
A
Alexander Graf 已提交
685 686
}

687 688 689 690 691 692 693 694 695 696
static void kvm_handle_diag_308(S390CPU *cpu, struct kvm_run *run)
{
    uint64_t r1, r3;

    cpu_synchronize_state(CPU(cpu));
    r1 = (run->s390_sieic.ipa & 0x00f0) >> 8;
    r3 = run->s390_sieic.ipa & 0x000f;
    handle_diag_308(&cpu->env, r1, r3);
}

697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712
static int handle_sw_breakpoint(S390CPU *cpu, struct kvm_run *run)
{
    CPUS390XState *env = &cpu->env;
    unsigned long pc;

    cpu_synchronize_state(CPU(cpu));

    pc = env->psw.addr - 4;
    if (kvm_find_sw_breakpoint(CPU(cpu), pc)) {
        env->psw.addr = pc;
        return EXCP_DEBUG;
    }

    return -ENOENT;
}

C
Cornelia Huck 已提交
713 714 715
#define DIAG_KVM_CODE_MASK 0x000000000000ffff

static int handle_diag(S390CPU *cpu, struct kvm_run *run, uint32_t ipb)
A
Alexander Graf 已提交
716 717
{
    int r = 0;
C
Cornelia Huck 已提交
718 719 720 721 722 723 724 725
    uint16_t func_code;

    /*
     * For any diagnose call we support, bits 48-63 of the resulting
     * address specify the function code; the remainder is ignored.
     */
    func_code = decode_basedisp_rs(&cpu->env, ipb) & DIAG_KVM_CODE_MASK;
    switch (func_code) {
726 727 728
    case DIAG_IPL:
        kvm_handle_diag_308(cpu, run);
        break;
729 730 731 732
    case DIAG_KVM_HYPERCALL:
        r = handle_hypercall(cpu, run);
        break;
    case DIAG_KVM_BREAKPOINT:
733
        r = handle_sw_breakpoint(cpu, run);
734 735
        break;
    default:
C
Cornelia Huck 已提交
736
        DPRINTF("KVM: unknown DIAG: 0x%x\n", func_code);
737 738
        r = -1;
        break;
A
Alexander Graf 已提交
739 740 741 742 743
    }

    return r;
}

T
Thomas Huth 已提交
744 745 746 747 748 749 750 751
static int kvm_s390_cpu_start(S390CPU *cpu)
{
    s390_add_running_cpu(cpu);
    qemu_cpu_kick(CPU(cpu));
    DPRINTF("DONE: KVM cpu start: %p\n", &cpu->env);
    return 0;
}

752
int kvm_s390_cpu_restart(S390CPU *cpu)
A
Alexander Graf 已提交
753
{
754
    kvm_s390_interrupt(cpu, KVM_S390_RESTART, 0);
755
    s390_add_running_cpu(cpu);
756
    qemu_cpu_kick(CPU(cpu));
757
    DPRINTF("DONE: KVM cpu restart: %p\n", &cpu->env);
A
Alexander Graf 已提交
758 759 760
    return 0;
}

761
static void sigp_initial_cpu_reset(void *arg)
A
Alexander Graf 已提交
762
{
763 764
    CPUState *cpu = arg;
    S390CPUClass *scc = S390_CPU_GET_CLASS(cpu);
765

766 767
    cpu_synchronize_state(cpu);
    scc->initial_cpu_reset(cpu);
A
Alexander Graf 已提交
768 769
}

770 771 772 773 774 775 776 777 778
static void sigp_cpu_reset(void *arg)
{
    CPUState *cpu = arg;
    S390CPUClass *scc = S390_CPU_GET_CLASS(cpu);

    cpu_synchronize_state(cpu);
    scc->cpu_reset(cpu);
}

779 780
#define SIGP_ORDER_MASK 0x000000ff

A
Andreas Färber 已提交
781
static int handle_sigp(S390CPU *cpu, struct kvm_run *run, uint8_t ipa1)
A
Alexander Graf 已提交
782
{
A
Andreas Färber 已提交
783
    CPUS390XState *env = &cpu->env;
A
Alexander Graf 已提交
784 785
    uint8_t order_code;
    uint16_t cpu_addr;
786
    S390CPU *target_cpu;
787 788
    uint64_t *statusreg = &env->regs[ipa1 >> 4];
    int cc;
A
Alexander Graf 已提交
789

790
    cpu_synchronize_state(CPU(cpu));
A
Alexander Graf 已提交
791 792

    /* get order code */
793
    order_code = decode_basedisp_rs(env, run->s390_sieic.ipb) & SIGP_ORDER_MASK;
A
Alexander Graf 已提交
794 795

    cpu_addr = env->regs[ipa1 & 0x0f];
796 797
    target_cpu = s390_cpu_addr2state(cpu_addr);
    if (target_cpu == NULL) {
798
        cc = 3;    /* not operational */
A
Alexander Graf 已提交
799 800 801 802
        goto out;
    }

    switch (order_code) {
T
Thomas Huth 已提交
803
    case SIGP_START:
804
        cc = kvm_s390_cpu_start(target_cpu);
T
Thomas Huth 已提交
805
        break;
806
    case SIGP_RESTART:
807
        cc = kvm_s390_cpu_restart(target_cpu);
808 809
        break;
    case SIGP_SET_ARCH:
810 811 812 813
        *statusreg &= 0xffffffff00000000UL;
        *statusreg |= SIGP_STAT_INVALID_PARAMETER;
        cc = 1;   /* status stored */
        break;
814
    case SIGP_INITIAL_CPU_RESET:
815 816
        run_on_cpu(CPU(target_cpu), sigp_initial_cpu_reset, CPU(target_cpu));
        cc = 0;
817
        break;
818 819 820 821
    case SIGP_CPU_RESET:
        run_on_cpu(CPU(target_cpu), sigp_cpu_reset, CPU(target_cpu));
        cc = 0;
        break;
822
    default:
823 824 825 826
        DPRINTF("KVM: unknown SIGP: 0x%x\n", order_code);
        *statusreg &= 0xffffffff00000000UL;
        *statusreg |= SIGP_STAT_INVALID_ORDER;
        cc = 1;   /* status stored */
827
        break;
A
Alexander Graf 已提交
828 829 830
    }

out:
831
    setcc(cpu, cc);
A
Alexander Graf 已提交
832 833 834
    return 0;
}

835
static int handle_instruction(S390CPU *cpu, struct kvm_run *run)
A
Alexander Graf 已提交
836 837 838
{
    unsigned int ipa0 = (run->s390_sieic.ipa & 0xff00);
    uint8_t ipa1 = run->s390_sieic.ipa & 0x00ff;
839
    int r = -1;
A
Alexander Graf 已提交
840

841 842
    DPRINTF("handle_instruction 0x%x 0x%x\n",
            run->s390_sieic.ipa, run->s390_sieic.ipb);
A
Alexander Graf 已提交
843
    switch (ipa0) {
844
    case IPA0_B2:
845 846
        r = handle_b2(cpu, run, ipa1);
        break;
847
    case IPA0_B9:
848 849
        r = handle_b9(cpu, run, ipa1);
        break;
850
    case IPA0_EB:
851
        r = handle_eb(cpu, run, ipa1);
852 853
        break;
    case IPA0_DIAG:
C
Cornelia Huck 已提交
854
        r = handle_diag(cpu, run, run->s390_sieic.ipb);
855 856 857 858
        break;
    case IPA0_SIGP:
        r = handle_sigp(cpu, run, ipa1);
        break;
A
Alexander Graf 已提交
859 860 861
    }

    if (r < 0) {
862
        r = 0;
863
        enter_pgmcheck(cpu, 0x0001);
A
Alexander Graf 已提交
864
    }
865 866

    return r;
A
Alexander Graf 已提交
867 868
}

A
Andreas Färber 已提交
869
static bool is_special_wait_psw(CPUState *cs)
870 871
{
    /* signal quiesce */
A
Andreas Färber 已提交
872
    return cs->kvm_run->psw_addr == 0xfffUL;
873 874
}

875
static int handle_intercept(S390CPU *cpu)
A
Alexander Graf 已提交
876
{
A
Andreas Färber 已提交
877 878
    CPUState *cs = CPU(cpu);
    struct kvm_run *run = cs->kvm_run;
A
Alexander Graf 已提交
879 880 881
    int icpt_code = run->s390_sieic.icptcode;
    int r = 0;

882
    DPRINTF("intercept: 0x%x (at 0x%lx)\n", icpt_code,
A
Andreas Färber 已提交
883
            (long)cs->kvm_run->psw_addr);
A
Alexander Graf 已提交
884 885
    switch (icpt_code) {
        case ICPT_INSTRUCTION:
886
            r = handle_instruction(cpu, run);
A
Alexander Graf 已提交
887 888
            break;
        case ICPT_WAITPSW:
889 890 891 892 893 894 895 896 897 898 899 900
            /* disabled wait, since enabled wait is handled in kernel */
            if (s390_del_running_cpu(cpu) == 0) {
                if (is_special_wait_psw(cs)) {
                    qemu_system_shutdown_request();
                } else {
                    QObject *data;

                    data = qobject_from_jsonf("{ 'action': %s }", "pause");
                    monitor_protocol_event(QEVENT_GUEST_PANICKED, data);
                    qobject_decref(data);
                    vm_stop(RUN_STATE_GUEST_PANICKED);
                }
901 902 903
            }
            r = EXCP_HALTED;
            break;
904
        case ICPT_CPU_STOP:
905
            if (s390_del_running_cpu(cpu) == 0) {
906 907 908
                qemu_system_shutdown_request();
            }
            r = EXCP_HALTED;
A
Alexander Graf 已提交
909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925 926
            break;
        case ICPT_SOFT_INTERCEPT:
            fprintf(stderr, "KVM unimplemented icpt SOFT\n");
            exit(1);
            break;
        case ICPT_IO:
            fprintf(stderr, "KVM unimplemented icpt IO\n");
            exit(1);
            break;
        default:
            fprintf(stderr, "Unknown intercept code: %d\n", icpt_code);
            exit(1);
            break;
    }

    return r;
}

927 928 929 930 931 932 933
static int handle_tsch(S390CPU *cpu)
{
    CPUS390XState *env = &cpu->env;
    CPUState *cs = CPU(cpu);
    struct kvm_run *run = cs->kvm_run;
    int ret;

934
    cpu_synchronize_state(cs);
935

936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964
    ret = ioinst_handle_tsch(env, env->regs[1], run->s390_tsch.ipb);
    if (ret >= 0) {
        /* Success; set condition code. */
        setcc(cpu, ret);
        ret = 0;
    } else if (ret < -1) {
        /*
         * Failure.
         * If an I/O interrupt had been dequeued, we have to reinject it.
         */
        if (run->s390_tsch.dequeued) {
            uint16_t subchannel_id = run->s390_tsch.subchannel_id;
            uint16_t subchannel_nr = run->s390_tsch.subchannel_nr;
            uint32_t io_int_parm = run->s390_tsch.io_int_parm;
            uint32_t io_int_word = run->s390_tsch.io_int_word;
            uint32_t type = ((subchannel_id & 0xff00) << 24) |
                ((subchannel_id & 0x00060) << 22) | (subchannel_nr << 16);

            kvm_s390_interrupt_internal(cpu, type,
                                        ((uint32_t)subchannel_id << 16)
                                        | subchannel_nr,
                                        ((uint64_t)io_int_parm << 32)
                                        | io_int_word, 1);
        }
        ret = 0;
    }
    return ret;
}

965 966
static int kvm_arch_handle_debug_exit(S390CPU *cpu)
{
967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995 996
    CPUState *cs = CPU(cpu);
    struct kvm_run *run = cs->kvm_run;

    int ret = 0;
    struct kvm_debug_exit_arch *arch_info = &run->debug.arch;

    switch (arch_info->type) {
    case KVM_HW_WP_WRITE:
        if (find_hw_breakpoint(arch_info->addr, -1, arch_info->type)) {
            cs->watchpoint_hit = &hw_watchpoint;
            hw_watchpoint.vaddr = arch_info->addr;
            hw_watchpoint.flags = BP_MEM_WRITE;
            ret = EXCP_DEBUG;
        }
        break;
    case KVM_HW_BP:
        if (find_hw_breakpoint(arch_info->addr, -1, arch_info->type)) {
            ret = EXCP_DEBUG;
        }
        break;
    case KVM_SINGLESTEP:
        if (cs->singlestep_enabled) {
            ret = EXCP_DEBUG;
        }
        break;
    default:
        ret = -ENOSYS;
    }

    return ret;
997 998
}

A
Andreas Färber 已提交
999
int kvm_arch_handle_exit(CPUState *cs, struct kvm_run *run)
A
Alexander Graf 已提交
1000
{
A
Andreas Färber 已提交
1001
    S390CPU *cpu = S390_CPU(cs);
A
Alexander Graf 已提交
1002 1003 1004 1005
    int ret = 0;

    switch (run->exit_reason) {
        case KVM_EXIT_S390_SIEIC:
1006
            ret = handle_intercept(cpu);
A
Alexander Graf 已提交
1007 1008
            break;
        case KVM_EXIT_S390_RESET:
1009
            qemu_system_reset_request();
A
Alexander Graf 已提交
1010
            break;
1011 1012 1013
        case KVM_EXIT_S390_TSCH:
            ret = handle_tsch(cpu);
            break;
1014 1015 1016
        case KVM_EXIT_DEBUG:
            ret = kvm_arch_handle_debug_exit(cpu);
            break;
A
Alexander Graf 已提交
1017 1018 1019 1020 1021
        default:
            fprintf(stderr, "Unknown KVM exit: %d\n", run->exit_reason);
            break;
    }

1022 1023 1024
    if (ret == 0) {
        ret = EXCP_INTERRUPT;
    }
A
Alexander Graf 已提交
1025 1026
    return ret;
}
1027

A
Andreas Färber 已提交
1028
bool kvm_arch_stop_on_emulation_error(CPUState *cpu)
1029 1030 1031
{
    return true;
}
1032

A
Andreas Färber 已提交
1033
int kvm_arch_on_sigbus_vcpu(CPUState *cpu, int code, void *addr)
1034 1035 1036 1037 1038 1039 1040 1041
{
    return 1;
}

int kvm_arch_on_sigbus(int code, void *addr)
{
    return 1;
}
1042 1043 1044 1045 1046 1047 1048

void kvm_s390_io_interrupt(S390CPU *cpu, uint16_t subchannel_id,
                           uint16_t subchannel_nr, uint32_t io_int_parm,
                           uint32_t io_int_word)
{
    uint32_t type;

1049 1050 1051 1052 1053 1054
    if (io_int_word & IO_INT_WORD_AI) {
        type = KVM_S390_INT_IO(1, 0, 0, 0);
    } else {
        type = ((subchannel_id & 0xff00) << 24) |
            ((subchannel_id & 0x00060) << 22) | (subchannel_nr << 16);
    }
1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070
    kvm_s390_interrupt_internal(cpu, type,
                                ((uint32_t)subchannel_id << 16) | subchannel_nr,
                                ((uint64_t)io_int_parm << 32) | io_int_word, 1);
}

void kvm_s390_crw_mchk(S390CPU *cpu)
{
    kvm_s390_interrupt_internal(cpu, KVM_S390_MCHK, 1 << 28,
                                0x00400f1d40330000, 1);
}

void kvm_s390_enable_css_support(S390CPU *cpu)
{
    int r;

    /* Activate host kernel channel subsystem support. */
C
Cornelia Huck 已提交
1071
    r = kvm_vcpu_enable_cap(CPU(cpu), KVM_CAP_S390_CSS_SUPPORT, 0);
1072 1073
    assert(r == 0);
}
1074 1075 1076

void kvm_arch_init_irq_routing(KVMState *s)
{
1077 1078 1079 1080 1081 1082 1083 1084 1085 1086
    /*
     * Note that while irqchip capabilities generally imply that cpustates
     * are handled in-kernel, it is not true for s390 (yet); therefore, we
     * have to override the common code kvm_halt_in_kernel_allowed setting.
     */
    if (kvm_check_extension(s, KVM_CAP_IRQ_ROUTING)) {
        kvm_irqfds_allowed = true;
        kvm_gsi_routing_allowed = true;
        kvm_halt_in_kernel_allowed = false;
    }
1087
}
C
Cornelia Huck 已提交
1088

1089 1090
int kvm_s390_assign_subch_ioeventfd(EventNotifier *notifier, uint32_t sch,
                                    int vq, bool assign)
C
Cornelia Huck 已提交
1091 1092 1093 1094
{
    struct kvm_ioeventfd kick = {
        .flags = KVM_IOEVENTFD_FLAG_VIRTIO_CCW_NOTIFY |
        KVM_IOEVENTFD_FLAG_DATAMATCH,
1095
        .fd = event_notifier_get_fd(notifier),
C
Cornelia Huck 已提交
1096 1097 1098 1099 1100 1101 1102 1103 1104 1105 1106 1107
        .datamatch = vq,
        .addr = sch,
        .len = 8,
    };
    if (!kvm_check_extension(kvm_state, KVM_CAP_IOEVENTFD)) {
        return -ENOSYS;
    }
    if (!assign) {
        kick.flags |= KVM_IOEVENTFD_FLAG_DEASSIGN;
    }
    return kvm_vm_ioctl(kvm_state, KVM_IOEVENTFD, &kick);
}