pc.c 29.1 KB
Newer Older
B
bellard 已提交
1 2
/*
 * QEMU PC System Emulator
3
 *
B
bellard 已提交
4
 * Copyright (c) 2003-2004 Fabrice Bellard
5
 *
B
bellard 已提交
6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */
P
pbrook 已提交
24 25
#include "hw.h"
#include "pc.h"
26
#include "apic.h"
P
pbrook 已提交
27
#include "fdc.h"
28
#include "ide.h"
P
pbrook 已提交
29
#include "pci.h"
30
#include "vmware_vga.h"
A
aliguori 已提交
31
#include "monitor.h"
32
#include "fw_cfg.h"
A
aliguori 已提交
33
#include "hpet_emul.h"
34
#include "smbios.h"
B
Blue Swirl 已提交
35 36
#include "loader.h"
#include "elf.h"
37
#include "multiboot.h"
38
#include "mc146818rtc.h"
B
Blue Swirl 已提交
39
#include "msix.h"
J
Jan Kiszka 已提交
40
#include "sysbus.h"
41
#include "sysemu.h"
B
bellard 已提交
42

B
bellard 已提交
43 44 45
/* output Bochs bios info messages */
//#define DEBUG_BIOS

B
Blue Swirl 已提交
46 47 48 49 50 51 52 53 54 55
/* debug PC/ISA interrupts */
//#define DEBUG_IRQ

#ifdef DEBUG_IRQ
#define DPRINTF(fmt, ...)                                       \
    do { printf("CPUIRQ: " fmt , ## __VA_ARGS__); } while (0)
#else
#define DPRINTF(fmt, ...)
#endif

B
bellard 已提交
56 57
#define BIOS_FILENAME "bios.bin"

58 59
#define PC_MAX_BIOS_SIZE (4 * 1024 * 1024)

60 61
/* Leave a chunk of memory at the top of RAM for the BIOS ACPI tables.  */
#define ACPI_DATA_SIZE       0x10000
62
#define BIOS_CFG_IOPORT 0x510
63
#define FW_CFG_ACPI_TABLES (FW_CFG_ARCH_LOCAL + 0)
64
#define FW_CFG_SMBIOS_ENTRIES (FW_CFG_ARCH_LOCAL + 1)
J
Jes Sorensen 已提交
65
#define FW_CFG_IRQ0_OVERRIDE (FW_CFG_ARCH_LOCAL + 2)
J
Jes Sorensen 已提交
66
#define FW_CFG_E820_TABLE (FW_CFG_ARCH_LOCAL + 3)
67
#define FW_CFG_HPET (FW_CFG_ARCH_LOCAL + 4)
B
bellard 已提交
68

B
Blue Swirl 已提交
69 70
#define MSI_ADDR_BASE 0xfee00000

J
Jes Sorensen 已提交
71 72 73 74 75 76 77 78 79 80 81 82 83 84 85
#define E820_NR_ENTRIES		16

struct e820_entry {
    uint64_t address;
    uint64_t length;
    uint32_t type;
};

struct e820_table {
    uint32_t count;
    struct e820_entry entry[E820_NR_ENTRIES];
};

static struct e820_table e820_table;

86
void isa_irq_handler(void *opaque, int n, int level)
87 88 89
{
    IsaIrqState *isa = (IsaIrqState *)opaque;

B
Blue Swirl 已提交
90
    DPRINTF("isa_irqs: %s irq %d\n", level? "raise" : "lower", n);
A
Avi Kivity 已提交
91 92 93
    if (n < 16) {
        qemu_set_irq(isa->i8259[n], level);
    }
G
Gerd Hoffmann 已提交
94 95
    if (isa->ioapic)
        qemu_set_irq(isa->ioapic[n], level);
A
Avi Kivity 已提交
96
};
97

B
bellard 已提交
98
static void ioport80_write(void *opaque, uint32_t addr, uint32_t data)
B
bellard 已提交
99 100 101
{
}

102
/* MSDOS compatibility mode FPU exception support */
P
pbrook 已提交
103
static qemu_irq ferr_irq;
104 105 106 107 108 109

void pc_register_ferr_irq(qemu_irq irq)
{
    ferr_irq = irq;
}

110 111 112
/* XXX: add IGNNE support */
void cpu_set_ferr(CPUX86State *s)
{
P
pbrook 已提交
113
    qemu_irq_raise(ferr_irq);
114 115 116 117
}

static void ioportF0_write(void *opaque, uint32_t addr, uint32_t data)
{
P
pbrook 已提交
118
    qemu_irq_lower(ferr_irq);
119 120
}

B
bellard 已提交
121 122 123
/* TSC handling */
uint64_t cpu_get_tsc(CPUX86State *env)
{
124
    return cpu_get_ticks();
B
bellard 已提交
125 126
}

B
bellard 已提交
127
/* SMM support */
128 129 130 131 132 133 134 135 136 137 138 139

static cpu_set_smm_t smm_set;
static void *smm_arg;

void cpu_smm_register(cpu_set_smm_t callback, void *arg)
{
    assert(smm_set == NULL);
    assert(smm_arg == NULL);
    smm_set = callback;
    smm_arg = arg;
}

B
bellard 已提交
140 141
void cpu_smm_update(CPUState *env)
{
142 143
    if (smm_set && smm_arg && env == first_cpu)
        smm_set(!!(env->hflags & HF_SMM_MASK), smm_arg);
B
bellard 已提交
144 145 146
}


B
bellard 已提交
147 148 149 150 151
/* IRQ handling */
int cpu_get_pic_interrupt(CPUState *env)
{
    int intno;

152
    intno = apic_get_interrupt(env->apic_state);
B
bellard 已提交
153 154 155
    if (intno >= 0) {
        /* set irq request if a PIC irq is still pending */
        /* XXX: improve that */
156
        pic_update_irq(isa_pic);
B
bellard 已提交
157 158 159
        return intno;
    }
    /* read the irq from the PIC */
160
    if (!apic_accept_pic_intr(env->apic_state)) {
161
        return -1;
162
    }
163

B
bellard 已提交
164 165 166 167
    intno = pic_read_irq(isa_pic);
    return intno;
}

P
pbrook 已提交
168
static void pic_irq_request(void *opaque, int irq, int level)
B
bellard 已提交
169
{
170 171
    CPUState *env = first_cpu;

B
Blue Swirl 已提交
172
    DPRINTF("pic_irqs: %s irq %d\n", level? "raise" : "lower", irq);
A
aurel32 已提交
173 174
    if (env->apic_state) {
        while (env) {
175 176 177
            if (apic_accept_pic_intr(env->apic_state)) {
                apic_deliver_pic_intr(env->apic_state, level);
            }
A
aurel32 已提交
178 179 180
            env = env->next_cpu;
        }
    } else {
A
aurel32 已提交
181 182 183 184
        if (level)
            cpu_interrupt(env, CPU_INTERRUPT_HARD);
        else
            cpu_reset_interrupt(env, CPU_INTERRUPT_HARD);
185
    }
B
bellard 已提交
186 187
}

B
bellard 已提交
188 189
/* PC cmos mappings */

B
bellard 已提交
190 191
#define REG_EQUIPMENT_BYTE          0x14

192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215
static int cmos_get_fd_drive_type(int fd0)
{
    int val;

    switch (fd0) {
    case 0:
        /* 1.44 Mb 3"5 drive */
        val = 4;
        break;
    case 1:
        /* 2.88 Mb 3"5 drive */
        val = 5;
        break;
    case 2:
        /* 1.2 Mb 5"5 drive */
        val = 2;
        break;
    default:
        val = 0;
        break;
    }
    return val;
}

216
static void cmos_init_hd(int type_ofs, int info_ofs, BlockDriverState *hd,
217
                         ISADevice *s)
B
bellard 已提交
218 219 220 221 222 223 224 225 226 227 228 229 230 231 232
{
    int cylinders, heads, sectors;
    bdrv_get_geometry_hint(hd, &cylinders, &heads, &sectors);
    rtc_set_memory(s, type_ofs, 47);
    rtc_set_memory(s, info_ofs, cylinders);
    rtc_set_memory(s, info_ofs + 1, cylinders >> 8);
    rtc_set_memory(s, info_ofs + 2, heads);
    rtc_set_memory(s, info_ofs + 3, 0xff);
    rtc_set_memory(s, info_ofs + 4, 0xff);
    rtc_set_memory(s, info_ofs + 5, 0xc0 | ((heads > 8) << 3));
    rtc_set_memory(s, info_ofs + 6, cylinders);
    rtc_set_memory(s, info_ofs + 7, cylinders >> 8);
    rtc_set_memory(s, info_ofs + 8, sectors);
}

233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249
/* convert boot_device letter to something recognizable by the bios */
static int boot_device2nibble(char boot_device)
{
    switch(boot_device) {
    case 'a':
    case 'b':
        return 0x01; /* floppy boot */
    case 'c':
        return 0x02; /* hard drive boot */
    case 'd':
        return 0x03; /* CD-ROM boot */
    case 'n':
        return 0x04; /* Network boot */
    }
    return 0;
}

250
static int set_boot_dev(ISADevice *s, const char *boot_device, int fd_bootchk)
251 252 253 254 255 256 257
{
#define PC_MAX_BOOT_DEVICES 3
    int nbds, bds[3] = { 0, };
    int i;

    nbds = strlen(boot_device);
    if (nbds > PC_MAX_BOOT_DEVICES) {
258
        error_report("Too many boot devices for PC");
259 260 261 262 263
        return(1);
    }
    for (i = 0; i < nbds; i++) {
        bds[i] = boot_device2nibble(boot_device[i]);
        if (bds[i] == 0) {
264 265
            error_report("Invalid boot device for PC: '%c'",
                         boot_device[i]);
266 267 268 269
            return(1);
        }
    }
    rtc_set_memory(s, 0x3d, (bds[1] << 4) | bds[0]);
270
    rtc_set_memory(s, 0x38, (bds[2] << 4) | (fd_bootchk ? 0x0 : 0x1));
271 272 273
    return(0);
}

274 275 276 277 278
static int pc_boot_set(void *opaque, const char *boot_device)
{
    return set_boot_dev(opaque, boot_device, 0);
}

279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329
typedef struct pc_cmos_init_late_arg {
    ISADevice *rtc_state;
    BusState *idebus0, *idebus1;
} pc_cmos_init_late_arg;

static void pc_cmos_init_late(void *opaque)
{
    pc_cmos_init_late_arg *arg = opaque;
    ISADevice *s = arg->rtc_state;
    int val;
    BlockDriverState *hd_table[4];
    int i;

    ide_get_bs(hd_table, arg->idebus0);
    ide_get_bs(hd_table + 2, arg->idebus1);

    rtc_set_memory(s, 0x12, (hd_table[0] ? 0xf0 : 0) | (hd_table[1] ? 0x0f : 0));
    if (hd_table[0])
        cmos_init_hd(0x19, 0x1b, hd_table[0], s);
    if (hd_table[1])
        cmos_init_hd(0x1a, 0x24, hd_table[1], s);

    val = 0;
    for (i = 0; i < 4; i++) {
        if (hd_table[i]) {
            int cylinders, heads, sectors, translation;
            /* NOTE: bdrv_get_geometry_hint() returns the physical
                geometry.  It is always such that: 1 <= sects <= 63, 1
                <= heads <= 16, 1 <= cylinders <= 16383. The BIOS
                geometry can be different if a translation is done. */
            translation = bdrv_get_translation_hint(hd_table[i]);
            if (translation == BIOS_ATA_TRANSLATION_AUTO) {
                bdrv_get_geometry_hint(hd_table[i], &cylinders, &heads, &sectors);
                if (cylinders <= 1024 && heads <= 16 && sectors <= 63) {
                    /* No translation. */
                    translation = 0;
                } else {
                    /* LBA translation. */
                    translation = 1;
                }
            } else {
                translation--;
            }
            val |= translation << (i * 2);
        }
    }
    rtc_set_memory(s, 0x39, val);

    qemu_unregister_reset(pc_cmos_init_late, opaque);
}

330
void pc_cmos_init(ram_addr_t ram_size, ram_addr_t above_4g_mem_size,
331 332
                  const char *boot_device,
                  BusState *idebus0, BusState *idebus1,
333
                  FDCtrl *floppy_controller, ISADevice *s)
B
bellard 已提交
334 335
{
    int val;
B
bellard 已提交
336
    int fd0, fd1, nb;
337
    static pc_cmos_init_late_arg arg;
B
bellard 已提交
338 339

    /* various important CMOS locations needed by PC/Bochs bios */
B
bellard 已提交
340 341

    /* memory size */
B
bellard 已提交
342 343 344 345
    val = 640; /* base memory in K */
    rtc_set_memory(s, 0x15, val);
    rtc_set_memory(s, 0x16, val >> 8);

B
bellard 已提交
346 347 348
    val = (ram_size / 1024) - 1024;
    if (val > 65535)
        val = 65535;
B
bellard 已提交
349 350 351 352
    rtc_set_memory(s, 0x17, val);
    rtc_set_memory(s, 0x18, val >> 8);
    rtc_set_memory(s, 0x30, val);
    rtc_set_memory(s, 0x31, val >> 8);
B
bellard 已提交
353

354 355 356 357 358 359
    if (above_4g_mem_size) {
        rtc_set_memory(s, 0x5b, (unsigned int)above_4g_mem_size >> 16);
        rtc_set_memory(s, 0x5c, (unsigned int)above_4g_mem_size >> 24);
        rtc_set_memory(s, 0x5d, (uint64_t)above_4g_mem_size >> 32);
    }

B
bellard 已提交
360 361 362 363
    if (ram_size > (16 * 1024 * 1024))
        val = (ram_size / 65536) - ((16 * 1024 * 1024) / 65536);
    else
        val = 0;
B
bellard 已提交
364 365
    if (val > 65535)
        val = 65535;
B
bellard 已提交
366 367
    rtc_set_memory(s, 0x34, val);
    rtc_set_memory(s, 0x35, val >> 8);
368

A
aurel32 已提交
369 370 371
    /* set the number of CPU */
    rtc_set_memory(s, 0x5f, smp_cpus - 1);

372
    /* set boot devices, and disable floppy signature check if requested */
373
    if (set_boot_dev(s, boot_device, fd_bootchk)) {
374 375
        exit(1);
    }
B
bellard 已提交
376

B
bellard 已提交
377 378
    /* floppy type */

379 380
    fd0 = fdctrl_get_drive_type(floppy_controller, 0);
    fd1 = fdctrl_get_drive_type(floppy_controller, 1);
B
bellard 已提交
381

382
    val = (cmos_get_fd_drive_type(fd0) << 4) | cmos_get_fd_drive_type(fd1);
B
bellard 已提交
383
    rtc_set_memory(s, 0x10, val);
384

B
bellard 已提交
385
    val = 0;
B
bellard 已提交
386
    nb = 0;
B
bellard 已提交
387 388 389 390 391 392 393 394
    if (fd0 < 3)
        nb++;
    if (fd1 < 3)
        nb++;
    switch (nb) {
    case 0:
        break;
    case 1:
B
bellard 已提交
395
        val |= 0x01; /* 1 drive, ready for boot */
B
bellard 已提交
396 397
        break;
    case 2:
B
bellard 已提交
398
        val |= 0x41; /* 2 drives, ready for boot */
B
bellard 已提交
399 400
        break;
    }
B
bellard 已提交
401 402 403 404
    val |= 0x02; /* FPU is there */
    val |= 0x04; /* PS/2 mouse installed */
    rtc_set_memory(s, REG_EQUIPMENT_BYTE, val);

B
bellard 已提交
405
    /* hard drives */
406 407 408 409
    arg.rtc_state = s;
    arg.idebus0 = idebus0;
    arg.idebus1 = idebus1;
    qemu_register_reset(pc_cmos_init_late, &arg);
B
bellard 已提交
410 411
}

B
Blue Swirl 已提交
412
static void handle_a20_line_change(void *opaque, int irq, int level)
413
{
B
Blue Swirl 已提交
414
    CPUState *cpu = opaque;
B
bellard 已提交
415

B
Blue Swirl 已提交
416 417
    /* XXX: send to all CPUs ? */
    cpu_x86_set_a20(cpu, level);
B
bellard 已提交
418 419
}

B
bellard 已提交
420 421 422
/***********************************************************/
/* Bochs BIOS debug ports */

423
static void bochs_bios_write(void *opaque, uint32_t addr, uint32_t val)
B
bellard 已提交
424
{
B
bellard 已提交
425 426
    static const char shutdown_str[8] = "Shutdown";
    static int shutdown_index = 0;
427

B
bellard 已提交
428 429 430 431 432 433 434 435 436 437 438 439
    switch(addr) {
        /* Bochs BIOS messages */
    case 0x400:
    case 0x401:
        fprintf(stderr, "BIOS panic at rombios.c, line %d\n", val);
        exit(1);
    case 0x402:
    case 0x403:
#ifdef DEBUG_BIOS
        fprintf(stderr, "%c", val);
#endif
        break;
B
bellard 已提交
440 441 442 443 444 445 446 447 448 449 450 451
    case 0x8900:
        /* same as Bochs power off */
        if (val == shutdown_str[shutdown_index]) {
            shutdown_index++;
            if (shutdown_index == 8) {
                shutdown_index = 0;
                qemu_system_shutdown_request();
            }
        } else {
            shutdown_index = 0;
        }
        break;
B
bellard 已提交
452 453 454 455 456 457 458 459 460 461 462 463 464 465 466

        /* LGPL'ed VGA BIOS messages */
    case 0x501:
    case 0x502:
        fprintf(stderr, "VGA BIOS panic, line %d\n", val);
        exit(1);
    case 0x500:
    case 0x503:
#ifdef DEBUG_BIOS
        fprintf(stderr, "%c", val);
#endif
        break;
    }
}

J
Jes Sorensen 已提交
467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483
int e820_add_entry(uint64_t address, uint64_t length, uint32_t type)
{
    int index = e820_table.count;
    struct e820_entry *entry;

    if (index >= E820_NR_ENTRIES)
        return -EBUSY;
    entry = &e820_table.entry[index];

    entry->address = address;
    entry->length = length;
    entry->type = type;

    e820_table.count++;
    return e820_table.count;
}

A
Alexander Graf 已提交
484
static void *bochs_bios_init(void)
B
bellard 已提交
485
{
486
    void *fw_cfg;
487 488
    uint8_t *smbios_table;
    size_t smbios_len;
489 490
    uint64_t *numa_fw_cfg;
    int i, j;
491

B
bellard 已提交
492 493 494 495
    register_ioport_write(0x400, 1, 2, bochs_bios_write, NULL);
    register_ioport_write(0x401, 1, 2, bochs_bios_write, NULL);
    register_ioport_write(0x402, 1, 1, bochs_bios_write, NULL);
    register_ioport_write(0x403, 1, 1, bochs_bios_write, NULL);
B
bellard 已提交
496
    register_ioport_write(0x8900, 1, 1, bochs_bios_write, NULL);
B
bellard 已提交
497 498 499 500 501

    register_ioport_write(0x501, 1, 2, bochs_bios_write, NULL);
    register_ioport_write(0x502, 1, 2, bochs_bios_write, NULL);
    register_ioport_write(0x500, 1, 1, bochs_bios_write, NULL);
    register_ioport_write(0x503, 1, 1, bochs_bios_write, NULL);
502 503

    fw_cfg = fw_cfg_init(BIOS_CFG_IOPORT, BIOS_CFG_IOPORT + 1, 0, 0);
A
Alexander Graf 已提交
504

505
    fw_cfg_add_i32(fw_cfg, FW_CFG_ID, 1);
506
    fw_cfg_add_i64(fw_cfg, FW_CFG_RAM_SIZE, (uint64_t)ram_size);
507 508
    fw_cfg_add_bytes(fw_cfg, FW_CFG_ACPI_TABLES, (uint8_t *)acpi_tables,
                     acpi_tables_len);
J
Jes Sorensen 已提交
509
    fw_cfg_add_bytes(fw_cfg, FW_CFG_IRQ0_OVERRIDE, &irq0override, 1);
510 511 512 513 514

    smbios_table = smbios_get_table(&smbios_len);
    if (smbios_table)
        fw_cfg_add_bytes(fw_cfg, FW_CFG_SMBIOS_ENTRIES,
                         smbios_table, smbios_len);
J
Jes Sorensen 已提交
515 516
    fw_cfg_add_bytes(fw_cfg, FW_CFG_E820_TABLE, (uint8_t *)&e820_table,
                     sizeof(struct e820_table));
517

518 519
    fw_cfg_add_bytes(fw_cfg, FW_CFG_HPET, (uint8_t *)&hpet_cfg,
                     sizeof(struct hpet_fw_config));
520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538
    /* allocate memory for the NUMA channel: one (64bit) word for the number
     * of nodes, one word for each VCPU->node and one word for each node to
     * hold the amount of memory.
     */
    numa_fw_cfg = qemu_mallocz((1 + smp_cpus + nb_numa_nodes) * 8);
    numa_fw_cfg[0] = cpu_to_le64(nb_numa_nodes);
    for (i = 0; i < smp_cpus; i++) {
        for (j = 0; j < nb_numa_nodes; j++) {
            if (node_cpumask[j] & (1 << i)) {
                numa_fw_cfg[i + 1] = cpu_to_le64(j);
                break;
            }
        }
    }
    for (i = 0; i < nb_numa_nodes; i++) {
        numa_fw_cfg[smp_cpus + 1 + i] = cpu_to_le64(node_mem[i]);
    }
    fw_cfg_add_bytes(fw_cfg, FW_CFG_NUMA, (uint8_t *)numa_fw_cfg,
                     (1 + smp_cpus + nb_numa_nodes) * 8);
A
Alexander Graf 已提交
539 540

    return fw_cfg;
B
bellard 已提交
541 542
}

T
ths 已提交
543 544 545 546 547 548 549 550 551 552 553 554 555 556
static long get_file_size(FILE *f)
{
    long where, size;

    /* XXX: on Unix systems, using fstat() probably makes more sense */

    where = ftell(f);
    fseek(f, 0, SEEK_END);
    size = ftell(f);
    fseek(f, where, SEEK_SET);

    return size;
}

A
Alexander Graf 已提交
557
static void load_linux(void *fw_cfg,
558
                       const char *kernel_filename,
T
ths 已提交
559
		       const char *initrd_filename,
G
Glauber Costa 已提交
560
		       const char *kernel_cmdline,
561
                       target_phys_addr_t max_ram_size)
T
ths 已提交
562 563
{
    uint16_t protocol;
P
Paul Brook 已提交
564
    int setup_size, kernel_size, initrd_size = 0, cmdline_size;
T
ths 已提交
565
    uint32_t initrd_max;
566
    uint8_t header[8192], *setup, *kernel, *initrd_data;
A
Anthony Liguori 已提交
567
    target_phys_addr_t real_addr, prot_addr, cmdline_addr, initrd_addr = 0;
568
    FILE *f;
P
Pascal Terjan 已提交
569
    char *vmode;
T
ths 已提交
570 571 572 573 574 575 576

    /* Align to 16 bytes as a paranoia measure */
    cmdline_size = (strlen(kernel_cmdline)+16) & ~15;

    /* load the kernel header */
    f = fopen(kernel_filename, "rb");
    if (!f || !(kernel_size = get_file_size(f)) ||
A
Alexander Graf 已提交
577 578
	fread(header, 1, MIN(ARRAY_SIZE(header), kernel_size), f) !=
	MIN(ARRAY_SIZE(header), kernel_size)) {
579 580
	fprintf(stderr, "qemu: could not load kernel '%s': %s\n",
		kernel_filename, strerror(errno));
T
ths 已提交
581 582 583 584
	exit(1);
    }

    /* kernel protocol version */
B
bellard 已提交
585
#if 0
T
ths 已提交
586
    fprintf(stderr, "header magic: %#x\n", ldl_p(header+0x202));
B
bellard 已提交
587
#endif
T
ths 已提交
588 589
    if (ldl_p(header+0x202) == 0x53726448)
	protocol = lduw_p(header+0x206);
A
Alexander Graf 已提交
590 591 592
    else {
	/* This looks like a multiboot kernel. If it is, let's stop
	   treating it like a Linux kernel. */
593 594
        if (load_multiboot(fw_cfg, f, kernel_filename, initrd_filename,
                           kernel_cmdline, kernel_size, header))
B
Blue Swirl 已提交
595
            return;
T
ths 已提交
596
	protocol = 0;
A
Alexander Graf 已提交
597
    }
T
ths 已提交
598 599 600

    if (protocol < 0x200 || !(header[0x211] & 0x01)) {
	/* Low kernel */
601 602 603
	real_addr    = 0x90000;
	cmdline_addr = 0x9a000 - cmdline_size;
	prot_addr    = 0x10000;
T
ths 已提交
604 605
    } else if (protocol < 0x202) {
	/* High but ancient kernel */
606 607 608
	real_addr    = 0x90000;
	cmdline_addr = 0x9a000 - cmdline_size;
	prot_addr    = 0x100000;
T
ths 已提交
609 610
    } else {
	/* High and recent kernel */
611 612 613
	real_addr    = 0x10000;
	cmdline_addr = 0x20000;
	prot_addr    = 0x100000;
T
ths 已提交
614 615
    }

B
bellard 已提交
616
#if 0
T
ths 已提交
617
    fprintf(stderr,
618 619 620
	    "qemu: real_addr     = 0x" TARGET_FMT_plx "\n"
	    "qemu: cmdline_addr  = 0x" TARGET_FMT_plx "\n"
	    "qemu: prot_addr     = 0x" TARGET_FMT_plx "\n",
621 622 623
	    real_addr,
	    cmdline_addr,
	    prot_addr);
B
bellard 已提交
624
#endif
T
ths 已提交
625 626 627 628 629 630 631

    /* highest address for loading the initrd */
    if (protocol >= 0x203)
	initrd_max = ldl_p(header+0x22c);
    else
	initrd_max = 0x37ffffff;

G
Glauber Costa 已提交
632 633
    if (initrd_max >= max_ram_size-ACPI_DATA_SIZE)
    	initrd_max = max_ram_size-ACPI_DATA_SIZE-1;
T
ths 已提交
634

635 636 637 638 639
    fw_cfg_add_i32(fw_cfg, FW_CFG_CMDLINE_ADDR, cmdline_addr);
    fw_cfg_add_i32(fw_cfg, FW_CFG_CMDLINE_SIZE, strlen(kernel_cmdline)+1);
    fw_cfg_add_bytes(fw_cfg, FW_CFG_CMDLINE_DATA,
                     (uint8_t*)strdup(kernel_cmdline),
                     strlen(kernel_cmdline)+1);
T
ths 已提交
640 641

    if (protocol >= 0x202) {
642
	stl_p(header+0x228, cmdline_addr);
T
ths 已提交
643 644 645 646 647
    } else {
	stw_p(header+0x20, 0xA33F);
	stw_p(header+0x22, cmdline_addr-real_addr);
    }

P
Pascal Terjan 已提交
648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665
    /* handle vga= parameter */
    vmode = strstr(kernel_cmdline, "vga=");
    if (vmode) {
        unsigned int video_mode;
        /* skip "vga=" */
        vmode += 4;
        if (!strncmp(vmode, "normal", 6)) {
            video_mode = 0xffff;
        } else if (!strncmp(vmode, "ext", 3)) {
            video_mode = 0xfffe;
        } else if (!strncmp(vmode, "ask", 3)) {
            video_mode = 0xfffd;
        } else {
            video_mode = strtol(vmode, NULL, 0);
        }
        stw_p(header+0x1fa, video_mode);
    }

T
ths 已提交
666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685
    /* loader type */
    /* High nybble = B reserved for Qemu; low nybble is revision number.
       If this code is substantially changed, you may want to consider
       incrementing the revision. */
    if (protocol >= 0x200)
	header[0x210] = 0xB0;

    /* heap */
    if (protocol >= 0x201) {
	header[0x211] |= 0x80;	/* CAN_USE_HEAP */
	stw_p(header+0x224, cmdline_addr-real_addr-0x200);
    }

    /* load initrd */
    if (initrd_filename) {
	if (protocol < 0x200) {
	    fprintf(stderr, "qemu: linux kernel too old to load a ram disk\n");
	    exit(1);
	}

686
	initrd_size = get_image_size(initrd_filename);
M
M. Mohan Kumar 已提交
687 688 689 690 691 692
        if (initrd_size < 0) {
            fprintf(stderr, "qemu: error reading initrd %s\n",
                    initrd_filename);
            exit(1);
        }

693
        initrd_addr = (initrd_max-initrd_size) & ~4095;
694 695 696 697 698 699 700

        initrd_data = qemu_malloc(initrd_size);
        load_image(initrd_filename, initrd_data);

        fw_cfg_add_i32(fw_cfg, FW_CFG_INITRD_ADDR, initrd_addr);
        fw_cfg_add_i32(fw_cfg, FW_CFG_INITRD_SIZE, initrd_size);
        fw_cfg_add_bytes(fw_cfg, FW_CFG_INITRD_DATA, initrd_data, initrd_size);
T
ths 已提交
701

702
	stl_p(header+0x218, initrd_addr);
T
ths 已提交
703 704 705
	stl_p(header+0x21c, initrd_size);
    }

706
    /* load kernel and setup */
T
ths 已提交
707 708 709 710
    setup_size = header[0x1f1];
    if (setup_size == 0)
	setup_size = 4;
    setup_size = (setup_size+1)*512;
711
    kernel_size -= setup_size;
T
ths 已提交
712

713 714 715
    setup  = qemu_malloc(setup_size);
    kernel = qemu_malloc(kernel_size);
    fseek(f, 0, SEEK_SET);
716 717 718 719 720 721 722 723
    if (fread(setup, 1, setup_size, f) != setup_size) {
        fprintf(stderr, "fread() failed\n");
        exit(1);
    }
    if (fread(kernel, 1, kernel_size, f) != kernel_size) {
        fprintf(stderr, "fread() failed\n");
        exit(1);
    }
T
ths 已提交
724
    fclose(f);
725
    memcpy(setup, header, MIN(sizeof(header), setup_size));
726 727 728 729 730 731 732 733 734 735 736

    fw_cfg_add_i32(fw_cfg, FW_CFG_KERNEL_ADDR, prot_addr);
    fw_cfg_add_i32(fw_cfg, FW_CFG_KERNEL_SIZE, kernel_size);
    fw_cfg_add_bytes(fw_cfg, FW_CFG_KERNEL_DATA, kernel, kernel_size);

    fw_cfg_add_i32(fw_cfg, FW_CFG_SETUP_ADDR, real_addr);
    fw_cfg_add_i32(fw_cfg, FW_CFG_SETUP_SIZE, setup_size);
    fw_cfg_add_bytes(fw_cfg, FW_CFG_SETUP_DATA, setup, setup_size);

    option_rom[nb_option_roms] = "linuxboot.bin";
    nb_option_roms++;
T
ths 已提交
737 738
}

B
bellard 已提交
739 740
#define NE2000_NB_MAX 6

B
Blue Swirl 已提交
741 742 743
static const int ne2000_io[NE2000_NB_MAX] = { 0x300, 0x320, 0x340, 0x360,
                                              0x280, 0x380 };
static const int ne2000_irq[NE2000_NB_MAX] = { 9, 10, 11, 3, 4, 5 };
B
bellard 已提交
744

B
Blue Swirl 已提交
745 746
static const int parallel_io[MAX_PARALLEL_PORTS] = { 0x378, 0x278, 0x3bc };
static const int parallel_irq[MAX_PARALLEL_PORTS] = { 7, 7, 7 };
747

748
void pc_audio_init (PCIBus *pci_bus, qemu_irq *pic)
749 750 751
{
    struct soundhw *c;

M
malc 已提交
752 753 754 755 756 757 758
    for (c = soundhw; c->name; ++c) {
        if (c->enabled) {
            if (c->isa) {
                c->init.init_isa(pic);
            } else {
                if (pci_bus) {
                    c->init.init_pci(pci_bus);
759 760 761 762 763 764
                }
            }
        }
    }
}

765
void pc_init_ne2k_isa(NICInfo *nd)
766 767 768 769 770
{
    static int nb_ne2k = 0;

    if (nb_ne2k == NE2000_NB_MAX)
        return;
J
Jes Sorensen 已提交
771
    isa_ne2000_init(ne2000_io[nb_ne2k],
G
Gerd Hoffmann 已提交
772
                    ne2000_irq[nb_ne2k], nd);
773 774 775
    nb_ne2k++;
}

G
Gleb Natapov 已提交
776 777
int cpu_is_bsp(CPUState *env)
{
J
Jan Kiszka 已提交
778 779
    /* We hard-wire the BSP to the first CPU. */
    return env->cpu_index == 0;
G
Gleb Natapov 已提交
780 781
}

B
Blue Swirl 已提交
782
DeviceState *cpu_get_current_apic(void)
783 784 785 786 787 788 789 790
{
    if (cpu_single_env) {
        return cpu_single_env->apic_state;
    } else {
        return NULL;
    }
}

B
Blue Swirl 已提交
791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816
static DeviceState *apic_init(void *env, uint8_t apic_id)
{
    DeviceState *dev;
    SysBusDevice *d;
    static int apic_mapped;

    dev = qdev_create(NULL, "apic");
    qdev_prop_set_uint8(dev, "id", apic_id);
    qdev_prop_set_ptr(dev, "cpu_env", env);
    qdev_init_nofail(dev);
    d = sysbus_from_qdev(dev);

    /* XXX: mapping more APICs at the same memory location */
    if (apic_mapped == 0) {
        /* NOTE: the APIC is directly connected to the CPU - it is not
           on the global memory bus. */
        /* XXX: what if the base changes? */
        sysbus_mmio_map(d, 0, MSI_ADDR_BASE);
        apic_mapped = 1;
    }

    msix_supported = 1;

    return dev;
}

B
Blue Swirl 已提交
817 818
/* set CMOS shutdown status register (index 0xF) as S3_resume(0xFE)
   BIOS will read it and start S3 resume at POST Entry */
819
void pc_cmos_set_s3_resume(void *opaque, int irq, int level)
B
Blue Swirl 已提交
820
{
821
    ISADevice *s = opaque;
B
Blue Swirl 已提交
822 823 824 825 826 827

    if (level) {
        rtc_set_memory(s, 0xF, 0xFE);
    }
}

828
void pc_acpi_smi_interrupt(void *opaque, int irq, int level)
B
Blue Swirl 已提交
829 830 831 832 833 834 835 836
{
    CPUState *s = opaque;

    if (level) {
        cpu_interrupt(s, CPU_INTERRUPT_SMI);
    }
}

J
Jan Kiszka 已提交
837
static void pc_cpu_reset(void *opaque)
838 839 840 841
{
    CPUState *env = opaque;

    cpu_reset(env);
J
Jan Kiszka 已提交
842
    env->halted = !cpu_is_bsp(env);
843 844
}

J
Jan Kiszka 已提交
845 846 847 848 849 850 851 852 853 854 855
static CPUState *pc_new_cpu(const char *cpu_model)
{
    CPUState *env;

    env = cpu_init(cpu_model);
    if (!env) {
        fprintf(stderr, "Unable to find x86 CPU definition\n");
        exit(1);
    }
    if ((env->cpuid_features & CPUID_APIC) || smp_cpus > 1) {
        env->cpuid_apic_id = env->cpu_index;
856 857
        env->apic_state = apic_init(env, env->cpuid_apic_id);
    }
J
Jan Kiszka 已提交
858 859
    qemu_register_reset(pc_cpu_reset, env);
    pc_cpu_reset(env);
J
Jan Kiszka 已提交
860 861 862
    return env;
}

863
void pc_cpus_init(const char *cpu_model)
864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880
{
    int i;

    /* init CPUs */
    if (cpu_model == NULL) {
#ifdef TARGET_X86_64
        cpu_model = "qemu64";
#else
        cpu_model = "qemu32";
#endif
    }

    for(i = 0; i < smp_cpus; i++) {
        pc_new_cpu(cpu_model);
    }
}

881 882 883 884 885 886
void pc_memory_init(ram_addr_t ram_size,
                    const char *kernel_filename,
                    const char *kernel_cmdline,
                    const char *initrd_filename,
                    ram_addr_t *below_4g_mem_size_p,
                    ram_addr_t *above_4g_mem_size_p)
B
bellard 已提交
887
{
P
Paul Brook 已提交
888
    char *filename;
T
ths 已提交
889
    int ret, linux_boot, i;
A
Anthony Liguori 已提交
890 891
    ram_addr_t ram_addr, bios_offset, option_rom_offset;
    ram_addr_t below_4g_mem_size, above_4g_mem_size = 0;
892
    int bios_size, isa_bios_size;
893
    void *fw_cfg;
894

895 896 897 898 899 900
    if (ram_size >= 0xe0000000 ) {
        above_4g_mem_size = ram_size - 0xe0000000;
        below_4g_mem_size = 0xe0000000;
    } else {
        below_4g_mem_size = ram_size;
    }
901 902
    *above_4g_mem_size_p = above_4g_mem_size;
    *below_4g_mem_size_p = below_4g_mem_size;
903

904 905 906 907 908
#if TARGET_PHYS_ADDR_BITS == 32
    if (above_4g_mem_size > 0) {
        hw_error("To much RAM for 32-bit physical address");
    }
#endif
B
bellard 已提交
909 910 911
    linux_boot = (kernel_filename != NULL);

    /* allocate RAM */
912
    ram_addr = qemu_ram_alloc(below_4g_mem_size + above_4g_mem_size);
913 914 915
    cpu_register_physical_memory(0, 0xa0000, ram_addr);
    cpu_register_physical_memory(0x100000,
                 below_4g_mem_size - 0x100000,
916
                 ram_addr + 0x100000);
917 918 919
#if TARGET_PHYS_ADDR_BITS > 32
    cpu_register_physical_memory(0x100000000ULL, above_4g_mem_size,
                                 ram_addr + below_4g_mem_size);
920
#endif
921

B
bellard 已提交
922
    /* BIOS load */
923 924
    if (bios_name == NULL)
        bios_name = BIOS_FILENAME;
P
Paul Brook 已提交
925 926 927 928 929 930
    filename = qemu_find_file(QEMU_FILE_TYPE_BIOS, bios_name);
    if (filename) {
        bios_size = get_image_size(filename);
    } else {
        bios_size = -1;
    }
931
    if (bios_size <= 0 ||
B
bellard 已提交
932
        (bios_size % 65536) != 0) {
B
bellard 已提交
933 934
        goto bios_error;
    }
B
bellard 已提交
935
    bios_offset = qemu_ram_alloc(bios_size);
G
Gerd Hoffmann 已提交
936 937
    ret = rom_add_file_fixed(bios_name, (uint32_t)(-bios_size));
    if (ret != 0) {
B
bellard 已提交
938
    bios_error:
P
Paul Brook 已提交
939
        fprintf(stderr, "qemu: could not load PC BIOS '%s'\n", bios_name);
B
bellard 已提交
940 941
        exit(1);
    }
P
Paul Brook 已提交
942 943 944
    if (filename) {
        qemu_free(filename);
    }
B
bellard 已提交
945 946 947 948
    /* map the last 128KB of the BIOS in ISA space */
    isa_bios_size = bios_size;
    if (isa_bios_size > (128 * 1024))
        isa_bios_size = 128 * 1024;
949 950
    cpu_register_physical_memory(0x100000 - isa_bios_size,
                                 isa_bios_size,
B
bellard 已提交
951
                                 (bios_offset + bios_size - isa_bios_size) | IO_MEM_ROM);
952

953 954
    option_rom_offset = qemu_ram_alloc(PC_ROM_SIZE);
    cpu_register_physical_memory(PC_ROM_MIN_VGA, PC_ROM_SIZE, option_rom_offset);
955

A
Alexander Graf 已提交
956 957 958 959
    /* map all the bios at the top of memory */
    cpu_register_physical_memory((uint32_t)(-bios_size),
                                 bios_size, bios_offset | IO_MEM_ROM);

A
Alexander Graf 已提交
960
    fw_cfg = bochs_bios_init();
G
Gerd Hoffmann 已提交
961
    rom_set_fw(fw_cfg);
A
Alexander Graf 已提交
962

963
    if (linux_boot) {
964
        load_linux(fw_cfg, kernel_filename, initrd_filename, kernel_cmdline, below_4g_mem_size);
965 966 967
    }

    for (i = 0; i < nb_option_roms; i++) {
968
        rom_add_option(option_rom[i]);
969
    }
970 971
}

972 973 974 975 976 977
qemu_irq *pc_allocate_cpu_irq(void)
{
    return qemu_allocate_irqs(pic_irq_request, NULL, 1);
}

void pc_vga_init(PCIBus *pci_bus)
978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995 996 997 998
{
    if (cirrus_vga_enabled) {
        if (pci_bus) {
            pci_cirrus_vga_init(pci_bus);
        } else {
            isa_cirrus_vga_init();
        }
    } else if (vmsvga_enabled) {
        if (pci_bus)
            pci_vmsvga_init(pci_bus);
        else
            fprintf(stderr, "%s: vmware_vga: no PCI bus\n", __FUNCTION__);
    } else if (std_vga_enabled) {
        if (pci_bus) {
            pci_vga_init(pci_bus, 0, 0);
        } else {
            isa_vga_init();
        }
    }
}

B
Blue Swirl 已提交
999 1000 1001 1002 1003 1004 1005 1006 1007
static void cpu_request_exit(void *opaque, int irq, int level)
{
    CPUState *env = cpu_single_env;

    if (env && level) {
        cpu_exit(env);
    }
}

1008 1009
void pc_basic_device_init(qemu_irq *isa_irq,
                          FDCtrl **floppy_controller,
1010
                          ISADevice **rtc_state)
1011 1012 1013 1014
{
    int i;
    DriveInfo *fd[MAX_FD];
    PITState *pit;
1015
    qemu_irq rtc_irq = NULL;
B
Blue Swirl 已提交
1016 1017
    qemu_irq *a20_line;
    ISADevice *i8042;
B
Blue Swirl 已提交
1018
    qemu_irq *cpu_exit_irq;
1019 1020 1021 1022 1023 1024

    register_ioport_write(0x80, 1, 1, ioport80_write, NULL);

    register_ioport_write(0xf0, 1, 1, ioportF0_write, NULL);

    if (!no_hpet) {
J
Jan Kiszka 已提交
1025 1026 1027 1028 1029
        DeviceState *hpet = sysbus_create_simple("hpet", HPET_BASE, NULL);

        for (i = 0; i < 24; i++) {
            sysbus_connect_irq(sysbus_from_qdev(hpet), i, isa_irq[i]);
        }
1030
        rtc_irq = qdev_get_gpio_in(hpet, 0);
1031
    }
1032 1033 1034 1035 1036 1037
    *rtc_state = rtc_init(2000, rtc_irq);

    qemu_register_boot_set(pc_boot_set, *rtc_state);

    pit = pit_init(0x40, isa_reserve_irq(0));
    pcspk_init(pit);
1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050

    for(i = 0; i < MAX_SERIAL_PORTS; i++) {
        if (serial_hds[i]) {
            serial_isa_init(i, serial_hds[i]);
        }
    }

    for(i = 0; i < MAX_PARALLEL_PORTS; i++) {
        if (parallel_hds[i]) {
            parallel_init(i, parallel_hds[i]);
        }
    }

B
Blue Swirl 已提交
1051 1052 1053 1054 1055
    a20_line = qemu_allocate_irqs(handle_a20_line_change, first_cpu, 1);
    i8042 = isa_create_simple("i8042");
    i8042_setup_a20_line(i8042, a20_line);
    vmmouse_init(i8042);

B
Blue Swirl 已提交
1056 1057
    cpu_exit_irq = qemu_allocate_irqs(cpu_request_exit, NULL, 1);
    DMA_init(0, cpu_exit_irq);
1058 1059 1060 1061 1062 1063 1064

    for(i = 0; i < MAX_FD; i++) {
        fd[i] = drive_get(IF_FLOPPY, 0, i);
    }
    *floppy_controller = fdctrl_init_isa(fd);
}

1065
void pc_pci_device_init(PCIBus *pci_bus)
1066 1067 1068 1069 1070 1071 1072 1073 1074
{
    int max_bus;
    int bus;

    max_bus = drive_get_max_bus(IF_SCSI);
    for (bus = 0; bus <= max_bus; bus++) {
        pci_create_simple(pci_bus, -1, "lsi53c895a");
    }
}