pci.c 69.4 KB
Newer Older
B
bellard 已提交
1 2 3 4
/*
 * QEMU PCI bus manager
 *
 * Copyright (c) 2004 Fabrice Bellard
5
 *
B
bellard 已提交
6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */
24 25 26
#include "hw/hw.h"
#include "hw/pci/pci.h"
#include "hw/pci/pci_bridge.h"
27
#include "hw/pci/pci_bus.h"
28
#include "hw/pci/pci_host.h"
29
#include "monitor/monitor.h"
P
Paolo Bonzini 已提交
30
#include "net/net.h"
31
#include "sysemu/sysemu.h"
32
#include "hw/loader.h"
33
#include "qemu/range.h"
L
Luiz Capitulino 已提交
34
#include "qmp-commands.h"
35 36
#include "hw/pci/msi.h"
#include "hw/pci/msix.h"
37
#include "exec/address-spaces.h"
B
bellard 已提交
38 39

//#define DEBUG_PCI
40
#ifdef DEBUG_PCI
41
# define PCI_DPRINTF(format, ...)       printf(format, ## __VA_ARGS__)
42 43 44
#else
# define PCI_DPRINTF(format, ...)       do { } while (0)
#endif
B
bellard 已提交
45

46
static void pcibus_dev_print(Monitor *mon, DeviceState *dev, int indent);
47
static char *pcibus_get_dev_path(DeviceState *dev);
48
static char *pcibus_get_fw_dev_path(DeviceState *dev);
49
static int pcibus_reset(BusState *qbus);
50
static void pci_bus_finalize(Object *obj);
51

52 53 54 55 56 57 58 59 60 61 62
static Property pci_props[] = {
    DEFINE_PROP_PCI_DEVFN("addr", PCIDevice, devfn, -1),
    DEFINE_PROP_STRING("romfile", PCIDevice, romfile),
    DEFINE_PROP_UINT32("rombar",  PCIDevice, rom_bar, 1),
    DEFINE_PROP_BIT("multifunction", PCIDevice, cap_present,
                    QEMU_PCI_CAP_MULTIFUNCTION_BITNR, false),
    DEFINE_PROP_BIT("command_serr_enable", PCIDevice, cap_present,
                    QEMU_PCI_CAP_SERR_BITNR, true),
    DEFINE_PROP_END_OF_LIST()
};

63 64 65 66 67 68 69 70 71 72 73 74 75 76
static void pci_bus_class_init(ObjectClass *klass, void *data)
{
    BusClass *k = BUS_CLASS(klass);

    k->print_dev = pcibus_dev_print;
    k->get_dev_path = pcibus_get_dev_path;
    k->get_fw_dev_path = pcibus_get_fw_dev_path;
    k->reset = pcibus_reset;
}

static const TypeInfo pci_bus_info = {
    .name = TYPE_PCI_BUS,
    .parent = TYPE_BUS,
    .instance_size = sizeof(PCIBus),
77
    .instance_finalize = pci_bus_finalize,
78
    .class_init = pci_bus_class_init,
79
};
B
bellard 已提交
80

81 82 83 84 85
static const TypeInfo pcie_bus_info = {
    .name = TYPE_PCIE_BUS,
    .parent = TYPE_PCI_BUS,
};

86
static PCIBus *pci_find_bus_nr(PCIBus *bus, int bus_num);
B
bellard 已提交
87
static void pci_update_mappings(PCIDevice *d);
88
static void pci_irq_handler(void *opaque, int irq_num, int level);
89
static int pci_add_option_rom(PCIDevice *pdev, bool is_default_rom);
90
static void pci_del_option_rom(PCIDevice *pdev);
B
bellard 已提交
91

92 93
static uint16_t pci_default_sub_vendor_id = PCI_SUBVENDOR_ID_REDHAT_QUMRANET;
static uint16_t pci_default_sub_device_id = PCI_SUBDEVICE_ID_QEMU;
94

95
static QLIST_HEAD(, PCIHostState) pci_host_bridges;
96

J
Juan Quintela 已提交
97 98 99 100 101 102 103
static const VMStateDescription vmstate_pcibus = {
    .name = "PCIBUS",
    .version_id = 1,
    .minimum_version_id = 1,
    .minimum_version_id_old = 1,
    .fields      = (VMStateField []) {
        VMSTATE_INT32_EQUAL(nirq, PCIBus),
104
        VMSTATE_VARRAY_INT32(irq_count, PCIBus, nirq, 0, vmstate_info_int32, int32_t),
J
Juan Quintela 已提交
105
        VMSTATE_END_OF_LIST()
106
    }
J
Juan Quintela 已提交
107
};
108
static int pci_bar(PCIDevice *d, int reg)
109
{
110 111 112 113 114 115 116
    uint8_t type;

    if (reg != PCI_ROM_SLOT)
        return PCI_BASE_ADDRESS_0 + reg * 4;

    type = d->config[PCI_HEADER_TYPE] & ~PCI_HEADER_TYPE_MULTI_FUNCTION;
    return type == PCI_HEADER_TYPE_BRIDGE ? PCI_ROM_ADDRESS1 : PCI_ROM_ADDRESS;
117 118
}

119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143
static inline int pci_irq_state(PCIDevice *d, int irq_num)
{
	return (d->irq_state >> irq_num) & 0x1;
}

static inline void pci_set_irq_state(PCIDevice *d, int irq_num, int level)
{
	d->irq_state &= ~(0x1 << irq_num);
	d->irq_state |= level << irq_num;
}

static void pci_change_irq_level(PCIDevice *pci_dev, int irq_num, int change)
{
    PCIBus *bus;
    for (;;) {
        bus = pci_dev->bus;
        irq_num = bus->map_irq(pci_dev, irq_num);
        if (bus->set_irq)
            break;
        pci_dev = bus->parent_dev;
    }
    bus->irq_count[irq_num] += change;
    bus->set_irq(bus->irq_opaque, irq_num, bus->irq_count[irq_num] != 0);
}

144 145 146 147 148 149 150
int pci_bus_get_irq_level(PCIBus *bus, int irq_num)
{
    assert(irq_num >= 0);
    assert(irq_num < bus->nirq);
    return !!bus->irq_count[irq_num];
}

151 152 153 154 155 156 157 158 159 160 161
/* Update interrupt status bit in config space on interrupt
 * state change. */
static void pci_update_irq_status(PCIDevice *dev)
{
    if (dev->irq_state) {
        dev->config[PCI_STATUS] |= PCI_STATUS_INTERRUPT;
    } else {
        dev->config[PCI_STATUS] &= ~PCI_STATUS_INTERRUPT;
    }
}

I
Isaku Yamahata 已提交
162 163 164 165
void pci_device_deassert_intx(PCIDevice *dev)
{
    int i;
    for (i = 0; i < PCI_NUM_PINS; ++i) {
166
        pci_irq_handler(dev, i, 0);
I
Isaku Yamahata 已提交
167 168 169
    }
}

I
Isaku Yamahata 已提交
170 171 172 173 174
/*
 * This function is called on #RST and FLR.
 * FLR if PCI_EXP_DEVCTL_BCR_FLR is set
 */
void pci_device_reset(PCIDevice *dev)
175
{
176
    int r;
177 178

    qdev_reset_all(&dev->qdev);
179

180
    dev->irq_state = 0;
181
    pci_update_irq_status(dev);
I
Isaku Yamahata 已提交
182
    pci_device_deassert_intx(dev);
S
Stefan Weil 已提交
183
    /* Clear all writable bits */
184
    pci_word_test_and_clear_mask(dev->config + PCI_COMMAND,
185 186
                                 pci_get_word(dev->wmask + PCI_COMMAND) |
                                 pci_get_word(dev->w1cmask + PCI_COMMAND));
187 188 189
    pci_word_test_and_clear_mask(dev->config + PCI_STATUS,
                                 pci_get_word(dev->wmask + PCI_STATUS) |
                                 pci_get_word(dev->w1cmask + PCI_STATUS));
190 191 192
    dev->config[PCI_CACHE_LINE_SIZE] = 0x0;
    dev->config[PCI_INTERRUPT_LINE] = 0x0;
    for (r = 0; r < PCI_NUM_REGIONS; ++r) {
I
Isaku Yamahata 已提交
193 194
        PCIIORegion *region = &dev->io_regions[r];
        if (!region->size) {
195 196
            continue;
        }
I
Isaku Yamahata 已提交
197 198 199 200 201 202 203

        if (!(region->type & PCI_BASE_ADDRESS_SPACE_IO) &&
            region->type & PCI_BASE_ADDRESS_MEM_TYPE_64) {
            pci_set_quad(dev->config + pci_bar(dev, r), region->type);
        } else {
            pci_set_long(dev->config + pci_bar(dev, r), region->type);
        }
204 205
    }
    pci_update_mappings(dev);
206 207 208

    msi_reset(dev);
    msix_reset(dev);
209 210
}

211 212 213 214
/*
 * Trigger pci bus reset under a given bus.
 * To be called on RST# assert.
 */
P
Paolo Bonzini 已提交
215
static int pcibus_reset(BusState *qbus)
G
Gleb Natapov 已提交
216
{
P
Paolo Bonzini 已提交
217
    PCIBus *bus = DO_UPCAST(PCIBus, qbus, qbus);
G
Gleb Natapov 已提交
218 219
    int i;

220 221 222 223
    for (i = 0; i < ARRAY_SIZE(bus->devices); ++i) {
        if (bus->devices[i]) {
            pci_device_reset(bus->devices[i]);
        }
G
Gleb Natapov 已提交
224
    }
225

P
Paolo Bonzini 已提交
226 227 228 229
    for (i = 0; i < bus->nirq; i++) {
        assert(bus->irq_count[i] == 0);
    }

230 231 232 233 234
    /* topology traverse is done by pci_bus_reset().
       Tell qbus/qdev walker not to traverse the tree */
    return 1;
}

235
static void pci_host_bus_register(PCIBus *bus, DeviceState *parent)
236
{
237 238 239
    PCIHostState *host_bridge = PCI_HOST_BRIDGE(parent);

    QLIST_INSERT_HEAD(&pci_host_bridges, host_bridge, next);
240 241
}

D
David Gibson 已提交
242
PCIBus *pci_find_primary_bus(void)
243
{
244
    PCIBus *primary_bus = NULL;
245
    PCIHostState *host;
246

247
    QLIST_FOREACH(host, &pci_host_bridges, next) {
248 249 250
        if (primary_bus) {
            /* We have multiple root buses, refuse to select a primary */
            return NULL;
251
        }
252
        primary_bus = host->bus;
253 254
    }

255
    return primary_bus;
256 257
}

258
PCIBus *pci_device_root_bus(const PCIDevice *d)
259
{
260
    PCIBus *bus = d->bus;
261 262 263 264 265

    while ((d = bus->parent_dev) != NULL) {
        bus = d->bus;
    }

266 267 268
    return bus;
}

269
const char *pci_root_bus_path(PCIDevice *dev)
270
{
271 272 273
    PCIBus *rootbus = pci_device_root_bus(dev);
    PCIHostState *host_bridge = PCI_HOST_BRIDGE(rootbus->qbus.parent);
    PCIHostBridgeClass *hc = PCI_HOST_BRIDGE_GET_CLASS(host_bridge);
274

275 276 277 278 279
    assert(!rootbus->parent_dev);
    assert(host_bridge->bus == rootbus);

    if (hc->root_bus_path) {
        return (*hc->root_bus_path)(host_bridge, rootbus);
280 281
    }

282
    return rootbus->qbus.name;
283 284
}

285
static void pci_bus_init(PCIBus *bus, DeviceState *parent,
286
                         const char *name,
287 288
                         MemoryRegion *address_space_mem,
                         MemoryRegion *address_space_io,
289
                         uint8_t devfn_min)
290
{
291
    assert(PCI_FUNC(devfn_min) == 0);
P
pbrook 已提交
292
    bus->devfn_min = devfn_min;
293 294
    bus->address_space_mem = address_space_mem;
    bus->address_space_io = address_space_io;
295 296 297

    /* host bridge */
    QLIST_INIT(&bus->child);
298

299
    pci_host_bus_register(bus, parent);
300

A
Alex Williamson 已提交
301
    vmstate_register(NULL, -1, &vmstate_pcibus, bus);
302 303
}

304 305 306 307 308
bool pci_bus_is_express(PCIBus *bus)
{
    return object_dynamic_cast(OBJECT(bus), TYPE_PCIE_BUS);
}

309 310 311 312 313
bool pci_bus_is_root(PCIBus *bus)
{
    return !bus->parent_dev;
}

314
void pci_bus_new_inplace(PCIBus *bus, size_t bus_size, DeviceState *parent,
315 316 317
                         const char *name,
                         MemoryRegion *address_space_mem,
                         MemoryRegion *address_space_io,
318
                         uint8_t devfn_min, const char *typename)
319
{
320
    qbus_create_inplace(bus, bus_size, typename, parent, name);
321 322 323 324
    pci_bus_init(bus, parent, name, address_space_mem,
                 address_space_io, devfn_min);
}

325
PCIBus *pci_bus_new(DeviceState *parent, const char *name,
326 327
                    MemoryRegion *address_space_mem,
                    MemoryRegion *address_space_io,
328
                    uint8_t devfn_min, const char *typename)
329 330 331
{
    PCIBus *bus;

332
    bus = PCI_BUS(qbus_create(typename, parent, name));
333 334
    pci_bus_init(bus, parent, name, address_space_mem,
                 address_space_io, devfn_min);
335 336 337 338 339 340 341 342 343 344
    return bus;
}

void pci_bus_irqs(PCIBus *bus, pci_set_irq_fn set_irq, pci_map_irq_fn map_irq,
                  void *irq_opaque, int nirq)
{
    bus->set_irq = set_irq;
    bus->map_irq = map_irq;
    bus->irq_opaque = irq_opaque;
    bus->nirq = nirq;
345
    bus->irq_count = g_malloc0(nirq * sizeof(bus->irq_count[0]));
346 347
}

348
void pci_bus_hotplug(PCIBus *bus, pci_hotplug_fn hotplug, DeviceState *qdev)
G
Gerd Hoffmann 已提交
349 350 351
{
    bus->qbus.allow_hotplug = 1;
    bus->hotplug = hotplug;
352
    bus->hotplug_qdev = qdev;
G
Gerd Hoffmann 已提交
353 354
}

355 356
PCIBus *pci_register_bus(DeviceState *parent, const char *name,
                         pci_set_irq_fn set_irq, pci_map_irq_fn map_irq,
357
                         void *irq_opaque,
358 359
                         MemoryRegion *address_space_mem,
                         MemoryRegion *address_space_io,
360
                         uint8_t devfn_min, int nirq, const char *typename)
361 362 363
{
    PCIBus *bus;

364
    bus = pci_bus_new(parent, name, address_space_mem,
365
                      address_space_io, devfn_min, typename);
366
    pci_bus_irqs(bus, set_irq, map_irq, irq_opaque, nirq);
367 368
    return bus;
}
B
bellard 已提交
369

P
pbrook 已提交
370 371
int pci_bus_num(PCIBus *s)
{
372
    if (pci_bus_is_root(s))
373 374
        return 0;       /* pci host bridge */
    return s->parent_dev->config[PCI_SECONDARY_BUS];
P
pbrook 已提交
375 376
}

377 378 379 380 381 382
static void pci_bus_finalize(Object *obj)
{
    PCIBus *bus = PCI_BUS(obj);
    vmstate_unregister(NULL, &vmstate_pcibus, bus);
}

J
Juan Quintela 已提交
383
static int get_pci_config_device(QEMUFile *f, void *pv, size_t size)
384
{
J
Juan Quintela 已提交
385
    PCIDevice *s = container_of(pv, PCIDevice, config);
386
    PCIDeviceClass *pc = PCI_DEVICE_GET_CLASS(s);
I
Isaku Yamahata 已提交
387
    uint8_t *config;
388 389
    int i;

I
Isaku Yamahata 已提交
390
    assert(size == pci_config_size(s));
391
    config = g_malloc(size);
I
Isaku Yamahata 已提交
392 393 394

    qemu_get_buffer(f, config, size);
    for (i = 0; i < size; ++i) {
395 396
        if ((config[i] ^ s->config[i]) &
            s->cmask[i] & ~s->wmask[i] & ~s->w1cmask[i]) {
397
            g_free(config);
398
            return -EINVAL;
I
Isaku Yamahata 已提交
399 400 401
        }
    }
    memcpy(s->config, config, size);
402

B
bellard 已提交
403
    pci_update_mappings(s);
404
    if (pc->is_bridge) {
405
        PCIBridge *b = PCI_BRIDGE(s);
406 407
        pci_bridge_update_mappings(b);
    }
408

G
Gerd Hoffmann 已提交
409 410 411 412
    memory_region_set_enabled(&s->bus_master_enable_region,
                              pci_get_word(s->config + PCI_COMMAND)
                              & PCI_COMMAND_MASTER);

413
    g_free(config);
414 415 416
    return 0;
}

J
Juan Quintela 已提交
417
/* just put buffer */
418
static void put_pci_config_device(QEMUFile *f, void *pv, size_t size)
J
Juan Quintela 已提交
419
{
420
    const uint8_t **v = pv;
I
Isaku Yamahata 已提交
421
    assert(size == pci_config_size(container_of(pv, PCIDevice, config)));
422
    qemu_put_buffer(f, *v, size);
J
Juan Quintela 已提交
423 424 425 426 427 428 429 430
}

static VMStateInfo vmstate_info_pci_config = {
    .name = "pci config",
    .get  = get_pci_config_device,
    .put  = put_pci_config_device,
};

431 432
static int get_pci_irq_state(QEMUFile *f, void *pv, size_t size)
{
433
    PCIDevice *s = container_of(pv, PCIDevice, irq_state);
434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454
    uint32_t irq_state[PCI_NUM_PINS];
    int i;
    for (i = 0; i < PCI_NUM_PINS; ++i) {
        irq_state[i] = qemu_get_be32(f);
        if (irq_state[i] != 0x1 && irq_state[i] != 0) {
            fprintf(stderr, "irq state %d: must be 0 or 1.\n",
                    irq_state[i]);
            return -EINVAL;
        }
    }

    for (i = 0; i < PCI_NUM_PINS; ++i) {
        pci_set_irq_state(s, i, irq_state[i]);
    }

    return 0;
}

static void put_pci_irq_state(QEMUFile *f, void *pv, size_t size)
{
    int i;
455
    PCIDevice *s = container_of(pv, PCIDevice, irq_state);
456 457 458 459 460 461 462 463 464 465 466 467

    for (i = 0; i < PCI_NUM_PINS; ++i) {
        qemu_put_be32(f, pci_irq_state(s, i));
    }
}

static VMStateInfo vmstate_info_pci_irq_state = {
    .name = "pci irq state",
    .get  = get_pci_irq_state,
    .put  = put_pci_irq_state,
};

J
Juan Quintela 已提交
468 469 470 471 472 473 474
const VMStateDescription vmstate_pci_device = {
    .name = "PCIDevice",
    .version_id = 2,
    .minimum_version_id = 1,
    .minimum_version_id_old = 1,
    .fields      = (VMStateField []) {
        VMSTATE_INT32_LE(version_id, PCIDevice),
I
Isaku Yamahata 已提交
475 476 477
        VMSTATE_BUFFER_UNSAFE_INFO(config, PCIDevice, 0,
                                   vmstate_info_pci_config,
                                   PCI_CONFIG_SPACE_SIZE),
478 479 480
        VMSTATE_BUFFER_UNSAFE_INFO(irq_state, PCIDevice, 2,
				   vmstate_info_pci_irq_state,
				   PCI_NUM_PINS * sizeof(int32_t)),
I
Isaku Yamahata 已提交
481 482 483 484 485
        VMSTATE_END_OF_LIST()
    }
};

const VMStateDescription vmstate_pcie_device = {
486
    .name = "PCIEDevice",
I
Isaku Yamahata 已提交
487 488 489 490 491 492 493 494
    .version_id = 2,
    .minimum_version_id = 1,
    .minimum_version_id_old = 1,
    .fields      = (VMStateField []) {
        VMSTATE_INT32_LE(version_id, PCIDevice),
        VMSTATE_BUFFER_UNSAFE_INFO(config, PCIDevice, 0,
                                   vmstate_info_pci_config,
                                   PCIE_CONFIG_SPACE_SIZE),
495 496 497
        VMSTATE_BUFFER_UNSAFE_INFO(irq_state, PCIDevice, 2,
				   vmstate_info_pci_irq_state,
				   PCI_NUM_PINS * sizeof(int32_t)),
J
Juan Quintela 已提交
498 499 500 501
        VMSTATE_END_OF_LIST()
    }
};

I
Isaku Yamahata 已提交
502 503 504 505 506
static inline const VMStateDescription *pci_get_vmstate(PCIDevice *s)
{
    return pci_is_express(s) ? &vmstate_pcie_device : &vmstate_pci_device;
}

J
Juan Quintela 已提交
507 508
void pci_device_save(PCIDevice *s, QEMUFile *f)
{
509 510 511 512 513
    /* Clear interrupt status bit: it is implicit
     * in irq_state which we are saving.
     * This makes us compatible with old devices
     * which never set or clear this bit. */
    s->config[PCI_STATUS] &= ~PCI_STATUS_INTERRUPT;
I
Isaku Yamahata 已提交
514
    vmstate_save_state(f, pci_get_vmstate(s), s);
515 516
    /* Restore the interrupt status bit. */
    pci_update_irq_status(s);
J
Juan Quintela 已提交
517 518 519 520
}

int pci_device_load(PCIDevice *s, QEMUFile *f)
{
521 522 523 524 525
    int ret;
    ret = vmstate_load_state(f, pci_get_vmstate(s), s, s->version_id);
    /* Restore the interrupt status bit. */
    pci_update_irq_status(s);
    return ret;
J
Juan Quintela 已提交
526 527
}

528
static void pci_set_default_subsystem_id(PCIDevice *pci_dev)
529
{
530 531 532 533
    pci_set_word(pci_dev->config + PCI_SUBSYSTEM_VENDOR_ID,
                 pci_default_sub_vendor_id);
    pci_set_word(pci_dev->config + PCI_SUBSYSTEM_ID,
                 pci_default_sub_device_id);
534 535
}

536
/*
537 538
 * Parse [[<domain>:]<bus>:]<slot>, return -1 on error if funcp == NULL
 *       [[<domain>:]<bus>:]<slot>.<func>, return -1 on error
539
 */
540
int pci_parse_devaddr(const char *addr, int *domp, int *busp,
541
                      unsigned int *slotp, unsigned int *funcp)
542 543 544 545 546
{
    const char *p;
    char *e;
    unsigned long val;
    unsigned long dom = 0, bus = 0;
547 548
    unsigned int slot = 0;
    unsigned int func = 0;
549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571

    p = addr;
    val = strtoul(p, &e, 16);
    if (e == p)
	return -1;
    if (*e == ':') {
	bus = val;
	p = e + 1;
	val = strtoul(p, &e, 16);
	if (e == p)
	    return -1;
	if (*e == ':') {
	    dom = bus;
	    bus = val;
	    p = e + 1;
	    val = strtoul(p, &e, 16);
	    if (e == p)
		return -1;
	}
    }

    slot = val;

572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587
    if (funcp != NULL) {
        if (*e != '.')
            return -1;

        p = e + 1;
        val = strtoul(p, &e, 16);
        if (e == p)
            return -1;

        func = val;
    }

    /* if funcp == NULL func is 0 */
    if (dom > 0xffff || bus > 0xff || slot > 0x1f || func > 7)
	return -1;

588 589 590 591 592 593
    if (*e)
	return -1;

    *domp = dom;
    *busp = bus;
    *slotp = slot;
594 595
    if (funcp != NULL)
        *funcp = func;
596 597 598
    return 0;
}

599
PCIBus *pci_get_bus_devfn(int *devfnp, PCIBus *root, const char *devaddr)
600 601 602 603
{
    int dom, bus;
    unsigned slot;

604 605
    assert(!root->parent_dev);

D
David Gibson 已提交
606 607 608 609 610
    if (!root) {
        fprintf(stderr, "No primary PCI bus\n");
        return NULL;
    }

611 612
    if (!devaddr) {
        *devfnp = -1;
D
David Gibson 已提交
613
        return pci_find_bus_nr(root, 0);
614 615
    }

616
    if (pci_parse_devaddr(devaddr, &dom, &bus, &slot, NULL) < 0) {
617 618 619
        return NULL;
    }

D
David Gibson 已提交
620 621 622 623 624
    if (dom != 0) {
        fprintf(stderr, "No support for non-zero PCI domains\n");
        return NULL;
    }

625
    *devfnp = PCI_DEVFN(slot, 0);
D
David Gibson 已提交
626
    return pci_find_bus_nr(root, bus);
627 628
}

629 630 631 632 633 634 635 636 637 638 639 640
static void pci_init_cmask(PCIDevice *dev)
{
    pci_set_word(dev->cmask + PCI_VENDOR_ID, 0xffff);
    pci_set_word(dev->cmask + PCI_DEVICE_ID, 0xffff);
    dev->cmask[PCI_STATUS] = PCI_STATUS_CAP_LIST;
    dev->cmask[PCI_REVISION_ID] = 0xff;
    dev->cmask[PCI_CLASS_PROG] = 0xff;
    pci_set_word(dev->cmask + PCI_CLASS_DEVICE, 0xffff);
    dev->cmask[PCI_HEADER_TYPE] = 0xff;
    dev->cmask[PCI_CAPABILITY_LIST] = 0xff;
}

641 642
static void pci_init_wmask(PCIDevice *dev)
{
I
Isaku Yamahata 已提交
643 644
    int config_size = pci_config_size(dev);

645 646
    dev->wmask[PCI_CACHE_LINE_SIZE] = 0xff;
    dev->wmask[PCI_INTERRUPT_LINE] = 0xff;
I
Isaku Yamahata 已提交
647
    pci_set_word(dev->wmask + PCI_COMMAND,
648 649
                 PCI_COMMAND_IO | PCI_COMMAND_MEMORY | PCI_COMMAND_MASTER |
                 PCI_COMMAND_INTX_DISABLE);
650 651 652
    if (dev->cap_present & QEMU_PCI_CAP_SERR) {
        pci_word_test_and_set_mask(dev->wmask + PCI_COMMAND, PCI_COMMAND_SERR);
    }
653 654 655

    memset(dev->wmask + PCI_CONFIG_HEADER_SIZE, 0xff,
           config_size - PCI_CONFIG_HEADER_SIZE);
656 657
}

658 659 660
static void pci_init_w1cmask(PCIDevice *dev)
{
    /*
661
     * Note: It's okay to set w1cmask even for readonly bits as
662 663 664 665 666 667 668 669
     * long as their value is hardwired to 0.
     */
    pci_set_word(dev->w1cmask + PCI_STATUS,
                 PCI_STATUS_PARITY | PCI_STATUS_SIG_TARGET_ABORT |
                 PCI_STATUS_REC_TARGET_ABORT | PCI_STATUS_REC_MASTER_ABORT |
                 PCI_STATUS_SIG_SYSTEM_ERROR | PCI_STATUS_DETECTED_PARITY);
}

670
static void pci_init_mask_bridge(PCIDevice *d)
671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690
{
    /* PCI_PRIMARY_BUS, PCI_SECONDARY_BUS, PCI_SUBORDINATE_BUS and
       PCI_SEC_LETENCY_TIMER */
    memset(d->wmask + PCI_PRIMARY_BUS, 0xff, 4);

    /* base and limit */
    d->wmask[PCI_IO_BASE] = PCI_IO_RANGE_MASK & 0xff;
    d->wmask[PCI_IO_LIMIT] = PCI_IO_RANGE_MASK & 0xff;
    pci_set_word(d->wmask + PCI_MEMORY_BASE,
                 PCI_MEMORY_RANGE_MASK & 0xffff);
    pci_set_word(d->wmask + PCI_MEMORY_LIMIT,
                 PCI_MEMORY_RANGE_MASK & 0xffff);
    pci_set_word(d->wmask + PCI_PREF_MEMORY_BASE,
                 PCI_PREF_RANGE_MASK & 0xffff);
    pci_set_word(d->wmask + PCI_PREF_MEMORY_LIMIT,
                 PCI_PREF_RANGE_MASK & 0xffff);

    /* PCI_PREF_BASE_UPPER32 and PCI_PREF_LIMIT_UPPER32 */
    memset(d->wmask + PCI_PREF_BASE_UPPER32, 0xff, 8);

691
    /* Supported memory and i/o types */
M
Michael S. Tsirkin 已提交
692 693
    d->config[PCI_IO_BASE] |= PCI_IO_RANGE_TYPE_16;
    d->config[PCI_IO_LIMIT] |= PCI_IO_RANGE_TYPE_16;
694 695 696 697 698
    pci_word_test_and_set_mask(d->config + PCI_PREF_MEMORY_BASE,
                               PCI_PREF_RANGE_TYPE_64);
    pci_word_test_and_set_mask(d->config + PCI_PREF_MEMORY_LIMIT,
                               PCI_PREF_RANGE_TYPE_64);

699 700 701 702
    /*
     * TODO: Bridges default to 10-bit VGA decoding but we currently only
     * implement 16-bit decoding (no alias support).
     */
703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718
    pci_set_word(d->wmask + PCI_BRIDGE_CONTROL,
                 PCI_BRIDGE_CTL_PARITY |
                 PCI_BRIDGE_CTL_SERR |
                 PCI_BRIDGE_CTL_ISA |
                 PCI_BRIDGE_CTL_VGA |
                 PCI_BRIDGE_CTL_VGA_16BIT |
                 PCI_BRIDGE_CTL_MASTER_ABORT |
                 PCI_BRIDGE_CTL_BUS_RESET |
                 PCI_BRIDGE_CTL_FAST_BACK |
                 PCI_BRIDGE_CTL_DISCARD |
                 PCI_BRIDGE_CTL_SEC_DISCARD |
                 PCI_BRIDGE_CTL_DISCARD_SERR);
    /* Below does not do anything as we never set this bit, put here for
     * completeness. */
    pci_set_word(d->w1cmask + PCI_BRIDGE_CONTROL,
                 PCI_BRIDGE_CTL_DISCARD_STATUS);
719
    d->cmask[PCI_IO_BASE] |= PCI_IO_RANGE_TYPE_MASK;
720
    d->cmask[PCI_IO_LIMIT] |= PCI_IO_RANGE_TYPE_MASK;
721 722
    pci_word_test_and_set_mask(d->cmask + PCI_PREF_MEMORY_BASE,
                               PCI_PREF_RANGE_TYPE_MASK);
723 724
    pci_word_test_and_set_mask(d->cmask + PCI_PREF_MEMORY_LIMIT,
                               PCI_PREF_RANGE_TYPE_MASK);
725 726
}

727 728 729 730 731 732 733 734 735 736
static int pci_init_multifunction(PCIBus *bus, PCIDevice *dev)
{
    uint8_t slot = PCI_SLOT(dev->devfn);
    uint8_t func;

    if (dev->cap_present & QEMU_PCI_CAP_MULTIFUNCTION) {
        dev->config[PCI_HEADER_TYPE] |= PCI_HEADER_TYPE_MULTI_FUNCTION;
    }

    /*
S
Stefan Weil 已提交
737
     * multifunction bit is interpreted in two ways as follows.
738 739 740 741 742 743 744 745 746 747 748 749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768 769 770 771 772 773 774
     *   - all functions must set the bit to 1.
     *     Example: Intel X53
     *   - function 0 must set the bit, but the rest function (> 0)
     *     is allowed to leave the bit to 0.
     *     Example: PIIX3(also in qemu), PIIX4(also in qemu), ICH10,
     *
     * So OS (at least Linux) checks the bit of only function 0,
     * and doesn't see the bit of function > 0.
     *
     * The below check allows both interpretation.
     */
    if (PCI_FUNC(dev->devfn)) {
        PCIDevice *f0 = bus->devices[PCI_DEVFN(slot, 0)];
        if (f0 && !(f0->cap_present & QEMU_PCI_CAP_MULTIFUNCTION)) {
            /* function 0 should set multifunction bit */
            error_report("PCI: single function device can't be populated "
                         "in function %x.%x", slot, PCI_FUNC(dev->devfn));
            return -1;
        }
        return 0;
    }

    if (dev->cap_present & QEMU_PCI_CAP_MULTIFUNCTION) {
        return 0;
    }
    /* function 0 indicates single function, so function > 0 must be NULL */
    for (func = 1; func < PCI_FUNC_MAX; ++func) {
        if (bus->devices[PCI_DEVFN(slot, func)]) {
            error_report("PCI: %x.0 indicates single function, "
                         "but %x.%x is already populated.",
                         slot, slot, func);
            return -1;
        }
    }
    return 0;
}

I
Isaku Yamahata 已提交
775 776 777 778
static void pci_config_alloc(PCIDevice *pci_dev)
{
    int config_size = pci_config_size(pci_dev);

779 780 781 782 783
    pci_dev->config = g_malloc0(config_size);
    pci_dev->cmask = g_malloc0(config_size);
    pci_dev->wmask = g_malloc0(config_size);
    pci_dev->w1cmask = g_malloc0(config_size);
    pci_dev->used = g_malloc0(config_size);
I
Isaku Yamahata 已提交
784 785 786 787
}

static void pci_config_free(PCIDevice *pci_dev)
{
788 789 790 791 792
    g_free(pci_dev->config);
    g_free(pci_dev->cmask);
    g_free(pci_dev->wmask);
    g_free(pci_dev->w1cmask);
    g_free(pci_dev->used);
I
Isaku Yamahata 已提交
793 794
}

B
bellard 已提交
795
/* -1 for devfn means auto assign */
P
Paul Brook 已提交
796
static PCIDevice *do_pci_register_device(PCIDevice *pci_dev, PCIBus *bus,
797
                                         const char *name, int devfn)
B
bellard 已提交
798
{
799 800 801
    PCIDeviceClass *pc = PCI_DEVICE_GET_CLASS(pci_dev);
    PCIConfigReadFunc *config_read = pc->config_read;
    PCIConfigWriteFunc *config_write = pc->config_write;
802
    AddressSpace *dma_as;
803

B
bellard 已提交
804
    if (devfn < 0) {
805
        for(devfn = bus->devfn_min ; devfn < ARRAY_SIZE(bus->devices);
806
            devfn += PCI_FUNC_MAX) {
807
            if (!bus->devices[devfn])
B
bellard 已提交
808 809
                goto found;
        }
810
        error_report("PCI: no slot/function available for %s, all in use", name);
811
        return NULL;
B
bellard 已提交
812
    found: ;
813
    } else if (bus->devices[devfn]) {
814 815
        error_report("PCI: slot %d function %d not available for %s, in use by %s",
                     PCI_SLOT(devfn), PCI_FUNC(devfn), name, bus->devices[devfn]->name);
816
        return NULL;
B
bellard 已提交
817
    }
818

819
    pci_dev->bus = bus;
820
    dma_as = pci_device_iommu_address_space(pci_dev);
821

822 823
    memory_region_init_alias(&pci_dev->bus_master_enable_region,
                             OBJECT(pci_dev), "bus master",
824 825
                             dma_as->root, 0, memory_region_size(dma_as->root));
    memory_region_set_enabled(&pci_dev->bus_master_enable_region, false);
826 827
    address_space_init(&pci_dev->bus_master_as, &pci_dev->bus_master_enable_region,
                       name);
828

B
bellard 已提交
829 830
    pci_dev->devfn = devfn;
    pstrcpy(pci_dev->name, sizeof(pci_dev->name), name);
831
    pci_dev->irq_state = 0;
I
Isaku Yamahata 已提交
832
    pci_config_alloc(pci_dev);
833

834 835 836 837
    pci_config_set_vendor_id(pci_dev->config, pc->vendor_id);
    pci_config_set_device_id(pci_dev->config, pc->device_id);
    pci_config_set_revision(pci_dev->config, pc->revision);
    pci_config_set_class(pci_dev->config, pc->class_id);
838

839 840
    if (!pc->is_bridge) {
        if (pc->subsystem_vendor_id || pc->subsystem_id) {
841
            pci_set_word(pci_dev->config + PCI_SUBSYSTEM_VENDOR_ID,
842
                         pc->subsystem_vendor_id);
843
            pci_set_word(pci_dev->config + PCI_SUBSYSTEM_ID,
844
                         pc->subsystem_id);
845 846 847 848 849
        } else {
            pci_set_default_subsystem_id(pci_dev);
        }
    } else {
        /* subsystem_vendor_id/subsystem_id are only for header type 0 */
850 851
        assert(!pc->subsystem_vendor_id);
        assert(!pc->subsystem_id);
852
    }
853
    pci_init_cmask(pci_dev);
854
    pci_init_wmask(pci_dev);
855
    pci_init_w1cmask(pci_dev);
856
    if (pc->is_bridge) {
857
        pci_init_mask_bridge(pci_dev);
858
    }
859 860 861 862
    if (pci_init_multifunction(bus, pci_dev)) {
        pci_config_free(pci_dev);
        return NULL;
    }
863 864 865 866 867

    if (!config_read)
        config_read = pci_default_read_config;
    if (!config_write)
        config_write = pci_default_write_config;
B
bellard 已提交
868 869
    pci_dev->config_read = config_read;
    pci_dev->config_write = config_write;
870
    bus->devices[devfn] = pci_dev;
J
Juan Quintela 已提交
871
    pci_dev->version_id = 2; /* Current pci device vmstate version */
B
bellard 已提交
872 873 874
    return pci_dev;
}

875 876 877 878
static void do_pci_unregister_device(PCIDevice *pci_dev)
{
    pci_dev->bus->devices[pci_dev->devfn] = NULL;
    pci_config_free(pci_dev);
879

880 881
    address_space_destroy(&pci_dev->bus_master_as);
    memory_region_destroy(&pci_dev->bus_master_enable_region);
882 883
}

884 885 886 887 888 889 890
static void pci_unregister_io_regions(PCIDevice *pci_dev)
{
    PCIIORegion *r;
    int i;

    for(i = 0; i < PCI_NUM_REGIONS; i++) {
        r = &pci_dev->io_regions[i];
891
        if (!r->size || r->addr == PCI_BAR_UNMAPPED)
892
            continue;
893
        memory_region_del_subregion(r->address_space, r->memory);
894
    }
A
Alex Williamson 已提交
895 896

    pci_unregister_vga(pci_dev);
897 898
}

899
static int pci_unregister_device(DeviceState *dev)
900
{
901 902
    PCIDevice *pci_dev = PCI_DEVICE(dev);
    PCIDeviceClass *pc = PCI_DEVICE_GET_CLASS(pci_dev);
903 904

    pci_unregister_io_regions(pci_dev);
905
    pci_del_option_rom(pci_dev);
906

907 908 909
    if (pc->exit) {
        pc->exit(pci_dev);
    }
910

911
    do_pci_unregister_device(pci_dev);
912 913 914
    return 0;
}

915 916
void pci_register_bar(PCIDevice *pci_dev, int region_num,
                      uint8_t type, MemoryRegion *memory)
B
bellard 已提交
917 918
{
    PCIIORegion *r;
P
pbrook 已提交
919
    uint32_t addr;
920
    uint64_t wmask;
A
Avi Kivity 已提交
921
    pcibus_t size = memory_region_size(memory);
922

923 924
    assert(region_num >= 0);
    assert(region_num < PCI_NUM_REGIONS);
925 926
    if (size & (size-1)) {
        fprintf(stderr, "ERROR: PCI region size must be pow2 "
927
                    "type=0x%x, size=0x%"FMT_PCIBUS"\n", type, size);
928 929 930
        exit(1);
    }

B
bellard 已提交
931
    r = &pci_dev->io_regions[region_num];
932
    r->addr = PCI_BAR_UNMAPPED;
B
bellard 已提交
933 934
    r->size = size;
    r->type = type;
935
    r->memory = NULL;
936 937

    wmask = ~(size - 1);
938
    addr = pci_bar(pci_dev, region_num);
P
pbrook 已提交
939
    if (region_num == PCI_ROM_SLOT) {
S
Stefan Weil 已提交
940
        /* ROM enable bit is writable */
941
        wmask |= PCI_ROM_ADDRESS_ENABLE;
P
pbrook 已提交
942
    }
943
    pci_set_long(pci_dev->config + addr, type);
I
Isaku Yamahata 已提交
944 945 946 947 948 949 950 951
    if (!(r->type & PCI_BASE_ADDRESS_SPACE_IO) &&
        r->type & PCI_BASE_ADDRESS_MEM_TYPE_64) {
        pci_set_quad(pci_dev->wmask + addr, wmask);
        pci_set_quad(pci_dev->cmask + addr, ~0ULL);
    } else {
        pci_set_long(pci_dev->wmask + addr, wmask & 0xffffffff);
        pci_set_long(pci_dev->cmask + addr, 0xffffffff);
    }
952
    pci_dev->io_regions[region_num].memory = memory;
953
    pci_dev->io_regions[region_num].address_space
A
Avi Kivity 已提交
954
        = type & PCI_BASE_ADDRESS_SPACE_IO
955 956
        ? pci_dev->bus->address_space_io
        : pci_dev->bus->address_space_mem;
957 958
}

A
Alex Williamson 已提交
959 960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015
static void pci_update_vga(PCIDevice *pci_dev)
{
    uint16_t cmd;

    if (!pci_dev->has_vga) {
        return;
    }

    cmd = pci_get_word(pci_dev->config + PCI_COMMAND);

    memory_region_set_enabled(pci_dev->vga_regions[QEMU_PCI_VGA_MEM],
                              cmd & PCI_COMMAND_MEMORY);
    memory_region_set_enabled(pci_dev->vga_regions[QEMU_PCI_VGA_IO_LO],
                              cmd & PCI_COMMAND_IO);
    memory_region_set_enabled(pci_dev->vga_regions[QEMU_PCI_VGA_IO_HI],
                              cmd & PCI_COMMAND_IO);
}

void pci_register_vga(PCIDevice *pci_dev, MemoryRegion *mem,
                      MemoryRegion *io_lo, MemoryRegion *io_hi)
{
    assert(!pci_dev->has_vga);

    assert(memory_region_size(mem) == QEMU_PCI_VGA_MEM_SIZE);
    pci_dev->vga_regions[QEMU_PCI_VGA_MEM] = mem;
    memory_region_add_subregion_overlap(pci_dev->bus->address_space_mem,
                                        QEMU_PCI_VGA_MEM_BASE, mem, 1);

    assert(memory_region_size(io_lo) == QEMU_PCI_VGA_IO_LO_SIZE);
    pci_dev->vga_regions[QEMU_PCI_VGA_IO_LO] = io_lo;
    memory_region_add_subregion_overlap(pci_dev->bus->address_space_io,
                                        QEMU_PCI_VGA_IO_LO_BASE, io_lo, 1);

    assert(memory_region_size(io_hi) == QEMU_PCI_VGA_IO_HI_SIZE);
    pci_dev->vga_regions[QEMU_PCI_VGA_IO_HI] = io_hi;
    memory_region_add_subregion_overlap(pci_dev->bus->address_space_io,
                                        QEMU_PCI_VGA_IO_HI_BASE, io_hi, 1);
    pci_dev->has_vga = true;

    pci_update_vga(pci_dev);
}

void pci_unregister_vga(PCIDevice *pci_dev)
{
    if (!pci_dev->has_vga) {
        return;
    }

    memory_region_del_subregion(pci_dev->bus->address_space_mem,
                                pci_dev->vga_regions[QEMU_PCI_VGA_MEM]);
    memory_region_del_subregion(pci_dev->bus->address_space_io,
                                pci_dev->vga_regions[QEMU_PCI_VGA_IO_LO]);
    memory_region_del_subregion(pci_dev->bus->address_space_io,
                                pci_dev->vga_regions[QEMU_PCI_VGA_IO_HI]);
    pci_dev->has_vga = false;
}

1016 1017 1018 1019 1020
pcibus_t pci_get_bar_addr(PCIDevice *pci_dev, int region_num)
{
    return pci_dev->io_regions[region_num].addr;
}

1021 1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033
static pcibus_t pci_bar_address(PCIDevice *d,
				int reg, uint8_t type, pcibus_t size)
{
    pcibus_t new_addr, last_addr;
    int bar = pci_bar(d, reg);
    uint16_t cmd = pci_get_word(d->config + PCI_COMMAND);

    if (type & PCI_BASE_ADDRESS_SPACE_IO) {
        if (!(cmd & PCI_COMMAND_IO)) {
            return PCI_BAR_UNMAPPED;
        }
        new_addr = pci_get_long(d->config + bar) & ~(size - 1);
        last_addr = new_addr + size - 1;
1034 1035 1036 1037
        /* Check if 32 bit BAR wraps around explicitly.
         * TODO: make priorities correct and remove this work around.
         */
        if (last_addr <= new_addr || new_addr == 0 || last_addr >= UINT32_MAX) {
1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080
            return PCI_BAR_UNMAPPED;
        }
        return new_addr;
    }

    if (!(cmd & PCI_COMMAND_MEMORY)) {
        return PCI_BAR_UNMAPPED;
    }
    if (type & PCI_BASE_ADDRESS_MEM_TYPE_64) {
        new_addr = pci_get_quad(d->config + bar);
    } else {
        new_addr = pci_get_long(d->config + bar);
    }
    /* the ROM slot has a specific enable bit */
    if (reg == PCI_ROM_SLOT && !(new_addr & PCI_ROM_ADDRESS_ENABLE)) {
        return PCI_BAR_UNMAPPED;
    }
    new_addr &= ~(size - 1);
    last_addr = new_addr + size - 1;
    /* NOTE: we do not support wrapping */
    /* XXX: as we cannot support really dynamic
       mappings, we handle specific values as invalid
       mappings. */
    if (last_addr <= new_addr || new_addr == 0 ||
        last_addr == PCI_BAR_UNMAPPED) {
        return PCI_BAR_UNMAPPED;
    }

    /* Now pcibus_t is 64bit.
     * Check if 32 bit BAR wraps around explicitly.
     * Without this, PC ide doesn't work well.
     * TODO: remove this work around.
     */
    if  (!(type & PCI_BASE_ADDRESS_MEM_TYPE_64) && last_addr >= UINT32_MAX) {
        return PCI_BAR_UNMAPPED;
    }

    /*
     * OS is allowed to set BAR beyond its addressable
     * bits. For example, 32 bit OS can set 64bit bar
     * to >4G. Check it. TODO: we might need to support
     * it in the future for e.g. PAE.
     */
A
Avi Kivity 已提交
1081
    if (last_addr >= HWADDR_MAX) {
1082 1083 1084 1085 1086 1087
        return PCI_BAR_UNMAPPED;
    }

    return new_addr;
}

1088 1089 1090
static void pci_update_mappings(PCIDevice *d)
{
    PCIIORegion *r;
1091
    int i;
1092
    pcibus_t new_addr;
1093

1094
    for(i = 0; i < PCI_NUM_REGIONS; i++) {
1095
        r = &d->io_regions[i];
1096 1097

        /* this region isn't registered */
1098
        if (!r->size)
1099 1100
            continue;

1101
        new_addr = pci_bar_address(d, i, r->type, r->size);
1102 1103

        /* This bar isn't changed */
1104
        if (new_addr == r->addr)
1105 1106 1107 1108
            continue;

        /* now do the real mapping */
        if (r->addr != PCI_BAR_UNMAPPED) {
1109
            memory_region_del_subregion(r->address_space, r->memory);
1110
        }
1111 1112
        r->addr = new_addr;
        if (r->addr != PCI_BAR_UNMAPPED) {
1113 1114
            memory_region_add_subregion_overlap(r->address_space,
                                                r->addr, r->memory, 1);
1115
        }
1116
    }
A
Alex Williamson 已提交
1117 1118

    pci_update_vga(d);
1119 1120
}

1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 1139
static inline int pci_irq_disabled(PCIDevice *d)
{
    return pci_get_word(d->config + PCI_COMMAND) & PCI_COMMAND_INTX_DISABLE;
}

/* Called after interrupt disabled field update in config space,
 * assert/deassert interrupts if necessary.
 * Gets original interrupt disable bit value (before update). */
static void pci_update_irq_disabled(PCIDevice *d, int was_irq_disabled)
{
    int i, disabled = pci_irq_disabled(d);
    if (disabled == was_irq_disabled)
        return;
    for (i = 0; i < PCI_NUM_PINS; ++i) {
        int state = pci_irq_state(d, i);
        pci_change_irq_level(d, i, disabled ? -state : state);
    }
}

1140
uint32_t pci_default_read_config(PCIDevice *d,
1141
                                 uint32_t address, int len)
B
bellard 已提交
1142
{
1143
    uint32_t val = 0;
J
Jan Kiszka 已提交
1144

1145 1146
    memcpy(&val, d->config + address, len);
    return le32_to_cpu(val);
1147 1148
}

1149
void pci_default_write_config(PCIDevice *d, uint32_t addr, uint32_t val, int l)
1150
{
1151
    int i, was_irq_disabled = pci_irq_disabled(d);
1152

J
Jan Kiszka 已提交
1153
    for (i = 0; i < l; val >>= 8, ++i) {
1154
        uint8_t wmask = d->wmask[addr + i];
1155 1156
        uint8_t w1cmask = d->w1cmask[addr + i];
        assert(!(wmask & w1cmask));
1157
        d->config[addr + i] = (d->config[addr + i] & ~wmask) | (val & wmask);
1158
        d->config[addr + i] &= ~(val & w1cmask); /* W1C: Write 1 to Clear */
1159
    }
I
Isaku Yamahata 已提交
1160
    if (ranges_overlap(addr, l, PCI_BASE_ADDRESS_0, 24) ||
1161 1162
        ranges_overlap(addr, l, PCI_ROM_ADDRESS, 4) ||
        ranges_overlap(addr, l, PCI_ROM_ADDRESS1, 4) ||
I
Isaku Yamahata 已提交
1163
        range_covers_byte(addr, l, PCI_COMMAND))
1164
        pci_update_mappings(d);
1165

A
Avi Kivity 已提交
1166
    if (range_covers_byte(addr, l, PCI_COMMAND)) {
1167
        pci_update_irq_disabled(d, was_irq_disabled);
A
Avi Kivity 已提交
1168 1169 1170 1171
        memory_region_set_enabled(&d->bus_master_enable_region,
                                  pci_get_word(d->config + PCI_COMMAND)
                                    & PCI_COMMAND_MASTER);
    }
1172 1173 1174

    msi_write_config(d, addr, val, l);
    msix_write_config(d, addr, val, l);
B
bellard 已提交
1175 1176
}

P
pbrook 已提交
1177 1178
/***********************************************************/
/* generic PCI irq support */
1179

P
pbrook 已提交
1180
/* 0 <= irq_num <= 3. level must be 0 or 1 */
1181
static void pci_irq_handler(void *opaque, int irq_num, int level)
B
bellard 已提交
1182
{
1183
    PCIDevice *pci_dev = opaque;
P
pbrook 已提交
1184
    int change;
1185

1186
    change = level - pci_irq_state(pci_dev, irq_num);
P
pbrook 已提交
1187 1188
    if (!change)
        return;
1189

1190
    pci_set_irq_state(pci_dev, irq_num, level);
1191
    pci_update_irq_status(pci_dev);
1192 1193
    if (pci_irq_disabled(pci_dev))
        return;
1194
    pci_change_irq_level(pci_dev, irq_num, change);
B
bellard 已提交
1195 1196
}

1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214
static inline int pci_intx(PCIDevice *pci_dev)
{
    return pci_get_byte(pci_dev->config + PCI_INTERRUPT_PIN) - 1;
}

qemu_irq pci_allocate_irq(PCIDevice *pci_dev)
{
    int intx = pci_intx(pci_dev);

    return qemu_allocate_irq(pci_irq_handler, pci_dev, intx);
}

void pci_set_irq(PCIDevice *pci_dev, int level)
{
    int intx = pci_intx(pci_dev);
    pci_irq_handler(pci_dev, intx, level);
}

1215 1216 1217
/* Special hooks used by device assignment */
void pci_bus_set_route_irq_fn(PCIBus *bus, pci_route_irq_fn route_intx_to_irq)
{
1218
    assert(pci_bus_is_root(bus));
1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230
    bus->route_intx_to_irq = route_intx_to_irq;
}

PCIINTxRoute pci_device_route_intx_to_irq(PCIDevice *dev, int pin)
{
    PCIBus *bus;

    do {
         bus = dev->bus;
         pin = bus->map_irq(dev, pin);
         dev = bus->parent_dev;
    } while (dev);
1231 1232

    if (!bus->route_intx_to_irq) {
1233
        error_report("PCI: Bug - unimplemented PCI INTx routing (%s)",
1234 1235 1236 1237
                     object_get_typename(OBJECT(bus->qbus.parent)));
        return (PCIINTxRoute) { PCI_INTX_DISABLED, -1 };
    }

1238
    return bus->route_intx_to_irq(bus->irq_opaque, pin);
J
Jan Kiszka 已提交
1239 1240
}

1241 1242 1243 1244 1245
bool pci_intx_route_changed(PCIINTxRoute *old, PCIINTxRoute *new)
{
    return old->mode != new->mode || old->irq != new->irq;
}

J
Jan Kiszka 已提交
1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256
void pci_bus_fire_intx_routing_notifier(PCIBus *bus)
{
    PCIDevice *dev;
    PCIBus *sec;
    int i;

    for (i = 0; i < ARRAY_SIZE(bus->devices); ++i) {
        dev = bus->devices[i];
        if (dev && dev->intx_routing_notifier) {
            dev->intx_routing_notifier(dev);
        }
1257 1258 1259 1260
    }

    QLIST_FOREACH(sec, &bus->child, sibling) {
        pci_bus_fire_intx_routing_notifier(sec);
J
Jan Kiszka 已提交
1261 1262 1263 1264 1265 1266 1267
    }
}

void pci_device_set_intx_routing_notifier(PCIDevice *dev,
                                          PCIINTxRoutingNotifier notifier)
{
    dev->intx_routing_notifier = notifier;
B
bellard 已提交
1268 1269
}

1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287
/*
 * PCI-to-PCI bridge specification
 * 9.1: Interrupt routing. Table 9-1
 *
 * the PCI Express Base Specification, Revision 2.1
 * 2.2.8.1: INTx interrutp signaling - Rules
 *          the Implementation Note
 *          Table 2-20
 */
/*
 * 0 <= pin <= 3 0 = INTA, 1 = INTB, 2 = INTC, 3 = INTD
 * 0-origin unlike PCI interrupt pin register.
 */
int pci_swizzle_map_irq_fn(PCIDevice *pci_dev, int pin)
{
    return (pin + PCI_SLOT(pci_dev->devfn)) % PCI_NUM_PINS;
}

P
pbrook 已提交
1288 1289
/***********************************************************/
/* monitor info on PCI */
1290

1291 1292 1293
typedef struct {
    uint16_t class;
    const char *desc;
1294 1295
    const char *fw_name;
    uint16_t fw_ign_bits;
1296 1297
} pci_class_desc;

1298
static const pci_class_desc pci_class_descriptions[] =
1299
{
1300 1301 1302 1303 1304 1305
    { 0x0001, "VGA controller", "display"},
    { 0x0100, "SCSI controller", "scsi"},
    { 0x0101, "IDE controller", "ide"},
    { 0x0102, "Floppy controller", "fdc"},
    { 0x0103, "IPI controller", "ipi"},
    { 0x0104, "RAID controller", "raid"},
T
ths 已提交
1306 1307 1308
    { 0x0106, "SATA controller"},
    { 0x0107, "SAS controller"},
    { 0x0180, "Storage controller"},
1309 1310 1311 1312
    { 0x0200, "Ethernet controller", "ethernet"},
    { 0x0201, "Token Ring controller", "token-ring"},
    { 0x0202, "FDDI controller", "fddi"},
    { 0x0203, "ATM controller", "atm"},
T
ths 已提交
1313
    { 0x0280, "Network controller"},
1314
    { 0x0300, "VGA controller", "display", 0x00ff},
T
ths 已提交
1315 1316 1317
    { 0x0301, "XGA controller"},
    { 0x0302, "3D controller"},
    { 0x0380, "Display controller"},
1318 1319
    { 0x0400, "Video controller", "video"},
    { 0x0401, "Audio controller", "sound"},
T
ths 已提交
1320
    { 0x0402, "Phone"},
1321
    { 0x0403, "Audio controller", "sound"},
T
ths 已提交
1322
    { 0x0480, "Multimedia controller"},
1323 1324
    { 0x0500, "RAM controller", "memory"},
    { 0x0501, "Flash controller", "flash"},
T
ths 已提交
1325
    { 0x0580, "Memory controller"},
1326 1327 1328 1329
    { 0x0600, "Host bridge", "host"},
    { 0x0601, "ISA bridge", "isa"},
    { 0x0602, "EISA bridge", "eisa"},
    { 0x0603, "MC bridge", "mca"},
G
Gerd Hoffmann 已提交
1330
    { 0x0604, "PCI bridge", "pci-bridge"},
1331 1332 1333
    { 0x0605, "PCMCIA bridge", "pcmcia"},
    { 0x0606, "NUBUS bridge", "nubus"},
    { 0x0607, "CARDBUS bridge", "cardbus"},
T
ths 已提交
1334 1335
    { 0x0608, "RACEWAY bridge"},
    { 0x0680, "Bridge"},
1336 1337 1338 1339 1340 1341 1342 1343 1344 1345 1346 1347 1348 1349 1350 1351
    { 0x0700, "Serial port", "serial"},
    { 0x0701, "Parallel port", "parallel"},
    { 0x0800, "Interrupt controller", "interrupt-controller"},
    { 0x0801, "DMA controller", "dma-controller"},
    { 0x0802, "Timer", "timer"},
    { 0x0803, "RTC", "rtc"},
    { 0x0900, "Keyboard", "keyboard"},
    { 0x0901, "Pen", "pen"},
    { 0x0902, "Mouse", "mouse"},
    { 0x0A00, "Dock station", "dock", 0x00ff},
    { 0x0B00, "i386 cpu", "cpu", 0x00ff},
    { 0x0c00, "Fireware contorller", "fireware"},
    { 0x0c01, "Access bus controller", "access-bus"},
    { 0x0c02, "SSA controller", "ssa"},
    { 0x0c03, "USB controller", "usb"},
    { 0x0c04, "Fibre channel controller", "fibre-channel"},
J
Jan Kiszka 已提交
1352
    { 0x0c05, "SMBus"},
1353 1354 1355
    { 0, NULL}
};

1356
static void pci_for_each_device_under_bus(PCIBus *bus,
1357 1358 1359
                                          void (*fn)(PCIBus *b, PCIDevice *d,
                                                     void *opaque),
                                          void *opaque)
1360
{
1361 1362
    PCIDevice *d;
    int devfn;
1363

1364 1365 1366
    for(devfn = 0; devfn < ARRAY_SIZE(bus->devices); devfn++) {
        d = bus->devices[devfn];
        if (d) {
1367
            fn(bus, d, opaque);
1368 1369 1370 1371 1372
        }
    }
}

void pci_for_each_device(PCIBus *bus, int bus_num,
1373 1374
                         void (*fn)(PCIBus *b, PCIDevice *d, void *opaque),
                         void *opaque)
1375
{
1376
    bus = pci_find_bus_nr(bus, bus_num);
1377 1378

    if (bus) {
1379
        pci_for_each_device_under_bus(bus, fn, opaque);
1380 1381 1382
    }
}

L
Luiz Capitulino 已提交
1383
static const pci_class_desc *get_class_desc(int class)
1384
{
L
Luiz Capitulino 已提交
1385
    const pci_class_desc *desc;
1386

L
Luiz Capitulino 已提交
1387 1388 1389
    desc = pci_class_descriptions;
    while (desc->desc && class != desc->class) {
        desc++;
1390
    }
1391

L
Luiz Capitulino 已提交
1392 1393
    return desc;
}
I
Isaku Yamahata 已提交
1394

L
Luiz Capitulino 已提交
1395
static PciDeviceInfoList *qmp_query_pci_devices(PCIBus *bus, int bus_num);
1396

L
Luiz Capitulino 已提交
1397 1398 1399 1400
static PciMemoryRegionList *qmp_query_pci_regions(const PCIDevice *dev)
{
    PciMemoryRegionList *head = NULL, *cur_item = NULL;
    int i;
1401

L
Luiz Capitulino 已提交
1402 1403 1404 1405 1406 1407
    for (i = 0; i < PCI_NUM_REGIONS; i++) {
        const PCIIORegion *r = &dev->io_regions[i];
        PciMemoryRegionList *region;

        if (!r->size) {
            continue;
P
pbrook 已提交
1408
        }
1409

L
Luiz Capitulino 已提交
1410 1411
        region = g_malloc0(sizeof(*region));
        region->value = g_malloc0(sizeof(*region->value));
1412

L
Luiz Capitulino 已提交
1413 1414 1415 1416 1417 1418 1419 1420
        if (r->type & PCI_BASE_ADDRESS_SPACE_IO) {
            region->value->type = g_strdup("io");
        } else {
            region->value->type = g_strdup("memory");
            region->value->has_prefetch = true;
            region->value->prefetch = !!(r->type & PCI_BASE_ADDRESS_MEM_PREFETCH);
            region->value->has_mem_type_64 = true;
            region->value->mem_type_64 = !!(r->type & PCI_BASE_ADDRESS_MEM_TYPE_64);
1421
        }
1422

L
Luiz Capitulino 已提交
1423 1424 1425
        region->value->bar = i;
        region->value->address = r->addr;
        region->value->size = r->size;
1426

L
Luiz Capitulino 已提交
1427 1428 1429 1430 1431 1432
        /* XXX: waiting for the qapi to support GSList */
        if (!cur_item) {
            head = cur_item = region;
        } else {
            cur_item->next = region;
            cur_item = region;
1433
        }
P
pbrook 已提交
1434
    }
1435

L
Luiz Capitulino 已提交
1436
    return head;
1437 1438
}

L
Luiz Capitulino 已提交
1439 1440
static PciBridgeInfo *qmp_query_pci_bridge(PCIDevice *dev, PCIBus *bus,
                                           int bus_num)
1441
{
L
Luiz Capitulino 已提交
1442
    PciBridgeInfo *info;
1443

L
Luiz Capitulino 已提交
1444
    info = g_malloc0(sizeof(*info));
1445

L
Luiz Capitulino 已提交
1446 1447 1448
    info->bus.number = dev->config[PCI_PRIMARY_BUS];
    info->bus.secondary = dev->config[PCI_SECONDARY_BUS];
    info->bus.subordinate = dev->config[PCI_SUBORDINATE_BUS];
1449

L
Luiz Capitulino 已提交
1450 1451 1452
    info->bus.io_range = g_malloc0(sizeof(*info->bus.io_range));
    info->bus.io_range->base = pci_bridge_get_base(dev, PCI_BASE_ADDRESS_SPACE_IO);
    info->bus.io_range->limit = pci_bridge_get_limit(dev, PCI_BASE_ADDRESS_SPACE_IO);
1453

L
Luiz Capitulino 已提交
1454 1455 1456
    info->bus.memory_range = g_malloc0(sizeof(*info->bus.memory_range));
    info->bus.memory_range->base = pci_bridge_get_base(dev, PCI_BASE_ADDRESS_SPACE_MEMORY);
    info->bus.memory_range->limit = pci_bridge_get_limit(dev, PCI_BASE_ADDRESS_SPACE_MEMORY);
1457

L
Luiz Capitulino 已提交
1458 1459 1460
    info->bus.prefetchable_range = g_malloc0(sizeof(*info->bus.prefetchable_range));
    info->bus.prefetchable_range->base = pci_bridge_get_base(dev, PCI_BASE_ADDRESS_MEM_PREFETCH);
    info->bus.prefetchable_range->limit = pci_bridge_get_limit(dev, PCI_BASE_ADDRESS_MEM_PREFETCH);
1461

L
Luiz Capitulino 已提交
1462
    if (dev->config[PCI_SECONDARY_BUS] != 0) {
1463
        PCIBus *child_bus = pci_find_bus_nr(bus, dev->config[PCI_SECONDARY_BUS]);
L
Luiz Capitulino 已提交
1464 1465 1466 1467
        if (child_bus) {
            info->has_devices = true;
            info->devices = qmp_query_pci_devices(child_bus, dev->config[PCI_SECONDARY_BUS]);
        }
1468 1469
    }

L
Luiz Capitulino 已提交
1470
    return info;
1471 1472
}

L
Luiz Capitulino 已提交
1473 1474
static PciDeviceInfo *qmp_query_pci_device(PCIDevice *dev, PCIBus *bus,
                                           int bus_num)
1475
{
L
Luiz Capitulino 已提交
1476 1477
    const pci_class_desc *desc;
    PciDeviceInfo *info;
1478
    uint8_t type;
L
Luiz Capitulino 已提交
1479
    int class;
1480

L
Luiz Capitulino 已提交
1481 1482 1483 1484 1485 1486
    info = g_malloc0(sizeof(*info));
    info->bus = bus_num;
    info->slot = PCI_SLOT(dev->devfn);
    info->function = PCI_FUNC(dev->devfn);

    class = pci_get_word(dev->config + PCI_CLASS_DEVICE);
1487
    info->class_info.q_class = class;
L
Luiz Capitulino 已提交
1488 1489 1490 1491 1492 1493 1494 1495 1496 1497
    desc = get_class_desc(class);
    if (desc->desc) {
        info->class_info.has_desc = true;
        info->class_info.desc = g_strdup(desc->desc);
    }

    info->id.vendor = pci_get_word(dev->config + PCI_VENDOR_ID);
    info->id.device = pci_get_word(dev->config + PCI_DEVICE_ID);
    info->regions = qmp_query_pci_regions(dev);
    info->qdev_id = g_strdup(dev->qdev.id ? dev->qdev.id : "");
1498 1499

    if (dev->config[PCI_INTERRUPT_PIN] != 0) {
L
Luiz Capitulino 已提交
1500 1501
        info->has_irq = true;
        info->irq = dev->config[PCI_INTERRUPT_LINE];
1502 1503
    }

1504 1505
    type = dev->config[PCI_HEADER_TYPE] & ~PCI_HEADER_TYPE_MULTI_FUNCTION;
    if (type == PCI_HEADER_TYPE_BRIDGE) {
L
Luiz Capitulino 已提交
1506 1507
        info->has_pci_bridge = true;
        info->pci_bridge = qmp_query_pci_bridge(dev, bus, bus_num);
1508 1509
    }

L
Luiz Capitulino 已提交
1510
    return info;
1511 1512
}

L
Luiz Capitulino 已提交
1513
static PciDeviceInfoList *qmp_query_pci_devices(PCIBus *bus, int bus_num)
1514
{
L
Luiz Capitulino 已提交
1515
    PciDeviceInfoList *info, *head = NULL, *cur_item = NULL;
1516
    PCIDevice *dev;
L
Luiz Capitulino 已提交
1517
    int devfn;
1518 1519 1520 1521

    for (devfn = 0; devfn < ARRAY_SIZE(bus->devices); devfn++) {
        dev = bus->devices[devfn];
        if (dev) {
L
Luiz Capitulino 已提交
1522 1523 1524 1525 1526 1527 1528 1529 1530 1531
            info = g_malloc0(sizeof(*info));
            info->value = qmp_query_pci_device(dev, bus, bus_num);

            /* XXX: waiting for the qapi to support GSList */
            if (!cur_item) {
                head = cur_item = info;
            } else {
                cur_item->next = info;
                cur_item = info;
            }
1532
        }
1533
    }
1534

L
Luiz Capitulino 已提交
1535
    return head;
1536 1537
}

L
Luiz Capitulino 已提交
1538
static PciInfo *qmp_query_pci_bus(PCIBus *bus, int bus_num)
1539
{
L
Luiz Capitulino 已提交
1540 1541
    PciInfo *info = NULL;

1542
    bus = pci_find_bus_nr(bus, bus_num);
P
pbrook 已提交
1543
    if (bus) {
L
Luiz Capitulino 已提交
1544 1545 1546
        info = g_malloc0(sizeof(*info));
        info->bus = bus_num;
        info->devices = qmp_query_pci_devices(bus, bus_num);
B
bellard 已提交
1547
    }
1548

L
Luiz Capitulino 已提交
1549
    return info;
B
bellard 已提交
1550 1551
}

L
Luiz Capitulino 已提交
1552
PciInfoList *qmp_query_pci(Error **errp)
B
bellard 已提交
1553
{
L
Luiz Capitulino 已提交
1554
    PciInfoList *info, *head = NULL, *cur_item = NULL;
1555
    PCIHostState *host_bridge;
1556

1557
    QLIST_FOREACH(host_bridge, &pci_host_bridges, next) {
L
Luiz Capitulino 已提交
1558
        info = g_malloc0(sizeof(*info));
1559
        info->value = qmp_query_pci_bus(host_bridge->bus, 0);
L
Luiz Capitulino 已提交
1560 1561 1562 1563 1564 1565 1566

        /* XXX: waiting for the qapi to support GSList */
        if (!cur_item) {
            head = cur_item = info;
        } else {
            cur_item->next = info;
            cur_item = info;
1567
        }
1568
    }
1569

L
Luiz Capitulino 已提交
1570
    return head;
B
bellard 已提交
1571
}
1572

1573 1574 1575 1576 1577 1578 1579 1580 1581 1582 1583 1584
static const char * const pci_nic_models[] = {
    "ne2k_pci",
    "i82551",
    "i82557b",
    "i82559er",
    "rtl8139",
    "e1000",
    "pcnet",
    "virtio",
    NULL
};

P
Paul Brook 已提交
1585 1586 1587 1588 1589 1590 1591 1592
static const char * const pci_nic_names[] = {
    "ne2k_pci",
    "i82551",
    "i82557b",
    "i82559er",
    "rtl8139",
    "e1000",
    "pcnet",
P
Paul Brook 已提交
1593
    "virtio-net-pci",
1594 1595 1596
    NULL
};

1597
/* Initialize a PCI NIC.  */
1598
/* FIXME callers should check for failure, but don't */
1599 1600
PCIDevice *pci_nic_init(NICInfo *nd, PCIBus *rootbus,
                        const char *default_model,
1601
                        const char *default_devaddr)
1602
{
1603
    const char *devaddr = nd->devaddr ? nd->devaddr : default_devaddr;
1604 1605
    PCIBus *bus;
    int devfn;
1606
    PCIDevice *pci_dev;
P
Paul Brook 已提交
1607
    DeviceState *dev;
1608 1609
    int i;

1610 1611 1612 1613
    i = qemu_find_nic_model(nd, pci_nic_models, default_model);
    if (i < 0)
        return NULL;

1614
    bus = pci_get_bus_devfn(&devfn, rootbus, devaddr);
1615
    if (!bus) {
1616 1617
        error_report("Invalid PCI device address %s for device %s",
                     devaddr, pci_nic_names[i]);
1618 1619 1620
        return NULL;
    }

1621
    pci_dev = pci_create(bus, devfn, pci_nic_names[i]);
1622
    dev = &pci_dev->qdev;
G
Gerd Hoffmann 已提交
1623
    qdev_set_nic_properties(dev, nd);
1624 1625
    if (qdev_init(dev) < 0)
        return NULL;
1626
    return pci_dev;
1627 1628
}

1629 1630
PCIDevice *pci_nic_init_nofail(NICInfo *nd, PCIBus *rootbus,
                               const char *default_model,
1631 1632 1633 1634 1635 1636 1637
                               const char *default_devaddr)
{
    PCIDevice *res;

    if (qemu_show_nic_models(nd->model, pci_nic_models))
        exit(0);

1638
    res = pci_nic_init(nd, rootbus, default_model, default_devaddr);
1639 1640 1641 1642 1643
    if (!res)
        exit(1);
    return res;
}

1644 1645 1646 1647 1648 1649 1650 1651 1652 1653 1654 1655 1656 1657 1658 1659 1660 1661
PCIDevice *pci_vga_init(PCIBus *bus)
{
    switch (vga_interface_type) {
    case VGA_CIRRUS:
        return pci_create_simple(bus, -1, "cirrus-vga");
    case VGA_QXL:
        return pci_create_simple(bus, -1, "qxl-vga");
    case VGA_STD:
        return pci_create_simple(bus, -1, "VGA");
    case VGA_VMWARE:
        return pci_create_simple(bus, -1, "vmware-svga");
    case VGA_NONE:
    default: /* Other non-PCI types. Checking for unsupported types is already
                done in vl.c. */
        return NULL;
    }
}

1662 1663 1664 1665 1666 1667 1668 1669 1670 1671
/* Whether a given bus number is in range of the secondary
 * bus of the given bridge device. */
static bool pci_secondary_bus_in_range(PCIDevice *dev, int bus_num)
{
    return !(pci_get_word(dev->config + PCI_BRIDGE_CONTROL) &
             PCI_BRIDGE_CTL_BUS_RESET) /* Don't walk the bus if it's reset. */ &&
        dev->config[PCI_SECONDARY_BUS] < bus_num &&
        bus_num <= dev->config[PCI_SUBORDINATE_BUS];
}

1672
static PCIBus *pci_find_bus_nr(PCIBus *bus, int bus_num)
1673
{
I
Isaku Yamahata 已提交
1674
    PCIBus *sec;
1675

I
Isaku Yamahata 已提交
1676
    if (!bus) {
1677
        return NULL;
I
Isaku Yamahata 已提交
1678
    }
1679

1680 1681 1682 1683
    if (pci_bus_num(bus) == bus_num) {
        return bus;
    }

1684
    /* Consider all bus numbers in range for the host pci bridge. */
1685
    if (!pci_bus_is_root(bus) &&
1686 1687 1688 1689
        !pci_secondary_bus_in_range(bus->parent_dev, bus_num)) {
        return NULL;
    }

1690
    /* try child bus */
1691 1692
    for (; bus; bus = sec) {
        QLIST_FOREACH(sec, &bus->child, sibling) {
1693
            assert(!pci_bus_is_root(sec));
1694 1695 1696 1697 1698
            if (sec->parent_dev->config[PCI_SECONDARY_BUS] == bus_num) {
                return sec;
            }
            if (pci_secondary_bus_in_range(sec->parent_dev, bus_num)) {
                break;
B
Blue Swirl 已提交
1699
            }
1700 1701 1702 1703
        }
    }

    return NULL;
1704 1705
}

1706
PCIDevice *pci_find_device(PCIBus *bus, int bus_num, uint8_t devfn)
1707
{
1708
    bus = pci_find_bus_nr(bus, bus_num);
1709 1710 1711 1712

    if (!bus)
        return NULL;

1713
    return bus->devices[devfn];
1714 1715
}

A
Anthony Liguori 已提交
1716
static int pci_qdev_init(DeviceState *qdev)
P
Paul Brook 已提交
1717 1718
{
    PCIDevice *pci_dev = (PCIDevice *)qdev;
1719
    PCIDeviceClass *pc = PCI_DEVICE_GET_CLASS(pci_dev);
P
Paul Brook 已提交
1720
    PCIBus *bus;
1721
    int rc;
1722
    bool is_default_rom;
P
Paul Brook 已提交
1723

I
Isaku Yamahata 已提交
1724
    /* initialize cap_present for pci_is_express() and pci_config_size() */
1725
    if (pc->is_express) {
I
Isaku Yamahata 已提交
1726 1727 1728
        pci_dev->cap_present |= QEMU_PCI_CAP_EXPRESS;
    }

A
Andreas Färber 已提交
1729
    bus = PCI_BUS(qdev_get_parent_bus(qdev));
A
Anthony Liguori 已提交
1730 1731 1732
    pci_dev = do_pci_register_device(pci_dev, bus,
                                     object_get_typename(OBJECT(qdev)),
                                     pci_dev->devfn);
1733 1734
    if (pci_dev == NULL)
        return -1;
1735
    if (qdev->hotplugged && pc->no_hotplug) {
1736
        qerror_report(QERR_DEVICE_NO_HOTPLUG, object_get_typename(OBJECT(pci_dev)));
1737 1738 1739
        do_pci_unregister_device(pci_dev);
        return -1;
    }
1740 1741
    if (pc->init) {
        rc = pc->init(pci_dev);
1742 1743 1744 1745
        if (rc != 0) {
            do_pci_unregister_device(pci_dev);
            return rc;
        }
1746
    }
1747 1748

    /* rom loading */
1749
    is_default_rom = false;
1750 1751
    if (pci_dev->romfile == NULL && pc->romfile != NULL) {
        pci_dev->romfile = g_strdup(pc->romfile);
1752 1753 1754
        is_default_rom = true;
    }
    pci_add_option_rom(pci_dev, is_default_rom);
1755

1756
    if (bus->hotplug) {
1757 1758 1759 1760 1761
        /* Let buses differentiate between hotplug and when device is
         * enabled during qemu machine creation. */
        rc = bus->hotplug(bus->hotplug_qdev, pci_dev,
                          qdev->hotplugged ? PCI_HOTPLUG_ENABLED:
                          PCI_COLDPLUG_ENABLED);
1762 1763 1764 1765 1766 1767
        if (rc != 0) {
            int r = pci_unregister_device(&pci_dev->qdev);
            assert(!r);
            return rc;
        }
    }
G
Gerd Hoffmann 已提交
1768 1769 1770 1771 1772
    return 0;
}

static int pci_unplug_device(DeviceState *qdev)
{
1773 1774
    PCIDevice *dev = PCI_DEVICE(qdev);
    PCIDeviceClass *pc = PCI_DEVICE_GET_CLASS(dev);
G
Gerd Hoffmann 已提交
1775

1776
    if (pc->no_hotplug) {
1777
        qerror_report(QERR_DEVICE_NO_HOTPLUG, object_get_typename(OBJECT(dev)));
1778 1779
        return -1;
    }
1780 1781
    return dev->bus->hotplug(dev->bus->hotplug_qdev, dev,
                             PCI_HOTPLUG_DISABLED);
P
Paul Brook 已提交
1782 1783
}

1784 1785
PCIDevice *pci_create_multifunction(PCIBus *bus, int devfn, bool multifunction,
                                    const char *name)
P
Paul Brook 已提交
1786 1787 1788
{
    DeviceState *dev;

P
Paul Brook 已提交
1789
    dev = qdev_create(&bus->qbus, name);
1790
    qdev_prop_set_int32(dev, "addr", devfn);
1791
    qdev_prop_set_bit(dev, "multifunction", multifunction);
1792
    return PCI_DEVICE(dev);
1793
}
P
Paul Brook 已提交
1794

1795 1796 1797
PCIDevice *pci_create_simple_multifunction(PCIBus *bus, int devfn,
                                           bool multifunction,
                                           const char *name)
1798
{
1799
    PCIDevice *dev = pci_create_multifunction(bus, devfn, multifunction, name);
M
Markus Armbruster 已提交
1800
    qdev_init_nofail(&dev->qdev);
1801
    return dev;
P
Paul Brook 已提交
1802
}
1803

1804 1805 1806 1807 1808 1809 1810 1811 1812 1813
PCIDevice *pci_create(PCIBus *bus, int devfn, const char *name)
{
    return pci_create_multifunction(bus, devfn, false, name);
}

PCIDevice *pci_create_simple(PCIBus *bus, int devfn, const char *name)
{
    return pci_create_simple_multifunction(bus, devfn, false, name);
}

1814
static uint8_t pci_find_space(PCIDevice *pdev, uint8_t size)
1815 1816 1817
{
    int offset = PCI_CONFIG_HEADER_SIZE;
    int i;
1818
    for (i = PCI_CONFIG_HEADER_SIZE; i < PCI_CONFIG_SPACE_SIZE; ++i) {
1819 1820 1821 1822
        if (pdev->used[i])
            offset = i + 1;
        else if (i - offset + 1 == size)
            return offset;
1823
    }
1824 1825 1826 1827 1828 1829 1830 1831 1832 1833 1834 1835 1836 1837 1838 1839 1840 1841 1842 1843 1844
    return 0;
}

static uint8_t pci_find_capability_list(PCIDevice *pdev, uint8_t cap_id,
                                        uint8_t *prev_p)
{
    uint8_t next, prev;

    if (!(pdev->config[PCI_STATUS] & PCI_STATUS_CAP_LIST))
        return 0;

    for (prev = PCI_CAPABILITY_LIST; (next = pdev->config[prev]);
         prev = next + PCI_CAP_LIST_NEXT)
        if (pdev->config[next + PCI_CAP_LIST_ID] == cap_id)
            break;

    if (prev_p)
        *prev_p = prev;
    return next;
}

1845 1846 1847 1848 1849 1850 1851 1852 1853 1854 1855 1856 1857 1858 1859 1860 1861 1862 1863
static uint8_t pci_find_capability_at_offset(PCIDevice *pdev, uint8_t offset)
{
    uint8_t next, prev, found = 0;

    if (!(pdev->used[offset])) {
        return 0;
    }

    assert(pdev->config[PCI_STATUS] & PCI_STATUS_CAP_LIST);

    for (prev = PCI_CAPABILITY_LIST; (next = pdev->config[prev]);
         prev = next + PCI_CAP_LIST_NEXT) {
        if (next <= offset && next > found) {
            found = next;
        }
    }
    return found;
}

1864 1865 1866 1867 1868 1869 1870 1871 1872 1873 1874 1875 1876 1877 1878 1879 1880 1881 1882 1883 1884 1885 1886 1887 1888 1889 1890 1891 1892 1893 1894 1895 1896 1897 1898 1899 1900 1901 1902 1903 1904 1905 1906 1907 1908 1909 1910 1911 1912 1913 1914 1915 1916 1917 1918 1919
/* Patch the PCI vendor and device ids in a PCI rom image if necessary.
   This is needed for an option rom which is used for more than one device. */
static void pci_patch_ids(PCIDevice *pdev, uint8_t *ptr, int size)
{
    uint16_t vendor_id;
    uint16_t device_id;
    uint16_t rom_vendor_id;
    uint16_t rom_device_id;
    uint16_t rom_magic;
    uint16_t pcir_offset;
    uint8_t checksum;

    /* Words in rom data are little endian (like in PCI configuration),
       so they can be read / written with pci_get_word / pci_set_word. */

    /* Only a valid rom will be patched. */
    rom_magic = pci_get_word(ptr);
    if (rom_magic != 0xaa55) {
        PCI_DPRINTF("Bad ROM magic %04x\n", rom_magic);
        return;
    }
    pcir_offset = pci_get_word(ptr + 0x18);
    if (pcir_offset + 8 >= size || memcmp(ptr + pcir_offset, "PCIR", 4)) {
        PCI_DPRINTF("Bad PCIR offset 0x%x or signature\n", pcir_offset);
        return;
    }

    vendor_id = pci_get_word(pdev->config + PCI_VENDOR_ID);
    device_id = pci_get_word(pdev->config + PCI_DEVICE_ID);
    rom_vendor_id = pci_get_word(ptr + pcir_offset + 4);
    rom_device_id = pci_get_word(ptr + pcir_offset + 6);

    PCI_DPRINTF("%s: ROM id %04x%04x / PCI id %04x%04x\n", pdev->romfile,
                vendor_id, device_id, rom_vendor_id, rom_device_id);

    checksum = ptr[6];

    if (vendor_id != rom_vendor_id) {
        /* Patch vendor id and checksum (at offset 6 for etherboot roms). */
        checksum += (uint8_t)rom_vendor_id + (uint8_t)(rom_vendor_id >> 8);
        checksum -= (uint8_t)vendor_id + (uint8_t)(vendor_id >> 8);
        PCI_DPRINTF("ROM checksum %02x / %02x\n", ptr[6], checksum);
        ptr[6] = checksum;
        pci_set_word(ptr + pcir_offset + 4, vendor_id);
    }

    if (device_id != rom_device_id) {
        /* Patch device id and checksum (at offset 6 for etherboot roms). */
        checksum += (uint8_t)rom_device_id + (uint8_t)(rom_device_id >> 8);
        checksum -= (uint8_t)device_id + (uint8_t)(device_id >> 8);
        PCI_DPRINTF("ROM checksum %02x / %02x\n", ptr[6], checksum);
        ptr[6] = checksum;
        pci_set_word(ptr + pcir_offset + 6, device_id);
    }
}

1920
/* Add an option rom for the device */
1921
static int pci_add_option_rom(PCIDevice *pdev, bool is_default_rom)
1922 1923 1924 1925
{
    int size;
    char *path;
    void *ptr;
1926
    char name[32];
A
Anthony Liguori 已提交
1927
    const VMStateDescription *vmsd;
1928

1929 1930 1931 1932 1933
    if (!pdev->romfile)
        return 0;
    if (strlen(pdev->romfile) == 0)
        return 0;

1934 1935 1936 1937 1938 1939 1940 1941 1942
    if (!pdev->rom_bar) {
        /*
         * Load rom via fw_cfg instead of creating a rom bar,
         * for 0.11 compatibility.
         */
        int class = pci_get_word(pdev->config + PCI_CLASS_DEVICE);
        if (class == 0x0300) {
            rom_add_vga(pdev->romfile);
        } else {
G
Gleb Natapov 已提交
1943
            rom_add_option(pdev->romfile, -1);
1944 1945 1946 1947
        }
        return 0;
    }

1948
    path = qemu_find_file(QEMU_FILE_TYPE_BIOS, pdev->romfile);
1949
    if (path == NULL) {
1950
        path = g_strdup(pdev->romfile);
1951 1952 1953
    }

    size = get_image_size(path);
1954
    if (size < 0) {
1955
        error_report("%s: failed to find romfile \"%s\"",
S
Stefan Hajnoczi 已提交
1956 1957 1958 1959 1960 1961
                     __func__, pdev->romfile);
        g_free(path);
        return -1;
    } else if (size == 0) {
        error_report("%s: ignoring empty romfile \"%s\"",
                     __func__, pdev->romfile);
1962
        g_free(path);
1963 1964
        return -1;
    }
1965 1966 1967 1968
    if (size & (size - 1)) {
        size = 1 << qemu_fls(size);
    }

A
Anthony Liguori 已提交
1969 1970 1971 1972 1973
    vmsd = qdev_get_vmsd(DEVICE(pdev));

    if (vmsd) {
        snprintf(name, sizeof(name), "%s.rom", vmsd->name);
    } else {
1974
        snprintf(name, sizeof(name), "%s.rom", object_get_typename(OBJECT(pdev)));
A
Anthony Liguori 已提交
1975
    }
A
Avi Kivity 已提交
1976
    pdev->has_rom = true;
1977
    memory_region_init_ram(&pdev->rom, OBJECT(pdev), name, size);
1978
    vmstate_register_ram(&pdev->rom, &pdev->qdev);
A
Avi Kivity 已提交
1979
    ptr = memory_region_get_ram_ptr(&pdev->rom);
1980
    load_image(path, ptr);
1981
    g_free(path);
1982

1983 1984 1985 1986 1987
    if (is_default_rom) {
        /* Only the default rom images will be patched (if needed). */
        pci_patch_ids(pdev, ptr, size);
    }

1988
    pci_register_bar(pdev, PCI_ROM_SLOT, 0, &pdev->rom);
1989 1990 1991 1992

    return 0;
}

1993 1994
static void pci_del_option_rom(PCIDevice *pdev)
{
A
Avi Kivity 已提交
1995
    if (!pdev->has_rom)
1996 1997
        return;

1998
    vmstate_unregister_ram(&pdev->rom, &pdev->qdev);
A
Avi Kivity 已提交
1999 2000
    memory_region_destroy(&pdev->rom);
    pdev->has_rom = false;
2001 2002
}

2003 2004 2005 2006 2007 2008 2009 2010 2011
/*
 * if !offset
 * Reserve space and add capability to the linked list in pci config space
 *
 * if offset = 0,
 * Find and reserve space and add capability to the linked list
 * in pci config space */
int pci_add_capability(PCIDevice *pdev, uint8_t cap_id,
                       uint8_t offset, uint8_t size)
2012
{
2013
    uint8_t *config;
2014 2015
    int i, overlapping_cap;

2016 2017 2018 2019 2020
    if (!offset) {
        offset = pci_find_space(pdev, size);
        if (!offset) {
            return -ENOSPC;
        }
2021 2022 2023 2024 2025 2026 2027 2028
    } else {
        /* Verify that capabilities don't overlap.  Note: device assignment
         * depends on this check to verify that the device is not broken.
         * Should never trigger for emulated devices, but it's helpful
         * for debugging these. */
        for (i = offset; i < offset + size; i++) {
            overlapping_cap = pci_find_capability_at_offset(pdev, i);
            if (overlapping_cap) {
2029
                fprintf(stderr, "ERROR: %s:%02x:%02x.%x "
2030 2031
                        "Attempt to add PCI capability %x at offset "
                        "%x overlaps existing capability %x at offset %x\n",
2032
                        pci_root_bus_path(pdev), pci_bus_num(pdev->bus),
2033 2034 2035 2036 2037
                        PCI_SLOT(pdev->devfn), PCI_FUNC(pdev->devfn),
                        cap_id, offset, overlapping_cap, i);
                return -EINVAL;
            }
        }
2038 2039 2040
    }

    config = pdev->config + offset;
2041 2042 2043 2044
    config[PCI_CAP_LIST_ID] = cap_id;
    config[PCI_CAP_LIST_NEXT] = pdev->config[PCI_CAPABILITY_LIST];
    pdev->config[PCI_CAPABILITY_LIST] = offset;
    pdev->config[PCI_STATUS] |= PCI_STATUS_CAP_LIST;
2045
    memset(pdev->used + offset, 0xFF, QEMU_ALIGN_UP(size, 4));
2046 2047
    /* Make capability read-only by default */
    memset(pdev->wmask + offset, 0, size);
2048 2049
    /* Check capability by default */
    memset(pdev->cmask + offset, 0xFF, size);
2050 2051 2052 2053 2054 2055 2056 2057 2058 2059
    return offset;
}

/* Unlink capability from the pci config space. */
void pci_del_capability(PCIDevice *pdev, uint8_t cap_id, uint8_t size)
{
    uint8_t prev, offset = pci_find_capability_list(pdev, cap_id, &prev);
    if (!offset)
        return;
    pdev->config[prev] = pdev->config[offset + PCI_CAP_LIST_NEXT];
S
Stefan Weil 已提交
2060
    /* Make capability writable again */
2061
    memset(pdev->wmask + offset, 0xff, size);
2062
    memset(pdev->w1cmask + offset, 0, size);
2063 2064
    /* Clear cmask as device-specific registers can't be checked */
    memset(pdev->cmask + offset, 0, size);
2065
    memset(pdev->used + offset, 0, QEMU_ALIGN_UP(size, 4));
2066 2067 2068 2069 2070 2071 2072 2073 2074

    if (!pdev->config[PCI_CAPABILITY_LIST])
        pdev->config[PCI_STATUS] &= ~PCI_STATUS_CAP_LIST;
}

uint8_t pci_find_capability(PCIDevice *pdev, uint8_t cap_id)
{
    return pci_find_capability_list(pdev, cap_id, NULL);
}
2075 2076 2077 2078 2079 2080 2081 2082 2083

static void pcibus_dev_print(Monitor *mon, DeviceState *dev, int indent)
{
    PCIDevice *d = (PCIDevice *)dev;
    const pci_class_desc *desc;
    char ctxt[64];
    PCIIORegion *r;
    int i, class;

2084
    class = pci_get_word(d->config + PCI_CLASS_DEVICE);
2085 2086 2087 2088 2089 2090 2091 2092 2093 2094 2095
    desc = pci_class_descriptions;
    while (desc->desc && class != desc->class)
        desc++;
    if (desc->desc) {
        snprintf(ctxt, sizeof(ctxt), "%s", desc->desc);
    } else {
        snprintf(ctxt, sizeof(ctxt), "Class %04x", class);
    }

    monitor_printf(mon, "%*sclass %s, addr %02x:%02x.%x, "
                   "pci id %04x:%04x (sub %04x:%04x)\n",
2096
                   indent, "", ctxt, pci_bus_num(d->bus),
2097
                   PCI_SLOT(d->devfn), PCI_FUNC(d->devfn),
2098 2099 2100 2101
                   pci_get_word(d->config + PCI_VENDOR_ID),
                   pci_get_word(d->config + PCI_DEVICE_ID),
                   pci_get_word(d->config + PCI_SUBSYSTEM_VENDOR_ID),
                   pci_get_word(d->config + PCI_SUBSYSTEM_ID));
2102 2103 2104 2105
    for (i = 0; i < PCI_NUM_REGIONS; i++) {
        r = &d->io_regions[i];
        if (!r->size)
            continue;
2106 2107 2108
        monitor_printf(mon, "%*sbar %d: %s at 0x%"FMT_PCIBUS
                       " [0x%"FMT_PCIBUS"]\n",
                       indent, "",
2109
                       i, r->type & PCI_BASE_ADDRESS_SPACE_IO ? "i/o" : "mem",
2110 2111 2112
                       r->addr, r->addr + r->size - 1);
    }
}
G
Gerd Hoffmann 已提交
2113

2114 2115 2116 2117 2118 2119 2120 2121 2122 2123 2124 2125 2126 2127 2128 2129 2130 2131 2132 2133 2134 2135 2136 2137 2138 2139 2140 2141 2142 2143 2144 2145 2146 2147 2148 2149 2150 2151 2152
static char *pci_dev_fw_name(DeviceState *dev, char *buf, int len)
{
    PCIDevice *d = (PCIDevice *)dev;
    const char *name = NULL;
    const pci_class_desc *desc =  pci_class_descriptions;
    int class = pci_get_word(d->config + PCI_CLASS_DEVICE);

    while (desc->desc &&
          (class & ~desc->fw_ign_bits) !=
          (desc->class & ~desc->fw_ign_bits)) {
        desc++;
    }

    if (desc->desc) {
        name = desc->fw_name;
    }

    if (name) {
        pstrcpy(buf, len, name);
    } else {
        snprintf(buf, len, "pci%04x,%04x",
                 pci_get_word(d->config + PCI_VENDOR_ID),
                 pci_get_word(d->config + PCI_DEVICE_ID));
    }

    return buf;
}

static char *pcibus_get_fw_dev_path(DeviceState *dev)
{
    PCIDevice *d = (PCIDevice *)dev;
    char path[50], name[33];
    int off;

    off = snprintf(path, sizeof(path), "%s@%x",
                   pci_dev_fw_name(dev, name, sizeof name),
                   PCI_SLOT(d->devfn));
    if (PCI_FUNC(d->devfn))
        snprintf(path + off, sizeof(path) + off, ",%x", PCI_FUNC(d->devfn));
2153
    return g_strdup(path);
2154 2155
}

2156 2157
static char *pcibus_get_dev_path(DeviceState *dev)
{
2158 2159 2160 2161 2162 2163 2164 2165
    PCIDevice *d = container_of(dev, PCIDevice, qdev);
    PCIDevice *t;
    int slot_depth;
    /* Path format: Domain:00:Slot.Function:Slot.Function....:Slot.Function.
     * 00 is added here to make this format compatible with
     * domain:Bus:Slot.Func for systems without nested PCI bridges.
     * Slot.Function list specifies the slot and function numbers for all
     * devices on the path from root to the specific device. */
2166 2167
    const char *root_bus_path;
    int root_bus_len;
M
Michael S. Tsirkin 已提交
2168 2169
    char slot[] = ":SS.F";
    int slot_len = sizeof slot - 1 /* For '\0' */;
2170 2171
    int path_len;
    char *path, *p;
M
Michael S. Tsirkin 已提交
2172
    int s;
2173

2174 2175 2176
    root_bus_path = pci_root_bus_path(d);
    root_bus_len = strlen(root_bus_path);

2177 2178 2179 2180 2181 2182
    /* Calculate # of slots on path between device and root. */;
    slot_depth = 0;
    for (t = d; t; t = t->bus->parent_dev) {
        ++slot_depth;
    }

2183
    path_len = root_bus_len + slot_len * slot_depth;
2184 2185

    /* Allocate memory, fill in the terminating null byte. */
2186
    path = g_malloc(path_len + 1 /* For '\0' */);
2187 2188
    path[path_len] = '\0';

2189
    memcpy(path, root_bus_path, root_bus_len);
2190 2191 2192 2193 2194 2195

    /* Fill in slot numbers. We walk up from device to root, so need to print
     * them in the reverse order, last to first. */
    p = path + path_len;
    for (t = d; t; t = t->bus->parent_dev) {
        p -= slot_len;
M
Michael S. Tsirkin 已提交
2196
        s = snprintf(slot, sizeof slot, ":%02x.%x",
2197
                     PCI_SLOT(t->devfn), PCI_FUNC(t->devfn));
M
Michael S. Tsirkin 已提交
2198 2199
        assert(s == slot_len);
        memcpy(p, slot, slot_len);
2200 2201 2202
    }

    return path;
2203 2204
}

2205 2206 2207 2208 2209 2210 2211 2212 2213
static int pci_qdev_find_recursive(PCIBus *bus,
                                   const char *id, PCIDevice **pdev)
{
    DeviceState *qdev = qdev_find_recursive(&bus->qbus, id);
    if (!qdev) {
        return -ENODEV;
    }

    /* roughly check if given qdev is pci device */
A
Anthony Liguori 已提交
2214
    if (object_dynamic_cast(OBJECT(qdev), TYPE_PCI_DEVICE)) {
2215
        *pdev = PCI_DEVICE(qdev);
2216 2217 2218 2219 2220 2221 2222
        return 0;
    }
    return -EINVAL;
}

int pci_qdev_find_device(const char *id, PCIDevice **pdev)
{
2223
    PCIHostState *host_bridge;
2224 2225
    int rc = -ENODEV;

2226 2227
    QLIST_FOREACH(host_bridge, &pci_host_bridges, next) {
        int tmp = pci_qdev_find_recursive(host_bridge->bus, id, pdev);
2228 2229 2230 2231 2232 2233 2234 2235 2236 2237 2238
        if (!tmp) {
            rc = 0;
            break;
        }
        if (tmp != -ENODEV) {
            rc = tmp;
        }
    }

    return rc;
}
A
Avi Kivity 已提交
2239 2240 2241 2242 2243

MemoryRegion *pci_address_space(PCIDevice *dev)
{
    return dev->bus->address_space_mem;
}
2244 2245 2246 2247 2248

MemoryRegion *pci_address_space_io(PCIDevice *dev)
{
    return dev->bus->address_space_io;
}
2249

2250 2251 2252 2253 2254 2255
static void pci_device_class_init(ObjectClass *klass, void *data)
{
    DeviceClass *k = DEVICE_CLASS(klass);
    k->init = pci_qdev_init;
    k->unplug = pci_unplug_device;
    k->exit = pci_unregister_device;
2256
    k->bus_type = TYPE_PCI_BUS;
2257
    k->props = pci_props;
2258 2259
}

2260 2261 2262 2263 2264 2265 2266 2267 2268 2269 2270 2271 2272 2273 2274 2275 2276
AddressSpace *pci_device_iommu_address_space(PCIDevice *dev)
{
    PCIBus *bus = PCI_BUS(dev->bus);

    if (bus->iommu_fn) {
        return bus->iommu_fn(bus, bus->iommu_opaque, dev->devfn);
    }

    if (bus->parent_dev) {
        /** We are ignoring the bus master DMA bit of the bridge
         *  as it would complicate things such as VFIO for no good reason */
        return pci_device_iommu_address_space(bus->parent_dev);
    }

    return &address_space_memory;
}

2277
void pci_setup_iommu(PCIBus *bus, PCIIOMMUFunc fn, void *opaque)
2278
{
2279 2280
    bus->iommu_fn = fn;
    bus->iommu_opaque = opaque;
2281 2282
}

2283 2284 2285 2286 2287
static void pci_dev_get_w64(PCIBus *b, PCIDevice *dev, void *opaque)
{
    Range *range = opaque;
    PCIDeviceClass *pc = PCI_DEVICE_GET_CLASS(dev);
    uint16_t cmd = pci_get_word(dev->config + PCI_COMMAND);
2288
    int i;
2289 2290 2291 2292 2293 2294 2295 2296 2297 2298 2299 2300 2301 2302 2303 2304 2305 2306

    if (!(cmd & PCI_COMMAND_MEMORY)) {
        return;
    }

    if (pc->is_bridge) {
        pcibus_t base = pci_bridge_get_base(dev, PCI_BASE_ADDRESS_MEM_PREFETCH);
        pcibus_t limit = pci_bridge_get_limit(dev, PCI_BASE_ADDRESS_MEM_PREFETCH);

        base = MAX(base, 0x1ULL << 32);

        if (limit >= base) {
            Range pref_range;
            pref_range.begin = base;
            pref_range.end = limit + 1;
            range_extend(range, &pref_range);
        }
    }
2307 2308
    for (i = 0; i < PCI_NUM_REGIONS; ++i) {
        PCIIORegion *r = &dev->io_regions[i];
2309 2310
        Range region_range;

2311 2312 2313 2314 2315 2316 2317 2318 2319
        if (!r->size ||
            (r->type & PCI_BASE_ADDRESS_SPACE_IO) ||
            !(r->type & PCI_BASE_ADDRESS_MEM_TYPE_64)) {
            continue;
        }
        region_range.begin = pci_bar_address(dev, i, r->type, r->size);
        region_range.end = region_range.begin + r->size;

        if (region_range.begin == PCI_BAR_UNMAPPED) {
2320 2321 2322 2323 2324 2325 2326 2327 2328 2329 2330 2331 2332 2333 2334 2335 2336
            continue;
        }

        region_range.begin = MAX(region_range.begin, 0x1ULL << 32);

        if (region_range.end - 1 >= region_range.begin) {
            range_extend(range, &region_range);
        }
    }
}

void pci_bus_get_w64_range(PCIBus *bus, Range *range)
{
    range->begin = range->end = 0;
    pci_for_each_device_under_bus(bus, pci_dev_get_w64, range);
}

2337
static const TypeInfo pci_device_type_info = {
2338 2339 2340 2341 2342
    .name = TYPE_PCI_DEVICE,
    .parent = TYPE_DEVICE,
    .instance_size = sizeof(PCIDevice),
    .abstract = true,
    .class_size = sizeof(PCIDeviceClass),
2343
    .class_init = pci_device_class_init,
2344 2345
};

A
Andreas Färber 已提交
2346
static void pci_register_types(void)
2347
{
2348
    type_register_static(&pci_bus_info);
2349
    type_register_static(&pcie_bus_info);
2350 2351 2352
    type_register_static(&pci_device_type_info);
}

A
Andreas Färber 已提交
2353
type_init(pci_register_types)