memory.c 69.0 KB
Newer Older
A
Avi Kivity 已提交
1 2 3 4 5 6 7 8 9 10 11
/*
 * Physical memory management
 *
 * Copyright 2011 Red Hat, Inc. and/or its affiliates
 *
 * Authors:
 *  Avi Kivity <avi@redhat.com>
 *
 * This work is licensed under the terms of the GNU GPL, version 2.  See
 * the COPYING file in the top-level directory.
 *
12 13
 * Contributions after 2012-01-13 are licensed under the terms of the
 * GNU GPL, version 2 or (at your option) any later version.
A
Avi Kivity 已提交
14 15
 */

16 17 18
#include "exec/memory.h"
#include "exec/address-spaces.h"
#include "exec/ioport.h"
19
#include "qapi/visitor.h"
20
#include "qemu/bitops.h"
21
#include "qom/object.h"
22
#include "trace.h"
A
Avi Kivity 已提交
23 24
#include <assert.h>

25
#include "exec/memory-internal.h"
26
#include "exec/ram_addr.h"
27
#include "sysemu/sysemu.h"
28

29 30
//#define DEBUG_UNASSIGNED

31 32
static unsigned memory_region_transaction_depth;
static bool memory_region_update_pending;
33
static bool ioeventfd_update_pending;
34 35
static bool global_dirty_log = false;

36 37
static QTAILQ_HEAD(memory_listeners, MemoryListener) memory_listeners
    = QTAILQ_HEAD_INITIALIZER(memory_listeners);
A
Avi Kivity 已提交
38

39 40 41
static QTAILQ_HEAD(, AddressSpace) address_spaces
    = QTAILQ_HEAD_INITIALIZER(address_spaces);

A
Avi Kivity 已提交
42 43
typedef struct AddrRange AddrRange;

A
Avi Kivity 已提交
44
/*
45
 * Note that signed integers are needed for negative offsetting in aliases
A
Avi Kivity 已提交
46 47
 * (large MemoryRegion::alias_offset).
 */
A
Avi Kivity 已提交
48
struct AddrRange {
49 50
    Int128 start;
    Int128 size;
A
Avi Kivity 已提交
51 52
};

53
static AddrRange addrrange_make(Int128 start, Int128 size)
A
Avi Kivity 已提交
54 55 56 57 58 59
{
    return (AddrRange) { start, size };
}

static bool addrrange_equal(AddrRange r1, AddrRange r2)
{
60
    return int128_eq(r1.start, r2.start) && int128_eq(r1.size, r2.size);
A
Avi Kivity 已提交
61 62
}

63
static Int128 addrrange_end(AddrRange r)
A
Avi Kivity 已提交
64
{
65
    return int128_add(r.start, r.size);
A
Avi Kivity 已提交
66 67
}

68
static AddrRange addrrange_shift(AddrRange range, Int128 delta)
A
Avi Kivity 已提交
69
{
70
    int128_addto(&range.start, delta);
A
Avi Kivity 已提交
71 72 73
    return range;
}

74 75 76 77 78 79
static bool addrrange_contains(AddrRange range, Int128 addr)
{
    return int128_ge(addr, range.start)
        && int128_lt(addr, addrrange_end(range));
}

A
Avi Kivity 已提交
80 81
static bool addrrange_intersects(AddrRange r1, AddrRange r2)
{
82 83
    return addrrange_contains(r1, r2.start)
        || addrrange_contains(r2, r1.start);
A
Avi Kivity 已提交
84 85 86 87
}

static AddrRange addrrange_intersection(AddrRange r1, AddrRange r2)
{
88 89 90
    Int128 start = int128_max(r1.start, r2.start);
    Int128 end = int128_min(addrrange_end(r1), addrrange_end(r2));
    return addrrange_make(start, int128_sub(end, start));
A
Avi Kivity 已提交
91 92
}

93 94
enum ListenerDirection { Forward, Reverse };

95 96 97 98 99 100 101 102
static bool memory_listener_match(MemoryListener *listener,
                                  MemoryRegionSection *section)
{
    return !listener->address_space_filter
        || listener->address_space_filter == section->address_space;
}

#define MEMORY_LISTENER_CALL_GLOBAL(_callback, _direction, _args...)    \
103 104 105 106 107 108
    do {                                                                \
        MemoryListener *_listener;                                      \
                                                                        \
        switch (_direction) {                                           \
        case Forward:                                                   \
            QTAILQ_FOREACH(_listener, &memory_listeners, link) {        \
109 110 111
                if (_listener->_callback) {                             \
                    _listener->_callback(_listener, ##_args);           \
                }                                                       \
112 113 114 115 116
            }                                                           \
            break;                                                      \
        case Reverse:                                                   \
            QTAILQ_FOREACH_REVERSE(_listener, &memory_listeners,        \
                                   memory_listeners, link) {            \
117 118 119
                if (_listener->_callback) {                             \
                    _listener->_callback(_listener, ##_args);           \
                }                                                       \
120 121 122 123 124 125 126
            }                                                           \
            break;                                                      \
        default:                                                        \
            abort();                                                    \
        }                                                               \
    } while (0)

127 128 129 130 131 132 133
#define MEMORY_LISTENER_CALL(_callback, _direction, _section, _args...) \
    do {                                                                \
        MemoryListener *_listener;                                      \
                                                                        \
        switch (_direction) {                                           \
        case Forward:                                                   \
            QTAILQ_FOREACH(_listener, &memory_listeners, link) {        \
134 135
                if (_listener->_callback                                \
                    && memory_listener_match(_listener, _section)) {    \
136 137 138 139 140 141 142
                    _listener->_callback(_listener, _section, ##_args); \
                }                                                       \
            }                                                           \
            break;                                                      \
        case Reverse:                                                   \
            QTAILQ_FOREACH_REVERSE(_listener, &memory_listeners,        \
                                   memory_listeners, link) {            \
143 144
                if (_listener->_callback                                \
                    && memory_listener_match(_listener, _section)) {    \
145 146 147 148 149 150 151 152 153
                    _listener->_callback(_listener, _section, ##_args); \
                }                                                       \
            }                                                           \
            break;                                                      \
        default:                                                        \
            abort();                                                    \
        }                                                               \
    } while (0)

P
Paolo Bonzini 已提交
154
/* No need to ref/unref .mr, the FlatRange keeps it alive.  */
155
#define MEMORY_LISTENER_UPDATE_REGION(fr, as, dir, callback)            \
156
    MEMORY_LISTENER_CALL(callback, dir, (&(MemoryRegionSection) {       \
157
        .mr = (fr)->mr,                                                 \
158
        .address_space = (as),                                          \
159
        .offset_within_region = (fr)->offset_in_region,                 \
160
        .size = (fr)->addr.size,                                        \
161
        .offset_within_address_space = int128_get64((fr)->addr.start),  \
162
        .readonly = (fr)->readonly,                                     \
163
              }))
164

A
Avi Kivity 已提交
165 166 167 168 169
struct CoalescedMemoryRange {
    AddrRange addr;
    QTAILQ_ENTRY(CoalescedMemoryRange) link;
};

A
Avi Kivity 已提交
170 171 172 173
struct MemoryRegionIoeventfd {
    AddrRange addr;
    bool match_data;
    uint64_t data;
174
    EventNotifier *e;
A
Avi Kivity 已提交
175 176 177 178 179
};

static bool memory_region_ioeventfd_before(MemoryRegionIoeventfd a,
                                           MemoryRegionIoeventfd b)
{
180
    if (int128_lt(a.addr.start, b.addr.start)) {
A
Avi Kivity 已提交
181
        return true;
182
    } else if (int128_gt(a.addr.start, b.addr.start)) {
A
Avi Kivity 已提交
183
        return false;
184
    } else if (int128_lt(a.addr.size, b.addr.size)) {
A
Avi Kivity 已提交
185
        return true;
186
    } else if (int128_gt(a.addr.size, b.addr.size)) {
A
Avi Kivity 已提交
187 188 189 190 191 192 193 194 195 196 197 198
        return false;
    } else if (a.match_data < b.match_data) {
        return true;
    } else  if (a.match_data > b.match_data) {
        return false;
    } else if (a.match_data) {
        if (a.data < b.data) {
            return true;
        } else if (a.data > b.data) {
            return false;
        }
    }
199
    if (a.e < b.e) {
A
Avi Kivity 已提交
200
        return true;
201
    } else if (a.e > b.e) {
A
Avi Kivity 已提交
202 203 204 205 206 207 208 209 210 211 212 213
        return false;
    }
    return false;
}

static bool memory_region_ioeventfd_equal(MemoryRegionIoeventfd a,
                                          MemoryRegionIoeventfd b)
{
    return !memory_region_ioeventfd_before(a, b)
        && !memory_region_ioeventfd_before(b, a);
}

A
Avi Kivity 已提交
214 215 216 217 218 219
typedef struct FlatRange FlatRange;
typedef struct FlatView FlatView;

/* Range of memory in the global map.  Addresses are absolute. */
struct FlatRange {
    MemoryRegion *mr;
A
Avi Kivity 已提交
220
    hwaddr offset_in_region;
A
Avi Kivity 已提交
221
    AddrRange addr;
A
Avi Kivity 已提交
222
    uint8_t dirty_log_mask;
223
    bool romd_mode;
224
    bool readonly;
A
Avi Kivity 已提交
225 226 227 228 229 230
};

/* Flattened global view of current active memory hierarchy.  Kept in sorted
 * order.
 */
struct FlatView {
231
    struct rcu_head rcu;
232
    unsigned ref;
A
Avi Kivity 已提交
233 234 235 236 237
    FlatRange *ranges;
    unsigned nr;
    unsigned nr_allocated;
};

238 239
typedef struct AddressSpaceOps AddressSpaceOps;

A
Avi Kivity 已提交
240 241 242 243 244 245 246
#define FOR_EACH_FLAT_RANGE(var, view)          \
    for (var = (view)->ranges; var < (view)->ranges + (view)->nr; ++var)

static bool flatrange_equal(FlatRange *a, FlatRange *b)
{
    return a->mr == b->mr
        && addrrange_equal(a->addr, b->addr)
247
        && a->offset_in_region == b->offset_in_region
248
        && a->romd_mode == b->romd_mode
249
        && a->readonly == b->readonly;
A
Avi Kivity 已提交
250 251 252 253
}

static void flatview_init(FlatView *view)
{
254
    view->ref = 1;
A
Avi Kivity 已提交
255 256 257 258 259 260 261 262 263 264 265 266
    view->ranges = NULL;
    view->nr = 0;
    view->nr_allocated = 0;
}

/* Insert a range into a given position.  Caller is responsible for maintaining
 * sorting order.
 */
static void flatview_insert(FlatView *view, unsigned pos, FlatRange *range)
{
    if (view->nr == view->nr_allocated) {
        view->nr_allocated = MAX(2 * view->nr, 10);
267
        view->ranges = g_realloc(view->ranges,
A
Avi Kivity 已提交
268 269 270 271 272
                                    view->nr_allocated * sizeof(*view->ranges));
    }
    memmove(view->ranges + pos + 1, view->ranges + pos,
            (view->nr - pos) * sizeof(FlatRange));
    view->ranges[pos] = *range;
P
Paolo Bonzini 已提交
273
    memory_region_ref(range->mr);
A
Avi Kivity 已提交
274 275 276 277 278
    ++view->nr;
}

static void flatview_destroy(FlatView *view)
{
P
Paolo Bonzini 已提交
279 280 281 282 283
    int i;

    for (i = 0; i < view->nr; i++) {
        memory_region_unref(view->ranges[i].mr);
    }
284
    g_free(view->ranges);
285
    g_free(view);
A
Avi Kivity 已提交
286 287
}

288 289 290 291 292 293 294 295 296 297 298 299
static void flatview_ref(FlatView *view)
{
    atomic_inc(&view->ref);
}

static void flatview_unref(FlatView *view)
{
    if (atomic_fetch_dec(&view->ref) == 1) {
        flatview_destroy(view);
    }
}

300 301
static bool can_merge(FlatRange *r1, FlatRange *r2)
{
302
    return int128_eq(addrrange_end(r1->addr), r2->addr.start)
303
        && r1->mr == r2->mr
304 305 306
        && int128_eq(int128_add(int128_make64(r1->offset_in_region),
                                r1->addr.size),
                     int128_make64(r2->offset_in_region))
307
        && r1->dirty_log_mask == r2->dirty_log_mask
308
        && r1->romd_mode == r2->romd_mode
309
        && r1->readonly == r2->readonly;
310 311
}

P
Peter Crosthwaite 已提交
312
/* Attempt to simplify a view by merging adjacent ranges */
313 314 315 316 317 318 319 320 321
static void flatview_simplify(FlatView *view)
{
    unsigned i, j;

    i = 0;
    while (i < view->nr) {
        j = i + 1;
        while (j < view->nr
               && can_merge(&view->ranges[j-1], &view->ranges[j])) {
322
            int128_addto(&view->ranges[i].addr.size, view->ranges[j].addr.size);
323 324 325 326 327 328 329 330 331
            ++j;
        }
        ++i;
        memmove(&view->ranges[i], &view->ranges[j],
                (view->nr - j) * sizeof(view->ranges[j]));
        view->nr -= j - i;
    }
}

332 333 334 335 336 337 338 339 340
static bool memory_region_big_endian(MemoryRegion *mr)
{
#ifdef TARGET_WORDS_BIGENDIAN
    return mr->ops->endianness != DEVICE_LITTLE_ENDIAN;
#else
    return mr->ops->endianness == DEVICE_BIG_ENDIAN;
#endif
}

P
Paolo Bonzini 已提交
341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370
static bool memory_region_wrong_endianness(MemoryRegion *mr)
{
#ifdef TARGET_WORDS_BIGENDIAN
    return mr->ops->endianness == DEVICE_LITTLE_ENDIAN;
#else
    return mr->ops->endianness == DEVICE_BIG_ENDIAN;
#endif
}

static void adjust_endianness(MemoryRegion *mr, uint64_t *data, unsigned size)
{
    if (memory_region_wrong_endianness(mr)) {
        switch (size) {
        case 1:
            break;
        case 2:
            *data = bswap16(*data);
            break;
        case 4:
            *data = bswap32(*data);
            break;
        case 8:
            *data = bswap64(*data);
            break;
        default:
            abort();
        }
    }
}

371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387
static MemTxResult memory_region_oldmmio_read_accessor(MemoryRegion *mr,
                                                       hwaddr addr,
                                                       uint64_t *value,
                                                       unsigned size,
                                                       unsigned shift,
                                                       uint64_t mask,
                                                       MemTxAttrs attrs)
{
    uint64_t tmp;

    tmp = mr->ops->old_mmio.read[ctz32(size)](mr->opaque, addr);
    trace_memory_region_ops_read(mr, addr, tmp, size);
    *value |= (tmp & mask) << shift;
    return MEMTX_OK;
}

static MemTxResult  memory_region_read_accessor(MemoryRegion *mr,
388 389 390 391
                                                hwaddr addr,
                                                uint64_t *value,
                                                unsigned size,
                                                unsigned shift,
392 393
                                                uint64_t mask,
                                                MemTxAttrs attrs)
394 395 396
{
    uint64_t tmp;

397 398 399 400
    if (mr->flush_coalesced_mmio) {
        qemu_flush_coalesced_mmio_buffer();
    }
    tmp = mr->ops->read(mr->opaque, addr, size);
401
    trace_memory_region_ops_read(mr, addr, tmp, size);
402
    *value |= (tmp & mask) << shift;
403
    return MEMTX_OK;
404 405
}

406 407 408 409 410 411 412
static MemTxResult memory_region_read_with_attrs_accessor(MemoryRegion *mr,
                                                          hwaddr addr,
                                                          uint64_t *value,
                                                          unsigned size,
                                                          unsigned shift,
                                                          uint64_t mask,
                                                          MemTxAttrs attrs)
413
{
414 415
    uint64_t tmp = 0;
    MemTxResult r;
416

417 418 419
    if (mr->flush_coalesced_mmio) {
        qemu_flush_coalesced_mmio_buffer();
    }
420
    r = mr->ops->read_with_attrs(mr->opaque, addr, &tmp, size, attrs);
421
    trace_memory_region_ops_read(mr, addr, tmp, size);
422
    *value |= (tmp & mask) << shift;
423
    return r;
424 425
}

426 427 428 429 430 431 432
static MemTxResult memory_region_oldmmio_write_accessor(MemoryRegion *mr,
                                                        hwaddr addr,
                                                        uint64_t *value,
                                                        unsigned size,
                                                        unsigned shift,
                                                        uint64_t mask,
                                                        MemTxAttrs attrs)
433 434 435 436
{
    uint64_t tmp;

    tmp = (*value >> shift) & mask;
437
    trace_memory_region_ops_write(mr, addr, tmp, size);
438
    mr->ops->old_mmio.write[ctz32(size)](mr->opaque, addr, tmp);
439
    return MEMTX_OK;
440 441
}

442 443 444 445 446 447 448
static MemTxResult memory_region_write_accessor(MemoryRegion *mr,
                                                hwaddr addr,
                                                uint64_t *value,
                                                unsigned size,
                                                unsigned shift,
                                                uint64_t mask,
                                                MemTxAttrs attrs)
449 450 451
{
    uint64_t tmp;

452 453 454
    if (mr->flush_coalesced_mmio) {
        qemu_flush_coalesced_mmio_buffer();
    }
455
    tmp = (*value >> shift) & mask;
456
    trace_memory_region_ops_write(mr, addr, tmp, size);
457
    mr->ops->write(mr->opaque, addr, tmp, size);
458
    return MEMTX_OK;
459 460
}

461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479
static MemTxResult memory_region_write_with_attrs_accessor(MemoryRegion *mr,
                                                           hwaddr addr,
                                                           uint64_t *value,
                                                           unsigned size,
                                                           unsigned shift,
                                                           uint64_t mask,
                                                           MemTxAttrs attrs)
{
    uint64_t tmp;

    if (mr->flush_coalesced_mmio) {
        qemu_flush_coalesced_mmio_buffer();
    }
    tmp = (*value >> shift) & mask;
    trace_memory_region_ops_write(mr, addr, tmp, size);
    return mr->ops->write_with_attrs(mr->opaque, addr, tmp, size, attrs);
}

static MemTxResult access_with_adjusted_size(hwaddr addr,
480 481 482 483
                                      uint64_t *value,
                                      unsigned size,
                                      unsigned access_size_min,
                                      unsigned access_size_max,
484 485 486 487 488 489 490 491 492
                                      MemTxResult (*access)(MemoryRegion *mr,
                                                            hwaddr addr,
                                                            uint64_t *value,
                                                            unsigned size,
                                                            unsigned shift,
                                                            uint64_t mask,
                                                            MemTxAttrs attrs),
                                      MemoryRegion *mr,
                                      MemTxAttrs attrs)
493 494 495 496
{
    uint64_t access_mask;
    unsigned access_size;
    unsigned i;
497
    MemTxResult r = MEMTX_OK;
498 499 500 501 502 503 504

    if (!access_size_min) {
        access_size_min = 1;
    }
    if (!access_size_max) {
        access_size_max = 4;
    }
505 506

    /* FIXME: support unaligned access? */
507 508
    access_size = MAX(MIN(size, access_size_max), access_size_min);
    access_mask = -1ULL >> (64 - access_size * 8);
509 510
    if (memory_region_big_endian(mr)) {
        for (i = 0; i < size; i += access_size) {
511 512
            r |= access(mr, addr + i, value, access_size,
                        (size - access_size - i) * 8, access_mask, attrs);
513 514 515
        }
    } else {
        for (i = 0; i < size; i += access_size) {
516 517
            r |= access(mr, addr + i, value, access_size, i * 8,
                        access_mask, attrs);
518
        }
519
    }
520
    return r;
521 522
}

523 524
static AddressSpace *memory_region_to_address_space(MemoryRegion *mr)
{
525 526
    AddressSpace *as;

527 528
    while (mr->container) {
        mr = mr->container;
529
    }
530 531 532 533
    QTAILQ_FOREACH(as, &address_spaces, address_spaces_link) {
        if (mr == as->root) {
            return as;
        }
534
    }
535
    return NULL;
536 537
}

A
Avi Kivity 已提交
538 539 540 541 542
/* Render a memory region into the global view.  Ranges in @view obscure
 * ranges in @mr.
 */
static void render_memory_region(FlatView *view,
                                 MemoryRegion *mr,
543
                                 Int128 base,
544 545
                                 AddrRange clip,
                                 bool readonly)
A
Avi Kivity 已提交
546 547 548
{
    MemoryRegion *subregion;
    unsigned i;
A
Avi Kivity 已提交
549
    hwaddr offset_in_region;
550 551
    Int128 remain;
    Int128 now;
A
Avi Kivity 已提交
552 553 554
    FlatRange fr;
    AddrRange tmp;

555 556 557 558
    if (!mr->enabled) {
        return;
    }

559
    int128_addto(&base, int128_make64(mr->addr));
560
    readonly |= mr->readonly;
A
Avi Kivity 已提交
561 562 563 564 565 566 567 568 569 570

    tmp = addrrange_make(base, mr->size);

    if (!addrrange_intersects(tmp, clip)) {
        return;
    }

    clip = addrrange_intersection(tmp, clip);

    if (mr->alias) {
571 572
        int128_subfrom(&base, int128_make64(mr->alias->addr));
        int128_subfrom(&base, int128_make64(mr->alias_offset));
573
        render_memory_region(view, mr->alias, base, clip, readonly);
A
Avi Kivity 已提交
574 575 576 577 578
        return;
    }

    /* Render subregions in priority order. */
    QTAILQ_FOREACH(subregion, &mr->subregions, subregions_link) {
579
        render_memory_region(view, subregion, base, clip, readonly);
A
Avi Kivity 已提交
580 581
    }

582
    if (!mr->terminates) {
A
Avi Kivity 已提交
583 584 585
        return;
    }

586
    offset_in_region = int128_get64(int128_sub(clip.start, base));
A
Avi Kivity 已提交
587 588 589
    base = clip.start;
    remain = clip.size;

590 591 592 593 594
    fr.mr = mr;
    fr.dirty_log_mask = mr->dirty_log_mask;
    fr.romd_mode = mr->romd_mode;
    fr.readonly = readonly;

A
Avi Kivity 已提交
595
    /* Render the region itself into any gaps left by the current view. */
596 597
    for (i = 0; i < view->nr && int128_nz(remain); ++i) {
        if (int128_ge(base, addrrange_end(view->ranges[i].addr))) {
A
Avi Kivity 已提交
598 599
            continue;
        }
600 601 602
        if (int128_lt(base, view->ranges[i].addr.start)) {
            now = int128_min(remain,
                             int128_sub(view->ranges[i].addr.start, base));
A
Avi Kivity 已提交
603 604 605 606
            fr.offset_in_region = offset_in_region;
            fr.addr = addrrange_make(base, now);
            flatview_insert(view, i, &fr);
            ++i;
607 608 609
            int128_addto(&base, now);
            offset_in_region += int128_get64(now);
            int128_subfrom(&remain, now);
A
Avi Kivity 已提交
610
        }
611 612 613 614 615 616
        now = int128_sub(int128_min(int128_add(base, remain),
                                    addrrange_end(view->ranges[i].addr)),
                         base);
        int128_addto(&base, now);
        offset_in_region += int128_get64(now);
        int128_subfrom(&remain, now);
A
Avi Kivity 已提交
617
    }
618
    if (int128_nz(remain)) {
A
Avi Kivity 已提交
619 620 621 622 623 624 625
        fr.offset_in_region = offset_in_region;
        fr.addr = addrrange_make(base, remain);
        flatview_insert(view, i, &fr);
    }
}

/* Render a memory topology into a list of disjoint absolute ranges. */
626
static FlatView *generate_memory_topology(MemoryRegion *mr)
A
Avi Kivity 已提交
627
{
628
    FlatView *view;
A
Avi Kivity 已提交
629

630 631
    view = g_new(FlatView, 1);
    flatview_init(view);
A
Avi Kivity 已提交
632

A
Avi Kivity 已提交
633
    if (mr) {
634
        render_memory_region(view, mr, int128_zero(),
A
Avi Kivity 已提交
635 636
                             addrrange_make(int128_zero(), int128_2_64()), false);
    }
637
    flatview_simplify(view);
A
Avi Kivity 已提交
638 639 640 641

    return view;
}

A
Avi Kivity 已提交
642 643 644 645 646 647 648
static void address_space_add_del_ioeventfds(AddressSpace *as,
                                             MemoryRegionIoeventfd *fds_new,
                                             unsigned fds_new_nb,
                                             MemoryRegionIoeventfd *fds_old,
                                             unsigned fds_old_nb)
{
    unsigned iold, inew;
649 650
    MemoryRegionIoeventfd *fd;
    MemoryRegionSection section;
A
Avi Kivity 已提交
651 652 653 654 655 656 657 658 659 660 661

    /* Generate a symmetric difference of the old and new fd sets, adding
     * and deleting as necessary.
     */

    iold = inew = 0;
    while (iold < fds_old_nb || inew < fds_new_nb) {
        if (iold < fds_old_nb
            && (inew == fds_new_nb
                || memory_region_ioeventfd_before(fds_old[iold],
                                                  fds_new[inew]))) {
662 663
            fd = &fds_old[iold];
            section = (MemoryRegionSection) {
664
                .address_space = as,
665
                .offset_within_address_space = int128_get64(fd->addr.start),
666
                .size = fd->addr.size,
667 668
            };
            MEMORY_LISTENER_CALL(eventfd_del, Forward, &section,
669
                                 fd->match_data, fd->data, fd->e);
A
Avi Kivity 已提交
670 671 672 673 674
            ++iold;
        } else if (inew < fds_new_nb
                   && (iold == fds_old_nb
                       || memory_region_ioeventfd_before(fds_new[inew],
                                                         fds_old[iold]))) {
675 676
            fd = &fds_new[inew];
            section = (MemoryRegionSection) {
677
                .address_space = as,
678
                .offset_within_address_space = int128_get64(fd->addr.start),
679
                .size = fd->addr.size,
680 681
            };
            MEMORY_LISTENER_CALL(eventfd_add, Reverse, &section,
682
                                 fd->match_data, fd->data, fd->e);
A
Avi Kivity 已提交
683 684 685 686 687 688 689 690
            ++inew;
        } else {
            ++iold;
            ++inew;
        }
    }
}

691 692 693 694
static FlatView *address_space_get_flatview(AddressSpace *as)
{
    FlatView *view;

695 696
    rcu_read_lock();
    view = atomic_rcu_read(&as->current_map);
697
    flatview_ref(view);
698
    rcu_read_unlock();
699 700 701
    return view;
}

A
Avi Kivity 已提交
702 703
static void address_space_update_ioeventfds(AddressSpace *as)
{
704
    FlatView *view;
A
Avi Kivity 已提交
705 706 707 708 709 710
    FlatRange *fr;
    unsigned ioeventfd_nb = 0;
    MemoryRegionIoeventfd *ioeventfds = NULL;
    AddrRange tmp;
    unsigned i;

711
    view = address_space_get_flatview(as);
712
    FOR_EACH_FLAT_RANGE(fr, view) {
A
Avi Kivity 已提交
713 714
        for (i = 0; i < fr->mr->ioeventfd_nb; ++i) {
            tmp = addrrange_shift(fr->mr->ioeventfds[i].addr,
715 716
                                  int128_sub(fr->addr.start,
                                             int128_make64(fr->offset_in_region)));
A
Avi Kivity 已提交
717 718
            if (addrrange_intersects(fr->addr, tmp)) {
                ++ioeventfd_nb;
719
                ioeventfds = g_realloc(ioeventfds,
A
Avi Kivity 已提交
720 721 722 723 724 725 726 727 728 729
                                          ioeventfd_nb * sizeof(*ioeventfds));
                ioeventfds[ioeventfd_nb-1] = fr->mr->ioeventfds[i];
                ioeventfds[ioeventfd_nb-1].addr = tmp;
            }
        }
    }

    address_space_add_del_ioeventfds(as, ioeventfds, ioeventfd_nb,
                                     as->ioeventfds, as->ioeventfd_nb);

730
    g_free(as->ioeventfds);
A
Avi Kivity 已提交
731 732
    as->ioeventfds = ioeventfds;
    as->ioeventfd_nb = ioeventfd_nb;
733
    flatview_unref(view);
A
Avi Kivity 已提交
734 735
}

736
static void address_space_update_topology_pass(AddressSpace *as,
737 738
                                               const FlatView *old_view,
                                               const FlatView *new_view,
739
                                               bool adding)
A
Avi Kivity 已提交
740 741 742 743 744 745 746 747
{
    unsigned iold, inew;
    FlatRange *frold, *frnew;

    /* Generate a symmetric difference of the old and new memory maps.
     * Kill ranges in the old map, and instantiate ranges in the new map.
     */
    iold = inew = 0;
748 749 750
    while (iold < old_view->nr || inew < new_view->nr) {
        if (iold < old_view->nr) {
            frold = &old_view->ranges[iold];
A
Avi Kivity 已提交
751 752 753
        } else {
            frold = NULL;
        }
754 755
        if (inew < new_view->nr) {
            frnew = &new_view->ranges[inew];
A
Avi Kivity 已提交
756 757 758 759 760 761
        } else {
            frnew = NULL;
        }

        if (frold
            && (!frnew
762 763
                || int128_lt(frold->addr.start, frnew->addr.start)
                || (int128_eq(frold->addr.start, frnew->addr.start)
A
Avi Kivity 已提交
764
                    && !flatrange_equal(frold, frnew)))) {
765
            /* In old but not in new, or in both but attributes changed. */
A
Avi Kivity 已提交
766

767
            if (!adding) {
768
                MEMORY_LISTENER_UPDATE_REGION(frold, as, Reverse, region_del);
769 770
            }

A
Avi Kivity 已提交
771 772
            ++iold;
        } else if (frold && frnew && flatrange_equal(frold, frnew)) {
773
            /* In both and unchanged (except logging may have changed) */
A
Avi Kivity 已提交
774

775
            if (adding) {
776
                MEMORY_LISTENER_UPDATE_REGION(frnew, as, Forward, region_nop);
777
                if (frold->dirty_log_mask && !frnew->dirty_log_mask) {
778
                    MEMORY_LISTENER_UPDATE_REGION(frnew, as, Reverse, log_stop);
779
                } else if (frnew->dirty_log_mask && !frold->dirty_log_mask) {
780
                    MEMORY_LISTENER_UPDATE_REGION(frnew, as, Forward, log_start);
781
                }
A
Avi Kivity 已提交
782 783
            }

A
Avi Kivity 已提交
784 785 786 787 788
            ++iold;
            ++inew;
        } else {
            /* In new */

789
            if (adding) {
790
                MEMORY_LISTENER_UPDATE_REGION(frnew, as, Forward, region_add);
791 792
            }

A
Avi Kivity 已提交
793 794 795
            ++inew;
        }
    }
796 797 798 799 800
}


static void address_space_update_topology(AddressSpace *as)
{
801
    FlatView *old_view = address_space_get_flatview(as);
802
    FlatView *new_view = generate_memory_topology(as->root);
803 804 805 806

    address_space_update_topology_pass(as, old_view, new_view, false);
    address_space_update_topology_pass(as, old_view, new_view, true);

807 808 809
    /* Writes are protected by the BQL.  */
    atomic_rcu_set(&as->current_map, new_view);
    call_rcu(old_view, flatview_unref, rcu);
810 811 812 813 814 815 816 817 818

    /* Note that all the old MemoryRegions are still alive up to this
     * point.  This relieves most MemoryListeners from the need to
     * ref/unref the MemoryRegions they get---unless they use them
     * outside the iothread mutex, in which case precise reference
     * counting is necessary.
     */
    flatview_unref(old_view);

A
Avi Kivity 已提交
819
    address_space_update_ioeventfds(as);
A
Avi Kivity 已提交
820 821
}

A
Avi Kivity 已提交
822 823
void memory_region_transaction_begin(void)
{
824
    qemu_flush_coalesced_mmio_buffer();
A
Avi Kivity 已提交
825 826 827
    ++memory_region_transaction_depth;
}

828 829 830 831 832 833
static void memory_region_clear_pending(void)
{
    memory_region_update_pending = false;
    ioeventfd_update_pending = false;
}

A
Avi Kivity 已提交
834 835
void memory_region_transaction_commit(void)
{
836 837
    AddressSpace *as;

A
Avi Kivity 已提交
838 839
    assert(memory_region_transaction_depth);
    --memory_region_transaction_depth;
840 841 842
    if (!memory_region_transaction_depth) {
        if (memory_region_update_pending) {
            MEMORY_LISTENER_CALL_GLOBAL(begin, Forward);
843

844 845 846
            QTAILQ_FOREACH(as, &address_spaces, address_spaces_link) {
                address_space_update_topology(as);
            }
847

848 849 850 851 852 853 854 855
            MEMORY_LISTENER_CALL_GLOBAL(commit, Forward);
        } else if (ioeventfd_update_pending) {
            QTAILQ_FOREACH(as, &address_spaces, address_spaces_link) {
                address_space_update_ioeventfds(as);
            }
        }
        memory_region_clear_pending();
   }
A
Avi Kivity 已提交
856 857
}

858 859 860 861 862 863 864 865 866
static void memory_region_destructor_none(MemoryRegion *mr)
{
}

static void memory_region_destructor_ram(MemoryRegion *mr)
{
    qemu_ram_free(mr->ram_addr);
}

P
Paolo Bonzini 已提交
867 868 869 870 871
static void memory_region_destructor_alias(MemoryRegion *mr)
{
    memory_region_unref(mr->alias);
}

872 873 874 875 876
static void memory_region_destructor_ram_from_ptr(MemoryRegion *mr)
{
    qemu_ram_free_from_ptr(mr->ram_addr);
}

877 878 879 880 881
static void memory_region_destructor_rom_device(MemoryRegion *mr)
{
    qemu_ram_free(mr->ram_addr & TARGET_PAGE_MASK);
}

P
Peter Crosthwaite 已提交
882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915
static bool memory_region_need_escape(char c)
{
    return c == '/' || c == '[' || c == '\\' || c == ']';
}

static char *memory_region_escape_name(const char *name)
{
    const char *p;
    char *escaped, *q;
    uint8_t c;
    size_t bytes = 0;

    for (p = name; *p; p++) {
        bytes += memory_region_need_escape(*p) ? 4 : 1;
    }
    if (bytes == p - name) {
       return g_memdup(name, bytes + 1);
    }

    escaped = g_malloc(bytes + 1);
    for (p = name, q = escaped; *p; p++) {
        c = *p;
        if (unlikely(memory_region_need_escape(c))) {
            *q++ = '\\';
            *q++ = 'x';
            *q++ = "0123456789abcdef"[c >> 4];
            c = "0123456789abcdef"[c & 15];
        }
        *q++ = c;
    }
    *q = 0;
    return escaped;
}

A
Avi Kivity 已提交
916
void memory_region_init(MemoryRegion *mr,
917
                        Object *owner,
A
Avi Kivity 已提交
918 919 920
                        const char *name,
                        uint64_t size)
{
921
    if (!owner) {
922
        owner = container_get(qdev_get_machine(), "/unattached");
923
    }
P
Peter Crosthwaite 已提交
924

925
    object_initialize(mr, sizeof(*mr), TYPE_MEMORY_REGION);
926 927 928 929
    mr->size = int128_make64(size);
    if (size == UINT64_MAX) {
        mr->size = int128_2_64();
    }
930
    mr->name = g_strdup(name);
P
Peter Crosthwaite 已提交
931 932

    if (name) {
933 934 935
        char *escaped_name = memory_region_escape_name(name);
        char *name_array = g_strdup_printf("%s[*]", escaped_name);
        object_property_add_child(owner, name_array, OBJECT(mr), &error_abort);
P
Peter Crosthwaite 已提交
936
        object_unref(OBJECT(mr));
937 938
        g_free(name_array);
        g_free(escaped_name);
P
Peter Crosthwaite 已提交
939 940 941
    }
}

942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967 968 969 970 971 972 973
static void memory_region_get_addr(Object *obj, Visitor *v, void *opaque,
                                   const char *name, Error **errp)
{
    MemoryRegion *mr = MEMORY_REGION(obj);
    uint64_t value = mr->addr;

    visit_type_uint64(v, &value, name, errp);
}

static void memory_region_get_container(Object *obj, Visitor *v, void *opaque,
                                        const char *name, Error **errp)
{
    MemoryRegion *mr = MEMORY_REGION(obj);
    gchar *path = (gchar *)"";

    if (mr->container) {
        path = object_get_canonical_path(OBJECT(mr->container));
    }
    visit_type_str(v, &path, name, errp);
    if (mr->container) {
        g_free(path);
    }
}

static Object *memory_region_resolve_container(Object *obj, void *opaque,
                                               const char *part)
{
    MemoryRegion *mr = MEMORY_REGION(obj);

    return OBJECT(mr->container);
}

974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989
static void memory_region_get_priority(Object *obj, Visitor *v, void *opaque,
                                       const char *name, Error **errp)
{
    MemoryRegion *mr = MEMORY_REGION(obj);
    int32_t value = mr->priority;

    visit_type_int32(v, &value, name, errp);
}

static bool memory_region_get_may_overlap(Object *obj, Error **errp)
{
    MemoryRegion *mr = MEMORY_REGION(obj);

    return mr->may_overlap;
}

990 991 992 993 994 995 996 997 998
static void memory_region_get_size(Object *obj, Visitor *v, void *opaque,
                                   const char *name, Error **errp)
{
    MemoryRegion *mr = MEMORY_REGION(obj);
    uint64_t value = memory_region_size(mr);

    visit_type_uint64(v, &value, name, errp);
}

P
Peter Crosthwaite 已提交
999 1000 1001
static void memory_region_initfn(Object *obj)
{
    MemoryRegion *mr = MEMORY_REGION(obj);
1002
    ObjectProperty *op;
P
Peter Crosthwaite 已提交
1003 1004

    mr->ops = &unassigned_mem_ops;
1005
    mr->enabled = true;
1006
    mr->romd_mode = true;
1007
    mr->destructor = memory_region_destructor_none;
A
Avi Kivity 已提交
1008 1009
    QTAILQ_INIT(&mr->subregions);
    QTAILQ_INIT(&mr->coalesced);
1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021

    op = object_property_add(OBJECT(mr), "container",
                             "link<" TYPE_MEMORY_REGION ">",
                             memory_region_get_container,
                             NULL, /* memory_region_set_container */
                             NULL, NULL, &error_abort);
    op->resolve = memory_region_resolve_container;

    object_property_add(OBJECT(mr), "addr", "uint64",
                        memory_region_get_addr,
                        NULL, /* memory_region_set_addr */
                        NULL, NULL, &error_abort);
1022 1023 1024 1025 1026 1027 1028 1029
    object_property_add(OBJECT(mr), "priority", "uint32",
                        memory_region_get_priority,
                        NULL, /* memory_region_set_priority */
                        NULL, NULL, &error_abort);
    object_property_add_bool(OBJECT(mr), "may-overlap",
                             memory_region_get_may_overlap,
                             NULL, /* memory_region_set_may_overlap */
                             &error_abort);
1030 1031 1032 1033
    object_property_add(OBJECT(mr), "size", "uint64",
                        memory_region_get_size,
                        NULL, /* memory_region_set_size, */
                        NULL, NULL, &error_abort);
A
Avi Kivity 已提交
1034 1035
}

1036 1037 1038 1039 1040 1041
static uint64_t unassigned_mem_read(void *opaque, hwaddr addr,
                                    unsigned size)
{
#ifdef DEBUG_UNASSIGNED
    printf("Unassigned mem read " TARGET_FMT_plx "\n", addr);
#endif
1042 1043
    if (current_cpu != NULL) {
        cpu_unassigned_access(current_cpu, addr, false, false, 0, size);
1044
    }
1045
    return 0;
1046 1047 1048 1049 1050 1051 1052 1053
}

static void unassigned_mem_write(void *opaque, hwaddr addr,
                                 uint64_t val, unsigned size)
{
#ifdef DEBUG_UNASSIGNED
    printf("Unassigned mem write " TARGET_FMT_plx " = 0x%"PRIx64"\n", addr, val);
#endif
1054 1055
    if (current_cpu != NULL) {
        cpu_unassigned_access(current_cpu, addr, true, false, 0, size);
1056
    }
1057 1058
}

1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069
static bool unassigned_mem_accepts(void *opaque, hwaddr addr,
                                   unsigned size, bool is_write)
{
    return false;
}

const MemoryRegionOps unassigned_mem_ops = {
    .valid.accepts = unassigned_mem_accepts,
    .endianness = DEVICE_NATIVE_ENDIAN,
};

1070 1071 1072 1073
bool memory_region_access_valid(MemoryRegion *mr,
                                hwaddr addr,
                                unsigned size,
                                bool is_write)
A
Avi Kivity 已提交
1074
{
1075 1076
    int access_size_min, access_size_max;
    int access_size, i;
1077

A
Avi Kivity 已提交
1078 1079 1080 1081
    if (!mr->ops->valid.unaligned && (addr & (size - 1))) {
        return false;
    }

1082
    if (!mr->ops->valid.accepts) {
A
Avi Kivity 已提交
1083 1084 1085
        return true;
    }

1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096 1097 1098 1099 1100 1101
    access_size_min = mr->ops->valid.min_access_size;
    if (!mr->ops->valid.min_access_size) {
        access_size_min = 1;
    }

    access_size_max = mr->ops->valid.max_access_size;
    if (!mr->ops->valid.max_access_size) {
        access_size_max = 4;
    }

    access_size = MAX(MIN(size, access_size_max), access_size_min);
    for (i = 0; i < size; i += access_size) {
        if (!mr->ops->valid.accepts(mr->opaque, addr + i, access_size,
                                    is_write)) {
            return false;
        }
A
Avi Kivity 已提交
1102
    }
1103

A
Avi Kivity 已提交
1104 1105 1106
    return true;
}

1107 1108 1109 1110 1111
static MemTxResult memory_region_dispatch_read1(MemoryRegion *mr,
                                                hwaddr addr,
                                                uint64_t *pval,
                                                unsigned size,
                                                MemTxAttrs attrs)
A
Avi Kivity 已提交
1112
{
1113
    *pval = 0;
A
Avi Kivity 已提交
1114

1115
    if (mr->ops->read) {
1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126
        return access_with_adjusted_size(addr, pval, size,
                                         mr->ops->impl.min_access_size,
                                         mr->ops->impl.max_access_size,
                                         memory_region_read_accessor,
                                         mr, attrs);
    } else if (mr->ops->read_with_attrs) {
        return access_with_adjusted_size(addr, pval, size,
                                         mr->ops->impl.min_access_size,
                                         mr->ops->impl.max_access_size,
                                         memory_region_read_with_attrs_accessor,
                                         mr, attrs);
1127
    } else {
1128 1129 1130
        return access_with_adjusted_size(addr, pval, size, 1, 4,
                                         memory_region_oldmmio_read_accessor,
                                         mr, attrs);
1131
    }
A
Avi Kivity 已提交
1132 1133
}

1134 1135 1136 1137 1138
MemTxResult memory_region_dispatch_read(MemoryRegion *mr,
                                        hwaddr addr,
                                        uint64_t *pval,
                                        unsigned size,
                                        MemTxAttrs attrs)
1139
{
1140 1141
    MemTxResult r;

1142 1143
    if (!memory_region_access_valid(mr, addr, size, false)) {
        *pval = unassigned_mem_read(mr, addr, size);
1144
        return MEMTX_DECODE_ERROR;
1145
    }
1146

1147
    r = memory_region_dispatch_read1(mr, addr, pval, size, attrs);
1148
    adjust_endianness(mr, pval, size);
1149
    return r;
1150
}
A
Avi Kivity 已提交
1151

1152 1153 1154 1155 1156
MemTxResult memory_region_dispatch_write(MemoryRegion *mr,
                                         hwaddr addr,
                                         uint64_t data,
                                         unsigned size,
                                         MemTxAttrs attrs)
1157
{
1158
    if (!memory_region_access_valid(mr, addr, size, true)) {
1159
        unassigned_mem_write(mr, addr, data, size);
1160
        return MEMTX_DECODE_ERROR;
A
Avi Kivity 已提交
1161 1162
    }

1163 1164
    adjust_endianness(mr, &data, size);

1165
    if (mr->ops->write) {
1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177
        return access_with_adjusted_size(addr, &data, size,
                                         mr->ops->impl.min_access_size,
                                         mr->ops->impl.max_access_size,
                                         memory_region_write_accessor, mr,
                                         attrs);
    } else if (mr->ops->write_with_attrs) {
        return
            access_with_adjusted_size(addr, &data, size,
                                      mr->ops->impl.min_access_size,
                                      mr->ops->impl.max_access_size,
                                      memory_region_write_with_attrs_accessor,
                                      mr, attrs);
1178
    } else {
1179 1180 1181
        return access_with_adjusted_size(addr, &data, size, 1, 4,
                                         memory_region_oldmmio_write_accessor,
                                         mr, attrs);
1182
    }
A
Avi Kivity 已提交
1183 1184 1185
}

void memory_region_init_io(MemoryRegion *mr,
1186
                           Object *owner,
A
Avi Kivity 已提交
1187 1188 1189 1190 1191
                           const MemoryRegionOps *ops,
                           void *opaque,
                           const char *name,
                           uint64_t size)
{
1192
    memory_region_init(mr, owner, name, size);
A
Avi Kivity 已提交
1193 1194
    mr->ops = ops;
    mr->opaque = opaque;
1195
    mr->terminates = true;
1196
    mr->ram_addr = ~(ram_addr_t)0;
A
Avi Kivity 已提交
1197 1198 1199
}

void memory_region_init_ram(MemoryRegion *mr,
1200
                            Object *owner,
A
Avi Kivity 已提交
1201
                            const char *name,
1202 1203
                            uint64_t size,
                            Error **errp)
A
Avi Kivity 已提交
1204
{
1205
    memory_region_init(mr, owner, name, size);
A
Avi Kivity 已提交
1206
    mr->ram = true;
1207
    mr->terminates = true;
1208
    mr->destructor = memory_region_destructor_ram;
1209
    mr->ram_addr = qemu_ram_alloc(size, mr, errp);
1210 1211
}

1212 1213 1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228
void memory_region_init_resizeable_ram(MemoryRegion *mr,
                                       Object *owner,
                                       const char *name,
                                       uint64_t size,
                                       uint64_t max_size,
                                       void (*resized)(const char*,
                                                       uint64_t length,
                                                       void *host),
                                       Error **errp)
{
    memory_region_init(mr, owner, name, size);
    mr->ram = true;
    mr->terminates = true;
    mr->destructor = memory_region_destructor_ram;
    mr->ram_addr = qemu_ram_alloc_resizeable(size, max_size, resized, mr, errp);
}

1229 1230 1231 1232 1233
#ifdef __linux__
void memory_region_init_ram_from_file(MemoryRegion *mr,
                                      struct Object *owner,
                                      const char *name,
                                      uint64_t size,
1234
                                      bool share,
1235 1236
                                      const char *path,
                                      Error **errp)
1237 1238 1239 1240 1241
{
    memory_region_init(mr, owner, name, size);
    mr->ram = true;
    mr->terminates = true;
    mr->destructor = memory_region_destructor_ram;
1242
    mr->ram_addr = qemu_ram_alloc_from_file(size, mr, share, path, errp);
A
Avi Kivity 已提交
1243
}
1244
#endif
A
Avi Kivity 已提交
1245 1246

void memory_region_init_ram_ptr(MemoryRegion *mr,
1247
                                Object *owner,
A
Avi Kivity 已提交
1248 1249 1250 1251
                                const char *name,
                                uint64_t size,
                                void *ptr)
{
1252
    memory_region_init(mr, owner, name, size);
A
Avi Kivity 已提交
1253
    mr->ram = true;
1254
    mr->terminates = true;
1255
    mr->destructor = memory_region_destructor_ram_from_ptr;
1256 1257 1258 1259

    /* qemu_ram_alloc_from_ptr cannot fail with ptr != NULL.  */
    assert(ptr != NULL);
    mr->ram_addr = qemu_ram_alloc_from_ptr(size, ptr, mr, &error_abort);
A
Avi Kivity 已提交
1260 1261
}

1262 1263 1264 1265 1266
void memory_region_set_skip_dump(MemoryRegion *mr)
{
    mr->skip_dump = true;
}

A
Avi Kivity 已提交
1267
void memory_region_init_alias(MemoryRegion *mr,
1268
                              Object *owner,
A
Avi Kivity 已提交
1269 1270
                              const char *name,
                              MemoryRegion *orig,
A
Avi Kivity 已提交
1271
                              hwaddr offset,
A
Avi Kivity 已提交
1272 1273
                              uint64_t size)
{
1274
    memory_region_init(mr, owner, name, size);
P
Paolo Bonzini 已提交
1275 1276
    memory_region_ref(orig);
    mr->destructor = memory_region_destructor_alias;
A
Avi Kivity 已提交
1277 1278 1279 1280
    mr->alias = orig;
    mr->alias_offset = offset;
}

1281
void memory_region_init_rom_device(MemoryRegion *mr,
1282
                                   Object *owner,
1283
                                   const MemoryRegionOps *ops,
1284
                                   void *opaque,
1285
                                   const char *name,
1286 1287
                                   uint64_t size,
                                   Error **errp)
1288
{
1289
    memory_region_init(mr, owner, name, size);
1290
    mr->ops = ops;
1291
    mr->opaque = opaque;
1292
    mr->terminates = true;
A
Avi Kivity 已提交
1293
    mr->rom_device = true;
1294
    mr->destructor = memory_region_destructor_rom_device;
1295
    mr->ram_addr = qemu_ram_alloc(size, mr, errp);
1296 1297
}

A
Avi Kivity 已提交
1298
void memory_region_init_iommu(MemoryRegion *mr,
1299
                              Object *owner,
A
Avi Kivity 已提交
1300 1301 1302 1303
                              const MemoryRegionIOMMUOps *ops,
                              const char *name,
                              uint64_t size)
{
1304
    memory_region_init(mr, owner, name, size);
A
Avi Kivity 已提交
1305 1306
    mr->iommu_ops = ops,
    mr->terminates = true;  /* then re-forwards */
1307
    notifier_list_init(&mr->iommu_notify);
A
Avi Kivity 已提交
1308 1309
}

1310
void memory_region_init_reservation(MemoryRegion *mr,
1311
                                    Object *owner,
1312 1313 1314
                                    const char *name,
                                    uint64_t size)
{
1315
    memory_region_init_io(mr, owner, &unassigned_mem_ops, mr, name, size);
1316 1317
}

P
Peter Crosthwaite 已提交
1318
static void memory_region_finalize(Object *obj)
A
Avi Kivity 已提交
1319
{
P
Peter Crosthwaite 已提交
1320 1321
    MemoryRegion *mr = MEMORY_REGION(obj);

A
Avi Kivity 已提交
1322
    assert(QTAILQ_EMPTY(&mr->subregions));
1323
    mr->destructor(mr);
A
Avi Kivity 已提交
1324
    memory_region_clear_coalescing(mr);
1325
    g_free((char *)mr->name);
1326
    g_free(mr->ioeventfds);
A
Avi Kivity 已提交
1327 1328
}

P
Paolo Bonzini 已提交
1329 1330
Object *memory_region_owner(MemoryRegion *mr)
{
1331 1332
    Object *obj = OBJECT(mr);
    return obj->parent;
P
Paolo Bonzini 已提交
1333 1334
}

P
Paolo Bonzini 已提交
1335 1336
void memory_region_ref(MemoryRegion *mr)
{
1337 1338 1339 1340 1341 1342 1343 1344 1345 1346 1347 1348 1349
    /* MMIO callbacks most likely will access data that belongs
     * to the owner, hence the need to ref/unref the owner whenever
     * the memory region is in use.
     *
     * The memory region is a child of its owner.  As long as the
     * owner doesn't call unparent itself on the memory region,
     * ref-ing the owner will also keep the memory region alive.
     * Memory regions without an owner are supposed to never go away,
     * but we still ref/unref them for debugging purposes.
     */
    Object *obj = OBJECT(mr);
    if (obj && obj->parent) {
        object_ref(obj->parent);
P
Peter Crosthwaite 已提交
1350
    } else {
1351
        object_ref(obj);
P
Paolo Bonzini 已提交
1352 1353 1354 1355 1356
    }
}

void memory_region_unref(MemoryRegion *mr)
{
1357 1358 1359
    Object *obj = OBJECT(mr);
    if (obj && obj->parent) {
        object_unref(obj->parent);
P
Peter Crosthwaite 已提交
1360
    } else {
1361
        object_unref(obj);
P
Paolo Bonzini 已提交
1362 1363 1364
    }
}

A
Avi Kivity 已提交
1365 1366
uint64_t memory_region_size(MemoryRegion *mr)
{
1367 1368 1369 1370
    if (int128_eq(mr->size, int128_2_64())) {
        return UINT64_MAX;
    }
    return int128_get64(mr->size);
A
Avi Kivity 已提交
1371 1372
}

1373
const char *memory_region_name(const MemoryRegion *mr)
1374
{
1375 1376 1377 1378
    if (!mr->name) {
        ((MemoryRegion *)mr)->name =
            object_get_canonical_path_component(OBJECT(mr));
    }
1379
    return mr->name;
1380 1381
}

A
Avi Kivity 已提交
1382 1383 1384 1385 1386
bool memory_region_is_ram(MemoryRegion *mr)
{
    return mr->ram;
}

1387 1388 1389 1390 1391
bool memory_region_is_skip_dump(MemoryRegion *mr)
{
    return mr->skip_dump;
}

1392 1393 1394 1395 1396
bool memory_region_is_logging(MemoryRegion *mr)
{
    return mr->dirty_log_mask;
}

A
Avi Kivity 已提交
1397 1398 1399 1400 1401
bool memory_region_is_rom(MemoryRegion *mr)
{
    return mr->ram && mr->readonly;
}

A
Avi Kivity 已提交
1402 1403 1404 1405 1406
bool memory_region_is_iommu(MemoryRegion *mr)
{
    return mr->iommu_ops;
}

1407 1408 1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423
void memory_region_register_iommu_notifier(MemoryRegion *mr, Notifier *n)
{
    notifier_list_add(&mr->iommu_notify, n);
}

void memory_region_unregister_iommu_notifier(Notifier *n)
{
    notifier_remove(n);
}

void memory_region_notify_iommu(MemoryRegion *mr,
                                IOMMUTLBEntry entry)
{
    assert(memory_region_is_iommu(mr));
    notifier_list_notify(&mr->iommu_notify, &entry);
}

A
Avi Kivity 已提交
1424 1425
void memory_region_set_log(MemoryRegion *mr, bool log, unsigned client)
{
A
Avi Kivity 已提交
1426 1427
    uint8_t mask = 1 << client;

1428
    assert(client == DIRTY_MEMORY_VGA);
1429
    memory_region_transaction_begin();
A
Avi Kivity 已提交
1430
    mr->dirty_log_mask = (mr->dirty_log_mask & ~mask) | (log * mask);
1431
    memory_region_update_pending |= mr->enabled;
1432
    memory_region_transaction_commit();
A
Avi Kivity 已提交
1433 1434
}

A
Avi Kivity 已提交
1435 1436
bool memory_region_get_dirty(MemoryRegion *mr, hwaddr addr,
                             hwaddr size, unsigned client)
A
Avi Kivity 已提交
1437
{
1438
    assert(mr->terminates);
1439
    return cpu_physical_memory_get_dirty(mr->ram_addr + addr, size, client);
A
Avi Kivity 已提交
1440 1441
}

A
Avi Kivity 已提交
1442 1443
void memory_region_set_dirty(MemoryRegion *mr, hwaddr addr,
                             hwaddr size)
A
Avi Kivity 已提交
1444
{
1445
    assert(mr->terminates);
1446
    cpu_physical_memory_set_dirty_range(mr->ram_addr + addr, size);
A
Avi Kivity 已提交
1447 1448
}

1449 1450 1451 1452 1453
bool memory_region_test_and_clear_dirty(MemoryRegion *mr, hwaddr addr,
                                        hwaddr size, unsigned client)
{
    bool ret;
    assert(mr->terminates);
1454
    ret = cpu_physical_memory_get_dirty(mr->ram_addr + addr, size, client);
1455
    if (ret) {
1456
        cpu_physical_memory_reset_dirty(mr->ram_addr + addr, size, client);
1457 1458 1459 1460 1461
    }
    return ret;
}


A
Avi Kivity 已提交
1462 1463
void memory_region_sync_dirty_bitmap(MemoryRegion *mr)
{
1464
    AddressSpace *as;
A
Avi Kivity 已提交
1465 1466
    FlatRange *fr;

1467
    QTAILQ_FOREACH(as, &address_spaces, address_spaces_link) {
1468
        FlatView *view = address_space_get_flatview(as);
1469
        FOR_EACH_FLAT_RANGE(fr, view) {
1470 1471 1472
            if (fr->mr == mr) {
                MEMORY_LISTENER_UPDATE_REGION(fr, as, Forward, log_sync);
            }
A
Avi Kivity 已提交
1473
        }
1474
        flatview_unref(view);
A
Avi Kivity 已提交
1475
    }
A
Avi Kivity 已提交
1476 1477 1478 1479
}

void memory_region_set_readonly(MemoryRegion *mr, bool readonly)
{
1480
    if (mr->readonly != readonly) {
1481
        memory_region_transaction_begin();
1482
        mr->readonly = readonly;
1483
        memory_region_update_pending |= mr->enabled;
1484
        memory_region_transaction_commit();
1485
    }
A
Avi Kivity 已提交
1486 1487
}

1488
void memory_region_rom_device_set_romd(MemoryRegion *mr, bool romd_mode)
1489
{
1490
    if (mr->romd_mode != romd_mode) {
1491
        memory_region_transaction_begin();
1492
        mr->romd_mode = romd_mode;
1493
        memory_region_update_pending |= mr->enabled;
1494
        memory_region_transaction_commit();
1495 1496 1497
    }
}

A
Avi Kivity 已提交
1498 1499
void memory_region_reset_dirty(MemoryRegion *mr, hwaddr addr,
                               hwaddr size, unsigned client)
A
Avi Kivity 已提交
1500
{
1501
    assert(mr->terminates);
1502
    cpu_physical_memory_reset_dirty(mr->ram_addr + addr, size, client);
A
Avi Kivity 已提交
1503 1504
}

1505 1506 1507 1508 1509 1510 1511 1512 1513 1514 1515
int memory_region_get_fd(MemoryRegion *mr)
{
    if (mr->alias) {
        return memory_region_get_fd(mr->alias);
    }

    assert(mr->terminates);

    return qemu_get_ram_fd(mr->ram_addr & TARGET_PAGE_MASK);
}

A
Avi Kivity 已提交
1516 1517 1518 1519 1520 1521
void *memory_region_get_ram_ptr(MemoryRegion *mr)
{
    if (mr->alias) {
        return memory_region_get_ram_ptr(mr->alias) + mr->alias_offset;
    }

1522
    assert(mr->terminates);
A
Avi Kivity 已提交
1523

1524
    return qemu_get_ram_ptr(mr->ram_addr & TARGET_PAGE_MASK);
A
Avi Kivity 已提交
1525 1526
}

1527 1528 1529 1530 1531 1532 1533
void memory_region_ram_resize(MemoryRegion *mr, ram_addr_t newsize, Error **errp)
{
    assert(mr->terminates);

    qemu_ram_resize(mr->ram_addr, newsize, errp);
}

1534
static void memory_region_update_coalesced_range_as(MemoryRegion *mr, AddressSpace *as)
A
Avi Kivity 已提交
1535
{
1536
    FlatView *view;
A
Avi Kivity 已提交
1537 1538 1539
    FlatRange *fr;
    CoalescedMemoryRange *cmr;
    AddrRange tmp;
1540
    MemoryRegionSection section;
A
Avi Kivity 已提交
1541

1542
    view = address_space_get_flatview(as);
1543
    FOR_EACH_FLAT_RANGE(fr, view) {
A
Avi Kivity 已提交
1544
        if (fr->mr == mr) {
1545
            section = (MemoryRegionSection) {
1546
                .address_space = as,
1547
                .offset_within_address_space = int128_get64(fr->addr.start),
1548
                .size = fr->addr.size,
1549 1550 1551 1552 1553
            };

            MEMORY_LISTENER_CALL(coalesced_mmio_del, Reverse, &section,
                                 int128_get64(fr->addr.start),
                                 int128_get64(fr->addr.size));
A
Avi Kivity 已提交
1554 1555
            QTAILQ_FOREACH(cmr, &mr->coalesced, link) {
                tmp = addrrange_shift(cmr->addr,
1556 1557
                                      int128_sub(fr->addr.start,
                                                 int128_make64(fr->offset_in_region)));
A
Avi Kivity 已提交
1558 1559 1560 1561
                if (!addrrange_intersects(tmp, fr->addr)) {
                    continue;
                }
                tmp = addrrange_intersection(tmp, fr->addr);
1562 1563 1564
                MEMORY_LISTENER_CALL(coalesced_mmio_add, Forward, &section,
                                     int128_get64(tmp.start),
                                     int128_get64(tmp.size));
A
Avi Kivity 已提交
1565 1566 1567
            }
        }
    }
1568
    flatview_unref(view);
A
Avi Kivity 已提交
1569 1570
}

1571 1572 1573 1574 1575 1576 1577 1578 1579
static void memory_region_update_coalesced_range(MemoryRegion *mr)
{
    AddressSpace *as;

    QTAILQ_FOREACH(as, &address_spaces, address_spaces_link) {
        memory_region_update_coalesced_range_as(mr, as);
    }
}

A
Avi Kivity 已提交
1580 1581 1582
void memory_region_set_coalescing(MemoryRegion *mr)
{
    memory_region_clear_coalescing(mr);
1583
    memory_region_add_coalescing(mr, 0, int128_get64(mr->size));
A
Avi Kivity 已提交
1584 1585 1586
}

void memory_region_add_coalescing(MemoryRegion *mr,
A
Avi Kivity 已提交
1587
                                  hwaddr offset,
A
Avi Kivity 已提交
1588 1589
                                  uint64_t size)
{
1590
    CoalescedMemoryRange *cmr = g_malloc(sizeof(*cmr));
A
Avi Kivity 已提交
1591

1592
    cmr->addr = addrrange_make(int128_make64(offset), int128_make64(size));
A
Avi Kivity 已提交
1593 1594
    QTAILQ_INSERT_TAIL(&mr->coalesced, cmr, link);
    memory_region_update_coalesced_range(mr);
1595
    memory_region_set_flush_coalesced(mr);
A
Avi Kivity 已提交
1596 1597 1598 1599 1600
}

void memory_region_clear_coalescing(MemoryRegion *mr)
{
    CoalescedMemoryRange *cmr;
1601
    bool updated = false;
A
Avi Kivity 已提交
1602

1603 1604 1605
    qemu_flush_coalesced_mmio_buffer();
    mr->flush_coalesced_mmio = false;

A
Avi Kivity 已提交
1606 1607 1608
    while (!QTAILQ_EMPTY(&mr->coalesced)) {
        cmr = QTAILQ_FIRST(&mr->coalesced);
        QTAILQ_REMOVE(&mr->coalesced, cmr, link);
1609
        g_free(cmr);
1610 1611 1612 1613 1614
        updated = true;
    }

    if (updated) {
        memory_region_update_coalesced_range(mr);
A
Avi Kivity 已提交
1615 1616 1617
    }
}

1618 1619 1620 1621 1622 1623 1624 1625 1626 1627 1628 1629 1630
void memory_region_set_flush_coalesced(MemoryRegion *mr)
{
    mr->flush_coalesced_mmio = true;
}

void memory_region_clear_flush_coalesced(MemoryRegion *mr)
{
    qemu_flush_coalesced_mmio_buffer();
    if (QTAILQ_EMPTY(&mr->coalesced)) {
        mr->flush_coalesced_mmio = false;
    }
}

A
Avi Kivity 已提交
1631
void memory_region_add_eventfd(MemoryRegion *mr,
A
Avi Kivity 已提交
1632
                               hwaddr addr,
A
Avi Kivity 已提交
1633 1634 1635
                               unsigned size,
                               bool match_data,
                               uint64_t data,
1636
                               EventNotifier *e)
A
Avi Kivity 已提交
1637 1638
{
    MemoryRegionIoeventfd mrfd = {
1639 1640
        .addr.start = int128_make64(addr),
        .addr.size = int128_make64(size),
A
Avi Kivity 已提交
1641 1642
        .match_data = match_data,
        .data = data,
1643
        .e = e,
A
Avi Kivity 已提交
1644 1645 1646
    };
    unsigned i;

1647
    adjust_endianness(mr, &mrfd.data, size);
1648
    memory_region_transaction_begin();
A
Avi Kivity 已提交
1649 1650 1651 1652 1653 1654
    for (i = 0; i < mr->ioeventfd_nb; ++i) {
        if (memory_region_ioeventfd_before(mrfd, mr->ioeventfds[i])) {
            break;
        }
    }
    ++mr->ioeventfd_nb;
1655
    mr->ioeventfds = g_realloc(mr->ioeventfds,
A
Avi Kivity 已提交
1656 1657 1658 1659
                                  sizeof(*mr->ioeventfds) * mr->ioeventfd_nb);
    memmove(&mr->ioeventfds[i+1], &mr->ioeventfds[i],
            sizeof(*mr->ioeventfds) * (mr->ioeventfd_nb-1 - i));
    mr->ioeventfds[i] = mrfd;
1660
    ioeventfd_update_pending |= mr->enabled;
1661
    memory_region_transaction_commit();
A
Avi Kivity 已提交
1662 1663 1664
}

void memory_region_del_eventfd(MemoryRegion *mr,
A
Avi Kivity 已提交
1665
                               hwaddr addr,
A
Avi Kivity 已提交
1666 1667 1668
                               unsigned size,
                               bool match_data,
                               uint64_t data,
1669
                               EventNotifier *e)
A
Avi Kivity 已提交
1670 1671
{
    MemoryRegionIoeventfd mrfd = {
1672 1673
        .addr.start = int128_make64(addr),
        .addr.size = int128_make64(size),
A
Avi Kivity 已提交
1674 1675
        .match_data = match_data,
        .data = data,
1676
        .e = e,
A
Avi Kivity 已提交
1677 1678 1679
    };
    unsigned i;

1680
    adjust_endianness(mr, &mrfd.data, size);
1681
    memory_region_transaction_begin();
A
Avi Kivity 已提交
1682 1683 1684 1685 1686 1687 1688 1689 1690
    for (i = 0; i < mr->ioeventfd_nb; ++i) {
        if (memory_region_ioeventfd_equal(mrfd, mr->ioeventfds[i])) {
            break;
        }
    }
    assert(i != mr->ioeventfd_nb);
    memmove(&mr->ioeventfds[i], &mr->ioeventfds[i+1],
            sizeof(*mr->ioeventfds) * (mr->ioeventfd_nb - (i+1)));
    --mr->ioeventfd_nb;
1691
    mr->ioeventfds = g_realloc(mr->ioeventfds,
A
Avi Kivity 已提交
1692
                                  sizeof(*mr->ioeventfds)*mr->ioeventfd_nb + 1);
1693
    ioeventfd_update_pending |= mr->enabled;
1694
    memory_region_transaction_commit();
A
Avi Kivity 已提交
1695 1696
}

1697
static void memory_region_update_container_subregions(MemoryRegion *subregion)
A
Avi Kivity 已提交
1698
{
1699
    hwaddr offset = subregion->addr;
1700
    MemoryRegion *mr = subregion->container;
A
Avi Kivity 已提交
1701 1702
    MemoryRegion *other;

1703 1704
    memory_region_transaction_begin();

P
Paolo Bonzini 已提交
1705
    memory_region_ref(subregion);
A
Avi Kivity 已提交
1706 1707 1708 1709
    QTAILQ_FOREACH(other, &mr->subregions, subregions_link) {
        if (subregion->may_overlap || other->may_overlap) {
            continue;
        }
1710
        if (int128_ge(int128_make64(offset),
1711 1712 1713
                      int128_add(int128_make64(other->addr), other->size))
            || int128_le(int128_add(int128_make64(offset), subregion->size),
                         int128_make64(other->addr))) {
A
Avi Kivity 已提交
1714 1715
            continue;
        }
1716
#if 0
1717 1718
        printf("warning: subregion collision %llx/%llx (%s) "
               "vs %llx/%llx (%s)\n",
A
Avi Kivity 已提交
1719
               (unsigned long long)offset,
1720
               (unsigned long long)int128_get64(subregion->size),
1721 1722
               subregion->name,
               (unsigned long long)other->addr,
1723
               (unsigned long long)int128_get64(other->size),
1724
               other->name);
1725
#endif
A
Avi Kivity 已提交
1726 1727 1728 1729 1730 1731 1732 1733 1734
    }
    QTAILQ_FOREACH(other, &mr->subregions, subregions_link) {
        if (subregion->priority >= other->priority) {
            QTAILQ_INSERT_BEFORE(other, subregion, subregions_link);
            goto done;
        }
    }
    QTAILQ_INSERT_TAIL(&mr->subregions, subregion, subregions_link);
done:
1735
    memory_region_update_pending |= mr->enabled && subregion->enabled;
1736
    memory_region_transaction_commit();
A
Avi Kivity 已提交
1737 1738
}

1739 1740 1741 1742
static void memory_region_add_subregion_common(MemoryRegion *mr,
                                               hwaddr offset,
                                               MemoryRegion *subregion)
{
1743 1744
    assert(!subregion->container);
    subregion->container = mr;
1745
    subregion->addr = offset;
1746
    memory_region_update_container_subregions(subregion);
1747
}
A
Avi Kivity 已提交
1748 1749

void memory_region_add_subregion(MemoryRegion *mr,
A
Avi Kivity 已提交
1750
                                 hwaddr offset,
A
Avi Kivity 已提交
1751 1752 1753 1754 1755 1756 1757 1758
                                 MemoryRegion *subregion)
{
    subregion->may_overlap = false;
    subregion->priority = 0;
    memory_region_add_subregion_common(mr, offset, subregion);
}

void memory_region_add_subregion_overlap(MemoryRegion *mr,
A
Avi Kivity 已提交
1759
                                         hwaddr offset,
A
Avi Kivity 已提交
1760
                                         MemoryRegion *subregion,
1761
                                         int priority)
A
Avi Kivity 已提交
1762 1763 1764 1765 1766 1767 1768 1769 1770
{
    subregion->may_overlap = true;
    subregion->priority = priority;
    memory_region_add_subregion_common(mr, offset, subregion);
}

void memory_region_del_subregion(MemoryRegion *mr,
                                 MemoryRegion *subregion)
{
1771
    memory_region_transaction_begin();
1772 1773
    assert(subregion->container == mr);
    subregion->container = NULL;
A
Avi Kivity 已提交
1774
    QTAILQ_REMOVE(&mr->subregions, subregion, subregions_link);
P
Paolo Bonzini 已提交
1775
    memory_region_unref(subregion);
1776
    memory_region_update_pending |= mr->enabled && subregion->enabled;
1777
    memory_region_transaction_commit();
1778 1779 1780 1781 1782 1783 1784
}

void memory_region_set_enabled(MemoryRegion *mr, bool enabled)
{
    if (enabled == mr->enabled) {
        return;
    }
1785
    memory_region_transaction_begin();
1786
    mr->enabled = enabled;
1787
    memory_region_update_pending = true;
1788
    memory_region_transaction_commit();
A
Avi Kivity 已提交
1789
}
A
Avi Kivity 已提交
1790

1791 1792 1793 1794 1795 1796 1797 1798 1799 1800 1801 1802 1803 1804 1805 1806
void memory_region_set_size(MemoryRegion *mr, uint64_t size)
{
    Int128 s = int128_make64(size);

    if (size == UINT64_MAX) {
        s = int128_2_64();
    }
    if (int128_eq(s, mr->size)) {
        return;
    }
    memory_region_transaction_begin();
    mr->size = s;
    memory_region_update_pending = true;
    memory_region_transaction_commit();
}

1807
static void memory_region_readd_subregion(MemoryRegion *mr)
1808
{
1809
    MemoryRegion *container = mr->container;
1810

1811
    if (container) {
1812 1813
        memory_region_transaction_begin();
        memory_region_ref(mr);
1814 1815 1816
        memory_region_del_subregion(container, mr);
        mr->container = container;
        memory_region_update_container_subregions(mr);
1817 1818
        memory_region_unref(mr);
        memory_region_transaction_commit();
1819
    }
1820
}
1821

1822 1823 1824 1825 1826 1827
void memory_region_set_address(MemoryRegion *mr, hwaddr addr)
{
    if (addr != mr->addr) {
        mr->addr = addr;
        memory_region_readd_subregion(mr);
    }
1828 1829
}

A
Avi Kivity 已提交
1830
void memory_region_set_alias_offset(MemoryRegion *mr, hwaddr offset)
1831 1832 1833
{
    assert(mr->alias);

1834
    if (offset == mr->alias_offset) {
1835 1836 1837
        return;
    }

1838 1839
    memory_region_transaction_begin();
    mr->alias_offset = offset;
1840
    memory_region_update_pending |= mr->enabled;
1841
    memory_region_transaction_commit();
1842 1843
}

1844 1845 1846 1847 1848
ram_addr_t memory_region_get_ram_addr(MemoryRegion *mr)
{
    return mr->ram_addr;
}

1849 1850 1851 1852 1853
uint64_t memory_region_get_alignment(const MemoryRegion *mr)
{
    return mr->align;
}

1854 1855 1856 1857 1858 1859 1860 1861 1862 1863 1864 1865 1866
static int cmp_flatrange_addr(const void *addr_, const void *fr_)
{
    const AddrRange *addr = addr_;
    const FlatRange *fr = fr_;

    if (int128_le(addrrange_end(*addr), fr->addr.start)) {
        return -1;
    } else if (int128_ge(addr->start, addrrange_end(fr->addr))) {
        return 1;
    }
    return 0;
}

1867
static FlatRange *flatview_lookup(FlatView *view, AddrRange addr)
1868
{
1869
    return bsearch(&addr, view->ranges, view->nr,
1870 1871 1872
                   sizeof(FlatRange), cmp_flatrange_addr);
}

1873
bool memory_region_present(MemoryRegion *container, hwaddr addr)
1874
{
1875 1876
    MemoryRegion *mr = memory_region_find(container, addr, 1).mr;
    if (!mr || (mr == container)) {
1877 1878
        return false;
    }
P
Paolo Bonzini 已提交
1879
    memory_region_unref(mr);
1880 1881 1882
    return true;
}

1883 1884 1885 1886 1887
bool memory_region_is_mapped(MemoryRegion *mr)
{
    return mr->container ? true : false;
}

1888
MemoryRegionSection memory_region_find(MemoryRegion *mr,
A
Avi Kivity 已提交
1889
                                       hwaddr addr, uint64_t size)
1890
{
1891
    MemoryRegionSection ret = { .mr = NULL };
1892 1893 1894
    MemoryRegion *root;
    AddressSpace *as;
    AddrRange range;
1895
    FlatView *view;
1896 1897 1898
    FlatRange *fr;

    addr += mr->addr;
1899 1900
    for (root = mr; root->container; ) {
        root = root->container;
1901 1902
        addr += root->addr;
    }
1903

1904
    as = memory_region_to_address_space(root);
1905 1906 1907
    if (!as) {
        return ret;
    }
1908
    range = addrrange_make(int128_make64(addr), int128_make64(size));
1909

1910 1911
    rcu_read_lock();
    view = atomic_rcu_read(&as->current_map);
1912
    fr = flatview_lookup(view, range);
1913
    if (!fr) {
1914
        goto out;
1915 1916
    }

1917
    while (fr > view->ranges && addrrange_intersects(fr[-1].addr, range)) {
1918 1919 1920 1921
        --fr;
    }

    ret.mr = fr->mr;
1922
    ret.address_space = as;
1923 1924 1925 1926
    range = addrrange_intersection(range, fr->addr);
    ret.offset_within_region = fr->offset_in_region;
    ret.offset_within_region += int128_get64(int128_sub(range.start,
                                                        fr->addr.start));
1927
    ret.size = range.size;
1928
    ret.offset_within_address_space = int128_get64(range.start);
1929
    ret.readonly = fr->readonly;
P
Paolo Bonzini 已提交
1930
    memory_region_ref(ret.mr);
1931 1932
out:
    rcu_read_unlock();
1933 1934 1935
    return ret;
}

1936
void address_space_sync_dirty_bitmap(AddressSpace *as)
1937
{
1938
    FlatView *view;
1939 1940
    FlatRange *fr;

1941
    view = address_space_get_flatview(as);
1942
    FOR_EACH_FLAT_RANGE(fr, view) {
1943
        MEMORY_LISTENER_UPDATE_REGION(fr, as, Forward, log_sync);
1944
    }
1945
    flatview_unref(view);
1946 1947 1948 1949 1950
}

void memory_global_dirty_log_start(void)
{
    global_dirty_log = true;
1951
    MEMORY_LISTENER_CALL_GLOBAL(log_global_start, Forward);
1952 1953 1954 1955 1956
}

void memory_global_dirty_log_stop(void)
{
    global_dirty_log = false;
1957
    MEMORY_LISTENER_CALL_GLOBAL(log_global_stop, Reverse);
1958 1959 1960 1961 1962
}

static void listener_add_address_space(MemoryListener *listener,
                                       AddressSpace *as)
{
1963
    FlatView *view;
1964 1965
    FlatRange *fr;

1966
    if (listener->address_space_filter
1967
        && listener->address_space_filter != as) {
1968 1969 1970
        return;
    }

1971
    if (global_dirty_log) {
1972 1973 1974
        if (listener->log_global_start) {
            listener->log_global_start(listener);
        }
1975
    }
1976

1977
    view = address_space_get_flatview(as);
1978
    FOR_EACH_FLAT_RANGE(fr, view) {
1979 1980
        MemoryRegionSection section = {
            .mr = fr->mr,
1981
            .address_space = as,
1982
            .offset_within_region = fr->offset_in_region,
1983
            .size = fr->addr.size,
1984
            .offset_within_address_space = int128_get64(fr->addr.start),
1985
            .readonly = fr->readonly,
1986
        };
1987 1988 1989
        if (listener->region_add) {
            listener->region_add(listener, &section);
        }
1990
    }
1991
    flatview_unref(view);
1992 1993
}

1994
void memory_listener_register(MemoryListener *listener, AddressSpace *filter)
1995
{
1996
    MemoryListener *other = NULL;
1997
    AddressSpace *as;
1998

1999
    listener->address_space_filter = filter;
2000 2001 2002 2003 2004 2005 2006 2007 2008 2009 2010 2011
    if (QTAILQ_EMPTY(&memory_listeners)
        || listener->priority >= QTAILQ_LAST(&memory_listeners,
                                             memory_listeners)->priority) {
        QTAILQ_INSERT_TAIL(&memory_listeners, listener, link);
    } else {
        QTAILQ_FOREACH(other, &memory_listeners, link) {
            if (listener->priority < other->priority) {
                break;
            }
        }
        QTAILQ_INSERT_BEFORE(other, listener, link);
    }
2012 2013 2014 2015

    QTAILQ_FOREACH(as, &address_spaces, address_spaces_link) {
        listener_add_address_space(listener, as);
    }
2016 2017 2018 2019
}

void memory_listener_unregister(MemoryListener *listener)
{
2020
    QTAILQ_REMOVE(&memory_listeners, listener, link);
2021
}
2022

2023
void address_space_init(AddressSpace *as, MemoryRegion *root, const char *name)
A
Avi Kivity 已提交
2024
{
2025
    memory_region_ref(root);
2026
    memory_region_transaction_begin();
2027 2028 2029
    as->root = root;
    as->current_map = g_new(FlatView, 1);
    flatview_init(as->current_map);
2030 2031
    as->ioeventfd_nb = 0;
    as->ioeventfds = NULL;
2032
    QTAILQ_INSERT_TAIL(&address_spaces, as, address_spaces_link);
2033
    as->name = g_strdup(name ? name : "anonymous");
A
Avi Kivity 已提交
2034
    address_space_init_dispatch(as);
2035 2036
    memory_region_update_pending |= root->enabled;
    memory_region_transaction_commit();
A
Avi Kivity 已提交
2037
}
A
Avi Kivity 已提交
2038

2039
static void do_address_space_destroy(AddressSpace *as)
A
Avi Kivity 已提交
2040
{
2041 2042
    MemoryListener *listener;

A
Avi Kivity 已提交
2043
    address_space_destroy_dispatch(as);
2044 2045 2046 2047 2048

    QTAILQ_FOREACH(listener, &memory_listeners, link) {
        assert(listener->address_space_filter != as);
    }

2049
    flatview_unref(as->current_map);
2050
    g_free(as->name);
2051
    g_free(as->ioeventfds);
2052
    memory_region_unref(as->root);
A
Avi Kivity 已提交
2053 2054
}

2055 2056
void address_space_destroy(AddressSpace *as)
{
2057 2058
    MemoryRegion *root = as->root;

2059 2060 2061 2062 2063
    /* Flush out anything from MemoryListeners listening in on this */
    memory_region_transaction_begin();
    as->root = NULL;
    memory_region_transaction_commit();
    QTAILQ_REMOVE(&address_spaces, as, address_spaces_link);
2064
    address_space_unregister(as);
2065 2066 2067 2068 2069

    /* At this point, as->dispatch and as->current_map are dummy
     * entries that the guest should never use.  Wait for the old
     * values to expire before freeing the data.
     */
2070
    as->root = root;
2071 2072 2073
    call_rcu(as, do_address_space_destroy, rcu);
}

B
Blue Swirl 已提交
2074 2075 2076 2077 2078 2079 2080 2081 2082 2083 2084
typedef struct MemoryRegionList MemoryRegionList;

struct MemoryRegionList {
    const MemoryRegion *mr;
    QTAILQ_ENTRY(MemoryRegionList) queue;
};

typedef QTAILQ_HEAD(queue, MemoryRegionList) MemoryRegionListHead;

static void mtree_print_mr(fprintf_function mon_printf, void *f,
                           const MemoryRegion *mr, unsigned int level,
A
Avi Kivity 已提交
2085
                           hwaddr base,
2086
                           MemoryRegionListHead *alias_print_queue)
B
Blue Swirl 已提交
2087
{
2088 2089
    MemoryRegionList *new_ml, *ml, *next_ml;
    MemoryRegionListHead submr_print_queue;
B
Blue Swirl 已提交
2090 2091 2092
    const MemoryRegion *submr;
    unsigned int i;

2093
    if (!mr) {
B
Blue Swirl 已提交
2094 2095 2096 2097 2098 2099 2100 2101 2102 2103 2104 2105
        return;
    }

    for (i = 0; i < level; i++) {
        mon_printf(f, "  ");
    }

    if (mr->alias) {
        MemoryRegionList *ml;
        bool found = false;

        /* check if the alias is already in the queue */
2106
        QTAILQ_FOREACH(ml, alias_print_queue, queue) {
P
Paolo Bonzini 已提交
2107
            if (ml->mr == mr->alias) {
B
Blue Swirl 已提交
2108 2109 2110 2111 2112 2113 2114
                found = true;
            }
        }

        if (!found) {
            ml = g_new(MemoryRegionList, 1);
            ml->mr = mr->alias;
2115
            QTAILQ_INSERT_TAIL(alias_print_queue, ml, queue);
B
Blue Swirl 已提交
2116
        }
2117 2118
        mon_printf(f, TARGET_FMT_plx "-" TARGET_FMT_plx
                   " (prio %d, %c%c): alias %s @%s " TARGET_FMT_plx
2119
                   "-" TARGET_FMT_plx "%s\n",
B
Blue Swirl 已提交
2120
                   base + mr->addr,
2121
                   base + mr->addr
2122 2123 2124
                   + (int128_nz(mr->size) ?
                      (hwaddr)int128_get64(int128_sub(mr->size,
                                                      int128_one())) : 0),
J
Jan Kiszka 已提交
2125
                   mr->priority,
2126 2127 2128
                   mr->romd_mode ? 'R' : '-',
                   !mr->readonly && !(mr->rom_device && mr->romd_mode) ? 'W'
                                                                       : '-',
2129 2130
                   memory_region_name(mr),
                   memory_region_name(mr->alias),
B
Blue Swirl 已提交
2131
                   mr->alias_offset,
2132
                   mr->alias_offset
2133 2134
                   + (int128_nz(mr->size) ?
                      (hwaddr)int128_get64(int128_sub(mr->size,
2135 2136
                                                      int128_one())) : 0),
                   mr->enabled ? "" : " [disabled]");
B
Blue Swirl 已提交
2137
    } else {
2138
        mon_printf(f,
2139
                   TARGET_FMT_plx "-" TARGET_FMT_plx " (prio %d, %c%c): %s%s\n",
B
Blue Swirl 已提交
2140
                   base + mr->addr,
2141
                   base + mr->addr
2142 2143 2144
                   + (int128_nz(mr->size) ?
                      (hwaddr)int128_get64(int128_sub(mr->size,
                                                      int128_one())) : 0),
J
Jan Kiszka 已提交
2145
                   mr->priority,
2146 2147 2148
                   mr->romd_mode ? 'R' : '-',
                   !mr->readonly && !(mr->rom_device && mr->romd_mode) ? 'W'
                                                                       : '-',
2149 2150
                   memory_region_name(mr),
                   mr->enabled ? "" : " [disabled]");
B
Blue Swirl 已提交
2151
    }
2152 2153 2154

    QTAILQ_INIT(&submr_print_queue);

B
Blue Swirl 已提交
2155
    QTAILQ_FOREACH(submr, &mr->subregions, subregions_link) {
2156 2157 2158 2159 2160 2161 2162 2163 2164 2165 2166 2167 2168 2169 2170 2171 2172 2173 2174 2175 2176
        new_ml = g_new(MemoryRegionList, 1);
        new_ml->mr = submr;
        QTAILQ_FOREACH(ml, &submr_print_queue, queue) {
            if (new_ml->mr->addr < ml->mr->addr ||
                (new_ml->mr->addr == ml->mr->addr &&
                 new_ml->mr->priority > ml->mr->priority)) {
                QTAILQ_INSERT_BEFORE(ml, new_ml, queue);
                new_ml = NULL;
                break;
            }
        }
        if (new_ml) {
            QTAILQ_INSERT_TAIL(&submr_print_queue, new_ml, queue);
        }
    }

    QTAILQ_FOREACH(ml, &submr_print_queue, queue) {
        mtree_print_mr(mon_printf, f, ml->mr, level + 1, base + mr->addr,
                       alias_print_queue);
    }

A
Avi Kivity 已提交
2177
    QTAILQ_FOREACH_SAFE(ml, &submr_print_queue, queue, next_ml) {
2178
        g_free(ml);
B
Blue Swirl 已提交
2179 2180 2181 2182 2183 2184 2185
    }
}

void mtree_info(fprintf_function mon_printf, void *f)
{
    MemoryRegionListHead ml_head;
    MemoryRegionList *ml, *ml2;
2186
    AddressSpace *as;
B
Blue Swirl 已提交
2187 2188 2189

    QTAILQ_INIT(&ml_head);

2190
    QTAILQ_FOREACH(as, &address_spaces, address_spaces_link) {
G
Gerd Hoffmann 已提交
2191 2192 2193
        mon_printf(f, "address-space: %s\n", as->name);
        mtree_print_mr(mon_printf, f, as->root, 1, 0, &ml_head);
        mon_printf(f, "\n");
2194 2195
    }

B
Blue Swirl 已提交
2196 2197
    /* print aliased regions */
    QTAILQ_FOREACH(ml, &ml_head, queue) {
G
Gerd Hoffmann 已提交
2198 2199 2200
        mon_printf(f, "memory-region: %s\n", memory_region_name(ml->mr));
        mtree_print_mr(mon_printf, f, ml->mr, 1, 0, &ml_head);
        mon_printf(f, "\n");
B
Blue Swirl 已提交
2201 2202 2203
    }

    QTAILQ_FOREACH_SAFE(ml, &ml_head, queue, ml2) {
A
Avi Kivity 已提交
2204
        g_free(ml);
B
Blue Swirl 已提交
2205 2206
    }
}
P
Peter Crosthwaite 已提交
2207 2208 2209 2210 2211 2212 2213 2214 2215 2216 2217 2218 2219 2220 2221

static const TypeInfo memory_region_info = {
    .parent             = TYPE_OBJECT,
    .name               = TYPE_MEMORY_REGION,
    .instance_size      = sizeof(MemoryRegion),
    .instance_init      = memory_region_initfn,
    .instance_finalize  = memory_region_finalize,
};

static void memory_register_types(void)
{
    type_register_static(&memory_region_info);
}

type_init(memory_register_types)