]> git.ipfire.org Git - thirdparty/qemu.git/blame - exec.c
memory: s/dirty/clean/ in cpu_physical_memory_is_dirty()
[thirdparty/qemu.git] / exec.c
CommitLineData
54936004 1/*
5b6dd868 2 * Virtual page mapping
5fafdf24 3 *
54936004
FB
4 * Copyright (c) 2003 Fabrice Bellard
5 *
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
10 *
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
15 *
16 * You should have received a copy of the GNU Lesser General Public
8167ee88 17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
54936004 18 */
67b915a5 19#include "config.h"
d5a8f07c
FB
20#ifdef _WIN32
21#include <windows.h>
22#else
a98d49b1 23#include <sys/types.h>
d5a8f07c
FB
24#include <sys/mman.h>
25#endif
54936004 26
055403b2 27#include "qemu-common.h"
6180a181 28#include "cpu.h"
b67d9a52 29#include "tcg.h"
b3c7724c 30#include "hw/hw.h"
cc9e98cb 31#include "hw/qdev.h"
1de7afc9 32#include "qemu/osdep.h"
9c17d615 33#include "sysemu/kvm.h"
2ff3de68 34#include "sysemu/sysemu.h"
0d09e41a 35#include "hw/xen/xen.h"
1de7afc9
PB
36#include "qemu/timer.h"
37#include "qemu/config-file.h"
022c62cb 38#include "exec/memory.h"
9c17d615 39#include "sysemu/dma.h"
022c62cb 40#include "exec/address-spaces.h"
53a5960a
PB
41#if defined(CONFIG_USER_ONLY)
42#include <qemu.h>
432d268c 43#else /* !CONFIG_USER_ONLY */
9c17d615 44#include "sysemu/xen-mapcache.h"
6506e4f9 45#include "trace.h"
53a5960a 46#endif
0d6d3c87 47#include "exec/cpu-all.h"
54936004 48
022c62cb 49#include "exec/cputlb.h"
5b6dd868 50#include "translate-all.h"
0cac1b66 51
022c62cb 52#include "exec/memory-internal.h"
582b55a9 53#include "qemu/cache-utils.h"
67d95c15 54
b35ba30f
MT
55#include "qemu/range.h"
56
db7b5426 57//#define DEBUG_SUBPAGE
1196be37 58
e2eef170 59#if !defined(CONFIG_USER_ONLY)
74576198 60static int in_migration;
94a6b54f 61
a3161038 62RAMList ram_list = { .blocks = QTAILQ_HEAD_INITIALIZER(ram_list.blocks) };
62152b8a
AK
63
64static MemoryRegion *system_memory;
309cb471 65static MemoryRegion *system_io;
62152b8a 66
f6790af6
AK
67AddressSpace address_space_io;
68AddressSpace address_space_memory;
2673a5da 69
0844e007 70MemoryRegion io_mem_rom, io_mem_notdirty;
acc9d80b 71static MemoryRegion io_mem_unassigned;
0e0df1e2 72
e2eef170 73#endif
9fa3e853 74
bdc44640 75struct CPUTailQ cpus = QTAILQ_HEAD_INITIALIZER(cpus);
6a00d601
FB
76/* current CPU in the current thread. It is only valid inside
77 cpu_exec() */
4917cf44 78DEFINE_TLS(CPUState *, current_cpu);
2e70f6ef 79/* 0 = Do not count executed instructions.
bf20dc07 80 1 = Precise instruction counting.
2e70f6ef 81 2 = Adaptive rate instruction counting. */
5708fc66 82int use_icount;
6a00d601 83
e2eef170 84#if !defined(CONFIG_USER_ONLY)
4346ae3e 85
1db8abb1
PB
86typedef struct PhysPageEntry PhysPageEntry;
87
88struct PhysPageEntry {
9736e55b 89 /* How many bits skip to next level (in units of L2_SIZE). 0 for a leaf. */
8b795765 90 uint32_t skip : 6;
9736e55b 91 /* index into phys_sections (!skip) or phys_map_nodes (skip) */
8b795765 92 uint32_t ptr : 26;
1db8abb1
PB
93};
94
8b795765
MT
95#define PHYS_MAP_NODE_NIL (((uint32_t)~0) >> 6)
96
03f49957 97/* Size of the L2 (and L3, etc) page tables. */
57271d63 98#define ADDR_SPACE_BITS 64
03f49957 99
026736ce 100#define P_L2_BITS 9
03f49957
PB
101#define P_L2_SIZE (1 << P_L2_BITS)
102
103#define P_L2_LEVELS (((ADDR_SPACE_BITS - TARGET_PAGE_BITS - 1) / P_L2_BITS) + 1)
104
105typedef PhysPageEntry Node[P_L2_SIZE];
0475d94f 106
53cb28cb
MA
107typedef struct PhysPageMap {
108 unsigned sections_nb;
109 unsigned sections_nb_alloc;
110 unsigned nodes_nb;
111 unsigned nodes_nb_alloc;
112 Node *nodes;
113 MemoryRegionSection *sections;
114} PhysPageMap;
115
1db8abb1
PB
116struct AddressSpaceDispatch {
117 /* This is a multi-level map on the physical address space.
118 * The bottom level has pointers to MemoryRegionSections.
119 */
120 PhysPageEntry phys_map;
53cb28cb 121 PhysPageMap map;
acc9d80b 122 AddressSpace *as;
1db8abb1
PB
123};
124
90260c6c
JK
125#define SUBPAGE_IDX(addr) ((addr) & ~TARGET_PAGE_MASK)
126typedef struct subpage_t {
127 MemoryRegion iomem;
acc9d80b 128 AddressSpace *as;
90260c6c
JK
129 hwaddr base;
130 uint16_t sub_section[TARGET_PAGE_SIZE];
131} subpage_t;
132
b41aac4f
LPF
133#define PHYS_SECTION_UNASSIGNED 0
134#define PHYS_SECTION_NOTDIRTY 1
135#define PHYS_SECTION_ROM 2
136#define PHYS_SECTION_WATCH 3
5312bd8b 137
e2eef170 138static void io_mem_init(void);
62152b8a 139static void memory_map_init(void);
e2eef170 140
1ec9b909 141static MemoryRegion io_mem_watch;
6658ffb8 142#endif
fd6ce8f6 143
6d9a1304 144#if !defined(CONFIG_USER_ONLY)
d6f2ea22 145
53cb28cb 146static void phys_map_node_reserve(PhysPageMap *map, unsigned nodes)
d6f2ea22 147{
53cb28cb
MA
148 if (map->nodes_nb + nodes > map->nodes_nb_alloc) {
149 map->nodes_nb_alloc = MAX(map->nodes_nb_alloc * 2, 16);
150 map->nodes_nb_alloc = MAX(map->nodes_nb_alloc, map->nodes_nb + nodes);
151 map->nodes = g_renew(Node, map->nodes, map->nodes_nb_alloc);
d6f2ea22 152 }
f7bf5461
AK
153}
154
53cb28cb 155static uint32_t phys_map_node_alloc(PhysPageMap *map)
f7bf5461
AK
156{
157 unsigned i;
8b795765 158 uint32_t ret;
f7bf5461 159
53cb28cb 160 ret = map->nodes_nb++;
f7bf5461 161 assert(ret != PHYS_MAP_NODE_NIL);
53cb28cb 162 assert(ret != map->nodes_nb_alloc);
03f49957 163 for (i = 0; i < P_L2_SIZE; ++i) {
53cb28cb
MA
164 map->nodes[ret][i].skip = 1;
165 map->nodes[ret][i].ptr = PHYS_MAP_NODE_NIL;
d6f2ea22 166 }
f7bf5461 167 return ret;
d6f2ea22
AK
168}
169
53cb28cb
MA
170static void phys_page_set_level(PhysPageMap *map, PhysPageEntry *lp,
171 hwaddr *index, hwaddr *nb, uint16_t leaf,
2999097b 172 int level)
f7bf5461
AK
173{
174 PhysPageEntry *p;
175 int i;
03f49957 176 hwaddr step = (hwaddr)1 << (level * P_L2_BITS);
108c49b8 177
9736e55b 178 if (lp->skip && lp->ptr == PHYS_MAP_NODE_NIL) {
53cb28cb
MA
179 lp->ptr = phys_map_node_alloc(map);
180 p = map->nodes[lp->ptr];
f7bf5461 181 if (level == 0) {
03f49957 182 for (i = 0; i < P_L2_SIZE; i++) {
9736e55b 183 p[i].skip = 0;
b41aac4f 184 p[i].ptr = PHYS_SECTION_UNASSIGNED;
4346ae3e 185 }
67c4d23c 186 }
f7bf5461 187 } else {
53cb28cb 188 p = map->nodes[lp->ptr];
92e873b9 189 }
03f49957 190 lp = &p[(*index >> (level * P_L2_BITS)) & (P_L2_SIZE - 1)];
f7bf5461 191
03f49957 192 while (*nb && lp < &p[P_L2_SIZE]) {
07f07b31 193 if ((*index & (step - 1)) == 0 && *nb >= step) {
9736e55b 194 lp->skip = 0;
c19e8800 195 lp->ptr = leaf;
07f07b31
AK
196 *index += step;
197 *nb -= step;
2999097b 198 } else {
53cb28cb 199 phys_page_set_level(map, lp, index, nb, leaf, level - 1);
2999097b
AK
200 }
201 ++lp;
f7bf5461
AK
202 }
203}
204
ac1970fb 205static void phys_page_set(AddressSpaceDispatch *d,
a8170e5e 206 hwaddr index, hwaddr nb,
2999097b 207 uint16_t leaf)
f7bf5461 208{
2999097b 209 /* Wildly overreserve - it doesn't matter much. */
53cb28cb 210 phys_map_node_reserve(&d->map, 3 * P_L2_LEVELS);
5cd2c5b6 211
53cb28cb 212 phys_page_set_level(&d->map, &d->phys_map, &index, &nb, leaf, P_L2_LEVELS - 1);
92e873b9
FB
213}
214
b35ba30f
MT
215/* Compact a non leaf page entry. Simply detect that the entry has a single child,
216 * and update our entry so we can skip it and go directly to the destination.
217 */
218static void phys_page_compact(PhysPageEntry *lp, Node *nodes, unsigned long *compacted)
219{
220 unsigned valid_ptr = P_L2_SIZE;
221 int valid = 0;
222 PhysPageEntry *p;
223 int i;
224
225 if (lp->ptr == PHYS_MAP_NODE_NIL) {
226 return;
227 }
228
229 p = nodes[lp->ptr];
230 for (i = 0; i < P_L2_SIZE; i++) {
231 if (p[i].ptr == PHYS_MAP_NODE_NIL) {
232 continue;
233 }
234
235 valid_ptr = i;
236 valid++;
237 if (p[i].skip) {
238 phys_page_compact(&p[i], nodes, compacted);
239 }
240 }
241
242 /* We can only compress if there's only one child. */
243 if (valid != 1) {
244 return;
245 }
246
247 assert(valid_ptr < P_L2_SIZE);
248
249 /* Don't compress if it won't fit in the # of bits we have. */
250 if (lp->skip + p[valid_ptr].skip >= (1 << 3)) {
251 return;
252 }
253
254 lp->ptr = p[valid_ptr].ptr;
255 if (!p[valid_ptr].skip) {
256 /* If our only child is a leaf, make this a leaf. */
257 /* By design, we should have made this node a leaf to begin with so we
258 * should never reach here.
259 * But since it's so simple to handle this, let's do it just in case we
260 * change this rule.
261 */
262 lp->skip = 0;
263 } else {
264 lp->skip += p[valid_ptr].skip;
265 }
266}
267
268static void phys_page_compact_all(AddressSpaceDispatch *d, int nodes_nb)
269{
270 DECLARE_BITMAP(compacted, nodes_nb);
271
272 if (d->phys_map.skip) {
53cb28cb 273 phys_page_compact(&d->phys_map, d->map.nodes, compacted);
b35ba30f
MT
274 }
275}
276
97115a8d 277static MemoryRegionSection *phys_page_find(PhysPageEntry lp, hwaddr addr,
9affd6fc 278 Node *nodes, MemoryRegionSection *sections)
92e873b9 279{
31ab2b4a 280 PhysPageEntry *p;
97115a8d 281 hwaddr index = addr >> TARGET_PAGE_BITS;
31ab2b4a 282 int i;
f1f6e3b8 283
9736e55b 284 for (i = P_L2_LEVELS; lp.skip && (i -= lp.skip) >= 0;) {
c19e8800 285 if (lp.ptr == PHYS_MAP_NODE_NIL) {
9affd6fc 286 return &sections[PHYS_SECTION_UNASSIGNED];
31ab2b4a 287 }
9affd6fc 288 p = nodes[lp.ptr];
03f49957 289 lp = p[(index >> (i * P_L2_BITS)) & (P_L2_SIZE - 1)];
5312bd8b 290 }
b35ba30f
MT
291
292 if (sections[lp.ptr].size.hi ||
293 range_covers_byte(sections[lp.ptr].offset_within_address_space,
294 sections[lp.ptr].size.lo, addr)) {
295 return &sections[lp.ptr];
296 } else {
297 return &sections[PHYS_SECTION_UNASSIGNED];
298 }
f3705d53
AK
299}
300
e5548617
BS
301bool memory_region_is_unassigned(MemoryRegion *mr)
302{
2a8e7499 303 return mr != &io_mem_rom && mr != &io_mem_notdirty && !mr->rom_device
5b6dd868 304 && mr != &io_mem_watch;
fd6ce8f6 305}
149f54b5 306
c7086b4a 307static MemoryRegionSection *address_space_lookup_region(AddressSpaceDispatch *d,
90260c6c
JK
308 hwaddr addr,
309 bool resolve_subpage)
9f029603 310{
90260c6c
JK
311 MemoryRegionSection *section;
312 subpage_t *subpage;
313
53cb28cb 314 section = phys_page_find(d->phys_map, addr, d->map.nodes, d->map.sections);
90260c6c
JK
315 if (resolve_subpage && section->mr->subpage) {
316 subpage = container_of(section->mr, subpage_t, iomem);
53cb28cb 317 section = &d->map.sections[subpage->sub_section[SUBPAGE_IDX(addr)]];
90260c6c
JK
318 }
319 return section;
9f029603
JK
320}
321
90260c6c 322static MemoryRegionSection *
c7086b4a 323address_space_translate_internal(AddressSpaceDispatch *d, hwaddr addr, hwaddr *xlat,
90260c6c 324 hwaddr *plen, bool resolve_subpage)
149f54b5
PB
325{
326 MemoryRegionSection *section;
327 Int128 diff;
328
c7086b4a 329 section = address_space_lookup_region(d, addr, resolve_subpage);
149f54b5
PB
330 /* Compute offset within MemoryRegionSection */
331 addr -= section->offset_within_address_space;
332
333 /* Compute offset within MemoryRegion */
334 *xlat = addr + section->offset_within_region;
335
336 diff = int128_sub(section->mr->size, int128_make64(addr));
3752a036 337 *plen = int128_get64(int128_min(diff, int128_make64(*plen)));
149f54b5
PB
338 return section;
339}
90260c6c 340
5c8a00ce
PB
341MemoryRegion *address_space_translate(AddressSpace *as, hwaddr addr,
342 hwaddr *xlat, hwaddr *plen,
343 bool is_write)
90260c6c 344{
30951157
AK
345 IOMMUTLBEntry iotlb;
346 MemoryRegionSection *section;
347 MemoryRegion *mr;
348 hwaddr len = *plen;
349
350 for (;;) {
c7086b4a 351 section = address_space_translate_internal(as->dispatch, addr, &addr, plen, true);
30951157
AK
352 mr = section->mr;
353
354 if (!mr->iommu_ops) {
355 break;
356 }
357
358 iotlb = mr->iommu_ops->translate(mr, addr);
359 addr = ((iotlb.translated_addr & ~iotlb.addr_mask)
360 | (addr & iotlb.addr_mask));
361 len = MIN(len, (addr | iotlb.addr_mask) - addr + 1);
362 if (!(iotlb.perm & (1 << is_write))) {
363 mr = &io_mem_unassigned;
364 break;
365 }
366
367 as = iotlb.target_as;
368 }
369
370 *plen = len;
371 *xlat = addr;
372 return mr;
90260c6c
JK
373}
374
375MemoryRegionSection *
376address_space_translate_for_iotlb(AddressSpace *as, hwaddr addr, hwaddr *xlat,
377 hwaddr *plen)
378{
30951157 379 MemoryRegionSection *section;
c7086b4a 380 section = address_space_translate_internal(as->dispatch, addr, xlat, plen, false);
30951157
AK
381
382 assert(!section->mr->iommu_ops);
383 return section;
90260c6c 384}
5b6dd868 385#endif
fd6ce8f6 386
5b6dd868 387void cpu_exec_init_all(void)
fdbb84d1 388{
5b6dd868 389#if !defined(CONFIG_USER_ONLY)
b2a8658e 390 qemu_mutex_init(&ram_list.mutex);
5b6dd868
BS
391 memory_map_init();
392 io_mem_init();
fdbb84d1 393#endif
5b6dd868 394}
fdbb84d1 395
b170fce3 396#if !defined(CONFIG_USER_ONLY)
5b6dd868
BS
397
398static int cpu_common_post_load(void *opaque, int version_id)
fd6ce8f6 399{
259186a7 400 CPUState *cpu = opaque;
a513fe19 401
5b6dd868
BS
402 /* 0x01 was CPU_INTERRUPT_EXIT. This line can be removed when the
403 version_id is increased. */
259186a7
AF
404 cpu->interrupt_request &= ~0x01;
405 tlb_flush(cpu->env_ptr, 1);
5b6dd868
BS
406
407 return 0;
a513fe19 408}
7501267e 409
1a1562f5 410const VMStateDescription vmstate_cpu_common = {
5b6dd868
BS
411 .name = "cpu_common",
412 .version_id = 1,
413 .minimum_version_id = 1,
414 .minimum_version_id_old = 1,
415 .post_load = cpu_common_post_load,
416 .fields = (VMStateField []) {
259186a7
AF
417 VMSTATE_UINT32(halted, CPUState),
418 VMSTATE_UINT32(interrupt_request, CPUState),
5b6dd868
BS
419 VMSTATE_END_OF_LIST()
420 }
421};
1a1562f5 422
5b6dd868 423#endif
ea041c0e 424
38d8f5c8 425CPUState *qemu_get_cpu(int index)
ea041c0e 426{
bdc44640 427 CPUState *cpu;
ea041c0e 428
bdc44640 429 CPU_FOREACH(cpu) {
55e5c285 430 if (cpu->cpu_index == index) {
bdc44640 431 return cpu;
55e5c285 432 }
ea041c0e 433 }
5b6dd868 434
bdc44640 435 return NULL;
ea041c0e
FB
436}
437
5b6dd868 438void cpu_exec_init(CPUArchState *env)
ea041c0e 439{
5b6dd868 440 CPUState *cpu = ENV_GET_CPU(env);
b170fce3 441 CPUClass *cc = CPU_GET_CLASS(cpu);
bdc44640 442 CPUState *some_cpu;
5b6dd868
BS
443 int cpu_index;
444
445#if defined(CONFIG_USER_ONLY)
446 cpu_list_lock();
447#endif
5b6dd868 448 cpu_index = 0;
bdc44640 449 CPU_FOREACH(some_cpu) {
5b6dd868
BS
450 cpu_index++;
451 }
55e5c285 452 cpu->cpu_index = cpu_index;
1b1ed8dc 453 cpu->numa_node = 0;
5b6dd868
BS
454 QTAILQ_INIT(&env->breakpoints);
455 QTAILQ_INIT(&env->watchpoints);
456#ifndef CONFIG_USER_ONLY
457 cpu->thread_id = qemu_get_thread_id();
458#endif
bdc44640 459 QTAILQ_INSERT_TAIL(&cpus, cpu, node);
5b6dd868
BS
460#if defined(CONFIG_USER_ONLY)
461 cpu_list_unlock();
462#endif
e0d47944
AF
463 if (qdev_get_vmsd(DEVICE(cpu)) == NULL) {
464 vmstate_register(NULL, cpu_index, &vmstate_cpu_common, cpu);
465 }
5b6dd868 466#if defined(CPU_SAVE_VERSION) && !defined(CONFIG_USER_ONLY)
5b6dd868
BS
467 register_savevm(NULL, "cpu", cpu_index, CPU_SAVE_VERSION,
468 cpu_save, cpu_load, env);
b170fce3 469 assert(cc->vmsd == NULL);
e0d47944 470 assert(qdev_get_vmsd(DEVICE(cpu)) == NULL);
5b6dd868 471#endif
b170fce3
AF
472 if (cc->vmsd != NULL) {
473 vmstate_register(NULL, cpu_index, cc->vmsd, cpu);
474 }
ea041c0e
FB
475}
476
1fddef4b 477#if defined(TARGET_HAS_ICE)
94df27fd 478#if defined(CONFIG_USER_ONLY)
00b941e5 479static void breakpoint_invalidate(CPUState *cpu, target_ulong pc)
94df27fd
PB
480{
481 tb_invalidate_phys_page_range(pc, pc + 1, 0);
482}
483#else
00b941e5 484static void breakpoint_invalidate(CPUState *cpu, target_ulong pc)
1e7855a5 485{
e8262a1b
MF
486 hwaddr phys = cpu_get_phys_page_debug(cpu, pc);
487 if (phys != -1) {
488 tb_invalidate_phys_addr(phys | (pc & ~TARGET_PAGE_MASK));
489 }
1e7855a5 490}
c27004ec 491#endif
94df27fd 492#endif /* TARGET_HAS_ICE */
d720b93d 493
c527ee8f 494#if defined(CONFIG_USER_ONLY)
9349b4f9 495void cpu_watchpoint_remove_all(CPUArchState *env, int mask)
c527ee8f
PB
496
497{
498}
499
9349b4f9 500int cpu_watchpoint_insert(CPUArchState *env, target_ulong addr, target_ulong len,
c527ee8f
PB
501 int flags, CPUWatchpoint **watchpoint)
502{
503 return -ENOSYS;
504}
505#else
6658ffb8 506/* Add a watchpoint. */
9349b4f9 507int cpu_watchpoint_insert(CPUArchState *env, target_ulong addr, target_ulong len,
a1d1bb31 508 int flags, CPUWatchpoint **watchpoint)
6658ffb8 509{
b4051334 510 target_ulong len_mask = ~(len - 1);
c0ce998e 511 CPUWatchpoint *wp;
6658ffb8 512
b4051334 513 /* sanity checks: allow power-of-2 lengths, deny unaligned watchpoints */
0dc23828
MF
514 if ((len & (len - 1)) || (addr & ~len_mask) ||
515 len == 0 || len > TARGET_PAGE_SIZE) {
b4051334
AL
516 fprintf(stderr, "qemu: tried to set invalid watchpoint at "
517 TARGET_FMT_lx ", len=" TARGET_FMT_lu "\n", addr, len);
518 return -EINVAL;
519 }
7267c094 520 wp = g_malloc(sizeof(*wp));
a1d1bb31
AL
521
522 wp->vaddr = addr;
b4051334 523 wp->len_mask = len_mask;
a1d1bb31
AL
524 wp->flags = flags;
525
2dc9f411 526 /* keep all GDB-injected watchpoints in front */
c0ce998e 527 if (flags & BP_GDB)
72cf2d4f 528 QTAILQ_INSERT_HEAD(&env->watchpoints, wp, entry);
c0ce998e 529 else
72cf2d4f 530 QTAILQ_INSERT_TAIL(&env->watchpoints, wp, entry);
6658ffb8 531
6658ffb8 532 tlb_flush_page(env, addr);
a1d1bb31
AL
533
534 if (watchpoint)
535 *watchpoint = wp;
536 return 0;
6658ffb8
PB
537}
538
a1d1bb31 539/* Remove a specific watchpoint. */
9349b4f9 540int cpu_watchpoint_remove(CPUArchState *env, target_ulong addr, target_ulong len,
a1d1bb31 541 int flags)
6658ffb8 542{
b4051334 543 target_ulong len_mask = ~(len - 1);
a1d1bb31 544 CPUWatchpoint *wp;
6658ffb8 545
72cf2d4f 546 QTAILQ_FOREACH(wp, &env->watchpoints, entry) {
b4051334 547 if (addr == wp->vaddr && len_mask == wp->len_mask
6e140f28 548 && flags == (wp->flags & ~BP_WATCHPOINT_HIT)) {
a1d1bb31 549 cpu_watchpoint_remove_by_ref(env, wp);
6658ffb8
PB
550 return 0;
551 }
552 }
a1d1bb31 553 return -ENOENT;
6658ffb8
PB
554}
555
a1d1bb31 556/* Remove a specific watchpoint by reference. */
9349b4f9 557void cpu_watchpoint_remove_by_ref(CPUArchState *env, CPUWatchpoint *watchpoint)
a1d1bb31 558{
72cf2d4f 559 QTAILQ_REMOVE(&env->watchpoints, watchpoint, entry);
7d03f82f 560
a1d1bb31
AL
561 tlb_flush_page(env, watchpoint->vaddr);
562
7267c094 563 g_free(watchpoint);
a1d1bb31
AL
564}
565
566/* Remove all matching watchpoints. */
9349b4f9 567void cpu_watchpoint_remove_all(CPUArchState *env, int mask)
a1d1bb31 568{
c0ce998e 569 CPUWatchpoint *wp, *next;
a1d1bb31 570
72cf2d4f 571 QTAILQ_FOREACH_SAFE(wp, &env->watchpoints, entry, next) {
a1d1bb31
AL
572 if (wp->flags & mask)
573 cpu_watchpoint_remove_by_ref(env, wp);
c0ce998e 574 }
7d03f82f 575}
c527ee8f 576#endif
7d03f82f 577
a1d1bb31 578/* Add a breakpoint. */
9349b4f9 579int cpu_breakpoint_insert(CPUArchState *env, target_ulong pc, int flags,
a1d1bb31 580 CPUBreakpoint **breakpoint)
4c3a88a2 581{
1fddef4b 582#if defined(TARGET_HAS_ICE)
c0ce998e 583 CPUBreakpoint *bp;
3b46e624 584
7267c094 585 bp = g_malloc(sizeof(*bp));
4c3a88a2 586
a1d1bb31
AL
587 bp->pc = pc;
588 bp->flags = flags;
589
2dc9f411 590 /* keep all GDB-injected breakpoints in front */
00b941e5 591 if (flags & BP_GDB) {
72cf2d4f 592 QTAILQ_INSERT_HEAD(&env->breakpoints, bp, entry);
00b941e5 593 } else {
72cf2d4f 594 QTAILQ_INSERT_TAIL(&env->breakpoints, bp, entry);
00b941e5 595 }
3b46e624 596
00b941e5 597 breakpoint_invalidate(ENV_GET_CPU(env), pc);
a1d1bb31 598
00b941e5 599 if (breakpoint) {
a1d1bb31 600 *breakpoint = bp;
00b941e5 601 }
4c3a88a2
FB
602 return 0;
603#else
a1d1bb31 604 return -ENOSYS;
4c3a88a2
FB
605#endif
606}
607
a1d1bb31 608/* Remove a specific breakpoint. */
9349b4f9 609int cpu_breakpoint_remove(CPUArchState *env, target_ulong pc, int flags)
a1d1bb31 610{
7d03f82f 611#if defined(TARGET_HAS_ICE)
a1d1bb31
AL
612 CPUBreakpoint *bp;
613
72cf2d4f 614 QTAILQ_FOREACH(bp, &env->breakpoints, entry) {
a1d1bb31
AL
615 if (bp->pc == pc && bp->flags == flags) {
616 cpu_breakpoint_remove_by_ref(env, bp);
617 return 0;
618 }
7d03f82f 619 }
a1d1bb31
AL
620 return -ENOENT;
621#else
622 return -ENOSYS;
7d03f82f
EI
623#endif
624}
625
a1d1bb31 626/* Remove a specific breakpoint by reference. */
9349b4f9 627void cpu_breakpoint_remove_by_ref(CPUArchState *env, CPUBreakpoint *breakpoint)
4c3a88a2 628{
1fddef4b 629#if defined(TARGET_HAS_ICE)
72cf2d4f 630 QTAILQ_REMOVE(&env->breakpoints, breakpoint, entry);
d720b93d 631
00b941e5 632 breakpoint_invalidate(ENV_GET_CPU(env), breakpoint->pc);
a1d1bb31 633
7267c094 634 g_free(breakpoint);
a1d1bb31
AL
635#endif
636}
637
638/* Remove all matching breakpoints. */
9349b4f9 639void cpu_breakpoint_remove_all(CPUArchState *env, int mask)
a1d1bb31
AL
640{
641#if defined(TARGET_HAS_ICE)
c0ce998e 642 CPUBreakpoint *bp, *next;
a1d1bb31 643
72cf2d4f 644 QTAILQ_FOREACH_SAFE(bp, &env->breakpoints, entry, next) {
a1d1bb31
AL
645 if (bp->flags & mask)
646 cpu_breakpoint_remove_by_ref(env, bp);
c0ce998e 647 }
4c3a88a2
FB
648#endif
649}
650
c33a346e
FB
651/* enable or disable single step mode. EXCP_DEBUG is returned by the
652 CPU loop after each instruction */
3825b28f 653void cpu_single_step(CPUState *cpu, int enabled)
c33a346e 654{
1fddef4b 655#if defined(TARGET_HAS_ICE)
ed2803da
AF
656 if (cpu->singlestep_enabled != enabled) {
657 cpu->singlestep_enabled = enabled;
658 if (kvm_enabled()) {
38e478ec 659 kvm_update_guest_debug(cpu, 0);
ed2803da 660 } else {
ccbb4d44 661 /* must flush all the translated code to avoid inconsistencies */
e22a25c9 662 /* XXX: only flush what is necessary */
38e478ec 663 CPUArchState *env = cpu->env_ptr;
e22a25c9
AL
664 tb_flush(env);
665 }
c33a346e
FB
666 }
667#endif
668}
669
9349b4f9 670void cpu_abort(CPUArchState *env, const char *fmt, ...)
7501267e 671{
878096ee 672 CPUState *cpu = ENV_GET_CPU(env);
7501267e 673 va_list ap;
493ae1f0 674 va_list ap2;
7501267e
FB
675
676 va_start(ap, fmt);
493ae1f0 677 va_copy(ap2, ap);
7501267e
FB
678 fprintf(stderr, "qemu: fatal: ");
679 vfprintf(stderr, fmt, ap);
680 fprintf(stderr, "\n");
878096ee 681 cpu_dump_state(cpu, stderr, fprintf, CPU_DUMP_FPU | CPU_DUMP_CCOP);
93fcfe39
AL
682 if (qemu_log_enabled()) {
683 qemu_log("qemu: fatal: ");
684 qemu_log_vprintf(fmt, ap2);
685 qemu_log("\n");
a0762859 686 log_cpu_state(cpu, CPU_DUMP_FPU | CPU_DUMP_CCOP);
31b1a7b4 687 qemu_log_flush();
93fcfe39 688 qemu_log_close();
924edcae 689 }
493ae1f0 690 va_end(ap2);
f9373291 691 va_end(ap);
fd052bf6
RV
692#if defined(CONFIG_USER_ONLY)
693 {
694 struct sigaction act;
695 sigfillset(&act.sa_mask);
696 act.sa_handler = SIG_DFL;
697 sigaction(SIGABRT, &act, NULL);
698 }
699#endif
7501267e
FB
700 abort();
701}
702
0124311e 703#if !defined(CONFIG_USER_ONLY)
041603fe
PB
704static RAMBlock *qemu_get_ram_block(ram_addr_t addr)
705{
706 RAMBlock *block;
707
708 /* The list is protected by the iothread lock here. */
709 block = ram_list.mru_block;
710 if (block && addr - block->offset < block->length) {
711 goto found;
712 }
713 QTAILQ_FOREACH(block, &ram_list.blocks, next) {
714 if (addr - block->offset < block->length) {
715 goto found;
716 }
717 }
718
719 fprintf(stderr, "Bad ram offset %" PRIx64 "\n", (uint64_t)addr);
720 abort();
721
722found:
723 ram_list.mru_block = block;
724 return block;
725}
726
d24981d3
JQ
727static void tlb_reset_dirty_range_all(ram_addr_t start, ram_addr_t end,
728 uintptr_t length)
729{
041603fe
PB
730 RAMBlock *block;
731 ram_addr_t start1;
d24981d3 732
041603fe
PB
733 block = qemu_get_ram_block(start);
734 assert(block == qemu_get_ram_block(end - 1));
735 start1 = (uintptr_t)block->host + (start - block->offset);
736 cpu_tlb_reset_dirty_all(start1, length);
d24981d3
JQ
737}
738
5579c7f3 739/* Note: start and end must be within the same ram block. */
c227f099 740void cpu_physical_memory_reset_dirty(ram_addr_t start, ram_addr_t end,
52159192 741 unsigned client)
1ccde1cb 742{
d24981d3 743 uintptr_t length;
1ccde1cb
FB
744
745 start &= TARGET_PAGE_MASK;
746 end = TARGET_PAGE_ALIGN(end);
747
748 length = end - start;
749 if (length == 0)
750 return;
ace694cc 751 cpu_physical_memory_clear_dirty_range(start, length, client);
f23db169 752
d24981d3
JQ
753 if (tcg_enabled()) {
754 tlb_reset_dirty_range_all(start, end, length);
5579c7f3 755 }
1ccde1cb
FB
756}
757
8b9c99d9 758static int cpu_physical_memory_set_dirty_tracking(int enable)
74576198 759{
f6f3fbca 760 int ret = 0;
74576198 761 in_migration = enable;
f6f3fbca 762 return ret;
74576198
AL
763}
764
a8170e5e 765hwaddr memory_region_section_get_iotlb(CPUArchState *env,
149f54b5
PB
766 MemoryRegionSection *section,
767 target_ulong vaddr,
768 hwaddr paddr, hwaddr xlat,
769 int prot,
770 target_ulong *address)
e5548617 771{
a8170e5e 772 hwaddr iotlb;
e5548617
BS
773 CPUWatchpoint *wp;
774
cc5bea60 775 if (memory_region_is_ram(section->mr)) {
e5548617
BS
776 /* Normal RAM. */
777 iotlb = (memory_region_get_ram_addr(section->mr) & TARGET_PAGE_MASK)
149f54b5 778 + xlat;
e5548617 779 if (!section->readonly) {
b41aac4f 780 iotlb |= PHYS_SECTION_NOTDIRTY;
e5548617 781 } else {
b41aac4f 782 iotlb |= PHYS_SECTION_ROM;
e5548617
BS
783 }
784 } else {
53cb28cb 785 iotlb = section - address_space_memory.dispatch->map.sections;
149f54b5 786 iotlb += xlat;
e5548617
BS
787 }
788
789 /* Make accesses to pages with watchpoints go via the
790 watchpoint trap routines. */
791 QTAILQ_FOREACH(wp, &env->watchpoints, entry) {
792 if (vaddr == (wp->vaddr & TARGET_PAGE_MASK)) {
793 /* Avoid trapping reads of pages with a write breakpoint. */
794 if ((prot & PAGE_WRITE) || (wp->flags & BP_MEM_READ)) {
b41aac4f 795 iotlb = PHYS_SECTION_WATCH + paddr;
e5548617
BS
796 *address |= TLB_MMIO;
797 break;
798 }
799 }
800 }
801
802 return iotlb;
803}
9fa3e853
FB
804#endif /* defined(CONFIG_USER_ONLY) */
805
e2eef170 806#if !defined(CONFIG_USER_ONLY)
8da3ff18 807
c227f099 808static int subpage_register (subpage_t *mmio, uint32_t start, uint32_t end,
5312bd8b 809 uint16_t section);
acc9d80b 810static subpage_t *subpage_init(AddressSpace *as, hwaddr base);
54688b1e 811
575ddeb4 812static void *(*phys_mem_alloc)(size_t size) = qemu_anon_ram_alloc;
91138037
MA
813
814/*
815 * Set a custom physical guest memory alloator.
816 * Accelerators with unusual needs may need this. Hopefully, we can
817 * get rid of it eventually.
818 */
575ddeb4 819void phys_mem_set_alloc(void *(*alloc)(size_t))
91138037
MA
820{
821 phys_mem_alloc = alloc;
822}
823
53cb28cb
MA
824static uint16_t phys_section_add(PhysPageMap *map,
825 MemoryRegionSection *section)
5312bd8b 826{
68f3f65b
PB
827 /* The physical section number is ORed with a page-aligned
828 * pointer to produce the iotlb entries. Thus it should
829 * never overflow into the page-aligned value.
830 */
53cb28cb 831 assert(map->sections_nb < TARGET_PAGE_SIZE);
68f3f65b 832
53cb28cb
MA
833 if (map->sections_nb == map->sections_nb_alloc) {
834 map->sections_nb_alloc = MAX(map->sections_nb_alloc * 2, 16);
835 map->sections = g_renew(MemoryRegionSection, map->sections,
836 map->sections_nb_alloc);
5312bd8b 837 }
53cb28cb 838 map->sections[map->sections_nb] = *section;
dfde4e6e 839 memory_region_ref(section->mr);
53cb28cb 840 return map->sections_nb++;
5312bd8b
AK
841}
842
058bc4b5
PB
843static void phys_section_destroy(MemoryRegion *mr)
844{
dfde4e6e
PB
845 memory_region_unref(mr);
846
058bc4b5
PB
847 if (mr->subpage) {
848 subpage_t *subpage = container_of(mr, subpage_t, iomem);
849 memory_region_destroy(&subpage->iomem);
850 g_free(subpage);
851 }
852}
853
6092666e 854static void phys_sections_free(PhysPageMap *map)
5312bd8b 855{
9affd6fc
PB
856 while (map->sections_nb > 0) {
857 MemoryRegionSection *section = &map->sections[--map->sections_nb];
058bc4b5
PB
858 phys_section_destroy(section->mr);
859 }
9affd6fc
PB
860 g_free(map->sections);
861 g_free(map->nodes);
5312bd8b
AK
862}
863
ac1970fb 864static void register_subpage(AddressSpaceDispatch *d, MemoryRegionSection *section)
0f0cb164
AK
865{
866 subpage_t *subpage;
a8170e5e 867 hwaddr base = section->offset_within_address_space
0f0cb164 868 & TARGET_PAGE_MASK;
97115a8d 869 MemoryRegionSection *existing = phys_page_find(d->phys_map, base,
53cb28cb 870 d->map.nodes, d->map.sections);
0f0cb164
AK
871 MemoryRegionSection subsection = {
872 .offset_within_address_space = base,
052e87b0 873 .size = int128_make64(TARGET_PAGE_SIZE),
0f0cb164 874 };
a8170e5e 875 hwaddr start, end;
0f0cb164 876
f3705d53 877 assert(existing->mr->subpage || existing->mr == &io_mem_unassigned);
0f0cb164 878
f3705d53 879 if (!(existing->mr->subpage)) {
acc9d80b 880 subpage = subpage_init(d->as, base);
0f0cb164 881 subsection.mr = &subpage->iomem;
ac1970fb 882 phys_page_set(d, base >> TARGET_PAGE_BITS, 1,
53cb28cb 883 phys_section_add(&d->map, &subsection));
0f0cb164 884 } else {
f3705d53 885 subpage = container_of(existing->mr, subpage_t, iomem);
0f0cb164
AK
886 }
887 start = section->offset_within_address_space & ~TARGET_PAGE_MASK;
052e87b0 888 end = start + int128_get64(section->size) - 1;
53cb28cb
MA
889 subpage_register(subpage, start, end,
890 phys_section_add(&d->map, section));
0f0cb164
AK
891}
892
893
052e87b0
PB
894static void register_multipage(AddressSpaceDispatch *d,
895 MemoryRegionSection *section)
33417e70 896{
a8170e5e 897 hwaddr start_addr = section->offset_within_address_space;
53cb28cb 898 uint16_t section_index = phys_section_add(&d->map, section);
052e87b0
PB
899 uint64_t num_pages = int128_get64(int128_rshift(section->size,
900 TARGET_PAGE_BITS));
dd81124b 901
733d5ef5
PB
902 assert(num_pages);
903 phys_page_set(d, start_addr >> TARGET_PAGE_BITS, num_pages, section_index);
33417e70
FB
904}
905
ac1970fb 906static void mem_add(MemoryListener *listener, MemoryRegionSection *section)
0f0cb164 907{
89ae337a 908 AddressSpace *as = container_of(listener, AddressSpace, dispatch_listener);
00752703 909 AddressSpaceDispatch *d = as->next_dispatch;
99b9cc06 910 MemoryRegionSection now = *section, remain = *section;
052e87b0 911 Int128 page_size = int128_make64(TARGET_PAGE_SIZE);
0f0cb164 912
733d5ef5
PB
913 if (now.offset_within_address_space & ~TARGET_PAGE_MASK) {
914 uint64_t left = TARGET_PAGE_ALIGN(now.offset_within_address_space)
915 - now.offset_within_address_space;
916
052e87b0 917 now.size = int128_min(int128_make64(left), now.size);
ac1970fb 918 register_subpage(d, &now);
733d5ef5 919 } else {
052e87b0 920 now.size = int128_zero();
733d5ef5 921 }
052e87b0
PB
922 while (int128_ne(remain.size, now.size)) {
923 remain.size = int128_sub(remain.size, now.size);
924 remain.offset_within_address_space += int128_get64(now.size);
925 remain.offset_within_region += int128_get64(now.size);
69b67646 926 now = remain;
052e87b0 927 if (int128_lt(remain.size, page_size)) {
733d5ef5 928 register_subpage(d, &now);
88266249 929 } else if (remain.offset_within_address_space & ~TARGET_PAGE_MASK) {
052e87b0 930 now.size = page_size;
ac1970fb 931 register_subpage(d, &now);
69b67646 932 } else {
052e87b0 933 now.size = int128_and(now.size, int128_neg(page_size));
ac1970fb 934 register_multipage(d, &now);
69b67646 935 }
0f0cb164
AK
936 }
937}
938
62a2744c
SY
939void qemu_flush_coalesced_mmio_buffer(void)
940{
941 if (kvm_enabled())
942 kvm_flush_coalesced_mmio_buffer();
943}
944
b2a8658e
UD
945void qemu_mutex_lock_ramlist(void)
946{
947 qemu_mutex_lock(&ram_list.mutex);
948}
949
950void qemu_mutex_unlock_ramlist(void)
951{
952 qemu_mutex_unlock(&ram_list.mutex);
953}
954
e1e84ba0 955#ifdef __linux__
c902760f
MT
956
957#include <sys/vfs.h>
958
959#define HUGETLBFS_MAGIC 0x958458f6
960
961static long gethugepagesize(const char *path)
962{
963 struct statfs fs;
964 int ret;
965
966 do {
9742bf26 967 ret = statfs(path, &fs);
c902760f
MT
968 } while (ret != 0 && errno == EINTR);
969
970 if (ret != 0) {
9742bf26
YT
971 perror(path);
972 return 0;
c902760f
MT
973 }
974
975 if (fs.f_type != HUGETLBFS_MAGIC)
9742bf26 976 fprintf(stderr, "Warning: path not on HugeTLBFS: %s\n", path);
c902760f
MT
977
978 return fs.f_bsize;
979}
980
ef36fa14
MT
981static sigjmp_buf sigjump;
982
983static void sigbus_handler(int signal)
984{
985 siglongjmp(sigjump, 1);
986}
987
04b16653
AW
988static void *file_ram_alloc(RAMBlock *block,
989 ram_addr_t memory,
990 const char *path)
c902760f
MT
991{
992 char *filename;
8ca761f6
PF
993 char *sanitized_name;
994 char *c;
c902760f
MT
995 void *area;
996 int fd;
c902760f
MT
997 unsigned long hpagesize;
998
999 hpagesize = gethugepagesize(path);
1000 if (!hpagesize) {
9742bf26 1001 return NULL;
c902760f
MT
1002 }
1003
1004 if (memory < hpagesize) {
1005 return NULL;
1006 }
1007
1008 if (kvm_enabled() && !kvm_has_sync_mmu()) {
1009 fprintf(stderr, "host lacks kvm mmu notifiers, -mem-path unsupported\n");
1010 return NULL;
1011 }
1012
8ca761f6
PF
1013 /* Make name safe to use with mkstemp by replacing '/' with '_'. */
1014 sanitized_name = g_strdup(block->mr->name);
1015 for (c = sanitized_name; *c != '\0'; c++) {
1016 if (*c == '/')
1017 *c = '_';
1018 }
1019
1020 filename = g_strdup_printf("%s/qemu_back_mem.%s.XXXXXX", path,
1021 sanitized_name);
1022 g_free(sanitized_name);
c902760f
MT
1023
1024 fd = mkstemp(filename);
1025 if (fd < 0) {
9742bf26 1026 perror("unable to create backing store for hugepages");
e4ada482 1027 g_free(filename);
9742bf26 1028 return NULL;
c902760f
MT
1029 }
1030 unlink(filename);
e4ada482 1031 g_free(filename);
c902760f
MT
1032
1033 memory = (memory+hpagesize-1) & ~(hpagesize-1);
1034
1035 /*
1036 * ftruncate is not supported by hugetlbfs in older
1037 * hosts, so don't bother bailing out on errors.
1038 * If anything goes wrong with it under other filesystems,
1039 * mmap will fail.
1040 */
1041 if (ftruncate(fd, memory))
9742bf26 1042 perror("ftruncate");
c902760f 1043
c902760f 1044 area = mmap(0, memory, PROT_READ | PROT_WRITE, MAP_PRIVATE, fd, 0);
c902760f 1045 if (area == MAP_FAILED) {
9742bf26
YT
1046 perror("file_ram_alloc: can't mmap RAM pages");
1047 close(fd);
1048 return (NULL);
c902760f 1049 }
ef36fa14
MT
1050
1051 if (mem_prealloc) {
1052 int ret, i;
1053 struct sigaction act, oldact;
1054 sigset_t set, oldset;
1055
1056 memset(&act, 0, sizeof(act));
1057 act.sa_handler = &sigbus_handler;
1058 act.sa_flags = 0;
1059
1060 ret = sigaction(SIGBUS, &act, &oldact);
1061 if (ret) {
1062 perror("file_ram_alloc: failed to install signal handler");
1063 exit(1);
1064 }
1065
1066 /* unblock SIGBUS */
1067 sigemptyset(&set);
1068 sigaddset(&set, SIGBUS);
1069 pthread_sigmask(SIG_UNBLOCK, &set, &oldset);
1070
1071 if (sigsetjmp(sigjump, 1)) {
1072 fprintf(stderr, "file_ram_alloc: failed to preallocate pages\n");
1073 exit(1);
1074 }
1075
1076 /* MAP_POPULATE silently ignores failures */
1077 for (i = 0; i < (memory/hpagesize)-1; i++) {
1078 memset(area + (hpagesize*i), 0, 1);
1079 }
1080
1081 ret = sigaction(SIGBUS, &oldact, NULL);
1082 if (ret) {
1083 perror("file_ram_alloc: failed to reinstall signal handler");
1084 exit(1);
1085 }
1086
1087 pthread_sigmask(SIG_SETMASK, &oldset, NULL);
1088 }
1089
04b16653 1090 block->fd = fd;
c902760f
MT
1091 return area;
1092}
e1e84ba0
MA
1093#else
1094static void *file_ram_alloc(RAMBlock *block,
1095 ram_addr_t memory,
1096 const char *path)
1097{
1098 fprintf(stderr, "-mem-path not supported on this host\n");
1099 exit(1);
1100}
c902760f
MT
1101#endif
1102
d17b5288 1103static ram_addr_t find_ram_offset(ram_addr_t size)
04b16653
AW
1104{
1105 RAMBlock *block, *next_block;
3e837b2c 1106 ram_addr_t offset = RAM_ADDR_MAX, mingap = RAM_ADDR_MAX;
04b16653 1107
49cd9ac6
SH
1108 assert(size != 0); /* it would hand out same offset multiple times */
1109
a3161038 1110 if (QTAILQ_EMPTY(&ram_list.blocks))
04b16653
AW
1111 return 0;
1112
a3161038 1113 QTAILQ_FOREACH(block, &ram_list.blocks, next) {
f15fbc4b 1114 ram_addr_t end, next = RAM_ADDR_MAX;
04b16653
AW
1115
1116 end = block->offset + block->length;
1117
a3161038 1118 QTAILQ_FOREACH(next_block, &ram_list.blocks, next) {
04b16653
AW
1119 if (next_block->offset >= end) {
1120 next = MIN(next, next_block->offset);
1121 }
1122 }
1123 if (next - end >= size && next - end < mingap) {
3e837b2c 1124 offset = end;
04b16653
AW
1125 mingap = next - end;
1126 }
1127 }
3e837b2c
AW
1128
1129 if (offset == RAM_ADDR_MAX) {
1130 fprintf(stderr, "Failed to find gap of requested size: %" PRIu64 "\n",
1131 (uint64_t)size);
1132 abort();
1133 }
1134
04b16653
AW
1135 return offset;
1136}
1137
652d7ec2 1138ram_addr_t last_ram_offset(void)
d17b5288
AW
1139{
1140 RAMBlock *block;
1141 ram_addr_t last = 0;
1142
a3161038 1143 QTAILQ_FOREACH(block, &ram_list.blocks, next)
d17b5288
AW
1144 last = MAX(last, block->offset + block->length);
1145
1146 return last;
1147}
1148
ddb97f1d
JB
1149static void qemu_ram_setup_dump(void *addr, ram_addr_t size)
1150{
1151 int ret;
ddb97f1d
JB
1152
1153 /* Use MADV_DONTDUMP, if user doesn't want the guest memory in the core */
2ff3de68
MA
1154 if (!qemu_opt_get_bool(qemu_get_machine_opts(),
1155 "dump-guest-core", true)) {
ddb97f1d
JB
1156 ret = qemu_madvise(addr, size, QEMU_MADV_DONTDUMP);
1157 if (ret) {
1158 perror("qemu_madvise");
1159 fprintf(stderr, "madvise doesn't support MADV_DONTDUMP, "
1160 "but dump_guest_core=off specified\n");
1161 }
1162 }
1163}
1164
c5705a77 1165void qemu_ram_set_idstr(ram_addr_t addr, const char *name, DeviceState *dev)
84b89d78
CM
1166{
1167 RAMBlock *new_block, *block;
1168
c5705a77 1169 new_block = NULL;
a3161038 1170 QTAILQ_FOREACH(block, &ram_list.blocks, next) {
c5705a77
AK
1171 if (block->offset == addr) {
1172 new_block = block;
1173 break;
1174 }
1175 }
1176 assert(new_block);
1177 assert(!new_block->idstr[0]);
84b89d78 1178
09e5ab63
AL
1179 if (dev) {
1180 char *id = qdev_get_dev_path(dev);
84b89d78
CM
1181 if (id) {
1182 snprintf(new_block->idstr, sizeof(new_block->idstr), "%s/", id);
7267c094 1183 g_free(id);
84b89d78
CM
1184 }
1185 }
1186 pstrcat(new_block->idstr, sizeof(new_block->idstr), name);
1187
b2a8658e
UD
1188 /* This assumes the iothread lock is taken here too. */
1189 qemu_mutex_lock_ramlist();
a3161038 1190 QTAILQ_FOREACH(block, &ram_list.blocks, next) {
c5705a77 1191 if (block != new_block && !strcmp(block->idstr, new_block->idstr)) {
84b89d78
CM
1192 fprintf(stderr, "RAMBlock \"%s\" already registered, abort!\n",
1193 new_block->idstr);
1194 abort();
1195 }
1196 }
b2a8658e 1197 qemu_mutex_unlock_ramlist();
c5705a77
AK
1198}
1199
8490fc78
LC
1200static int memory_try_enable_merging(void *addr, size_t len)
1201{
2ff3de68 1202 if (!qemu_opt_get_bool(qemu_get_machine_opts(), "mem-merge", true)) {
8490fc78
LC
1203 /* disabled by the user */
1204 return 0;
1205 }
1206
1207 return qemu_madvise(addr, len, QEMU_MADV_MERGEABLE);
1208}
1209
c5705a77
AK
1210ram_addr_t qemu_ram_alloc_from_ptr(ram_addr_t size, void *host,
1211 MemoryRegion *mr)
1212{
abb26d63 1213 RAMBlock *block, *new_block;
2152f5ca
JQ
1214 ram_addr_t old_ram_size, new_ram_size;
1215
1216 old_ram_size = last_ram_offset() >> TARGET_PAGE_BITS;
c5705a77
AK
1217
1218 size = TARGET_PAGE_ALIGN(size);
1219 new_block = g_malloc0(sizeof(*new_block));
3435f395 1220 new_block->fd = -1;
84b89d78 1221
b2a8658e
UD
1222 /* This assumes the iothread lock is taken here too. */
1223 qemu_mutex_lock_ramlist();
7c637366 1224 new_block->mr = mr;
432d268c 1225 new_block->offset = find_ram_offset(size);
6977dfe6
YT
1226 if (host) {
1227 new_block->host = host;
cd19cfa2 1228 new_block->flags |= RAM_PREALLOC_MASK;
dfeaf2ab
MA
1229 } else if (xen_enabled()) {
1230 if (mem_path) {
1231 fprintf(stderr, "-mem-path not supported with Xen\n");
1232 exit(1);
1233 }
1234 xen_ram_alloc(new_block->offset, size, mr);
6977dfe6
YT
1235 } else {
1236 if (mem_path) {
e1e84ba0
MA
1237 if (phys_mem_alloc != qemu_anon_ram_alloc) {
1238 /*
1239 * file_ram_alloc() needs to allocate just like
1240 * phys_mem_alloc, but we haven't bothered to provide
1241 * a hook there.
1242 */
1243 fprintf(stderr,
1244 "-mem-path not supported with this accelerator\n");
1245 exit(1);
1246 }
6977dfe6 1247 new_block->host = file_ram_alloc(new_block, size, mem_path);
0628c182
MA
1248 }
1249 if (!new_block->host) {
91138037 1250 new_block->host = phys_mem_alloc(size);
39228250
MA
1251 if (!new_block->host) {
1252 fprintf(stderr, "Cannot set up guest memory '%s': %s\n",
1253 new_block->mr->name, strerror(errno));
1254 exit(1);
1255 }
8490fc78 1256 memory_try_enable_merging(new_block->host, size);
6977dfe6 1257 }
c902760f 1258 }
94a6b54f
PB
1259 new_block->length = size;
1260
abb26d63
PB
1261 /* Keep the list sorted from biggest to smallest block. */
1262 QTAILQ_FOREACH(block, &ram_list.blocks, next) {
1263 if (block->length < new_block->length) {
1264 break;
1265 }
1266 }
1267 if (block) {
1268 QTAILQ_INSERT_BEFORE(block, new_block, next);
1269 } else {
1270 QTAILQ_INSERT_TAIL(&ram_list.blocks, new_block, next);
1271 }
0d6d3c87 1272 ram_list.mru_block = NULL;
94a6b54f 1273
f798b07f 1274 ram_list.version++;
b2a8658e 1275 qemu_mutex_unlock_ramlist();
f798b07f 1276
2152f5ca
JQ
1277 new_ram_size = last_ram_offset() >> TARGET_PAGE_BITS;
1278
1279 if (new_ram_size > old_ram_size) {
1ab4c8ce
JQ
1280 int i;
1281 for (i = 0; i < DIRTY_MEMORY_NUM; i++) {
1282 ram_list.dirty_memory[i] =
1283 bitmap_zero_extend(ram_list.dirty_memory[i],
1284 old_ram_size, new_ram_size);
1285 }
2152f5ca 1286 }
75218e7f 1287 cpu_physical_memory_set_dirty_range(new_block->offset, size);
94a6b54f 1288
ddb97f1d 1289 qemu_ram_setup_dump(new_block->host, size);
ad0b5321 1290 qemu_madvise(new_block->host, size, QEMU_MADV_HUGEPAGE);
3e469dbf 1291 qemu_madvise(new_block->host, size, QEMU_MADV_DONTFORK);
ddb97f1d 1292
6f0437e8
JK
1293 if (kvm_enabled())
1294 kvm_setup_guest_memory(new_block->host, size);
1295
94a6b54f
PB
1296 return new_block->offset;
1297}
e9a1ab19 1298
c5705a77 1299ram_addr_t qemu_ram_alloc(ram_addr_t size, MemoryRegion *mr)
6977dfe6 1300{
c5705a77 1301 return qemu_ram_alloc_from_ptr(size, NULL, mr);
6977dfe6
YT
1302}
1303
1f2e98b6
AW
1304void qemu_ram_free_from_ptr(ram_addr_t addr)
1305{
1306 RAMBlock *block;
1307
b2a8658e
UD
1308 /* This assumes the iothread lock is taken here too. */
1309 qemu_mutex_lock_ramlist();
a3161038 1310 QTAILQ_FOREACH(block, &ram_list.blocks, next) {
1f2e98b6 1311 if (addr == block->offset) {
a3161038 1312 QTAILQ_REMOVE(&ram_list.blocks, block, next);
0d6d3c87 1313 ram_list.mru_block = NULL;
f798b07f 1314 ram_list.version++;
7267c094 1315 g_free(block);
b2a8658e 1316 break;
1f2e98b6
AW
1317 }
1318 }
b2a8658e 1319 qemu_mutex_unlock_ramlist();
1f2e98b6
AW
1320}
1321
c227f099 1322void qemu_ram_free(ram_addr_t addr)
e9a1ab19 1323{
04b16653
AW
1324 RAMBlock *block;
1325
b2a8658e
UD
1326 /* This assumes the iothread lock is taken here too. */
1327 qemu_mutex_lock_ramlist();
a3161038 1328 QTAILQ_FOREACH(block, &ram_list.blocks, next) {
04b16653 1329 if (addr == block->offset) {
a3161038 1330 QTAILQ_REMOVE(&ram_list.blocks, block, next);
0d6d3c87 1331 ram_list.mru_block = NULL;
f798b07f 1332 ram_list.version++;
cd19cfa2
HY
1333 if (block->flags & RAM_PREALLOC_MASK) {
1334 ;
dfeaf2ab
MA
1335 } else if (xen_enabled()) {
1336 xen_invalidate_map_cache_entry(block->host);
089f3f76 1337#ifndef _WIN32
3435f395
MA
1338 } else if (block->fd >= 0) {
1339 munmap(block->host, block->length);
1340 close(block->fd);
089f3f76 1341#endif
04b16653 1342 } else {
dfeaf2ab 1343 qemu_anon_ram_free(block->host, block->length);
04b16653 1344 }
7267c094 1345 g_free(block);
b2a8658e 1346 break;
04b16653
AW
1347 }
1348 }
b2a8658e 1349 qemu_mutex_unlock_ramlist();
04b16653 1350
e9a1ab19
FB
1351}
1352
cd19cfa2
HY
1353#ifndef _WIN32
1354void qemu_ram_remap(ram_addr_t addr, ram_addr_t length)
1355{
1356 RAMBlock *block;
1357 ram_addr_t offset;
1358 int flags;
1359 void *area, *vaddr;
1360
a3161038 1361 QTAILQ_FOREACH(block, &ram_list.blocks, next) {
cd19cfa2
HY
1362 offset = addr - block->offset;
1363 if (offset < block->length) {
1364 vaddr = block->host + offset;
1365 if (block->flags & RAM_PREALLOC_MASK) {
1366 ;
dfeaf2ab
MA
1367 } else if (xen_enabled()) {
1368 abort();
cd19cfa2
HY
1369 } else {
1370 flags = MAP_FIXED;
1371 munmap(vaddr, length);
3435f395 1372 if (block->fd >= 0) {
cd19cfa2 1373#ifdef MAP_POPULATE
3435f395
MA
1374 flags |= mem_prealloc ? MAP_POPULATE | MAP_SHARED :
1375 MAP_PRIVATE;
fd28aa13 1376#else
3435f395 1377 flags |= MAP_PRIVATE;
cd19cfa2 1378#endif
3435f395
MA
1379 area = mmap(vaddr, length, PROT_READ | PROT_WRITE,
1380 flags, block->fd, offset);
cd19cfa2 1381 } else {
2eb9fbaa
MA
1382 /*
1383 * Remap needs to match alloc. Accelerators that
1384 * set phys_mem_alloc never remap. If they did,
1385 * we'd need a remap hook here.
1386 */
1387 assert(phys_mem_alloc == qemu_anon_ram_alloc);
1388
cd19cfa2
HY
1389 flags |= MAP_PRIVATE | MAP_ANONYMOUS;
1390 area = mmap(vaddr, length, PROT_READ | PROT_WRITE,
1391 flags, -1, 0);
cd19cfa2
HY
1392 }
1393 if (area != vaddr) {
f15fbc4b
AP
1394 fprintf(stderr, "Could not remap addr: "
1395 RAM_ADDR_FMT "@" RAM_ADDR_FMT "\n",
cd19cfa2
HY
1396 length, addr);
1397 exit(1);
1398 }
8490fc78 1399 memory_try_enable_merging(vaddr, length);
ddb97f1d 1400 qemu_ram_setup_dump(vaddr, length);
cd19cfa2
HY
1401 }
1402 return;
1403 }
1404 }
1405}
1406#endif /* !_WIN32 */
1407
1b5ec234
PB
1408/* Return a host pointer to ram allocated with qemu_ram_alloc.
1409 With the exception of the softmmu code in this file, this should
1410 only be used for local memory (e.g. video ram) that the device owns,
1411 and knows it isn't going to access beyond the end of the block.
1412
1413 It should not be used for general purpose DMA.
1414 Use cpu_physical_memory_map/cpu_physical_memory_rw instead.
1415 */
1416void *qemu_get_ram_ptr(ram_addr_t addr)
1417{
1418 RAMBlock *block = qemu_get_ram_block(addr);
1419
0d6d3c87
PB
1420 if (xen_enabled()) {
1421 /* We need to check if the requested address is in the RAM
1422 * because we don't want to map the entire memory in QEMU.
1423 * In that case just map until the end of the page.
1424 */
1425 if (block->offset == 0) {
1426 return xen_map_cache(addr, 0, 0);
1427 } else if (block->host == NULL) {
1428 block->host =
1429 xen_map_cache(block->offset, block->length, 1);
1430 }
1431 }
1432 return block->host + (addr - block->offset);
dc828ca1
PB
1433}
1434
38bee5dc
SS
1435/* Return a host pointer to guest's ram. Similar to qemu_get_ram_ptr
1436 * but takes a size argument */
cb85f7ab 1437static void *qemu_ram_ptr_length(ram_addr_t addr, hwaddr *size)
38bee5dc 1438{
8ab934f9
SS
1439 if (*size == 0) {
1440 return NULL;
1441 }
868bb33f 1442 if (xen_enabled()) {
e41d7c69 1443 return xen_map_cache(addr, *size, 1);
868bb33f 1444 } else {
38bee5dc
SS
1445 RAMBlock *block;
1446
a3161038 1447 QTAILQ_FOREACH(block, &ram_list.blocks, next) {
38bee5dc
SS
1448 if (addr - block->offset < block->length) {
1449 if (addr - block->offset + *size > block->length)
1450 *size = block->length - addr + block->offset;
1451 return block->host + (addr - block->offset);
1452 }
1453 }
1454
1455 fprintf(stderr, "Bad ram offset %" PRIx64 "\n", (uint64_t)addr);
1456 abort();
38bee5dc
SS
1457 }
1458}
1459
7443b437
PB
1460/* Some of the softmmu routines need to translate from a host pointer
1461 (typically a TLB entry) back to a ram offset. */
1b5ec234 1462MemoryRegion *qemu_ram_addr_from_host(void *ptr, ram_addr_t *ram_addr)
5579c7f3 1463{
94a6b54f
PB
1464 RAMBlock *block;
1465 uint8_t *host = ptr;
1466
868bb33f 1467 if (xen_enabled()) {
e41d7c69 1468 *ram_addr = xen_ram_addr_from_mapcache(ptr);
1b5ec234 1469 return qemu_get_ram_block(*ram_addr)->mr;
712c2b41
SS
1470 }
1471
23887b79
PB
1472 block = ram_list.mru_block;
1473 if (block && block->host && host - block->host < block->length) {
1474 goto found;
1475 }
1476
a3161038 1477 QTAILQ_FOREACH(block, &ram_list.blocks, next) {
432d268c
JN
1478 /* This case append when the block is not mapped. */
1479 if (block->host == NULL) {
1480 continue;
1481 }
f471a17e 1482 if (host - block->host < block->length) {
23887b79 1483 goto found;
f471a17e 1484 }
94a6b54f 1485 }
432d268c 1486
1b5ec234 1487 return NULL;
23887b79
PB
1488
1489found:
1490 *ram_addr = block->offset + (host - block->host);
1b5ec234 1491 return block->mr;
e890261f 1492}
f471a17e 1493
a8170e5e 1494static void notdirty_mem_write(void *opaque, hwaddr ram_addr,
0e0df1e2 1495 uint64_t val, unsigned size)
9fa3e853 1496{
52159192 1497 if (!cpu_physical_memory_get_dirty_flag(ram_addr, DIRTY_MEMORY_CODE)) {
0e0df1e2 1498 tb_invalidate_phys_page_fast(ram_addr, size);
3a7d929e 1499 }
0e0df1e2
AK
1500 switch (size) {
1501 case 1:
1502 stb_p(qemu_get_ram_ptr(ram_addr), val);
1503 break;
1504 case 2:
1505 stw_p(qemu_get_ram_ptr(ram_addr), val);
1506 break;
1507 case 4:
1508 stl_p(qemu_get_ram_ptr(ram_addr), val);
1509 break;
1510 default:
1511 abort();
3a7d929e 1512 }
52159192
JQ
1513 cpu_physical_memory_set_dirty_flag(ram_addr, DIRTY_MEMORY_MIGRATION);
1514 cpu_physical_memory_set_dirty_flag(ram_addr, DIRTY_MEMORY_VGA);
f23db169
FB
1515 /* we remove the notdirty callback only if the code has been
1516 flushed */
a2cd8c85 1517 if (!cpu_physical_memory_is_clean(ram_addr)) {
4917cf44
AF
1518 CPUArchState *env = current_cpu->env_ptr;
1519 tlb_set_dirty(env, env->mem_io_vaddr);
1520 }
9fa3e853
FB
1521}
1522
b018ddf6
PB
1523static bool notdirty_mem_accepts(void *opaque, hwaddr addr,
1524 unsigned size, bool is_write)
1525{
1526 return is_write;
1527}
1528
0e0df1e2 1529static const MemoryRegionOps notdirty_mem_ops = {
0e0df1e2 1530 .write = notdirty_mem_write,
b018ddf6 1531 .valid.accepts = notdirty_mem_accepts,
0e0df1e2 1532 .endianness = DEVICE_NATIVE_ENDIAN,
1ccde1cb
FB
1533};
1534
0f459d16 1535/* Generate a debug exception if a watchpoint has been hit. */
b4051334 1536static void check_watchpoint(int offset, int len_mask, int flags)
0f459d16 1537{
4917cf44 1538 CPUArchState *env = current_cpu->env_ptr;
06d55cc1 1539 target_ulong pc, cs_base;
0f459d16 1540 target_ulong vaddr;
a1d1bb31 1541 CPUWatchpoint *wp;
06d55cc1 1542 int cpu_flags;
0f459d16 1543
06d55cc1
AL
1544 if (env->watchpoint_hit) {
1545 /* We re-entered the check after replacing the TB. Now raise
1546 * the debug interrupt so that is will trigger after the
1547 * current instruction. */
c3affe56 1548 cpu_interrupt(ENV_GET_CPU(env), CPU_INTERRUPT_DEBUG);
06d55cc1
AL
1549 return;
1550 }
2e70f6ef 1551 vaddr = (env->mem_io_vaddr & TARGET_PAGE_MASK) + offset;
72cf2d4f 1552 QTAILQ_FOREACH(wp, &env->watchpoints, entry) {
b4051334
AL
1553 if ((vaddr == (wp->vaddr & len_mask) ||
1554 (vaddr & wp->len_mask) == wp->vaddr) && (wp->flags & flags)) {
6e140f28
AL
1555 wp->flags |= BP_WATCHPOINT_HIT;
1556 if (!env->watchpoint_hit) {
1557 env->watchpoint_hit = wp;
5a316526 1558 tb_check_watchpoint(env);
6e140f28
AL
1559 if (wp->flags & BP_STOP_BEFORE_ACCESS) {
1560 env->exception_index = EXCP_DEBUG;
488d6577 1561 cpu_loop_exit(env);
6e140f28
AL
1562 } else {
1563 cpu_get_tb_cpu_state(env, &pc, &cs_base, &cpu_flags);
1564 tb_gen_code(env, pc, cs_base, cpu_flags, 1);
488d6577 1565 cpu_resume_from_signal(env, NULL);
6e140f28 1566 }
06d55cc1 1567 }
6e140f28
AL
1568 } else {
1569 wp->flags &= ~BP_WATCHPOINT_HIT;
0f459d16
PB
1570 }
1571 }
1572}
1573
6658ffb8
PB
1574/* Watchpoint access routines. Watchpoints are inserted using TLB tricks,
1575 so these check for a hit then pass through to the normal out-of-line
1576 phys routines. */
a8170e5e 1577static uint64_t watch_mem_read(void *opaque, hwaddr addr,
1ec9b909 1578 unsigned size)
6658ffb8 1579{
1ec9b909
AK
1580 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~(size - 1), BP_MEM_READ);
1581 switch (size) {
1582 case 1: return ldub_phys(addr);
1583 case 2: return lduw_phys(addr);
1584 case 4: return ldl_phys(addr);
1585 default: abort();
1586 }
6658ffb8
PB
1587}
1588
a8170e5e 1589static void watch_mem_write(void *opaque, hwaddr addr,
1ec9b909 1590 uint64_t val, unsigned size)
6658ffb8 1591{
1ec9b909
AK
1592 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~(size - 1), BP_MEM_WRITE);
1593 switch (size) {
67364150
MF
1594 case 1:
1595 stb_phys(addr, val);
1596 break;
1597 case 2:
1598 stw_phys(addr, val);
1599 break;
1600 case 4:
1601 stl_phys(addr, val);
1602 break;
1ec9b909
AK
1603 default: abort();
1604 }
6658ffb8
PB
1605}
1606
1ec9b909
AK
1607static const MemoryRegionOps watch_mem_ops = {
1608 .read = watch_mem_read,
1609 .write = watch_mem_write,
1610 .endianness = DEVICE_NATIVE_ENDIAN,
6658ffb8 1611};
6658ffb8 1612
a8170e5e 1613static uint64_t subpage_read(void *opaque, hwaddr addr,
70c68e44 1614 unsigned len)
db7b5426 1615{
acc9d80b
JK
1616 subpage_t *subpage = opaque;
1617 uint8_t buf[4];
791af8c8 1618
db7b5426 1619#if defined(DEBUG_SUBPAGE)
016e9d62 1620 printf("%s: subpage %p len %u addr " TARGET_FMT_plx "\n", __func__,
acc9d80b 1621 subpage, len, addr);
db7b5426 1622#endif
acc9d80b
JK
1623 address_space_read(subpage->as, addr + subpage->base, buf, len);
1624 switch (len) {
1625 case 1:
1626 return ldub_p(buf);
1627 case 2:
1628 return lduw_p(buf);
1629 case 4:
1630 return ldl_p(buf);
1631 default:
1632 abort();
1633 }
db7b5426
BS
1634}
1635
a8170e5e 1636static void subpage_write(void *opaque, hwaddr addr,
70c68e44 1637 uint64_t value, unsigned len)
db7b5426 1638{
acc9d80b
JK
1639 subpage_t *subpage = opaque;
1640 uint8_t buf[4];
1641
db7b5426 1642#if defined(DEBUG_SUBPAGE)
016e9d62 1643 printf("%s: subpage %p len %u addr " TARGET_FMT_plx
acc9d80b
JK
1644 " value %"PRIx64"\n",
1645 __func__, subpage, len, addr, value);
db7b5426 1646#endif
acc9d80b
JK
1647 switch (len) {
1648 case 1:
1649 stb_p(buf, value);
1650 break;
1651 case 2:
1652 stw_p(buf, value);
1653 break;
1654 case 4:
1655 stl_p(buf, value);
1656 break;
1657 default:
1658 abort();
1659 }
1660 address_space_write(subpage->as, addr + subpage->base, buf, len);
db7b5426
BS
1661}
1662
c353e4cc 1663static bool subpage_accepts(void *opaque, hwaddr addr,
016e9d62 1664 unsigned len, bool is_write)
c353e4cc 1665{
acc9d80b 1666 subpage_t *subpage = opaque;
c353e4cc 1667#if defined(DEBUG_SUBPAGE)
016e9d62 1668 printf("%s: subpage %p %c len %u addr " TARGET_FMT_plx "\n",
acc9d80b 1669 __func__, subpage, is_write ? 'w' : 'r', len, addr);
c353e4cc
PB
1670#endif
1671
acc9d80b 1672 return address_space_access_valid(subpage->as, addr + subpage->base,
016e9d62 1673 len, is_write);
c353e4cc
PB
1674}
1675
70c68e44
AK
1676static const MemoryRegionOps subpage_ops = {
1677 .read = subpage_read,
1678 .write = subpage_write,
c353e4cc 1679 .valid.accepts = subpage_accepts,
70c68e44 1680 .endianness = DEVICE_NATIVE_ENDIAN,
db7b5426
BS
1681};
1682
c227f099 1683static int subpage_register (subpage_t *mmio, uint32_t start, uint32_t end,
5312bd8b 1684 uint16_t section)
db7b5426
BS
1685{
1686 int idx, eidx;
1687
1688 if (start >= TARGET_PAGE_SIZE || end >= TARGET_PAGE_SIZE)
1689 return -1;
1690 idx = SUBPAGE_IDX(start);
1691 eidx = SUBPAGE_IDX(end);
1692#if defined(DEBUG_SUBPAGE)
016e9d62
AK
1693 printf("%s: %p start %08x end %08x idx %08x eidx %08x section %d\n",
1694 __func__, mmio, start, end, idx, eidx, section);
db7b5426 1695#endif
db7b5426 1696 for (; idx <= eidx; idx++) {
5312bd8b 1697 mmio->sub_section[idx] = section;
db7b5426
BS
1698 }
1699
1700 return 0;
1701}
1702
acc9d80b 1703static subpage_t *subpage_init(AddressSpace *as, hwaddr base)
db7b5426 1704{
c227f099 1705 subpage_t *mmio;
db7b5426 1706
7267c094 1707 mmio = g_malloc0(sizeof(subpage_t));
1eec614b 1708
acc9d80b 1709 mmio->as = as;
1eec614b 1710 mmio->base = base;
2c9b15ca 1711 memory_region_init_io(&mmio->iomem, NULL, &subpage_ops, mmio,
70c68e44 1712 "subpage", TARGET_PAGE_SIZE);
b3b00c78 1713 mmio->iomem.subpage = true;
db7b5426 1714#if defined(DEBUG_SUBPAGE)
016e9d62
AK
1715 printf("%s: %p base " TARGET_FMT_plx " len %08x\n", __func__,
1716 mmio, base, TARGET_PAGE_SIZE);
db7b5426 1717#endif
b41aac4f 1718 subpage_register(mmio, 0, TARGET_PAGE_SIZE-1, PHYS_SECTION_UNASSIGNED);
db7b5426
BS
1719
1720 return mmio;
1721}
1722
53cb28cb 1723static uint16_t dummy_section(PhysPageMap *map, MemoryRegion *mr)
5312bd8b
AK
1724{
1725 MemoryRegionSection section = {
1726 .mr = mr,
1727 .offset_within_address_space = 0,
1728 .offset_within_region = 0,
052e87b0 1729 .size = int128_2_64(),
5312bd8b
AK
1730 };
1731
53cb28cb 1732 return phys_section_add(map, &section);
5312bd8b
AK
1733}
1734
a8170e5e 1735MemoryRegion *iotlb_to_region(hwaddr index)
aa102231 1736{
53cb28cb
MA
1737 return address_space_memory.dispatch->map.sections[
1738 index & ~TARGET_PAGE_MASK].mr;
aa102231
AK
1739}
1740
e9179ce1
AK
1741static void io_mem_init(void)
1742{
2c9b15ca
PB
1743 memory_region_init_io(&io_mem_rom, NULL, &unassigned_mem_ops, NULL, "rom", UINT64_MAX);
1744 memory_region_init_io(&io_mem_unassigned, NULL, &unassigned_mem_ops, NULL,
0e0df1e2 1745 "unassigned", UINT64_MAX);
2c9b15ca 1746 memory_region_init_io(&io_mem_notdirty, NULL, &notdirty_mem_ops, NULL,
0e0df1e2 1747 "notdirty", UINT64_MAX);
2c9b15ca 1748 memory_region_init_io(&io_mem_watch, NULL, &watch_mem_ops, NULL,
1ec9b909 1749 "watch", UINT64_MAX);
e9179ce1
AK
1750}
1751
ac1970fb 1752static void mem_begin(MemoryListener *listener)
00752703
PB
1753{
1754 AddressSpace *as = container_of(listener, AddressSpace, dispatch_listener);
53cb28cb
MA
1755 AddressSpaceDispatch *d = g_new0(AddressSpaceDispatch, 1);
1756 uint16_t n;
1757
1758 n = dummy_section(&d->map, &io_mem_unassigned);
1759 assert(n == PHYS_SECTION_UNASSIGNED);
1760 n = dummy_section(&d->map, &io_mem_notdirty);
1761 assert(n == PHYS_SECTION_NOTDIRTY);
1762 n = dummy_section(&d->map, &io_mem_rom);
1763 assert(n == PHYS_SECTION_ROM);
1764 n = dummy_section(&d->map, &io_mem_watch);
1765 assert(n == PHYS_SECTION_WATCH);
00752703 1766
9736e55b 1767 d->phys_map = (PhysPageEntry) { .ptr = PHYS_MAP_NODE_NIL, .skip = 1 };
00752703
PB
1768 d->as = as;
1769 as->next_dispatch = d;
1770}
1771
1772static void mem_commit(MemoryListener *listener)
ac1970fb 1773{
89ae337a 1774 AddressSpace *as = container_of(listener, AddressSpace, dispatch_listener);
0475d94f
PB
1775 AddressSpaceDispatch *cur = as->dispatch;
1776 AddressSpaceDispatch *next = as->next_dispatch;
1777
53cb28cb 1778 phys_page_compact_all(next, next->map.nodes_nb);
b35ba30f 1779
0475d94f 1780 as->dispatch = next;
b41aac4f 1781
53cb28cb
MA
1782 if (cur) {
1783 phys_sections_free(&cur->map);
1784 g_free(cur);
1785 }
9affd6fc
PB
1786}
1787
1d71148e 1788static void tcg_commit(MemoryListener *listener)
50c1e149 1789{
182735ef 1790 CPUState *cpu;
117712c3
AK
1791
1792 /* since each CPU stores ram addresses in its TLB cache, we must
1793 reset the modified entries */
1794 /* XXX: slow ! */
bdc44640 1795 CPU_FOREACH(cpu) {
182735ef
AF
1796 CPUArchState *env = cpu->env_ptr;
1797
117712c3
AK
1798 tlb_flush(env, 1);
1799 }
50c1e149
AK
1800}
1801
93632747
AK
1802static void core_log_global_start(MemoryListener *listener)
1803{
1804 cpu_physical_memory_set_dirty_tracking(1);
1805}
1806
1807static void core_log_global_stop(MemoryListener *listener)
1808{
1809 cpu_physical_memory_set_dirty_tracking(0);
1810}
1811
93632747 1812static MemoryListener core_memory_listener = {
93632747
AK
1813 .log_global_start = core_log_global_start,
1814 .log_global_stop = core_log_global_stop,
ac1970fb 1815 .priority = 1,
93632747
AK
1816};
1817
1d71148e
AK
1818static MemoryListener tcg_memory_listener = {
1819 .commit = tcg_commit,
1820};
1821
ac1970fb
AK
1822void address_space_init_dispatch(AddressSpace *as)
1823{
00752703 1824 as->dispatch = NULL;
89ae337a 1825 as->dispatch_listener = (MemoryListener) {
ac1970fb 1826 .begin = mem_begin,
00752703 1827 .commit = mem_commit,
ac1970fb
AK
1828 .region_add = mem_add,
1829 .region_nop = mem_add,
1830 .priority = 0,
1831 };
89ae337a 1832 memory_listener_register(&as->dispatch_listener, as);
ac1970fb
AK
1833}
1834
83f3c251
AK
1835void address_space_destroy_dispatch(AddressSpace *as)
1836{
1837 AddressSpaceDispatch *d = as->dispatch;
1838
89ae337a 1839 memory_listener_unregister(&as->dispatch_listener);
83f3c251
AK
1840 g_free(d);
1841 as->dispatch = NULL;
1842}
1843
62152b8a
AK
1844static void memory_map_init(void)
1845{
7267c094 1846 system_memory = g_malloc(sizeof(*system_memory));
03f49957 1847
57271d63 1848 memory_region_init(system_memory, NULL, "system", UINT64_MAX);
7dca8043 1849 address_space_init(&address_space_memory, system_memory, "memory");
309cb471 1850
7267c094 1851 system_io = g_malloc(sizeof(*system_io));
3bb28b72
JK
1852 memory_region_init_io(system_io, NULL, &unassigned_io_ops, NULL, "io",
1853 65536);
7dca8043 1854 address_space_init(&address_space_io, system_io, "I/O");
93632747 1855
f6790af6 1856 memory_listener_register(&core_memory_listener, &address_space_memory);
2641689a
LG
1857 if (tcg_enabled()) {
1858 memory_listener_register(&tcg_memory_listener, &address_space_memory);
1859 }
62152b8a
AK
1860}
1861
1862MemoryRegion *get_system_memory(void)
1863{
1864 return system_memory;
1865}
1866
309cb471
AK
1867MemoryRegion *get_system_io(void)
1868{
1869 return system_io;
1870}
1871
e2eef170
PB
1872#endif /* !defined(CONFIG_USER_ONLY) */
1873
13eb76e0
FB
1874/* physical memory access (slow version, mainly for debug) */
1875#if defined(CONFIG_USER_ONLY)
f17ec444 1876int cpu_memory_rw_debug(CPUState *cpu, target_ulong addr,
a68fe89c 1877 uint8_t *buf, int len, int is_write)
13eb76e0
FB
1878{
1879 int l, flags;
1880 target_ulong page;
53a5960a 1881 void * p;
13eb76e0
FB
1882
1883 while (len > 0) {
1884 page = addr & TARGET_PAGE_MASK;
1885 l = (page + TARGET_PAGE_SIZE) - addr;
1886 if (l > len)
1887 l = len;
1888 flags = page_get_flags(page);
1889 if (!(flags & PAGE_VALID))
a68fe89c 1890 return -1;
13eb76e0
FB
1891 if (is_write) {
1892 if (!(flags & PAGE_WRITE))
a68fe89c 1893 return -1;
579a97f7 1894 /* XXX: this code should not depend on lock_user */
72fb7daa 1895 if (!(p = lock_user(VERIFY_WRITE, addr, l, 0)))
a68fe89c 1896 return -1;
72fb7daa
AJ
1897 memcpy(p, buf, l);
1898 unlock_user(p, addr, l);
13eb76e0
FB
1899 } else {
1900 if (!(flags & PAGE_READ))
a68fe89c 1901 return -1;
579a97f7 1902 /* XXX: this code should not depend on lock_user */
72fb7daa 1903 if (!(p = lock_user(VERIFY_READ, addr, l, 1)))
a68fe89c 1904 return -1;
72fb7daa 1905 memcpy(buf, p, l);
5b257578 1906 unlock_user(p, addr, 0);
13eb76e0
FB
1907 }
1908 len -= l;
1909 buf += l;
1910 addr += l;
1911 }
a68fe89c 1912 return 0;
13eb76e0 1913}
8df1cd07 1914
13eb76e0 1915#else
51d7a9eb 1916
a8170e5e
AK
1917static void invalidate_and_set_dirty(hwaddr addr,
1918 hwaddr length)
51d7a9eb 1919{
a2cd8c85 1920 if (cpu_physical_memory_is_clean(addr)) {
51d7a9eb
AP
1921 /* invalidate code */
1922 tb_invalidate_phys_page_range(addr, addr + length, 0);
1923 /* set dirty bit */
52159192
JQ
1924 cpu_physical_memory_set_dirty_flag(addr, DIRTY_MEMORY_VGA);
1925 cpu_physical_memory_set_dirty_flag(addr, DIRTY_MEMORY_MIGRATION);
51d7a9eb 1926 }
e226939d 1927 xen_modified_memory(addr, length);
51d7a9eb
AP
1928}
1929
2bbfa05d
PB
1930static inline bool memory_access_is_direct(MemoryRegion *mr, bool is_write)
1931{
1932 if (memory_region_is_ram(mr)) {
1933 return !(is_write && mr->readonly);
1934 }
1935 if (memory_region_is_romd(mr)) {
1936 return !is_write;
1937 }
1938
1939 return false;
1940}
1941
23326164 1942static int memory_access_size(MemoryRegion *mr, unsigned l, hwaddr addr)
82f2563f 1943{
e1622f4b 1944 unsigned access_size_max = mr->ops->valid.max_access_size;
23326164
RH
1945
1946 /* Regions are assumed to support 1-4 byte accesses unless
1947 otherwise specified. */
23326164
RH
1948 if (access_size_max == 0) {
1949 access_size_max = 4;
1950 }
1951
1952 /* Bound the maximum access by the alignment of the address. */
1953 if (!mr->ops->impl.unaligned) {
1954 unsigned align_size_max = addr & -addr;
1955 if (align_size_max != 0 && align_size_max < access_size_max) {
1956 access_size_max = align_size_max;
1957 }
82f2563f 1958 }
23326164
RH
1959
1960 /* Don't attempt accesses larger than the maximum. */
1961 if (l > access_size_max) {
1962 l = access_size_max;
82f2563f 1963 }
098178f2
PB
1964 if (l & (l - 1)) {
1965 l = 1 << (qemu_fls(l) - 1);
1966 }
23326164
RH
1967
1968 return l;
82f2563f
PB
1969}
1970
fd8aaa76 1971bool address_space_rw(AddressSpace *as, hwaddr addr, uint8_t *buf,
ac1970fb 1972 int len, bool is_write)
13eb76e0 1973{
149f54b5 1974 hwaddr l;
13eb76e0 1975 uint8_t *ptr;
791af8c8 1976 uint64_t val;
149f54b5 1977 hwaddr addr1;
5c8a00ce 1978 MemoryRegion *mr;
fd8aaa76 1979 bool error = false;
3b46e624 1980
13eb76e0 1981 while (len > 0) {
149f54b5 1982 l = len;
5c8a00ce 1983 mr = address_space_translate(as, addr, &addr1, &l, is_write);
3b46e624 1984
13eb76e0 1985 if (is_write) {
5c8a00ce
PB
1986 if (!memory_access_is_direct(mr, is_write)) {
1987 l = memory_access_size(mr, l, addr1);
4917cf44 1988 /* XXX: could force current_cpu to NULL to avoid
6a00d601 1989 potential bugs */
23326164
RH
1990 switch (l) {
1991 case 8:
1992 /* 64 bit write access */
1993 val = ldq_p(buf);
1994 error |= io_mem_write(mr, addr1, val, 8);
1995 break;
1996 case 4:
1c213d19 1997 /* 32 bit write access */
c27004ec 1998 val = ldl_p(buf);
5c8a00ce 1999 error |= io_mem_write(mr, addr1, val, 4);
23326164
RH
2000 break;
2001 case 2:
1c213d19 2002 /* 16 bit write access */
c27004ec 2003 val = lduw_p(buf);
5c8a00ce 2004 error |= io_mem_write(mr, addr1, val, 2);
23326164
RH
2005 break;
2006 case 1:
1c213d19 2007 /* 8 bit write access */
c27004ec 2008 val = ldub_p(buf);
5c8a00ce 2009 error |= io_mem_write(mr, addr1, val, 1);
23326164
RH
2010 break;
2011 default:
2012 abort();
13eb76e0 2013 }
2bbfa05d 2014 } else {
5c8a00ce 2015 addr1 += memory_region_get_ram_addr(mr);
13eb76e0 2016 /* RAM case */
5579c7f3 2017 ptr = qemu_get_ram_ptr(addr1);
13eb76e0 2018 memcpy(ptr, buf, l);
51d7a9eb 2019 invalidate_and_set_dirty(addr1, l);
13eb76e0
FB
2020 }
2021 } else {
5c8a00ce 2022 if (!memory_access_is_direct(mr, is_write)) {
13eb76e0 2023 /* I/O case */
5c8a00ce 2024 l = memory_access_size(mr, l, addr1);
23326164
RH
2025 switch (l) {
2026 case 8:
2027 /* 64 bit read access */
2028 error |= io_mem_read(mr, addr1, &val, 8);
2029 stq_p(buf, val);
2030 break;
2031 case 4:
13eb76e0 2032 /* 32 bit read access */
5c8a00ce 2033 error |= io_mem_read(mr, addr1, &val, 4);
c27004ec 2034 stl_p(buf, val);
23326164
RH
2035 break;
2036 case 2:
13eb76e0 2037 /* 16 bit read access */
5c8a00ce 2038 error |= io_mem_read(mr, addr1, &val, 2);
c27004ec 2039 stw_p(buf, val);
23326164
RH
2040 break;
2041 case 1:
1c213d19 2042 /* 8 bit read access */
5c8a00ce 2043 error |= io_mem_read(mr, addr1, &val, 1);
c27004ec 2044 stb_p(buf, val);
23326164
RH
2045 break;
2046 default:
2047 abort();
13eb76e0
FB
2048 }
2049 } else {
2050 /* RAM case */
5c8a00ce 2051 ptr = qemu_get_ram_ptr(mr->ram_addr + addr1);
f3705d53 2052 memcpy(buf, ptr, l);
13eb76e0
FB
2053 }
2054 }
2055 len -= l;
2056 buf += l;
2057 addr += l;
2058 }
fd8aaa76
PB
2059
2060 return error;
13eb76e0 2061}
8df1cd07 2062
fd8aaa76 2063bool address_space_write(AddressSpace *as, hwaddr addr,
ac1970fb
AK
2064 const uint8_t *buf, int len)
2065{
fd8aaa76 2066 return address_space_rw(as, addr, (uint8_t *)buf, len, true);
ac1970fb
AK
2067}
2068
fd8aaa76 2069bool address_space_read(AddressSpace *as, hwaddr addr, uint8_t *buf, int len)
ac1970fb 2070{
fd8aaa76 2071 return address_space_rw(as, addr, buf, len, false);
ac1970fb
AK
2072}
2073
2074
a8170e5e 2075void cpu_physical_memory_rw(hwaddr addr, uint8_t *buf,
ac1970fb
AK
2076 int len, int is_write)
2077{
fd8aaa76 2078 address_space_rw(&address_space_memory, addr, buf, len, is_write);
ac1970fb
AK
2079}
2080
582b55a9
AG
2081enum write_rom_type {
2082 WRITE_DATA,
2083 FLUSH_CACHE,
2084};
2085
2086static inline void cpu_physical_memory_write_rom_internal(
2087 hwaddr addr, const uint8_t *buf, int len, enum write_rom_type type)
d0ecd2aa 2088{
149f54b5 2089 hwaddr l;
d0ecd2aa 2090 uint8_t *ptr;
149f54b5 2091 hwaddr addr1;
5c8a00ce 2092 MemoryRegion *mr;
3b46e624 2093
d0ecd2aa 2094 while (len > 0) {
149f54b5 2095 l = len;
5c8a00ce
PB
2096 mr = address_space_translate(&address_space_memory,
2097 addr, &addr1, &l, true);
3b46e624 2098
5c8a00ce
PB
2099 if (!(memory_region_is_ram(mr) ||
2100 memory_region_is_romd(mr))) {
d0ecd2aa
FB
2101 /* do nothing */
2102 } else {
5c8a00ce 2103 addr1 += memory_region_get_ram_addr(mr);
d0ecd2aa 2104 /* ROM/RAM case */
5579c7f3 2105 ptr = qemu_get_ram_ptr(addr1);
582b55a9
AG
2106 switch (type) {
2107 case WRITE_DATA:
2108 memcpy(ptr, buf, l);
2109 invalidate_and_set_dirty(addr1, l);
2110 break;
2111 case FLUSH_CACHE:
2112 flush_icache_range((uintptr_t)ptr, (uintptr_t)ptr + l);
2113 break;
2114 }
d0ecd2aa
FB
2115 }
2116 len -= l;
2117 buf += l;
2118 addr += l;
2119 }
2120}
2121
582b55a9
AG
2122/* used for ROM loading : can write in RAM and ROM */
2123void cpu_physical_memory_write_rom(hwaddr addr,
2124 const uint8_t *buf, int len)
2125{
2126 cpu_physical_memory_write_rom_internal(addr, buf, len, WRITE_DATA);
2127}
2128
2129void cpu_flush_icache_range(hwaddr start, int len)
2130{
2131 /*
2132 * This function should do the same thing as an icache flush that was
2133 * triggered from within the guest. For TCG we are always cache coherent,
2134 * so there is no need to flush anything. For KVM / Xen we need to flush
2135 * the host's instruction cache at least.
2136 */
2137 if (tcg_enabled()) {
2138 return;
2139 }
2140
2141 cpu_physical_memory_write_rom_internal(start, NULL, len, FLUSH_CACHE);
2142}
2143
6d16c2f8 2144typedef struct {
d3e71559 2145 MemoryRegion *mr;
6d16c2f8 2146 void *buffer;
a8170e5e
AK
2147 hwaddr addr;
2148 hwaddr len;
6d16c2f8
AL
2149} BounceBuffer;
2150
2151static BounceBuffer bounce;
2152
ba223c29
AL
2153typedef struct MapClient {
2154 void *opaque;
2155 void (*callback)(void *opaque);
72cf2d4f 2156 QLIST_ENTRY(MapClient) link;
ba223c29
AL
2157} MapClient;
2158
72cf2d4f
BS
2159static QLIST_HEAD(map_client_list, MapClient) map_client_list
2160 = QLIST_HEAD_INITIALIZER(map_client_list);
ba223c29
AL
2161
2162void *cpu_register_map_client(void *opaque, void (*callback)(void *opaque))
2163{
7267c094 2164 MapClient *client = g_malloc(sizeof(*client));
ba223c29
AL
2165
2166 client->opaque = opaque;
2167 client->callback = callback;
72cf2d4f 2168 QLIST_INSERT_HEAD(&map_client_list, client, link);
ba223c29
AL
2169 return client;
2170}
2171
8b9c99d9 2172static void cpu_unregister_map_client(void *_client)
ba223c29
AL
2173{
2174 MapClient *client = (MapClient *)_client;
2175
72cf2d4f 2176 QLIST_REMOVE(client, link);
7267c094 2177 g_free(client);
ba223c29
AL
2178}
2179
2180static void cpu_notify_map_clients(void)
2181{
2182 MapClient *client;
2183
72cf2d4f
BS
2184 while (!QLIST_EMPTY(&map_client_list)) {
2185 client = QLIST_FIRST(&map_client_list);
ba223c29 2186 client->callback(client->opaque);
34d5e948 2187 cpu_unregister_map_client(client);
ba223c29
AL
2188 }
2189}
2190
51644ab7
PB
2191bool address_space_access_valid(AddressSpace *as, hwaddr addr, int len, bool is_write)
2192{
5c8a00ce 2193 MemoryRegion *mr;
51644ab7
PB
2194 hwaddr l, xlat;
2195
2196 while (len > 0) {
2197 l = len;
5c8a00ce
PB
2198 mr = address_space_translate(as, addr, &xlat, &l, is_write);
2199 if (!memory_access_is_direct(mr, is_write)) {
2200 l = memory_access_size(mr, l, addr);
2201 if (!memory_region_access_valid(mr, xlat, l, is_write)) {
51644ab7
PB
2202 return false;
2203 }
2204 }
2205
2206 len -= l;
2207 addr += l;
2208 }
2209 return true;
2210}
2211
6d16c2f8
AL
2212/* Map a physical memory region into a host virtual address.
2213 * May map a subset of the requested range, given by and returned in *plen.
2214 * May return NULL if resources needed to perform the mapping are exhausted.
2215 * Use only for reads OR writes - not for read-modify-write operations.
ba223c29
AL
2216 * Use cpu_register_map_client() to know when retrying the map operation is
2217 * likely to succeed.
6d16c2f8 2218 */
ac1970fb 2219void *address_space_map(AddressSpace *as,
a8170e5e
AK
2220 hwaddr addr,
2221 hwaddr *plen,
ac1970fb 2222 bool is_write)
6d16c2f8 2223{
a8170e5e 2224 hwaddr len = *plen;
e3127ae0
PB
2225 hwaddr done = 0;
2226 hwaddr l, xlat, base;
2227 MemoryRegion *mr, *this_mr;
2228 ram_addr_t raddr;
6d16c2f8 2229
e3127ae0
PB
2230 if (len == 0) {
2231 return NULL;
2232 }
38bee5dc 2233
e3127ae0
PB
2234 l = len;
2235 mr = address_space_translate(as, addr, &xlat, &l, is_write);
2236 if (!memory_access_is_direct(mr, is_write)) {
2237 if (bounce.buffer) {
2238 return NULL;
6d16c2f8 2239 }
e85d9db5
KW
2240 /* Avoid unbounded allocations */
2241 l = MIN(l, TARGET_PAGE_SIZE);
2242 bounce.buffer = qemu_memalign(TARGET_PAGE_SIZE, l);
e3127ae0
PB
2243 bounce.addr = addr;
2244 bounce.len = l;
d3e71559
PB
2245
2246 memory_region_ref(mr);
2247 bounce.mr = mr;
e3127ae0
PB
2248 if (!is_write) {
2249 address_space_read(as, addr, bounce.buffer, l);
8ab934f9 2250 }
6d16c2f8 2251
e3127ae0
PB
2252 *plen = l;
2253 return bounce.buffer;
2254 }
2255
2256 base = xlat;
2257 raddr = memory_region_get_ram_addr(mr);
2258
2259 for (;;) {
6d16c2f8
AL
2260 len -= l;
2261 addr += l;
e3127ae0
PB
2262 done += l;
2263 if (len == 0) {
2264 break;
2265 }
2266
2267 l = len;
2268 this_mr = address_space_translate(as, addr, &xlat, &l, is_write);
2269 if (this_mr != mr || xlat != base + done) {
2270 break;
2271 }
6d16c2f8 2272 }
e3127ae0 2273
d3e71559 2274 memory_region_ref(mr);
e3127ae0
PB
2275 *plen = done;
2276 return qemu_ram_ptr_length(raddr + base, plen);
6d16c2f8
AL
2277}
2278
ac1970fb 2279/* Unmaps a memory region previously mapped by address_space_map().
6d16c2f8
AL
2280 * Will also mark the memory as dirty if is_write == 1. access_len gives
2281 * the amount of memory that was actually read or written by the caller.
2282 */
a8170e5e
AK
2283void address_space_unmap(AddressSpace *as, void *buffer, hwaddr len,
2284 int is_write, hwaddr access_len)
6d16c2f8
AL
2285{
2286 if (buffer != bounce.buffer) {
d3e71559
PB
2287 MemoryRegion *mr;
2288 ram_addr_t addr1;
2289
2290 mr = qemu_ram_addr_from_host(buffer, &addr1);
2291 assert(mr != NULL);
6d16c2f8 2292 if (is_write) {
6d16c2f8
AL
2293 while (access_len) {
2294 unsigned l;
2295 l = TARGET_PAGE_SIZE;
2296 if (l > access_len)
2297 l = access_len;
51d7a9eb 2298 invalidate_and_set_dirty(addr1, l);
6d16c2f8
AL
2299 addr1 += l;
2300 access_len -= l;
2301 }
2302 }
868bb33f 2303 if (xen_enabled()) {
e41d7c69 2304 xen_invalidate_map_cache_entry(buffer);
050a0ddf 2305 }
d3e71559 2306 memory_region_unref(mr);
6d16c2f8
AL
2307 return;
2308 }
2309 if (is_write) {
ac1970fb 2310 address_space_write(as, bounce.addr, bounce.buffer, access_len);
6d16c2f8 2311 }
f8a83245 2312 qemu_vfree(bounce.buffer);
6d16c2f8 2313 bounce.buffer = NULL;
d3e71559 2314 memory_region_unref(bounce.mr);
ba223c29 2315 cpu_notify_map_clients();
6d16c2f8 2316}
d0ecd2aa 2317
a8170e5e
AK
2318void *cpu_physical_memory_map(hwaddr addr,
2319 hwaddr *plen,
ac1970fb
AK
2320 int is_write)
2321{
2322 return address_space_map(&address_space_memory, addr, plen, is_write);
2323}
2324
a8170e5e
AK
2325void cpu_physical_memory_unmap(void *buffer, hwaddr len,
2326 int is_write, hwaddr access_len)
ac1970fb
AK
2327{
2328 return address_space_unmap(&address_space_memory, buffer, len, is_write, access_len);
2329}
2330
8df1cd07 2331/* warning: addr must be aligned */
a8170e5e 2332static inline uint32_t ldl_phys_internal(hwaddr addr,
1e78bcc1 2333 enum device_endian endian)
8df1cd07 2334{
8df1cd07 2335 uint8_t *ptr;
791af8c8 2336 uint64_t val;
5c8a00ce 2337 MemoryRegion *mr;
149f54b5
PB
2338 hwaddr l = 4;
2339 hwaddr addr1;
8df1cd07 2340
5c8a00ce
PB
2341 mr = address_space_translate(&address_space_memory, addr, &addr1, &l,
2342 false);
2343 if (l < 4 || !memory_access_is_direct(mr, false)) {
8df1cd07 2344 /* I/O case */
5c8a00ce 2345 io_mem_read(mr, addr1, &val, 4);
1e78bcc1
AG
2346#if defined(TARGET_WORDS_BIGENDIAN)
2347 if (endian == DEVICE_LITTLE_ENDIAN) {
2348 val = bswap32(val);
2349 }
2350#else
2351 if (endian == DEVICE_BIG_ENDIAN) {
2352 val = bswap32(val);
2353 }
2354#endif
8df1cd07
FB
2355 } else {
2356 /* RAM case */
5c8a00ce 2357 ptr = qemu_get_ram_ptr((memory_region_get_ram_addr(mr)
06ef3525 2358 & TARGET_PAGE_MASK)
149f54b5 2359 + addr1);
1e78bcc1
AG
2360 switch (endian) {
2361 case DEVICE_LITTLE_ENDIAN:
2362 val = ldl_le_p(ptr);
2363 break;
2364 case DEVICE_BIG_ENDIAN:
2365 val = ldl_be_p(ptr);
2366 break;
2367 default:
2368 val = ldl_p(ptr);
2369 break;
2370 }
8df1cd07
FB
2371 }
2372 return val;
2373}
2374
a8170e5e 2375uint32_t ldl_phys(hwaddr addr)
1e78bcc1
AG
2376{
2377 return ldl_phys_internal(addr, DEVICE_NATIVE_ENDIAN);
2378}
2379
a8170e5e 2380uint32_t ldl_le_phys(hwaddr addr)
1e78bcc1
AG
2381{
2382 return ldl_phys_internal(addr, DEVICE_LITTLE_ENDIAN);
2383}
2384
a8170e5e 2385uint32_t ldl_be_phys(hwaddr addr)
1e78bcc1
AG
2386{
2387 return ldl_phys_internal(addr, DEVICE_BIG_ENDIAN);
2388}
2389
84b7b8e7 2390/* warning: addr must be aligned */
a8170e5e 2391static inline uint64_t ldq_phys_internal(hwaddr addr,
1e78bcc1 2392 enum device_endian endian)
84b7b8e7 2393{
84b7b8e7
FB
2394 uint8_t *ptr;
2395 uint64_t val;
5c8a00ce 2396 MemoryRegion *mr;
149f54b5
PB
2397 hwaddr l = 8;
2398 hwaddr addr1;
84b7b8e7 2399
5c8a00ce
PB
2400 mr = address_space_translate(&address_space_memory, addr, &addr1, &l,
2401 false);
2402 if (l < 8 || !memory_access_is_direct(mr, false)) {
84b7b8e7 2403 /* I/O case */
5c8a00ce 2404 io_mem_read(mr, addr1, &val, 8);
968a5627
PB
2405#if defined(TARGET_WORDS_BIGENDIAN)
2406 if (endian == DEVICE_LITTLE_ENDIAN) {
2407 val = bswap64(val);
2408 }
2409#else
2410 if (endian == DEVICE_BIG_ENDIAN) {
2411 val = bswap64(val);
2412 }
84b7b8e7
FB
2413#endif
2414 } else {
2415 /* RAM case */
5c8a00ce 2416 ptr = qemu_get_ram_ptr((memory_region_get_ram_addr(mr)
06ef3525 2417 & TARGET_PAGE_MASK)
149f54b5 2418 + addr1);
1e78bcc1
AG
2419 switch (endian) {
2420 case DEVICE_LITTLE_ENDIAN:
2421 val = ldq_le_p(ptr);
2422 break;
2423 case DEVICE_BIG_ENDIAN:
2424 val = ldq_be_p(ptr);
2425 break;
2426 default:
2427 val = ldq_p(ptr);
2428 break;
2429 }
84b7b8e7
FB
2430 }
2431 return val;
2432}
2433
a8170e5e 2434uint64_t ldq_phys(hwaddr addr)
1e78bcc1
AG
2435{
2436 return ldq_phys_internal(addr, DEVICE_NATIVE_ENDIAN);
2437}
2438
a8170e5e 2439uint64_t ldq_le_phys(hwaddr addr)
1e78bcc1
AG
2440{
2441 return ldq_phys_internal(addr, DEVICE_LITTLE_ENDIAN);
2442}
2443
a8170e5e 2444uint64_t ldq_be_phys(hwaddr addr)
1e78bcc1
AG
2445{
2446 return ldq_phys_internal(addr, DEVICE_BIG_ENDIAN);
2447}
2448
aab33094 2449/* XXX: optimize */
a8170e5e 2450uint32_t ldub_phys(hwaddr addr)
aab33094
FB
2451{
2452 uint8_t val;
2453 cpu_physical_memory_read(addr, &val, 1);
2454 return val;
2455}
2456
733f0b02 2457/* warning: addr must be aligned */
a8170e5e 2458static inline uint32_t lduw_phys_internal(hwaddr addr,
1e78bcc1 2459 enum device_endian endian)
aab33094 2460{
733f0b02
MT
2461 uint8_t *ptr;
2462 uint64_t val;
5c8a00ce 2463 MemoryRegion *mr;
149f54b5
PB
2464 hwaddr l = 2;
2465 hwaddr addr1;
733f0b02 2466
5c8a00ce
PB
2467 mr = address_space_translate(&address_space_memory, addr, &addr1, &l,
2468 false);
2469 if (l < 2 || !memory_access_is_direct(mr, false)) {
733f0b02 2470 /* I/O case */
5c8a00ce 2471 io_mem_read(mr, addr1, &val, 2);
1e78bcc1
AG
2472#if defined(TARGET_WORDS_BIGENDIAN)
2473 if (endian == DEVICE_LITTLE_ENDIAN) {
2474 val = bswap16(val);
2475 }
2476#else
2477 if (endian == DEVICE_BIG_ENDIAN) {
2478 val = bswap16(val);
2479 }
2480#endif
733f0b02
MT
2481 } else {
2482 /* RAM case */
5c8a00ce 2483 ptr = qemu_get_ram_ptr((memory_region_get_ram_addr(mr)
06ef3525 2484 & TARGET_PAGE_MASK)
149f54b5 2485 + addr1);
1e78bcc1
AG
2486 switch (endian) {
2487 case DEVICE_LITTLE_ENDIAN:
2488 val = lduw_le_p(ptr);
2489 break;
2490 case DEVICE_BIG_ENDIAN:
2491 val = lduw_be_p(ptr);
2492 break;
2493 default:
2494 val = lduw_p(ptr);
2495 break;
2496 }
733f0b02
MT
2497 }
2498 return val;
aab33094
FB
2499}
2500
a8170e5e 2501uint32_t lduw_phys(hwaddr addr)
1e78bcc1
AG
2502{
2503 return lduw_phys_internal(addr, DEVICE_NATIVE_ENDIAN);
2504}
2505
a8170e5e 2506uint32_t lduw_le_phys(hwaddr addr)
1e78bcc1
AG
2507{
2508 return lduw_phys_internal(addr, DEVICE_LITTLE_ENDIAN);
2509}
2510
a8170e5e 2511uint32_t lduw_be_phys(hwaddr addr)
1e78bcc1
AG
2512{
2513 return lduw_phys_internal(addr, DEVICE_BIG_ENDIAN);
2514}
2515
8df1cd07
FB
2516/* warning: addr must be aligned. The ram page is not masked as dirty
2517 and the code inside is not invalidated. It is useful if the dirty
2518 bits are used to track modified PTEs */
a8170e5e 2519void stl_phys_notdirty(hwaddr addr, uint32_t val)
8df1cd07 2520{
8df1cd07 2521 uint8_t *ptr;
5c8a00ce 2522 MemoryRegion *mr;
149f54b5
PB
2523 hwaddr l = 4;
2524 hwaddr addr1;
8df1cd07 2525
5c8a00ce
PB
2526 mr = address_space_translate(&address_space_memory, addr, &addr1, &l,
2527 true);
2528 if (l < 4 || !memory_access_is_direct(mr, true)) {
2529 io_mem_write(mr, addr1, val, 4);
8df1cd07 2530 } else {
5c8a00ce 2531 addr1 += memory_region_get_ram_addr(mr) & TARGET_PAGE_MASK;
5579c7f3 2532 ptr = qemu_get_ram_ptr(addr1);
8df1cd07 2533 stl_p(ptr, val);
74576198
AL
2534
2535 if (unlikely(in_migration)) {
a2cd8c85 2536 if (cpu_physical_memory_is_clean(addr1)) {
74576198
AL
2537 /* invalidate code */
2538 tb_invalidate_phys_page_range(addr1, addr1 + 4, 0);
2539 /* set dirty bit */
52159192
JQ
2540 cpu_physical_memory_set_dirty_flag(addr1,
2541 DIRTY_MEMORY_MIGRATION);
2542 cpu_physical_memory_set_dirty_flag(addr1, DIRTY_MEMORY_VGA);
74576198
AL
2543 }
2544 }
8df1cd07
FB
2545 }
2546}
2547
2548/* warning: addr must be aligned */
a8170e5e 2549static inline void stl_phys_internal(hwaddr addr, uint32_t val,
1e78bcc1 2550 enum device_endian endian)
8df1cd07 2551{
8df1cd07 2552 uint8_t *ptr;
5c8a00ce 2553 MemoryRegion *mr;
149f54b5
PB
2554 hwaddr l = 4;
2555 hwaddr addr1;
8df1cd07 2556
5c8a00ce
PB
2557 mr = address_space_translate(&address_space_memory, addr, &addr1, &l,
2558 true);
2559 if (l < 4 || !memory_access_is_direct(mr, true)) {
1e78bcc1
AG
2560#if defined(TARGET_WORDS_BIGENDIAN)
2561 if (endian == DEVICE_LITTLE_ENDIAN) {
2562 val = bswap32(val);
2563 }
2564#else
2565 if (endian == DEVICE_BIG_ENDIAN) {
2566 val = bswap32(val);
2567 }
2568#endif
5c8a00ce 2569 io_mem_write(mr, addr1, val, 4);
8df1cd07 2570 } else {
8df1cd07 2571 /* RAM case */
5c8a00ce 2572 addr1 += memory_region_get_ram_addr(mr) & TARGET_PAGE_MASK;
5579c7f3 2573 ptr = qemu_get_ram_ptr(addr1);
1e78bcc1
AG
2574 switch (endian) {
2575 case DEVICE_LITTLE_ENDIAN:
2576 stl_le_p(ptr, val);
2577 break;
2578 case DEVICE_BIG_ENDIAN:
2579 stl_be_p(ptr, val);
2580 break;
2581 default:
2582 stl_p(ptr, val);
2583 break;
2584 }
51d7a9eb 2585 invalidate_and_set_dirty(addr1, 4);
8df1cd07
FB
2586 }
2587}
2588
a8170e5e 2589void stl_phys(hwaddr addr, uint32_t val)
1e78bcc1
AG
2590{
2591 stl_phys_internal(addr, val, DEVICE_NATIVE_ENDIAN);
2592}
2593
a8170e5e 2594void stl_le_phys(hwaddr addr, uint32_t val)
1e78bcc1
AG
2595{
2596 stl_phys_internal(addr, val, DEVICE_LITTLE_ENDIAN);
2597}
2598
a8170e5e 2599void stl_be_phys(hwaddr addr, uint32_t val)
1e78bcc1
AG
2600{
2601 stl_phys_internal(addr, val, DEVICE_BIG_ENDIAN);
2602}
2603
aab33094 2604/* XXX: optimize */
a8170e5e 2605void stb_phys(hwaddr addr, uint32_t val)
aab33094
FB
2606{
2607 uint8_t v = val;
2608 cpu_physical_memory_write(addr, &v, 1);
2609}
2610
733f0b02 2611/* warning: addr must be aligned */
a8170e5e 2612static inline void stw_phys_internal(hwaddr addr, uint32_t val,
1e78bcc1 2613 enum device_endian endian)
aab33094 2614{
733f0b02 2615 uint8_t *ptr;
5c8a00ce 2616 MemoryRegion *mr;
149f54b5
PB
2617 hwaddr l = 2;
2618 hwaddr addr1;
733f0b02 2619
5c8a00ce
PB
2620 mr = address_space_translate(&address_space_memory, addr, &addr1, &l,
2621 true);
2622 if (l < 2 || !memory_access_is_direct(mr, true)) {
1e78bcc1
AG
2623#if defined(TARGET_WORDS_BIGENDIAN)
2624 if (endian == DEVICE_LITTLE_ENDIAN) {
2625 val = bswap16(val);
2626 }
2627#else
2628 if (endian == DEVICE_BIG_ENDIAN) {
2629 val = bswap16(val);
2630 }
2631#endif
5c8a00ce 2632 io_mem_write(mr, addr1, val, 2);
733f0b02 2633 } else {
733f0b02 2634 /* RAM case */
5c8a00ce 2635 addr1 += memory_region_get_ram_addr(mr) & TARGET_PAGE_MASK;
733f0b02 2636 ptr = qemu_get_ram_ptr(addr1);
1e78bcc1
AG
2637 switch (endian) {
2638 case DEVICE_LITTLE_ENDIAN:
2639 stw_le_p(ptr, val);
2640 break;
2641 case DEVICE_BIG_ENDIAN:
2642 stw_be_p(ptr, val);
2643 break;
2644 default:
2645 stw_p(ptr, val);
2646 break;
2647 }
51d7a9eb 2648 invalidate_and_set_dirty(addr1, 2);
733f0b02 2649 }
aab33094
FB
2650}
2651
a8170e5e 2652void stw_phys(hwaddr addr, uint32_t val)
1e78bcc1
AG
2653{
2654 stw_phys_internal(addr, val, DEVICE_NATIVE_ENDIAN);
2655}
2656
a8170e5e 2657void stw_le_phys(hwaddr addr, uint32_t val)
1e78bcc1
AG
2658{
2659 stw_phys_internal(addr, val, DEVICE_LITTLE_ENDIAN);
2660}
2661
a8170e5e 2662void stw_be_phys(hwaddr addr, uint32_t val)
1e78bcc1
AG
2663{
2664 stw_phys_internal(addr, val, DEVICE_BIG_ENDIAN);
2665}
2666
aab33094 2667/* XXX: optimize */
a8170e5e 2668void stq_phys(hwaddr addr, uint64_t val)
aab33094
FB
2669{
2670 val = tswap64(val);
71d2b725 2671 cpu_physical_memory_write(addr, &val, 8);
aab33094
FB
2672}
2673
a8170e5e 2674void stq_le_phys(hwaddr addr, uint64_t val)
1e78bcc1
AG
2675{
2676 val = cpu_to_le64(val);
2677 cpu_physical_memory_write(addr, &val, 8);
2678}
2679
a8170e5e 2680void stq_be_phys(hwaddr addr, uint64_t val)
1e78bcc1
AG
2681{
2682 val = cpu_to_be64(val);
2683 cpu_physical_memory_write(addr, &val, 8);
2684}
2685
5e2972fd 2686/* virtual memory access for debug (includes writing to ROM) */
f17ec444 2687int cpu_memory_rw_debug(CPUState *cpu, target_ulong addr,
b448f2f3 2688 uint8_t *buf, int len, int is_write)
13eb76e0
FB
2689{
2690 int l;
a8170e5e 2691 hwaddr phys_addr;
9b3c35e0 2692 target_ulong page;
13eb76e0
FB
2693
2694 while (len > 0) {
2695 page = addr & TARGET_PAGE_MASK;
f17ec444 2696 phys_addr = cpu_get_phys_page_debug(cpu, page);
13eb76e0
FB
2697 /* if no physical page mapped, return an error */
2698 if (phys_addr == -1)
2699 return -1;
2700 l = (page + TARGET_PAGE_SIZE) - addr;
2701 if (l > len)
2702 l = len;
5e2972fd 2703 phys_addr += (addr & ~TARGET_PAGE_MASK);
5e2972fd
AL
2704 if (is_write)
2705 cpu_physical_memory_write_rom(phys_addr, buf, l);
2706 else
5e2972fd 2707 cpu_physical_memory_rw(phys_addr, buf, l, is_write);
13eb76e0
FB
2708 len -= l;
2709 buf += l;
2710 addr += l;
2711 }
2712 return 0;
2713}
a68fe89c 2714#endif
13eb76e0 2715
8e4a424b
BS
2716#if !defined(CONFIG_USER_ONLY)
2717
2718/*
2719 * A helper function for the _utterly broken_ virtio device model to find out if
2720 * it's running on a big endian machine. Don't do this at home kids!
2721 */
2722bool virtio_is_big_endian(void);
2723bool virtio_is_big_endian(void)
2724{
2725#if defined(TARGET_WORDS_BIGENDIAN)
2726 return true;
2727#else
2728 return false;
2729#endif
2730}
2731
2732#endif
2733
76f35538 2734#ifndef CONFIG_USER_ONLY
a8170e5e 2735bool cpu_physical_memory_is_io(hwaddr phys_addr)
76f35538 2736{
5c8a00ce 2737 MemoryRegion*mr;
149f54b5 2738 hwaddr l = 1;
76f35538 2739
5c8a00ce
PB
2740 mr = address_space_translate(&address_space_memory,
2741 phys_addr, &phys_addr, &l, false);
76f35538 2742
5c8a00ce
PB
2743 return !(memory_region_is_ram(mr) ||
2744 memory_region_is_romd(mr));
76f35538 2745}
bd2fa51f
MH
2746
2747void qemu_ram_foreach_block(RAMBlockIterFunc func, void *opaque)
2748{
2749 RAMBlock *block;
2750
2751 QTAILQ_FOREACH(block, &ram_list.blocks, next) {
2752 func(block->host, block->offset, block->length, opaque);
2753 }
2754}
ec3f8c99 2755#endif