xref: /openbmc/qemu/accel/tcg/cputlb.c (revision fb0343d5b4dd4b9b9e96e563d913a3e0c709fe4e)
1d9bb58e5SYang Zhong /*
2d9bb58e5SYang Zhong  *  Common CPU TLB handling
3d9bb58e5SYang Zhong  *
4d9bb58e5SYang Zhong  *  Copyright (c) 2003 Fabrice Bellard
5d9bb58e5SYang Zhong  *
6d9bb58e5SYang Zhong  * This library is free software; you can redistribute it and/or
7d9bb58e5SYang Zhong  * modify it under the terms of the GNU Lesser General Public
8d9bb58e5SYang Zhong  * License as published by the Free Software Foundation; either
9*fb0343d5SThomas Huth  * version 2.1 of the License, or (at your option) any later version.
10d9bb58e5SYang Zhong  *
11d9bb58e5SYang Zhong  * This library is distributed in the hope that it will be useful,
12d9bb58e5SYang Zhong  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13d9bb58e5SYang Zhong  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14d9bb58e5SYang Zhong  * Lesser General Public License for more details.
15d9bb58e5SYang Zhong  *
16d9bb58e5SYang Zhong  * You should have received a copy of the GNU Lesser General Public
17d9bb58e5SYang Zhong  * License along with this library; if not, see <http://www.gnu.org/licenses/>.
18d9bb58e5SYang Zhong  */
19d9bb58e5SYang Zhong 
20d9bb58e5SYang Zhong #include "qemu/osdep.h"
21d9bb58e5SYang Zhong #include "qemu/main-loop.h"
22d9bb58e5SYang Zhong #include "cpu.h"
23d9bb58e5SYang Zhong #include "exec/exec-all.h"
24d9bb58e5SYang Zhong #include "exec/memory.h"
25d9bb58e5SYang Zhong #include "exec/address-spaces.h"
26d9bb58e5SYang Zhong #include "exec/cpu_ldst.h"
27d9bb58e5SYang Zhong #include "exec/cputlb.h"
28d9bb58e5SYang Zhong #include "exec/memory-internal.h"
29d9bb58e5SYang Zhong #include "exec/ram_addr.h"
30d9bb58e5SYang Zhong #include "tcg/tcg.h"
31d9bb58e5SYang Zhong #include "qemu/error-report.h"
32d9bb58e5SYang Zhong #include "exec/log.h"
33d9bb58e5SYang Zhong #include "exec/helper-proto.h"
34d9bb58e5SYang Zhong #include "qemu/atomic.h"
35e6cd4bb5SRichard Henderson #include "qemu/atomic128.h"
36d9bb58e5SYang Zhong 
37d9bb58e5SYang Zhong /* DEBUG defines, enable DEBUG_TLB_LOG to log to the CPU_LOG_MMU target */
38d9bb58e5SYang Zhong /* #define DEBUG_TLB */
39d9bb58e5SYang Zhong /* #define DEBUG_TLB_LOG */
40d9bb58e5SYang Zhong 
41d9bb58e5SYang Zhong #ifdef DEBUG_TLB
42d9bb58e5SYang Zhong # define DEBUG_TLB_GATE 1
43d9bb58e5SYang Zhong # ifdef DEBUG_TLB_LOG
44d9bb58e5SYang Zhong #  define DEBUG_TLB_LOG_GATE 1
45d9bb58e5SYang Zhong # else
46d9bb58e5SYang Zhong #  define DEBUG_TLB_LOG_GATE 0
47d9bb58e5SYang Zhong # endif
48d9bb58e5SYang Zhong #else
49d9bb58e5SYang Zhong # define DEBUG_TLB_GATE 0
50d9bb58e5SYang Zhong # define DEBUG_TLB_LOG_GATE 0
51d9bb58e5SYang Zhong #endif
52d9bb58e5SYang Zhong 
53d9bb58e5SYang Zhong #define tlb_debug(fmt, ...) do { \
54d9bb58e5SYang Zhong     if (DEBUG_TLB_LOG_GATE) { \
55d9bb58e5SYang Zhong         qemu_log_mask(CPU_LOG_MMU, "%s: " fmt, __func__, \
56d9bb58e5SYang Zhong                       ## __VA_ARGS__); \
57d9bb58e5SYang Zhong     } else if (DEBUG_TLB_GATE) { \
58d9bb58e5SYang Zhong         fprintf(stderr, "%s: " fmt, __func__, ## __VA_ARGS__); \
59d9bb58e5SYang Zhong     } \
60d9bb58e5SYang Zhong } while (0)
61d9bb58e5SYang Zhong 
62ea9025cbSEmilio G. Cota #define assert_cpu_is_self(cpu) do {                              \
63d9bb58e5SYang Zhong         if (DEBUG_TLB_GATE) {                                     \
64ea9025cbSEmilio G. Cota             g_assert(!(cpu)->created || qemu_cpu_is_self(cpu));   \
65d9bb58e5SYang Zhong         }                                                         \
66d9bb58e5SYang Zhong     } while (0)
67d9bb58e5SYang Zhong 
68d9bb58e5SYang Zhong /* run_on_cpu_data.target_ptr should always be big enough for a
69d9bb58e5SYang Zhong  * target_ulong even on 32 bit builds */
70d9bb58e5SYang Zhong QEMU_BUILD_BUG_ON(sizeof(target_ulong) > sizeof(run_on_cpu_data));
71d9bb58e5SYang Zhong 
72d9bb58e5SYang Zhong /* We currently can't handle more than 16 bits in the MMUIDX bitmask.
73d9bb58e5SYang Zhong  */
74d9bb58e5SYang Zhong QEMU_BUILD_BUG_ON(NB_MMU_MODES > 16);
75d9bb58e5SYang Zhong #define ALL_MMUIDX_BITS ((1 << NB_MMU_MODES) - 1)
76d9bb58e5SYang Zhong 
7786e1eff8SEmilio G. Cota static inline size_t sizeof_tlb(CPUArchState *env, uintptr_t mmu_idx)
7886e1eff8SEmilio G. Cota {
7986e1eff8SEmilio G. Cota     return env->tlb_mask[mmu_idx] + (1 << CPU_TLB_ENTRY_BITS);
8086e1eff8SEmilio G. Cota }
8186e1eff8SEmilio G. Cota 
8286e1eff8SEmilio G. Cota static void tlb_window_reset(CPUTLBWindow *window, int64_t ns,
8386e1eff8SEmilio G. Cota                              size_t max_entries)
8486e1eff8SEmilio G. Cota {
8586e1eff8SEmilio G. Cota     window->begin_ns = ns;
8686e1eff8SEmilio G. Cota     window->max_entries = max_entries;
8786e1eff8SEmilio G. Cota }
8886e1eff8SEmilio G. Cota 
8986e1eff8SEmilio G. Cota static void tlb_dyn_init(CPUArchState *env)
9086e1eff8SEmilio G. Cota {
9186e1eff8SEmilio G. Cota     int i;
9286e1eff8SEmilio G. Cota 
9386e1eff8SEmilio G. Cota     for (i = 0; i < NB_MMU_MODES; i++) {
9486e1eff8SEmilio G. Cota         CPUTLBDesc *desc = &env->tlb_d[i];
9586e1eff8SEmilio G. Cota         size_t n_entries = 1 << CPU_TLB_DYN_DEFAULT_BITS;
9686e1eff8SEmilio G. Cota 
9786e1eff8SEmilio G. Cota         tlb_window_reset(&desc->window, get_clock_realtime(), 0);
9886e1eff8SEmilio G. Cota         desc->n_used_entries = 0;
9986e1eff8SEmilio G. Cota         env->tlb_mask[i] = (n_entries - 1) << CPU_TLB_ENTRY_BITS;
10086e1eff8SEmilio G. Cota         env->tlb_table[i] = g_new(CPUTLBEntry, n_entries);
10186e1eff8SEmilio G. Cota         env->iotlb[i] = g_new(CPUIOTLBEntry, n_entries);
10286e1eff8SEmilio G. Cota     }
10386e1eff8SEmilio G. Cota }
10486e1eff8SEmilio G. Cota 
10586e1eff8SEmilio G. Cota /**
10686e1eff8SEmilio G. Cota  * tlb_mmu_resize_locked() - perform TLB resize bookkeeping; resize if necessary
10786e1eff8SEmilio G. Cota  * @env: CPU that owns the TLB
10886e1eff8SEmilio G. Cota  * @mmu_idx: MMU index of the TLB
10986e1eff8SEmilio G. Cota  *
11086e1eff8SEmilio G. Cota  * Called with tlb_lock_held.
11186e1eff8SEmilio G. Cota  *
11286e1eff8SEmilio G. Cota  * We have two main constraints when resizing a TLB: (1) we only resize it
11386e1eff8SEmilio G. Cota  * on a TLB flush (otherwise we'd have to take a perf hit by either rehashing
11486e1eff8SEmilio G. Cota  * the array or unnecessarily flushing it), which means we do not control how
11586e1eff8SEmilio G. Cota  * frequently the resizing can occur; (2) we don't have access to the guest's
11686e1eff8SEmilio G. Cota  * future scheduling decisions, and therefore have to decide the magnitude of
11786e1eff8SEmilio G. Cota  * the resize based on past observations.
11886e1eff8SEmilio G. Cota  *
11986e1eff8SEmilio G. Cota  * In general, a memory-hungry process can benefit greatly from an appropriately
12086e1eff8SEmilio G. Cota  * sized TLB, since a guest TLB miss is very expensive. This doesn't mean that
12186e1eff8SEmilio G. Cota  * we just have to make the TLB as large as possible; while an oversized TLB
12286e1eff8SEmilio G. Cota  * results in minimal TLB miss rates, it also takes longer to be flushed
12386e1eff8SEmilio G. Cota  * (flushes can be _very_ frequent), and the reduced locality can also hurt
12486e1eff8SEmilio G. Cota  * performance.
12586e1eff8SEmilio G. Cota  *
12686e1eff8SEmilio G. Cota  * To achieve near-optimal performance for all kinds of workloads, we:
12786e1eff8SEmilio G. Cota  *
12886e1eff8SEmilio G. Cota  * 1. Aggressively increase the size of the TLB when the use rate of the
12986e1eff8SEmilio G. Cota  * TLB being flushed is high, since it is likely that in the near future this
13086e1eff8SEmilio G. Cota  * memory-hungry process will execute again, and its memory hungriness will
13186e1eff8SEmilio G. Cota  * probably be similar.
13286e1eff8SEmilio G. Cota  *
13386e1eff8SEmilio G. Cota  * 2. Slowly reduce the size of the TLB as the use rate declines over a
13486e1eff8SEmilio G. Cota  * reasonably large time window. The rationale is that if in such a time window
13586e1eff8SEmilio G. Cota  * we have not observed a high TLB use rate, it is likely that we won't observe
13686e1eff8SEmilio G. Cota  * it in the near future. In that case, once a time window expires we downsize
13786e1eff8SEmilio G. Cota  * the TLB to match the maximum use rate observed in the window.
13886e1eff8SEmilio G. Cota  *
13986e1eff8SEmilio G. Cota  * 3. Try to keep the maximum use rate in a time window in the 30-70% range,
14086e1eff8SEmilio G. Cota  * since in that range performance is likely near-optimal. Recall that the TLB
14186e1eff8SEmilio G. Cota  * is direct mapped, so we want the use rate to be low (or at least not too
14286e1eff8SEmilio G. Cota  * high), since otherwise we are likely to have a significant amount of
14386e1eff8SEmilio G. Cota  * conflict misses.
14486e1eff8SEmilio G. Cota  */
14586e1eff8SEmilio G. Cota static void tlb_mmu_resize_locked(CPUArchState *env, int mmu_idx)
14686e1eff8SEmilio G. Cota {
14786e1eff8SEmilio G. Cota     CPUTLBDesc *desc = &env->tlb_d[mmu_idx];
14886e1eff8SEmilio G. Cota     size_t old_size = tlb_n_entries(env, mmu_idx);
14986e1eff8SEmilio G. Cota     size_t rate;
15086e1eff8SEmilio G. Cota     size_t new_size = old_size;
15186e1eff8SEmilio G. Cota     int64_t now = get_clock_realtime();
15286e1eff8SEmilio G. Cota     int64_t window_len_ms = 100;
15386e1eff8SEmilio G. Cota     int64_t window_len_ns = window_len_ms * 1000 * 1000;
15486e1eff8SEmilio G. Cota     bool window_expired = now > desc->window.begin_ns + window_len_ns;
15586e1eff8SEmilio G. Cota 
15686e1eff8SEmilio G. Cota     if (desc->n_used_entries > desc->window.max_entries) {
15786e1eff8SEmilio G. Cota         desc->window.max_entries = desc->n_used_entries;
15886e1eff8SEmilio G. Cota     }
15986e1eff8SEmilio G. Cota     rate = desc->window.max_entries * 100 / old_size;
16086e1eff8SEmilio G. Cota 
16186e1eff8SEmilio G. Cota     if (rate > 70) {
16286e1eff8SEmilio G. Cota         new_size = MIN(old_size << 1, 1 << CPU_TLB_DYN_MAX_BITS);
16386e1eff8SEmilio G. Cota     } else if (rate < 30 && window_expired) {
16486e1eff8SEmilio G. Cota         size_t ceil = pow2ceil(desc->window.max_entries);
16586e1eff8SEmilio G. Cota         size_t expected_rate = desc->window.max_entries * 100 / ceil;
16686e1eff8SEmilio G. Cota 
16786e1eff8SEmilio G. Cota         /*
16886e1eff8SEmilio G. Cota          * Avoid undersizing when the max number of entries seen is just below
16986e1eff8SEmilio G. Cota          * a pow2. For instance, if max_entries == 1025, the expected use rate
17086e1eff8SEmilio G. Cota          * would be 1025/2048==50%. However, if max_entries == 1023, we'd get
17186e1eff8SEmilio G. Cota          * 1023/1024==99.9% use rate, so we'd likely end up doubling the size
17286e1eff8SEmilio G. Cota          * later. Thus, make sure that the expected use rate remains below 70%.
17386e1eff8SEmilio G. Cota          * (and since we double the size, that means the lowest rate we'd
17486e1eff8SEmilio G. Cota          * expect to get is 35%, which is still in the 30-70% range where
17586e1eff8SEmilio G. Cota          * we consider that the size is appropriate.)
17686e1eff8SEmilio G. Cota          */
17786e1eff8SEmilio G. Cota         if (expected_rate > 70) {
17886e1eff8SEmilio G. Cota             ceil *= 2;
17986e1eff8SEmilio G. Cota         }
18086e1eff8SEmilio G. Cota         new_size = MAX(ceil, 1 << CPU_TLB_DYN_MIN_BITS);
18186e1eff8SEmilio G. Cota     }
18286e1eff8SEmilio G. Cota 
18386e1eff8SEmilio G. Cota     if (new_size == old_size) {
18486e1eff8SEmilio G. Cota         if (window_expired) {
18586e1eff8SEmilio G. Cota             tlb_window_reset(&desc->window, now, desc->n_used_entries);
18686e1eff8SEmilio G. Cota         }
18786e1eff8SEmilio G. Cota         return;
18886e1eff8SEmilio G. Cota     }
18986e1eff8SEmilio G. Cota 
19086e1eff8SEmilio G. Cota     g_free(env->tlb_table[mmu_idx]);
19186e1eff8SEmilio G. Cota     g_free(env->iotlb[mmu_idx]);
19286e1eff8SEmilio G. Cota 
19386e1eff8SEmilio G. Cota     tlb_window_reset(&desc->window, now, 0);
19486e1eff8SEmilio G. Cota     /* desc->n_used_entries is cleared by the caller */
19586e1eff8SEmilio G. Cota     env->tlb_mask[mmu_idx] = (new_size - 1) << CPU_TLB_ENTRY_BITS;
19686e1eff8SEmilio G. Cota     env->tlb_table[mmu_idx] = g_try_new(CPUTLBEntry, new_size);
19786e1eff8SEmilio G. Cota     env->iotlb[mmu_idx] = g_try_new(CPUIOTLBEntry, new_size);
19886e1eff8SEmilio G. Cota     /*
19986e1eff8SEmilio G. Cota      * If the allocations fail, try smaller sizes. We just freed some
20086e1eff8SEmilio G. Cota      * memory, so going back to half of new_size has a good chance of working.
20186e1eff8SEmilio G. Cota      * Increased memory pressure elsewhere in the system might cause the
20286e1eff8SEmilio G. Cota      * allocations to fail though, so we progressively reduce the allocation
20386e1eff8SEmilio G. Cota      * size, aborting if we cannot even allocate the smallest TLB we support.
20486e1eff8SEmilio G. Cota      */
20586e1eff8SEmilio G. Cota     while (env->tlb_table[mmu_idx] == NULL || env->iotlb[mmu_idx] == NULL) {
20686e1eff8SEmilio G. Cota         if (new_size == (1 << CPU_TLB_DYN_MIN_BITS)) {
20786e1eff8SEmilio G. Cota             error_report("%s: %s", __func__, strerror(errno));
20886e1eff8SEmilio G. Cota             abort();
20986e1eff8SEmilio G. Cota         }
21086e1eff8SEmilio G. Cota         new_size = MAX(new_size >> 1, 1 << CPU_TLB_DYN_MIN_BITS);
21186e1eff8SEmilio G. Cota         env->tlb_mask[mmu_idx] = (new_size - 1) << CPU_TLB_ENTRY_BITS;
21286e1eff8SEmilio G. Cota 
21386e1eff8SEmilio G. Cota         g_free(env->tlb_table[mmu_idx]);
21486e1eff8SEmilio G. Cota         g_free(env->iotlb[mmu_idx]);
21586e1eff8SEmilio G. Cota         env->tlb_table[mmu_idx] = g_try_new(CPUTLBEntry, new_size);
21686e1eff8SEmilio G. Cota         env->iotlb[mmu_idx] = g_try_new(CPUIOTLBEntry, new_size);
21786e1eff8SEmilio G. Cota     }
21886e1eff8SEmilio G. Cota }
21986e1eff8SEmilio G. Cota 
22086e1eff8SEmilio G. Cota static inline void tlb_table_flush_by_mmuidx(CPUArchState *env, int mmu_idx)
22186e1eff8SEmilio G. Cota {
22286e1eff8SEmilio G. Cota     tlb_mmu_resize_locked(env, mmu_idx);
22386e1eff8SEmilio G. Cota     memset(env->tlb_table[mmu_idx], -1, sizeof_tlb(env, mmu_idx));
22486e1eff8SEmilio G. Cota     env->tlb_d[mmu_idx].n_used_entries = 0;
22586e1eff8SEmilio G. Cota }
22686e1eff8SEmilio G. Cota 
22786e1eff8SEmilio G. Cota static inline void tlb_n_used_entries_inc(CPUArchState *env, uintptr_t mmu_idx)
22886e1eff8SEmilio G. Cota {
22986e1eff8SEmilio G. Cota     env->tlb_d[mmu_idx].n_used_entries++;
23086e1eff8SEmilio G. Cota }
23186e1eff8SEmilio G. Cota 
23286e1eff8SEmilio G. Cota static inline void tlb_n_used_entries_dec(CPUArchState *env, uintptr_t mmu_idx)
23386e1eff8SEmilio G. Cota {
23486e1eff8SEmilio G. Cota     env->tlb_d[mmu_idx].n_used_entries--;
23586e1eff8SEmilio G. Cota }
23686e1eff8SEmilio G. Cota 
2375005e253SEmilio G. Cota void tlb_init(CPUState *cpu)
2385005e253SEmilio G. Cota {
23971aec354SEmilio G. Cota     CPUArchState *env = cpu->env_ptr;
24071aec354SEmilio G. Cota 
24153d28455SRichard Henderson     qemu_spin_init(&env->tlb_c.lock);
2423d1523ceSRichard Henderson 
2433d1523ceSRichard Henderson     /* Ensure that cpu_reset performs a full flush.  */
2443d1523ceSRichard Henderson     env->tlb_c.dirty = ALL_MMUIDX_BITS;
24586e1eff8SEmilio G. Cota 
24686e1eff8SEmilio G. Cota     tlb_dyn_init(env);
2475005e253SEmilio G. Cota }
2485005e253SEmilio G. Cota 
249d9bb58e5SYang Zhong /* flush_all_helper: run fn across all cpus
250d9bb58e5SYang Zhong  *
251d9bb58e5SYang Zhong  * If the wait flag is set then the src cpu's helper will be queued as
252d9bb58e5SYang Zhong  * "safe" work and the loop exited creating a synchronisation point
253d9bb58e5SYang Zhong  * where all queued work will be finished before execution starts
254d9bb58e5SYang Zhong  * again.
255d9bb58e5SYang Zhong  */
256d9bb58e5SYang Zhong static void flush_all_helper(CPUState *src, run_on_cpu_func fn,
257d9bb58e5SYang Zhong                              run_on_cpu_data d)
258d9bb58e5SYang Zhong {
259d9bb58e5SYang Zhong     CPUState *cpu;
260d9bb58e5SYang Zhong 
261d9bb58e5SYang Zhong     CPU_FOREACH(cpu) {
262d9bb58e5SYang Zhong         if (cpu != src) {
263d9bb58e5SYang Zhong             async_run_on_cpu(cpu, fn, d);
264d9bb58e5SYang Zhong         }
265d9bb58e5SYang Zhong     }
266d9bb58e5SYang Zhong }
267d9bb58e5SYang Zhong 
268e09de0a2SRichard Henderson void tlb_flush_counts(size_t *pfull, size_t *ppart, size_t *pelide)
26983974cf4SEmilio G. Cota {
27083974cf4SEmilio G. Cota     CPUState *cpu;
271e09de0a2SRichard Henderson     size_t full = 0, part = 0, elide = 0;
27283974cf4SEmilio G. Cota 
27383974cf4SEmilio G. Cota     CPU_FOREACH(cpu) {
27483974cf4SEmilio G. Cota         CPUArchState *env = cpu->env_ptr;
27583974cf4SEmilio G. Cota 
276e09de0a2SRichard Henderson         full += atomic_read(&env->tlb_c.full_flush_count);
277e09de0a2SRichard Henderson         part += atomic_read(&env->tlb_c.part_flush_count);
278e09de0a2SRichard Henderson         elide += atomic_read(&env->tlb_c.elide_flush_count);
27983974cf4SEmilio G. Cota     }
280e09de0a2SRichard Henderson     *pfull = full;
281e09de0a2SRichard Henderson     *ppart = part;
282e09de0a2SRichard Henderson     *pelide = elide;
28383974cf4SEmilio G. Cota }
284d9bb58e5SYang Zhong 
2851308e026SRichard Henderson static void tlb_flush_one_mmuidx_locked(CPUArchState *env, int mmu_idx)
2861308e026SRichard Henderson {
28786e1eff8SEmilio G. Cota     tlb_table_flush_by_mmuidx(env, mmu_idx);
2881308e026SRichard Henderson     memset(env->tlb_v_table[mmu_idx], -1, sizeof(env->tlb_v_table[0]));
2891308e026SRichard Henderson     env->tlb_d[mmu_idx].large_page_addr = -1;
2901308e026SRichard Henderson     env->tlb_d[mmu_idx].large_page_mask = -1;
291d5363e58SRichard Henderson     env->tlb_d[mmu_idx].vindex = 0;
2921308e026SRichard Henderson }
2931308e026SRichard Henderson 
294d9bb58e5SYang Zhong static void tlb_flush_by_mmuidx_async_work(CPUState *cpu, run_on_cpu_data data)
295d9bb58e5SYang Zhong {
296d9bb58e5SYang Zhong     CPUArchState *env = cpu->env_ptr;
2973d1523ceSRichard Henderson     uint16_t asked = data.host_int;
2983d1523ceSRichard Henderson     uint16_t all_dirty, work, to_clean;
299d9bb58e5SYang Zhong 
300d9bb58e5SYang Zhong     assert_cpu_is_self(cpu);
301d9bb58e5SYang Zhong 
3023d1523ceSRichard Henderson     tlb_debug("mmu_idx:0x%04" PRIx16 "\n", asked);
303d9bb58e5SYang Zhong 
30453d28455SRichard Henderson     qemu_spin_lock(&env->tlb_c.lock);
30560a2ad7dSRichard Henderson 
3063d1523ceSRichard Henderson     all_dirty = env->tlb_c.dirty;
3073d1523ceSRichard Henderson     to_clean = asked & all_dirty;
3083d1523ceSRichard Henderson     all_dirty &= ~to_clean;
3093d1523ceSRichard Henderson     env->tlb_c.dirty = all_dirty;
3103d1523ceSRichard Henderson 
3113d1523ceSRichard Henderson     for (work = to_clean; work != 0; work &= work - 1) {
3123d1523ceSRichard Henderson         int mmu_idx = ctz32(work);
3131308e026SRichard Henderson         tlb_flush_one_mmuidx_locked(env, mmu_idx);
314d9bb58e5SYang Zhong     }
3153d1523ceSRichard Henderson 
31653d28455SRichard Henderson     qemu_spin_unlock(&env->tlb_c.lock);
317d9bb58e5SYang Zhong 
318f3ced3c5SEmilio G. Cota     cpu_tb_jmp_cache_clear(cpu);
31964f2674bSRichard Henderson 
3203d1523ceSRichard Henderson     if (to_clean == ALL_MMUIDX_BITS) {
321e09de0a2SRichard Henderson         atomic_set(&env->tlb_c.full_flush_count,
322e09de0a2SRichard Henderson                    env->tlb_c.full_flush_count + 1);
323e09de0a2SRichard Henderson     } else {
324e09de0a2SRichard Henderson         atomic_set(&env->tlb_c.part_flush_count,
3253d1523ceSRichard Henderson                    env->tlb_c.part_flush_count + ctpop16(to_clean));
3263d1523ceSRichard Henderson         if (to_clean != asked) {
3273d1523ceSRichard Henderson             atomic_set(&env->tlb_c.elide_flush_count,
3283d1523ceSRichard Henderson                        env->tlb_c.elide_flush_count +
3293d1523ceSRichard Henderson                        ctpop16(asked & ~to_clean));
3303d1523ceSRichard Henderson         }
33164f2674bSRichard Henderson     }
332d9bb58e5SYang Zhong }
333d9bb58e5SYang Zhong 
334d9bb58e5SYang Zhong void tlb_flush_by_mmuidx(CPUState *cpu, uint16_t idxmap)
335d9bb58e5SYang Zhong {
336d9bb58e5SYang Zhong     tlb_debug("mmu_idx: 0x%" PRIx16 "\n", idxmap);
337d9bb58e5SYang Zhong 
33864f2674bSRichard Henderson     if (cpu->created && !qemu_cpu_is_self(cpu)) {
339d9bb58e5SYang Zhong         async_run_on_cpu(cpu, tlb_flush_by_mmuidx_async_work,
340ab651105SRichard Henderson                          RUN_ON_CPU_HOST_INT(idxmap));
341d9bb58e5SYang Zhong     } else {
34260a2ad7dSRichard Henderson         tlb_flush_by_mmuidx_async_work(cpu, RUN_ON_CPU_HOST_INT(idxmap));
343d9bb58e5SYang Zhong     }
344d9bb58e5SYang Zhong }
345d9bb58e5SYang Zhong 
34664f2674bSRichard Henderson void tlb_flush(CPUState *cpu)
34764f2674bSRichard Henderson {
34864f2674bSRichard Henderson     tlb_flush_by_mmuidx(cpu, ALL_MMUIDX_BITS);
34964f2674bSRichard Henderson }
35064f2674bSRichard Henderson 
351d9bb58e5SYang Zhong void tlb_flush_by_mmuidx_all_cpus(CPUState *src_cpu, uint16_t idxmap)
352d9bb58e5SYang Zhong {
353d9bb58e5SYang Zhong     const run_on_cpu_func fn = tlb_flush_by_mmuidx_async_work;
354d9bb58e5SYang Zhong 
355d9bb58e5SYang Zhong     tlb_debug("mmu_idx: 0x%"PRIx16"\n", idxmap);
356d9bb58e5SYang Zhong 
357d9bb58e5SYang Zhong     flush_all_helper(src_cpu, fn, RUN_ON_CPU_HOST_INT(idxmap));
358d9bb58e5SYang Zhong     fn(src_cpu, RUN_ON_CPU_HOST_INT(idxmap));
359d9bb58e5SYang Zhong }
360d9bb58e5SYang Zhong 
36164f2674bSRichard Henderson void tlb_flush_all_cpus(CPUState *src_cpu)
36264f2674bSRichard Henderson {
36364f2674bSRichard Henderson     tlb_flush_by_mmuidx_all_cpus(src_cpu, ALL_MMUIDX_BITS);
36464f2674bSRichard Henderson }
36564f2674bSRichard Henderson 
36664f2674bSRichard Henderson void tlb_flush_by_mmuidx_all_cpus_synced(CPUState *src_cpu, uint16_t idxmap)
367d9bb58e5SYang Zhong {
368d9bb58e5SYang Zhong     const run_on_cpu_func fn = tlb_flush_by_mmuidx_async_work;
369d9bb58e5SYang Zhong 
370d9bb58e5SYang Zhong     tlb_debug("mmu_idx: 0x%"PRIx16"\n", idxmap);
371d9bb58e5SYang Zhong 
372d9bb58e5SYang Zhong     flush_all_helper(src_cpu, fn, RUN_ON_CPU_HOST_INT(idxmap));
373d9bb58e5SYang Zhong     async_safe_run_on_cpu(src_cpu, fn, RUN_ON_CPU_HOST_INT(idxmap));
374d9bb58e5SYang Zhong }
375d9bb58e5SYang Zhong 
37664f2674bSRichard Henderson void tlb_flush_all_cpus_synced(CPUState *src_cpu)
37764f2674bSRichard Henderson {
37864f2674bSRichard Henderson     tlb_flush_by_mmuidx_all_cpus_synced(src_cpu, ALL_MMUIDX_BITS);
37964f2674bSRichard Henderson }
38064f2674bSRichard Henderson 
38168fea038SRichard Henderson static inline bool tlb_hit_page_anyprot(CPUTLBEntry *tlb_entry,
38268fea038SRichard Henderson                                         target_ulong page)
383d9bb58e5SYang Zhong {
38468fea038SRichard Henderson     return tlb_hit_page(tlb_entry->addr_read, page) ||
385403f290cSEmilio G. Cota            tlb_hit_page(tlb_addr_write(tlb_entry), page) ||
38668fea038SRichard Henderson            tlb_hit_page(tlb_entry->addr_code, page);
38768fea038SRichard Henderson }
38868fea038SRichard Henderson 
3893cea94bbSEmilio G. Cota /**
3903cea94bbSEmilio G. Cota  * tlb_entry_is_empty - return true if the entry is not in use
3913cea94bbSEmilio G. Cota  * @te: pointer to CPUTLBEntry
3923cea94bbSEmilio G. Cota  */
3933cea94bbSEmilio G. Cota static inline bool tlb_entry_is_empty(const CPUTLBEntry *te)
3943cea94bbSEmilio G. Cota {
3953cea94bbSEmilio G. Cota     return te->addr_read == -1 && te->addr_write == -1 && te->addr_code == -1;
3963cea94bbSEmilio G. Cota }
3973cea94bbSEmilio G. Cota 
39853d28455SRichard Henderson /* Called with tlb_c.lock held */
39986e1eff8SEmilio G. Cota static inline bool tlb_flush_entry_locked(CPUTLBEntry *tlb_entry,
40071aec354SEmilio G. Cota                                           target_ulong page)
40168fea038SRichard Henderson {
40268fea038SRichard Henderson     if (tlb_hit_page_anyprot(tlb_entry, page)) {
403d9bb58e5SYang Zhong         memset(tlb_entry, -1, sizeof(*tlb_entry));
40486e1eff8SEmilio G. Cota         return true;
405d9bb58e5SYang Zhong     }
40686e1eff8SEmilio G. Cota     return false;
407d9bb58e5SYang Zhong }
408d9bb58e5SYang Zhong 
40953d28455SRichard Henderson /* Called with tlb_c.lock held */
41071aec354SEmilio G. Cota static inline void tlb_flush_vtlb_page_locked(CPUArchState *env, int mmu_idx,
41168fea038SRichard Henderson                                               target_ulong page)
41268fea038SRichard Henderson {
41368fea038SRichard Henderson     int k;
41471aec354SEmilio G. Cota 
41571aec354SEmilio G. Cota     assert_cpu_is_self(ENV_GET_CPU(env));
41668fea038SRichard Henderson     for (k = 0; k < CPU_VTLB_SIZE; k++) {
41786e1eff8SEmilio G. Cota         if (tlb_flush_entry_locked(&env->tlb_v_table[mmu_idx][k], page)) {
41886e1eff8SEmilio G. Cota             tlb_n_used_entries_dec(env, mmu_idx);
41986e1eff8SEmilio G. Cota         }
42068fea038SRichard Henderson     }
42168fea038SRichard Henderson }
42268fea038SRichard Henderson 
4231308e026SRichard Henderson static void tlb_flush_page_locked(CPUArchState *env, int midx,
4241308e026SRichard Henderson                                   target_ulong page)
4251308e026SRichard Henderson {
4261308e026SRichard Henderson     target_ulong lp_addr = env->tlb_d[midx].large_page_addr;
4271308e026SRichard Henderson     target_ulong lp_mask = env->tlb_d[midx].large_page_mask;
4281308e026SRichard Henderson 
4291308e026SRichard Henderson     /* Check if we need to flush due to large pages.  */
4301308e026SRichard Henderson     if ((page & lp_mask) == lp_addr) {
4311308e026SRichard Henderson         tlb_debug("forcing full flush midx %d ("
4321308e026SRichard Henderson                   TARGET_FMT_lx "/" TARGET_FMT_lx ")\n",
4331308e026SRichard Henderson                   midx, lp_addr, lp_mask);
4341308e026SRichard Henderson         tlb_flush_one_mmuidx_locked(env, midx);
4351308e026SRichard Henderson     } else {
43686e1eff8SEmilio G. Cota         if (tlb_flush_entry_locked(tlb_entry(env, midx, page), page)) {
43786e1eff8SEmilio G. Cota             tlb_n_used_entries_dec(env, midx);
43886e1eff8SEmilio G. Cota         }
4391308e026SRichard Henderson         tlb_flush_vtlb_page_locked(env, midx, page);
4401308e026SRichard Henderson     }
4411308e026SRichard Henderson }
4421308e026SRichard Henderson 
443d9bb58e5SYang Zhong /* As we are going to hijack the bottom bits of the page address for a
444d9bb58e5SYang Zhong  * mmuidx bit mask we need to fail to build if we can't do that
445d9bb58e5SYang Zhong  */
446d9bb58e5SYang Zhong QEMU_BUILD_BUG_ON(NB_MMU_MODES > TARGET_PAGE_BITS_MIN);
447d9bb58e5SYang Zhong 
448d9bb58e5SYang Zhong static void tlb_flush_page_by_mmuidx_async_work(CPUState *cpu,
449d9bb58e5SYang Zhong                                                 run_on_cpu_data data)
450d9bb58e5SYang Zhong {
451d9bb58e5SYang Zhong     CPUArchState *env = cpu->env_ptr;
452d9bb58e5SYang Zhong     target_ulong addr_and_mmuidx = (target_ulong) data.target_ptr;
453d9bb58e5SYang Zhong     target_ulong addr = addr_and_mmuidx & TARGET_PAGE_MASK;
454d9bb58e5SYang Zhong     unsigned long mmu_idx_bitmap = addr_and_mmuidx & ALL_MMUIDX_BITS;
455d9bb58e5SYang Zhong     int mmu_idx;
456d9bb58e5SYang Zhong 
457d9bb58e5SYang Zhong     assert_cpu_is_self(cpu);
458d9bb58e5SYang Zhong 
4591308e026SRichard Henderson     tlb_debug("page addr:" TARGET_FMT_lx " mmu_map:0x%lx\n",
460383beda9SRichard Henderson               addr, mmu_idx_bitmap);
461d9bb58e5SYang Zhong 
46253d28455SRichard Henderson     qemu_spin_lock(&env->tlb_c.lock);
463d9bb58e5SYang Zhong     for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++) {
464d9bb58e5SYang Zhong         if (test_bit(mmu_idx, &mmu_idx_bitmap)) {
4651308e026SRichard Henderson             tlb_flush_page_locked(env, mmu_idx, addr);
466d9bb58e5SYang Zhong         }
467d9bb58e5SYang Zhong     }
46853d28455SRichard Henderson     qemu_spin_unlock(&env->tlb_c.lock);
469d9bb58e5SYang Zhong 
470d9bb58e5SYang Zhong     tb_flush_jmp_cache(cpu, addr);
471d9bb58e5SYang Zhong }
472d9bb58e5SYang Zhong 
473d9bb58e5SYang Zhong void tlb_flush_page_by_mmuidx(CPUState *cpu, target_ulong addr, uint16_t idxmap)
474d9bb58e5SYang Zhong {
475d9bb58e5SYang Zhong     target_ulong addr_and_mmu_idx;
476d9bb58e5SYang Zhong 
477d9bb58e5SYang Zhong     tlb_debug("addr: "TARGET_FMT_lx" mmu_idx:%" PRIx16 "\n", addr, idxmap);
478d9bb58e5SYang Zhong 
479d9bb58e5SYang Zhong     /* This should already be page aligned */
480d9bb58e5SYang Zhong     addr_and_mmu_idx = addr & TARGET_PAGE_MASK;
481d9bb58e5SYang Zhong     addr_and_mmu_idx |= idxmap;
482d9bb58e5SYang Zhong 
483d9bb58e5SYang Zhong     if (!qemu_cpu_is_self(cpu)) {
4841308e026SRichard Henderson         async_run_on_cpu(cpu, tlb_flush_page_by_mmuidx_async_work,
485d9bb58e5SYang Zhong                          RUN_ON_CPU_TARGET_PTR(addr_and_mmu_idx));
486d9bb58e5SYang Zhong     } else {
4871308e026SRichard Henderson         tlb_flush_page_by_mmuidx_async_work(
488d9bb58e5SYang Zhong             cpu, RUN_ON_CPU_TARGET_PTR(addr_and_mmu_idx));
489d9bb58e5SYang Zhong     }
490d9bb58e5SYang Zhong }
491d9bb58e5SYang Zhong 
492f8144c6cSRichard Henderson void tlb_flush_page(CPUState *cpu, target_ulong addr)
493f8144c6cSRichard Henderson {
494f8144c6cSRichard Henderson     tlb_flush_page_by_mmuidx(cpu, addr, ALL_MMUIDX_BITS);
495f8144c6cSRichard Henderson }
496f8144c6cSRichard Henderson 
497d9bb58e5SYang Zhong void tlb_flush_page_by_mmuidx_all_cpus(CPUState *src_cpu, target_ulong addr,
498d9bb58e5SYang Zhong                                        uint16_t idxmap)
499d9bb58e5SYang Zhong {
5001308e026SRichard Henderson     const run_on_cpu_func fn = tlb_flush_page_by_mmuidx_async_work;
501d9bb58e5SYang Zhong     target_ulong addr_and_mmu_idx;
502d9bb58e5SYang Zhong 
503d9bb58e5SYang Zhong     tlb_debug("addr: "TARGET_FMT_lx" mmu_idx:%"PRIx16"\n", addr, idxmap);
504d9bb58e5SYang Zhong 
505d9bb58e5SYang Zhong     /* This should already be page aligned */
506d9bb58e5SYang Zhong     addr_and_mmu_idx = addr & TARGET_PAGE_MASK;
507d9bb58e5SYang Zhong     addr_and_mmu_idx |= idxmap;
508d9bb58e5SYang Zhong 
509d9bb58e5SYang Zhong     flush_all_helper(src_cpu, fn, RUN_ON_CPU_TARGET_PTR(addr_and_mmu_idx));
510d9bb58e5SYang Zhong     fn(src_cpu, RUN_ON_CPU_TARGET_PTR(addr_and_mmu_idx));
511d9bb58e5SYang Zhong }
512d9bb58e5SYang Zhong 
513f8144c6cSRichard Henderson void tlb_flush_page_all_cpus(CPUState *src, target_ulong addr)
514f8144c6cSRichard Henderson {
515f8144c6cSRichard Henderson     tlb_flush_page_by_mmuidx_all_cpus(src, addr, ALL_MMUIDX_BITS);
516f8144c6cSRichard Henderson }
517f8144c6cSRichard Henderson 
518d9bb58e5SYang Zhong void tlb_flush_page_by_mmuidx_all_cpus_synced(CPUState *src_cpu,
519d9bb58e5SYang Zhong                                               target_ulong addr,
520d9bb58e5SYang Zhong                                               uint16_t idxmap)
521d9bb58e5SYang Zhong {
5221308e026SRichard Henderson     const run_on_cpu_func fn = tlb_flush_page_by_mmuidx_async_work;
523d9bb58e5SYang Zhong     target_ulong addr_and_mmu_idx;
524d9bb58e5SYang Zhong 
525d9bb58e5SYang Zhong     tlb_debug("addr: "TARGET_FMT_lx" mmu_idx:%"PRIx16"\n", addr, idxmap);
526d9bb58e5SYang Zhong 
527d9bb58e5SYang Zhong     /* This should already be page aligned */
528d9bb58e5SYang Zhong     addr_and_mmu_idx = addr & TARGET_PAGE_MASK;
529d9bb58e5SYang Zhong     addr_and_mmu_idx |= idxmap;
530d9bb58e5SYang Zhong 
531d9bb58e5SYang Zhong     flush_all_helper(src_cpu, fn, RUN_ON_CPU_TARGET_PTR(addr_and_mmu_idx));
532d9bb58e5SYang Zhong     async_safe_run_on_cpu(src_cpu, fn, RUN_ON_CPU_TARGET_PTR(addr_and_mmu_idx));
533d9bb58e5SYang Zhong }
534d9bb58e5SYang Zhong 
535f8144c6cSRichard Henderson void tlb_flush_page_all_cpus_synced(CPUState *src, target_ulong addr)
536d9bb58e5SYang Zhong {
537f8144c6cSRichard Henderson     tlb_flush_page_by_mmuidx_all_cpus_synced(src, addr, ALL_MMUIDX_BITS);
538d9bb58e5SYang Zhong }
539d9bb58e5SYang Zhong 
540d9bb58e5SYang Zhong /* update the TLBs so that writes to code in the virtual page 'addr'
541d9bb58e5SYang Zhong    can be detected */
542d9bb58e5SYang Zhong void tlb_protect_code(ram_addr_t ram_addr)
543d9bb58e5SYang Zhong {
544d9bb58e5SYang Zhong     cpu_physical_memory_test_and_clear_dirty(ram_addr, TARGET_PAGE_SIZE,
545d9bb58e5SYang Zhong                                              DIRTY_MEMORY_CODE);
546d9bb58e5SYang Zhong }
547d9bb58e5SYang Zhong 
548d9bb58e5SYang Zhong /* update the TLB so that writes in physical page 'phys_addr' are no longer
549d9bb58e5SYang Zhong    tested for self modifying code */
550d9bb58e5SYang Zhong void tlb_unprotect_code(ram_addr_t ram_addr)
551d9bb58e5SYang Zhong {
552d9bb58e5SYang Zhong     cpu_physical_memory_set_dirty_flag(ram_addr, DIRTY_MEMORY_CODE);
553d9bb58e5SYang Zhong }
554d9bb58e5SYang Zhong 
555d9bb58e5SYang Zhong 
556d9bb58e5SYang Zhong /*
557d9bb58e5SYang Zhong  * Dirty write flag handling
558d9bb58e5SYang Zhong  *
559d9bb58e5SYang Zhong  * When the TCG code writes to a location it looks up the address in
560d9bb58e5SYang Zhong  * the TLB and uses that data to compute the final address. If any of
561d9bb58e5SYang Zhong  * the lower bits of the address are set then the slow path is forced.
562d9bb58e5SYang Zhong  * There are a number of reasons to do this but for normal RAM the
563d9bb58e5SYang Zhong  * most usual is detecting writes to code regions which may invalidate
564d9bb58e5SYang Zhong  * generated code.
565d9bb58e5SYang Zhong  *
56671aec354SEmilio G. Cota  * Other vCPUs might be reading their TLBs during guest execution, so we update
56771aec354SEmilio G. Cota  * te->addr_write with atomic_set. We don't need to worry about this for
56871aec354SEmilio G. Cota  * oversized guests as MTTCG is disabled for them.
569d9bb58e5SYang Zhong  *
57053d28455SRichard Henderson  * Called with tlb_c.lock held.
571d9bb58e5SYang Zhong  */
57271aec354SEmilio G. Cota static void tlb_reset_dirty_range_locked(CPUTLBEntry *tlb_entry,
57371aec354SEmilio G. Cota                                          uintptr_t start, uintptr_t length)
574d9bb58e5SYang Zhong {
575d9bb58e5SYang Zhong     uintptr_t addr = tlb_entry->addr_write;
576d9bb58e5SYang Zhong 
577d9bb58e5SYang Zhong     if ((addr & (TLB_INVALID_MASK | TLB_MMIO | TLB_NOTDIRTY)) == 0) {
578d9bb58e5SYang Zhong         addr &= TARGET_PAGE_MASK;
579d9bb58e5SYang Zhong         addr += tlb_entry->addend;
580d9bb58e5SYang Zhong         if ((addr - start) < length) {
581d9bb58e5SYang Zhong #if TCG_OVERSIZED_GUEST
58271aec354SEmilio G. Cota             tlb_entry->addr_write |= TLB_NOTDIRTY;
583d9bb58e5SYang Zhong #else
58471aec354SEmilio G. Cota             atomic_set(&tlb_entry->addr_write,
58571aec354SEmilio G. Cota                        tlb_entry->addr_write | TLB_NOTDIRTY);
586d9bb58e5SYang Zhong #endif
587d9bb58e5SYang Zhong         }
58871aec354SEmilio G. Cota     }
58971aec354SEmilio G. Cota }
59071aec354SEmilio G. Cota 
59171aec354SEmilio G. Cota /*
59253d28455SRichard Henderson  * Called with tlb_c.lock held.
59371aec354SEmilio G. Cota  * Called only from the vCPU context, i.e. the TLB's owner thread.
59471aec354SEmilio G. Cota  */
59571aec354SEmilio G. Cota static inline void copy_tlb_helper_locked(CPUTLBEntry *d, const CPUTLBEntry *s)
59671aec354SEmilio G. Cota {
59771aec354SEmilio G. Cota     *d = *s;
59871aec354SEmilio G. Cota }
599d9bb58e5SYang Zhong 
600d9bb58e5SYang Zhong /* This is a cross vCPU call (i.e. another vCPU resetting the flags of
60171aec354SEmilio G. Cota  * the target vCPU).
60253d28455SRichard Henderson  * We must take tlb_c.lock to avoid racing with another vCPU update. The only
60371aec354SEmilio G. Cota  * thing actually updated is the target TLB entry ->addr_write flags.
604d9bb58e5SYang Zhong  */
605d9bb58e5SYang Zhong void tlb_reset_dirty(CPUState *cpu, ram_addr_t start1, ram_addr_t length)
606d9bb58e5SYang Zhong {
607d9bb58e5SYang Zhong     CPUArchState *env;
608d9bb58e5SYang Zhong 
609d9bb58e5SYang Zhong     int mmu_idx;
610d9bb58e5SYang Zhong 
611d9bb58e5SYang Zhong     env = cpu->env_ptr;
61253d28455SRichard Henderson     qemu_spin_lock(&env->tlb_c.lock);
613d9bb58e5SYang Zhong     for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++) {
614d9bb58e5SYang Zhong         unsigned int i;
61586e1eff8SEmilio G. Cota         unsigned int n = tlb_n_entries(env, mmu_idx);
616d9bb58e5SYang Zhong 
61786e1eff8SEmilio G. Cota         for (i = 0; i < n; i++) {
61871aec354SEmilio G. Cota             tlb_reset_dirty_range_locked(&env->tlb_table[mmu_idx][i], start1,
61971aec354SEmilio G. Cota                                          length);
620d9bb58e5SYang Zhong         }
621d9bb58e5SYang Zhong 
622d9bb58e5SYang Zhong         for (i = 0; i < CPU_VTLB_SIZE; i++) {
62371aec354SEmilio G. Cota             tlb_reset_dirty_range_locked(&env->tlb_v_table[mmu_idx][i], start1,
62471aec354SEmilio G. Cota                                          length);
625d9bb58e5SYang Zhong         }
626d9bb58e5SYang Zhong     }
62753d28455SRichard Henderson     qemu_spin_unlock(&env->tlb_c.lock);
628d9bb58e5SYang Zhong }
629d9bb58e5SYang Zhong 
63053d28455SRichard Henderson /* Called with tlb_c.lock held */
63171aec354SEmilio G. Cota static inline void tlb_set_dirty1_locked(CPUTLBEntry *tlb_entry,
63271aec354SEmilio G. Cota                                          target_ulong vaddr)
633d9bb58e5SYang Zhong {
634d9bb58e5SYang Zhong     if (tlb_entry->addr_write == (vaddr | TLB_NOTDIRTY)) {
635d9bb58e5SYang Zhong         tlb_entry->addr_write = vaddr;
636d9bb58e5SYang Zhong     }
637d9bb58e5SYang Zhong }
638d9bb58e5SYang Zhong 
639d9bb58e5SYang Zhong /* update the TLB corresponding to virtual page vaddr
640d9bb58e5SYang Zhong    so that it is no longer dirty */
641d9bb58e5SYang Zhong void tlb_set_dirty(CPUState *cpu, target_ulong vaddr)
642d9bb58e5SYang Zhong {
643d9bb58e5SYang Zhong     CPUArchState *env = cpu->env_ptr;
644d9bb58e5SYang Zhong     int mmu_idx;
645d9bb58e5SYang Zhong 
646d9bb58e5SYang Zhong     assert_cpu_is_self(cpu);
647d9bb58e5SYang Zhong 
648d9bb58e5SYang Zhong     vaddr &= TARGET_PAGE_MASK;
64953d28455SRichard Henderson     qemu_spin_lock(&env->tlb_c.lock);
650d9bb58e5SYang Zhong     for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++) {
651383beda9SRichard Henderson         tlb_set_dirty1_locked(tlb_entry(env, mmu_idx, vaddr), vaddr);
652d9bb58e5SYang Zhong     }
653d9bb58e5SYang Zhong 
654d9bb58e5SYang Zhong     for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++) {
655d9bb58e5SYang Zhong         int k;
656d9bb58e5SYang Zhong         for (k = 0; k < CPU_VTLB_SIZE; k++) {
65771aec354SEmilio G. Cota             tlb_set_dirty1_locked(&env->tlb_v_table[mmu_idx][k], vaddr);
658d9bb58e5SYang Zhong         }
659d9bb58e5SYang Zhong     }
66053d28455SRichard Henderson     qemu_spin_unlock(&env->tlb_c.lock);
661d9bb58e5SYang Zhong }
662d9bb58e5SYang Zhong 
663d9bb58e5SYang Zhong /* Our TLB does not support large pages, so remember the area covered by
664d9bb58e5SYang Zhong    large pages and trigger a full TLB flush if these are invalidated.  */
6651308e026SRichard Henderson static void tlb_add_large_page(CPUArchState *env, int mmu_idx,
6661308e026SRichard Henderson                                target_ulong vaddr, target_ulong size)
667d9bb58e5SYang Zhong {
6681308e026SRichard Henderson     target_ulong lp_addr = env->tlb_d[mmu_idx].large_page_addr;
6691308e026SRichard Henderson     target_ulong lp_mask = ~(size - 1);
670d9bb58e5SYang Zhong 
6711308e026SRichard Henderson     if (lp_addr == (target_ulong)-1) {
6721308e026SRichard Henderson         /* No previous large page.  */
6731308e026SRichard Henderson         lp_addr = vaddr;
6741308e026SRichard Henderson     } else {
675d9bb58e5SYang Zhong         /* Extend the existing region to include the new page.
6761308e026SRichard Henderson            This is a compromise between unnecessary flushes and
6771308e026SRichard Henderson            the cost of maintaining a full variable size TLB.  */
6781308e026SRichard Henderson         lp_mask &= env->tlb_d[mmu_idx].large_page_mask;
6791308e026SRichard Henderson         while (((lp_addr ^ vaddr) & lp_mask) != 0) {
6801308e026SRichard Henderson             lp_mask <<= 1;
681d9bb58e5SYang Zhong         }
6821308e026SRichard Henderson     }
6831308e026SRichard Henderson     env->tlb_d[mmu_idx].large_page_addr = lp_addr & lp_mask;
6841308e026SRichard Henderson     env->tlb_d[mmu_idx].large_page_mask = lp_mask;
685d9bb58e5SYang Zhong }
686d9bb58e5SYang Zhong 
687d9bb58e5SYang Zhong /* Add a new TLB entry. At most one entry for a given virtual address
688d9bb58e5SYang Zhong  * is permitted. Only a single TARGET_PAGE_SIZE region is mapped, the
689d9bb58e5SYang Zhong  * supplied size is only used by tlb_flush_page.
690d9bb58e5SYang Zhong  *
691d9bb58e5SYang Zhong  * Called from TCG-generated code, which is under an RCU read-side
692d9bb58e5SYang Zhong  * critical section.
693d9bb58e5SYang Zhong  */
694d9bb58e5SYang Zhong void tlb_set_page_with_attrs(CPUState *cpu, target_ulong vaddr,
695d9bb58e5SYang Zhong                              hwaddr paddr, MemTxAttrs attrs, int prot,
696d9bb58e5SYang Zhong                              int mmu_idx, target_ulong size)
697d9bb58e5SYang Zhong {
698d9bb58e5SYang Zhong     CPUArchState *env = cpu->env_ptr;
699d9bb58e5SYang Zhong     MemoryRegionSection *section;
700d9bb58e5SYang Zhong     unsigned int index;
701d9bb58e5SYang Zhong     target_ulong address;
702d9bb58e5SYang Zhong     target_ulong code_address;
703d9bb58e5SYang Zhong     uintptr_t addend;
70468fea038SRichard Henderson     CPUTLBEntry *te, tn;
70555df6fcfSPeter Maydell     hwaddr iotlb, xlat, sz, paddr_page;
70655df6fcfSPeter Maydell     target_ulong vaddr_page;
707d9bb58e5SYang Zhong     int asidx = cpu_asidx_from_attrs(cpu, attrs);
708d9bb58e5SYang Zhong 
709d9bb58e5SYang Zhong     assert_cpu_is_self(cpu);
71055df6fcfSPeter Maydell 
7111308e026SRichard Henderson     if (size <= TARGET_PAGE_SIZE) {
71255df6fcfSPeter Maydell         sz = TARGET_PAGE_SIZE;
71355df6fcfSPeter Maydell     } else {
7141308e026SRichard Henderson         tlb_add_large_page(env, mmu_idx, vaddr, size);
715d9bb58e5SYang Zhong         sz = size;
71655df6fcfSPeter Maydell     }
71755df6fcfSPeter Maydell     vaddr_page = vaddr & TARGET_PAGE_MASK;
71855df6fcfSPeter Maydell     paddr_page = paddr & TARGET_PAGE_MASK;
71955df6fcfSPeter Maydell 
72055df6fcfSPeter Maydell     section = address_space_translate_for_iotlb(cpu, asidx, paddr_page,
72155df6fcfSPeter Maydell                                                 &xlat, &sz, attrs, &prot);
722d9bb58e5SYang Zhong     assert(sz >= TARGET_PAGE_SIZE);
723d9bb58e5SYang Zhong 
724d9bb58e5SYang Zhong     tlb_debug("vaddr=" TARGET_FMT_lx " paddr=0x" TARGET_FMT_plx
725d9bb58e5SYang Zhong               " prot=%x idx=%d\n",
726d9bb58e5SYang Zhong               vaddr, paddr, prot, mmu_idx);
727d9bb58e5SYang Zhong 
72855df6fcfSPeter Maydell     address = vaddr_page;
72955df6fcfSPeter Maydell     if (size < TARGET_PAGE_SIZE) {
73055df6fcfSPeter Maydell         /*
73155df6fcfSPeter Maydell          * Slow-path the TLB entries; we will repeat the MMU check and TLB
73255df6fcfSPeter Maydell          * fill on every access.
73355df6fcfSPeter Maydell          */
73455df6fcfSPeter Maydell         address |= TLB_RECHECK;
73555df6fcfSPeter Maydell     }
73655df6fcfSPeter Maydell     if (!memory_region_is_ram(section->mr) &&
73755df6fcfSPeter Maydell         !memory_region_is_romd(section->mr)) {
738d9bb58e5SYang Zhong         /* IO memory case */
739d9bb58e5SYang Zhong         address |= TLB_MMIO;
740d9bb58e5SYang Zhong         addend = 0;
741d9bb58e5SYang Zhong     } else {
742d9bb58e5SYang Zhong         /* TLB_MMIO for rom/romd handled below */
743d9bb58e5SYang Zhong         addend = (uintptr_t)memory_region_get_ram_ptr(section->mr) + xlat;
744d9bb58e5SYang Zhong     }
745d9bb58e5SYang Zhong 
746d9bb58e5SYang Zhong     code_address = address;
74755df6fcfSPeter Maydell     iotlb = memory_region_section_get_iotlb(cpu, section, vaddr_page,
74855df6fcfSPeter Maydell                                             paddr_page, xlat, prot, &address);
749d9bb58e5SYang Zhong 
750383beda9SRichard Henderson     index = tlb_index(env, mmu_idx, vaddr_page);
751383beda9SRichard Henderson     te = tlb_entry(env, mmu_idx, vaddr_page);
752d9bb58e5SYang Zhong 
75368fea038SRichard Henderson     /*
75471aec354SEmilio G. Cota      * Hold the TLB lock for the rest of the function. We could acquire/release
75571aec354SEmilio G. Cota      * the lock several times in the function, but it is faster to amortize the
75671aec354SEmilio G. Cota      * acquisition cost by acquiring it just once. Note that this leads to
75771aec354SEmilio G. Cota      * a longer critical section, but this is not a concern since the TLB lock
75871aec354SEmilio G. Cota      * is unlikely to be contended.
75971aec354SEmilio G. Cota      */
76053d28455SRichard Henderson     qemu_spin_lock(&env->tlb_c.lock);
76171aec354SEmilio G. Cota 
7623d1523ceSRichard Henderson     /* Note that the tlb is no longer clean.  */
7633d1523ceSRichard Henderson     env->tlb_c.dirty |= 1 << mmu_idx;
7643d1523ceSRichard Henderson 
76571aec354SEmilio G. Cota     /* Make sure there's no cached translation for the new page.  */
76671aec354SEmilio G. Cota     tlb_flush_vtlb_page_locked(env, mmu_idx, vaddr_page);
76771aec354SEmilio G. Cota 
76871aec354SEmilio G. Cota     /*
76968fea038SRichard Henderson      * Only evict the old entry to the victim tlb if it's for a
77068fea038SRichard Henderson      * different page; otherwise just overwrite the stale data.
77168fea038SRichard Henderson      */
7723cea94bbSEmilio G. Cota     if (!tlb_hit_page_anyprot(te, vaddr_page) && !tlb_entry_is_empty(te)) {
773d5363e58SRichard Henderson         unsigned vidx = env->tlb_d[mmu_idx].vindex++ % CPU_VTLB_SIZE;
77468fea038SRichard Henderson         CPUTLBEntry *tv = &env->tlb_v_table[mmu_idx][vidx];
77568fea038SRichard Henderson 
77668fea038SRichard Henderson         /* Evict the old entry into the victim tlb.  */
77771aec354SEmilio G. Cota         copy_tlb_helper_locked(tv, te);
778d9bb58e5SYang Zhong         env->iotlb_v[mmu_idx][vidx] = env->iotlb[mmu_idx][index];
77986e1eff8SEmilio G. Cota         tlb_n_used_entries_dec(env, mmu_idx);
78068fea038SRichard Henderson     }
781d9bb58e5SYang Zhong 
782d9bb58e5SYang Zhong     /* refill the tlb */
783ace41090SPeter Maydell     /*
784ace41090SPeter Maydell      * At this point iotlb contains a physical section number in the lower
785ace41090SPeter Maydell      * TARGET_PAGE_BITS, and either
786ace41090SPeter Maydell      *  + the ram_addr_t of the page base of the target RAM (if NOTDIRTY or ROM)
787ace41090SPeter Maydell      *  + the offset within section->mr of the page base (otherwise)
78855df6fcfSPeter Maydell      * We subtract the vaddr_page (which is page aligned and thus won't
789ace41090SPeter Maydell      * disturb the low bits) to give an offset which can be added to the
790ace41090SPeter Maydell      * (non-page-aligned) vaddr of the eventual memory access to get
791ace41090SPeter Maydell      * the MemoryRegion offset for the access. Note that the vaddr we
792ace41090SPeter Maydell      * subtract here is that of the page base, and not the same as the
793ace41090SPeter Maydell      * vaddr we add back in io_readx()/io_writex()/get_page_addr_code().
794ace41090SPeter Maydell      */
79555df6fcfSPeter Maydell     env->iotlb[mmu_idx][index].addr = iotlb - vaddr_page;
796d9bb58e5SYang Zhong     env->iotlb[mmu_idx][index].attrs = attrs;
797d9bb58e5SYang Zhong 
798d9bb58e5SYang Zhong     /* Now calculate the new entry */
79955df6fcfSPeter Maydell     tn.addend = addend - vaddr_page;
800d9bb58e5SYang Zhong     if (prot & PAGE_READ) {
801d9bb58e5SYang Zhong         tn.addr_read = address;
802d9bb58e5SYang Zhong     } else {
803d9bb58e5SYang Zhong         tn.addr_read = -1;
804d9bb58e5SYang Zhong     }
805d9bb58e5SYang Zhong 
806d9bb58e5SYang Zhong     if (prot & PAGE_EXEC) {
807d9bb58e5SYang Zhong         tn.addr_code = code_address;
808d9bb58e5SYang Zhong     } else {
809d9bb58e5SYang Zhong         tn.addr_code = -1;
810d9bb58e5SYang Zhong     }
811d9bb58e5SYang Zhong 
812d9bb58e5SYang Zhong     tn.addr_write = -1;
813d9bb58e5SYang Zhong     if (prot & PAGE_WRITE) {
814d9bb58e5SYang Zhong         if ((memory_region_is_ram(section->mr) && section->readonly)
815d9bb58e5SYang Zhong             || memory_region_is_romd(section->mr)) {
816d9bb58e5SYang Zhong             /* Write access calls the I/O callback.  */
817d9bb58e5SYang Zhong             tn.addr_write = address | TLB_MMIO;
818d9bb58e5SYang Zhong         } else if (memory_region_is_ram(section->mr)
819d9bb58e5SYang Zhong                    && cpu_physical_memory_is_clean(
820d9bb58e5SYang Zhong                        memory_region_get_ram_addr(section->mr) + xlat)) {
821d9bb58e5SYang Zhong             tn.addr_write = address | TLB_NOTDIRTY;
822d9bb58e5SYang Zhong         } else {
823d9bb58e5SYang Zhong             tn.addr_write = address;
824d9bb58e5SYang Zhong         }
825f52bfb12SDavid Hildenbrand         if (prot & PAGE_WRITE_INV) {
826f52bfb12SDavid Hildenbrand             tn.addr_write |= TLB_INVALID_MASK;
827f52bfb12SDavid Hildenbrand         }
828d9bb58e5SYang Zhong     }
829d9bb58e5SYang Zhong 
83071aec354SEmilio G. Cota     copy_tlb_helper_locked(te, &tn);
83186e1eff8SEmilio G. Cota     tlb_n_used_entries_inc(env, mmu_idx);
83253d28455SRichard Henderson     qemu_spin_unlock(&env->tlb_c.lock);
833d9bb58e5SYang Zhong }
834d9bb58e5SYang Zhong 
835d9bb58e5SYang Zhong /* Add a new TLB entry, but without specifying the memory
836d9bb58e5SYang Zhong  * transaction attributes to be used.
837d9bb58e5SYang Zhong  */
838d9bb58e5SYang Zhong void tlb_set_page(CPUState *cpu, target_ulong vaddr,
839d9bb58e5SYang Zhong                   hwaddr paddr, int prot,
840d9bb58e5SYang Zhong                   int mmu_idx, target_ulong size)
841d9bb58e5SYang Zhong {
842d9bb58e5SYang Zhong     tlb_set_page_with_attrs(cpu, vaddr, paddr, MEMTXATTRS_UNSPECIFIED,
843d9bb58e5SYang Zhong                             prot, mmu_idx, size);
844d9bb58e5SYang Zhong }
845d9bb58e5SYang Zhong 
846d9bb58e5SYang Zhong static inline ram_addr_t qemu_ram_addr_from_host_nofail(void *ptr)
847d9bb58e5SYang Zhong {
848d9bb58e5SYang Zhong     ram_addr_t ram_addr;
849d9bb58e5SYang Zhong 
850d9bb58e5SYang Zhong     ram_addr = qemu_ram_addr_from_host(ptr);
851d9bb58e5SYang Zhong     if (ram_addr == RAM_ADDR_INVALID) {
852d9bb58e5SYang Zhong         error_report("Bad ram pointer %p", ptr);
853d9bb58e5SYang Zhong         abort();
854d9bb58e5SYang Zhong     }
855d9bb58e5SYang Zhong     return ram_addr;
856d9bb58e5SYang Zhong }
857d9bb58e5SYang Zhong 
858d9bb58e5SYang Zhong static uint64_t io_readx(CPUArchState *env, CPUIOTLBEntry *iotlbentry,
85904e3aabdSPeter Maydell                          int mmu_idx,
86055df6fcfSPeter Maydell                          target_ulong addr, uintptr_t retaddr,
861dbea78a4SPeter Maydell                          bool recheck, MMUAccessType access_type, int size)
862d9bb58e5SYang Zhong {
863d9bb58e5SYang Zhong     CPUState *cpu = ENV_GET_CPU(env);
8642d54f194SPeter Maydell     hwaddr mr_offset;
8652d54f194SPeter Maydell     MemoryRegionSection *section;
8662d54f194SPeter Maydell     MemoryRegion *mr;
867d9bb58e5SYang Zhong     uint64_t val;
868d9bb58e5SYang Zhong     bool locked = false;
86904e3aabdSPeter Maydell     MemTxResult r;
870d9bb58e5SYang Zhong 
87155df6fcfSPeter Maydell     if (recheck) {
87255df6fcfSPeter Maydell         /*
87355df6fcfSPeter Maydell          * This is a TLB_RECHECK access, where the MMU protection
87455df6fcfSPeter Maydell          * covers a smaller range than a target page, and we must
87555df6fcfSPeter Maydell          * repeat the MMU check here. This tlb_fill() call might
87655df6fcfSPeter Maydell          * longjump out if this access should cause a guest exception.
87755df6fcfSPeter Maydell          */
878383beda9SRichard Henderson         CPUTLBEntry *entry;
87955df6fcfSPeter Maydell         target_ulong tlb_addr;
88055df6fcfSPeter Maydell 
88155df6fcfSPeter Maydell         tlb_fill(cpu, addr, size, MMU_DATA_LOAD, mmu_idx, retaddr);
88255df6fcfSPeter Maydell 
883383beda9SRichard Henderson         entry = tlb_entry(env, mmu_idx, addr);
884383beda9SRichard Henderson         tlb_addr = entry->addr_read;
88555df6fcfSPeter Maydell         if (!(tlb_addr & ~(TARGET_PAGE_MASK | TLB_RECHECK))) {
88655df6fcfSPeter Maydell             /* RAM access */
887383beda9SRichard Henderson             uintptr_t haddr = addr + entry->addend;
88855df6fcfSPeter Maydell 
88955df6fcfSPeter Maydell             return ldn_p((void *)haddr, size);
89055df6fcfSPeter Maydell         }
89155df6fcfSPeter Maydell         /* Fall through for handling IO accesses */
89255df6fcfSPeter Maydell     }
89355df6fcfSPeter Maydell 
8942d54f194SPeter Maydell     section = iotlb_to_section(cpu, iotlbentry->addr, iotlbentry->attrs);
8952d54f194SPeter Maydell     mr = section->mr;
8962d54f194SPeter Maydell     mr_offset = (iotlbentry->addr & TARGET_PAGE_MASK) + addr;
897d9bb58e5SYang Zhong     cpu->mem_io_pc = retaddr;
898d9bb58e5SYang Zhong     if (mr != &io_mem_rom && mr != &io_mem_notdirty && !cpu->can_do_io) {
899d9bb58e5SYang Zhong         cpu_io_recompile(cpu, retaddr);
900d9bb58e5SYang Zhong     }
901d9bb58e5SYang Zhong 
902d9bb58e5SYang Zhong     cpu->mem_io_vaddr = addr;
903dbea78a4SPeter Maydell     cpu->mem_io_access_type = access_type;
904d9bb58e5SYang Zhong 
9058b812533SAlex Bennée     if (mr->global_locking && !qemu_mutex_iothread_locked()) {
906d9bb58e5SYang Zhong         qemu_mutex_lock_iothread();
907d9bb58e5SYang Zhong         locked = true;
908d9bb58e5SYang Zhong     }
9092d54f194SPeter Maydell     r = memory_region_dispatch_read(mr, mr_offset,
91004e3aabdSPeter Maydell                                     &val, size, iotlbentry->attrs);
91104e3aabdSPeter Maydell     if (r != MEMTX_OK) {
9122d54f194SPeter Maydell         hwaddr physaddr = mr_offset +
9132d54f194SPeter Maydell             section->offset_within_address_space -
9142d54f194SPeter Maydell             section->offset_within_region;
9152d54f194SPeter Maydell 
916dbea78a4SPeter Maydell         cpu_transaction_failed(cpu, physaddr, addr, size, access_type,
91704e3aabdSPeter Maydell                                mmu_idx, iotlbentry->attrs, r, retaddr);
91804e3aabdSPeter Maydell     }
919d9bb58e5SYang Zhong     if (locked) {
920d9bb58e5SYang Zhong         qemu_mutex_unlock_iothread();
921d9bb58e5SYang Zhong     }
922d9bb58e5SYang Zhong 
923d9bb58e5SYang Zhong     return val;
924d9bb58e5SYang Zhong }
925d9bb58e5SYang Zhong 
926d9bb58e5SYang Zhong static void io_writex(CPUArchState *env, CPUIOTLBEntry *iotlbentry,
92704e3aabdSPeter Maydell                       int mmu_idx,
928d9bb58e5SYang Zhong                       uint64_t val, target_ulong addr,
92955df6fcfSPeter Maydell                       uintptr_t retaddr, bool recheck, int size)
930d9bb58e5SYang Zhong {
931d9bb58e5SYang Zhong     CPUState *cpu = ENV_GET_CPU(env);
9322d54f194SPeter Maydell     hwaddr mr_offset;
9332d54f194SPeter Maydell     MemoryRegionSection *section;
9342d54f194SPeter Maydell     MemoryRegion *mr;
935d9bb58e5SYang Zhong     bool locked = false;
93604e3aabdSPeter Maydell     MemTxResult r;
937d9bb58e5SYang Zhong 
93855df6fcfSPeter Maydell     if (recheck) {
93955df6fcfSPeter Maydell         /*
94055df6fcfSPeter Maydell          * This is a TLB_RECHECK access, where the MMU protection
94155df6fcfSPeter Maydell          * covers a smaller range than a target page, and we must
94255df6fcfSPeter Maydell          * repeat the MMU check here. This tlb_fill() call might
94355df6fcfSPeter Maydell          * longjump out if this access should cause a guest exception.
94455df6fcfSPeter Maydell          */
945383beda9SRichard Henderson         CPUTLBEntry *entry;
94655df6fcfSPeter Maydell         target_ulong tlb_addr;
94755df6fcfSPeter Maydell 
94855df6fcfSPeter Maydell         tlb_fill(cpu, addr, size, MMU_DATA_STORE, mmu_idx, retaddr);
94955df6fcfSPeter Maydell 
950383beda9SRichard Henderson         entry = tlb_entry(env, mmu_idx, addr);
951403f290cSEmilio G. Cota         tlb_addr = tlb_addr_write(entry);
95255df6fcfSPeter Maydell         if (!(tlb_addr & ~(TARGET_PAGE_MASK | TLB_RECHECK))) {
95355df6fcfSPeter Maydell             /* RAM access */
954383beda9SRichard Henderson             uintptr_t haddr = addr + entry->addend;
95555df6fcfSPeter Maydell 
95655df6fcfSPeter Maydell             stn_p((void *)haddr, size, val);
95755df6fcfSPeter Maydell             return;
95855df6fcfSPeter Maydell         }
95955df6fcfSPeter Maydell         /* Fall through for handling IO accesses */
96055df6fcfSPeter Maydell     }
96155df6fcfSPeter Maydell 
9622d54f194SPeter Maydell     section = iotlb_to_section(cpu, iotlbentry->addr, iotlbentry->attrs);
9632d54f194SPeter Maydell     mr = section->mr;
9642d54f194SPeter Maydell     mr_offset = (iotlbentry->addr & TARGET_PAGE_MASK) + addr;
965d9bb58e5SYang Zhong     if (mr != &io_mem_rom && mr != &io_mem_notdirty && !cpu->can_do_io) {
966d9bb58e5SYang Zhong         cpu_io_recompile(cpu, retaddr);
967d9bb58e5SYang Zhong     }
968d9bb58e5SYang Zhong     cpu->mem_io_vaddr = addr;
969d9bb58e5SYang Zhong     cpu->mem_io_pc = retaddr;
970d9bb58e5SYang Zhong 
9718b812533SAlex Bennée     if (mr->global_locking && !qemu_mutex_iothread_locked()) {
972d9bb58e5SYang Zhong         qemu_mutex_lock_iothread();
973d9bb58e5SYang Zhong         locked = true;
974d9bb58e5SYang Zhong     }
9752d54f194SPeter Maydell     r = memory_region_dispatch_write(mr, mr_offset,
97604e3aabdSPeter Maydell                                      val, size, iotlbentry->attrs);
97704e3aabdSPeter Maydell     if (r != MEMTX_OK) {
9782d54f194SPeter Maydell         hwaddr physaddr = mr_offset +
9792d54f194SPeter Maydell             section->offset_within_address_space -
9802d54f194SPeter Maydell             section->offset_within_region;
9812d54f194SPeter Maydell 
98204e3aabdSPeter Maydell         cpu_transaction_failed(cpu, physaddr, addr, size, MMU_DATA_STORE,
98304e3aabdSPeter Maydell                                mmu_idx, iotlbentry->attrs, r, retaddr);
98404e3aabdSPeter Maydell     }
985d9bb58e5SYang Zhong     if (locked) {
986d9bb58e5SYang Zhong         qemu_mutex_unlock_iothread();
987d9bb58e5SYang Zhong     }
988d9bb58e5SYang Zhong }
989d9bb58e5SYang Zhong 
990d9bb58e5SYang Zhong /* Return true if ADDR is present in the victim tlb, and has been copied
991d9bb58e5SYang Zhong    back to the main tlb.  */
992d9bb58e5SYang Zhong static bool victim_tlb_hit(CPUArchState *env, size_t mmu_idx, size_t index,
993d9bb58e5SYang Zhong                            size_t elt_ofs, target_ulong page)
994d9bb58e5SYang Zhong {
995d9bb58e5SYang Zhong     size_t vidx;
99671aec354SEmilio G. Cota 
99771aec354SEmilio G. Cota     assert_cpu_is_self(ENV_GET_CPU(env));
998d9bb58e5SYang Zhong     for (vidx = 0; vidx < CPU_VTLB_SIZE; ++vidx) {
999d9bb58e5SYang Zhong         CPUTLBEntry *vtlb = &env->tlb_v_table[mmu_idx][vidx];
1000403f290cSEmilio G. Cota         target_ulong cmp;
1001403f290cSEmilio G. Cota 
1002403f290cSEmilio G. Cota         /* elt_ofs might correspond to .addr_write, so use atomic_read */
1003403f290cSEmilio G. Cota #if TCG_OVERSIZED_GUEST
1004403f290cSEmilio G. Cota         cmp = *(target_ulong *)((uintptr_t)vtlb + elt_ofs);
1005403f290cSEmilio G. Cota #else
1006403f290cSEmilio G. Cota         cmp = atomic_read((target_ulong *)((uintptr_t)vtlb + elt_ofs));
1007403f290cSEmilio G. Cota #endif
1008d9bb58e5SYang Zhong 
1009d9bb58e5SYang Zhong         if (cmp == page) {
1010d9bb58e5SYang Zhong             /* Found entry in victim tlb, swap tlb and iotlb.  */
1011d9bb58e5SYang Zhong             CPUTLBEntry tmptlb, *tlb = &env->tlb_table[mmu_idx][index];
1012d9bb58e5SYang Zhong 
101353d28455SRichard Henderson             qemu_spin_lock(&env->tlb_c.lock);
101471aec354SEmilio G. Cota             copy_tlb_helper_locked(&tmptlb, tlb);
101571aec354SEmilio G. Cota             copy_tlb_helper_locked(tlb, vtlb);
101671aec354SEmilio G. Cota             copy_tlb_helper_locked(vtlb, &tmptlb);
101753d28455SRichard Henderson             qemu_spin_unlock(&env->tlb_c.lock);
1018d9bb58e5SYang Zhong 
1019d9bb58e5SYang Zhong             CPUIOTLBEntry tmpio, *io = &env->iotlb[mmu_idx][index];
1020d9bb58e5SYang Zhong             CPUIOTLBEntry *vio = &env->iotlb_v[mmu_idx][vidx];
1021d9bb58e5SYang Zhong             tmpio = *io; *io = *vio; *vio = tmpio;
1022d9bb58e5SYang Zhong             return true;
1023d9bb58e5SYang Zhong         }
1024d9bb58e5SYang Zhong     }
1025d9bb58e5SYang Zhong     return false;
1026d9bb58e5SYang Zhong }
1027d9bb58e5SYang Zhong 
1028d9bb58e5SYang Zhong /* Macro to call the above, with local variables from the use context.  */
1029d9bb58e5SYang Zhong #define VICTIM_TLB_HIT(TY, ADDR) \
1030d9bb58e5SYang Zhong   victim_tlb_hit(env, mmu_idx, index, offsetof(CPUTLBEntry, TY), \
1031d9bb58e5SYang Zhong                  (ADDR) & TARGET_PAGE_MASK)
1032d9bb58e5SYang Zhong 
1033f2553f04SKONRAD Frederic /* NOTE: this function can trigger an exception */
1034f2553f04SKONRAD Frederic /* NOTE2: the returned address is not exactly the physical address: it
1035f2553f04SKONRAD Frederic  * is actually a ram_addr_t (in system mode; the user mode emulation
1036f2553f04SKONRAD Frederic  * version of this function returns a guest virtual address).
1037f2553f04SKONRAD Frederic  */
1038f2553f04SKONRAD Frederic tb_page_addr_t get_page_addr_code(CPUArchState *env, target_ulong addr)
1039f2553f04SKONRAD Frederic {
1040383beda9SRichard Henderson     uintptr_t mmu_idx = cpu_mmu_index(env, true);
1041383beda9SRichard Henderson     uintptr_t index = tlb_index(env, mmu_idx, addr);
1042383beda9SRichard Henderson     CPUTLBEntry *entry = tlb_entry(env, mmu_idx, addr);
1043f2553f04SKONRAD Frederic     void *p;
1044f2553f04SKONRAD Frederic 
1045383beda9SRichard Henderson     if (unlikely(!tlb_hit(entry->addr_code, addr))) {
1046b493ccf1SPeter Maydell         if (!VICTIM_TLB_HIT(addr_code, addr)) {
104798670d47SLaurent Vivier             tlb_fill(ENV_GET_CPU(env), addr, 0, MMU_INST_FETCH, mmu_idx, 0);
104871b9a453SKONRAD Frederic         }
1049383beda9SRichard Henderson         assert(tlb_hit(entry->addr_code, addr));
1050f2553f04SKONRAD Frederic     }
105155df6fcfSPeter Maydell 
1052383beda9SRichard Henderson     if (unlikely(entry->addr_code & (TLB_RECHECK | TLB_MMIO))) {
105355df6fcfSPeter Maydell         /*
105455a7cb14SPeter Maydell          * Return -1 if we can't translate and execute from an entire
105555a7cb14SPeter Maydell          * page of RAM here, which will cause us to execute by loading
105655a7cb14SPeter Maydell          * and translating one insn at a time, without caching:
105755a7cb14SPeter Maydell          *  - TLB_RECHECK: means the MMU protection covers a smaller range
105855a7cb14SPeter Maydell          *    than a target page, so we must redo the MMU check every insn
105955a7cb14SPeter Maydell          *  - TLB_MMIO: region is not backed by RAM
106055df6fcfSPeter Maydell          */
106120cb6ae4SPeter Maydell         return -1;
106255df6fcfSPeter Maydell     }
106355df6fcfSPeter Maydell 
1064383beda9SRichard Henderson     p = (void *)((uintptr_t)addr + entry->addend);
1065f2553f04SKONRAD Frederic     return qemu_ram_addr_from_host_nofail(p);
1066f2553f04SKONRAD Frederic }
1067f2553f04SKONRAD Frederic 
1068d9bb58e5SYang Zhong /* Probe for whether the specified guest write access is permitted.
1069d9bb58e5SYang Zhong  * If it is not permitted then an exception will be taken in the same
1070d9bb58e5SYang Zhong  * way as if this were a real write access (and we will not return).
1071d9bb58e5SYang Zhong  * Otherwise the function will return, and there will be a valid
1072d9bb58e5SYang Zhong  * entry in the TLB for this access.
1073d9bb58e5SYang Zhong  */
107498670d47SLaurent Vivier void probe_write(CPUArchState *env, target_ulong addr, int size, int mmu_idx,
1075d9bb58e5SYang Zhong                  uintptr_t retaddr)
1076d9bb58e5SYang Zhong {
1077383beda9SRichard Henderson     uintptr_t index = tlb_index(env, mmu_idx, addr);
1078383beda9SRichard Henderson     CPUTLBEntry *entry = tlb_entry(env, mmu_idx, addr);
1079d9bb58e5SYang Zhong 
1080403f290cSEmilio G. Cota     if (!tlb_hit(tlb_addr_write(entry), addr)) {
1081d9bb58e5SYang Zhong         /* TLB entry is for a different page */
1082d9bb58e5SYang Zhong         if (!VICTIM_TLB_HIT(addr_write, addr)) {
108398670d47SLaurent Vivier             tlb_fill(ENV_GET_CPU(env), addr, size, MMU_DATA_STORE,
108498670d47SLaurent Vivier                      mmu_idx, retaddr);
1085d9bb58e5SYang Zhong         }
1086d9bb58e5SYang Zhong     }
1087d9bb58e5SYang Zhong }
1088d9bb58e5SYang Zhong 
1089d9bb58e5SYang Zhong /* Probe for a read-modify-write atomic operation.  Do not allow unaligned
1090d9bb58e5SYang Zhong  * operations, or io operations to proceed.  Return the host address.  */
1091d9bb58e5SYang Zhong static void *atomic_mmu_lookup(CPUArchState *env, target_ulong addr,
109234d49937SPeter Maydell                                TCGMemOpIdx oi, uintptr_t retaddr,
109334d49937SPeter Maydell                                NotDirtyInfo *ndi)
1094d9bb58e5SYang Zhong {
1095d9bb58e5SYang Zhong     size_t mmu_idx = get_mmuidx(oi);
1096383beda9SRichard Henderson     uintptr_t index = tlb_index(env, mmu_idx, addr);
1097383beda9SRichard Henderson     CPUTLBEntry *tlbe = tlb_entry(env, mmu_idx, addr);
1098403f290cSEmilio G. Cota     target_ulong tlb_addr = tlb_addr_write(tlbe);
1099d9bb58e5SYang Zhong     TCGMemOp mop = get_memop(oi);
1100d9bb58e5SYang Zhong     int a_bits = get_alignment_bits(mop);
1101d9bb58e5SYang Zhong     int s_bits = mop & MO_SIZE;
110234d49937SPeter Maydell     void *hostaddr;
1103d9bb58e5SYang Zhong 
1104d9bb58e5SYang Zhong     /* Adjust the given return address.  */
1105d9bb58e5SYang Zhong     retaddr -= GETPC_ADJ;
1106d9bb58e5SYang Zhong 
1107d9bb58e5SYang Zhong     /* Enforce guest required alignment.  */
1108d9bb58e5SYang Zhong     if (unlikely(a_bits > 0 && (addr & ((1 << a_bits) - 1)))) {
1109d9bb58e5SYang Zhong         /* ??? Maybe indicate atomic op to cpu_unaligned_access */
1110d9bb58e5SYang Zhong         cpu_unaligned_access(ENV_GET_CPU(env), addr, MMU_DATA_STORE,
1111d9bb58e5SYang Zhong                              mmu_idx, retaddr);
1112d9bb58e5SYang Zhong     }
1113d9bb58e5SYang Zhong 
1114d9bb58e5SYang Zhong     /* Enforce qemu required alignment.  */
1115d9bb58e5SYang Zhong     if (unlikely(addr & ((1 << s_bits) - 1))) {
1116d9bb58e5SYang Zhong         /* We get here if guest alignment was not requested,
1117d9bb58e5SYang Zhong            or was not enforced by cpu_unaligned_access above.
1118d9bb58e5SYang Zhong            We might widen the access and emulate, but for now
1119d9bb58e5SYang Zhong            mark an exception and exit the cpu loop.  */
1120d9bb58e5SYang Zhong         goto stop_the_world;
1121d9bb58e5SYang Zhong     }
1122d9bb58e5SYang Zhong 
1123d9bb58e5SYang Zhong     /* Check TLB entry and enforce page permissions.  */
1124334692bcSPeter Maydell     if (!tlb_hit(tlb_addr, addr)) {
1125d9bb58e5SYang Zhong         if (!VICTIM_TLB_HIT(addr_write, addr)) {
112698670d47SLaurent Vivier             tlb_fill(ENV_GET_CPU(env), addr, 1 << s_bits, MMU_DATA_STORE,
112798670d47SLaurent Vivier                      mmu_idx, retaddr);
1128d9bb58e5SYang Zhong         }
1129403f290cSEmilio G. Cota         tlb_addr = tlb_addr_write(tlbe) & ~TLB_INVALID_MASK;
1130d9bb58e5SYang Zhong     }
1131d9bb58e5SYang Zhong 
113255df6fcfSPeter Maydell     /* Notice an IO access or a needs-MMU-lookup access */
113355df6fcfSPeter Maydell     if (unlikely(tlb_addr & (TLB_MMIO | TLB_RECHECK))) {
1134d9bb58e5SYang Zhong         /* There's really nothing that can be done to
1135d9bb58e5SYang Zhong            support this apart from stop-the-world.  */
1136d9bb58e5SYang Zhong         goto stop_the_world;
1137d9bb58e5SYang Zhong     }
1138d9bb58e5SYang Zhong 
1139d9bb58e5SYang Zhong     /* Let the guest notice RMW on a write-only page.  */
114034d49937SPeter Maydell     if (unlikely(tlbe->addr_read != (tlb_addr & ~TLB_NOTDIRTY))) {
114198670d47SLaurent Vivier         tlb_fill(ENV_GET_CPU(env), addr, 1 << s_bits, MMU_DATA_LOAD,
114298670d47SLaurent Vivier                  mmu_idx, retaddr);
1143d9bb58e5SYang Zhong         /* Since we don't support reads and writes to different addresses,
1144d9bb58e5SYang Zhong            and we do have the proper page loaded for write, this shouldn't
1145d9bb58e5SYang Zhong            ever return.  But just in case, handle via stop-the-world.  */
1146d9bb58e5SYang Zhong         goto stop_the_world;
1147d9bb58e5SYang Zhong     }
1148d9bb58e5SYang Zhong 
114934d49937SPeter Maydell     hostaddr = (void *)((uintptr_t)addr + tlbe->addend);
115034d49937SPeter Maydell 
115134d49937SPeter Maydell     ndi->active = false;
115234d49937SPeter Maydell     if (unlikely(tlb_addr & TLB_NOTDIRTY)) {
115334d49937SPeter Maydell         ndi->active = true;
115434d49937SPeter Maydell         memory_notdirty_write_prepare(ndi, ENV_GET_CPU(env), addr,
115534d49937SPeter Maydell                                       qemu_ram_addr_from_host_nofail(hostaddr),
115634d49937SPeter Maydell                                       1 << s_bits);
115734d49937SPeter Maydell     }
115834d49937SPeter Maydell 
115934d49937SPeter Maydell     return hostaddr;
1160d9bb58e5SYang Zhong 
1161d9bb58e5SYang Zhong  stop_the_world:
1162d9bb58e5SYang Zhong     cpu_loop_exit_atomic(ENV_GET_CPU(env), retaddr);
1163d9bb58e5SYang Zhong }
1164d9bb58e5SYang Zhong 
1165d9bb58e5SYang Zhong #ifdef TARGET_WORDS_BIGENDIAN
1166d9bb58e5SYang Zhong # define TGT_BE(X)  (X)
1167d9bb58e5SYang Zhong # define TGT_LE(X)  BSWAP(X)
1168d9bb58e5SYang Zhong #else
1169d9bb58e5SYang Zhong # define TGT_BE(X)  BSWAP(X)
1170d9bb58e5SYang Zhong # define TGT_LE(X)  (X)
1171d9bb58e5SYang Zhong #endif
1172d9bb58e5SYang Zhong 
1173d9bb58e5SYang Zhong #define MMUSUFFIX _mmu
1174d9bb58e5SYang Zhong 
1175d9bb58e5SYang Zhong #define DATA_SIZE 1
1176d9bb58e5SYang Zhong #include "softmmu_template.h"
1177d9bb58e5SYang Zhong 
1178d9bb58e5SYang Zhong #define DATA_SIZE 2
1179d9bb58e5SYang Zhong #include "softmmu_template.h"
1180d9bb58e5SYang Zhong 
1181d9bb58e5SYang Zhong #define DATA_SIZE 4
1182d9bb58e5SYang Zhong #include "softmmu_template.h"
1183d9bb58e5SYang Zhong 
1184d9bb58e5SYang Zhong #define DATA_SIZE 8
1185d9bb58e5SYang Zhong #include "softmmu_template.h"
1186d9bb58e5SYang Zhong 
1187d9bb58e5SYang Zhong /* First set of helpers allows passing in of OI and RETADDR.  This makes
1188d9bb58e5SYang Zhong    them callable from other helpers.  */
1189d9bb58e5SYang Zhong 
1190d9bb58e5SYang Zhong #define EXTRA_ARGS     , TCGMemOpIdx oi, uintptr_t retaddr
1191d9bb58e5SYang Zhong #define ATOMIC_NAME(X) \
1192d9bb58e5SYang Zhong     HELPER(glue(glue(glue(atomic_ ## X, SUFFIX), END), _mmu))
119334d49937SPeter Maydell #define ATOMIC_MMU_DECLS NotDirtyInfo ndi
119434d49937SPeter Maydell #define ATOMIC_MMU_LOOKUP atomic_mmu_lookup(env, addr, oi, retaddr, &ndi)
119534d49937SPeter Maydell #define ATOMIC_MMU_CLEANUP                              \
119634d49937SPeter Maydell     do {                                                \
119734d49937SPeter Maydell         if (unlikely(ndi.active)) {                     \
119834d49937SPeter Maydell             memory_notdirty_write_complete(&ndi);       \
119934d49937SPeter Maydell         }                                               \
120034d49937SPeter Maydell     } while (0)
1201d9bb58e5SYang Zhong 
1202d9bb58e5SYang Zhong #define DATA_SIZE 1
1203d9bb58e5SYang Zhong #include "atomic_template.h"
1204d9bb58e5SYang Zhong 
1205d9bb58e5SYang Zhong #define DATA_SIZE 2
1206d9bb58e5SYang Zhong #include "atomic_template.h"
1207d9bb58e5SYang Zhong 
1208d9bb58e5SYang Zhong #define DATA_SIZE 4
1209d9bb58e5SYang Zhong #include "atomic_template.h"
1210d9bb58e5SYang Zhong 
1211d9bb58e5SYang Zhong #ifdef CONFIG_ATOMIC64
1212d9bb58e5SYang Zhong #define DATA_SIZE 8
1213d9bb58e5SYang Zhong #include "atomic_template.h"
1214d9bb58e5SYang Zhong #endif
1215d9bb58e5SYang Zhong 
1216e6cd4bb5SRichard Henderson #if HAVE_CMPXCHG128 || HAVE_ATOMIC128
1217d9bb58e5SYang Zhong #define DATA_SIZE 16
1218d9bb58e5SYang Zhong #include "atomic_template.h"
1219d9bb58e5SYang Zhong #endif
1220d9bb58e5SYang Zhong 
1221d9bb58e5SYang Zhong /* Second set of helpers are directly callable from TCG as helpers.  */
1222d9bb58e5SYang Zhong 
1223d9bb58e5SYang Zhong #undef EXTRA_ARGS
1224d9bb58e5SYang Zhong #undef ATOMIC_NAME
1225d9bb58e5SYang Zhong #undef ATOMIC_MMU_LOOKUP
1226d9bb58e5SYang Zhong #define EXTRA_ARGS         , TCGMemOpIdx oi
1227d9bb58e5SYang Zhong #define ATOMIC_NAME(X)     HELPER(glue(glue(atomic_ ## X, SUFFIX), END))
122834d49937SPeter Maydell #define ATOMIC_MMU_LOOKUP  atomic_mmu_lookup(env, addr, oi, GETPC(), &ndi)
1229d9bb58e5SYang Zhong 
1230d9bb58e5SYang Zhong #define DATA_SIZE 1
1231d9bb58e5SYang Zhong #include "atomic_template.h"
1232d9bb58e5SYang Zhong 
1233d9bb58e5SYang Zhong #define DATA_SIZE 2
1234d9bb58e5SYang Zhong #include "atomic_template.h"
1235d9bb58e5SYang Zhong 
1236d9bb58e5SYang Zhong #define DATA_SIZE 4
1237d9bb58e5SYang Zhong #include "atomic_template.h"
1238d9bb58e5SYang Zhong 
1239d9bb58e5SYang Zhong #ifdef CONFIG_ATOMIC64
1240d9bb58e5SYang Zhong #define DATA_SIZE 8
1241d9bb58e5SYang Zhong #include "atomic_template.h"
1242d9bb58e5SYang Zhong #endif
1243d9bb58e5SYang Zhong 
1244d9bb58e5SYang Zhong /* Code access functions.  */
1245d9bb58e5SYang Zhong 
1246d9bb58e5SYang Zhong #undef MMUSUFFIX
1247d9bb58e5SYang Zhong #define MMUSUFFIX _cmmu
1248d9bb58e5SYang Zhong #undef GETPC
1249d9bb58e5SYang Zhong #define GETPC() ((uintptr_t)0)
1250d9bb58e5SYang Zhong #define SOFTMMU_CODE_ACCESS
1251d9bb58e5SYang Zhong 
1252d9bb58e5SYang Zhong #define DATA_SIZE 1
1253d9bb58e5SYang Zhong #include "softmmu_template.h"
1254d9bb58e5SYang Zhong 
1255d9bb58e5SYang Zhong #define DATA_SIZE 2
1256d9bb58e5SYang Zhong #include "softmmu_template.h"
1257d9bb58e5SYang Zhong 
1258d9bb58e5SYang Zhong #define DATA_SIZE 4
1259d9bb58e5SYang Zhong #include "softmmu_template.h"
1260d9bb58e5SYang Zhong 
1261d9bb58e5SYang Zhong #define DATA_SIZE 8
1262d9bb58e5SYang Zhong #include "softmmu_template.h"
1263