2014-03-28 19:42:10 +01:00
|
|
|
/*
|
|
|
|
* Software MMU support
|
|
|
|
*
|
|
|
|
* This library is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
|
|
* License as published by the Free Software Foundation; either
|
2020-10-23 14:33:53 +02:00
|
|
|
* version 2.1 of the License, or (at your option) any later version.
|
2014-03-28 19:42:10 +01:00
|
|
|
*
|
|
|
|
* This library is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
* Lesser General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
|
|
* License along with this library; if not, see <http://www.gnu.org/licenses/>.
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Generate inline load/store functions for all MMU modes (typically
|
|
|
|
* at least _user and _kernel) as well as _data versions, for all data
|
|
|
|
* sizes.
|
|
|
|
*
|
|
|
|
* Used by target op helpers.
|
|
|
|
*
|
2015-01-20 16:19:35 +01:00
|
|
|
* The syntax for the accessors is:
|
|
|
|
*
|
2020-05-08 17:43:46 +02:00
|
|
|
* load: cpu_ld{sign}{size}{end}_{mmusuffix}(env, ptr)
|
|
|
|
* cpu_ld{sign}{size}{end}_{mmusuffix}_ra(env, ptr, retaddr)
|
|
|
|
* cpu_ld{sign}{size}{end}_mmuidx_ra(env, ptr, mmu_idx, retaddr)
|
2015-01-20 16:19:35 +01:00
|
|
|
*
|
2020-05-08 17:43:46 +02:00
|
|
|
* store: cpu_st{size}{end}_{mmusuffix}(env, ptr, val)
|
|
|
|
* cpu_st{size}{end}_{mmusuffix}_ra(env, ptr, val, retaddr)
|
|
|
|
* cpu_st{size}{end}_mmuidx_ra(env, ptr, val, mmu_idx, retaddr)
|
2015-01-20 16:19:35 +01:00
|
|
|
*
|
|
|
|
* sign is:
|
|
|
|
* (empty): for 32 and 64 bit sizes
|
|
|
|
* u : unsigned
|
|
|
|
* s : signed
|
|
|
|
*
|
|
|
|
* size is:
|
|
|
|
* b: 8 bits
|
|
|
|
* w: 16 bits
|
|
|
|
* l: 32 bits
|
|
|
|
* q: 64 bits
|
|
|
|
*
|
2020-05-08 17:43:46 +02:00
|
|
|
* end is:
|
|
|
|
* (empty): for target native endian, or for 8 bit access
|
|
|
|
* _be: for forced big endian
|
|
|
|
* _le: for forced little endian
|
|
|
|
*
|
2019-12-10 06:10:04 +01:00
|
|
|
* mmusuffix is one of the generic suffixes "data" or "code", or "mmuidx".
|
|
|
|
* The "mmuidx" suffix carries an extra mmu_idx argument that specifies
|
|
|
|
* the index to use; the "data" and "code" suffixes take the index from
|
|
|
|
* cpu_mmu_index().
|
2014-03-28 19:42:10 +01:00
|
|
|
*/
|
|
|
|
#ifndef CPU_LDST_H
|
|
|
|
#define CPU_LDST_H
|
|
|
|
|
2014-03-28 19:11:26 +01:00
|
|
|
#if defined(CONFIG_USER_ONLY)
|
2018-08-14 19:12:17 +02:00
|
|
|
/* sparc32plus has 64bit long but 32bit space address
|
|
|
|
* this can make bad result with g2h() and h2g()
|
|
|
|
*/
|
|
|
|
#if TARGET_VIRT_ADDR_SPACE_BITS <= 32
|
|
|
|
typedef uint32_t abi_ptr;
|
|
|
|
#define TARGET_ABI_FMT_ptr "%x"
|
|
|
|
#else
|
|
|
|
typedef uint64_t abi_ptr;
|
|
|
|
#define TARGET_ABI_FMT_ptr "%"PRIx64
|
|
|
|
#endif
|
|
|
|
|
2021-02-12 19:48:42 +01:00
|
|
|
#ifndef TARGET_TAGGED_ADDRESSES
|
|
|
|
static inline abi_ptr cpu_untagged_addr(CPUState *cs, abi_ptr x)
|
|
|
|
{
|
|
|
|
return x;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2014-03-28 19:11:26 +01:00
|
|
|
/* All direct uses of g2h and h2g need to go away for usermode softmmu. */
|
2021-02-12 19:48:43 +01:00
|
|
|
static inline void *g2h_untagged(abi_ptr x)
|
|
|
|
{
|
|
|
|
return (void *)((uintptr_t)(x) + guest_base);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void *g2h(CPUState *cs, abi_ptr x)
|
|
|
|
{
|
|
|
|
return g2h_untagged(cpu_untagged_addr(cs, x));
|
|
|
|
}
|
2014-03-28 19:11:26 +01:00
|
|
|
|
2021-02-12 19:48:46 +01:00
|
|
|
static inline bool guest_addr_valid_untagged(abi_ulong x)
|
2021-02-12 19:48:41 +01:00
|
|
|
{
|
|
|
|
return x <= GUEST_ADDR_MAX;
|
|
|
|
}
|
2018-03-07 22:50:10 +01:00
|
|
|
|
2021-02-12 19:48:46 +01:00
|
|
|
static inline bool guest_range_valid_untagged(abi_ulong start, abi_ulong len)
|
2018-03-07 22:50:10 +01:00
|
|
|
{
|
|
|
|
return len - 1 <= GUEST_ADDR_MAX && start <= GUEST_ADDR_MAX - len + 1;
|
|
|
|
}
|
2014-03-28 19:11:26 +01:00
|
|
|
|
2021-02-12 19:48:40 +01:00
|
|
|
#define h2g_valid(x) \
|
|
|
|
(HOST_LONG_BITS <= TARGET_VIRT_ADDR_SPACE_BITS || \
|
|
|
|
(uintptr_t)(x) - guest_base <= GUEST_ADDR_MAX)
|
|
|
|
|
2014-03-28 19:11:26 +01:00
|
|
|
#define h2g_nocheck(x) ({ \
|
2021-02-12 19:48:35 +01:00
|
|
|
uintptr_t __ret = (uintptr_t)(x) - guest_base; \
|
2018-08-14 19:12:17 +02:00
|
|
|
(abi_ptr)__ret; \
|
2014-03-28 19:11:26 +01:00
|
|
|
})
|
|
|
|
|
|
|
|
#define h2g(x) ({ \
|
|
|
|
/* Check if given address fits target address space */ \
|
|
|
|
assert(h2g_valid(x)); \
|
|
|
|
h2g_nocheck(x); \
|
|
|
|
})
|
2018-08-14 19:12:17 +02:00
|
|
|
#else
|
|
|
|
typedef target_ulong abi_ptr;
|
|
|
|
#define TARGET_ABI_FMT_ptr TARGET_ABI_FMT_lx
|
2014-03-28 19:42:10 +01:00
|
|
|
#endif
|
|
|
|
|
2019-12-11 21:31:36 +01:00
|
|
|
uint32_t cpu_ldub_data(CPUArchState *env, abi_ptr ptr);
|
|
|
|
int cpu_ldsb_data(CPUArchState *env, abi_ptr ptr);
|
|
|
|
|
2020-05-08 17:43:46 +02:00
|
|
|
uint32_t cpu_lduw_be_data(CPUArchState *env, abi_ptr ptr);
|
|
|
|
int cpu_ldsw_be_data(CPUArchState *env, abi_ptr ptr);
|
|
|
|
uint32_t cpu_ldl_be_data(CPUArchState *env, abi_ptr ptr);
|
|
|
|
uint64_t cpu_ldq_be_data(CPUArchState *env, abi_ptr ptr);
|
|
|
|
|
|
|
|
uint32_t cpu_lduw_le_data(CPUArchState *env, abi_ptr ptr);
|
|
|
|
int cpu_ldsw_le_data(CPUArchState *env, abi_ptr ptr);
|
|
|
|
uint32_t cpu_ldl_le_data(CPUArchState *env, abi_ptr ptr);
|
|
|
|
uint64_t cpu_ldq_le_data(CPUArchState *env, abi_ptr ptr);
|
|
|
|
|
|
|
|
uint32_t cpu_ldub_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t ra);
|
|
|
|
int cpu_ldsb_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t ra);
|
|
|
|
|
|
|
|
uint32_t cpu_lduw_be_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t ra);
|
|
|
|
int cpu_ldsw_be_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t ra);
|
|
|
|
uint32_t cpu_ldl_be_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t ra);
|
|
|
|
uint64_t cpu_ldq_be_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t ra);
|
|
|
|
|
|
|
|
uint32_t cpu_lduw_le_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t ra);
|
|
|
|
int cpu_ldsw_le_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t ra);
|
|
|
|
uint32_t cpu_ldl_le_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t ra);
|
|
|
|
uint64_t cpu_ldq_le_data_ra(CPUArchState *env, abi_ptr ptr, uintptr_t ra);
|
2019-12-11 21:31:36 +01:00
|
|
|
|
|
|
|
void cpu_stb_data(CPUArchState *env, abi_ptr ptr, uint32_t val);
|
2020-05-08 17:43:46 +02:00
|
|
|
|
|
|
|
void cpu_stw_be_data(CPUArchState *env, abi_ptr ptr, uint32_t val);
|
|
|
|
void cpu_stl_be_data(CPUArchState *env, abi_ptr ptr, uint32_t val);
|
|
|
|
void cpu_stq_be_data(CPUArchState *env, abi_ptr ptr, uint64_t val);
|
|
|
|
|
|
|
|
void cpu_stw_le_data(CPUArchState *env, abi_ptr ptr, uint32_t val);
|
|
|
|
void cpu_stl_le_data(CPUArchState *env, abi_ptr ptr, uint32_t val);
|
|
|
|
void cpu_stq_le_data(CPUArchState *env, abi_ptr ptr, uint64_t val);
|
2019-12-11 21:31:36 +01:00
|
|
|
|
|
|
|
void cpu_stb_data_ra(CPUArchState *env, abi_ptr ptr,
|
2020-05-08 17:43:46 +02:00
|
|
|
uint32_t val, uintptr_t ra);
|
|
|
|
|
|
|
|
void cpu_stw_be_data_ra(CPUArchState *env, abi_ptr ptr,
|
|
|
|
uint32_t val, uintptr_t ra);
|
|
|
|
void cpu_stl_be_data_ra(CPUArchState *env, abi_ptr ptr,
|
|
|
|
uint32_t val, uintptr_t ra);
|
|
|
|
void cpu_stq_be_data_ra(CPUArchState *env, abi_ptr ptr,
|
|
|
|
uint64_t val, uintptr_t ra);
|
|
|
|
|
|
|
|
void cpu_stw_le_data_ra(CPUArchState *env, abi_ptr ptr,
|
|
|
|
uint32_t val, uintptr_t ra);
|
|
|
|
void cpu_stl_le_data_ra(CPUArchState *env, abi_ptr ptr,
|
|
|
|
uint32_t val, uintptr_t ra);
|
|
|
|
void cpu_stq_le_data_ra(CPUArchState *env, abi_ptr ptr,
|
|
|
|
uint64_t val, uintptr_t ra);
|
2014-03-28 19:11:26 +01:00
|
|
|
|
2019-12-11 19:33:26 +01:00
|
|
|
#if defined(CONFIG_USER_ONLY)
|
|
|
|
|
|
|
|
extern __thread uintptr_t helper_retaddr;
|
|
|
|
|
|
|
|
static inline void set_helper_retaddr(uintptr_t ra)
|
|
|
|
{
|
|
|
|
helper_retaddr = ra;
|
|
|
|
/*
|
|
|
|
* Ensure that this write is visible to the SIGSEGV handler that
|
|
|
|
* may be invoked due to a subsequent invalid memory operation.
|
|
|
|
*/
|
|
|
|
signal_barrier();
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void clear_helper_retaddr(void)
|
|
|
|
{
|
|
|
|
/*
|
|
|
|
* Ensure that previous memory operations have succeeded before
|
|
|
|
* removing the data visible to the signal handler.
|
|
|
|
*/
|
|
|
|
signal_barrier();
|
|
|
|
helper_retaddr = 0;
|
|
|
|
}
|
|
|
|
|
2019-12-10 06:10:04 +01:00
|
|
|
/*
|
|
|
|
* Provide the same *_mmuidx_ra interface as for softmmu.
|
|
|
|
* The mmu_idx argument is ignored.
|
|
|
|
*/
|
|
|
|
|
|
|
|
static inline uint32_t cpu_ldub_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra)
|
|
|
|
{
|
|
|
|
return cpu_ldub_data_ra(env, addr, ra);
|
|
|
|
}
|
|
|
|
|
2020-05-08 17:43:46 +02:00
|
|
|
static inline int cpu_ldsb_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra)
|
2019-12-10 06:10:04 +01:00
|
|
|
{
|
2020-05-08 17:43:46 +02:00
|
|
|
return cpu_ldsb_data_ra(env, addr, ra);
|
2019-12-10 06:10:04 +01:00
|
|
|
}
|
|
|
|
|
2020-05-08 17:43:46 +02:00
|
|
|
static inline uint32_t cpu_lduw_be_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra)
|
2019-12-10 06:10:04 +01:00
|
|
|
{
|
2020-05-08 17:43:46 +02:00
|
|
|
return cpu_lduw_be_data_ra(env, addr, ra);
|
2019-12-10 06:10:04 +01:00
|
|
|
}
|
|
|
|
|
2020-05-08 17:43:46 +02:00
|
|
|
static inline int cpu_ldsw_be_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra)
|
2019-12-10 06:10:04 +01:00
|
|
|
{
|
2020-05-08 17:43:46 +02:00
|
|
|
return cpu_ldsw_be_data_ra(env, addr, ra);
|
2019-12-10 06:10:04 +01:00
|
|
|
}
|
|
|
|
|
2020-05-08 17:43:46 +02:00
|
|
|
static inline uint32_t cpu_ldl_be_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra)
|
2019-12-10 06:10:04 +01:00
|
|
|
{
|
2020-05-08 17:43:46 +02:00
|
|
|
return cpu_ldl_be_data_ra(env, addr, ra);
|
2019-12-10 06:10:04 +01:00
|
|
|
}
|
|
|
|
|
2020-05-08 17:43:46 +02:00
|
|
|
static inline uint64_t cpu_ldq_be_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra)
|
|
|
|
{
|
|
|
|
return cpu_ldq_be_data_ra(env, addr, ra);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline uint32_t cpu_lduw_le_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra)
|
|
|
|
{
|
|
|
|
return cpu_lduw_le_data_ra(env, addr, ra);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int cpu_ldsw_le_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra)
|
|
|
|
{
|
|
|
|
return cpu_ldsw_le_data_ra(env, addr, ra);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline uint32_t cpu_ldl_le_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra)
|
|
|
|
{
|
|
|
|
return cpu_ldl_le_data_ra(env, addr, ra);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline uint64_t cpu_ldq_le_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra)
|
2019-12-10 06:10:04 +01:00
|
|
|
{
|
2020-05-08 17:43:46 +02:00
|
|
|
return cpu_ldq_le_data_ra(env, addr, ra);
|
2019-12-10 06:10:04 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline void cpu_stb_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
uint32_t val, int mmu_idx, uintptr_t ra)
|
|
|
|
{
|
|
|
|
cpu_stb_data_ra(env, addr, val, ra);
|
|
|
|
}
|
|
|
|
|
2020-05-08 17:43:46 +02:00
|
|
|
static inline void cpu_stw_be_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
uint32_t val, int mmu_idx,
|
|
|
|
uintptr_t ra)
|
2019-12-10 06:10:04 +01:00
|
|
|
{
|
2020-05-08 17:43:46 +02:00
|
|
|
cpu_stw_be_data_ra(env, addr, val, ra);
|
2019-12-10 06:10:04 +01:00
|
|
|
}
|
|
|
|
|
2020-05-08 17:43:46 +02:00
|
|
|
static inline void cpu_stl_be_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
uint32_t val, int mmu_idx,
|
|
|
|
uintptr_t ra)
|
|
|
|
{
|
|
|
|
cpu_stl_be_data_ra(env, addr, val, ra);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void cpu_stq_be_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
uint64_t val, int mmu_idx,
|
|
|
|
uintptr_t ra)
|
|
|
|
{
|
|
|
|
cpu_stq_be_data_ra(env, addr, val, ra);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void cpu_stw_le_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
uint32_t val, int mmu_idx,
|
|
|
|
uintptr_t ra)
|
|
|
|
{
|
|
|
|
cpu_stw_le_data_ra(env, addr, val, ra);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void cpu_stl_le_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
uint32_t val, int mmu_idx,
|
|
|
|
uintptr_t ra)
|
2019-12-10 06:10:04 +01:00
|
|
|
{
|
2020-05-08 17:43:46 +02:00
|
|
|
cpu_stl_le_data_ra(env, addr, val, ra);
|
2019-12-10 06:10:04 +01:00
|
|
|
}
|
|
|
|
|
2020-05-08 17:43:46 +02:00
|
|
|
static inline void cpu_stq_le_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
uint64_t val, int mmu_idx,
|
|
|
|
uintptr_t ra)
|
2019-12-10 06:10:04 +01:00
|
|
|
{
|
2020-05-08 17:43:46 +02:00
|
|
|
cpu_stq_le_data_ra(env, addr, val, ra);
|
2019-12-10 06:10:04 +01:00
|
|
|
}
|
|
|
|
|
2014-03-28 19:11:26 +01:00
|
|
|
#else
|
|
|
|
|
2019-12-09 22:49:58 +01:00
|
|
|
/* Needed for TCG_OVERSIZED_GUEST */
|
2020-01-01 12:23:00 +01:00
|
|
|
#include "tcg/tcg.h"
|
2014-03-28 19:11:26 +01:00
|
|
|
|
cputlb: read CPUTLBEntry.addr_write atomically
Updates can come from other threads, so readers that do not
take tlb_lock must use atomic_read to avoid undefined
behaviour (UB).
This completes the conversion to tlb_lock. This conversion results
on average in no performance loss, as the following experiments
(run on an Intel i7-6700K CPU @ 4.00GHz) show.
1. aarch64 bootup+shutdown test:
- Before:
Performance counter stats for 'taskset -c 0 ../img/aarch64/die.sh' (10 runs):
7487.087786 task-clock (msec) # 0.998 CPUs utilized ( +- 0.12% )
31,574,905,303 cycles # 4.217 GHz ( +- 0.12% )
57,097,908,812 instructions # 1.81 insns per cycle ( +- 0.08% )
10,255,415,367 branches # 1369.747 M/sec ( +- 0.08% )
173,278,962 branch-misses # 1.69% of all branches ( +- 0.18% )
7.504481349 seconds time elapsed ( +- 0.14% )
- After:
Performance counter stats for 'taskset -c 0 ../img/aarch64/die.sh' (10 runs):
7462.441328 task-clock (msec) # 0.998 CPUs utilized ( +- 0.07% )
31,478,476,520 cycles # 4.218 GHz ( +- 0.07% )
57,017,330,084 instructions # 1.81 insns per cycle ( +- 0.05% )
10,251,929,667 branches # 1373.804 M/sec ( +- 0.05% )
173,023,787 branch-misses # 1.69% of all branches ( +- 0.11% )
7.474970463 seconds time elapsed ( +- 0.07% )
2. SPEC06int:
SPEC06int (test set)
[Y axis: Speedup over master]
1.15 +-+----+------+------+------+------+------+-------+------+------+------+------+------+------+----+-+
| |
1.1 +-+.................................+++.............................+ tlb-lock-v2 (m+++x) +-+
| +++ | +++ tlb-lock-v3 (spinl|ck) |
| +++ | | +++ +++ | | |
1.05 +-+....+++...........####.........|####.+++.|......|.....###....+++...........+++....###.........+-+
| ### ++#| # |# |# ***### +++### +++#+# | +++ | #|# ### |
1 +-+++***+#++++####+++#++#++++++++++#++#+*+*++#++++#+#+****+#++++###++++###++++###++++#+#++++#+#+++-+
| *+* # #++# *** # #### *** # * *++# ****+# *| * # ****|# |# # #|# #+# # # |
0.95 +-+..*.*.#....#..#.*|*..#...#..#.*|*..#.*.*..#.*|.*.#.*++*.#.*++*+#.****.#....#+#....#.#..++#.#..+-+
| * * # # # *|* # # # *|* # * * # *++* # * * # * * # * |* # ++# # # # *** # |
| * * # ++# # *+* # # # *|* # * * # * * # * * # * * # *++* # **** # ++# # * * # |
0.9 +-+..*.*.#...|#..#.*.*..#.++#..#.*|*..#.*.*..#.*..*.#.*..*.#.*..*.#.*..*.#.*.|*.#...|#.#..*.*.#..+-+
| * * # *** # * * # |# # *+* # * * # * * # * * # * * # * * # *++* # |# # * * # |
0.85 +-+..*.*.#..*|*..#.*.*..#.***..#.*.*..#.*.*..#.*..*.#.*..*.#.*..*.#.*..*.#.*..*.#.****.#..*.*.#..+-+
| * * # *+* # * * # *|* # * * # * * # * * # * * # * * # * * # * * # * |* # * * # |
| * * # * * # * * # *+* # * * # * * # * * # * * # * * # * * # * * # * |* # * * # |
0.8 +-+..*.*.#..*.*..#.*.*..#.*.*..#.*.*..#.*.*..#.*..*.#.*..*.#.*..*.#.*..*.#.*..*.#.*++*.#..*.*.#..+-+
| * * # * * # * * # * * # * * # * * # * * # * * # * * # * * # * * # * * # * * # |
0.75 +-+--***##--***###-***###-***###-***###-***###-****##-****##-****##-****##-****##-****##--***##--+-+
400.perlben401.bzip2403.gcc429.m445.gob456.hmme45462.libqua464.h26471.omnet473483.xalancbmkgeomean
png: https://imgur.com/a/BHzpPTW
Notes:
- tlb-lock-v2 corresponds to an implementation with a mutex.
- tlb-lock-v3 corresponds to the current implementation, i.e.
a spinlock and a single lock acquisition in tlb_set_page_with_attrs.
Signed-off-by: Emilio G. Cota <cota@braap.org>
Message-Id: <20181016153840.25877-1-cota@braap.org>
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
2018-10-16 17:38:40 +02:00
|
|
|
static inline target_ulong tlb_addr_write(const CPUTLBEntry *entry)
|
|
|
|
{
|
|
|
|
#if TCG_OVERSIZED_GUEST
|
|
|
|
return entry->addr_write;
|
|
|
|
#else
|
2020-09-23 12:56:46 +02:00
|
|
|
return qatomic_read(&entry->addr_write);
|
cputlb: read CPUTLBEntry.addr_write atomically
Updates can come from other threads, so readers that do not
take tlb_lock must use atomic_read to avoid undefined
behaviour (UB).
This completes the conversion to tlb_lock. This conversion results
on average in no performance loss, as the following experiments
(run on an Intel i7-6700K CPU @ 4.00GHz) show.
1. aarch64 bootup+shutdown test:
- Before:
Performance counter stats for 'taskset -c 0 ../img/aarch64/die.sh' (10 runs):
7487.087786 task-clock (msec) # 0.998 CPUs utilized ( +- 0.12% )
31,574,905,303 cycles # 4.217 GHz ( +- 0.12% )
57,097,908,812 instructions # 1.81 insns per cycle ( +- 0.08% )
10,255,415,367 branches # 1369.747 M/sec ( +- 0.08% )
173,278,962 branch-misses # 1.69% of all branches ( +- 0.18% )
7.504481349 seconds time elapsed ( +- 0.14% )
- After:
Performance counter stats for 'taskset -c 0 ../img/aarch64/die.sh' (10 runs):
7462.441328 task-clock (msec) # 0.998 CPUs utilized ( +- 0.07% )
31,478,476,520 cycles # 4.218 GHz ( +- 0.07% )
57,017,330,084 instructions # 1.81 insns per cycle ( +- 0.05% )
10,251,929,667 branches # 1373.804 M/sec ( +- 0.05% )
173,023,787 branch-misses # 1.69% of all branches ( +- 0.11% )
7.474970463 seconds time elapsed ( +- 0.07% )
2. SPEC06int:
SPEC06int (test set)
[Y axis: Speedup over master]
1.15 +-+----+------+------+------+------+------+-------+------+------+------+------+------+------+----+-+
| |
1.1 +-+.................................+++.............................+ tlb-lock-v2 (m+++x) +-+
| +++ | +++ tlb-lock-v3 (spinl|ck) |
| +++ | | +++ +++ | | |
1.05 +-+....+++...........####.........|####.+++.|......|.....###....+++...........+++....###.........+-+
| ### ++#| # |# |# ***### +++### +++#+# | +++ | #|# ### |
1 +-+++***+#++++####+++#++#++++++++++#++#+*+*++#++++#+#+****+#++++###++++###++++###++++#+#++++#+#+++-+
| *+* # #++# *** # #### *** # * *++# ****+# *| * # ****|# |# # #|# #+# # # |
0.95 +-+..*.*.#....#..#.*|*..#...#..#.*|*..#.*.*..#.*|.*.#.*++*.#.*++*+#.****.#....#+#....#.#..++#.#..+-+
| * * # # # *|* # # # *|* # * * # *++* # * * # * * # * |* # ++# # # # *** # |
| * * # ++# # *+* # # # *|* # * * # * * # * * # * * # *++* # **** # ++# # * * # |
0.9 +-+..*.*.#...|#..#.*.*..#.++#..#.*|*..#.*.*..#.*..*.#.*..*.#.*..*.#.*..*.#.*.|*.#...|#.#..*.*.#..+-+
| * * # *** # * * # |# # *+* # * * # * * # * * # * * # * * # *++* # |# # * * # |
0.85 +-+..*.*.#..*|*..#.*.*..#.***..#.*.*..#.*.*..#.*..*.#.*..*.#.*..*.#.*..*.#.*..*.#.****.#..*.*.#..+-+
| * * # *+* # * * # *|* # * * # * * # * * # * * # * * # * * # * * # * |* # * * # |
| * * # * * # * * # *+* # * * # * * # * * # * * # * * # * * # * * # * |* # * * # |
0.8 +-+..*.*.#..*.*..#.*.*..#.*.*..#.*.*..#.*.*..#.*..*.#.*..*.#.*..*.#.*..*.#.*..*.#.*++*.#..*.*.#..+-+
| * * # * * # * * # * * # * * # * * # * * # * * # * * # * * # * * # * * # * * # |
0.75 +-+--***##--***###-***###-***###-***###-***###-****##-****##-****##-****##-****##-****##--***##--+-+
400.perlben401.bzip2403.gcc429.m445.gob456.hmme45462.libqua464.h26471.omnet473483.xalancbmkgeomean
png: https://imgur.com/a/BHzpPTW
Notes:
- tlb-lock-v2 corresponds to an implementation with a mutex.
- tlb-lock-v3 corresponds to the current implementation, i.e.
a spinlock and a single lock acquisition in tlb_set_page_with_attrs.
Signed-off-by: Emilio G. Cota <cota@braap.org>
Message-Id: <20181016153840.25877-1-cota@braap.org>
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
2018-10-16 17:38:40 +02:00
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2019-01-16 18:01:13 +01:00
|
|
|
/* Find the TLB index corresponding to the mmu_idx + address pair. */
|
|
|
|
static inline uintptr_t tlb_index(CPUArchState *env, uintptr_t mmu_idx,
|
|
|
|
target_ulong addr)
|
|
|
|
{
|
2019-03-22 21:52:09 +01:00
|
|
|
uintptr_t size_mask = env_tlb(env)->f[mmu_idx].mask >> CPU_TLB_ENTRY_BITS;
|
2019-01-16 18:01:13 +01:00
|
|
|
|
|
|
|
return (addr >> TARGET_PAGE_BITS) & size_mask;
|
|
|
|
}
|
|
|
|
|
2018-10-09 19:51:25 +02:00
|
|
|
/* Find the TLB entry corresponding to the mmu_idx + address pair. */
|
|
|
|
static inline CPUTLBEntry *tlb_entry(CPUArchState *env, uintptr_t mmu_idx,
|
|
|
|
target_ulong addr)
|
|
|
|
{
|
2019-03-22 21:52:09 +01:00
|
|
|
return &env_tlb(env)->f[mmu_idx].table[tlb_index(env, mmu_idx, addr)];
|
2018-10-09 19:51:25 +02:00
|
|
|
}
|
|
|
|
|
2019-12-09 22:49:58 +01:00
|
|
|
uint32_t cpu_ldub_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra);
|
|
|
|
int cpu_ldsb_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra);
|
2020-05-08 17:43:46 +02:00
|
|
|
|
|
|
|
uint32_t cpu_lduw_be_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra);
|
|
|
|
int cpu_ldsw_be_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra);
|
|
|
|
uint32_t cpu_ldl_be_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra);
|
|
|
|
uint64_t cpu_ldq_be_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra);
|
|
|
|
|
|
|
|
uint32_t cpu_lduw_le_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra);
|
|
|
|
int cpu_ldsw_le_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra);
|
|
|
|
uint32_t cpu_ldl_le_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra);
|
|
|
|
uint64_t cpu_ldq_le_mmuidx_ra(CPUArchState *env, abi_ptr addr,
|
|
|
|
int mmu_idx, uintptr_t ra);
|
2019-12-09 22:49:58 +01:00
|
|
|
|
|
|
|
void cpu_stb_mmuidx_ra(CPUArchState *env, abi_ptr addr, uint32_t val,
|
|
|
|
int mmu_idx, uintptr_t retaddr);
|
2020-05-08 17:43:46 +02:00
|
|
|
|
|
|
|
void cpu_stw_be_mmuidx_ra(CPUArchState *env, abi_ptr addr, uint32_t val,
|
|
|
|
int mmu_idx, uintptr_t retaddr);
|
|
|
|
void cpu_stl_be_mmuidx_ra(CPUArchState *env, abi_ptr addr, uint32_t val,
|
|
|
|
int mmu_idx, uintptr_t retaddr);
|
|
|
|
void cpu_stq_be_mmuidx_ra(CPUArchState *env, abi_ptr addr, uint64_t val,
|
|
|
|
int mmu_idx, uintptr_t retaddr);
|
|
|
|
|
|
|
|
void cpu_stw_le_mmuidx_ra(CPUArchState *env, abi_ptr addr, uint32_t val,
|
|
|
|
int mmu_idx, uintptr_t retaddr);
|
|
|
|
void cpu_stl_le_mmuidx_ra(CPUArchState *env, abi_ptr addr, uint32_t val,
|
|
|
|
int mmu_idx, uintptr_t retaddr);
|
|
|
|
void cpu_stq_le_mmuidx_ra(CPUArchState *env, abi_ptr addr, uint64_t val,
|
|
|
|
int mmu_idx, uintptr_t retaddr);
|
2019-12-09 22:49:58 +01:00
|
|
|
|
2019-12-11 21:31:36 +01:00
|
|
|
#endif /* defined(CONFIG_USER_ONLY) */
|
|
|
|
|
2020-05-08 17:43:46 +02:00
|
|
|
#ifdef TARGET_WORDS_BIGENDIAN
|
|
|
|
# define cpu_lduw_data cpu_lduw_be_data
|
|
|
|
# define cpu_ldsw_data cpu_ldsw_be_data
|
|
|
|
# define cpu_ldl_data cpu_ldl_be_data
|
|
|
|
# define cpu_ldq_data cpu_ldq_be_data
|
|
|
|
# define cpu_lduw_data_ra cpu_lduw_be_data_ra
|
|
|
|
# define cpu_ldsw_data_ra cpu_ldsw_be_data_ra
|
|
|
|
# define cpu_ldl_data_ra cpu_ldl_be_data_ra
|
|
|
|
# define cpu_ldq_data_ra cpu_ldq_be_data_ra
|
|
|
|
# define cpu_lduw_mmuidx_ra cpu_lduw_be_mmuidx_ra
|
|
|
|
# define cpu_ldsw_mmuidx_ra cpu_ldsw_be_mmuidx_ra
|
|
|
|
# define cpu_ldl_mmuidx_ra cpu_ldl_be_mmuidx_ra
|
|
|
|
# define cpu_ldq_mmuidx_ra cpu_ldq_be_mmuidx_ra
|
|
|
|
# define cpu_stw_data cpu_stw_be_data
|
|
|
|
# define cpu_stl_data cpu_stl_be_data
|
|
|
|
# define cpu_stq_data cpu_stq_be_data
|
|
|
|
# define cpu_stw_data_ra cpu_stw_be_data_ra
|
|
|
|
# define cpu_stl_data_ra cpu_stl_be_data_ra
|
|
|
|
# define cpu_stq_data_ra cpu_stq_be_data_ra
|
|
|
|
# define cpu_stw_mmuidx_ra cpu_stw_be_mmuidx_ra
|
|
|
|
# define cpu_stl_mmuidx_ra cpu_stl_be_mmuidx_ra
|
|
|
|
# define cpu_stq_mmuidx_ra cpu_stq_be_mmuidx_ra
|
|
|
|
#else
|
|
|
|
# define cpu_lduw_data cpu_lduw_le_data
|
|
|
|
# define cpu_ldsw_data cpu_ldsw_le_data
|
|
|
|
# define cpu_ldl_data cpu_ldl_le_data
|
|
|
|
# define cpu_ldq_data cpu_ldq_le_data
|
|
|
|
# define cpu_lduw_data_ra cpu_lduw_le_data_ra
|
|
|
|
# define cpu_ldsw_data_ra cpu_ldsw_le_data_ra
|
|
|
|
# define cpu_ldl_data_ra cpu_ldl_le_data_ra
|
|
|
|
# define cpu_ldq_data_ra cpu_ldq_le_data_ra
|
|
|
|
# define cpu_lduw_mmuidx_ra cpu_lduw_le_mmuidx_ra
|
|
|
|
# define cpu_ldsw_mmuidx_ra cpu_ldsw_le_mmuidx_ra
|
|
|
|
# define cpu_ldl_mmuidx_ra cpu_ldl_le_mmuidx_ra
|
|
|
|
# define cpu_ldq_mmuidx_ra cpu_ldq_le_mmuidx_ra
|
|
|
|
# define cpu_stw_data cpu_stw_le_data
|
|
|
|
# define cpu_stl_data cpu_stl_le_data
|
|
|
|
# define cpu_stq_data cpu_stq_le_data
|
|
|
|
# define cpu_stw_data_ra cpu_stw_le_data_ra
|
|
|
|
# define cpu_stl_data_ra cpu_stl_le_data_ra
|
|
|
|
# define cpu_stq_data_ra cpu_stq_le_data_ra
|
|
|
|
# define cpu_stw_mmuidx_ra cpu_stw_le_mmuidx_ra
|
|
|
|
# define cpu_stl_mmuidx_ra cpu_stl_le_mmuidx_ra
|
|
|
|
# define cpu_stq_mmuidx_ra cpu_stq_le_mmuidx_ra
|
|
|
|
#endif
|
|
|
|
|
2019-12-11 20:25:10 +01:00
|
|
|
uint32_t cpu_ldub_code(CPUArchState *env, abi_ptr addr);
|
|
|
|
uint32_t cpu_lduw_code(CPUArchState *env, abi_ptr addr);
|
|
|
|
uint32_t cpu_ldl_code(CPUArchState *env, abi_ptr addr);
|
|
|
|
uint64_t cpu_ldq_code(CPUArchState *env, abi_ptr addr);
|
2014-03-28 19:11:26 +01:00
|
|
|
|
2019-12-11 20:25:10 +01:00
|
|
|
static inline int cpu_ldsb_code(CPUArchState *env, abi_ptr addr)
|
|
|
|
{
|
|
|
|
return (int8_t)cpu_ldub_code(env, addr);
|
|
|
|
}
|
2014-03-28 19:11:26 +01:00
|
|
|
|
2019-12-11 20:25:10 +01:00
|
|
|
static inline int cpu_ldsw_code(CPUArchState *env, abi_ptr addr)
|
|
|
|
{
|
|
|
|
return (int16_t)cpu_lduw_code(env, addr);
|
|
|
|
}
|
2014-03-28 19:11:26 +01:00
|
|
|
|
|
|
|
/**
|
|
|
|
* tlb_vaddr_to_host:
|
|
|
|
* @env: CPUArchState
|
|
|
|
* @addr: guest virtual address to look up
|
|
|
|
* @access_type: 0 for read, 1 for write, 2 for execute
|
|
|
|
* @mmu_idx: MMU index to use for lookup
|
|
|
|
*
|
|
|
|
* Look up the specified guest virtual index in the TCG softmmu TLB.
|
2019-04-03 05:16:56 +02:00
|
|
|
* If we can translate a host virtual address suitable for direct RAM
|
|
|
|
* access, without causing a guest exception, then return it.
|
|
|
|
* Otherwise (TLB entry is for an I/O access, guest software
|
|
|
|
* TLB fill required, etc) return NULL.
|
2014-03-28 19:11:26 +01:00
|
|
|
*/
|
2019-04-03 05:16:56 +02:00
|
|
|
#ifdef CONFIG_USER_ONLY
|
2018-08-14 19:12:17 +02:00
|
|
|
static inline void *tlb_vaddr_to_host(CPUArchState *env, abi_ptr addr,
|
2019-04-03 05:16:56 +02:00
|
|
|
MMUAccessType access_type, int mmu_idx)
|
2014-03-28 19:11:26 +01:00
|
|
|
{
|
2021-02-12 19:48:43 +01:00
|
|
|
return g2h(env_cpu(env), addr);
|
2015-06-13 00:45:49 +02:00
|
|
|
}
|
2019-04-03 05:16:56 +02:00
|
|
|
#else
|
|
|
|
void *tlb_vaddr_to_host(CPUArchState *env, abi_ptr addr,
|
|
|
|
MMUAccessType access_type, int mmu_idx);
|
|
|
|
#endif
|
2014-03-28 19:11:26 +01:00
|
|
|
|
2014-03-28 19:42:10 +01:00
|
|
|
#endif /* CPU_LDST_H */
|