2013-09-03 21:12:03 +02:00
|
|
|
#ifndef TARGET_ARM_TRANSLATE_H
|
|
|
|
#define TARGET_ARM_TRANSLATE_H
|
|
|
|
|
2023-04-02 05:38:32 +02:00
|
|
|
#include "cpu.h"
|
|
|
|
#include "tcg/tcg-op.h"
|
|
|
|
#include "tcg/tcg-op-gvec.h"
|
2023-04-02 06:12:50 +02:00
|
|
|
#include "exec/exec-all.h"
|
2017-07-14 10:21:37 +02:00
|
|
|
#include "exec/translator.h"
|
2023-03-29 20:41:03 +02:00
|
|
|
#include "exec/helper-gen.h"
|
2019-08-15 10:46:42 +02:00
|
|
|
#include "internals.h"
|
2017-07-14 10:21:37 +02:00
|
|
|
|
|
|
|
|
2013-09-03 21:12:03 +02:00
|
|
|
/* internal defines */
|
2022-10-20 05:06:41 +02:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Save pc_save across a branch, so that we may restore the value from
|
|
|
|
* before the branch at the point the label is emitted.
|
|
|
|
*/
|
|
|
|
typedef struct DisasLabel {
|
|
|
|
TCGLabel *label;
|
|
|
|
target_ulong pc_save;
|
|
|
|
} DisasLabel;
|
|
|
|
|
2013-09-03 21:12:03 +02:00
|
|
|
typedef struct DisasContext {
|
2017-07-14 11:01:59 +02:00
|
|
|
DisasContextBase base;
|
2018-10-24 08:50:16 +02:00
|
|
|
const ARMISARegisters *isar;
|
2017-07-14 11:01:59 +02:00
|
|
|
|
2019-08-15 10:46:43 +02:00
|
|
|
/* The address of the current instruction being translated. */
|
|
|
|
target_ulong pc_curr;
|
2022-10-20 05:06:41 +02:00
|
|
|
/*
|
2023-02-27 14:51:41 +01:00
|
|
|
* For CF_PCREL, the full value of cpu_pc is not known
|
2022-10-20 05:06:41 +02:00
|
|
|
* (although the page offset is known). For convenience, the
|
|
|
|
* translation loop uses the full virtual address that triggered
|
|
|
|
* the translation, from base.pc_start through pc_curr.
|
|
|
|
* For efficiency, we do not update cpu_pc for every instruction.
|
|
|
|
* Instead, pc_save has the value of pc_curr at the time of the
|
|
|
|
* last update to cpu_pc, which allows us to compute the addend
|
|
|
|
* needed to bring cpu_pc current: pc_curr - pc_save.
|
|
|
|
* If cpu_pc now contains the destination of an indirect branch,
|
|
|
|
* pc_save contains -1 to indicate that relative updates are no
|
|
|
|
* longer possible.
|
|
|
|
*/
|
|
|
|
target_ulong pc_save;
|
2018-04-10 17:09:52 +02:00
|
|
|
target_ulong page_start;
|
2013-09-03 21:12:10 +02:00
|
|
|
uint32_t insn;
|
2013-09-03 21:12:03 +02:00
|
|
|
/* Nonzero if this instruction has been conditionally skipped. */
|
|
|
|
int condjmp;
|
|
|
|
/* The label that will be jumped to when the instruction is skipped. */
|
2022-10-20 05:06:41 +02:00
|
|
|
DisasLabel condlabel;
|
2013-09-03 21:12:03 +02:00
|
|
|
/* Thumb-2 conditional execution bits. */
|
|
|
|
int condexec_mask;
|
|
|
|
int condexec_cond;
|
target/arm: Add handling for PSR.ECI/ICI
On A-profile, PSR bits [15:10][26:25] are always the IT state bits.
On M-profile, some of the reserved encodings of the IT state are used
to instead indicate partial progress through instructions that were
interrupted partway through by an exception and can be resumed.
These resumable instructions fall into two categories:
(1) load/store multiple instructions, where these bits are called
"ICI" and specify the register in the ldm/stm list where execution
should resume. (Specifically: LDM, STM, VLDM, VSTM, VLLDM, VLSTM,
CLRM, VSCCLRM.)
(2) MVE instructions subject to beatwise execution, where these bits
are called "ECI" and specify which beats in this and possibly also
the following MVE insn have been executed.
There are also a few insns (LE, LETP, and BKPT) which do not use the
ICI/ECI bits but must leave them alone.
Otherwise, we should raise an INVSTATE UsageFault for any attempt to
execute an insn with non-zero ICI/ECI bits.
So far we have been able to ignore ECI/ICI, because the architecture
allows the IMPDEF choice of "always restart load/store multiple from
the beginning regardless of ICI state", so the only thing we have
been missing is that we don't raise the INVSTATE fault for bad guest
code. However, MVE requires that we honour ECI bits and do not
rexecute beats of an insn that have already been executed.
Add the support in the decoder for handling ECI/ICI:
* identify the ECI/ICI case in the CONDEXEC TB flags
* when a load/store multiple insn succeeds, it updates the ECI/ICI
state (both in DisasContext and in the CPU state), and sets a flag
to say that the ECI/ICI state was handled
* if we find that the insn we just decoded did not handle the
ECI/ICI state, we delete all the code that we just generated for
it and instead emit the code to raise the INVFAULT. This allows
us to avoid having to update every non-MVE non-LDM/STM insn to
make it check for "is ECI/ICI set?".
We continue with our existing IMPDEF choice of not caring about the
ICI state for the load/store multiples and simply restarting them
from the beginning. Because we don't allow interrupts in the middle
of an insn, the only way we would see this state is if the guest set
ICI manually on return from an exception handler, so it's a corner
case which doesn't merit optimisation.
ICI update for LDM/STM is simple -- it always zeroes the state. ECI
update for MVE beatwise insns will be a little more complex, since
the ECI state may include information for the following insn.
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
Message-id: 20210614151007.4545-5-peter.maydell@linaro.org
2021-06-14 17:09:14 +02:00
|
|
|
/* M-profile ECI/ICI exception-continuable instruction state */
|
|
|
|
int eci;
|
|
|
|
/*
|
|
|
|
* trans_ functions for insns which are continuable should set this true
|
|
|
|
* after decode (ie after any UNDEF checks)
|
|
|
|
*/
|
|
|
|
bool eci_handled;
|
2016-03-04 12:30:19 +01:00
|
|
|
int sctlr_b;
|
2019-08-23 20:10:58 +02:00
|
|
|
MemOp be_data;
|
2013-09-03 21:12:03 +02:00
|
|
|
#if !defined(CONFIG_USER_ONLY)
|
|
|
|
int user;
|
|
|
|
#endif
|
2015-02-05 14:37:23 +01:00
|
|
|
ARMMMUIdx mmu_idx; /* MMU index to use for normal loads/stores */
|
2019-02-05 17:52:39 +01:00
|
|
|
uint8_t tbii; /* TBI1|TBI0 for insns */
|
|
|
|
uint8_t tbid; /* TBI1|TBI0 for data */
|
2020-06-26 05:31:06 +02:00
|
|
|
uint8_t tcma; /* TCMA1|TCMA0 for MTE */
|
2014-12-11 13:07:48 +01:00
|
|
|
bool ns; /* Use non-secure CPREG bank on access */
|
2015-05-29 12:28:53 +02:00
|
|
|
int fp_excp_el; /* FP exception EL or 0 if enabled */
|
2018-01-23 04:53:49 +01:00
|
|
|
int sve_excp_el; /* SVE exception EL or 0 if enabled */
|
2022-06-20 19:51:46 +02:00
|
|
|
int sme_excp_el; /* SME exception EL or 0 if enabled */
|
2022-06-08 20:38:54 +02:00
|
|
|
int vl; /* current vector length in bytes */
|
2022-06-20 19:52:03 +02:00
|
|
|
int svl; /* current streaming vector length in bytes */
|
2014-04-15 20:18:39 +02:00
|
|
|
bool vfp_enabled; /* FP enabled via FPSCR.EN */
|
2013-09-03 21:12:03 +02:00
|
|
|
int vec_len;
|
|
|
|
int vec_stride;
|
2017-04-20 18:32:31 +02:00
|
|
|
bool v7m_handler_mode;
|
2017-09-07 14:54:54 +02:00
|
|
|
bool v8m_secure; /* true if v8M and we're in Secure mode */
|
2018-10-08 15:55:04 +02:00
|
|
|
bool v8m_stackcheck; /* true if we need to perform v8M stack limit checks */
|
2019-04-29 18:36:01 +02:00
|
|
|
bool v8m_fpccr_s_wrong; /* true if v8M FPCCR.S != v8m_secure */
|
2019-04-29 18:36:01 +02:00
|
|
|
bool v7m_new_fp_ctxt_needed; /* ASPEN set but no active FP context */
|
2019-04-29 18:36:02 +02:00
|
|
|
bool v7m_lspact; /* FPCCR.LSPACT set */
|
2014-04-15 20:18:38 +02:00
|
|
|
/* Immediate value in AArch32 SVC insn; must be set if is_jmp == DISAS_SWI
|
|
|
|
* so that top level loop can generate correct syndrome information.
|
|
|
|
*/
|
|
|
|
uint32_t svc_imm;
|
2014-10-24 13:19:14 +02:00
|
|
|
int current_el;
|
2014-01-04 23:15:44 +01:00
|
|
|
GHashTable *cp_regs;
|
2014-03-17 17:31:47 +01:00
|
|
|
uint64_t features; /* CPU features bits */
|
2022-04-17 19:43:31 +02:00
|
|
|
bool aarch64;
|
2022-04-17 19:43:34 +02:00
|
|
|
bool thumb;
|
2023-06-06 11:19:35 +02:00
|
|
|
bool lse2;
|
2014-04-15 20:18:40 +02:00
|
|
|
/* Because unallocated encodings generate different exception syndrome
|
|
|
|
* information from traps due to FP being disabled, we can't do a single
|
|
|
|
* "is fp access disabled" check at a high level in the decode tree.
|
|
|
|
* To help in catching bugs where the access check was forgotten in some
|
|
|
|
* code path, we set this flag when the access check is done, and assert
|
|
|
|
* that it is set at the point where we actually touch the FP regs.
|
|
|
|
*/
|
|
|
|
bool fp_access_checked;
|
2020-08-28 11:02:47 +02:00
|
|
|
bool sve_access_checked;
|
2014-08-19 19:56:26 +02:00
|
|
|
/* ARMv8 single-step state (this is distinct from the QEMU gdbstub
|
|
|
|
* single-step support).
|
|
|
|
*/
|
|
|
|
bool ss_active;
|
|
|
|
bool pstate_ss;
|
|
|
|
/* True if the insn just emitted was a load-exclusive instruction
|
|
|
|
* (necessary for syndrome information for single step exceptions),
|
|
|
|
* ie A64 LDX*, LDAX*, A32/T32 LDREX*, LDAEX*.
|
|
|
|
*/
|
|
|
|
bool is_ldex;
|
2020-02-07 15:04:26 +01:00
|
|
|
/* True if AccType_UNPRIV should be used for LDTR et al */
|
|
|
|
bool unpriv;
|
2019-01-21 11:23:11 +01:00
|
|
|
/* True if v8.3-PAuth is active. */
|
|
|
|
bool pauth_active;
|
2020-06-26 05:31:06 +02:00
|
|
|
/* True if v8.5-MTE access to tags is enabled. */
|
|
|
|
bool ata;
|
|
|
|
/* True if v8.5-MTE tag checks affect the PE; index with is_unpriv. */
|
|
|
|
bool mte_active[2];
|
2019-02-05 17:52:36 +01:00
|
|
|
/* True with v8.5-BTI and SCTLR_ELx.BT* set. */
|
|
|
|
bool bt;
|
2019-12-01 13:20:17 +01:00
|
|
|
/* True if any CP15 access is trapped by HSTR_EL2 */
|
|
|
|
bool hstr_active;
|
2021-04-19 22:22:36 +02:00
|
|
|
/* True if memory operations require alignment */
|
|
|
|
bool align_mem;
|
2021-09-13 17:07:24 +02:00
|
|
|
/* True if PSTATE.IL is set */
|
|
|
|
bool pstate_il;
|
2022-06-20 19:51:52 +02:00
|
|
|
/* True if PSTATE.SM is set. */
|
|
|
|
bool pstate_sm;
|
|
|
|
/* True if PSTATE.ZA is set. */
|
|
|
|
bool pstate_za;
|
2022-07-08 17:14:58 +02:00
|
|
|
/* True if non-streaming insns should raise an SME Streaming exception. */
|
|
|
|
bool sme_trap_nonstreaming;
|
|
|
|
/* True if the current instruction is non-streaming. */
|
|
|
|
bool is_nonstreaming;
|
2021-09-13 11:54:31 +02:00
|
|
|
/* True if MVE insns are definitely not predicated by VPR or LTPSIZE */
|
|
|
|
bool mve_no_pred;
|
2023-01-30 19:24:45 +01:00
|
|
|
/* True if fine-grained traps are active */
|
|
|
|
bool fgt_active;
|
2023-01-30 19:24:56 +01:00
|
|
|
/* True if fine-grained trap on ERET is enabled */
|
|
|
|
bool fgt_eret;
|
2023-01-30 19:24:57 +01:00
|
|
|
/* True if fine-grained trap on SVC is enabled */
|
|
|
|
bool fgt_svc;
|
2019-02-05 17:52:37 +01:00
|
|
|
/*
|
|
|
|
* >= 0, a copy of PSTATE.BTYPE, which will be 0 without v8.5-BTI.
|
|
|
|
* < 0, set by the current instruction.
|
|
|
|
*/
|
|
|
|
int8_t btype;
|
2020-06-26 05:31:17 +02:00
|
|
|
/* A copy of cpu->dcz_blocksize. */
|
|
|
|
uint8_t dcz_blocksize;
|
2019-02-05 17:52:37 +01:00
|
|
|
/* True if this page is guarded. */
|
|
|
|
bool guarded_page;
|
2014-09-29 19:48:48 +02:00
|
|
|
/* Bottom two bits of XScale c15_cpar coprocessor access control reg */
|
|
|
|
int c15_cpar;
|
2017-11-02 15:19:14 +01:00
|
|
|
/* TCG op of the current insn_start. */
|
|
|
|
TCGOp *insn_start;
|
2013-09-03 21:12:03 +02:00
|
|
|
} DisasContext;
|
|
|
|
|
2015-09-14 15:39:47 +02:00
|
|
|
typedef struct DisasCompare {
|
|
|
|
TCGCond cond;
|
|
|
|
TCGv_i32 value;
|
|
|
|
} DisasCompare;
|
|
|
|
|
2015-09-14 15:39:47 +02:00
|
|
|
/* Share the TCG temporaries common between 32 and 64 bit modes. */
|
|
|
|
extern TCGv_i32 cpu_NF, cpu_ZF, cpu_CF, cpu_VF;
|
|
|
|
extern TCGv_i64 cpu_exclusive_addr;
|
|
|
|
extern TCGv_i64 cpu_exclusive_val;
|
2013-09-03 21:12:04 +02:00
|
|
|
|
2021-04-30 15:27:28 +02:00
|
|
|
/*
|
|
|
|
* Constant expanders for the decoders.
|
|
|
|
*/
|
|
|
|
|
|
|
|
static inline int negate(DisasContext *s, int x)
|
|
|
|
{
|
|
|
|
return -x;
|
|
|
|
}
|
|
|
|
|
2021-06-17 14:16:03 +02:00
|
|
|
static inline int plus_1(DisasContext *s, int x)
|
|
|
|
{
|
|
|
|
return x + 1;
|
|
|
|
}
|
|
|
|
|
2021-04-30 15:27:28 +02:00
|
|
|
static inline int plus_2(DisasContext *s, int x)
|
|
|
|
{
|
|
|
|
return x + 2;
|
|
|
|
}
|
|
|
|
|
2022-07-08 17:15:14 +02:00
|
|
|
static inline int plus_12(DisasContext *s, int x)
|
|
|
|
{
|
|
|
|
return x + 12;
|
|
|
|
}
|
|
|
|
|
2021-04-30 15:27:28 +02:00
|
|
|
static inline int times_2(DisasContext *s, int x)
|
|
|
|
{
|
|
|
|
return x * 2;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int times_4(DisasContext *s, int x)
|
|
|
|
{
|
|
|
|
return x * 4;
|
|
|
|
}
|
|
|
|
|
2021-06-17 14:16:03 +02:00
|
|
|
static inline int times_2_plus_1(DisasContext *s, int x)
|
|
|
|
{
|
|
|
|
return x * 2 + 1;
|
|
|
|
}
|
|
|
|
|
2021-06-28 15:58:25 +02:00
|
|
|
static inline int rsub_64(DisasContext *s, int x)
|
|
|
|
{
|
|
|
|
return 64 - x;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int rsub_32(DisasContext *s, int x)
|
|
|
|
{
|
|
|
|
return 32 - x;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int rsub_16(DisasContext *s, int x)
|
|
|
|
{
|
|
|
|
return 16 - x;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int rsub_8(DisasContext *s, int x)
|
|
|
|
{
|
|
|
|
return 8 - x;
|
|
|
|
}
|
|
|
|
|
2023-05-12 16:40:52 +02:00
|
|
|
static inline int shl_12(DisasContext *s, int x)
|
|
|
|
{
|
|
|
|
return x << 12;
|
|
|
|
}
|
|
|
|
|
2021-09-01 10:02:34 +02:00
|
|
|
static inline int neon_3same_fp_size(DisasContext *s, int x)
|
|
|
|
{
|
|
|
|
/* Convert 0==fp32, 1==fp16 into a MO_* value */
|
|
|
|
return MO_32 - x;
|
|
|
|
}
|
|
|
|
|
2014-03-17 17:31:47 +01:00
|
|
|
static inline int arm_dc_feature(DisasContext *dc, int feature)
|
|
|
|
{
|
|
|
|
return (dc->features & (1ULL << feature)) != 0;
|
|
|
|
}
|
|
|
|
|
2014-05-27 18:09:50 +02:00
|
|
|
static inline int get_mem_index(DisasContext *s)
|
|
|
|
{
|
2017-06-02 12:51:47 +02:00
|
|
|
return arm_to_core_mmu_idx(s->mmu_idx);
|
2014-05-27 18:09:50 +02:00
|
|
|
}
|
|
|
|
|
2018-01-25 12:45:28 +01:00
|
|
|
static inline void disas_set_insn_syndrome(DisasContext *s, uint32_t syn)
|
2017-02-07 19:30:00 +01:00
|
|
|
{
|
|
|
|
/* We don't need to save all of the syndrome so we mask and shift
|
|
|
|
* out unneeded bits to help the sleb128 encoder do a better job.
|
|
|
|
*/
|
|
|
|
syn &= ARM_INSN_START_WORD2_MASK;
|
|
|
|
syn >>= ARM_INSN_START_WORD2_SHIFT;
|
|
|
|
|
|
|
|
/* We check and clear insn_start_idx to catch multiple updates. */
|
2017-11-02 15:19:14 +01:00
|
|
|
assert(s->insn_start != NULL);
|
2018-04-10 14:02:26 +02:00
|
|
|
tcg_set_insn_start_param(s->insn_start, 2, syn);
|
2017-11-02 15:19:14 +01:00
|
|
|
s->insn_start = NULL;
|
2017-02-07 19:30:00 +01:00
|
|
|
}
|
|
|
|
|
2022-10-20 05:06:33 +02:00
|
|
|
static inline int curr_insn_len(DisasContext *s)
|
|
|
|
{
|
|
|
|
return s->base.pc_next - s->pc_curr;
|
|
|
|
}
|
|
|
|
|
2017-07-14 10:21:37 +02:00
|
|
|
/* is_jmp field values */
|
|
|
|
#define DISAS_JUMP DISAS_TARGET_0 /* only pc was modified dynamically */
|
2020-06-26 05:31:03 +02:00
|
|
|
/* CPU state was modified dynamically; exit to main loop for interrupts. */
|
|
|
|
#define DISAS_UPDATE_EXIT DISAS_TARGET_1
|
2013-12-17 20:42:31 +01:00
|
|
|
/* These instructions trap after executing, so the A32/T32 decoder must
|
|
|
|
* defer them until after the conditional execution state has been updated.
|
|
|
|
* WFI also needs special handling when single-stepping.
|
|
|
|
*/
|
2017-07-14 10:21:37 +02:00
|
|
|
#define DISAS_WFI DISAS_TARGET_2
|
|
|
|
#define DISAS_SWI DISAS_TARGET_3
|
2014-03-10 15:56:30 +01:00
|
|
|
/* WFE */
|
2017-07-14 10:21:37 +02:00
|
|
|
#define DISAS_WFE DISAS_TARGET_4
|
|
|
|
#define DISAS_HVC DISAS_TARGET_5
|
|
|
|
#define DISAS_SMC DISAS_TARGET_6
|
|
|
|
#define DISAS_YIELD DISAS_TARGET_7
|
arm: Implement M profile exception return properly
On M profile, return from exceptions happen when code in Handler mode
executes one of the following function call return instructions:
* POP or LDM which loads the PC
* LDR to PC
* BX register
and the new PC value is 0xFFxxxxxx.
QEMU tries to implement this by not treating the instruction
specially but then catching the attempt to execute from the magic
address value. This is not ideal, because:
* there are guest visible differences from the architecturally
specified behaviour (for instance jumping to 0xFFxxxxxx via a
different instruction should not cause an exception return but it
will in the QEMU implementation)
* we have to account for it in various places (like refusing to take
an interrupt if the PC is at a magic value, and making sure that
the MPU doesn't deny execution at the magic value addresses)
Drop these hacks, and instead implement exception return the way the
architecture specifies -- by having the relevant instructions check
for the magic value and raise the 'do an exception return' QEMU
internal exception immediately.
The effect on the generated code is minor:
bx lr, old code (and new code for Thread mode):
TCG:
mov_i32 tmp5,r14
movi_i32 tmp6,$0xfffffffffffffffe
and_i32 pc,tmp5,tmp6
movi_i32 tmp6,$0x1
and_i32 tmp5,tmp5,tmp6
st_i32 tmp5,env,$0x218
exit_tb $0x0
set_label $L0
exit_tb $0x7f2aabd61993
x86_64 generated code:
0x7f2aabe87019: mov %ebx,%ebp
0x7f2aabe8701b: and $0xfffffffffffffffe,%ebp
0x7f2aabe8701e: mov %ebp,0x3c(%r14)
0x7f2aabe87022: and $0x1,%ebx
0x7f2aabe87025: mov %ebx,0x218(%r14)
0x7f2aabe8702c: xor %eax,%eax
0x7f2aabe8702e: jmpq 0x7f2aabe7c016
bx lr, new code when in Handler mode:
TCG:
mov_i32 tmp5,r14
movi_i32 tmp6,$0xfffffffffffffffe
and_i32 pc,tmp5,tmp6
movi_i32 tmp6,$0x1
and_i32 tmp5,tmp5,tmp6
st_i32 tmp5,env,$0x218
movi_i32 tmp5,$0xffffffffff000000
brcond_i32 pc,tmp5,geu,$L1
exit_tb $0x0
set_label $L1
movi_i32 tmp5,$0x8
call exception_internal,$0x0,$0,env,tmp5
x86_64 generated code:
0x7fe8fa1264e3: mov %ebp,%ebx
0x7fe8fa1264e5: and $0xfffffffffffffffe,%ebx
0x7fe8fa1264e8: mov %ebx,0x3c(%r14)
0x7fe8fa1264ec: and $0x1,%ebp
0x7fe8fa1264ef: mov %ebp,0x218(%r14)
0x7fe8fa1264f6: cmp $0xff000000,%ebx
0x7fe8fa1264fc: jae 0x7fe8fa126509
0x7fe8fa126502: xor %eax,%eax
0x7fe8fa126504: jmpq 0x7fe8fa122016
0x7fe8fa126509: mov %r14,%rdi
0x7fe8fa12650c: mov $0x8,%esi
0x7fe8fa126511: mov $0x56095dbeccf5,%r10
0x7fe8fa12651b: callq *%r10
which is a difference of one cmp/branch-not-taken. This will
be lost in the noise of having to exit generated code and
look up the next TB anyway.
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
Reviewed-by: Richard Henderson <rth@twiddle.net>
Reviewed-by: Philippe Mathieu-Daudé <f4bug@amsat.org>
Message-id: 1491844419-12485-9-git-send-email-peter.maydell@linaro.org
2017-04-20 18:32:31 +02:00
|
|
|
/* M profile branch which might be an exception return (and so needs
|
|
|
|
* custom end-of-TB code)
|
|
|
|
*/
|
2017-07-14 10:21:37 +02:00
|
|
|
#define DISAS_BX_EXCRET DISAS_TARGET_8
|
2020-06-26 05:31:03 +02:00
|
|
|
/*
|
|
|
|
* For instructions which want an immediate exit to the main loop, as opposed
|
|
|
|
* to attempting to use lookup_and_goto_ptr. Unlike DISAS_UPDATE_EXIT, this
|
|
|
|
* doesn't write the PC on exiting the translation loop so you need to ensure
|
2022-10-20 05:06:35 +02:00
|
|
|
* something (gen_a64_update_pc or runtime helper) has done so before we reach
|
2020-06-26 05:31:03 +02:00
|
|
|
* return from cpu_tb_exec.
|
2017-04-27 05:29:20 +02:00
|
|
|
*/
|
2017-07-14 10:21:37 +02:00
|
|
|
#define DISAS_EXIT DISAS_TARGET_9
|
2020-06-26 05:31:04 +02:00
|
|
|
/* CPU state was modified dynamically; no need to exit, but do not chain. */
|
|
|
|
#define DISAS_UPDATE_NOCHAIN DISAS_TARGET_10
|
2013-12-17 20:42:31 +01:00
|
|
|
|
2013-09-03 21:12:10 +02:00
|
|
|
#ifdef TARGET_AARCH64
|
|
|
|
void a64_translate_init(void);
|
2022-10-20 05:06:35 +02:00
|
|
|
void gen_a64_update_pc(DisasContext *s, target_long diff);
|
2017-07-14 11:58:33 +02:00
|
|
|
extern const TranslatorOps aarch64_translator_ops;
|
2013-09-03 21:12:10 +02:00
|
|
|
#else
|
|
|
|
static inline void a64_translate_init(void)
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2022-10-20 05:06:35 +02:00
|
|
|
static inline void gen_a64_update_pc(DisasContext *s, target_long diff)
|
2013-09-03 21:12:10 +02:00
|
|
|
{
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2015-09-14 15:39:47 +02:00
|
|
|
void arm_test_cc(DisasCompare *cmp, int cc);
|
|
|
|
void arm_jump_cc(DisasCompare *cmp, TCGLabel *label);
|
2015-02-13 21:51:55 +01:00
|
|
|
void arm_gen_test_cc(int cc, TCGLabel *label);
|
2021-04-19 22:22:48 +02:00
|
|
|
MemOp pow2_align(unsigned i);
|
2021-04-30 15:27:29 +02:00
|
|
|
void unallocated_encoding(DisasContext *s);
|
2022-10-20 05:06:36 +02:00
|
|
|
void gen_exception_insn_el(DisasContext *s, target_long pc_diff, int excp,
|
2022-06-10 15:32:32 +02:00
|
|
|
uint32_t syn, uint32_t target_el);
|
2022-10-20 05:06:36 +02:00
|
|
|
void gen_exception_insn(DisasContext *s, target_long pc_diff,
|
|
|
|
int excp, uint32_t syn);
|
2013-12-17 20:42:33 +01:00
|
|
|
|
2018-05-07 14:17:16 +02:00
|
|
|
/* Return state of Alternate Half-precision flag, caller frees result */
|
|
|
|
static inline TCGv_i32 get_ahp_flag(void)
|
|
|
|
{
|
|
|
|
TCGv_i32 ret = tcg_temp_new_i32();
|
|
|
|
|
|
|
|
tcg_gen_ld_i32(ret, cpu_env,
|
|
|
|
offsetof(CPUARMState, vfp.xregs[ARM_VFP_FPSCR]));
|
|
|
|
tcg_gen_extract_i32(ret, ret, 26, 1);
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2019-03-01 21:04:56 +01:00
|
|
|
/* Set bits within PSTATE. */
|
|
|
|
static inline void set_pstate_bits(uint32_t bits)
|
|
|
|
{
|
|
|
|
TCGv_i32 p = tcg_temp_new_i32();
|
|
|
|
|
|
|
|
tcg_debug_assert(!(bits & CACHED_PSTATE_BITS));
|
|
|
|
|
|
|
|
tcg_gen_ld_i32(p, cpu_env, offsetof(CPUARMState, pstate));
|
|
|
|
tcg_gen_ori_i32(p, p, bits);
|
|
|
|
tcg_gen_st_i32(p, cpu_env, offsetof(CPUARMState, pstate));
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Clear bits within PSTATE. */
|
|
|
|
static inline void clear_pstate_bits(uint32_t bits)
|
|
|
|
{
|
|
|
|
TCGv_i32 p = tcg_temp_new_i32();
|
|
|
|
|
|
|
|
tcg_debug_assert(!(bits & CACHED_PSTATE_BITS));
|
|
|
|
|
|
|
|
tcg_gen_ld_i32(p, cpu_env, offsetof(CPUARMState, pstate));
|
|
|
|
tcg_gen_andi_i32(p, p, ~bits);
|
|
|
|
tcg_gen_st_i32(p, cpu_env, offsetof(CPUARMState, pstate));
|
|
|
|
}
|
|
|
|
|
|
|
|
/* If the singlestep state is Active-not-pending, advance to Active-pending. */
|
|
|
|
static inline void gen_ss_advance(DisasContext *s)
|
|
|
|
{
|
|
|
|
if (s->ss_active) {
|
|
|
|
s->pstate_ss = 0;
|
|
|
|
clear_pstate_bits(PSTATE_SS);
|
|
|
|
}
|
|
|
|
}
|
2018-10-24 08:50:19 +02:00
|
|
|
|
2019-08-15 10:46:42 +02:00
|
|
|
/* Generate an architectural singlestep exception */
|
|
|
|
static inline void gen_swstep_exception(DisasContext *s, int isv, int ex)
|
|
|
|
{
|
2022-06-10 15:32:32 +02:00
|
|
|
/* Fill in the same_el field of the syndrome in the helper. */
|
|
|
|
uint32_t syn = syn_swstep(false, isv, ex);
|
|
|
|
gen_helper_exception_swstep(cpu_env, tcg_constant_i32(syn));
|
2019-08-15 10:46:42 +02:00
|
|
|
}
|
|
|
|
|
2019-06-13 18:39:06 +02:00
|
|
|
/*
|
|
|
|
* Given a VFP floating point constant encoded into an 8 bit immediate in an
|
|
|
|
* instruction, expand it to the actual constant value of the specified
|
|
|
|
* size, as per the VFPExpandImm() pseudocode in the Arm ARM.
|
|
|
|
*/
|
|
|
|
uint64_t vfp_expand_imm(int size, uint8_t imm8);
|
|
|
|
|
2018-10-24 08:50:19 +02:00
|
|
|
/* Vector operations shared between ARM and AArch64. */
|
2020-05-13 18:32:35 +02:00
|
|
|
void gen_gvec_ceq0(unsigned vece, uint32_t rd_ofs, uint32_t rm_ofs,
|
|
|
|
uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
void gen_gvec_clt0(unsigned vece, uint32_t rd_ofs, uint32_t rm_ofs,
|
|
|
|
uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
void gen_gvec_cgt0(unsigned vece, uint32_t rd_ofs, uint32_t rm_ofs,
|
|
|
|
uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
void gen_gvec_cle0(unsigned vece, uint32_t rd_ofs, uint32_t rm_ofs,
|
|
|
|
uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
void gen_gvec_cge0(unsigned vece, uint32_t rd_ofs, uint32_t rm_ofs,
|
|
|
|
uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
|
2020-05-13 18:32:36 +02:00
|
|
|
void gen_gvec_mla(unsigned vece, uint32_t rd_ofs, uint32_t rn_ofs,
|
|
|
|
uint32_t rm_ofs, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
void gen_gvec_mls(unsigned vece, uint32_t rd_ofs, uint32_t rn_ofs,
|
|
|
|
uint32_t rm_ofs, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
|
2020-05-13 18:32:38 +02:00
|
|
|
void gen_gvec_cmtst(unsigned vece, uint32_t rd_ofs, uint32_t rn_ofs,
|
|
|
|
uint32_t rm_ofs, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
void gen_gvec_sshl(unsigned vece, uint32_t rd_ofs, uint32_t rn_ofs,
|
|
|
|
uint32_t rm_ofs, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
void gen_gvec_ushl(unsigned vece, uint32_t rd_ofs, uint32_t rn_ofs,
|
|
|
|
uint32_t rm_ofs, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
|
2018-10-24 08:50:20 +02:00
|
|
|
void gen_cmtst_i64(TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
|
2020-02-16 22:42:29 +01:00
|
|
|
void gen_ushl_i32(TCGv_i32 d, TCGv_i32 a, TCGv_i32 b);
|
|
|
|
void gen_sshl_i32(TCGv_i32 d, TCGv_i32 a, TCGv_i32 b);
|
|
|
|
void gen_ushl_i64(TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
|
|
|
|
void gen_sshl_i64(TCGv_i64 d, TCGv_i64 a, TCGv_i64 b);
|
2018-10-24 08:50:19 +02:00
|
|
|
|
2020-05-13 18:32:39 +02:00
|
|
|
void gen_gvec_uqadd_qc(unsigned vece, uint32_t rd_ofs, uint32_t rn_ofs,
|
|
|
|
uint32_t rm_ofs, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
void gen_gvec_sqadd_qc(unsigned vece, uint32_t rd_ofs, uint32_t rn_ofs,
|
|
|
|
uint32_t rm_ofs, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
void gen_gvec_uqsub_qc(unsigned vece, uint32_t rd_ofs, uint32_t rn_ofs,
|
|
|
|
uint32_t rm_ofs, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
void gen_gvec_sqsub_qc(unsigned vece, uint32_t rd_ofs, uint32_t rn_ofs,
|
|
|
|
uint32_t rm_ofs, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
|
2020-05-13 18:32:30 +02:00
|
|
|
void gen_gvec_ssra(unsigned vece, uint32_t rd_ofs, uint32_t rm_ofs,
|
|
|
|
int64_t shift, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
void gen_gvec_usra(unsigned vece, uint32_t rd_ofs, uint32_t rm_ofs,
|
|
|
|
int64_t shift, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
|
2020-05-13 18:32:31 +02:00
|
|
|
void gen_gvec_srshr(unsigned vece, uint32_t rd_ofs, uint32_t rm_ofs,
|
|
|
|
int64_t shift, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
void gen_gvec_urshr(unsigned vece, uint32_t rd_ofs, uint32_t rm_ofs,
|
|
|
|
int64_t shift, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
void gen_gvec_srsra(unsigned vece, uint32_t rd_ofs, uint32_t rm_ofs,
|
|
|
|
int64_t shift, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
void gen_gvec_ursra(unsigned vece, uint32_t rd_ofs, uint32_t rm_ofs,
|
|
|
|
int64_t shift, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
|
2020-05-13 18:32:32 +02:00
|
|
|
void gen_gvec_sri(unsigned vece, uint32_t rd_ofs, uint32_t rm_ofs,
|
|
|
|
int64_t shift, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
void gen_gvec_sli(unsigned vece, uint32_t rd_ofs, uint32_t rm_ofs,
|
|
|
|
int64_t shift, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
|
2020-05-13 18:32:41 +02:00
|
|
|
void gen_gvec_sqrdmlah_qc(unsigned vece, uint32_t rd_ofs, uint32_t rn_ofs,
|
|
|
|
uint32_t rm_ofs, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
void gen_gvec_sqrdmlsh_qc(unsigned vece, uint32_t rd_ofs, uint32_t rn_ofs,
|
|
|
|
uint32_t rm_ofs, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
|
2020-05-13 18:32:44 +02:00
|
|
|
void gen_gvec_sabd(unsigned vece, uint32_t rd_ofs, uint32_t rn_ofs,
|
|
|
|
uint32_t rm_ofs, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
void gen_gvec_uabd(unsigned vece, uint32_t rd_ofs, uint32_t rn_ofs,
|
|
|
|
uint32_t rm_ofs, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
|
2020-05-13 18:32:45 +02:00
|
|
|
void gen_gvec_saba(unsigned vece, uint32_t rd_ofs, uint32_t rn_ofs,
|
|
|
|
uint32_t rm_ofs, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
void gen_gvec_uaba(unsigned vece, uint32_t rd_ofs, uint32_t rn_ofs,
|
|
|
|
uint32_t rm_ofs, uint32_t opr_sz, uint32_t max_sz);
|
|
|
|
|
2018-10-24 08:50:16 +02:00
|
|
|
/*
|
|
|
|
* Forward to the isar_feature_* tests given a DisasContext pointer.
|
|
|
|
*/
|
|
|
|
#define dc_isar_feature(name, ctx) \
|
|
|
|
({ DisasContext *ctx_ = (ctx); isar_feature_##name(ctx_->isar); })
|
|
|
|
|
2020-04-30 20:09:41 +02:00
|
|
|
/* Note that the gvec expanders operate on offsets + sizes. */
|
|
|
|
typedef void GVecGen2Fn(unsigned, uint32_t, uint32_t, uint32_t, uint32_t);
|
|
|
|
typedef void GVecGen2iFn(unsigned, uint32_t, uint32_t, int64_t,
|
|
|
|
uint32_t, uint32_t);
|
|
|
|
typedef void GVecGen3Fn(unsigned, uint32_t, uint32_t,
|
|
|
|
uint32_t, uint32_t, uint32_t);
|
|
|
|
typedef void GVecGen4Fn(unsigned, uint32_t, uint32_t, uint32_t,
|
|
|
|
uint32_t, uint32_t, uint32_t);
|
|
|
|
|
2020-04-30 20:09:49 +02:00
|
|
|
/* Function prototype for gen_ functions for calling Neon helpers */
|
2020-06-16 19:08:35 +02:00
|
|
|
typedef void NeonGenOneOpFn(TCGv_i32, TCGv_i32);
|
2020-04-30 20:09:49 +02:00
|
|
|
typedef void NeonGenOneOpEnvFn(TCGv_i32, TCGv_ptr, TCGv_i32);
|
|
|
|
typedef void NeonGenTwoOpFn(TCGv_i32, TCGv_i32, TCGv_i32);
|
|
|
|
typedef void NeonGenTwoOpEnvFn(TCGv_i32, TCGv_ptr, TCGv_i32, TCGv_i32);
|
2021-04-30 15:27:38 +02:00
|
|
|
typedef void NeonGenThreeOpEnvFn(TCGv_i32, TCGv_env, TCGv_i32,
|
|
|
|
TCGv_i32, TCGv_i32);
|
2020-04-30 20:09:49 +02:00
|
|
|
typedef void NeonGenTwo64OpFn(TCGv_i64, TCGv_i64, TCGv_i64);
|
|
|
|
typedef void NeonGenTwo64OpEnvFn(TCGv_i64, TCGv_ptr, TCGv_i64, TCGv_i64);
|
|
|
|
typedef void NeonGenNarrowFn(TCGv_i32, TCGv_i64);
|
|
|
|
typedef void NeonGenNarrowEnvFn(TCGv_i32, TCGv_ptr, TCGv_i64);
|
|
|
|
typedef void NeonGenWidenFn(TCGv_i64, TCGv_i32);
|
2020-06-16 11:32:25 +02:00
|
|
|
typedef void NeonGenTwoOpWidenFn(TCGv_i64, TCGv_i32, TCGv_i32);
|
2020-06-16 19:08:38 +02:00
|
|
|
typedef void NeonGenOneSingleOpFn(TCGv_i32, TCGv_i32, TCGv_ptr);
|
2020-06-16 19:08:33 +02:00
|
|
|
typedef void NeonGenTwoSingleOpFn(TCGv_i32, TCGv_i32, TCGv_i32, TCGv_ptr);
|
|
|
|
typedef void NeonGenTwoDoubleOpFn(TCGv_i64, TCGv_i64, TCGv_i64, TCGv_ptr);
|
2020-06-16 19:08:32 +02:00
|
|
|
typedef void NeonGenOne64OpFn(TCGv_i64, TCGv_i64);
|
2020-04-30 20:09:49 +02:00
|
|
|
typedef void CryptoTwoOpFn(TCGv_ptr, TCGv_ptr);
|
|
|
|
typedef void CryptoThreeOpIntFn(TCGv_ptr, TCGv_ptr, TCGv_i32);
|
|
|
|
typedef void CryptoThreeOpFn(TCGv_ptr, TCGv_ptr, TCGv_ptr);
|
|
|
|
typedef void AtomicThreeOpFn(TCGv_i64, TCGv_i64, TCGv_i64, TCGArg, MemOp);
|
target/arm: Implement MVE long shifts by immediate
The MVE extension to v8.1M includes some new shift instructions which
sit entirely within the non-coprocessor part of the encoding space
and which operate only on general-purpose registers. They take up
the space which was previously UNPREDICTABLE MOVS and ORRS encodings
with Rm == 13 or 15.
Implement the long shifts by immediate, which perform shifts on a
pair of general-purpose registers treated as a 64-bit quantity, with
an immediate shift count between 1 and 32.
Awkwardly, because the MOVS and ORRS trans functions do not UNDEF for
the Rm==13,15 case, we need to explicitly emit code to UNDEF for the
cases where v8.1M now requires that. (Trying to change MOVS and ORRS
is too difficult, because the functions that generate the code are
shared between a dozen different kinds of arithmetic or logical
instruction for all A32, T16 and T32 encodings, and for some insns
and some encodings Rm==13,15 are valid.)
We make the helper functions we need for UQSHLL and SQSHLL take
a 32-bit value which the helper casts to int8_t because we'll need
these helpers also for the shift-by-register insns, where the shift
count might be < 0 or > 32.
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
Message-id: 20210628135835.6690-16-peter.maydell@linaro.org
2021-06-28 15:58:32 +02:00
|
|
|
typedef void WideShiftImmFn(TCGv_i64, TCGv_i64, int64_t shift);
|
2021-06-28 15:58:33 +02:00
|
|
|
typedef void WideShiftFn(TCGv_i64, TCGv_ptr, TCGv_i64, TCGv_i32);
|
2021-06-28 15:58:34 +02:00
|
|
|
typedef void ShiftImmFn(TCGv_i32, TCGv_i32, int32_t shift);
|
2021-06-28 15:58:35 +02:00
|
|
|
typedef void ShiftFn(TCGv_i32, TCGv_ptr, TCGv_i32, TCGv_i32);
|
2020-04-30 20:09:49 +02:00
|
|
|
|
2021-04-19 22:22:31 +02:00
|
|
|
/**
|
|
|
|
* arm_tbflags_from_tb:
|
|
|
|
* @tb: the TranslationBlock
|
|
|
|
*
|
|
|
|
* Extract the flag values from @tb.
|
|
|
|
*/
|
|
|
|
static inline CPUARMTBFlags arm_tbflags_from_tb(const TranslationBlock *tb)
|
|
|
|
{
|
2021-04-19 22:22:32 +02:00
|
|
|
return (CPUARMTBFlags){ tb->flags, tb->cs_base };
|
2021-04-19 22:22:31 +02:00
|
|
|
}
|
|
|
|
|
target/arm: Replace A64 get_fpstatus_ptr() with generic fpstatus_ptr()
We currently have two versions of get_fpstatus_ptr(), which both take
an effectively boolean argument:
* the one for A64 takes "bool is_f16" to distinguish fp16 from other ops
* the one for A32/T32 takes "int neon" to distinguish Neon from other ops
This is confusing, and to implement ARMv8.2-FP16 the A32/T32 one will
need to make a four-way distinction between "non-Neon, FP16",
"non-Neon, single/double", "Neon, FP16" and "Neon, single/double".
The A64 version will then be a strict subset of the A32/T32 version.
To clean this all up, we want to go to a single implementation which
takes an enum argument with values FPST_FPCR, FPST_STD,
FPST_FPCR_F16, and FPST_STD_F16. We rename the function to
fpstatus_ptr() so that unconverted code gets a compilation error
rather than silently passing the wrong thing to the new function.
This commit implements that new API, and converts A64 to use it:
get_fpstatus_ptr(false) -> fpstatus_ptr(FPST_FPCR)
get_fpstatus_ptr(true) -> fpstatus_ptr(FPST_FPCR_F16)
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
Message-id: 20200806104453.30393-2-peter.maydell@linaro.org
2020-08-06 12:44:50 +02:00
|
|
|
/*
|
|
|
|
* Enum for argument to fpstatus_ptr().
|
|
|
|
*/
|
|
|
|
typedef enum ARMFPStatusFlavour {
|
|
|
|
FPST_FPCR,
|
|
|
|
FPST_FPCR_F16,
|
|
|
|
FPST_STD,
|
|
|
|
FPST_STD_F16,
|
|
|
|
} ARMFPStatusFlavour;
|
|
|
|
|
|
|
|
/**
|
|
|
|
* fpstatus_ptr: return TCGv_ptr to the specified fp_status field
|
|
|
|
*
|
|
|
|
* We have multiple softfloat float_status fields in the Arm CPU state struct
|
|
|
|
* (see the comment in cpu.h for details). Return a TCGv_ptr which has
|
|
|
|
* been set up to point to the requested field in the CPU state struct.
|
|
|
|
* The options are:
|
|
|
|
*
|
|
|
|
* FPST_FPCR
|
|
|
|
* for non-FP16 operations controlled by the FPCR
|
|
|
|
* FPST_FPCR_F16
|
|
|
|
* for operations controlled by the FPCR where FPCR.FZ16 is to be used
|
|
|
|
* FPST_STD
|
|
|
|
* for A32/T32 Neon operations using the "standard FPSCR value"
|
|
|
|
* FPST_STD_F16
|
|
|
|
* as FPST_STD, but where FPCR.FZ16 is to be used
|
|
|
|
*/
|
|
|
|
static inline TCGv_ptr fpstatus_ptr(ARMFPStatusFlavour flavour)
|
|
|
|
{
|
|
|
|
TCGv_ptr statusptr = tcg_temp_new_ptr();
|
|
|
|
int offset;
|
|
|
|
|
|
|
|
switch (flavour) {
|
|
|
|
case FPST_FPCR:
|
|
|
|
offset = offsetof(CPUARMState, vfp.fp_status);
|
|
|
|
break;
|
|
|
|
case FPST_FPCR_F16:
|
|
|
|
offset = offsetof(CPUARMState, vfp.fp_status_f16);
|
|
|
|
break;
|
|
|
|
case FPST_STD:
|
|
|
|
offset = offsetof(CPUARMState, vfp.standard_fp_status);
|
|
|
|
break;
|
|
|
|
case FPST_STD_F16:
|
2020-08-06 12:44:52 +02:00
|
|
|
offset = offsetof(CPUARMState, vfp.standard_fp_status_f16);
|
|
|
|
break;
|
target/arm: Replace A64 get_fpstatus_ptr() with generic fpstatus_ptr()
We currently have two versions of get_fpstatus_ptr(), which both take
an effectively boolean argument:
* the one for A64 takes "bool is_f16" to distinguish fp16 from other ops
* the one for A32/T32 takes "int neon" to distinguish Neon from other ops
This is confusing, and to implement ARMv8.2-FP16 the A32/T32 one will
need to make a four-way distinction between "non-Neon, FP16",
"non-Neon, single/double", "Neon, FP16" and "Neon, single/double".
The A64 version will then be a strict subset of the A32/T32 version.
To clean this all up, we want to go to a single implementation which
takes an enum argument with values FPST_FPCR, FPST_STD,
FPST_FPCR_F16, and FPST_STD_F16. We rename the function to
fpstatus_ptr() so that unconverted code gets a compilation error
rather than silently passing the wrong thing to the new function.
This commit implements that new API, and converts A64 to use it:
get_fpstatus_ptr(false) -> fpstatus_ptr(FPST_FPCR)
get_fpstatus_ptr(true) -> fpstatus_ptr(FPST_FPCR_F16)
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
Reviewed-by: Alex Bennée <alex.bennee@linaro.org>
Message-id: 20200806104453.30393-2-peter.maydell@linaro.org
2020-08-06 12:44:50 +02:00
|
|
|
default:
|
|
|
|
g_assert_not_reached();
|
|
|
|
}
|
|
|
|
tcg_gen_addi_ptr(statusptr, cpu_env, offset);
|
|
|
|
return statusptr;
|
|
|
|
}
|
|
|
|
|
2021-04-19 22:22:37 +02:00
|
|
|
/**
|
2023-06-06 11:19:35 +02:00
|
|
|
* finalize_memop_atom:
|
2021-04-19 22:22:37 +02:00
|
|
|
* @s: DisasContext
|
|
|
|
* @opc: size+sign+align of the memory operation
|
2023-06-06 11:19:35 +02:00
|
|
|
* @atom: atomicity of the memory operation
|
2021-04-19 22:22:37 +02:00
|
|
|
*
|
2023-06-06 11:19:35 +02:00
|
|
|
* Build the complete MemOp for a memory operation, including alignment,
|
|
|
|
* endianness, and atomicity.
|
2021-04-19 22:22:37 +02:00
|
|
|
*
|
|
|
|
* If (op & MO_AMASK) then the operation already contains the required
|
|
|
|
* alignment, e.g. for AccType_ATOMIC. Otherwise, this an optionally
|
|
|
|
* unaligned operation, e.g. for AccType_NORMAL.
|
|
|
|
*
|
|
|
|
* In the latter case, there are configuration bits that require alignment,
|
|
|
|
* and this is applied here. Note that there is no way to indicate that
|
|
|
|
* no alignment should ever be enforced; this must be handled manually.
|
|
|
|
*/
|
2023-06-06 11:19:35 +02:00
|
|
|
static inline MemOp finalize_memop_atom(DisasContext *s, MemOp opc, MemOp atom)
|
2021-04-19 22:22:37 +02:00
|
|
|
{
|
|
|
|
if (s->align_mem && !(opc & MO_AMASK)) {
|
|
|
|
opc |= MO_ALIGN;
|
|
|
|
}
|
2023-06-06 11:19:35 +02:00
|
|
|
return opc | atom | s->be_data;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* finalize_memop:
|
|
|
|
* @s: DisasContext
|
|
|
|
* @opc: size+sign+align of the memory operation
|
|
|
|
*
|
|
|
|
* Like finalize_memop_atom, but with default atomicity.
|
|
|
|
*/
|
|
|
|
static inline MemOp finalize_memop(DisasContext *s, MemOp opc)
|
|
|
|
{
|
|
|
|
MemOp atom = s->lse2 ? MO_ATOM_WITHIN16 : MO_ATOM_IFALIGN;
|
|
|
|
return finalize_memop_atom(s, opc, atom);
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* finalize_memop_pair:
|
|
|
|
* @s: DisasContext
|
|
|
|
* @opc: size+sign+align of the memory operation
|
|
|
|
*
|
|
|
|
* Like finalize_memop_atom, but with atomicity for a pair.
|
|
|
|
* C.f. Pseudocode for Mem[], operand ispair.
|
|
|
|
*/
|
|
|
|
static inline MemOp finalize_memop_pair(DisasContext *s, MemOp opc)
|
|
|
|
{
|
|
|
|
MemOp atom = s->lse2 ? MO_ATOM_WITHIN16_PAIR : MO_ATOM_IFALIGN_PAIR;
|
|
|
|
return finalize_memop_atom(s, opc, atom);
|
2021-04-19 22:22:37 +02:00
|
|
|
}
|
|
|
|
|
2021-06-28 15:58:20 +02:00
|
|
|
/**
|
|
|
|
* asimd_imm_const: Expand an encoded SIMD constant value
|
|
|
|
*
|
|
|
|
* Expand a SIMD constant value. This is essentially the pseudocode
|
|
|
|
* AdvSIMDExpandImm, except that we also perform the boolean NOT needed for
|
|
|
|
* VMVN and VBIC (when cmode < 14 && op == 1).
|
|
|
|
*
|
|
|
|
* The combination cmode == 15 op == 1 is a reserved encoding for AArch32;
|
2021-06-28 15:58:21 +02:00
|
|
|
* callers must catch this; we return the 64-bit constant value defined
|
|
|
|
* for AArch64.
|
2021-06-28 15:58:20 +02:00
|
|
|
*
|
|
|
|
* cmode = 2,3,4,5,6,7,10,11,12,13 imm=0 was UNPREDICTABLE in v7A but
|
|
|
|
* is either not unpredictable or merely CONSTRAINED UNPREDICTABLE in v8A;
|
|
|
|
* we produce an immediate constant value of 0 in these cases.
|
|
|
|
*/
|
|
|
|
uint64_t asimd_imm_const(uint32_t imm, int cmode, int op);
|
|
|
|
|
2022-10-20 05:06:41 +02:00
|
|
|
/*
|
|
|
|
* gen_disas_label:
|
|
|
|
* Create a label and cache a copy of pc_save.
|
|
|
|
*/
|
|
|
|
static inline DisasLabel gen_disas_label(DisasContext *s)
|
|
|
|
{
|
|
|
|
return (DisasLabel){
|
|
|
|
.label = gen_new_label(),
|
|
|
|
.pc_save = s->pc_save,
|
|
|
|
};
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* set_disas_label:
|
|
|
|
* Emit a label and restore the cached copy of pc_save.
|
|
|
|
*/
|
|
|
|
static inline void set_disas_label(DisasContext *s, DisasLabel l)
|
|
|
|
{
|
|
|
|
gen_set_label(l.label);
|
|
|
|
s->pc_save = l.pc_save;
|
|
|
|
}
|
|
|
|
|
target/arm: Look up ARMCPRegInfo at runtime
Do not encode the pointer as a constant in the opcode stream.
This pointer is specific to the cpu that first generated the
translation, which runs into problems with both hot-pluggable
cpus and user-only threads, as cpus are removed. It's also a
potential correctness issue in the theoretical case of a
slightly-heterogenous system, because if CPU 0 generates a
TB and then CPU 1 executes it, CPU 1 will end up using CPU 0's
hash table, which might have a wrong set of registers in it.
(All our current systems are either completely homogenous,
M-profile, or have CPUs sufficiently different that they
wouldn't be sharing TBs anyway because the differences would
show up in the TB flags, so the correctness issue is only
theoretical, not practical.)
Perform the lookup in either helper_access_check_cp_reg,
or a new helper_lookup_cp_reg.
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
Message-id: 20230106194451.1213153-3-richard.henderson@linaro.org
[PMM: added note in commit message about correctness issue]
Reviewed-by: Peter Maydell <peter.maydell@linaro.org>
Signed-off-by: Peter Maydell <peter.maydell@linaro.org>
2023-01-06 20:44:51 +01:00
|
|
|
static inline TCGv_ptr gen_lookup_cp_reg(uint32_t key)
|
|
|
|
{
|
|
|
|
TCGv_ptr ret = tcg_temp_new_ptr();
|
|
|
|
gen_helper_lookup_cp_reg(ret, cpu_env, tcg_constant_i32(key));
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2023-02-25 22:06:53 +01:00
|
|
|
/*
|
|
|
|
* Set and reset rounding mode around another operation.
|
|
|
|
*/
|
|
|
|
static inline TCGv_i32 gen_set_rmode(ARMFPRounding rmode, TCGv_ptr fpst)
|
|
|
|
{
|
|
|
|
TCGv_i32 new = tcg_constant_i32(arm_rmode_to_sf(rmode));
|
|
|
|
TCGv_i32 old = tcg_temp_new_i32();
|
|
|
|
|
|
|
|
gen_helper_set_rmode(old, new, fpst);
|
|
|
|
return old;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void gen_restore_rmode(TCGv_i32 old, TCGv_ptr fpst)
|
|
|
|
{
|
|
|
|
gen_helper_set_rmode(old, old, fpst);
|
|
|
|
}
|
|
|
|
|
2022-05-27 20:17:14 +02:00
|
|
|
/*
|
|
|
|
* Helpers for implementing sets of trans_* functions.
|
|
|
|
* Defer the implementation of NAME to FUNC, with optional extra arguments.
|
|
|
|
*/
|
|
|
|
#define TRANS(NAME, FUNC, ...) \
|
|
|
|
static bool trans_##NAME(DisasContext *s, arg_##NAME *a) \
|
|
|
|
{ return FUNC(s, __VA_ARGS__); }
|
|
|
|
#define TRANS_FEAT(NAME, FEAT, FUNC, ...) \
|
|
|
|
static bool trans_##NAME(DisasContext *s, arg_##NAME *a) \
|
|
|
|
{ return dc_isar_feature(FEAT, s) && FUNC(s, __VA_ARGS__); }
|
|
|
|
|
2022-07-08 17:14:59 +02:00
|
|
|
#define TRANS_FEAT_NONSTREAMING(NAME, FEAT, FUNC, ...) \
|
|
|
|
static bool trans_##NAME(DisasContext *s, arg_##NAME *a) \
|
|
|
|
{ \
|
|
|
|
s->is_nonstreaming = true; \
|
|
|
|
return dc_isar_feature(FEAT, s) && FUNC(s, __VA_ARGS__); \
|
|
|
|
}
|
|
|
|
|
2013-09-03 21:12:03 +02:00
|
|
|
#endif /* TARGET_ARM_TRANSLATE_H */
|