target/arm/vec_helper: Handle oprsz less than 16 bytes in indexed operations
In the gvec helper functions for indexed operations, for AArch32 Neon the oprsz (total size of the vector) can be less than 16 bytes if the operation is on a D reg. Since the inner loop in these helpers always goes from 0 to segment, we must clamp it based on oprsz to avoid processing a full 16 byte segment when asked to handle an 8 byte wide vector. Signed-off-by: Peter Maydell <peter.maydell@linaro.org> Reviewed-by: Richard Henderson <richard.henderson@linaro.org> Message-id: 20200828183354.27913-43-peter.maydell@linaro.org
This commit is contained in:
parent
23afcdd251
commit
d7ce81e553
@ -1040,7 +1040,8 @@ DO_MULADD(gvec_vfms_s, float32_mulsub_f, float32)
|
||||
#define DO_MUL_IDX(NAME, TYPE, H) \
|
||||
void HELPER(NAME)(void *vd, void *vn, void *vm, uint32_t desc) \
|
||||
{ \
|
||||
intptr_t i, j, oprsz = simd_oprsz(desc), segment = 16 / sizeof(TYPE); \
|
||||
intptr_t i, j, oprsz = simd_oprsz(desc); \
|
||||
intptr_t segment = MIN(16, oprsz) / sizeof(TYPE); \
|
||||
intptr_t idx = simd_data(desc); \
|
||||
TYPE *d = vd, *n = vn, *m = vm; \
|
||||
for (i = 0; i < oprsz / sizeof(TYPE); i += segment) { \
|
||||
@ -1061,7 +1062,8 @@ DO_MUL_IDX(gvec_mul_idx_d, uint64_t, )
|
||||
#define DO_MLA_IDX(NAME, TYPE, OP, H) \
|
||||
void HELPER(NAME)(void *vd, void *vn, void *vm, void *va, uint32_t desc) \
|
||||
{ \
|
||||
intptr_t i, j, oprsz = simd_oprsz(desc), segment = 16 / sizeof(TYPE); \
|
||||
intptr_t i, j, oprsz = simd_oprsz(desc); \
|
||||
intptr_t segment = MIN(16, oprsz) / sizeof(TYPE); \
|
||||
intptr_t idx = simd_data(desc); \
|
||||
TYPE *d = vd, *n = vn, *m = vm, *a = va; \
|
||||
for (i = 0; i < oprsz / sizeof(TYPE); i += segment) { \
|
||||
@ -1086,7 +1088,8 @@ DO_MLA_IDX(gvec_mls_idx_d, uint64_t, -, )
|
||||
#define DO_FMUL_IDX(NAME, TYPE, H) \
|
||||
void HELPER(NAME)(void *vd, void *vn, void *vm, void *stat, uint32_t desc) \
|
||||
{ \
|
||||
intptr_t i, j, oprsz = simd_oprsz(desc), segment = 16 / sizeof(TYPE); \
|
||||
intptr_t i, j, oprsz = simd_oprsz(desc); \
|
||||
intptr_t segment = MIN(16, oprsz) / sizeof(TYPE); \
|
||||
intptr_t idx = simd_data(desc); \
|
||||
TYPE *d = vd, *n = vn, *m = vm; \
|
||||
for (i = 0; i < oprsz / sizeof(TYPE); i += segment) { \
|
||||
@ -1108,7 +1111,8 @@ DO_FMUL_IDX(gvec_fmul_idx_d, float64, )
|
||||
void HELPER(NAME)(void *vd, void *vn, void *vm, void *va, \
|
||||
void *stat, uint32_t desc) \
|
||||
{ \
|
||||
intptr_t i, j, oprsz = simd_oprsz(desc), segment = 16 / sizeof(TYPE); \
|
||||
intptr_t i, j, oprsz = simd_oprsz(desc); \
|
||||
intptr_t segment = MIN(16, oprsz) / sizeof(TYPE); \
|
||||
TYPE op1_neg = extract32(desc, SIMD_DATA_SHIFT, 1); \
|
||||
intptr_t idx = desc >> (SIMD_DATA_SHIFT + 1); \
|
||||
TYPE *d = vd, *n = vn, *m = vm, *a = va; \
|
||||
|
Loading…
Reference in New Issue
Block a user