mirror of
https://github.com/Motorhead1991/qemu.git
synced 2025-08-11 03:24:58 -06:00
target/riscv: rvv: Add tail agnostic for vector reduction instructions
Signed-off-by: eop Chen <eop.chen@sifive.com> Reviewed-by: Frank Chang <frank.chang@sifive.com> Reviewed-by: Weiwei Li <liweiwei@iscas.ac.cn> Acked-by: Alistair Francis <alistair.francis@wdc.com> Message-Id: <165449614532.19704.7000832880482980398-13@git.sr.ht> Signed-off-by: Alistair Francis <alistair.francis@wdc.com>
This commit is contained in:
parent
5eacf7d8a0
commit
df4f52a758
1 changed files with 20 additions and 0 deletions
|
@ -4535,6 +4535,9 @@ void HELPER(NAME)(void *vd, void *v0, void *vs1, \
|
||||||
{ \
|
{ \
|
||||||
uint32_t vm = vext_vm(desc); \
|
uint32_t vm = vext_vm(desc); \
|
||||||
uint32_t vl = env->vl; \
|
uint32_t vl = env->vl; \
|
||||||
|
uint32_t esz = sizeof(TD); \
|
||||||
|
uint32_t vlenb = simd_maxsz(desc); \
|
||||||
|
uint32_t vta = vext_vta(desc); \
|
||||||
uint32_t i; \
|
uint32_t i; \
|
||||||
TD s1 = *((TD *)vs1 + HD(0)); \
|
TD s1 = *((TD *)vs1 + HD(0)); \
|
||||||
\
|
\
|
||||||
|
@ -4547,6 +4550,8 @@ void HELPER(NAME)(void *vd, void *v0, void *vs1, \
|
||||||
} \
|
} \
|
||||||
*((TD *)vd + HD(0)) = s1; \
|
*((TD *)vd + HD(0)) = s1; \
|
||||||
env->vstart = 0; \
|
env->vstart = 0; \
|
||||||
|
/* set tail elements to 1s */ \
|
||||||
|
vext_set_elems_1s(vd, vta, esz, vlenb); \
|
||||||
}
|
}
|
||||||
|
|
||||||
/* vd[0] = sum(vs1[0], vs2[*]) */
|
/* vd[0] = sum(vs1[0], vs2[*]) */
|
||||||
|
@ -4616,6 +4621,9 @@ void HELPER(NAME)(void *vd, void *v0, void *vs1, \
|
||||||
{ \
|
{ \
|
||||||
uint32_t vm = vext_vm(desc); \
|
uint32_t vm = vext_vm(desc); \
|
||||||
uint32_t vl = env->vl; \
|
uint32_t vl = env->vl; \
|
||||||
|
uint32_t esz = sizeof(TD); \
|
||||||
|
uint32_t vlenb = simd_maxsz(desc); \
|
||||||
|
uint32_t vta = vext_vta(desc); \
|
||||||
uint32_t i; \
|
uint32_t i; \
|
||||||
TD s1 = *((TD *)vs1 + HD(0)); \
|
TD s1 = *((TD *)vs1 + HD(0)); \
|
||||||
\
|
\
|
||||||
|
@ -4628,6 +4636,8 @@ void HELPER(NAME)(void *vd, void *v0, void *vs1, \
|
||||||
} \
|
} \
|
||||||
*((TD *)vd + HD(0)) = s1; \
|
*((TD *)vd + HD(0)) = s1; \
|
||||||
env->vstart = 0; \
|
env->vstart = 0; \
|
||||||
|
/* set tail elements to 1s */ \
|
||||||
|
vext_set_elems_1s(vd, vta, esz, vlenb); \
|
||||||
}
|
}
|
||||||
|
|
||||||
/* Unordered sum */
|
/* Unordered sum */
|
||||||
|
@ -4652,6 +4662,9 @@ void HELPER(vfwredsum_vs_h)(void *vd, void *v0, void *vs1,
|
||||||
{
|
{
|
||||||
uint32_t vm = vext_vm(desc);
|
uint32_t vm = vext_vm(desc);
|
||||||
uint32_t vl = env->vl;
|
uint32_t vl = env->vl;
|
||||||
|
uint32_t esz = sizeof(uint32_t);
|
||||||
|
uint32_t vlenb = simd_maxsz(desc);
|
||||||
|
uint32_t vta = vext_vta(desc);
|
||||||
uint32_t i;
|
uint32_t i;
|
||||||
uint32_t s1 = *((uint32_t *)vs1 + H4(0));
|
uint32_t s1 = *((uint32_t *)vs1 + H4(0));
|
||||||
|
|
||||||
|
@ -4665,6 +4678,8 @@ void HELPER(vfwredsum_vs_h)(void *vd, void *v0, void *vs1,
|
||||||
}
|
}
|
||||||
*((uint32_t *)vd + H4(0)) = s1;
|
*((uint32_t *)vd + H4(0)) = s1;
|
||||||
env->vstart = 0;
|
env->vstart = 0;
|
||||||
|
/* set tail elements to 1s */
|
||||||
|
vext_set_elems_1s(vd, vta, esz, vlenb);
|
||||||
}
|
}
|
||||||
|
|
||||||
void HELPER(vfwredsum_vs_w)(void *vd, void *v0, void *vs1,
|
void HELPER(vfwredsum_vs_w)(void *vd, void *v0, void *vs1,
|
||||||
|
@ -4672,6 +4687,9 @@ void HELPER(vfwredsum_vs_w)(void *vd, void *v0, void *vs1,
|
||||||
{
|
{
|
||||||
uint32_t vm = vext_vm(desc);
|
uint32_t vm = vext_vm(desc);
|
||||||
uint32_t vl = env->vl;
|
uint32_t vl = env->vl;
|
||||||
|
uint32_t esz = sizeof(uint64_t);
|
||||||
|
uint32_t vlenb = simd_maxsz(desc);
|
||||||
|
uint32_t vta = vext_vta(desc);
|
||||||
uint32_t i;
|
uint32_t i;
|
||||||
uint64_t s1 = *((uint64_t *)vs1);
|
uint64_t s1 = *((uint64_t *)vs1);
|
||||||
|
|
||||||
|
@ -4685,6 +4703,8 @@ void HELPER(vfwredsum_vs_w)(void *vd, void *v0, void *vs1,
|
||||||
}
|
}
|
||||||
*((uint64_t *)vd) = s1;
|
*((uint64_t *)vd) = s1;
|
||||||
env->vstart = 0;
|
env->vstart = 0;
|
||||||
|
/* set tail elements to 1s */
|
||||||
|
vext_set_elems_1s(vd, vta, esz, vlenb);
|
||||||
}
|
}
|
||||||
|
|
||||||
/*
|
/*
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue