target/loongarch: Implement xvsllwil xvextl

This patch includes:
- XVSLLWIL.{H.B/W.H/D.W};
- XVSLLWIL.{HU.BU/WU.HU/DU.WU};
- XVEXTL.Q.D, VEXTL.QU.DU.

Signed-off-by: Song Gao <gaosong@loongson.cn>
Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
Message-Id: <20230914022645.1151356-37-gaosong@loongson.cn>
This commit is contained in:
Song Gao 2023-09-14 10:26:24 +08:00
parent ad6dc7189a
commit 6567eac7f7
No known key found for this signature in database
GPG key ID: 40A2FFF239263EDF
4 changed files with 63 additions and 21 deletions

View file

@ -2077,6 +2077,15 @@ INSN_LASX(xvrotri_h, vv_i)
INSN_LASX(xvrotri_w, vv_i) INSN_LASX(xvrotri_w, vv_i)
INSN_LASX(xvrotri_d, vv_i) INSN_LASX(xvrotri_d, vv_i)
INSN_LASX(xvsllwil_h_b, vv_i)
INSN_LASX(xvsllwil_w_h, vv_i)
INSN_LASX(xvsllwil_d_w, vv_i)
INSN_LASX(xvextl_q_d, vv)
INSN_LASX(xvsllwil_hu_bu, vv_i)
INSN_LASX(xvsllwil_wu_hu, vv_i)
INSN_LASX(xvsllwil_du_wu, vv_i)
INSN_LASX(xvextl_qu_du, vv)
INSN_LASX(xvreplgr2vr_b, vr) INSN_LASX(xvreplgr2vr_b, vr)
INSN_LASX(xvreplgr2vr_h, vr) INSN_LASX(xvreplgr2vr_h, vr)
INSN_LASX(xvreplgr2vr_w, vr) INSN_LASX(xvreplgr2vr_w, vr)

View file

@ -164,6 +164,10 @@ static bool gen_xx(DisasContext *ctx, arg_vv *a, gen_helper_gvec_2 *fn)
static bool gen_vv_i_vl(DisasContext *ctx, arg_vv_i *a, uint32_t oprsz, static bool gen_vv_i_vl(DisasContext *ctx, arg_vv_i *a, uint32_t oprsz,
gen_helper_gvec_2i *fn) gen_helper_gvec_2i *fn)
{ {
if (!check_vec(ctx, oprsz)) {
return true;
}
tcg_gen_gvec_2i_ool(vec_full_offset(a->vd), tcg_gen_gvec_2i_ool(vec_full_offset(a->vd),
vec_full_offset(a->vj), vec_full_offset(a->vj),
tcg_constant_i64(a->imm), tcg_constant_i64(a->imm),
@ -173,11 +177,12 @@ static bool gen_vv_i_vl(DisasContext *ctx, arg_vv_i *a, uint32_t oprsz,
static bool gen_vv_i(DisasContext *ctx, arg_vv_i *a, gen_helper_gvec_2i *fn) static bool gen_vv_i(DisasContext *ctx, arg_vv_i *a, gen_helper_gvec_2i *fn)
{ {
if (!check_vec(ctx, 16)) { return gen_vv_i_vl(ctx, a, 16, fn);
return true;
} }
return gen_vv_i_vl(ctx, a, 16, fn); static bool gen_xx_i(DisasContext *ctx, arg_vv_i *a, gen_helper_gvec_2i *fn)
{
return gen_vv_i_vl(ctx, a, 32, fn);
} }
static bool gen_cv(DisasContext *ctx, arg_cv *a, static bool gen_cv(DisasContext *ctx, arg_cv *a,
@ -3717,6 +3722,14 @@ TRANS(vsllwil_hu_bu, LSX, gen_vv_i, gen_helper_vsllwil_hu_bu)
TRANS(vsllwil_wu_hu, LSX, gen_vv_i, gen_helper_vsllwil_wu_hu) TRANS(vsllwil_wu_hu, LSX, gen_vv_i, gen_helper_vsllwil_wu_hu)
TRANS(vsllwil_du_wu, LSX, gen_vv_i, gen_helper_vsllwil_du_wu) TRANS(vsllwil_du_wu, LSX, gen_vv_i, gen_helper_vsllwil_du_wu)
TRANS(vextl_qu_du, LSX, gen_vv, gen_helper_vextl_qu_du) TRANS(vextl_qu_du, LSX, gen_vv, gen_helper_vextl_qu_du)
TRANS(xvsllwil_h_b, LASX, gen_xx_i, gen_helper_vsllwil_h_b)
TRANS(xvsllwil_w_h, LASX, gen_xx_i, gen_helper_vsllwil_w_h)
TRANS(xvsllwil_d_w, LASX, gen_xx_i, gen_helper_vsllwil_d_w)
TRANS(xvextl_q_d, LASX, gen_xx, gen_helper_vextl_q_d)
TRANS(xvsllwil_hu_bu, LASX, gen_xx_i, gen_helper_vsllwil_hu_bu)
TRANS(xvsllwil_wu_hu, LASX, gen_xx_i, gen_helper_vsllwil_wu_hu)
TRANS(xvsllwil_du_wu, LASX, gen_xx_i, gen_helper_vsllwil_du_wu)
TRANS(xvextl_qu_du, LASX, gen_xx, gen_helper_vextl_qu_du)
TRANS(vsrlr_b, LSX, gen_vvv, gen_helper_vsrlr_b) TRANS(vsrlr_b, LSX, gen_vvv, gen_helper_vsrlr_b)
TRANS(vsrlr_h, LSX, gen_vvv, gen_helper_vsrlr_h) TRANS(vsrlr_h, LSX, gen_vvv, gen_helper_vsrlr_h)

View file

@ -1652,6 +1652,15 @@ xvrotri_h 0111 01101010 00000 1 .... ..... ..... @vv_ui4
xvrotri_w 0111 01101010 00001 ..... ..... ..... @vv_ui5 xvrotri_w 0111 01101010 00001 ..... ..... ..... @vv_ui5
xvrotri_d 0111 01101010 0001 ...... ..... ..... @vv_ui6 xvrotri_d 0111 01101010 0001 ...... ..... ..... @vv_ui6
xvsllwil_h_b 0111 01110000 10000 01 ... ..... ..... @vv_ui3
xvsllwil_w_h 0111 01110000 10000 1 .... ..... ..... @vv_ui4
xvsllwil_d_w 0111 01110000 10001 ..... ..... ..... @vv_ui5
xvextl_q_d 0111 01110000 10010 00000 ..... ..... @vv
xvsllwil_hu_bu 0111 01110000 11000 01 ... ..... ..... @vv_ui3
xvsllwil_wu_hu 0111 01110000 11000 1 .... ..... ..... @vv_ui4
xvsllwil_du_wu 0111 01110000 11001 ..... ..... ..... @vv_ui5
xvextl_qu_du 0111 01110000 11010 00000 ..... ..... @vv
xvreplgr2vr_b 0111 01101001 11110 00000 ..... ..... @vr xvreplgr2vr_b 0111 01101001 11110 00000 ..... ..... @vr
xvreplgr2vr_h 0111 01101001 11110 00001 ..... ..... @vr xvreplgr2vr_h 0111 01101001 11110 00001 ..... ..... @vr
xvreplgr2vr_w 0111 01101001 11110 00010 ..... ..... @vr xvreplgr2vr_w 0111 01101001 11110 00010 ..... ..... @vr

View file

@ -955,34 +955,45 @@ void HELPER(vnori_b)(void *vd, void *vj, uint64_t imm, uint32_t desc)
#define VSLLWIL(NAME, BIT, E1, E2) \ #define VSLLWIL(NAME, BIT, E1, E2) \
void HELPER(NAME)(void *vd, void *vj, uint64_t imm, uint32_t desc) \ void HELPER(NAME)(void *vd, void *vj, uint64_t imm, uint32_t desc) \
{ \ { \
int i; \ int i, j, ofs; \
VReg temp; \ VReg temp = {}; \
VReg *Vd = (VReg *)vd; \ VReg *Vd = (VReg *)vd; \
VReg *Vj = (VReg *)vj; \ VReg *Vj = (VReg *)vj; \
int oprsz = simd_oprsz(desc); \
typedef __typeof(temp.E1(0)) TD; \ typedef __typeof(temp.E1(0)) TD; \
\ \
temp.D(0) = 0; \ ofs = LSX_LEN / BIT; \
temp.D(1) = 0; \ for (i = 0; i < oprsz / 16; i++) { \
for (i = 0; i < LSX_LEN/BIT; i++) { \ for (j = 0; j < ofs; j++) { \
temp.E1(i) = (TD)Vj->E2(i) << (imm % BIT); \ temp.E1(j + ofs * i) = (TD)Vj->E2(j + ofs * 2 * i) << (imm % BIT); \
} \
} \ } \
*Vd = temp; \ *Vd = temp; \
} }
void HELPER(vextl_q_d)(void *vd, void *vj, uint32_t desc) void HELPER(vextl_q_d)(void *vd, void *vj, uint32_t desc)
{ {
int i;
VReg *Vd = (VReg *)vd; VReg *Vd = (VReg *)vd;
VReg *Vj = (VReg *)vj; VReg *Vj = (VReg *)vj;
int oprsz = simd_oprsz(desc);
Vd->Q(0) = int128_makes64(Vj->D(0)); for (i = 0; i < oprsz / 16; i++) {
Vd->Q(i) = int128_makes64(Vj->D(2 * i));
}
} }
void HELPER(vextl_qu_du)(void *vd, void *vj, uint32_t desc) void HELPER(vextl_qu_du)(void *vd, void *vj, uint32_t desc)
{ {
int i;
VReg *Vd = (VReg *)vd; VReg *Vd = (VReg *)vd;
VReg *Vj = (VReg *)vj; VReg *Vj = (VReg *)vj;
int oprsz = simd_oprsz(desc);
Vd->Q(0) = int128_make64(Vj->D(0)); for (i = 0; i < oprsz / 16; i++) {
Vd->Q(i) = int128_make64(Vj->UD(2 * i));
}
} }
VSLLWIL(vsllwil_h_b, 16, H, B) VSLLWIL(vsllwil_h_b, 16, H, B)