ILVR_D2_SH(fact3, fact1, fact7, fact5, fact1, fact3);
ILVR_B4_SH(zero, top0, zero, top1, zero, top2, zero, top3,
diff0, diff2, diff4, diff6);
- SLDI_B4_0_SH(diff0, diff2, diff4, diff6, diff1, diff3, diff5, diff7, 2);
+ SLDI_B4_SH(zero, diff0, zero, diff2, zero, diff4, zero, diff6, 2,
+ diff1, diff3, diff5, diff7);
ILVR_D2_SH(diff2, diff0, diff6, diff4, diff0, diff2);
ILVR_D2_SH(diff3, diff1, diff7, diff5, diff1, diff3);
MUL2(diff1, fact0, diff3, fact2, diff1, diff3);
UNPCK_UB_SH(top2, diff4, diff5);
UNPCK_UB_SH(top3, diff6, diff7);
- SLDI_B2_SH(diff1, diff3, diff0, diff2, diff1, diff3, 2);
- SLDI_B2_SH(diff5, diff7, diff4, diff6, diff5, diff7, 2);
+ SLDI_B4_SH(diff1, diff0, diff3, diff2, diff5, diff4, diff7, diff6, 2,
+ diff1, diff3, diff5, diff7);
MUL4(diff1, fact0, diff3, fact2, diff5, fact4, diff7, fact6,
diff1, diff3, diff5, diff7);
fact6 = __msa_fill_h(fact_val3);
fact7 = __msa_fill_h(32 - fact_val3);
- SLDI_B2_UB(top1, top3, top0, top2, top1, top3, 1);
- SLDI_B2_UB(top5, top7, top4, top6, top5, top7, 1);
+ SLDI_B4_UB(top1, top0, top3, top2, top5, top4, top7, top6, 1,
+ top1, top3, top5, top7);
UNPCK_UB_SH(top0, diff0, diff1);
UNPCK_UB_SH(top1, diff2, diff3);
UNPCK_UB_SH(top2, diff4, diff5);
top2 = top1;
top6 = top5;
- SLDI_B2_UB(top1, top3, top0, top2, top1, top3, 1);
- SLDI_B2_UB(top5, top7, top4, top6, top5, top7, 1);
+ SLDI_B4_UB(top1, top0, top3, top2, top5, top4, top7, top6, 1,
+ top1, top3, top5, top7);
UNPCK_UB_SH(top0, diff0, diff1);
UNPCK_UB_SH(top1, diff2, diff3);
UNPCK_UB_SH(top2, diff4, diff5);
ILVR_D2_SH(fact3, fact1, fact7, fact5, fact1, fact3);
ILVR_B4_SH(zero, top0, zero, top1, zero, top2, zero, top3,
diff0, diff2, diff4, diff6);
- SLDI_B4_0_SH(diff0, diff2, diff4, diff6, diff1, diff3, diff5, diff7, 2);
+ SLDI_B4_SH(zero, diff0, zero, diff2, zero, diff4, zero, diff6, 2,
+ diff1, diff3, diff5, diff7);
ILVR_D2_SH(diff2, diff0, diff6, diff4, diff0, diff2);
ILVR_D2_SH(diff3, diff1, diff7, diff5, diff1, diff3);
MUL2(diff1, fact0, diff3, fact2, diff1, diff3);
UNPCK_UB_SH(top1, diff2, diff3);
UNPCK_UB_SH(top2, diff4, diff5);
UNPCK_UB_SH(top3, diff6, diff7);
- SLDI_B2_SH(diff1, diff3, diff0, diff2, diff1, diff3, 2);
- SLDI_B2_SH(diff5, diff7, diff4, diff6, diff5, diff7, 2);
+ SLDI_B4_SH(diff1, diff0, diff3, diff2, diff5, diff4, diff7, diff6, 2,
+ diff1, diff3, diff5, diff7);
MUL4(diff1, fact0, diff3, fact2, diff5, fact4, diff7, fact6,
diff1, diff3, diff5, diff7);
fact6 = __msa_fill_h(fact_val3);
fact7 = __msa_fill_h(32 - fact_val3);
- SLDI_B2_SB(top1, top3, top0, top2, top1, top3, 1);
- SLDI_B2_SB(top5, top7, top4, top6, top5, top7, 1);
+ SLDI_B4_SB(top1, top0, top3, top2, top5, top4, top7, top6, 1,
+ top1, top3, top5, top7);
UNPCK_UB_SH(top0, diff0, diff1);
UNPCK_UB_SH(top1, diff2, diff3);
top2 = top1;
top6 = top5;
- SLDI_B2_SB(top1, top3, top0, top2, top1, top3, 1);
- SLDI_B2_SB(top5, top7, top4, top6, top5, top7, 1);
+ SLDI_B4_SB(top1, top0, top3, top2, top5, top4, top7, top6, 1,
+ top1, top3, top5, top7);
UNPCK_UB_SH(top0, diff0, diff1);
UNPCK_UB_SH(top1, diff2, diff3);