Lines Matching refs:out1
206 #define LW4(psrc, stride, out0, out1, out2, out3) \ argument
209 out1 = LW((psrc) + stride); \
214 #define LW2(psrc, stride, out0, out1) \ argument
217 out1 = LW((psrc) + stride); \
227 #define LD2(psrc, stride, out0, out1) \ argument
230 out1 = LD((psrc) + stride); \
232 #define LD4(psrc, stride, out0, out1, out2, out3) \ argument
234 LD2((psrc), stride, out0, out1); \
276 #define LD_V2(RTYPE, psrc, stride, out0, out1) \ argument
279 out1 = LD_V(RTYPE, (psrc) + stride); \
287 #define LD_V3(RTYPE, psrc, stride, out0, out1, out2) \ argument
289 LD_V2(RTYPE, (psrc), stride, out0, out1); \
295 #define LD_V4(RTYPE, psrc, stride, out0, out1, out2, out3) \ argument
297 LD_V2(RTYPE, (psrc), stride, out0, out1); \
306 #define LD_V5(RTYPE, psrc, stride, out0, out1, out2, out3, out4) \ argument
308 LD_V4(RTYPE, (psrc), stride, out0, out1, out2, out3); \
314 #define LD_V6(RTYPE, psrc, stride, out0, out1, out2, out3, out4, out5) \ argument
316 LD_V4(RTYPE, (psrc), stride, out0, out1, out2, out3); \
325 out0, out1, out2, out3, out4, out5, out6) \ argument
327 LD_V5(RTYPE, (psrc), stride, out0, out1, out2, out3, out4); \
334 out0, out1, out2, out3, out4, out5, out6, out7) \ argument
336 LD_V4(RTYPE, (psrc), stride, out0, out1, out2, out3); \
346 out0, out1, out2, out3, out4, out5, out6, out7, \ argument
350 out0, out1, out2, out3, out4, out5, out6, out7); \
594 #define AVER_UB2(RTYPE, in0, in1, in2, in3, out0, out1) \ argument
597 out1 = (RTYPE) __msa_aver_u_b((v16u8) in2, (v16u8) in3); \
602 out0, out1, out2, out3) \ argument
604 AVER_UB2(RTYPE, in0, in1, in2, in3, out0, out1) \
621 #define SLDI_B2(RTYPE, d0, s0, d1, s1, slide_val, out0, out1) \ argument
624 SLDI_B(RTYPE, d1, s1, slide_val, out1) \
632 out0, out1, out2) \ argument
634 SLDI_B2(RTYPE, d0, s0, d1, s1, slide_val, out0, out1) \
642 slide_val, out0, out1, out2, out3) \ argument
644 SLDI_B2(RTYPE, d0, s0, d1, s1, slide_val, out0, out1) \
660 #define VSHF_B2(RTYPE, in0, in1, in2, in3, mask0, mask1, out0, out1) \ argument
663 out1 = (RTYPE) __msa_vshf_b((v16i8) mask1, (v16i8) in3, (v16i8) in2); \
671 out0, out1, out2) \ argument
673 VSHF_B2(RTYPE, in0, in1, in2, in3, mask0, mask1, out0, out1); \
679 out0, out1, out2, out3) \ argument
681 VSHF_B2(RTYPE, in0, in1, in0, in1, mask0, mask1, out0, out1); \
696 #define VSHF_H2(RTYPE, in0, in1, in2, in3, mask0, mask1, out0, out1) \ argument
699 out1 = (RTYPE) __msa_vshf_h((v8i16) mask1, (v8i16) in3, (v8i16) in2); \
704 out0, out1, out2) \ argument
706 VSHF_H2(RTYPE, in0, in1, in2, in3, mask0, mask1, out0, out1); \
720 #define VSHF_W2(RTYPE, in0, in1, in2, in3, mask0, mask1, out0, out1) \ argument
723 out1 = (RTYPE) __msa_vshf_w((v4i32) mask1, (v4i32) in3, (v4i32) in2); \
739 #define DOTP_UB2(RTYPE, mult0, mult1, cnst0, cnst1, out0, out1) \ argument
742 out1 = (RTYPE) __msa_dotp_u_h((v16u8) mult1, (v16u8) cnst1); \
748 out0, out1, out2, out3) \ argument
750 DOTP_UB2(RTYPE, mult0, mult1, cnst0, cnst1, out0, out1); \
767 #define DOTP_SB2(RTYPE, mult0, mult1, cnst0, cnst1, out0, out1) \ argument
770 out1 = (RTYPE) __msa_dotp_s_h((v16i8) mult1, (v16i8) cnst1); \
775 out0, out1, out2) \ argument
777 DOTP_SB2(RTYPE, mult0, mult1, cnst0, cnst1, out0, out1); \
783 cnst0, cnst1, cnst2, cnst3, out0, out1, out2, out3) \ argument
785 DOTP_SB2(RTYPE, mult0, mult1, cnst0, cnst1, out0, out1); \
802 #define DOTP_SH2(RTYPE, mult0, mult1, cnst0, cnst1, out0, out1) \ argument
805 out1 = (RTYPE) __msa_dotp_s_w((v8i16) mult1, (v8i16) cnst1); \
811 out0, out1, out2, out3) \ argument
813 DOTP_SH2(RTYPE, mult0, mult1, cnst0, cnst1, out0, out1); \
830 #define DPADD_SB2(RTYPE, mult0, mult1, cnst0, cnst1, out0, out1) \ argument
834 out1 = (RTYPE) __msa_dpadd_s_h((v8i16) out1, \
840 cnst0, cnst1, cnst2, cnst3, out0, out1, out2, out3) \ argument
842 DPADD_SB2(RTYPE, mult0, mult1, cnst0, cnst1, out0, out1); \
859 #define DPADD_UB2(RTYPE, mult0, mult1, cnst0, cnst1, out0, out1) \ argument
863 out1 = (RTYPE) __msa_dpadd_u_h((v8u16) out1, \
880 #define DPADD_SH2(RTYPE, mult0, mult1, cnst0, cnst1, out0, out1) \ argument
884 out1 = (RTYPE) __msa_dpadd_s_w((v4i32) out1, \
890 cnst0, cnst1, cnst2, cnst3, out0, out1, out2, out3) \ argument
892 DPADD_SH2(RTYPE, mult0, mult1, cnst0, cnst1, out0, out1); \
1043 #define HADD_SB2(RTYPE, in0, in1, out0, out1) \ argument
1046 out1 = (RTYPE) __msa_hadd_s_h((v16i8) in1, (v16i8) in1); \
1050 #define HADD_SB4(RTYPE, in0, in1, in2, in3, out0, out1, out2, out3) \ argument
1052 HADD_SB2(RTYPE, in0, in1, out0, out1); \
1066 #define HADD_UB2(RTYPE, in0, in1, out0, out1) \ argument
1069 out1 = (RTYPE) __msa_hadd_u_h((v16u8) in1, (v16u8) in1); \
1073 #define HADD_UB3(RTYPE, in0, in1, in2, out0, out1, out2) \ argument
1075 HADD_UB2(RTYPE, in0, in1, out0, out1); \
1080 #define HADD_UB4(RTYPE, in0, in1, in2, in3, out0, out1, out2, out3) \ argument
1082 HADD_UB2(RTYPE, in0, in1, out0, out1); \
1097 #define HSUB_UB2(RTYPE, in0, in1, out0, out1) \ argument
1100 out1 = (RTYPE) __msa_hsub_u_h((v16u8) in1, (v16u8) in1); \
1105 #define HSUB_UB4(RTYPE, in0, in1, in2, in3, out0, out1, out2, out3) \ argument
1107 HSUB_UB2(RTYPE, in0, in1, out0, out1); \
1197 #define ILVEV_B2(RTYPE, in0, in1, in2, in3, out0, out1) \ argument
1200 out1 = (RTYPE) __msa_ilvev_b((v16i8) in3, (v16i8) in2); \
1216 #define ILVEV_H2(RTYPE, in0, in1, in2, in3, out0, out1) \ argument
1219 out1 = (RTYPE) __msa_ilvev_h((v8i16) in3, (v8i16) in2); \
1234 #define ILVEV_W2(RTYPE, in0, in1, in2, in3, out0, out1) \ argument
1237 out1 = (RTYPE) __msa_ilvev_w((v4i32) in3, (v4i32) in2); \
1253 #define ILVEV_D2(RTYPE, in0, in1, in2, in3, out0, out1) \ argument
1256 out1 = (RTYPE) __msa_ilvev_d((v2i64) in3, (v2i64) in2); \
1271 #define ILVL_B2(RTYPE, in0, in1, in2, in3, out0, out1) \ argument
1274 out1 = (RTYPE) __msa_ilvl_b((v16i8) in2, (v16i8) in3); \
1282 out0, out1, out2, out3) \ argument
1284 ILVL_B2(RTYPE, in0, in1, in2, in3, out0, out1); \
1301 #define ILVL_H2(RTYPE, in0, in1, in2, in3, out0, out1) \ argument
1304 out1 = (RTYPE) __msa_ilvl_h((v8i16) in2, (v8i16) in3); \
1310 out0, out1, out2, out3) \ argument
1312 ILVL_H2(RTYPE, in0, in1, in2, in3, out0, out1); \
1327 #define ILVL_W2(RTYPE, in0, in1, in2, in3, out0, out1) \ argument
1330 out1 = (RTYPE) __msa_ilvl_w((v4i32) in2, (v4i32) in3); \
1346 #define ILVR_B2(RTYPE, in0, in1, in2, in3, out0, out1) \ argument
1349 out1 = (RTYPE) __msa_ilvr_b((v16i8) in2, (v16i8) in3); \
1357 #define ILVR_B3(RTYPE, in0, in1, in2, in3, in4, in5, out0, out1, out2) \ argument
1359 ILVR_B2(RTYPE, in0, in1, in2, in3, out0, out1); \
1368 out0, out1, out2, out3) \ argument
1370 ILVR_B2(RTYPE, in0, in1, in2, in3, out0, out1); \
1381 out0, out1, out2, out3, out4, out5, out6, out7) \ argument
1384 out0, out1, out2, out3); \
1401 #define ILVR_H2(RTYPE, in0, in1, in2, in3, out0, out1) \ argument
1404 out1 = (RTYPE) __msa_ilvr_h((v8i16) in2, (v8i16) in3); \
1409 #define ILVR_H3(RTYPE, in0, in1, in2, in3, in4, in5, out0, out1, out2) \ argument
1411 ILVR_H2(RTYPE, in0, in1, in2, in3, out0, out1); \
1417 out0, out1, out2, out3) \ argument
1419 ILVR_H2(RTYPE, in0, in1, in2, in3, out0, out1); \
1425 #define ILVR_W2(RTYPE, in0, in1, in2, in3, out0, out1) \ argument
1428 out1 = (RTYPE) __msa_ilvr_w((v4i32) in2, (v4i32) in3); \
1435 out0, out1, out2, out3) \ argument
1437 ILVR_W2(RTYPE, in0, in1, in2, in3, out0, out1); \
1452 #define ILVR_D2(RTYPE, in0, in1, in2, in3, out0, out1) \ argument
1455 out1 = (RTYPE) __msa_ilvr_d((v2i64) in2, (v2i64) in3); \
1461 #define ILVR_D3(RTYPE, in0, in1, in2, in3, in4, in5, out0, out1, out2) \ argument
1463 ILVR_D2(RTYPE, in0, in1, in2, in3, out0, out1); \
1469 out0, out1, out2, out3) \ argument
1471 ILVR_D2(RTYPE, in0, in1, in2, in3, out0, out1); \
1486 #define ILVL_D2(RTYPE, in0, in1, in2, in3, out0, out1) \ argument
1489 out1 = (RTYPE) __msa_ilvl_d((v2i64) in2, (v2i64) in3); \
1504 #define ILVRL_B2(RTYPE, in0, in1, out0, out1) \ argument
1507 out1 = (RTYPE) __msa_ilvl_b((v16i8) in0, (v16i8) in1); \
1515 #define ILVRL_H2(RTYPE, in0, in1, out0, out1) \ argument
1518 out1 = (RTYPE) __msa_ilvl_h((v8i16) in0, (v8i16) in1); \
1525 #define ILVRL_W2(RTYPE, in0, in1, out0, out1) \ argument
1528 out1 = (RTYPE) __msa_ilvl_w((v4i32) in0, (v4i32) in1); \
1664 #define SPLATI_H2(RTYPE, in, idx0, idx1, out0, out1) \ argument
1667 out1 = (RTYPE) __msa_splati_h((v8i16) in, idx1); \
1673 out0, out1, out2) \ argument
1675 SPLATI_H2(RTYPE, in, idx0, idx1, out0, out1); \
1682 out0, out1, out2, out3) \ argument
1684 SPLATI_H2(RTYPE, in, idx0, idx1, out0, out1); \
1701 #define SPLATI_W2(RTYPE, in, stidx, out0, out1) \ argument
1704 out1 = (RTYPE) __msa_splati_w((v4i32) in, (stidx+1)); \
1709 #define SPLATI_W4(RTYPE, in, out0, out1, out2, out3) \ argument
1711 SPLATI_W2(RTYPE, in, 0, out0, out1); \
1728 #define PCKEV_B2(RTYPE, in0, in1, in2, in3, out0, out1) \ argument
1731 out1 = (RTYPE) __msa_pckev_b((v16i8) in2, (v16i8) in3); \
1738 #define PCKEV_B3(RTYPE, in0, in1, in2, in3, in4, in5, out0, out1, out2) \ argument
1740 PCKEV_B2(RTYPE, in0, in1, in2, in3, out0, out1); \
1747 out0, out1, out2, out3) \ argument
1749 PCKEV_B2(RTYPE, in0, in1, in2, in3, out0, out1); \
1768 #define PCKEV_H2(RTYPE, in0, in1, in2, in3, out0, out1) \ argument
1771 out1 = (RTYPE) __msa_pckev_h((v8i16) in2, (v8i16) in3); \
1777 out0, out1, out2, out3) \ argument
1779 PCKEV_H2(RTYPE, in0, in1, in2, in3, out0, out1); \
1796 #define PCKEV_D2(RTYPE, in0, in1, in2, in3, out0, out1) \ argument
1799 out1 = (RTYPE) __msa_pckev_d((v2i64) in2, (v2i64) in3); \
1806 out0, out1, out2, out3) \ argument
1808 PCKEV_D2(RTYPE, in0, in1, in2, in3, out0, out1); \
1822 #define PCKOD_D2(RTYPE, in0, in1, in2, in3, out0, out1) \ argument
1825 out1 = (RTYPE) __msa_pckod_d((v2i64) in2, (v2i64) in3); \
1906 #define ADDS_SH2(RTYPE, in0, in1, in2, in3, out0, out1) \ argument
1909 out1 = (RTYPE) __msa_adds_s_h((v8i16) in2, (v8i16) in3); \
1914 out0, out1, out2, out3) \ argument
1916 ADDS_SH2(RTYPE, in0, in1, in2, in3, out0, out1); \
2115 #define MUL2(in0, in1, in2, in3, out0, out1) \ argument
2118 out1 = in2 * in3; \
2120 #define MUL4(in0, in1, in2, in3, in4, in5, in6, in7, out0, out1, out2, out3) \ argument
2122 MUL2(in0, in1, in2, in3, out0, out1); \
2132 #define ADD2(in0, in1, in2, in3, out0, out1) \ argument
2135 out1 = in2 + in3; \
2137 #define ADD4(in0, in1, in2, in3, in4, in5, in6, in7, out0, out1, out2, out3) \ argument
2139 ADD2(in0, in1, in2, in3, out0, out1); \
2149 #define SUB2(in0, in1, in2, in3, out0, out1) \ argument
2152 out1 = in2 - in3; \
2154 #define SUB4(in0, in1, in2, in3, in4, in5, in6, in7, out0, out1, out2, out3) \ argument
2157 out1 = in2 - in3; \
2213 #define UNPCK_SB_SH(in, out0, out1) \ argument
2216 out1 = (v4i32) __builtin_msa2_w2x_hi_s_b((v16i8) in); \
2219 #define UNPCK_SB_SH(in, out0, out1) \ argument
2224 ILVRL_B2_SH(tmp_m, in, out0, out1); \
2235 #define UNPCK_UB_SH(in, out0, out1) \ argument
2239 ILVRL_B2_SH(zero_m, in, out0, out1); \
2254 #define UNPCK_SH_SW(in, out0, out1) \ argument
2257 out1 = (v4i32) __builtin_msa2_w2x_hi_s_h((v8i16) in); \
2260 #define UNPCK_SH_SW(in, out0, out1) \ argument
2265 ILVRL_H2_SW(tmp_m, in, out0, out1); \
2286 #define BUTTERFLY_4(in0, in1, in2, in3, out0, out1, out2, out3) \ argument
2289 out1 = in1 + in2; \
2301 out0, out1, out2, out3, out4, out5, out6, out7) \ argument
2304 out1 = in1 + in6; \
2321 out0, out1, out2, out3, out4, out5, out6, out7, \ argument
2325 out1 = in1 + in14; \
2349 #define TRANSPOSE4x4_UB_UB(in0, in1, in2, in3, out0, out1, out2, out3) \ argument
2358 out1 = (v16u8) __msa_sldi_b(zero_m, (v16i8) out0, 4); \
2359 out2 = (v16u8) __msa_sldi_b(zero_m, (v16i8) out1, 4); \
2370 out0, out1, out2, out3) \ argument
2382 out1 = (RTYPE) __msa_ilvl_d((v2i64) out2, (v2i64) out0); \
2397 out0, out1, out2, out3, out4, out5, out6, out7) \ argument
2410 8, out1, out3, out5, out7); \
2424 out0, out1, out2, out3) \ argument
2429 out1 = (v16u8) __msa_ilvev_d(tmp1_m, tmp0_m); \
2440 ILVEV_B2_SD(out1, out3, tmp2_m, tmp3_m, tmp0_m, tmp1_m); \
2444 tmp0_m = (v2i64) __msa_ilvod_b((v16i8) out3, (v16i8) out1); \
2446 out1 = (v16u8) __msa_ilvev_h((v8i16) tmp1_m, (v8i16) tmp0_m); \
2459 out0, out1, out2, out3, out4, out5, out6, out7) \ argument
2467 ILVEV_D2_UB(in6, in14, in7, in15, out1, out0); \
2475 out7 = (v16u8) __msa_ilvev_b((v16i8) out0, (v16i8) out1); \
2476 tmp7_m = (v16u8) __msa_ilvod_b((v16i8) out0, (v16i8) out1); \
2488 out1 = (v16u8) __msa_ilvev_w((v4i32) tmp3_m, (v4i32) tmp2_m); \
2503 #define TRANSPOSE4x4_SH_SH(in0, in1, in2, in3, out0, out1, out2, out3) \ argument
2509 out1 = (v8i16) __msa_ilvl_d((v2i64) out0, (v2i64) out0); \
2520 out0, out1, out2, out3, out4, out5, out6, out7) \ argument
2536 out1 = (RTYPE) __msa_pckod_d((v2i64) tmp0_m, (v2i64) tmp4_m); \
2550 #define TRANSPOSE4x4_SW_SW(in0, in1, in2, in3, out0, out1, out2, out3) \ argument
2558 out1 = (v4i32) __msa_ilvl_d((v2i64) s2_m, (v2i64) s0_m); \