Lines Matching refs:pitch
196 void ff_loop_filter_v_4_8_msa(uint8_t *src, ptrdiff_t pitch, in ff_loop_filter_v_4_8_msa() argument
206 LD_UB8((src - 4 * pitch), pitch, p3, p2, p1, p0, q0, q1, q2, q3); in ff_loop_filter_v_4_8_msa()
221 SD4(p1_d, p0_d, q0_d, q1_d, (src - 2 * pitch), pitch); in ff_loop_filter_v_4_8_msa()
225 void ff_loop_filter_v_44_16_msa(uint8_t *src, ptrdiff_t pitch, in ff_loop_filter_v_44_16_msa() argument
234 LD_UB8((src - 4 * pitch), pitch, p3, p2, p1, p0, q0, q1, q2, q3); in ff_loop_filter_v_44_16_msa()
252 ST_UB4(p1, p0, q0, q1, (src - 2 * pitch), pitch); in ff_loop_filter_v_44_16_msa()
255 void ff_loop_filter_v_8_8_msa(uint8_t *src, ptrdiff_t pitch, in ff_loop_filter_v_8_8_msa() argument
270 LD_UB8((src - 4 * pitch), pitch, p3, p2, p1, p0, q0, q1, q2, q3); in ff_loop_filter_v_8_8_msa()
290 SD4(p1_d, p0_d, q0_d, q1_d, (src - 2 * pitch), pitch); in ff_loop_filter_v_8_8_msa()
319 src -= 3 * pitch; in ff_loop_filter_v_8_8_msa()
321 SD4(p2_d, p1_d, p0_d, q0_d, src, pitch); in ff_loop_filter_v_8_8_msa()
322 src += (4 * pitch); in ff_loop_filter_v_8_8_msa()
324 src += pitch; in ff_loop_filter_v_8_8_msa()
329 void ff_loop_filter_v_88_16_msa(uint8_t *src, ptrdiff_t pitch, in ff_loop_filter_v_88_16_msa() argument
346 LD_UB8(src - (4 * pitch), pitch, p3, p2, p1, p0, q0, q1, q2, q3); in ff_loop_filter_v_88_16_msa()
369 ST_UB4(p1_out, p0_out, q0_out, q1_out, (src - 2 * pitch), pitch); in ff_loop_filter_v_88_16_msa()
399 src -= 3 * pitch; in ff_loop_filter_v_88_16_msa()
401 ST_UB4(p2_out, p1_out, p0_out, q0_out, src, pitch); in ff_loop_filter_v_88_16_msa()
402 src += (4 * pitch); in ff_loop_filter_v_88_16_msa()
403 ST_UB2(q1_out, q2_out, src, pitch); in ff_loop_filter_v_88_16_msa()
404 src += (2 * pitch); in ff_loop_filter_v_88_16_msa()
408 void ff_loop_filter_v_84_16_msa(uint8_t *src, ptrdiff_t pitch, in ff_loop_filter_v_84_16_msa() argument
422 LD_UB8(src - (4 * pitch), pitch, p3, p2, p1, p0, q0, q1, q2, q3); in ff_loop_filter_v_84_16_msa()
447 ST_UB4(p1_out, p0_out, q0_out, q1_out, (src - 2 * pitch), pitch); in ff_loop_filter_v_84_16_msa()
470 src -= 3 * pitch; in ff_loop_filter_v_84_16_msa()
472 ST_UB4(p2_out, p1_out, p0_out, q0_out, src, pitch); in ff_loop_filter_v_84_16_msa()
473 src += (4 * pitch); in ff_loop_filter_v_84_16_msa()
474 ST_UB2(q1_out, q2_out, src, pitch); in ff_loop_filter_v_84_16_msa()
475 src += (2 * pitch); in ff_loop_filter_v_84_16_msa()
479 void ff_loop_filter_v_48_16_msa(uint8_t *src, ptrdiff_t pitch, in ff_loop_filter_v_48_16_msa() argument
493 LD_UB8(src - (4 * pitch), pitch, p3, p2, p1, p0, q0, q1, q2, q3); in ff_loop_filter_v_48_16_msa()
518 ST_UB4(p1_out, p0_out, q0_out, q1_out, (src - 2 * pitch), pitch); in ff_loop_filter_v_48_16_msa()
542 src -= 3 * pitch; in ff_loop_filter_v_48_16_msa()
544 ST_UB4(p2_out, p1_out, p0_out, q0_out, src, pitch); in ff_loop_filter_v_48_16_msa()
545 src += (4 * pitch); in ff_loop_filter_v_48_16_msa()
546 ST_UB2(q1_out, q2_out, src, pitch); in ff_loop_filter_v_48_16_msa()
547 src += (2 * pitch); in ff_loop_filter_v_48_16_msa()
551 static int32_t vp9_hz_lpf_t4_and_t8_16w(uint8_t *src, ptrdiff_t pitch, in vp9_hz_lpf_t4_and_t8_16w() argument
569 LD_UB8(src - (4 * pitch), pitch, p3, p2, p1, p0, q0, q1, q2, q3); in vp9_hz_lpf_t4_and_t8_16w()
584 ST_UB4(p1_out, p0_out, q0_out, q1_out, (src - 2 * pitch), pitch); in vp9_hz_lpf_t4_and_t8_16w()
626 static void vp9_hz_lpf_t16_16w(uint8_t *src, ptrdiff_t pitch, uint8_t *filter48) in vp9_hz_lpf_t16_16w() argument
644 LD_UB8((src - 8 * pitch), pitch, p7, p6, p5, p4, p3, p2, p1, p0); in vp9_hz_lpf_t16_16w()
645 LD_UB8(src, pitch, q0, q1, q2, q3, q4, q5, q6, q7); in vp9_hz_lpf_t16_16w()
653 src -= 3 * pitch; in vp9_hz_lpf_t16_16w()
654 ST_UB4(p2, p1, p0, q0, src, pitch); in vp9_hz_lpf_t16_16w()
655 src += (4 * pitch); in vp9_hz_lpf_t16_16w()
656 ST_UB2(q1, q2, src, pitch); in vp9_hz_lpf_t16_16w()
658 src -= 7 * pitch; in vp9_hz_lpf_t16_16w()
701 src += pitch; in vp9_hz_lpf_t16_16w()
721 src += pitch; in vp9_hz_lpf_t16_16w()
741 src += pitch; in vp9_hz_lpf_t16_16w()
761 src += pitch; in vp9_hz_lpf_t16_16w()
782 src += pitch; in vp9_hz_lpf_t16_16w()
803 src += pitch; in vp9_hz_lpf_t16_16w()
824 src += pitch; in vp9_hz_lpf_t16_16w()
845 src += pitch; in vp9_hz_lpf_t16_16w()
864 src += pitch; in vp9_hz_lpf_t16_16w()
883 src += pitch; in vp9_hz_lpf_t16_16w()
901 src += pitch; in vp9_hz_lpf_t16_16w()
919 src += pitch; in vp9_hz_lpf_t16_16w()
937 src += pitch; in vp9_hz_lpf_t16_16w()
958 void ff_loop_filter_v_16_16_msa(uint8_t *src, ptrdiff_t pitch, in ff_loop_filter_v_16_16_msa() argument
966 early_exit = vp9_hz_lpf_t4_and_t8_16w(src, pitch, &filter48[0], in ff_loop_filter_v_16_16_msa()
970 vp9_hz_lpf_t16_16w(src, pitch, filter48); in ff_loop_filter_v_16_16_msa()
974 void ff_loop_filter_v_16_8_msa(uint8_t *src, ptrdiff_t pitch, in ff_loop_filter_v_16_8_msa() argument
993 LD_UB8((src - 4 * pitch), pitch, p3, p2, p1, p0, q0, q1, q2, q3); in ff_loop_filter_v_16_8_msa()
1013 SD4(p1_d, p0_d, q0_d, q1_d, src - 2 * pitch, pitch); in ff_loop_filter_v_16_8_msa()
1039 LD_UB4((src - 8 * pitch), pitch, p7, p6, p5, p4); in ff_loop_filter_v_16_8_msa()
1040 LD_UB4(src + (4 * pitch), pitch, q4, q5, q6, q7); in ff_loop_filter_v_16_8_msa()
1053 SD4(p2_d, p1_d, p0_d, q0_d, src - 3 * pitch, pitch); in ff_loop_filter_v_16_8_msa()
1054 SD(q1_d, src + pitch); in ff_loop_filter_v_16_8_msa()
1055 SD(q2_d, src + 2 * pitch); in ff_loop_filter_v_16_8_msa()
1067 src -= 7 * pitch; in ff_loop_filter_v_16_8_msa()
1084 src += pitch; in ff_loop_filter_v_16_8_msa()
1086 src += pitch; in ff_loop_filter_v_16_8_msa()
1102 src += pitch; in ff_loop_filter_v_16_8_msa()
1104 src += pitch; in ff_loop_filter_v_16_8_msa()
1120 src += pitch; in ff_loop_filter_v_16_8_msa()
1122 src += pitch; in ff_loop_filter_v_16_8_msa()
1138 src += pitch; in ff_loop_filter_v_16_8_msa()
1140 src += pitch; in ff_loop_filter_v_16_8_msa()
1156 src += pitch; in ff_loop_filter_v_16_8_msa()
1158 src += pitch; in ff_loop_filter_v_16_8_msa()
1174 src += pitch; in ff_loop_filter_v_16_8_msa()
1176 src += pitch; in ff_loop_filter_v_16_8_msa()
1192 src += pitch; in ff_loop_filter_v_16_8_msa()
1198 void ff_loop_filter_h_4_8_msa(uint8_t *src, ptrdiff_t pitch, in ff_loop_filter_h_4_8_msa() argument
1207 LD_UB8((src - 4), pitch, p3, p2, p1, p0, q0, q1, q2, q3); in ff_loop_filter_h_4_8_msa()
1222 ST_W8(vec2, vec3, 0, 1, 2, 3, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_4_8_msa()
1225 void ff_loop_filter_h_44_16_msa(uint8_t *src, ptrdiff_t pitch, in ff_loop_filter_h_44_16_msa() argument
1237 LD_UB8(src - 4, pitch, row0, row1, row2, row3, row4, row5, row6, row7); in ff_loop_filter_h_44_16_msa()
1238 LD_UB8(src - 4 + (8 * pitch), pitch, in ff_loop_filter_h_44_16_msa()
1267 ST_W8(tmp2, tmp3, 0, 1, 2, 3, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_44_16_msa()
1268 ST_W8(tmp4, tmp5, 0, 1, 2, 3, 0, 1, 2, 3, src + 8 * pitch, pitch); in ff_loop_filter_h_44_16_msa()
1271 void ff_loop_filter_h_8_8_msa(uint8_t *src, ptrdiff_t pitch, in ff_loop_filter_h_8_8_msa() argument
1286 LD_UB8(src - 4, pitch, p3, p2, p1, p0, q0, q1, q2, q3); in ff_loop_filter_h_8_8_msa()
1313 ST_W8(vec2, vec3, 0, 1, 2, 3, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_8_8_msa()
1341 ST_W4(vec2, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_8_8_msa()
1342 ST_H4(vec4, 0, 1, 2, 3, src + 4, pitch); in ff_loop_filter_h_8_8_msa()
1343 src += (4 * pitch); in ff_loop_filter_h_8_8_msa()
1344 ST_W4(vec3, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_8_8_msa()
1345 ST_H4(vec4, 4, 5, 6, 7, src + 4, pitch); in ff_loop_filter_h_8_8_msa()
1349 void ff_loop_filter_h_88_16_msa(uint8_t *src, ptrdiff_t pitch, in ff_loop_filter_h_88_16_msa() argument
1370 LD_UB8(temp_src, pitch, p0, p1, p2, p3, row4, row5, row6, row7); in ff_loop_filter_h_88_16_msa()
1371 temp_src += (8 * pitch); in ff_loop_filter_h_88_16_msa()
1372 LD_UB8(temp_src, pitch, q3, q2, q1, q0, row12, row13, row14, row15); in ff_loop_filter_h_88_16_msa()
1408 ST_W8(vec2, vec3, 0, 1, 2, 3, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_88_16_msa()
1409 ST_W8(vec4, vec5, 0, 1, 2, 3, 0, 1, 2, 3, src + 8 * pitch, pitch); in ff_loop_filter_h_88_16_msa()
1448 ST_W4(vec3, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_88_16_msa()
1449 ST_H4(vec2, 0, 1, 2, 3, src + 4, pitch); in ff_loop_filter_h_88_16_msa()
1450 src += (4 * pitch); in ff_loop_filter_h_88_16_msa()
1451 ST_W4(vec4, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_88_16_msa()
1452 ST_H4(vec2, 4, 5, 6, 7, src + 4, pitch); in ff_loop_filter_h_88_16_msa()
1453 src += (4 * pitch); in ff_loop_filter_h_88_16_msa()
1454 ST_W4(vec6, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_88_16_msa()
1455 ST_H4(vec5, 0, 1, 2, 3, src + 4, pitch); in ff_loop_filter_h_88_16_msa()
1456 src += (4 * pitch); in ff_loop_filter_h_88_16_msa()
1457 ST_W4(vec7, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_88_16_msa()
1458 ST_H4(vec5, 4, 5, 6, 7, src + 4, pitch); in ff_loop_filter_h_88_16_msa()
1462 void ff_loop_filter_h_84_16_msa(uint8_t *src, ptrdiff_t pitch, in ff_loop_filter_h_84_16_msa() argument
1480 LD_UB8(temp_src, pitch, p0, p1, p2, p3, row4, row5, row6, row7); in ff_loop_filter_h_84_16_msa()
1481 temp_src += (8 * pitch); in ff_loop_filter_h_84_16_msa()
1482 LD_UB8(temp_src, pitch, q3, q2, q1, q0, row12, row13, row14, row15); in ff_loop_filter_h_84_16_msa()
1520 ST_W8(vec2, vec3, 0, 1, 2, 3, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_84_16_msa()
1521 ST_W8(vec4, vec5, 0, 1, 2, 3, 0, 1, 2, 3, src + 8 * pitch, pitch); in ff_loop_filter_h_84_16_msa()
1551 ST_W4(vec3, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_84_16_msa()
1552 ST_H4(vec2, 0, 1, 2, 3, src + 4, pitch); in ff_loop_filter_h_84_16_msa()
1553 src += (4 * pitch); in ff_loop_filter_h_84_16_msa()
1554 ST_W4(vec4, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_84_16_msa()
1555 ST_H4(vec2, 4, 5, 6, 7, src + 4, pitch); in ff_loop_filter_h_84_16_msa()
1556 src += (4 * pitch); in ff_loop_filter_h_84_16_msa()
1557 ST_W4(vec6, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_84_16_msa()
1558 ST_H4(vec5, 0, 1, 2, 3, src + 4, pitch); in ff_loop_filter_h_84_16_msa()
1559 src += (4 * pitch); in ff_loop_filter_h_84_16_msa()
1560 ST_W4(vec7, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_84_16_msa()
1561 ST_H4(vec5, 4, 5, 6, 7, src + 4, pitch); in ff_loop_filter_h_84_16_msa()
1565 void ff_loop_filter_h_48_16_msa(uint8_t *src, ptrdiff_t pitch, in ff_loop_filter_h_48_16_msa() argument
1583 LD_UB8(temp_src, pitch, p0, p1, p2, p3, row4, row5, row6, row7); in ff_loop_filter_h_48_16_msa()
1584 temp_src += (8 * pitch); in ff_loop_filter_h_48_16_msa()
1585 LD_UB8(temp_src, pitch, q3, q2, q1, q0, row12, row13, row14, row15); in ff_loop_filter_h_48_16_msa()
1623 ST_W8(vec2, vec3, 0, 1, 2, 3, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_48_16_msa()
1624 ST_W8(vec4, vec5, 0, 1, 2, 3, 0, 1, 2, 3, src + 8 * pitch, pitch); in ff_loop_filter_h_48_16_msa()
1656 ST_W4(vec3, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_48_16_msa()
1657 ST_H4(vec2, 0, 1, 2, 3, src + 4, pitch); in ff_loop_filter_h_48_16_msa()
1658 src += (4 * pitch); in ff_loop_filter_h_48_16_msa()
1659 ST_W4(vec4, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_48_16_msa()
1660 ST_H4(vec2, 4, 5, 6, 7, src + 4, pitch); in ff_loop_filter_h_48_16_msa()
1661 src += (4 * pitch); in ff_loop_filter_h_48_16_msa()
1662 ST_W4(vec6, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_48_16_msa()
1663 ST_H4(vec5, 0, 1, 2, 3, src + 4, pitch); in ff_loop_filter_h_48_16_msa()
1664 src += (4 * pitch); in ff_loop_filter_h_48_16_msa()
1665 ST_W4(vec7, 0, 1, 2, 3, src, pitch); in ff_loop_filter_h_48_16_msa()
1666 ST_H4(vec5, 4, 5, 6, 7, src + 4, pitch); in ff_loop_filter_h_48_16_msa()
1842 static int32_t vp9_vt_lpf_t16_8w(uint8_t *src, uint8_t *src_org, ptrdiff_t pitch, in vp9_vt_lpf_t16_8w() argument
1874 ST_W4(vec3, 0, 1, 2, 3, src_org, pitch); in vp9_vt_lpf_t16_8w()
1875 ST_H4(vec2, 0, 1, 2, 3, (src_org + 4), pitch); in vp9_vt_lpf_t16_8w()
1876 src_org += (4 * pitch); in vp9_vt_lpf_t16_8w()
1877 ST_W4(vec4, 0, 1, 2, 3, src_org, pitch); in vp9_vt_lpf_t16_8w()
1878 ST_H4(vec2, 4, 5, 6, 7, (src_org + 4), pitch); in vp9_vt_lpf_t16_8w()
2066 void ff_loop_filter_h_16_8_msa(uint8_t *src, ptrdiff_t pitch, in ff_loop_filter_h_16_8_msa() argument
2075 vp9_transpose_16x8_to_8x16(src - 8, pitch, transposed_input, 16); in ff_loop_filter_h_16_8_msa()
2078 &filter48[0], src, pitch, in ff_loop_filter_h_16_8_msa()
2082 early_exit = vp9_vt_lpf_t16_8w((transposed_input + 16 * 8), src, pitch, in ff_loop_filter_h_16_8_msa()
2086 vp9_transpose_8x16_to_16x8(transposed_input, 16, src - 8, pitch); in ff_loop_filter_h_16_8_msa()
2092 uint8_t *src_org, ptrdiff_t pitch, in vp9_vt_lpf_t4_and_t8_16w() argument
2133 ST_W8(vec2, vec3, 0, 1, 2, 3, 0, 1, 2, 3, src_org, pitch); in vp9_vt_lpf_t4_and_t8_16w()
2134 ST_W8(vec4, vec5, 0, 1, 2, 3, 0, 1, 2, 3, src_org + 8 * pitch, pitch); in vp9_vt_lpf_t4_and_t8_16w()
2175 static int32_t vp9_vt_lpf_t16_16w(uint8_t *src, uint8_t *src_org, ptrdiff_t pitch, in vp9_vt_lpf_t16_16w() argument
2213 ST_W4(vec3, 0, 1, 2, 3, src_org, pitch); in vp9_vt_lpf_t16_16w()
2214 ST_H4(vec2, 0, 1, 2, 3, (src_org + 4), pitch); in vp9_vt_lpf_t16_16w()
2215 src_org += (4 * pitch); in vp9_vt_lpf_t16_16w()
2216 ST_W4(vec4, 0, 1, 2, 3, src_org, pitch); in vp9_vt_lpf_t16_16w()
2217 ST_H4(vec2, 4, 5, 6, 7, (src_org + 4), pitch); in vp9_vt_lpf_t16_16w()
2218 src_org += (4 * pitch); in vp9_vt_lpf_t16_16w()
2219 ST_W4(vec6, 0, 1, 2, 3, src_org, pitch); in vp9_vt_lpf_t16_16w()
2220 ST_H4(vec5, 0, 1, 2, 3, (src_org + 4), pitch); in vp9_vt_lpf_t16_16w()
2221 src_org += (4 * pitch); in vp9_vt_lpf_t16_16w()
2222 ST_W4(vec7, 0, 1, 2, 3, src_org, pitch); in vp9_vt_lpf_t16_16w()
2223 ST_H4(vec5, 4, 5, 6, 7, (src_org + 4), pitch); in vp9_vt_lpf_t16_16w()
2502 void ff_loop_filter_h_16_16_msa(uint8_t *src, ptrdiff_t pitch, in ff_loop_filter_h_16_16_msa() argument
2511 vp9_transpose_16x16((src - 8), pitch, &transposed_input[0], 16); in ff_loop_filter_h_16_16_msa()
2514 &filter48[0], src, pitch, in ff_loop_filter_h_16_16_msa()
2518 early_exit = vp9_vt_lpf_t16_16w((transposed_input + 16 * 8), src, pitch, in ff_loop_filter_h_16_16_msa()
2522 vp9_transpose_16x16(transposed_input, 16, (src - 8), pitch); in ff_loop_filter_h_16_16_msa()