Lines Matching refs:src
159 static void common_hz_8t_4x4_msa(const uint8_t *src, int32_t src_stride,
168 src -= 3;
178 LD_SB4(src, src_stride, src0, src1, src2, src3);
188 static void common_hz_8t_4x8_msa(const uint8_t *src, int32_t src_stride,
198 src -= 3;
208 LD_SB4(src, src_stride, src0, src1, src2, src3);
210 src += (4 * src_stride);
213 LD_SB4(src, src_stride, src0, src1, src2, src3);
225 static void common_hz_8t_4w_msa(const uint8_t *src, int32_t src_stride,
230 common_hz_8t_4x4_msa(src, src_stride, dst, dst_stride, filter);
232 common_hz_8t_4x8_msa(src, src_stride, dst, dst_stride, filter);
236 static void common_hz_8t_8x4_msa(const uint8_t *src, int32_t src_stride,
245 src -= 3;
255 LD_SB4(src, src_stride, src0, src1, src2, src3);
267 static void common_hz_8t_8x8mult_msa(const uint8_t *src, int32_t src_stride,
277 src -= 3;
288 LD_SB4(src, src_stride, src0, src1, src2, src3);
290 src += (4 * src_stride);
303 static void common_hz_8t_8w_msa(const uint8_t *src, int32_t src_stride,
308 common_hz_8t_8x4_msa(src, src_stride, dst, dst_stride, filter);
310 common_hz_8t_8x8mult_msa(src, src_stride, dst, dst_stride, filter,
315 static void common_hz_8t_16w_msa(const uint8_t *src, int32_t src_stride,
325 src -= 3;
336 LD_SB2(src, src_stride, src0, src2);
337 LD_SB2(src + 8, src_stride, src1, src3);
339 src += (2 * src_stride);
354 static void common_hz_8t_32w_msa(const uint8_t *src, int32_t src_stride,
364 src -= 3;
375 src0 = LD_SB(src);
376 src2 = LD_SB(src + 16);
377 src3 = LD_SB(src + 24);
379 src += src_stride;
387 src0 = LD_SB(src);
388 src2 = LD_SB(src + 16);
389 src3 = LD_SB(src + 24);
391 src += src_stride;
413 static void common_hz_8t_64w_msa(const uint8_t *src, int32_t src_stride,
423 src -= 3;
434 src0 = LD_SB(src);
435 src2 = LD_SB(src + 16);
436 src3 = LD_SB(src + 24);
450 src0 = LD_SB(src + 32);
451 src2 = LD_SB(src + 48);
452 src3 = LD_SB(src + 56);
454 src += src_stride;
470 static void common_vt_8t_4w_msa(const uint8_t *src, int32_t src_stride,
482 src -= (3 * src_stride);
487 LD_SB7(src, src_stride, src0, src1, src2, src3, src4, src5, src6);
488 src += (7 * src_stride);
498 LD_SB4(src, src_stride, src7, src8, src9, src10);
499 src += (4 * src_stride);
522 static void common_vt_8t_8w_msa(const uint8_t *src, int32_t src_stride,
533 src -= (3 * src_stride);
538 LD_SB7(src, src_stride, src0, src1, src2, src3, src4, src5, src6);
540 src += (7 * src_stride);
546 LD_SB4(src, src_stride, src7, src8, src9, src10);
548 src += (4 * src_stride);
577 static void common_vt_8t_16w_msa(const uint8_t *src, int32_t src_stride,
590 src -= (3 * src_stride);
595 LD_SB7(src, src_stride, src0, src1, src2, src3, src4, src5, src6);
597 src += (7 * src_stride);
606 LD_SB4(src, src_stride, src7, src8, src9, src10);
608 src += (4 * src_stride);
656 static void common_vt_8t_16w_mult_msa(const uint8_t *src, int32_t src_stride,
672 src -= (3 * src_stride);
678 src_tmp = src;
740 src += 16;
745 static void common_vt_8t_32w_msa(const uint8_t *src, int32_t src_stride,
749 common_vt_8t_16w_mult_msa(src, src_stride, dst, dst_stride, filter, height,
753 static void common_vt_8t_64w_msa(const uint8_t *src, int32_t src_stride,
757 common_vt_8t_16w_mult_msa(src, src_stride, dst, dst_stride, filter, height,
761 static void common_hv_8ht_8vt_4w_msa(const uint8_t *src, int32_t src_stride,
776 src -= (3 + 3 * src_stride);
786 LD_SB7(src, src_stride, src0, src1, src2, src3, src4, src5, src6);
788 src += (7 * src_stride);
807 LD_SB4(src, src_stride, src7, src8, src9, src10);
809 src += (4 * src_stride);
837 static void common_hv_8ht_8vt_8w_msa(const uint8_t *src, int32_t src_stride,
853 src -= (3 + 3 * src_stride);
863 LD_SB7(src, src_stride, src0, src1, src2, src3, src4, src5, src6);
864 src += (7 * src_stride);
890 LD_SB4(src, src_stride, src7, src8, src9, src10);
891 src += (4 * src_stride);
935 static void common_hv_8ht_8vt_16w_msa(const uint8_t *src, int32_t src_stride,
944 common_hv_8ht_8vt_8w_msa(src, src_stride, dst, dst_stride, filter_horiz,
947 src += 8;
952 static void common_hv_8ht_8vt_32w_msa(const uint8_t *src, int32_t src_stride,
961 common_hv_8ht_8vt_8w_msa(src, src_stride, dst, dst_stride, filter_horiz,
964 src += 8;
969 static void common_hv_8ht_8vt_64w_msa(const uint8_t *src, int32_t src_stride,
978 common_hv_8ht_8vt_8w_msa(src, src_stride, dst, dst_stride, filter_horiz,
981 src += 8;
986 static void common_hz_8t_and_aver_dst_4x4_msa(const uint8_t *src,
998 src -= 3;
1008 LD_SB4(src, src_stride, src0, src1, src2, src3);
1021 static void common_hz_8t_and_aver_dst_4x8_msa(const uint8_t *src,
1033 src -= 3;
1043 LD_SB4(src, src_stride, src0, src1, src2, src3);
1045 src += (4 * src_stride);
1052 LD_SB4(src, src_stride, src0, src1, src2, src3);
1066 static void common_hz_8t_and_aver_dst_4w_msa(const uint8_t *src,
1073 common_hz_8t_and_aver_dst_4x4_msa(src, src_stride, dst, dst_stride,
1076 common_hz_8t_and_aver_dst_4x8_msa(src, src_stride, dst, dst_stride,
1081 static void common_hz_8t_and_aver_dst_8w_msa(const uint8_t *src,
1094 src -= 3;
1105 LD_SB4(src, src_stride, src0, src1, src2, src3);
1107 src += (4 * src_stride);
1122 static void common_hz_8t_and_aver_dst_16w_msa(const uint8_t *src,
1136 src -= 3;
1147 LD_SB2(src, src_stride, src0, src2);
1148 LD_SB2(src + 8, src_stride, src1, src3);
1149 src += (2 * src_stride);
1180 static void common_hz_8t_and_aver_dst_32w_msa(const uint8_t *src,
1194 src -= 3;
1205 src0 = LD_SB(src);
1206 src2 = LD_SB(src + 16);
1207 src3 = LD_SB(src + 24);
1209 src += src_stride;
1239 static void common_hz_8t_and_aver_dst_64w_msa(const uint8_t *src,
1253 src -= 3;
1265 src0 = LD_SB(&src[cnt << 5]);
1266 src2 = LD_SB(&src[16 + (cnt << 5)]);
1267 src3 = LD_SB(&src[24 + (cnt << 5)]);
1296 src += src_stride;
1301 static void common_vt_8t_and_aver_dst_4w_msa(const uint8_t *src,
1316 src -= (3 * src_stride);
1321 LD_SB7(src, src_stride, src0, src1, src2, src3, src4, src5, src6);
1322 src += (7 * src_stride);
1332 LD_SB4(src, src_stride, src7, src8, src9, src10);
1333 src += (4 * src_stride);
1360 static void common_vt_8t_and_aver_dst_8w_msa(const uint8_t *src,
1374 src -= (3 * src_stride);
1379 LD_SB7(src, src_stride, src0, src1, src2, src3, src4, src5, src6);
1380 src += (7 * src_stride);
1388 LD_SB4(src, src_stride, src7, src8, src9, src10);
1389 src += (4 * src_stride);
1421 static void common_vt_8t_and_aver_dst_16w_mult_msa(const uint8_t *src,
1440 src -= (3 * src_stride);
1446 src_tmp = src;
1513 src += 16;
1518 static void common_vt_8t_and_aver_dst_16w_msa(const uint8_t *src,
1524 common_vt_8t_and_aver_dst_16w_mult_msa(src, src_stride, dst, dst_stride,
1528 static void common_vt_8t_and_aver_dst_32w_msa(const uint8_t *src,
1534 common_vt_8t_and_aver_dst_16w_mult_msa(src, src_stride, dst, dst_stride,
1538 static void common_vt_8t_and_aver_dst_64w_msa(const uint8_t *src,
1544 common_vt_8t_and_aver_dst_16w_mult_msa(src, src_stride, dst, dst_stride,
1548 static void common_hv_8ht_8vt_and_aver_dst_4w_msa(const uint8_t *src,
1566 src -= (3 + 3 * src_stride);
1576 LD_SB7(src, src_stride, src0, src1, src2, src3, src4, src5, src6);
1578 src += (7 * src_stride);
1597 LD_SB4(src, src_stride, src7, src8, src9, src10);
1599 src += (4 * src_stride);
1631 static void common_hv_8ht_8vt_and_aver_dst_8w_msa(const uint8_t *src,
1650 src -= (3 + 3 * src_stride);
1660 LD_SB7(src, src_stride, src0, src1, src2, src3, src4, src5, src6);
1661 src += (7 * src_stride);
1687 LD_SB4(src, src_stride, src7, src8, src9, src10);
1689 src += (4 * src_stride);
1735 static void common_hv_8ht_8vt_and_aver_dst_16w_msa(const uint8_t *src,
1746 common_hv_8ht_8vt_and_aver_dst_8w_msa(src, src_stride, dst, dst_stride,
1750 src += 8;
1755 static void common_hv_8ht_8vt_and_aver_dst_32w_msa(const uint8_t *src,
1766 common_hv_8ht_8vt_and_aver_dst_8w_msa(src, src_stride, dst, dst_stride,
1770 src += 8;
1775 static void common_hv_8ht_8vt_and_aver_dst_64w_msa(const uint8_t *src,
1786 common_hv_8ht_8vt_and_aver_dst_8w_msa(src, src_stride, dst, dst_stride,
1790 src += 8;
1795 static void common_hz_2t_4x4_msa(const uint8_t *src, int32_t src_stride,
1809 LD_SB4(src, src_stride, src0, src1, src2, src3);
1818 static void common_hz_2t_4x8_msa(const uint8_t *src, int32_t src_stride,
1833 LD_SB8(src, src_stride, src0, src1, src2, src3, src4, src5, src6, src7);
1848 const uint8_t *src, ptrdiff_t src_stride,
1854 common_hz_2t_4x4_msa(src, src_stride, dst, dst_stride, filter);
1856 common_hz_2t_4x8_msa(src, src_stride, dst, dst_stride, filter);
1860 static void common_hz_2t_8x4_msa(const uint8_t *src, int32_t src_stride,
1874 LD_SB4(src, src_stride, src0, src1, src2, src3);
1884 static void common_hz_2t_8x8mult_msa(const uint8_t *src, int32_t src_stride,
1898 LD_SB4(src, src_stride, src0, src1, src2, src3);
1899 src += (4 * src_stride);
1906 LD_SB4(src, src_stride, src0, src1, src2, src3);
1907 src += (4 * src_stride);
1922 LD_SB4(src, src_stride, src0, src1, src2, src3);
1923 src += (4 * src_stride);
1930 LD_SB4(src, src_stride, src0, src1, src2, src3);
1931 src += (4 * src_stride);
1947 const uint8_t *src, ptrdiff_t src_stride,
1953 common_hz_2t_8x4_msa(src, src_stride, dst, dst_stride, filter);
1955 common_hz_2t_8x8mult_msa(src, src_stride, dst, dst_stride, filter,
1961 const uint8_t *src, ptrdiff_t src_stride,
1978 LD_SB4(src, src_stride, src0, src2, src4, src6);
1979 LD_SB4(src + 8, src_stride, src1, src3, src5, src7);
1980 src += (4 * src_stride);
2002 LD_SB4(src, src_stride, src0, src2, src4, src6);
2003 LD_SB4(src + 8, src_stride, src1, src3, src5, src7);
2004 src += (4 * src_stride);
2028 const uint8_t *src, ptrdiff_t src_stride,
2044 src0 = LD_SB(src);
2045 src2 = LD_SB(src + 16);
2046 src3 = LD_SB(src + 24);
2048 src += src_stride;
2049 src4 = LD_SB(src);
2050 src6 = LD_SB(src + 16);
2051 src7 = LD_SB(src + 24);
2053 src += src_stride;
2075 const uint8_t *src, ptrdiff_t src_stride,
2091 src0 = LD_SB(src);
2092 src2 = LD_SB(src + 16);
2093 src4 = LD_SB(src + 32);
2094 src6 = LD_SB(src + 48);
2095 src7 = LD_SB(src + 56);
2097 src += src_stride;
2117 static void common_vt_2t_4x4_msa(const uint8_t *src, int32_t src_stride,
2130 LD_SB5(src, src_stride, src0, src1, src2, src3, src4);
2131 src += (5 * src_stride);
2143 static void common_vt_2t_4x8_msa(const uint8_t *src, int32_t src_stride,
2157 LD_SB8(src, src_stride, src0, src1, src2, src3, src4, src5, src6, src7);
2158 src += (8 * src_stride);
2160 src8 = LD_SB(src);
2161 src += src_stride;
2178 const uint8_t *src, ptrdiff_t src_stride,
2184 common_vt_2t_4x4_msa(src, src_stride, dst, dst_stride, filter);
2186 common_vt_2t_4x8_msa(src, src_stride, dst, dst_stride, filter);
2190 static void common_vt_2t_8x4_msa(const uint8_t *src, int32_t src_stride,
2203 LD_UB5(src, src_stride, src0, src1, src2, src3, src4);
2214 static void common_vt_2t_8x8mult_msa(const uint8_t *src, int32_t src_stride,
2229 src0 = LD_UB(src);
2230 src += src_stride;
2233 LD_UB8(src, src_stride, src1, src2, src3, src4, src5, src6, src7, src8);
2234 src += (8 * src_stride);
2260 const uint8_t *src, ptrdiff_t src_stride,
2266 common_vt_2t_8x4_msa(src, src_stride, dst, dst_stride, filter);
2268 common_vt_2t_8x8mult_msa(src, src_stride, dst, dst_stride, filter,
2274 const uint8_t *src, ptrdiff_t src_stride,
2288 src0 = LD_UB(src);
2289 src += src_stride;
2292 LD_UB4(src, src_stride, src1, src2, src3, src4);
2293 src += (4 * src_stride);
2328 const uint8_t *src, ptrdiff_t src_stride,
2342 src0 = LD_UB(src);
2343 src5 = LD_UB(src + 16);
2344 src += src_stride;
2347 LD_UB4(src, src_stride, src1, src2, src3, src4);
2351 LD_UB4(src + 16, src_stride, src6, src7, src8, src9);
2352 src += (4 * src_stride);
2406 const uint8_t *src, ptrdiff_t src_stride,
2420 LD_UB4(src, 16, src0, src3, src6, src9);
2421 src += src_stride;
2424 LD_UB2(src, src_stride, src1, src2);
2425 LD_UB2(src + 16, src_stride, src4, src5);
2426 LD_UB2(src + 32, src_stride, src7, src8);
2427 LD_UB2(src + 48, src_stride, src10, src11);
2428 src += (2 * src_stride);
2486 static void common_hv_2ht_2vt_4x4_msa(const uint8_t *src, int32_t src_stride,
2503 LD_SB5(src, src_stride, src0, src1, src2, src3, src4);
2519 static void common_hv_2ht_2vt_4x8_msa(const uint8_t *src, int32_t src_stride,
2538 LD_SB8(src, src_stride, src0, src1, src2, src3, src4, src5, src6, src7);
2539 src += (8 * src_stride);
2540 src8 = LD_SB(src);
2566 const uint8_t *src, ptrdiff_t src_stride,
2573 common_hv_2ht_2vt_4x4_msa(src, src_stride, dst, dst_stride,
2576 common_hv_2ht_2vt_4x8_msa(src, src_stride, dst, dst_stride,
2581 static void common_hv_2ht_2vt_8x4_msa(const uint8_t *src, int32_t src_stride,
2599 LD_SB5(src, src_stride, src0, src1, src2, src3, src4);
2624 static void common_hv_2ht_2vt_8x8mult_msa(const uint8_t *src, int32_t src_stride,
2644 src0 = LD_SB(src);
2645 src += src_stride;
2650 LD_SB4(src, src_stride, src1, src2, src3, src4);
2651 src += (4 * src_stride);
2669 LD_SB4(src, src_stride, src1, src2, src3, src4);
2670 src += (4 * src_stride);
2704 const uint8_t *src, ptrdiff_t src_stride,
2711 common_hv_2ht_2vt_8x4_msa(src, src_stride, dst, dst_stride,
2714 common_hv_2ht_2vt_8x8mult_msa(src, src_stride, dst, dst_stride,
2720 const uint8_t *src, ptrdiff_t src_stride,
2740 LD_SB2(src, 8, src0, src1);
2741 src += src_stride;
2748 LD_SB4(src, src_stride, src0, src2, src4, src6);
2749 LD_SB4(src + 8, src_stride, src1, src3, src5, src7);
2750 src += (4 * src_stride);
2791 const uint8_t *src, ptrdiff_t src_stride,
2797 ff_put_bilin_16hv_msa(dst, dst_stride, src, src_stride, height, mx, my);
2799 src += 16;
2805 const uint8_t *src, ptrdiff_t src_stride,
2811 ff_put_bilin_16hv_msa(dst, dst_stride, src, src_stride, height, mx, my);
2813 src += 16;
2818 static void common_hz_2t_and_aver_dst_4x4_msa(const uint8_t *src,
2834 LD_SB4(src, src_stride, src0, src1, src2, src3);
2847 static void common_hz_2t_and_aver_dst_4x8_msa(const uint8_t *src,
2864 LD_SB8(src, src_stride, src0, src1, src2, src3, src4, src5, src6, src7);
2882 const uint8_t *src, ptrdiff_t src_stride,
2888 common_hz_2t_and_aver_dst_4x4_msa(src, src_stride, dst, dst_stride,
2891 common_hz_2t_and_aver_dst_4x8_msa(src, src_stride, dst, dst_stride,
2896 static void common_hz_2t_and_aver_dst_8x4_msa(const uint8_t *src,
2912 LD_SB4(src, src_stride, src0, src1, src2, src3);
2924 static void common_hz_2t_and_aver_dst_8x8mult_msa(const uint8_t *src,
2942 LD_SB4(src, src_stride, src0, src1, src2, src3);
2943 src += (4 * src_stride);
2952 LD_SB4(src, src_stride, src0, src1, src2, src3);
2953 src += (4 * src_stride);
2969 LD_SB4(src, src_stride, src0, src1, src2, src3);
2970 src += (4 * src_stride);
2980 LD_SB4(src, src_stride, src0, src1, src2, src3);
2997 const uint8_t *src, ptrdiff_t src_stride,
3003 common_hz_2t_and_aver_dst_8x4_msa(src, src_stride, dst, dst_stride,
3006 common_hz_2t_and_aver_dst_8x8mult_msa(src, src_stride, dst, dst_stride,
3012 const uint8_t *src, ptrdiff_t src_stride,
3028 LD_SB4(src, src_stride, src0, src2, src4, src6);
3029 LD_SB4(src + 8, src_stride, src1, src3, src5, src7);
3030 src += (4 * src_stride);
3053 LD_SB4(src, src_stride, src0, src2, src4, src6);
3054 LD_SB4(src + 8, src_stride, src1, src3, src5, src7);
3055 src += (4 * src_stride);
3080 const uint8_t *src, ptrdiff_t src_stride,
3097 src0 = LD_SB(src);
3098 src2 = LD_SB(src + 16);
3099 src3 = LD_SB(src + 24);
3101 src += src_stride;
3102 src4 = LD_SB(src);
3103 src6 = LD_SB(src + 16);
3104 src7 = LD_SB(src + 24);
3106 src += src_stride;
3130 const uint8_t *src, ptrdiff_t src_stride,
3147 LD_SB4(src, 16, src0, src2, src4, src6);
3148 src7 = LD_SB(src + 56);
3150 src += src_stride;
3171 static void common_vt_2t_and_aver_dst_4x4_msa(const uint8_t *src,
3186 LD_SB4(src, src_stride, src0, src1, src2, src3);
3187 src += (4 * src_stride);
3189 src4 = LD_SB(src);
3190 src += src_stride;
3207 static void common_vt_2t_and_aver_dst_4x8_msa(const uint8_t *src,
3223 LD_SB8(src, src_stride, src0, src1, src2, src3, src4, src5, src6, src7);
3224 src += (8 * src_stride);
3225 src8 = LD_SB(src);
3247 const uint8_t *src, ptrdiff_t src_stride,
3253 common_vt_2t_and_aver_dst_4x4_msa(src, src_stride, dst, dst_stride,
3256 common_vt_2t_and_aver_dst_4x8_msa(src, src_stride, dst, dst_stride,
3261 static void common_vt_2t_and_aver_dst_8x4_msa(const uint8_t *src,
3277 LD_UB5(src, src_stride, src0, src1, src2, src3, src4);
3290 static void common_vt_2t_and_aver_dst_8x8mult_msa(const uint8_t *src,
3309 src0 = LD_UB(src);
3310 src += src_stride;
3313 LD_UB8(src, src_stride, src1, src2, src3, src4, src5, src6, src7, src8);
3314 src += (8 * src_stride);
3346 const uint8_t *src, ptrdiff_t src_stride,
3352 common_vt_2t_and_aver_dst_8x4_msa(src, src_stride, dst, dst_stride,
3355 common_vt_2t_and_aver_dst_8x8mult_msa(src, src_stride, dst, dst_stride,
3361 const uint8_t *src, ptrdiff_t src_stride,
3374 src0 = LD_UB(src);
3375 src += src_stride;
3378 LD_UB4(src, src_stride, src1, src2, src3, src4);
3379 src += (4 * src_stride);
3415 const uint8_t *src, ptrdiff_t src_stride,
3429 LD_UB2(src, 16, src0, src5);
3430 src += src_stride;
3433 LD_UB4(src, src_stride, src1, src2, src3, src4);
3438 LD_UB4(src + 16, src_stride, src6, src7, src8, src9);
3440 src += (4 * src_stride);
3495 const uint8_t *src, ptrdiff_t src_stride,
3511 LD_UB4(src, 16, src0, src3, src6, src9);
3512 src += src_stride;
3515 LD_UB2(src, src_stride, src1, src2);
3517 LD_UB2(src + 16, src_stride, src4, src5);
3519 LD_UB2(src + 32, src_stride, src7, src8);
3521 LD_UB2(src + 48, src_stride, src10, src11);
3523 src += (2 * src_stride);
3581 static void common_hv_2ht_2vt_and_aver_dst_4x4_msa(const uint8_t *src,
3603 LD_SB5(src, src_stride, src0, src1, src2, src3, src4);
3625 static void common_hv_2ht_2vt_and_aver_dst_4x8_msa(const uint8_t *src,
3649 LD_SB8(src, src_stride, src0, src1, src2, src3, src4, src5, src6, src7);
3650 src += (8 * src_stride);
3651 src8 = LD_SB(src);
3678 const uint8_t *src, ptrdiff_t src_stride,
3685 common_hv_2ht_2vt_and_aver_dst_4x4_msa(src, src_stride, dst, dst_stride,
3688 common_hv_2ht_2vt_and_aver_dst_4x8_msa(src, src_stride, dst, dst_stride,
3693 static void common_hv_2ht_2vt_and_aver_dst_8x4_msa(const uint8_t *src,
3715 LD_SB5(src, src_stride, src0, src1, src2, src3, src4);
3716 src += (5 * src_stride);
3743 static void common_hv_2ht_2vt_and_aver_dst_8x8mult_msa(const uint8_t *src,
3767 src0 = LD_SB(src);
3768 src += src_stride;
3773 LD_SB4(src, src_stride, src1, src2, src3, src4);
3774 src += (4 * src_stride);
3806 const uint8_t *src, ptrdiff_t src_stride,
3813 common_hv_2ht_2vt_and_aver_dst_8x4_msa(src, src_stride, dst, dst_stride,
3816 common_hv_2ht_2vt_and_aver_dst_8x8mult_msa(src, src_stride,
3824 const uint8_t *src, ptrdiff_t src_stride,
3844 LD_SB2(src, 8, src0, src1);
3845 src += src_stride;
3851 LD_SB4(src, src_stride, src0, src2, src4, src6);
3852 LD_SB4(src + 8, src_stride, src1, src3, src5, src7);
3853 src += (4 * src_stride);
3895 const uint8_t *src, ptrdiff_t src_stride,
3901 ff_avg_bilin_16hv_msa(dst, dst_stride, src, src_stride, height, mx, my);
3903 src += 16;
3909 const uint8_t *src, ptrdiff_t src_stride,
3915 ff_avg_bilin_16hv_msa(dst, dst_stride, src, src_stride, height, mx, my);
3917 src += 16;
3922 static void copy_width8_msa(const uint8_t *src, int32_t src_stride,
3931 LD4(src, src_stride, out0, out1, out2, out3);
3932 src += (4 * src_stride);
3933 LD4(src, src_stride, out4, out5, out6, out7);
3934 src += (4 * src_stride);
3943 LD4(src, src_stride, out0, out1, out2, out3);
3944 src += (4 * src_stride);
3952 static void copy_width16_msa(const uint8_t *src, int32_t src_stride,
3960 LD_UB8(src, src_stride, src0, src1, src2, src3, src4, src5, src6, src7);
3963 LD_UB8(src, src_stride, src0, src1, src2, src3, src4, src5, src6, src7);
3964 src += (8 * src_stride);
3967 LD_UB8(src, src_stride, src0, src1, src2, src3, src4, src5, src6, src7);
3968 src += (8 * src_stride);
3972 LD_UB8(src, src_stride, src0, src1, src2, src3, src4, src5, src6, src7);
3973 src += (8 * src_stride);
3976 LD_UB8(src, src_stride, src0, src1, src2, src3, src4, src5, src6, src7);
3977 src += (8 * src_stride);
3980 LD_UB8(src, src_stride, src0, src1, src2, src3, src4, src5, src6, src7);
3981 src += (8 * src_stride);
3984 LD_UB8(src, src_stride, src0, src1, src2, src3, src4, src5, src6, src7);
3988 LD_UB4(src, src_stride, src0, src1, src2, src3);
3989 src += (4 * src_stride);
3996 static void copy_width32_msa(const uint8_t *src, int32_t src_stride,
4005 LD_UB8(src, src_stride, src0, src1, src2, src3, src4, src5, src6, src7);
4007 LD_UB8(src + 16, src_stride, src0, src1, src2, src3, src4, src5, src6,
4009 src += (8 * src_stride);
4016 LD_UB4(src, src_stride, src0, src1, src2, src3);
4017 LD_UB4(src + 16, src_stride, src4, src5, src6, src7);
4018 src += (4 * src_stride);
4026 static void copy_width64_msa(const uint8_t *src, int32_t src_stride,
4035 LD_UB4(src, 16, src0, src1, src2, src3);
4036 src += src_stride;
4037 LD_UB4(src, 16, src4, src5, src6, src7);
4038 src += src_stride;
4039 LD_UB4(src, 16, src8, src9, src10, src11);
4040 src += src_stride;
4041 LD_UB4(src, 16, src12, src13, src14, src15);
4042 src += src_stride;
4055 static void avg_width4_msa(const uint8_t *src, int32_t src_stride,
4063 LW4(src, src_stride, tp0, tp1, tp2, tp3);
4064 src += 4 * src_stride;
4066 LW4(src, src_stride, tp0, tp1, tp2, tp3);
4075 LW4(src, src_stride, tp0, tp1, tp2, tp3);
4084 static void avg_width8_msa(const uint8_t *src, int32_t src_stride,
4095 LD4(src, src_stride, tp0, tp1, tp2, tp3);
4096 src += 4 * src_stride;
4097 LD4(src, src_stride, tp4, tp5, tp6, tp7);
4098 src += 4 * src_stride;
4115 LD4(src, src_stride, tp0, tp1, tp2, tp3);
4126 static void avg_width16_msa(const uint8_t *src, int32_t src_stride,
4136 LD_UB8(src, src_stride, src0, src1, src2, src3, src4, src5, src6, src7);
4137 src += (8 * src_stride);
4149 LD_UB4(src, src_stride, src0, src1, src2, src3);
4150 src += (4 * src_stride);
4161 static void avg_width32_msa(const uint8_t *src, int32_t src_stride,
4174 LD_UB4(src, src_stride, src0, src2, src4, src6);
4175 LD_UB4(src + 16, src_stride, src1, src3, src5, src7);
4176 src += (4 * src_stride);
4180 LD_UB4(src, src_stride, src8, src10, src12, src14);
4181 LD_UB4(src + 16, src_stride, src9, src11, src13, src15);
4182 src += (4 * src_stride);
4205 LD_UB4(src, src_stride, src0, src2, src4, src6);
4206 LD_UB4(src + 16, src_stride, src1, src3, src5, src7);
4207 src += (4 * src_stride);
4224 static void avg_width64_msa(const uint8_t *src, int32_t src_stride,
4236 LD_UB4(src, 16, src0, src1, src2, src3);
4237 src += src_stride;
4238 LD_UB4(src, 16, src4, src5, src6, src7);
4239 src += src_stride;
4240 LD_UB4(src, 16, src8, src9, src10, src11);
4241 src += src_stride;
4242 LD_UB4(src, 16, src12, src13, src14, src15);
4243 src += src_stride;
4328 const uint8_t *src, \
4334 common_hz_8t_##SIZE##w_msa(src, srcstride, dst, dststride, filter, h); \
4338 const uint8_t *src, \
4344 common_vt_8t_##SIZE##w_msa(src, srcstride, dst, dststride, filter, h); \
4348 const uint8_t *src, \
4355 common_hv_8ht_8vt_##SIZE##w_msa(src, srcstride, dst, dststride, hfilter, \
4360 const uint8_t *src, \
4366 common_hz_8t_and_aver_dst_##SIZE##w_msa(src, srcstride, dst, \
4371 const uint8_t *src, \
4377 common_vt_8t_and_aver_dst_##SIZE##w_msa(src, srcstride, dst, dststride, \
4382 const uint8_t *src, \
4389 common_hv_8ht_8vt_and_aver_dst_##SIZE##w_msa(src, srcstride, dst, \
4396 const uint8_t *src, ptrdiff_t srcstride, \
4400 copy_width##SIZE##_msa(src, srcstride, dst, dststride, h); \
4404 const uint8_t *src, ptrdiff_t srcstride, \
4408 avg_width##SIZE##_msa(src, srcstride, dst, dststride, h); \
4413 const uint8_t *src, ptrdiff_t srcstride, \
4417 avg_width##SIZE##_msa(src, srcstride, dst, dststride, h); \