1cabdff1aSopenharmony_ci/*
2cabdff1aSopenharmony_ci * Copyright (c) 2015 Parag Salasakar (parag.salasakar@imgtec.com)
3cabdff1aSopenharmony_ci *
4cabdff1aSopenharmony_ci * This file is part of FFmpeg.
5cabdff1aSopenharmony_ci *
6cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or
7cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public
8cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either
9cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version.
10cabdff1aSopenharmony_ci *
11cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful,
12cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of
13cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14cabdff1aSopenharmony_ci * Lesser General Public License for more details.
15cabdff1aSopenharmony_ci *
16cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public
17cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software
18cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19cabdff1aSopenharmony_ci */
20cabdff1aSopenharmony_ci
21cabdff1aSopenharmony_ci#include "libavutil/mips/generic_macros_msa.h"
22cabdff1aSopenharmony_ci#include "blockdsp_mips.h"
23cabdff1aSopenharmony_ci
24cabdff1aSopenharmony_cistatic void copy_8bit_value_width8_msa(uint8_t *src, uint8_t val,
25cabdff1aSopenharmony_ci                                       int32_t src_stride, int32_t height)
26cabdff1aSopenharmony_ci{
27cabdff1aSopenharmony_ci    int32_t cnt;
28cabdff1aSopenharmony_ci    uint64_t dst0;
29cabdff1aSopenharmony_ci    v16u8 val0;
30cabdff1aSopenharmony_ci
31cabdff1aSopenharmony_ci    val0 = (v16u8) __msa_fill_b(val);
32cabdff1aSopenharmony_ci    dst0 = __msa_copy_u_d((v2i64) val0, 0);
33cabdff1aSopenharmony_ci
34cabdff1aSopenharmony_ci    for (cnt = (height >> 2); cnt--;) {
35cabdff1aSopenharmony_ci        SD4(dst0, dst0, dst0, dst0, src, src_stride);
36cabdff1aSopenharmony_ci        src += (4 * src_stride);
37cabdff1aSopenharmony_ci    }
38cabdff1aSopenharmony_ci}
39cabdff1aSopenharmony_ci
40cabdff1aSopenharmony_cistatic void copy_8bit_value_width16_msa(uint8_t *src, uint8_t val,
41cabdff1aSopenharmony_ci                                        int32_t src_stride, int32_t height)
42cabdff1aSopenharmony_ci{
43cabdff1aSopenharmony_ci    int32_t cnt;
44cabdff1aSopenharmony_ci    v16u8 val0;
45cabdff1aSopenharmony_ci
46cabdff1aSopenharmony_ci    val0 = (v16u8) __msa_fill_b(val);
47cabdff1aSopenharmony_ci
48cabdff1aSopenharmony_ci    for (cnt = (height >> 3); cnt--;) {
49cabdff1aSopenharmony_ci        ST_UB8(val0, val0, val0, val0, val0, val0, val0, val0, src, src_stride);
50cabdff1aSopenharmony_ci        src += (8 * src_stride);
51cabdff1aSopenharmony_ci    }
52cabdff1aSopenharmony_ci}
53cabdff1aSopenharmony_ci
54cabdff1aSopenharmony_cistatic void memset_zero_16width_msa(uint8_t *src, int32_t stride,
55cabdff1aSopenharmony_ci                                    int32_t height)
56cabdff1aSopenharmony_ci{
57cabdff1aSopenharmony_ci    int8_t cnt;
58cabdff1aSopenharmony_ci    v16u8 zero = { 0 };
59cabdff1aSopenharmony_ci
60cabdff1aSopenharmony_ci    for (cnt = (height / 2); cnt--;) {
61cabdff1aSopenharmony_ci        ST_UB(zero, src);
62cabdff1aSopenharmony_ci        src += stride;
63cabdff1aSopenharmony_ci        ST_UB(zero, src);
64cabdff1aSopenharmony_ci        src += stride;
65cabdff1aSopenharmony_ci    }
66cabdff1aSopenharmony_ci}
67cabdff1aSopenharmony_ci
68cabdff1aSopenharmony_civoid ff_fill_block16_msa(uint8_t *src, uint8_t val, ptrdiff_t stride, int height)
69cabdff1aSopenharmony_ci{
70cabdff1aSopenharmony_ci    copy_8bit_value_width16_msa(src, val, stride, height);
71cabdff1aSopenharmony_ci}
72cabdff1aSopenharmony_ci
73cabdff1aSopenharmony_civoid ff_fill_block8_msa(uint8_t *src, uint8_t val, ptrdiff_t stride, int height)
74cabdff1aSopenharmony_ci{
75cabdff1aSopenharmony_ci    copy_8bit_value_width8_msa(src, val, stride, height);
76cabdff1aSopenharmony_ci}
77cabdff1aSopenharmony_ci
78cabdff1aSopenharmony_civoid ff_clear_block_msa(int16_t *block)
79cabdff1aSopenharmony_ci{
80cabdff1aSopenharmony_ci    memset_zero_16width_msa((uint8_t *) block, 16, 8);
81cabdff1aSopenharmony_ci}
82cabdff1aSopenharmony_ci
83cabdff1aSopenharmony_civoid ff_clear_blocks_msa(int16_t *block)
84cabdff1aSopenharmony_ci{
85cabdff1aSopenharmony_ci    memset_zero_16width_msa((uint8_t *) block, 16, 8 * 6);
86cabdff1aSopenharmony_ci}
87