1cabdff1aSopenharmony_ci/*
2cabdff1aSopenharmony_ci * Loongson SIMD optimized blockdsp
3cabdff1aSopenharmony_ci *
4cabdff1aSopenharmony_ci * Copyright (c) 2015 Loongson Technology Corporation Limited
5cabdff1aSopenharmony_ci * Copyright (c) 2015 Zhou Xiaoyong <zhouxiaoyong@loongson.cn>
6cabdff1aSopenharmony_ci *
7cabdff1aSopenharmony_ci * This file is part of FFmpeg.
8cabdff1aSopenharmony_ci *
9cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or
10cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public
11cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either
12cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version.
13cabdff1aSopenharmony_ci *
14cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful,
15cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of
16cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
17cabdff1aSopenharmony_ci * Lesser General Public License for more details.
18cabdff1aSopenharmony_ci *
19cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public
20cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software
21cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
22cabdff1aSopenharmony_ci */
23cabdff1aSopenharmony_ci
24cabdff1aSopenharmony_ci#include "blockdsp_mips.h"
25cabdff1aSopenharmony_ci#include "libavutil/mips/mmiutils.h"
26cabdff1aSopenharmony_ci
27cabdff1aSopenharmony_civoid ff_fill_block16_mmi(uint8_t *block, uint8_t value, ptrdiff_t line_size, int h)
28cabdff1aSopenharmony_ci{
29cabdff1aSopenharmony_ci    double ftmp[1];
30cabdff1aSopenharmony_ci    DECLARE_VAR_ALL64;
31cabdff1aSopenharmony_ci
32cabdff1aSopenharmony_ci    __asm__ volatile (
33cabdff1aSopenharmony_ci        "mtc1       %[value],   %[ftmp0]                                \n\t"
34cabdff1aSopenharmony_ci        "punpcklbh  %[ftmp0],   %[ftmp0],       %[ftmp0]                \n\t"
35cabdff1aSopenharmony_ci        "punpcklbh  %[ftmp0],   %[ftmp0],       %[ftmp0]                \n\t"
36cabdff1aSopenharmony_ci        "punpcklbh  %[ftmp0],   %[ftmp0],       %[ftmp0]                \n\t"
37cabdff1aSopenharmony_ci        "1:                                                             \n\t"
38cabdff1aSopenharmony_ci        MMI_SDC1(%[ftmp0], %[block], 0x00)
39cabdff1aSopenharmony_ci        PTR_ADDI   "%[h],       %[h],           -0x01                   \n\t"
40cabdff1aSopenharmony_ci        MMI_SDC1(%[ftmp0], %[block], 0x08)
41cabdff1aSopenharmony_ci        PTR_ADDU   "%[block],   %[block],       %[line_size]            \n\t"
42cabdff1aSopenharmony_ci        "bnez       %[h],       1b                                      \n\t"
43cabdff1aSopenharmony_ci        : [ftmp0]"=&f"(ftmp[0]),
44cabdff1aSopenharmony_ci          RESTRICT_ASM_ALL64
45cabdff1aSopenharmony_ci          [block]"+&r"(block),              [h]"+&r"(h)
46cabdff1aSopenharmony_ci        : [value]"r"(value),                [line_size]"r"((mips_reg)line_size)
47cabdff1aSopenharmony_ci        : "memory"
48cabdff1aSopenharmony_ci    );
49cabdff1aSopenharmony_ci}
50cabdff1aSopenharmony_ci
51cabdff1aSopenharmony_civoid ff_fill_block8_mmi(uint8_t *block, uint8_t value, ptrdiff_t line_size, int h)
52cabdff1aSopenharmony_ci{
53cabdff1aSopenharmony_ci    double ftmp0;
54cabdff1aSopenharmony_ci    DECLARE_VAR_ALL64;
55cabdff1aSopenharmony_ci
56cabdff1aSopenharmony_ci    __asm__ volatile (
57cabdff1aSopenharmony_ci        "mtc1       %[value],   %[ftmp0]                                \n\t"
58cabdff1aSopenharmony_ci        "punpcklbh  %[ftmp0],   %[ftmp0],       %[ftmp0]                \n\t"
59cabdff1aSopenharmony_ci        "punpcklbh  %[ftmp0],   %[ftmp0],       %[ftmp0]                \n\t"
60cabdff1aSopenharmony_ci        "punpcklbh  %[ftmp0],   %[ftmp0],       %[ftmp0]                \n\t"
61cabdff1aSopenharmony_ci        "1:                                                             \n\t"
62cabdff1aSopenharmony_ci        MMI_SDC1(%[ftmp0], %[block], 0x00)
63cabdff1aSopenharmony_ci        PTR_ADDI   "%[h],       %[h],           -0x01                   \n\t"
64cabdff1aSopenharmony_ci        PTR_ADDU   "%[block],   %[block],       %[line_size]            \n\t"
65cabdff1aSopenharmony_ci        "bnez       %[h],       1b                                      \n\t"
66cabdff1aSopenharmony_ci        : [ftmp0]"=&f"(ftmp0),
67cabdff1aSopenharmony_ci          RESTRICT_ASM_ALL64
68cabdff1aSopenharmony_ci          [block]"+&r"(block),              [h]"+&r"(h)
69cabdff1aSopenharmony_ci        : [value]"r"(value),                [line_size]"r"((mips_reg)line_size)
70cabdff1aSopenharmony_ci        : "memory"
71cabdff1aSopenharmony_ci    );
72cabdff1aSopenharmony_ci}
73cabdff1aSopenharmony_ci
74cabdff1aSopenharmony_civoid ff_clear_block_mmi(int16_t *block)
75cabdff1aSopenharmony_ci{
76cabdff1aSopenharmony_ci    double ftmp[2];
77cabdff1aSopenharmony_ci
78cabdff1aSopenharmony_ci    __asm__ volatile (
79cabdff1aSopenharmony_ci        "pxor       %[ftmp0],   %[ftmp0],       %[ftmp0]                \n\t"
80cabdff1aSopenharmony_ci        "pxor       %[ftmp1],   %[ftmp1],       %[ftmp1]                \n\t"
81cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x00)
82cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x10)
83cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x20)
84cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x30)
85cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x40)
86cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x50)
87cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x60)
88cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x70)
89cabdff1aSopenharmony_ci        : [ftmp0]"=&f"(ftmp[0]),            [ftmp1]"=&f"(ftmp[1])
90cabdff1aSopenharmony_ci        : [block]"r"(block)
91cabdff1aSopenharmony_ci        : "memory"
92cabdff1aSopenharmony_ci    );
93cabdff1aSopenharmony_ci}
94cabdff1aSopenharmony_ci
95cabdff1aSopenharmony_civoid ff_clear_blocks_mmi(int16_t *block)
96cabdff1aSopenharmony_ci{
97cabdff1aSopenharmony_ci    double ftmp[2];
98cabdff1aSopenharmony_ci
99cabdff1aSopenharmony_ci    __asm__ volatile (
100cabdff1aSopenharmony_ci        "pxor       %[ftmp0],   %[ftmp0],       %[ftmp0]                \n\t"
101cabdff1aSopenharmony_ci        "pxor       %[ftmp1],   %[ftmp1],       %[ftmp1]                \n\t"
102cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x00)
103cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x10)
104cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x20)
105cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x30)
106cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x40)
107cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x50)
108cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x60)
109cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x70)
110cabdff1aSopenharmony_ci
111cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x80)
112cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x90)
113cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0xa0)
114cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0xb0)
115cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0xc0)
116cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0xd0)
117cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0xe0)
118cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0xf0)
119cabdff1aSopenharmony_ci
120cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x100)
121cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x110)
122cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x120)
123cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x130)
124cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x140)
125cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x150)
126cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x160)
127cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x170)
128cabdff1aSopenharmony_ci
129cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x180)
130cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x190)
131cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x1a0)
132cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x1b0)
133cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x1c0)
134cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x1d0)
135cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x1e0)
136cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x1f0)
137cabdff1aSopenharmony_ci
138cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x200)
139cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x210)
140cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x220)
141cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x230)
142cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x240)
143cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x250)
144cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x260)
145cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x270)
146cabdff1aSopenharmony_ci
147cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x280)
148cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x290)
149cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x2a0)
150cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x2b0)
151cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x2c0)
152cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x2d0)
153cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x2e0)
154cabdff1aSopenharmony_ci        MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x2f0)
155cabdff1aSopenharmony_ci        : [ftmp0]"=&f"(ftmp[0]),            [ftmp1]"=&f"(ftmp[1])
156cabdff1aSopenharmony_ci        : [block]"r"((uint64_t *)block)
157cabdff1aSopenharmony_ci        : "memory"
158cabdff1aSopenharmony_ci    );
159cabdff1aSopenharmony_ci}
160