1cabdff1aSopenharmony_ci/* 2cabdff1aSopenharmony_ci * Loongson SIMD optimized blockdsp 3cabdff1aSopenharmony_ci * 4cabdff1aSopenharmony_ci * Copyright (c) 2015 Loongson Technology Corporation Limited 5cabdff1aSopenharmony_ci * Copyright (c) 2015 Zhou Xiaoyong <zhouxiaoyong@loongson.cn> 6cabdff1aSopenharmony_ci * 7cabdff1aSopenharmony_ci * This file is part of FFmpeg. 8cabdff1aSopenharmony_ci * 9cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or 10cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public 11cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either 12cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version. 13cabdff1aSopenharmony_ci * 14cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful, 15cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of 16cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 17cabdff1aSopenharmony_ci * Lesser General Public License for more details. 18cabdff1aSopenharmony_ci * 19cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public 20cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software 21cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA 22cabdff1aSopenharmony_ci */ 23cabdff1aSopenharmony_ci 24cabdff1aSopenharmony_ci#include "blockdsp_mips.h" 25cabdff1aSopenharmony_ci#include "libavutil/mips/mmiutils.h" 26cabdff1aSopenharmony_ci 27cabdff1aSopenharmony_civoid ff_fill_block16_mmi(uint8_t *block, uint8_t value, ptrdiff_t line_size, int h) 28cabdff1aSopenharmony_ci{ 29cabdff1aSopenharmony_ci double ftmp[1]; 30cabdff1aSopenharmony_ci DECLARE_VAR_ALL64; 31cabdff1aSopenharmony_ci 32cabdff1aSopenharmony_ci __asm__ volatile ( 33cabdff1aSopenharmony_ci "mtc1 %[value], %[ftmp0] \n\t" 34cabdff1aSopenharmony_ci "punpcklbh %[ftmp0], %[ftmp0], %[ftmp0] \n\t" 35cabdff1aSopenharmony_ci "punpcklbh %[ftmp0], %[ftmp0], %[ftmp0] \n\t" 36cabdff1aSopenharmony_ci "punpcklbh %[ftmp0], %[ftmp0], %[ftmp0] \n\t" 37cabdff1aSopenharmony_ci "1: \n\t" 38cabdff1aSopenharmony_ci MMI_SDC1(%[ftmp0], %[block], 0x00) 39cabdff1aSopenharmony_ci PTR_ADDI "%[h], %[h], -0x01 \n\t" 40cabdff1aSopenharmony_ci MMI_SDC1(%[ftmp0], %[block], 0x08) 41cabdff1aSopenharmony_ci PTR_ADDU "%[block], %[block], %[line_size] \n\t" 42cabdff1aSopenharmony_ci "bnez %[h], 1b \n\t" 43cabdff1aSopenharmony_ci : [ftmp0]"=&f"(ftmp[0]), 44cabdff1aSopenharmony_ci RESTRICT_ASM_ALL64 45cabdff1aSopenharmony_ci [block]"+&r"(block), [h]"+&r"(h) 46cabdff1aSopenharmony_ci : [value]"r"(value), [line_size]"r"((mips_reg)line_size) 47cabdff1aSopenharmony_ci : "memory" 48cabdff1aSopenharmony_ci ); 49cabdff1aSopenharmony_ci} 50cabdff1aSopenharmony_ci 51cabdff1aSopenharmony_civoid ff_fill_block8_mmi(uint8_t *block, uint8_t value, ptrdiff_t line_size, int h) 52cabdff1aSopenharmony_ci{ 53cabdff1aSopenharmony_ci double ftmp0; 54cabdff1aSopenharmony_ci DECLARE_VAR_ALL64; 55cabdff1aSopenharmony_ci 56cabdff1aSopenharmony_ci __asm__ volatile ( 57cabdff1aSopenharmony_ci "mtc1 %[value], %[ftmp0] \n\t" 58cabdff1aSopenharmony_ci "punpcklbh %[ftmp0], %[ftmp0], %[ftmp0] \n\t" 59cabdff1aSopenharmony_ci "punpcklbh %[ftmp0], %[ftmp0], %[ftmp0] \n\t" 60cabdff1aSopenharmony_ci "punpcklbh %[ftmp0], %[ftmp0], %[ftmp0] \n\t" 61cabdff1aSopenharmony_ci "1: \n\t" 62cabdff1aSopenharmony_ci MMI_SDC1(%[ftmp0], %[block], 0x00) 63cabdff1aSopenharmony_ci PTR_ADDI "%[h], %[h], -0x01 \n\t" 64cabdff1aSopenharmony_ci PTR_ADDU "%[block], %[block], %[line_size] \n\t" 65cabdff1aSopenharmony_ci "bnez %[h], 1b \n\t" 66cabdff1aSopenharmony_ci : [ftmp0]"=&f"(ftmp0), 67cabdff1aSopenharmony_ci RESTRICT_ASM_ALL64 68cabdff1aSopenharmony_ci [block]"+&r"(block), [h]"+&r"(h) 69cabdff1aSopenharmony_ci : [value]"r"(value), [line_size]"r"((mips_reg)line_size) 70cabdff1aSopenharmony_ci : "memory" 71cabdff1aSopenharmony_ci ); 72cabdff1aSopenharmony_ci} 73cabdff1aSopenharmony_ci 74cabdff1aSopenharmony_civoid ff_clear_block_mmi(int16_t *block) 75cabdff1aSopenharmony_ci{ 76cabdff1aSopenharmony_ci double ftmp[2]; 77cabdff1aSopenharmony_ci 78cabdff1aSopenharmony_ci __asm__ volatile ( 79cabdff1aSopenharmony_ci "pxor %[ftmp0], %[ftmp0], %[ftmp0] \n\t" 80cabdff1aSopenharmony_ci "pxor %[ftmp1], %[ftmp1], %[ftmp1] \n\t" 81cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x00) 82cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x10) 83cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x20) 84cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x30) 85cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x40) 86cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x50) 87cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x60) 88cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x70) 89cabdff1aSopenharmony_ci : [ftmp0]"=&f"(ftmp[0]), [ftmp1]"=&f"(ftmp[1]) 90cabdff1aSopenharmony_ci : [block]"r"(block) 91cabdff1aSopenharmony_ci : "memory" 92cabdff1aSopenharmony_ci ); 93cabdff1aSopenharmony_ci} 94cabdff1aSopenharmony_ci 95cabdff1aSopenharmony_civoid ff_clear_blocks_mmi(int16_t *block) 96cabdff1aSopenharmony_ci{ 97cabdff1aSopenharmony_ci double ftmp[2]; 98cabdff1aSopenharmony_ci 99cabdff1aSopenharmony_ci __asm__ volatile ( 100cabdff1aSopenharmony_ci "pxor %[ftmp0], %[ftmp0], %[ftmp0] \n\t" 101cabdff1aSopenharmony_ci "pxor %[ftmp1], %[ftmp1], %[ftmp1] \n\t" 102cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x00) 103cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x10) 104cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x20) 105cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x30) 106cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x40) 107cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x50) 108cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x60) 109cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x70) 110cabdff1aSopenharmony_ci 111cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x80) 112cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x90) 113cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0xa0) 114cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0xb0) 115cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0xc0) 116cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0xd0) 117cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0xe0) 118cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0xf0) 119cabdff1aSopenharmony_ci 120cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x100) 121cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x110) 122cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x120) 123cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x130) 124cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x140) 125cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x150) 126cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x160) 127cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x170) 128cabdff1aSopenharmony_ci 129cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x180) 130cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x190) 131cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x1a0) 132cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x1b0) 133cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x1c0) 134cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x1d0) 135cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x1e0) 136cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x1f0) 137cabdff1aSopenharmony_ci 138cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x200) 139cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x210) 140cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x220) 141cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x230) 142cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x240) 143cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x250) 144cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x260) 145cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x270) 146cabdff1aSopenharmony_ci 147cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x280) 148cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x290) 149cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x2a0) 150cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x2b0) 151cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x2c0) 152cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x2d0) 153cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x2e0) 154cabdff1aSopenharmony_ci MMI_SQC1(%[ftmp0], %[ftmp1], %[block], 0x2f0) 155cabdff1aSopenharmony_ci : [ftmp0]"=&f"(ftmp[0]), [ftmp1]"=&f"(ftmp[1]) 156cabdff1aSopenharmony_ci : [block]"r"((uint64_t *)block) 157cabdff1aSopenharmony_ci : "memory" 158cabdff1aSopenharmony_ci ); 159cabdff1aSopenharmony_ci} 160