1cabdff1aSopenharmony_ci/* 2cabdff1aSopenharmony_ci * Copyright (c) 2020 Reimar Döffinger 3cabdff1aSopenharmony_ci * 4cabdff1aSopenharmony_ci * This file is part of FFmpeg. 5cabdff1aSopenharmony_ci * 6cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or 7cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public 8cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either 9cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version. 10cabdff1aSopenharmony_ci * 11cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful, 12cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of 13cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 14cabdff1aSopenharmony_ci * Lesser General Public License for more details. 15cabdff1aSopenharmony_ci * 16cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public 17cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software 18cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA 19cabdff1aSopenharmony_ci */ 20cabdff1aSopenharmony_ci 21cabdff1aSopenharmony_ci#include <stdint.h> 22cabdff1aSopenharmony_ci 23cabdff1aSopenharmony_ci#include "libavutil/attributes.h" 24cabdff1aSopenharmony_ci#include "libavutil/cpu.h" 25cabdff1aSopenharmony_ci#include "libavutil/aarch64/cpu.h" 26cabdff1aSopenharmony_ci#include "libavcodec/hevcdsp.h" 27cabdff1aSopenharmony_ci 28cabdff1aSopenharmony_civoid ff_hevc_add_residual_4x4_8_neon(uint8_t *_dst, int16_t *coeffs, 29cabdff1aSopenharmony_ci ptrdiff_t stride); 30cabdff1aSopenharmony_civoid ff_hevc_add_residual_4x4_10_neon(uint8_t *_dst, int16_t *coeffs, 31cabdff1aSopenharmony_ci ptrdiff_t stride); 32cabdff1aSopenharmony_civoid ff_hevc_add_residual_8x8_8_neon(uint8_t *_dst, int16_t *coeffs, 33cabdff1aSopenharmony_ci ptrdiff_t stride); 34cabdff1aSopenharmony_civoid ff_hevc_add_residual_8x8_10_neon(uint8_t *_dst, int16_t *coeffs, 35cabdff1aSopenharmony_ci ptrdiff_t stride); 36cabdff1aSopenharmony_civoid ff_hevc_add_residual_16x16_8_neon(uint8_t *_dst, int16_t *coeffs, 37cabdff1aSopenharmony_ci ptrdiff_t stride); 38cabdff1aSopenharmony_civoid ff_hevc_add_residual_16x16_10_neon(uint8_t *_dst, int16_t *coeffs, 39cabdff1aSopenharmony_ci ptrdiff_t stride); 40cabdff1aSopenharmony_civoid ff_hevc_add_residual_32x32_8_neon(uint8_t *_dst, int16_t *coeffs, 41cabdff1aSopenharmony_ci ptrdiff_t stride); 42cabdff1aSopenharmony_civoid ff_hevc_add_residual_32x32_10_neon(uint8_t *_dst, int16_t *coeffs, 43cabdff1aSopenharmony_ci ptrdiff_t stride); 44cabdff1aSopenharmony_civoid ff_hevc_idct_8x8_8_neon(int16_t *coeffs, int col_limit); 45cabdff1aSopenharmony_civoid ff_hevc_idct_8x8_10_neon(int16_t *coeffs, int col_limit); 46cabdff1aSopenharmony_civoid ff_hevc_idct_16x16_8_neon(int16_t *coeffs, int col_limit); 47cabdff1aSopenharmony_civoid ff_hevc_idct_16x16_10_neon(int16_t *coeffs, int col_limit); 48cabdff1aSopenharmony_civoid ff_hevc_idct_4x4_dc_8_neon(int16_t *coeffs); 49cabdff1aSopenharmony_civoid ff_hevc_idct_8x8_dc_8_neon(int16_t *coeffs); 50cabdff1aSopenharmony_civoid ff_hevc_idct_16x16_dc_8_neon(int16_t *coeffs); 51cabdff1aSopenharmony_civoid ff_hevc_idct_32x32_dc_8_neon(int16_t *coeffs); 52cabdff1aSopenharmony_civoid ff_hevc_idct_4x4_dc_10_neon(int16_t *coeffs); 53cabdff1aSopenharmony_civoid ff_hevc_idct_8x8_dc_10_neon(int16_t *coeffs); 54cabdff1aSopenharmony_civoid ff_hevc_idct_16x16_dc_10_neon(int16_t *coeffs); 55cabdff1aSopenharmony_civoid ff_hevc_idct_32x32_dc_10_neon(int16_t *coeffs); 56cabdff1aSopenharmony_civoid ff_hevc_sao_band_filter_8x8_8_neon(uint8_t *_dst, uint8_t *_src, 57cabdff1aSopenharmony_ci ptrdiff_t stride_dst, ptrdiff_t stride_src, 58cabdff1aSopenharmony_ci int16_t *sao_offset_val, int sao_left_class, 59cabdff1aSopenharmony_ci int width, int height); 60cabdff1aSopenharmony_civoid ff_hevc_sao_edge_filter_16x16_8_neon(uint8_t *dst, uint8_t *src, ptrdiff_t stride_dst, 61cabdff1aSopenharmony_ci int16_t *sao_offset_val, int eo, int width, int height); 62cabdff1aSopenharmony_civoid ff_hevc_sao_edge_filter_8x8_8_neon(uint8_t *dst, uint8_t *src, ptrdiff_t stride_dst, 63cabdff1aSopenharmony_ci int16_t *sao_offset_val, int eo, int width, int height); 64cabdff1aSopenharmony_ci 65cabdff1aSopenharmony_ciav_cold void ff_hevc_dsp_init_aarch64(HEVCDSPContext *c, const int bit_depth) 66cabdff1aSopenharmony_ci{ 67cabdff1aSopenharmony_ci if (!have_neon(av_get_cpu_flags())) return; 68cabdff1aSopenharmony_ci 69cabdff1aSopenharmony_ci if (bit_depth == 8) { 70cabdff1aSopenharmony_ci c->add_residual[0] = ff_hevc_add_residual_4x4_8_neon; 71cabdff1aSopenharmony_ci c->add_residual[1] = ff_hevc_add_residual_8x8_8_neon; 72cabdff1aSopenharmony_ci c->add_residual[2] = ff_hevc_add_residual_16x16_8_neon; 73cabdff1aSopenharmony_ci c->add_residual[3] = ff_hevc_add_residual_32x32_8_neon; 74cabdff1aSopenharmony_ci c->idct[1] = ff_hevc_idct_8x8_8_neon; 75cabdff1aSopenharmony_ci c->idct[2] = ff_hevc_idct_16x16_8_neon; 76cabdff1aSopenharmony_ci c->idct_dc[0] = ff_hevc_idct_4x4_dc_8_neon; 77cabdff1aSopenharmony_ci c->idct_dc[1] = ff_hevc_idct_8x8_dc_8_neon; 78cabdff1aSopenharmony_ci c->idct_dc[2] = ff_hevc_idct_16x16_dc_8_neon; 79cabdff1aSopenharmony_ci c->idct_dc[3] = ff_hevc_idct_32x32_dc_8_neon; 80cabdff1aSopenharmony_ci c->sao_band_filter[0] = 81cabdff1aSopenharmony_ci c->sao_band_filter[1] = 82cabdff1aSopenharmony_ci c->sao_band_filter[2] = 83cabdff1aSopenharmony_ci c->sao_band_filter[3] = 84cabdff1aSopenharmony_ci c->sao_band_filter[4] = ff_hevc_sao_band_filter_8x8_8_neon; 85cabdff1aSopenharmony_ci c->sao_edge_filter[0] = ff_hevc_sao_edge_filter_8x8_8_neon; 86cabdff1aSopenharmony_ci c->sao_edge_filter[1] = 87cabdff1aSopenharmony_ci c->sao_edge_filter[2] = 88cabdff1aSopenharmony_ci c->sao_edge_filter[3] = 89cabdff1aSopenharmony_ci c->sao_edge_filter[4] = ff_hevc_sao_edge_filter_16x16_8_neon; 90cabdff1aSopenharmony_ci } 91cabdff1aSopenharmony_ci if (bit_depth == 10) { 92cabdff1aSopenharmony_ci c->add_residual[0] = ff_hevc_add_residual_4x4_10_neon; 93cabdff1aSopenharmony_ci c->add_residual[1] = ff_hevc_add_residual_8x8_10_neon; 94cabdff1aSopenharmony_ci c->add_residual[2] = ff_hevc_add_residual_16x16_10_neon; 95cabdff1aSopenharmony_ci c->add_residual[3] = ff_hevc_add_residual_32x32_10_neon; 96cabdff1aSopenharmony_ci c->idct[1] = ff_hevc_idct_8x8_10_neon; 97cabdff1aSopenharmony_ci c->idct[2] = ff_hevc_idct_16x16_10_neon; 98cabdff1aSopenharmony_ci c->idct_dc[0] = ff_hevc_idct_4x4_dc_10_neon; 99cabdff1aSopenharmony_ci c->idct_dc[1] = ff_hevc_idct_8x8_dc_10_neon; 100cabdff1aSopenharmony_ci c->idct_dc[2] = ff_hevc_idct_16x16_dc_10_neon; 101cabdff1aSopenharmony_ci c->idct_dc[3] = ff_hevc_idct_32x32_dc_10_neon; 102cabdff1aSopenharmony_ci } 103cabdff1aSopenharmony_ci} 104