1cabdff1aSopenharmony_ci/* 2cabdff1aSopenharmony_ci * ARM NEON optimised DSP functions 3cabdff1aSopenharmony_ci * Copyright (c) 2008 Mans Rullgard <mans@mansr.com> 4cabdff1aSopenharmony_ci * 5cabdff1aSopenharmony_ci * This file is part of FFmpeg. 6cabdff1aSopenharmony_ci * 7cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or 8cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public 9cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either 10cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version. 11cabdff1aSopenharmony_ci * 12cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful, 13cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of 14cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 15cabdff1aSopenharmony_ci * Lesser General Public License for more details. 16cabdff1aSopenharmony_ci * 17cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public 18cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software 19cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA 20cabdff1aSopenharmony_ci */ 21cabdff1aSopenharmony_ci 22cabdff1aSopenharmony_ci#include <stddef.h> 23cabdff1aSopenharmony_ci#include <stdint.h> 24cabdff1aSopenharmony_ci 25cabdff1aSopenharmony_ci#include "config.h" 26cabdff1aSopenharmony_ci 27cabdff1aSopenharmony_ci#include "libavutil/attributes.h" 28cabdff1aSopenharmony_ci#include "libavutil/cpu.h" 29cabdff1aSopenharmony_ci#include "libavutil/aarch64/cpu.h" 30cabdff1aSopenharmony_ci#include "libavcodec/hpeldsp.h" 31cabdff1aSopenharmony_ci 32cabdff1aSopenharmony_civoid ff_put_pixels16_neon(uint8_t *block, const uint8_t *pixels, 33cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 34cabdff1aSopenharmony_civoid ff_put_pixels16_x2_neon(uint8_t *block, const uint8_t *pixels, 35cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 36cabdff1aSopenharmony_civoid ff_put_pixels16_y2_neon(uint8_t *block, const uint8_t *pixels, 37cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 38cabdff1aSopenharmony_civoid ff_put_pixels16_xy2_neon(uint8_t *block, const uint8_t *pixels, 39cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 40cabdff1aSopenharmony_civoid ff_put_pixels8_neon(uint8_t *block, const uint8_t *pixels, 41cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 42cabdff1aSopenharmony_civoid ff_put_pixels8_x2_neon(uint8_t *block, const uint8_t *pixels, 43cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 44cabdff1aSopenharmony_civoid ff_put_pixels8_y2_neon(uint8_t *block, const uint8_t *pixels, 45cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 46cabdff1aSopenharmony_civoid ff_put_pixels8_xy2_neon(uint8_t *block, const uint8_t *pixels, 47cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 48cabdff1aSopenharmony_ci 49cabdff1aSopenharmony_civoid ff_put_pixels16_x2_no_rnd_neon(uint8_t *block, const uint8_t *pixels, 50cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 51cabdff1aSopenharmony_civoid ff_put_pixels16_y2_no_rnd_neon(uint8_t *block, const uint8_t *pixels, 52cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 53cabdff1aSopenharmony_civoid ff_put_pixels16_xy2_no_rnd_neon(uint8_t *block, const uint8_t *pixels, 54cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 55cabdff1aSopenharmony_civoid ff_put_pixels8_x2_no_rnd_neon(uint8_t *block, const uint8_t *pixels, 56cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 57cabdff1aSopenharmony_civoid ff_put_pixels8_y2_no_rnd_neon(uint8_t *block, const uint8_t *pixels, 58cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 59cabdff1aSopenharmony_civoid ff_put_pixels8_xy2_no_rnd_neon(uint8_t *block, const uint8_t *pixels, 60cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 61cabdff1aSopenharmony_ci 62cabdff1aSopenharmony_civoid ff_avg_pixels16_neon(uint8_t *block, const uint8_t *pixels, 63cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 64cabdff1aSopenharmony_civoid ff_avg_pixels16_x2_neon(uint8_t *block, const uint8_t *pixels, 65cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 66cabdff1aSopenharmony_civoid ff_avg_pixels16_y2_neon(uint8_t *block, const uint8_t *pixels, 67cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 68cabdff1aSopenharmony_civoid ff_avg_pixels16_xy2_neon(uint8_t *block, const uint8_t *pixels, 69cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 70cabdff1aSopenharmony_civoid ff_avg_pixels8_neon(uint8_t *block, const uint8_t *pixels, 71cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 72cabdff1aSopenharmony_civoid ff_avg_pixels8_x2_neon(uint8_t *block, const uint8_t *pixels, 73cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 74cabdff1aSopenharmony_civoid ff_avg_pixels8_y2_neon(uint8_t *block, const uint8_t *pixels, 75cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 76cabdff1aSopenharmony_civoid ff_avg_pixels8_xy2_neon(uint8_t *block, const uint8_t *pixels, 77cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 78cabdff1aSopenharmony_ci 79cabdff1aSopenharmony_civoid ff_avg_pixels16_x2_no_rnd_neon(uint8_t *block, const uint8_t *pixels, 80cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 81cabdff1aSopenharmony_civoid ff_avg_pixels16_y2_no_rnd_neon(uint8_t *block, const uint8_t *pixels, 82cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 83cabdff1aSopenharmony_civoid ff_avg_pixels16_xy2_no_rnd_neon(uint8_t *block, const uint8_t *pixels, 84cabdff1aSopenharmony_ci ptrdiff_t line_size, int h); 85cabdff1aSopenharmony_ci 86cabdff1aSopenharmony_ciav_cold void ff_hpeldsp_init_aarch64(HpelDSPContext *c, int flags) 87cabdff1aSopenharmony_ci{ 88cabdff1aSopenharmony_ci int cpu_flags = av_get_cpu_flags(); 89cabdff1aSopenharmony_ci 90cabdff1aSopenharmony_ci if (have_neon(cpu_flags)) { 91cabdff1aSopenharmony_ci c->put_pixels_tab[0][0] = ff_put_pixels16_neon; 92cabdff1aSopenharmony_ci c->put_pixels_tab[0][1] = ff_put_pixels16_x2_neon; 93cabdff1aSopenharmony_ci c->put_pixels_tab[0][2] = ff_put_pixels16_y2_neon; 94cabdff1aSopenharmony_ci c->put_pixels_tab[0][3] = ff_put_pixels16_xy2_neon; 95cabdff1aSopenharmony_ci c->put_pixels_tab[1][0] = ff_put_pixels8_neon; 96cabdff1aSopenharmony_ci c->put_pixels_tab[1][1] = ff_put_pixels8_x2_neon; 97cabdff1aSopenharmony_ci c->put_pixels_tab[1][2] = ff_put_pixels8_y2_neon; 98cabdff1aSopenharmony_ci c->put_pixels_tab[1][3] = ff_put_pixels8_xy2_neon; 99cabdff1aSopenharmony_ci 100cabdff1aSopenharmony_ci c->put_no_rnd_pixels_tab[0][0] = ff_put_pixels16_neon; 101cabdff1aSopenharmony_ci c->put_no_rnd_pixels_tab[0][1] = ff_put_pixels16_x2_no_rnd_neon; 102cabdff1aSopenharmony_ci c->put_no_rnd_pixels_tab[0][2] = ff_put_pixels16_y2_no_rnd_neon; 103cabdff1aSopenharmony_ci c->put_no_rnd_pixels_tab[0][3] = ff_put_pixels16_xy2_no_rnd_neon; 104cabdff1aSopenharmony_ci c->put_no_rnd_pixels_tab[1][0] = ff_put_pixels8_neon; 105cabdff1aSopenharmony_ci c->put_no_rnd_pixels_tab[1][1] = ff_put_pixels8_x2_no_rnd_neon; 106cabdff1aSopenharmony_ci c->put_no_rnd_pixels_tab[1][2] = ff_put_pixels8_y2_no_rnd_neon; 107cabdff1aSopenharmony_ci c->put_no_rnd_pixels_tab[1][3] = ff_put_pixels8_xy2_no_rnd_neon; 108cabdff1aSopenharmony_ci 109cabdff1aSopenharmony_ci c->avg_pixels_tab[0][0] = ff_avg_pixels16_neon; 110cabdff1aSopenharmony_ci c->avg_pixels_tab[0][1] = ff_avg_pixels16_x2_neon; 111cabdff1aSopenharmony_ci c->avg_pixels_tab[0][2] = ff_avg_pixels16_y2_neon; 112cabdff1aSopenharmony_ci c->avg_pixels_tab[0][3] = ff_avg_pixels16_xy2_neon; 113cabdff1aSopenharmony_ci c->avg_pixels_tab[1][0] = ff_avg_pixels8_neon; 114cabdff1aSopenharmony_ci c->avg_pixels_tab[1][1] = ff_avg_pixels8_x2_neon; 115cabdff1aSopenharmony_ci c->avg_pixels_tab[1][2] = ff_avg_pixels8_y2_neon; 116cabdff1aSopenharmony_ci c->avg_pixels_tab[1][3] = ff_avg_pixels8_xy2_neon; 117cabdff1aSopenharmony_ci 118cabdff1aSopenharmony_ci c->avg_no_rnd_pixels_tab[0] = ff_avg_pixels16_neon; 119cabdff1aSopenharmony_ci c->avg_no_rnd_pixels_tab[1] = ff_avg_pixels16_x2_no_rnd_neon; 120cabdff1aSopenharmony_ci c->avg_no_rnd_pixels_tab[2] = ff_avg_pixels16_y2_no_rnd_neon; 121cabdff1aSopenharmony_ci c->avg_no_rnd_pixels_tab[3] = ff_avg_pixels16_xy2_no_rnd_neon; 122cabdff1aSopenharmony_ci } 123cabdff1aSopenharmony_ci} 124