1/* 2 * ARM-NEON-optimized IDCT functions 3 * Copyright (c) 2008 Mans Rullgard <mans@mansr.com> 4 * Copyright (c) 2017 Matthieu Bouron <matthieu.bouron@gmail.com> 5 * 6 * This file is part of FFmpeg. 7 * 8 * FFmpeg is free software; you can redistribute it and/or 9 * modify it under the terms of the GNU Lesser General Public 10 * License as published by the Free Software Foundation; either 11 * version 2.1 of the License, or (at your option) any later version. 12 * 13 * FFmpeg is distributed in the hope that it will be useful, 14 * but WITHOUT ANY WARRANTY; without even the implied warranty of 15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 16 * Lesser General Public License for more details. 17 * 18 * You should have received a copy of the GNU Lesser General Public 19 * License along with FFmpeg; if not, write to the Free Software 20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA 21 */ 22 23#include "libavutil/attributes.h" 24#include "libavutil/cpu.h" 25#include "libavutil/arm/cpu.h" 26#include "libavcodec/avcodec.h" 27#include "libavcodec/idctdsp.h" 28#include "idct.h" 29 30void ff_put_pixels_clamped_neon(const int16_t *, uint8_t *, ptrdiff_t); 31void ff_put_signed_pixels_clamped_neon(const int16_t *, uint8_t *, ptrdiff_t); 32void ff_add_pixels_clamped_neon(const int16_t *, uint8_t *, ptrdiff_t); 33 34av_cold void ff_idctdsp_init_aarch64(IDCTDSPContext *c, AVCodecContext *avctx, 35 unsigned high_bit_depth) 36{ 37 int cpu_flags = av_get_cpu_flags(); 38 39 if (have_neon(cpu_flags)) { 40 if (!avctx->lowres && !high_bit_depth) { 41 if (avctx->idct_algo == FF_IDCT_AUTO || 42 avctx->idct_algo == FF_IDCT_SIMPLEAUTO || 43 avctx->idct_algo == FF_IDCT_SIMPLENEON) { 44 c->idct_put = ff_simple_idct_put_neon; 45 c->idct_add = ff_simple_idct_add_neon; 46 c->idct = ff_simple_idct_neon; 47 c->perm_type = FF_IDCT_PERM_PARTTRANS; 48 } 49 } 50 51 c->add_pixels_clamped = ff_add_pixels_clamped_neon; 52 c->put_pixels_clamped = ff_put_pixels_clamped_neon; 53 c->put_signed_pixels_clamped = ff_put_signed_pixels_clamped_neon; 54 } 55} 56