1cabdff1aSopenharmony_ci/*
2cabdff1aSopenharmony_ci * Audio resampling
3cabdff1aSopenharmony_ci *
4cabdff1aSopenharmony_ci * Copyright (c) 2004-2012 Michael Niedermayer <michaelni@gmx.at>
5cabdff1aSopenharmony_ci *
6cabdff1aSopenharmony_ci * This file is part of FFmpeg.
7cabdff1aSopenharmony_ci *
8cabdff1aSopenharmony_ci * FFmpeg is free software; you can redistribute it and/or
9cabdff1aSopenharmony_ci * modify it under the terms of the GNU Lesser General Public
10cabdff1aSopenharmony_ci * License as published by the Free Software Foundation; either
11cabdff1aSopenharmony_ci * version 2.1 of the License, or (at your option) any later version.
12cabdff1aSopenharmony_ci *
13cabdff1aSopenharmony_ci * FFmpeg is distributed in the hope that it will be useful,
14cabdff1aSopenharmony_ci * but WITHOUT ANY WARRANTY; without even the implied warranty of
15cabdff1aSopenharmony_ci * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
16cabdff1aSopenharmony_ci * Lesser General Public License for more details.
17cabdff1aSopenharmony_ci *
18cabdff1aSopenharmony_ci * You should have received a copy of the GNU Lesser General Public
19cabdff1aSopenharmony_ci * License along with FFmpeg; if not, write to the Free Software
20cabdff1aSopenharmony_ci * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21cabdff1aSopenharmony_ci */
22cabdff1aSopenharmony_ci
23cabdff1aSopenharmony_ci#include "config.h"
24cabdff1aSopenharmony_ci
25cabdff1aSopenharmony_ci#include "libavutil/attributes.h"
26cabdff1aSopenharmony_ci#include "libavutil/cpu.h"
27cabdff1aSopenharmony_ci#include "libavutil/avassert.h"
28cabdff1aSopenharmony_ci
29cabdff1aSopenharmony_ci#include "libavutil/aarch64/cpu.h"
30cabdff1aSopenharmony_ci#include "libswresample/resample.h"
31cabdff1aSopenharmony_ci
32cabdff1aSopenharmony_ci#define DECLARE_RESAMPLE_COMMON_TEMPLATE(TYPE, DELEM, FELEM, FELEM2, OUT)                         \
33cabdff1aSopenharmony_ci                                                                                                  \
34cabdff1aSopenharmony_civoid ff_resample_common_apply_filter_x4_##TYPE##_neon(FELEM2 *acc, const DELEM *src,              \
35cabdff1aSopenharmony_ci                                                      const FELEM *filter, int length);           \
36cabdff1aSopenharmony_ci                                                                                                  \
37cabdff1aSopenharmony_civoid ff_resample_common_apply_filter_x8_##TYPE##_neon(FELEM2 *acc, const DELEM *src,              \
38cabdff1aSopenharmony_ci                                                      const FELEM *filter, int length);           \
39cabdff1aSopenharmony_ci                                                                                                  \
40cabdff1aSopenharmony_cistatic int ff_resample_common_##TYPE##_neon(ResampleContext *c, void *dest, const void *source,   \
41cabdff1aSopenharmony_ci                                            int n, int update_ctx)                                \
42cabdff1aSopenharmony_ci{                                                                                                 \
43cabdff1aSopenharmony_ci    DELEM *dst = dest;                                                                            \
44cabdff1aSopenharmony_ci    const DELEM *src = source;                                                                    \
45cabdff1aSopenharmony_ci    int dst_index;                                                                                \
46cabdff1aSopenharmony_ci    int index = c->index;                                                                         \
47cabdff1aSopenharmony_ci    int frac = c->frac;                                                                           \
48cabdff1aSopenharmony_ci    int sample_index = 0;                                                                         \
49cabdff1aSopenharmony_ci    int x4_aligned_filter_length = c->filter_length & ~3;                                         \
50cabdff1aSopenharmony_ci    int x8_aligned_filter_length = c->filter_length & ~7;                                         \
51cabdff1aSopenharmony_ci                                                                                                  \
52cabdff1aSopenharmony_ci    while (index >= c->phase_count) {                                                             \
53cabdff1aSopenharmony_ci        sample_index++;                                                                           \
54cabdff1aSopenharmony_ci        index -= c->phase_count;                                                                  \
55cabdff1aSopenharmony_ci    }                                                                                             \
56cabdff1aSopenharmony_ci                                                                                                  \
57cabdff1aSopenharmony_ci    for (dst_index = 0; dst_index < n; dst_index++) {                                             \
58cabdff1aSopenharmony_ci        FELEM *filter = ((FELEM *) c->filter_bank) + c->filter_alloc * index;                     \
59cabdff1aSopenharmony_ci                                                                                                  \
60cabdff1aSopenharmony_ci        FELEM2 val = 0;                                                                             \
61cabdff1aSopenharmony_ci        int i = 0;                                                                                \
62cabdff1aSopenharmony_ci        if (x8_aligned_filter_length >= 8) {                                                      \
63cabdff1aSopenharmony_ci            ff_resample_common_apply_filter_x8_##TYPE##_neon(&val, &src[sample_index],            \
64cabdff1aSopenharmony_ci                                                             filter, x8_aligned_filter_length);   \
65cabdff1aSopenharmony_ci            i += x8_aligned_filter_length;                                                        \
66cabdff1aSopenharmony_ci                                                                                                  \
67cabdff1aSopenharmony_ci        } else if (x4_aligned_filter_length >= 4) {                                               \
68cabdff1aSopenharmony_ci            ff_resample_common_apply_filter_x4_##TYPE##_neon(&val, &src[sample_index],            \
69cabdff1aSopenharmony_ci                                                             filter, x4_aligned_filter_length);   \
70cabdff1aSopenharmony_ci            i += x4_aligned_filter_length;                                                        \
71cabdff1aSopenharmony_ci        }                                                                                         \
72cabdff1aSopenharmony_ci        for (; i < c->filter_length; i++) {                                                       \
73cabdff1aSopenharmony_ci            val += src[sample_index + i] * (FELEM2)filter[i];                                     \
74cabdff1aSopenharmony_ci        }                                                                                         \
75cabdff1aSopenharmony_ci        OUT(dst[dst_index], val);                                                                 \
76cabdff1aSopenharmony_ci                                                                                                  \
77cabdff1aSopenharmony_ci        frac  += c->dst_incr_mod;                                                                 \
78cabdff1aSopenharmony_ci        index += c->dst_incr_div;                                                                 \
79cabdff1aSopenharmony_ci        if (frac >= c->src_incr) {                                                                \
80cabdff1aSopenharmony_ci            frac -= c->src_incr;                                                                  \
81cabdff1aSopenharmony_ci            index++;                                                                              \
82cabdff1aSopenharmony_ci        }                                                                                         \
83cabdff1aSopenharmony_ci                                                                                                  \
84cabdff1aSopenharmony_ci        while (index >= c->phase_count) {                                                         \
85cabdff1aSopenharmony_ci            sample_index++;                                                                       \
86cabdff1aSopenharmony_ci            index -= c->phase_count;                                                              \
87cabdff1aSopenharmony_ci        }                                                                                         \
88cabdff1aSopenharmony_ci    }                                                                                             \
89cabdff1aSopenharmony_ci                                                                                                  \
90cabdff1aSopenharmony_ci    if (update_ctx) {                                                                             \
91cabdff1aSopenharmony_ci        c->frac = frac;                                                                           \
92cabdff1aSopenharmony_ci        c->index = index;                                                                         \
93cabdff1aSopenharmony_ci    }                                                                                             \
94cabdff1aSopenharmony_ci                                                                                                  \
95cabdff1aSopenharmony_ci    return sample_index;                                                                          \
96cabdff1aSopenharmony_ci}                                                                                                 \
97cabdff1aSopenharmony_ci
98cabdff1aSopenharmony_ci#define OUT(d, v) d = v
99cabdff1aSopenharmony_ciDECLARE_RESAMPLE_COMMON_TEMPLATE(float, float, float, float, OUT)
100cabdff1aSopenharmony_ci#undef OUT
101cabdff1aSopenharmony_ci
102cabdff1aSopenharmony_ci#define OUT(d, v) (v) = ((v) + (1<<(14)))>>15; (d) = av_clip_int16(v)
103cabdff1aSopenharmony_ciDECLARE_RESAMPLE_COMMON_TEMPLATE(s16, int16_t, int16_t, int32_t, OUT)
104cabdff1aSopenharmony_ci#undef OUT
105cabdff1aSopenharmony_ci
106cabdff1aSopenharmony_ciav_cold void swri_resample_dsp_aarch64_init(ResampleContext *c)
107cabdff1aSopenharmony_ci{
108cabdff1aSopenharmony_ci    int cpu_flags = av_get_cpu_flags();
109cabdff1aSopenharmony_ci
110cabdff1aSopenharmony_ci    if (!have_neon(cpu_flags))
111cabdff1aSopenharmony_ci        return;
112cabdff1aSopenharmony_ci
113cabdff1aSopenharmony_ci    switch(c->format) {
114cabdff1aSopenharmony_ci    case AV_SAMPLE_FMT_FLTP:
115cabdff1aSopenharmony_ci        c->dsp.resample_common = ff_resample_common_float_neon;
116cabdff1aSopenharmony_ci        break;
117cabdff1aSopenharmony_ci    case AV_SAMPLE_FMT_S16P:
118cabdff1aSopenharmony_ci        c->dsp.resample_common = ff_resample_common_s16_neon;
119cabdff1aSopenharmony_ci        break;
120cabdff1aSopenharmony_ci    }
121cabdff1aSopenharmony_ci}
122