1 /*
2 * Bluetooth low-complexity, subband codec (SBC)
3 *
4 * Copyright (C) 2017 Aurelien Jacobs <aurel@gnuage.org>
5 * Copyright (C) 2008-2010 Nokia Corporation
6 * Copyright (C) 2004-2010 Marcel Holtmann <marcel@holtmann.org>
7 * Copyright (C) 2004-2005 Henryk Ploetz <henryk@ploetzli.ch>
8 * Copyright (C) 2005-2006 Brad Midgley <bmidgley@xmission.com>
9 *
10 * This file is part of FFmpeg.
11 *
12 * FFmpeg is free software; you can redistribute it and/or
13 * modify it under the terms of the GNU Lesser General Public
14 * License as published by the Free Software Foundation; either
15 * version 2.1 of the License, or (at your option) any later version.
16 *
17 * FFmpeg is distributed in the hope that it will be useful,
18 * but WITHOUT ANY WARRANTY; without even the implied warranty of
19 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20 * Lesser General Public License for more details.
21 *
22 * You should have received a copy of the GNU Lesser General Public
23 * License along with FFmpeg; if not, write to the Free Software
24 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
25 */
26
27 /**
28 * @file
29 * SBC ARMv6 optimization for some basic "building bricks"
30 */
31
32 #include "libavutil/cpu.h"
33 #include "libavutil/mem_internal.h"
34 #include "libavutil/arm/cpu.h"
35 #include "libavcodec/sbcdsp.h"
36
37 void ff_sbc_analyze_4_armv6(const int16_t *in, int32_t *out, const int16_t *consts);
38 void ff_sbc_analyze_8_armv6(const int16_t *in, int32_t *out, const int16_t *consts);
39
40 void ff_sbc_analyze_4_neon(const int16_t *in, int32_t *out, const int16_t *consts);
41 void ff_sbc_analyze_8_neon(const int16_t *in, int32_t *out, const int16_t *consts);
42 void ff_sbc_calc_scalefactors_neon(int32_t sb_sample_f[16][2][8],
43 uint32_t scale_factor[2][8],
44 int blocks, int channels, int subbands);
45 int ff_sbc_calc_scalefactors_j_neon(int32_t sb_sample_f[16][2][8],
46 uint32_t scale_factor[2][8],
47 int blocks, int subbands);
48 int ff_sbc_enc_process_input_4s_neon(int position, const uint8_t *pcm,
49 int16_t X[2][SBC_X_BUFFER_SIZE],
50 int nsamples, int nchannels);
51 int ff_sbc_enc_process_input_8s_neon(int position, const uint8_t *pcm,
52 int16_t X[2][SBC_X_BUFFER_SIZE],
53 int nsamples, int nchannels);
54
55 DECLARE_ALIGNED(SBC_ALIGN, int32_t, ff_sbcdsp_joint_bits_mask)[8] = {
56 8, 4, 2, 1, 128, 64, 32, 16
57 };
58
59 #if HAVE_BIGENDIAN
60 #define PERM(a, b, c, d) { \
61 (a * 2) + 1, (a * 2) + 0, \
62 (b * 2) + 1, (b * 2) + 0, \
63 (c * 2) + 1, (c * 2) + 0, \
64 (d * 2) + 1, (d * 2) + 0 \
65 }
66 #else
67 #define PERM(a, b, c, d) { \
68 (a * 2) + 0, (a * 2) + 1, \
69 (b * 2) + 0, (b * 2) + 1, \
70 (c * 2) + 0, (c * 2) + 1, \
71 (d * 2) + 0, (d * 2) + 1 \
72 }
73 #endif
74
75 DECLARE_ALIGNED(SBC_ALIGN, uint8_t, ff_sbc_input_perm_4)[2][8] = {
76 PERM(7, 3, 6, 4),
77 PERM(0, 2, 1, 5)
78 };
79
80 DECLARE_ALIGNED(SBC_ALIGN, uint8_t, ff_sbc_input_perm_8)[4][8] = {
81 PERM(15, 7, 14, 8),
82 PERM(13, 9, 12, 10),
83 PERM(11, 3, 6, 0),
84 PERM( 5, 1, 4, 2)
85 };
86
ff_sbcdsp_init_arm(SBCDSPContext * s)87 av_cold void ff_sbcdsp_init_arm(SBCDSPContext *s)
88 {
89 int cpu_flags = av_get_cpu_flags();
90
91 if (have_armv6(cpu_flags)) {
92 s->sbc_analyze_4 = ff_sbc_analyze_4_armv6;
93 s->sbc_analyze_8 = ff_sbc_analyze_8_armv6;
94 }
95
96 if (have_neon(cpu_flags)) {
97 s->sbc_analyze_4 = ff_sbc_analyze_4_neon;
98 s->sbc_analyze_8 = ff_sbc_analyze_8_neon;
99 s->sbc_calc_scalefactors = ff_sbc_calc_scalefactors_neon;
100 s->sbc_calc_scalefactors_j = ff_sbc_calc_scalefactors_j_neon;
101 if (s->increment != 1) {
102 s->sbc_enc_process_input_4s = ff_sbc_enc_process_input_4s_neon;
103 s->sbc_enc_process_input_8s = ff_sbc_enc_process_input_8s_neon;
104 }
105 }
106 }
107