Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
Download
52867 views
1
/*
2
* Copyright (C) 2011 Michael Niedermayer ([email protected])
3
* Copyright (c) 2012 Justin Ruggles <[email protected]>
4
*
5
* This file is part of FFmpeg.
6
*
7
* FFmpeg is free software; you can redistribute it and/or
8
* modify it under the terms of the GNU Lesser General Public
9
* License as published by the Free Software Foundation; either
10
* version 2.1 of the License, or (at your option) any later version.
11
*
12
* FFmpeg is distributed in the hope that it will be useful,
13
* but WITHOUT ANY WARRANTY; without even the implied warranty of
14
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15
* Lesser General Public License for more details.
16
*
17
* You should have received a copy of the GNU Lesser General Public
18
* License along with FFmpeg; if not, write to the Free Software
19
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20
*/
21
22
#include <stdint.h>
23
24
#include "libavutil/common.h"
25
#include "libavutil/libm.h"
26
#include "libavutil/samplefmt.h"
27
#include "avresample.h"
28
#include "internal.h"
29
#include "audio_data.h"
30
#include "audio_mix.h"
31
32
/* channel positions */
33
#define FRONT_LEFT 0
34
#define FRONT_RIGHT 1
35
#define FRONT_CENTER 2
36
#define LOW_FREQUENCY 3
37
#define BACK_LEFT 4
38
#define BACK_RIGHT 5
39
#define FRONT_LEFT_OF_CENTER 6
40
#define FRONT_RIGHT_OF_CENTER 7
41
#define BACK_CENTER 8
42
#define SIDE_LEFT 9
43
#define SIDE_RIGHT 10
44
#define TOP_CENTER 11
45
#define TOP_FRONT_LEFT 12
46
#define TOP_FRONT_CENTER 13
47
#define TOP_FRONT_RIGHT 14
48
#define TOP_BACK_LEFT 15
49
#define TOP_BACK_CENTER 16
50
#define TOP_BACK_RIGHT 17
51
#define STEREO_LEFT 29
52
#define STEREO_RIGHT 30
53
#define WIDE_LEFT 31
54
#define WIDE_RIGHT 32
55
#define SURROUND_DIRECT_LEFT 33
56
#define SURROUND_DIRECT_RIGHT 34
57
#define LOW_FREQUENCY_2 35
58
59
#define SQRT3_2 1.22474487139158904909 /* sqrt(3/2) */
60
61
static av_always_inline int even(uint64_t layout)
62
{
63
return (!layout || !!(layout & (layout - 1)));
64
}
65
66
static int sane_layout(uint64_t layout)
67
{
68
/* check that there is at least 1 front speaker */
69
if (!(layout & AV_CH_LAYOUT_SURROUND))
70
return 0;
71
72
/* check for left/right symmetry */
73
if (!even(layout & (AV_CH_FRONT_LEFT | AV_CH_FRONT_RIGHT)) ||
74
!even(layout & (AV_CH_SIDE_LEFT | AV_CH_SIDE_RIGHT)) ||
75
!even(layout & (AV_CH_BACK_LEFT | AV_CH_BACK_RIGHT)) ||
76
!even(layout & (AV_CH_FRONT_LEFT_OF_CENTER | AV_CH_FRONT_RIGHT_OF_CENTER)) ||
77
!even(layout & (AV_CH_TOP_FRONT_LEFT | AV_CH_TOP_FRONT_RIGHT)) ||
78
!even(layout & (AV_CH_TOP_BACK_LEFT | AV_CH_TOP_BACK_RIGHT)) ||
79
!even(layout & (AV_CH_STEREO_LEFT | AV_CH_STEREO_RIGHT)) ||
80
!even(layout & (AV_CH_WIDE_LEFT | AV_CH_WIDE_RIGHT)) ||
81
!even(layout & (AV_CH_SURROUND_DIRECT_LEFT | AV_CH_SURROUND_DIRECT_RIGHT)))
82
return 0;
83
84
return 1;
85
}
86
87
int avresample_build_matrix(uint64_t in_layout, uint64_t out_layout,
88
double center_mix_level, double surround_mix_level,
89
double lfe_mix_level, int normalize,
90
double *matrix_out, int stride,
91
enum AVMatrixEncoding matrix_encoding)
92
{
93
int i, j, out_i, out_j;
94
double matrix[64][64] = {{0}};
95
int64_t unaccounted;
96
double maxcoef = 0;
97
int in_channels, out_channels;
98
99
if ((out_layout & AV_CH_LAYOUT_STEREO_DOWNMIX) == AV_CH_LAYOUT_STEREO_DOWNMIX) {
100
out_layout = AV_CH_LAYOUT_STEREO;
101
}
102
103
unaccounted = in_layout & ~out_layout;
104
105
in_channels = av_get_channel_layout_nb_channels( in_layout);
106
out_channels = av_get_channel_layout_nb_channels(out_layout);
107
108
memset(matrix_out, 0, out_channels * stride * sizeof(*matrix_out));
109
110
/* check if layouts are supported */
111
if (!in_layout || in_channels > AVRESAMPLE_MAX_CHANNELS)
112
return AVERROR(EINVAL);
113
if (!out_layout || out_channels > AVRESAMPLE_MAX_CHANNELS)
114
return AVERROR(EINVAL);
115
116
/* check if layouts are unbalanced or abnormal */
117
if (!sane_layout(in_layout) || !sane_layout(out_layout))
118
return AVERROR_PATCHWELCOME;
119
120
/* route matching input/output channels */
121
for (i = 0; i < 64; i++) {
122
if (in_layout & out_layout & (1ULL << i))
123
matrix[i][i] = 1.0;
124
}
125
126
/* mix front center to front left/right */
127
if (unaccounted & AV_CH_FRONT_CENTER) {
128
if ((out_layout & AV_CH_LAYOUT_STEREO) == AV_CH_LAYOUT_STEREO) {
129
if ((in_layout & AV_CH_LAYOUT_STEREO) == AV_CH_LAYOUT_STEREO) {
130
matrix[FRONT_LEFT ][FRONT_CENTER] += center_mix_level;
131
matrix[FRONT_RIGHT][FRONT_CENTER] += center_mix_level;
132
} else {
133
matrix[FRONT_LEFT ][FRONT_CENTER] += M_SQRT1_2;
134
matrix[FRONT_RIGHT][FRONT_CENTER] += M_SQRT1_2;
135
}
136
} else
137
return AVERROR_PATCHWELCOME;
138
}
139
/* mix front left/right to center */
140
if (unaccounted & AV_CH_LAYOUT_STEREO) {
141
if (out_layout & AV_CH_FRONT_CENTER) {
142
matrix[FRONT_CENTER][FRONT_LEFT ] += M_SQRT1_2;
143
matrix[FRONT_CENTER][FRONT_RIGHT] += M_SQRT1_2;
144
/* mix left/right/center to center */
145
if (in_layout & AV_CH_FRONT_CENTER)
146
matrix[FRONT_CENTER][FRONT_CENTER] = center_mix_level * M_SQRT2;
147
} else
148
return AVERROR_PATCHWELCOME;
149
}
150
/* mix back center to back, side, or front */
151
if (unaccounted & AV_CH_BACK_CENTER) {
152
if (out_layout & AV_CH_BACK_LEFT) {
153
matrix[BACK_LEFT ][BACK_CENTER] += M_SQRT1_2;
154
matrix[BACK_RIGHT][BACK_CENTER] += M_SQRT1_2;
155
} else if (out_layout & AV_CH_SIDE_LEFT) {
156
matrix[SIDE_LEFT ][BACK_CENTER] += M_SQRT1_2;
157
matrix[SIDE_RIGHT][BACK_CENTER] += M_SQRT1_2;
158
} else if (out_layout & AV_CH_FRONT_LEFT) {
159
if (matrix_encoding == AV_MATRIX_ENCODING_DOLBY ||
160
matrix_encoding == AV_MATRIX_ENCODING_DPLII) {
161
if (unaccounted & (AV_CH_BACK_LEFT | AV_CH_SIDE_LEFT)) {
162
matrix[FRONT_LEFT ][BACK_CENTER] -= surround_mix_level * M_SQRT1_2;
163
matrix[FRONT_RIGHT][BACK_CENTER] += surround_mix_level * M_SQRT1_2;
164
} else {
165
matrix[FRONT_LEFT ][BACK_CENTER] -= surround_mix_level;
166
matrix[FRONT_RIGHT][BACK_CENTER] += surround_mix_level;
167
}
168
} else {
169
matrix[FRONT_LEFT ][BACK_CENTER] += surround_mix_level * M_SQRT1_2;
170
matrix[FRONT_RIGHT][BACK_CENTER] += surround_mix_level * M_SQRT1_2;
171
}
172
} else if (out_layout & AV_CH_FRONT_CENTER) {
173
matrix[FRONT_CENTER][BACK_CENTER] += surround_mix_level * M_SQRT1_2;
174
} else
175
return AVERROR_PATCHWELCOME;
176
}
177
/* mix back left/right to back center, side, or front */
178
if (unaccounted & AV_CH_BACK_LEFT) {
179
if (out_layout & AV_CH_BACK_CENTER) {
180
matrix[BACK_CENTER][BACK_LEFT ] += M_SQRT1_2;
181
matrix[BACK_CENTER][BACK_RIGHT] += M_SQRT1_2;
182
} else if (out_layout & AV_CH_SIDE_LEFT) {
183
/* if side channels do not exist in the input, just copy back
184
channels to side channels, otherwise mix back into side */
185
if (in_layout & AV_CH_SIDE_LEFT) {
186
matrix[SIDE_LEFT ][BACK_LEFT ] += M_SQRT1_2;
187
matrix[SIDE_RIGHT][BACK_RIGHT] += M_SQRT1_2;
188
} else {
189
matrix[SIDE_LEFT ][BACK_LEFT ] += 1.0;
190
matrix[SIDE_RIGHT][BACK_RIGHT] += 1.0;
191
}
192
} else if (out_layout & AV_CH_FRONT_LEFT) {
193
if (matrix_encoding == AV_MATRIX_ENCODING_DOLBY) {
194
matrix[FRONT_LEFT ][BACK_LEFT ] -= surround_mix_level * M_SQRT1_2;
195
matrix[FRONT_LEFT ][BACK_RIGHT] -= surround_mix_level * M_SQRT1_2;
196
matrix[FRONT_RIGHT][BACK_LEFT ] += surround_mix_level * M_SQRT1_2;
197
matrix[FRONT_RIGHT][BACK_RIGHT] += surround_mix_level * M_SQRT1_2;
198
} else if (matrix_encoding == AV_MATRIX_ENCODING_DPLII) {
199
matrix[FRONT_LEFT ][BACK_LEFT ] -= surround_mix_level * SQRT3_2;
200
matrix[FRONT_LEFT ][BACK_RIGHT] -= surround_mix_level * M_SQRT1_2;
201
matrix[FRONT_RIGHT][BACK_LEFT ] += surround_mix_level * M_SQRT1_2;
202
matrix[FRONT_RIGHT][BACK_RIGHT] += surround_mix_level * SQRT3_2;
203
} else {
204
matrix[FRONT_LEFT ][BACK_LEFT ] += surround_mix_level;
205
matrix[FRONT_RIGHT][BACK_RIGHT] += surround_mix_level;
206
}
207
} else if (out_layout & AV_CH_FRONT_CENTER) {
208
matrix[FRONT_CENTER][BACK_LEFT ] += surround_mix_level * M_SQRT1_2;
209
matrix[FRONT_CENTER][BACK_RIGHT] += surround_mix_level * M_SQRT1_2;
210
} else
211
return AVERROR_PATCHWELCOME;
212
}
213
/* mix side left/right into back or front */
214
if (unaccounted & AV_CH_SIDE_LEFT) {
215
if (out_layout & AV_CH_BACK_LEFT) {
216
/* if back channels do not exist in the input, just copy side
217
channels to back channels, otherwise mix side into back */
218
if (in_layout & AV_CH_BACK_LEFT) {
219
matrix[BACK_LEFT ][SIDE_LEFT ] += M_SQRT1_2;
220
matrix[BACK_RIGHT][SIDE_RIGHT] += M_SQRT1_2;
221
} else {
222
matrix[BACK_LEFT ][SIDE_LEFT ] += 1.0;
223
matrix[BACK_RIGHT][SIDE_RIGHT] += 1.0;
224
}
225
} else if (out_layout & AV_CH_BACK_CENTER) {
226
matrix[BACK_CENTER][SIDE_LEFT ] += M_SQRT1_2;
227
matrix[BACK_CENTER][SIDE_RIGHT] += M_SQRT1_2;
228
} else if (out_layout & AV_CH_FRONT_LEFT) {
229
if (matrix_encoding == AV_MATRIX_ENCODING_DOLBY) {
230
matrix[FRONT_LEFT ][SIDE_LEFT ] -= surround_mix_level * M_SQRT1_2;
231
matrix[FRONT_LEFT ][SIDE_RIGHT] -= surround_mix_level * M_SQRT1_2;
232
matrix[FRONT_RIGHT][SIDE_LEFT ] += surround_mix_level * M_SQRT1_2;
233
matrix[FRONT_RIGHT][SIDE_RIGHT] += surround_mix_level * M_SQRT1_2;
234
} else if (matrix_encoding == AV_MATRIX_ENCODING_DPLII) {
235
matrix[FRONT_LEFT ][SIDE_LEFT ] -= surround_mix_level * SQRT3_2;
236
matrix[FRONT_LEFT ][SIDE_RIGHT] -= surround_mix_level * M_SQRT1_2;
237
matrix[FRONT_RIGHT][SIDE_LEFT ] += surround_mix_level * M_SQRT1_2;
238
matrix[FRONT_RIGHT][SIDE_RIGHT] += surround_mix_level * SQRT3_2;
239
} else {
240
matrix[FRONT_LEFT ][SIDE_LEFT ] += surround_mix_level;
241
matrix[FRONT_RIGHT][SIDE_RIGHT] += surround_mix_level;
242
}
243
} else if (out_layout & AV_CH_FRONT_CENTER) {
244
matrix[FRONT_CENTER][SIDE_LEFT ] += surround_mix_level * M_SQRT1_2;
245
matrix[FRONT_CENTER][SIDE_RIGHT] += surround_mix_level * M_SQRT1_2;
246
} else
247
return AVERROR_PATCHWELCOME;
248
}
249
/* mix left-of-center/right-of-center into front left/right or center */
250
if (unaccounted & AV_CH_FRONT_LEFT_OF_CENTER) {
251
if (out_layout & AV_CH_FRONT_LEFT) {
252
matrix[FRONT_LEFT ][FRONT_LEFT_OF_CENTER ] += 1.0;
253
matrix[FRONT_RIGHT][FRONT_RIGHT_OF_CENTER] += 1.0;
254
} else if (out_layout & AV_CH_FRONT_CENTER) {
255
matrix[FRONT_CENTER][FRONT_LEFT_OF_CENTER ] += M_SQRT1_2;
256
matrix[FRONT_CENTER][FRONT_RIGHT_OF_CENTER] += M_SQRT1_2;
257
} else
258
return AVERROR_PATCHWELCOME;
259
}
260
/* mix LFE into front left/right or center */
261
if (unaccounted & AV_CH_LOW_FREQUENCY) {
262
if (out_layout & AV_CH_FRONT_CENTER) {
263
matrix[FRONT_CENTER][LOW_FREQUENCY] += lfe_mix_level;
264
} else if (out_layout & AV_CH_FRONT_LEFT) {
265
matrix[FRONT_LEFT ][LOW_FREQUENCY] += lfe_mix_level * M_SQRT1_2;
266
matrix[FRONT_RIGHT][LOW_FREQUENCY] += lfe_mix_level * M_SQRT1_2;
267
} else
268
return AVERROR_PATCHWELCOME;
269
}
270
271
/* transfer internal matrix to output matrix and calculate maximum
272
per-channel coefficient sum */
273
for (out_i = i = 0; out_i < out_channels && i < 64; i++) {
274
double sum = 0;
275
for (out_j = j = 0; out_j < in_channels && j < 64; j++) {
276
matrix_out[out_i * stride + out_j] = matrix[i][j];
277
sum += fabs(matrix[i][j]);
278
if (in_layout & (1ULL << j))
279
out_j++;
280
}
281
maxcoef = FFMAX(maxcoef, sum);
282
if (out_layout & (1ULL << i))
283
out_i++;
284
}
285
286
/* normalize */
287
if (normalize && maxcoef > 1.0) {
288
for (i = 0; i < out_channels; i++)
289
for (j = 0; j < in_channels; j++)
290
matrix_out[i * stride + j] /= maxcoef;
291
}
292
293
return 0;
294
}
295
296