flvdec: expose metadata through the generic metadata API
[libav.git] / libavcodec / libamr.c
1 /*
2 * AMR Audio decoder stub
3 * Copyright (c) 2003 the ffmpeg project
4 *
5 * This file is part of FFmpeg.
6 *
7 * FFmpeg is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
11 *
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
16 *
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with FFmpeg; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20 */
21
22 /** @file
23 * Adaptive Multi-Rate (AMR) Audio decoder stub.
24 *
25 * This code implements both an AMR-NarrowBand (AMR-NB) and an AMR-WideBand
26 * (AMR-WB) audio encoder/decoder through external reference code from
27 * http://www.3gpp.org/. The license of the code from 3gpp is unclear so you
28 * have to download the code separately.
29 *
30 * \section AMR-NB
31 *
32 * The float version (default) can be downloaded from:
33 * http://www.3gpp.org/ftp/Specs/archive/26_series/26.104/26104-610.zip
34 *
35 * \subsection Specification
36 * The specification for AMR-NB can be found in TS 26.071
37 * (http://www.3gpp.org/ftp/Specs/html-info/26071.htm) and some other
38 * info at http://www.3gpp.org/ftp/Specs/html-info/26-series.htm.
39 *
40 * \section AMR-WB
41 *
42 * The reference code can be downloaded from:
43 * http://www.3gpp.org/ftp/Specs/archive/26_series/26.204/26204-600.zip
44 *
45 * \subsection Specification
46 * The specification for AMR-WB can be found in TS 26.171
47 * (http://www.3gpp.org/ftp/Specs/html-info/26171.htm) and some other
48 * info at http://www.3gpp.org/ftp/Specs/html-info/26-series.htm.
49 *
50 */
51
52 #include "avcodec.h"
53
54 static void amr_decode_fix_avctx(AVCodecContext *avctx)
55 {
56 const int is_amr_wb = 1 + (avctx->codec_id == CODEC_ID_AMR_WB);
57
58 if (!avctx->sample_rate)
59 avctx->sample_rate = 8000 * is_amr_wb;
60
61 if (!avctx->channels)
62 avctx->channels = 1;
63
64 avctx->frame_size = 160 * is_amr_wb;
65 avctx->sample_fmt = SAMPLE_FMT_S16;
66 }
67
68 #if CONFIG_LIBAMR_NB
69
70 #include <amrnb/interf_dec.h>
71 #include <amrnb/interf_enc.h>
72
73 static const char nb_bitrate_unsupported[] =
74 "bitrate not supported: use one of 4.75k, 5.15k, 5.9k, 6.7k, 7.4k, 7.95k, 10.2k or 12.2k\n";
75
76 typedef struct AMR_bitrates {
77 int rate;
78 enum Mode mode;
79 } AMR_bitrates;
80
81 /* Match desired bitrate */
82 static int getBitrateMode(int bitrate)
83 {
84 /* make the correspondance between bitrate and mode */
85 AMR_bitrates rates[] = { { 4750, MR475},
86 { 5150, MR515},
87 { 5900, MR59},
88 { 6700, MR67},
89 { 7400, MR74},
90 { 7950, MR795},
91 {10200, MR102},
92 {12200, MR122}, };
93 int i;
94
95 for (i = 0; i < 8; i++)
96 if (rates[i].rate == bitrate)
97 return rates[i].mode;
98 /* no bitrate matching, return an error */
99 return -1;
100 }
101
102 typedef struct AMRContext {
103 int frameCount;
104 void *decState;
105 int *enstate;
106 int enc_bitrate;
107 } AMRContext;
108
109 static av_cold int amr_nb_decode_init(AVCodecContext *avctx)
110 {
111 AMRContext *s = avctx->priv_data;
112
113 s->frameCount = 0;
114 s->decState = Decoder_Interface_init();
115 if (!s->decState) {
116 av_log(avctx, AV_LOG_ERROR, "Decoder_Interface_init error\r\n");
117 return -1;
118 }
119
120 amr_decode_fix_avctx(avctx);
121
122 if (avctx->channels > 1) {
123 av_log(avctx, AV_LOG_ERROR, "amr_nb: multichannel decoding not supported\n");
124 return -1;
125 }
126
127 return 0;
128 }
129
130 static av_cold int amr_nb_decode_close(AVCodecContext *avctx)
131 {
132 AMRContext *s = avctx->priv_data;
133
134 Decoder_Interface_exit(s->decState);
135 return 0;
136 }
137
138 static int amr_nb_decode_frame(AVCodecContext *avctx, void *data,
139 int *data_size, AVPacket *avpkt)
140 {
141 const uint8_t *buf = avpkt->data;
142 int buf_size = avpkt->size;
143 AMRContext *s = avctx->priv_data;
144 const uint8_t *amrData = buf;
145 static const uint8_t block_size[16] = { 12, 13, 15, 17, 19, 20, 26, 31, 5, 0, 0, 0, 0, 0, 0, 0 };
146 enum Mode dec_mode;
147 int packet_size;
148
149 /* av_log(NULL, AV_LOG_DEBUG, "amr_decode_frame buf=%p buf_size=%d frameCount=%d!!\n",
150 buf, buf_size, s->frameCount); */
151
152 dec_mode = (buf[0] >> 3) & 0x000F;
153 packet_size = block_size[dec_mode] + 1;
154
155 if (packet_size > buf_size) {
156 av_log(avctx, AV_LOG_ERROR, "amr frame too short (%u, should be %u)\n",
157 buf_size, packet_size);
158 return -1;
159 }
160
161 s->frameCount++;
162 /* av_log(NULL, AV_LOG_DEBUG, "packet_size=%d amrData= 0x%X %X %X %X\n",
163 packet_size, amrData[0], amrData[1], amrData[2], amrData[3]); */
164 /* call decoder */
165 Decoder_Interface_Decode(s->decState, amrData, data, 0);
166 *data_size = 160 * 2;
167
168 return packet_size;
169 }
170
171 AVCodec libamr_nb_decoder = {
172 "libamr_nb",
173 CODEC_TYPE_AUDIO,
174 CODEC_ID_AMR_NB,
175 sizeof(AMRContext),
176 amr_nb_decode_init,
177 NULL,
178 amr_nb_decode_close,
179 amr_nb_decode_frame,
180 .long_name = NULL_IF_CONFIG_SMALL("libamr-nb Adaptive Multi-Rate (AMR) Narrow-Band"),
181 };
182
183 static av_cold int amr_nb_encode_init(AVCodecContext *avctx)
184 {
185 AMRContext *s = avctx->priv_data;
186
187 s->frameCount = 0;
188
189 if (avctx->sample_rate != 8000) {
190 av_log(avctx, AV_LOG_ERROR, "Only 8000Hz sample rate supported\n");
191 return -1;
192 }
193
194 if (avctx->channels != 1) {
195 av_log(avctx, AV_LOG_ERROR, "Only mono supported\n");
196 return -1;
197 }
198
199 avctx->frame_size = 160;
200 avctx->coded_frame = avcodec_alloc_frame();
201
202 s->enstate=Encoder_Interface_init(0);
203 if (!s->enstate) {
204 av_log(avctx, AV_LOG_ERROR, "Encoder_Interface_init error\n");
205 return -1;
206 }
207
208 if ((s->enc_bitrate = getBitrateMode(avctx->bit_rate)) < 0) {
209 av_log(avctx, AV_LOG_ERROR, nb_bitrate_unsupported);
210 return -1;
211 }
212
213 return 0;
214 }
215
216 static av_cold int amr_nb_encode_close(AVCodecContext *avctx)
217 {
218 AMRContext *s = avctx->priv_data;
219
220 Encoder_Interface_exit(s->enstate);
221 av_freep(&avctx->coded_frame);
222 return 0;
223 }
224
225 static int amr_nb_encode_frame(AVCodecContext *avctx,
226 unsigned char *frame/*out*/,
227 int buf_size, void *data/*in*/)
228 {
229 AMRContext *s = avctx->priv_data;
230 int written;
231
232 if ((s->enc_bitrate = getBitrateMode(avctx->bit_rate)) < 0) {
233 av_log(avctx, AV_LOG_ERROR, nb_bitrate_unsupported);
234 return -1;
235 }
236
237 written = Encoder_Interface_Encode(s->enstate, s->enc_bitrate, data,
238 frame, 0);
239 /* av_log(NULL, AV_LOG_DEBUG, "amr_nb_encode_frame encoded %u bytes, bitrate %u, first byte was %#02x\n",
240 written, s->enc_bitrate, frame[0] ); */
241
242 return written;
243 }
244
245 AVCodec libamr_nb_encoder = {
246 "libamr_nb",
247 CODEC_TYPE_AUDIO,
248 CODEC_ID_AMR_NB,
249 sizeof(AMRContext),
250 amr_nb_encode_init,
251 amr_nb_encode_frame,
252 amr_nb_encode_close,
253 NULL,
254 .sample_fmts = (enum SampleFormat[]){SAMPLE_FMT_S16,SAMPLE_FMT_NONE},
255 .long_name = NULL_IF_CONFIG_SMALL("libamr-nb Adaptive Multi-Rate (AMR) Narrow-Band"),
256 };
257
258 #endif
259
260 /* -----------AMR wideband ------------*/
261 #if CONFIG_LIBAMR_WB
262
263 #ifdef _TYPEDEF_H
264 //To avoid duplicate typedefs from typedef in amr-nb
265 #define typedef_h
266 #endif
267
268 #include <amrwb/dec_if.h>
269 #include <amrwb/if_rom.h>
270
271 static const char wb_bitrate_unsupported[] =
272 "bitrate not supported: use one of 6.6k, 8.85k, 12.65k, 14.25k, 15.85k, 18.25k, 19.85k, 23.05k, or 23.85k\n";
273
274 typedef struct AMRWB_bitrates {
275 int rate;
276 int mode;
277 } AMRWB_bitrates;
278
279 typedef struct AMRWBContext {
280 int frameCount;
281 void *state;
282 int mode;
283 Word16 allow_dtx;
284 } AMRWBContext;
285
286 #if CONFIG_LIBAMR_WB_ENCODER
287
288 #include <amrwb/enc_if.h>
289
290 static int getWBBitrateMode(int bitrate)
291 {
292 /* make the correspondance between bitrate and mode */
293 AMRWB_bitrates rates[] = { { 6600, 0},
294 { 8850, 1},
295 {12650, 2},
296 {14250, 3},
297 {15850, 4},
298 {18250, 5},
299 {19850, 6},
300 {23050, 7},
301 {23850, 8}, };
302 int i;
303
304 for (i = 0; i < 9; i++)
305 if (rates[i].rate == bitrate)
306 return rates[i].mode;
307 /* no bitrate matching, return an error */
308 return -1;
309 }
310
311 static av_cold int amr_wb_encode_init(AVCodecContext *avctx)
312 {
313 AMRWBContext *s = avctx->priv_data;
314
315 s->frameCount = 0;
316
317 if (avctx->sample_rate != 16000) {
318 av_log(avctx, AV_LOG_ERROR, "Only 16000Hz sample rate supported\n");
319 return -1;
320 }
321
322 if (avctx->channels != 1) {
323 av_log(avctx, AV_LOG_ERROR, "Only mono supported\n");
324 return -1;
325 }
326
327 if ((s->mode = getWBBitrateMode(avctx->bit_rate)) < 0) {
328 av_log(avctx, AV_LOG_ERROR, wb_bitrate_unsupported);
329 return -1;
330 }
331
332 avctx->frame_size = 320;
333 avctx->coded_frame = avcodec_alloc_frame();
334
335 s->state = E_IF_init();
336 s->allow_dtx = 0;
337
338 return 0;
339 }
340
341 static int amr_wb_encode_close(AVCodecContext *avctx)
342 {
343 AMRWBContext *s = avctx->priv_data;
344
345 E_IF_exit(s->state);
346 av_freep(&avctx->coded_frame);
347 s->frameCount++;
348 return 0;
349 }
350
351 static int amr_wb_encode_frame(AVCodecContext *avctx,
352 unsigned char *frame/*out*/,
353 int buf_size, void *data/*in*/)
354 {
355 AMRWBContext *s = avctx->priv_data;
356 int size;
357
358 if ((s->mode = getWBBitrateMode(avctx->bit_rate)) < 0) {
359 av_log(avctx, AV_LOG_ERROR, wb_bitrate_unsupported);
360 return -1;
361 }
362 size = E_IF_encode(s->state, s->mode, data, frame, s->allow_dtx);
363 return size;
364 }
365
366 AVCodec libamr_wb_encoder = {
367 "libamr_wb",
368 CODEC_TYPE_AUDIO,
369 CODEC_ID_AMR_WB,
370 sizeof(AMRWBContext),
371 amr_wb_encode_init,
372 amr_wb_encode_frame,
373 amr_wb_encode_close,
374 NULL,
375 .sample_fmts = (enum SampleFormat[]){SAMPLE_FMT_S16,SAMPLE_FMT_NONE},
376 .long_name = NULL_IF_CONFIG_SMALL("libamr-wb Adaptive Multi-Rate (AMR) Wide-Band"),
377 };
378
379 #endif
380
381 static av_cold int amr_wb_decode_init(AVCodecContext *avctx)
382 {
383 AMRWBContext *s = avctx->priv_data;
384
385 s->frameCount = 0;
386 s->state = D_IF_init();
387
388 amr_decode_fix_avctx(avctx);
389
390 if (avctx->channels > 1) {
391 av_log(avctx, AV_LOG_ERROR, "amr_wb: multichannel decoding not supported\n");
392 return -1;
393 }
394
395 return 0;
396 }
397
398 static int amr_wb_decode_frame(AVCodecContext *avctx, void *data,
399 int *data_size, AVPacket *avpkt)
400 {
401 const uint8_t *buf = avpkt->data;
402 int buf_size = avpkt->size;
403 AMRWBContext *s = avctx->priv_data;
404 const uint8_t *amrData = buf;
405 int mode;
406 int packet_size;
407 static const uint8_t block_size[16] = {18, 24, 33, 37, 41, 47, 51, 59, 61, 6, 6, 0, 0, 0, 1, 1};
408
409 if (!buf_size)
410 /* nothing to do */
411 return 0;
412
413 mode = (amrData[0] >> 3) & 0x000F;
414 packet_size = block_size[mode];
415
416 if (packet_size > buf_size) {
417 av_log(avctx, AV_LOG_ERROR, "amr frame too short (%u, should be %u)\n",
418 buf_size, packet_size + 1);
419 return -1;
420 }
421
422 s->frameCount++;
423 D_IF_decode(s->state, amrData, data, _good_frame);
424 *data_size = 320 * 2;
425 return packet_size;
426 }
427
428 static int amr_wb_decode_close(AVCodecContext *avctx)
429 {
430 AMRWBContext *s = avctx->priv_data;
431
432 D_IF_exit(s->state);
433 return 0;
434 }
435
436 AVCodec libamr_wb_decoder = {
437 "libamr_wb",
438 CODEC_TYPE_AUDIO,
439 CODEC_ID_AMR_WB,
440 sizeof(AMRWBContext),
441 amr_wb_decode_init,
442 NULL,
443 amr_wb_decode_close,
444 amr_wb_decode_frame,
445 .long_name = NULL_IF_CONFIG_SMALL("libamr-wb Adaptive Multi-Rate (AMR) Wide-Band"),
446 };
447
448 #endif //CONFIG_LIBAMR_WB