changing AVCodecContext codec -> *codec in AVStream so additions to AVCodecContext...
[libav.git] / libavformat / wav.c
1 /*
2 * WAV encoder and decoder
3 * Copyright (c) 2001, 2002 Fabrice Bellard.
4 *
5 * This library is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU Lesser General Public
7 * License as published by the Free Software Foundation; either
8 * version 2 of the License, or (at your option) any later version.
9 *
10 * This library is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * Lesser General Public License for more details.
14 *
15 * You should have received a copy of the GNU Lesser General Public
16 * License along with this library; if not, write to the Free Software
17 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
18 */
19 #include "avformat.h"
20 #include "avi.h"
21
22 const CodecTag codec_wav_tags[] = {
23 { CODEC_ID_MP2, 0x50 },
24 { CODEC_ID_MP3, 0x55 },
25 { CODEC_ID_AC3, 0x2000 },
26 { CODEC_ID_PCM_S16LE, 0x01 },
27 { CODEC_ID_PCM_U8, 0x01 }, /* must come after s16le in this list */
28 { CODEC_ID_PCM_ALAW, 0x06 },
29 { CODEC_ID_PCM_MULAW, 0x07 },
30 { CODEC_ID_ADPCM_MS, 0x02 },
31 { CODEC_ID_ADPCM_IMA_WAV, 0x11 },
32 { CODEC_ID_ADPCM_YAMAHA, 0x20 },
33 { CODEC_ID_ADPCM_G726, 0x45 },
34 { CODEC_ID_ADPCM_IMA_DK4, 0x61 }, /* rogue format number */
35 { CODEC_ID_ADPCM_IMA_DK3, 0x62 }, /* rogue format number */
36 { CODEC_ID_WMAV1, 0x160 },
37 { CODEC_ID_WMAV2, 0x161 },
38 { CODEC_ID_AAC, 0x706d },
39 { CODEC_ID_VORBIS, ('V'<<8)+'o' }, //HACK/FIXME, does vorbis in WAV/AVI have an (in)official id?
40 { CODEC_ID_SONIC, 0x2048 },
41 { CODEC_ID_SONIC_LS, 0x2048 },
42 { CODEC_ID_ADPCM_CT, 0x200 },
43 { CODEC_ID_ADPCM_SWF, ('S'<<8)+'F' },
44 { 0, 0 },
45 };
46
47 #ifdef CONFIG_ENCODERS
48 /* WAVEFORMATEX header */
49 /* returns the size or -1 on error */
50 int put_wav_header(ByteIOContext *pb, AVCodecContext *enc)
51 {
52 int bps, blkalign, bytespersec;
53 int hdrsize = 18;
54
55 if(!enc->codec_tag)
56 enc->codec_tag = codec_get_tag(codec_wav_tags, enc->codec_id);
57 if(!enc->codec_tag)
58 return -1;
59
60 put_le16(pb, enc->codec_tag);
61 put_le16(pb, enc->channels);
62 put_le32(pb, enc->sample_rate);
63 if (enc->codec_id == CODEC_ID_PCM_U8 ||
64 enc->codec_id == CODEC_ID_PCM_ALAW ||
65 enc->codec_id == CODEC_ID_PCM_MULAW) {
66 bps = 8;
67 } else if (enc->codec_id == CODEC_ID_MP2 || enc->codec_id == CODEC_ID_MP3) {
68 bps = 0;
69 } else if (enc->codec_id == CODEC_ID_ADPCM_IMA_WAV || enc->codec_id == CODEC_ID_ADPCM_MS || enc->codec_id == CODEC_ID_ADPCM_G726 || enc->codec_id == CODEC_ID_ADPCM_YAMAHA) { //
70 bps = 4;
71 } else {
72 bps = 16;
73 }
74
75 if (enc->codec_id == CODEC_ID_MP2 || enc->codec_id == CODEC_ID_MP3) {
76 blkalign = enc->frame_size; //this is wrong, but seems many demuxers dont work if this is set correctly
77 //blkalign = 144 * enc->bit_rate/enc->sample_rate;
78 } else if (enc->codec_id == CODEC_ID_ADPCM_G726) { //
79 blkalign = 1;
80 } else if (enc->block_align != 0) { /* specified by the codec */
81 blkalign = enc->block_align;
82 } else
83 blkalign = enc->channels*bps >> 3;
84 if (enc->codec_id == CODEC_ID_PCM_U8 ||
85 enc->codec_id == CODEC_ID_PCM_S16LE) {
86 bytespersec = enc->sample_rate * blkalign;
87 } else {
88 bytespersec = enc->bit_rate / 8;
89 }
90 put_le32(pb, bytespersec); /* bytes per second */
91 put_le16(pb, blkalign); /* block align */
92 put_le16(pb, bps); /* bits per sample */
93 if (enc->codec_id == CODEC_ID_MP3) {
94 put_le16(pb, 12); /* wav_extra_size */
95 hdrsize += 12;
96 put_le16(pb, 1); /* wID */
97 put_le32(pb, 2); /* fdwFlags */
98 put_le16(pb, 1152); /* nBlockSize */
99 put_le16(pb, 1); /* nFramesPerBlock */
100 put_le16(pb, 1393); /* nCodecDelay */
101 } else if (enc->codec_id == CODEC_ID_MP2) {
102 put_le16(pb, 22); /* wav_extra_size */
103 hdrsize += 22;
104 put_le16(pb, 2); /* fwHeadLayer */
105 put_le32(pb, enc->bit_rate); /* dwHeadBitrate */
106 put_le16(pb, enc->channels == 2 ? 1 : 8); /* fwHeadMode */
107 put_le16(pb, 0); /* fwHeadModeExt */
108 put_le16(pb, 1); /* wHeadEmphasis */
109 put_le16(pb, 16); /* fwHeadFlags */
110 put_le32(pb, 0); /* dwPTSLow */
111 put_le32(pb, 0); /* dwPTSHigh */
112 } else if (enc->codec_id == CODEC_ID_ADPCM_IMA_WAV) {
113 put_le16(pb, 2); /* wav_extra_size */
114 hdrsize += 2;
115 put_le16(pb, ((enc->block_align - 4 * enc->channels) / (4 * enc->channels)) * 8 + 1); /* wSamplesPerBlock */
116 } else if(enc->extradata_size){
117 put_le16(pb, enc->extradata_size);
118 put_buffer(pb, enc->extradata, enc->extradata_size);
119 hdrsize += enc->extradata_size;
120 if(hdrsize&1){
121 hdrsize++;
122 put_byte(pb, 0);
123 }
124 } else {
125 hdrsize -= 2;
126 }
127
128 return hdrsize;
129 }
130 #endif //CONFIG_ENCODERS
131
132 /* We could be given one of the three possible structures here:
133 * WAVEFORMAT, PCMWAVEFORMAT or WAVEFORMATEX. Each structure
134 * is an expansion of the previous one with the fields added
135 * at the bottom. PCMWAVEFORMAT adds 'WORD wBitsPerSample' and
136 * WAVEFORMATEX adds 'WORD cbSize' and basically makes itself
137 * an openended structure.
138 */
139 void get_wav_header(ByteIOContext *pb, AVCodecContext *codec, int size)
140 {
141 int id;
142
143 id = get_le16(pb);
144 codec->codec_type = CODEC_TYPE_AUDIO;
145 codec->codec_tag = id;
146 codec->channels = get_le16(pb);
147 codec->sample_rate = get_le32(pb);
148 codec->bit_rate = get_le32(pb) * 8;
149 codec->block_align = get_le16(pb);
150 if (size == 14) { /* We're dealing with plain vanilla WAVEFORMAT */
151 codec->bits_per_sample = 8;
152 }else
153 codec->bits_per_sample = get_le16(pb);
154 codec->codec_id = wav_codec_get_id(id, codec->bits_per_sample);
155
156 if (size > 16) { /* We're obviously dealing with WAVEFORMATEX */
157 codec->extradata_size = get_le16(pb);
158 if (codec->extradata_size > 0) {
159 if (codec->extradata_size > size - 18)
160 codec->extradata_size = size - 18;
161 codec->extradata = av_mallocz(codec->extradata_size + FF_INPUT_BUFFER_PADDING_SIZE);
162 get_buffer(pb, codec->extradata, codec->extradata_size);
163 } else
164 codec->extradata_size = 0;
165
166 /* It is possible for the chunk to contain garbage at the end */
167 if (size - codec->extradata_size - 18 > 0)
168 url_fskip(pb, size - codec->extradata_size - 18);
169 }
170 }
171
172
173 int wav_codec_get_id(unsigned int tag, int bps)
174 {
175 int id;
176 id = codec_get_id(codec_wav_tags, tag);
177 if (id <= 0)
178 return id;
179 /* handle specific u8 codec */
180 if (id == CODEC_ID_PCM_S16LE && bps == 8)
181 id = CODEC_ID_PCM_U8;
182 return id;
183 }
184
185 #ifdef CONFIG_ENCODERS
186 typedef struct {
187 offset_t data;
188 } WAVContext;
189
190 static int wav_write_header(AVFormatContext *s)
191 {
192 WAVContext *wav = s->priv_data;
193 ByteIOContext *pb = &s->pb;
194 offset_t fmt;
195
196 put_tag(pb, "RIFF");
197 put_le32(pb, 0); /* file length */
198 put_tag(pb, "WAVE");
199
200 /* format header */
201 fmt = start_tag(pb, "fmt ");
202 if (put_wav_header(pb, s->streams[0]->codec) < 0) {
203 av_free(wav);
204 return -1;
205 }
206 end_tag(pb, fmt);
207
208 av_set_pts_info(s->streams[0], 64, 1, s->streams[0]->codec->sample_rate);
209
210 /* data header */
211 wav->data = start_tag(pb, "data");
212
213 put_flush_packet(pb);
214
215 return 0;
216 }
217
218 static int wav_write_packet(AVFormatContext *s, AVPacket *pkt)
219 {
220 ByteIOContext *pb = &s->pb;
221 put_buffer(pb, pkt->data, pkt->size);
222 return 0;
223 }
224
225 static int wav_write_trailer(AVFormatContext *s)
226 {
227 ByteIOContext *pb = &s->pb;
228 WAVContext *wav = s->priv_data;
229 offset_t file_size;
230
231 if (!url_is_streamed(&s->pb)) {
232 end_tag(pb, wav->data);
233
234 /* update file size */
235 file_size = url_ftell(pb);
236 url_fseek(pb, 4, SEEK_SET);
237 put_le32(pb, (uint32_t)(file_size - 8));
238 url_fseek(pb, file_size, SEEK_SET);
239
240 put_flush_packet(pb);
241 }
242 return 0;
243 }
244 #endif //CONFIG_ENCODERS
245
246 /* return the size of the found tag */
247 /* XXX: > 2GB ? */
248 static int find_tag(ByteIOContext *pb, uint32_t tag1)
249 {
250 unsigned int tag;
251 int size;
252
253 for(;;) {
254 if (url_feof(pb))
255 return -1;
256 tag = get_le32(pb);
257 size = get_le32(pb);
258 if (tag == tag1)
259 break;
260 url_fseek(pb, size, SEEK_CUR);
261 }
262 if (size < 0)
263 size = 0x7fffffff;
264 return size;
265 }
266
267 static int wav_probe(AVProbeData *p)
268 {
269 /* check file header */
270 if (p->buf_size <= 32)
271 return 0;
272 if (p->buf[0] == 'R' && p->buf[1] == 'I' &&
273 p->buf[2] == 'F' && p->buf[3] == 'F' &&
274 p->buf[8] == 'W' && p->buf[9] == 'A' &&
275 p->buf[10] == 'V' && p->buf[11] == 'E')
276 return AVPROBE_SCORE_MAX;
277 else
278 return 0;
279 }
280
281 /* wav input */
282 static int wav_read_header(AVFormatContext *s,
283 AVFormatParameters *ap)
284 {
285 int size;
286 unsigned int tag;
287 ByteIOContext *pb = &s->pb;
288 AVStream *st;
289
290 /* check RIFF header */
291 tag = get_le32(pb);
292
293 if (tag != MKTAG('R', 'I', 'F', 'F'))
294 return -1;
295 get_le32(pb); /* file size */
296 tag = get_le32(pb);
297 if (tag != MKTAG('W', 'A', 'V', 'E'))
298 return -1;
299
300 /* parse fmt header */
301 size = find_tag(pb, MKTAG('f', 'm', 't', ' '));
302 if (size < 0)
303 return -1;
304 st = av_new_stream(s, 0);
305 if (!st)
306 return AVERROR_NOMEM;
307
308 get_wav_header(pb, st->codec, size);
309 st->need_parsing = 1;
310
311 av_set_pts_info(st, 64, 1, st->codec->sample_rate);
312
313 size = find_tag(pb, MKTAG('d', 'a', 't', 'a'));
314 if (size < 0)
315 return -1;
316 return 0;
317 }
318
319 #define MAX_SIZE 4096
320
321 static int wav_read_packet(AVFormatContext *s,
322 AVPacket *pkt)
323 {
324 int ret, size;
325 AVStream *st;
326
327 if (url_feof(&s->pb))
328 return AVERROR_IO;
329 st = s->streams[0];
330
331 size = MAX_SIZE;
332 if (st->codec->block_align > 1) {
333 if (size < st->codec->block_align)
334 size = st->codec->block_align;
335 size = (size / st->codec->block_align) * st->codec->block_align;
336 }
337 if (av_new_packet(pkt, size))
338 return AVERROR_IO;
339 pkt->stream_index = 0;
340
341 ret = get_buffer(&s->pb, pkt->data, pkt->size);
342 if (ret < 0)
343 av_free_packet(pkt);
344 /* note: we need to modify the packet size here to handle the last
345 packet */
346 pkt->size = ret;
347 return ret;
348 }
349
350 static int wav_read_close(AVFormatContext *s)
351 {
352 return 0;
353 }
354
355 static int wav_read_seek(AVFormatContext *s,
356 int stream_index, int64_t timestamp, int flags)
357 {
358 AVStream *st;
359
360 st = s->streams[0];
361 switch(st->codec->codec_id) {
362 case CODEC_ID_MP2:
363 case CODEC_ID_MP3:
364 case CODEC_ID_AC3:
365 case CODEC_ID_DTS:
366 /* use generic seeking with dynamically generated indexes */
367 return -1;
368 default:
369 break;
370 }
371 return pcm_read_seek(s, stream_index, timestamp, flags);
372 }
373
374
375 static AVInputFormat wav_iformat = {
376 "wav",
377 "wav format",
378 0,
379 wav_probe,
380 wav_read_header,
381 wav_read_packet,
382 wav_read_close,
383 wav_read_seek,
384 };
385
386 #ifdef CONFIG_ENCODERS
387 static AVOutputFormat wav_oformat = {
388 "wav",
389 "wav format",
390 "audio/x-wav",
391 "wav",
392 sizeof(WAVContext),
393 CODEC_ID_PCM_S16LE,
394 CODEC_ID_NONE,
395 wav_write_header,
396 wav_write_packet,
397 wav_write_trailer,
398 };
399 #endif //CONFIG_ENCODERS
400
401 int ff_wav_init(void)
402 {
403 av_register_input_format(&wav_iformat);
404 #ifdef CONFIG_ENCODERS
405 av_register_output_format(&wav_oformat);
406 #endif //CONFIG_ENCODERS
407 return 0;
408 }