Commit | Line | Data |
---|---|---|
04d7f601 DB |
1 | /* |
2 | * copyright (c) 2002 Mark Hills <mark@pogo.org.uk> | |
3 | * | |
b78e7197 DB |
4 | * This file is part of FFmpeg. |
5 | * | |
6 | * FFmpeg is free software; you can redistribute it and/or | |
04d7f601 DB |
7 | * modify it under the terms of the GNU Lesser General Public |
8 | * License as published by the Free Software Foundation; either | |
b78e7197 | 9 | * version 2.1 of the License, or (at your option) any later version. |
04d7f601 | 10 | * |
b78e7197 | 11 | * FFmpeg is distributed in the hope that it will be useful, |
04d7f601 DB |
12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
14 | * Lesser General Public License for more details. | |
15 | * | |
16 | * You should have received a copy of the GNU Lesser General Public | |
b78e7197 | 17 | * License along with FFmpeg; if not, write to the Free Software |
e5a389a1 | 18 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
04d7f601 DB |
19 | */ |
20 | ||
983e3246 | 21 | /** |
ba87f080 | 22 | * @file |
983e3246 MN |
23 | * Ogg Vorbis codec support via libvorbisenc. |
24 | * @author Mark Hills <mark@pogo.org.uk> | |
81e0d0b4 MH |
25 | */ |
26 | ||
81e0d0b4 MH |
27 | #include <vorbis/vorbisenc.h> |
28 | ||
77336a5e | 29 | #include "libavutil/opt.h" |
81e0d0b4 | 30 | #include "avcodec.h" |
2c124cb6 | 31 | #include "bytestream.h" |
9577838f | 32 | #include "vorbis.h" |
81e0d0b4 | 33 | |
3f4993f1 MN |
34 | #undef NDEBUG |
35 | #include <assert.h> | |
36 | ||
6d8f985e | 37 | #define OGGVORBIS_FRAME_SIZE 64 |
81e0d0b4 | 38 | |
6d8f985e | 39 | #define BUFFER_SIZE (1024*64) |
81e0d0b4 MH |
40 | |
41 | typedef struct OggVorbisContext { | |
77336a5e | 42 | AVClass *av_class; |
81e0d0b4 MH |
43 | vorbis_info vi ; |
44 | vorbis_dsp_state vd ; | |
45 | vorbis_block vb ; | |
6d8f985e MN |
46 | uint8_t buffer[BUFFER_SIZE]; |
47 | int buffer_index; | |
9c8f0768 | 48 | int eof; |
3aca208a MH |
49 | |
50 | /* decoder */ | |
51 | vorbis_comment vc ; | |
d76f581f | 52 | ogg_packet op; |
77336a5e MN |
53 | |
54 | double iblock; | |
81e0d0b4 MH |
55 | } OggVorbisContext ; |
56 | ||
77336a5e | 57 | static const AVOption options[]={ |
78c8b4b7 | 58 | {"iblock", "Sets the impulse block bias", offsetof(OggVorbisContext, iblock), FF_OPT_TYPE_DOUBLE, 0, -15, 0, AV_OPT_FLAG_AUDIO_PARAM|AV_OPT_FLAG_ENCODING_PARAM}, |
77336a5e MN |
59 | {NULL} |
60 | }; | |
da754858 | 61 | static const AVClass class = { "libvorbis", av_default_item_name, options, LIBAVUTIL_VERSION_INT }; |
81e0d0b4 | 62 | |
5ef251e5 | 63 | static av_cold int oggvorbis_init_encoder(vorbis_info *vi, AVCodecContext *avccontext) { |
77336a5e | 64 | OggVorbisContext *context = avccontext->priv_data ; |
13c71451 | 65 | double cfreq; |
c55427f8 | 66 | |
1ff8f2b3 | 67 | if(avccontext->flags & CODEC_FLAG_QSCALE) { |
13c71451 JR |
68 | /* variable bitrate */ |
69 | if(vorbis_encode_setup_vbr(vi, avccontext->channels, | |
1ff8f2b3 | 70 | avccontext->sample_rate, |
05276956 | 71 | avccontext->global_quality / (float)FF_QP2LAMBDA / 10.0)) |
13c71451 JR |
72 | return -1; |
73 | } else { | |
e5a5ea9e DC |
74 | int minrate = avccontext->rc_min_rate > 0 ? avccontext->rc_min_rate : -1; |
75 | int maxrate = avccontext->rc_min_rate > 0 ? avccontext->rc_max_rate : -1; | |
76 | ||
13c71451 JR |
77 | /* constant bitrate */ |
78 | if(vorbis_encode_setup_managed(vi, avccontext->channels, | |
e5a5ea9e | 79 | avccontext->sample_rate, minrate, avccontext->bit_rate, maxrate)) |
13c71451 JR |
80 | return -1; |
81 | ||
57ebbccf DC |
82 | /* variable bitrate by estimate, disable slow rate management */ |
83 | if(minrate == -1 && maxrate == -1) | |
84 | if(vorbis_encode_ctl(vi, OV_ECTL_RATEMANAGE2_SET, NULL)) | |
85 | return -1; | |
13c71451 | 86 | } |
c55427f8 | 87 | |
13c71451 JR |
88 | /* cutoff frequency */ |
89 | if(avccontext->cutoff > 0) { | |
90 | cfreq = avccontext->cutoff / 1000.0; | |
91 | if(vorbis_encode_ctl(vi, OV_ECTL_LOWPASS_SET, &cfreq)) | |
92 | return -1; | |
93 | } | |
81e0d0b4 | 94 | |
77336a5e MN |
95 | if(context->iblock){ |
96 | vorbis_encode_ctl(vi, OV_ECTL_IBLOCK_SET, &context->iblock); | |
97 | } | |
98 | ||
13c71451 | 99 | return vorbis_encode_setup_init(vi); |
81e0d0b4 MH |
100 | } |
101 | ||
fd7242dd PM |
102 | /* How many bytes are needed for a buffer of length 'l' */ |
103 | static int xiph_len(int l) { return (1 + l / 255 + l); } | |
104 | ||
98a6fff9 | 105 | static av_cold int oggvorbis_encode_init(AVCodecContext *avccontext) { |
81e0d0b4 | 106 | OggVorbisContext *context = avccontext->priv_data ; |
bbb77e7c MN |
107 | ogg_packet header, header_comm, header_code; |
108 | uint8_t *p; | |
fd7242dd | 109 | unsigned int offset; |
81e0d0b4 | 110 | |
81e0d0b4 | 111 | vorbis_info_init(&context->vi) ; |
81e0d0b4 | 112 | if(oggvorbis_init_encoder(&context->vi, avccontext) < 0) { |
fb0a835f | 113 | av_log(avccontext, AV_LOG_ERROR, "oggvorbis_encode_init: init_encoder failed\n") ; |
bb270c08 | 114 | return -1 ; |
81e0d0b4 | 115 | } |
81e0d0b4 MH |
116 | vorbis_analysis_init(&context->vd, &context->vi) ; |
117 | vorbis_block_init(&context->vd, &context->vb) ; | |
118 | ||
bbb77e7c MN |
119 | vorbis_comment_init(&context->vc); |
120 | vorbis_comment_add_tag(&context->vc, "encoder", LIBAVCODEC_IDENT) ; | |
121 | ||
122 | vorbis_analysis_headerout(&context->vd, &context->vc, &header, | |
123 | &header_comm, &header_code); | |
115329f1 | 124 | |
fd7242dd PM |
125 | avccontext->extradata_size= |
126 | 1 + xiph_len(header.bytes) + xiph_len(header_comm.bytes) + | |
127 | header_code.bytes; | |
128 | p = avccontext->extradata = | |
129 | av_malloc(avccontext->extradata_size + FF_INPUT_BUFFER_PADDING_SIZE); | |
ad2b531d MR |
130 | p[0] = 2; |
131 | offset = 1; | |
132 | offset += av_xiphlacing(&p[offset], header.bytes); | |
133 | offset += av_xiphlacing(&p[offset], header_comm.bytes); | |
134 | memcpy(&p[offset], header.packet, header.bytes); | |
135 | offset += header.bytes; | |
136 | memcpy(&p[offset], header_comm.packet, header_comm.bytes); | |
137 | offset += header_comm.bytes; | |
138 | memcpy(&p[offset], header_code.packet, header_code.bytes); | |
139 | offset += header_code.bytes; | |
fd7242dd | 140 | assert(offset == avccontext->extradata_size); |
115329f1 | 141 | |
bbb77e7c MN |
142 | /* vorbis_block_clear(&context->vb); |
143 | vorbis_dsp_clear(&context->vd); | |
144 | vorbis_info_clear(&context->vi);*/ | |
145 | vorbis_comment_clear(&context->vc); | |
115329f1 | 146 | |
81e0d0b4 | 147 | avccontext->frame_size = OGGVORBIS_FRAME_SIZE ; |
115329f1 | 148 | |
492cd3a9 MN |
149 | avccontext->coded_frame= avcodec_alloc_frame(); |
150 | avccontext->coded_frame->key_frame= 1; | |
115329f1 | 151 | |
81e0d0b4 MH |
152 | return 0 ; |
153 | } | |
154 | ||
155 | ||
3aca208a | 156 | static int oggvorbis_encode_frame(AVCodecContext *avccontext, |
bb270c08 DB |
157 | unsigned char *packets, |
158 | int buf_size, void *data) | |
81e0d0b4 MH |
159 | { |
160 | OggVorbisContext *context = avccontext->priv_data ; | |
81e0d0b4 | 161 | ogg_packet op ; |
0d00cf38 | 162 | signed short *audio = data ; |
9c8f0768 NG |
163 | int l; |
164 | ||
165 | if(data) { | |
42859ddb | 166 | const int samples = avccontext->frame_size; |
9c8f0768 | 167 | float **buffer ; |
9577838f | 168 | int c, channels = context->vi.channels; |
81e0d0b4 | 169 | |
a6080be7 | 170 | buffer = vorbis_analysis_buffer(&context->vd, samples) ; |
9577838f JD |
171 | for (c = 0; c < channels; c++) { |
172 | int co = (channels > 8) ? c : | |
173 | ff_vorbis_encoding_channel_layout_offsets[channels-1][c]; | |
a6080be7 | 174 | for(l = 0 ; l < samples ; l++) |
9577838f | 175 | buffer[c][l]=audio[l*channels+co]/32768.f; |
bb270c08 | 176 | } |
a6080be7 | 177 | vorbis_analysis_wrote(&context->vd, samples) ; |
9c8f0768 NG |
178 | } else { |
179 | if(!context->eof) | |
180 | vorbis_analysis_wrote(&context->vd, 0) ; | |
181 | context->eof = 1; | |
182 | } | |
81e0d0b4 | 183 | |
81e0d0b4 | 184 | while(vorbis_analysis_blockout(&context->vd, &context->vb) == 1) { |
bb270c08 DB |
185 | vorbis_analysis(&context->vb, NULL); |
186 | vorbis_bitrate_addblock(&context->vb) ; | |
81e0d0b4 | 187 | |
bb270c08 | 188 | while(vorbis_bitrate_flushpacket(&context->vd, &op)) { |
0afd2a92 DB |
189 | /* i'd love to say the following line is a hack, but sadly it's |
190 | * not, apparently the end of stream decision is in libogg. */ | |
d99659f0 | 191 | if(op.bytes==1 && op.e_o_s) |
6f824977 | 192 | continue; |
c426562c PM |
193 | if (context->buffer_index + sizeof(ogg_packet) + op.bytes > BUFFER_SIZE) { |
194 | av_log(avccontext, AV_LOG_ERROR, "libvorbis: buffer overflow."); | |
195 | return -1; | |
196 | } | |
6d8f985e MN |
197 | memcpy(context->buffer + context->buffer_index, &op, sizeof(ogg_packet)); |
198 | context->buffer_index += sizeof(ogg_packet); | |
199 | memcpy(context->buffer + context->buffer_index, op.packet, op.bytes); | |
200 | context->buffer_index += op.bytes; | |
201 | // av_log(avccontext, AV_LOG_DEBUG, "e%d / %d\n", context->buffer_index, op.bytes); | |
bb270c08 | 202 | } |
81e0d0b4 MH |
203 | } |
204 | ||
3f4993f1 | 205 | l=0; |
6d8f985e | 206 | if(context->buffer_index){ |
bbb77e7c | 207 | ogg_packet *op2= (ogg_packet*)context->buffer; |
6d8f985e | 208 | op2->packet = context->buffer + sizeof(ogg_packet); |
3f4993f1 | 209 | |
6f824977 | 210 | l= op2->bytes; |
42661adf | 211 | avccontext->coded_frame->pts= av_rescale_q(op2->granulepos, (AVRational){1, avccontext->sample_rate}, avccontext->time_base); |
3723f01c | 212 | //FIXME we should reorder the user supplied pts and not assume that they are spaced by 1/sample_rate |
3f4993f1 | 213 | |
c426562c PM |
214 | if (l > buf_size) { |
215 | av_log(avccontext, AV_LOG_ERROR, "libvorbis: buffer overflow."); | |
216 | return -1; | |
217 | } | |
218 | ||
6f824977 MN |
219 | memcpy(packets, op2->packet, l); |
220 | context->buffer_index -= l + sizeof(ogg_packet); | |
1204a13c | 221 | memmove(context->buffer, context->buffer + l + sizeof(ogg_packet), context->buffer_index); |
6d8f985e | 222 | // av_log(avccontext, AV_LOG_DEBUG, "E%d\n", l); |
6d8f985e MN |
223 | } |
224 | ||
3f4993f1 | 225 | return l; |
81e0d0b4 MH |
226 | } |
227 | ||
228 | ||
98a6fff9 | 229 | static av_cold int oggvorbis_encode_close(AVCodecContext *avccontext) { |
81e0d0b4 MH |
230 | OggVorbisContext *context = avccontext->priv_data ; |
231 | /* ogg_packet op ; */ | |
115329f1 | 232 | |
81e0d0b4 MH |
233 | vorbis_analysis_wrote(&context->vd, 0) ; /* notify vorbisenc this is EOF */ |
234 | ||
81e0d0b4 MH |
235 | vorbis_block_clear(&context->vb); |
236 | vorbis_dsp_clear(&context->vd); | |
237 | vorbis_info_clear(&context->vi); | |
492cd3a9 MN |
238 | |
239 | av_freep(&avccontext->coded_frame); | |
bbb77e7c | 240 | av_freep(&avccontext->extradata); |
115329f1 | 241 | |
81e0d0b4 MH |
242 | return 0 ; |
243 | } | |
244 | ||
245 | ||
d36beb3f | 246 | AVCodec ff_libvorbis_encoder = { |
d0d866e0 | 247 | "libvorbis", |
72415b2a | 248 | AVMEDIA_TYPE_AUDIO, |
81e0d0b4 MH |
249 | CODEC_ID_VORBIS, |
250 | sizeof(OggVorbisContext), | |
251 | oggvorbis_encode_init, | |
252 | oggvorbis_encode_frame, | |
6f824977 MN |
253 | oggvorbis_encode_close, |
254 | .capabilities= CODEC_CAP_DELAY, | |
5d6e4c16 | 255 | .sample_fmts = (const enum AVSampleFormat[]){AV_SAMPLE_FMT_S16,AV_SAMPLE_FMT_NONE}, |
fe4bf374 | 256 | .long_name= NULL_IF_CONFIG_SMALL("libvorbis Vorbis"), |
77336a5e | 257 | .priv_class= &class, |
3aca208a | 258 | } ; |