Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
[libav.git] / libavcodec / iff.c
CommitLineData
b9e06ddd
PR
1/*
2 * IFF PBM/ILBM bitmap decoder
3 * Copyright (c) 2010 Peter Ross <pross@xvid.org>
473147be 4 * Copyright (c) 2010 Sebastian Vater <cdgs.basty@googlemail.com>
b9e06ddd
PR
5 *
6 * This file is part of FFmpeg.
7 *
8 * FFmpeg is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation; either
11 * version 2.1 of the License, or (at your option) any later version.
12 *
13 * FFmpeg is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * Lesser General Public License for more details.
17 *
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with FFmpeg; if not, write to the Free Software
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21 */
22
23/**
ba87f080 24 * @file
b9e06ddd
PR
25 * IFF PBM/ILBM bitmap decoder
26 */
27
28#include "bytestream.h"
29#include "avcodec.h"
005caa34 30#include "get_bits.h"
d9747e29 31#include "iff.h"
005caa34
PR
32
33typedef struct {
34 AVFrame frame;
4fe4bb61 35 int planesize;
005caa34
PR
36 uint8_t * planebuf;
37} IffContext;
b9e06ddd 38
0a9cb385
SV
39#define LUT8_PART(plane, v) \
40 AV_LE2ME64C(UINT64_C(0x0000000)<<32 | v) << plane, \
41 AV_LE2ME64C(UINT64_C(0x1000000)<<32 | v) << plane, \
42 AV_LE2ME64C(UINT64_C(0x0010000)<<32 | v) << plane, \
43 AV_LE2ME64C(UINT64_C(0x1010000)<<32 | v) << plane, \
44 AV_LE2ME64C(UINT64_C(0x0000100)<<32 | v) << plane, \
45 AV_LE2ME64C(UINT64_C(0x1000100)<<32 | v) << plane, \
46 AV_LE2ME64C(UINT64_C(0x0010100)<<32 | v) << plane, \
47 AV_LE2ME64C(UINT64_C(0x1010100)<<32 | v) << plane, \
48 AV_LE2ME64C(UINT64_C(0x0000001)<<32 | v) << plane, \
49 AV_LE2ME64C(UINT64_C(0x1000001)<<32 | v) << plane, \
50 AV_LE2ME64C(UINT64_C(0x0010001)<<32 | v) << plane, \
51 AV_LE2ME64C(UINT64_C(0x1010001)<<32 | v) << plane, \
52 AV_LE2ME64C(UINT64_C(0x0000101)<<32 | v) << plane, \
53 AV_LE2ME64C(UINT64_C(0x1000101)<<32 | v) << plane, \
54 AV_LE2ME64C(UINT64_C(0x0010101)<<32 | v) << plane, \
55 AV_LE2ME64C(UINT64_C(0x1010101)<<32 | v) << plane
56
57#define LUT8(plane) { \
58 LUT8_PART(plane, 0x0000000), \
59 LUT8_PART(plane, 0x1000000), \
60 LUT8_PART(plane, 0x0010000), \
61 LUT8_PART(plane, 0x1010000), \
62 LUT8_PART(plane, 0x0000100), \
63 LUT8_PART(plane, 0x1000100), \
64 LUT8_PART(plane, 0x0010100), \
65 LUT8_PART(plane, 0x1010100), \
66 LUT8_PART(plane, 0x0000001), \
67 LUT8_PART(plane, 0x1000001), \
68 LUT8_PART(plane, 0x0010001), \
69 LUT8_PART(plane, 0x1010001), \
70 LUT8_PART(plane, 0x0000101), \
71 LUT8_PART(plane, 0x1000101), \
72 LUT8_PART(plane, 0x0010101), \
73 LUT8_PART(plane, 0x1010101), \
74}
75
76// 8 planes * 8-bit mask
77static const uint64_t plane8_lut[8][256] = {
78 LUT8(0), LUT8(1), LUT8(2), LUT8(3),
79 LUT8(4), LUT8(5), LUT8(6), LUT8(7),
80};
81
b9e06ddd
PR
82/**
83 * Convert CMAP buffer (stored in extradata) to lavc palette format
84 */
85int ff_cmap_read_palette(AVCodecContext *avctx, uint32_t *pal)
86{
4fe4bb61 87 int count, i;
b9e06ddd
PR
88
89 if (avctx->bits_per_coded_sample > 8) {
90 av_log(avctx, AV_LOG_ERROR, "bit_per_coded_sample > 8 not supported\n");
91 return AVERROR_INVALIDDATA;
92 }
93
94 count = 1 << avctx->bits_per_coded_sample;
95 if (avctx->extradata_size < count * 3) {
96 av_log(avctx, AV_LOG_ERROR, "palette data underflow\n");
97 return AVERROR_INVALIDDATA;
98 }
99 for (i=0; i < count; i++) {
005caa34 100 pal[i] = 0xFF000000 | AV_RB24( avctx->extradata + i*3 );
b9e06ddd
PR
101 }
102 return 0;
103}
104
105static av_cold int decode_init(AVCodecContext *avctx)
106{
005caa34 107 IffContext *s = avctx->priv_data;
0edfa79b 108 int err;
005caa34
PR
109
110 if (avctx->bits_per_coded_sample <= 8) {
111 avctx->pix_fmt = PIX_FMT_PAL8;
112 } else if (avctx->bits_per_coded_sample <= 32) {
113 avctx->pix_fmt = PIX_FMT_BGR32;
114 } else {
115 return AVERROR_INVALIDDATA;
116 }
b9e06ddd 117
cfdaee45 118 s->planesize = FFALIGN(avctx->width, 16) >> 3; // Align plane size in bits to word-boundary
005caa34
PR
119 s->planebuf = av_malloc(s->planesize + FF_INPUT_BUFFER_PADDING_SIZE);
120 if (!s->planebuf)
121 return AVERROR(ENOMEM);
b9e06ddd 122
005caa34 123 s->frame.reference = 1;
0edfa79b 124 if ((err = avctx->get_buffer(avctx, &s->frame) < 0)) {
b9e06ddd 125 av_log(avctx, AV_LOG_ERROR, "get_buffer() failed\n");
0edfa79b 126 return err;
b9e06ddd 127 }
b9e06ddd 128
005caa34
PR
129 return avctx->bits_per_coded_sample <= 8 ?
130 ff_cmap_read_palette(avctx, (uint32_t*)s->frame.data[1]) : 0;
b9e06ddd
PR
131}
132
133/**
687dc355
SV
134 * Decode interleaved plane buffer up to 8bpp
135 * @param dst Destination buffer
136 * @param buf Source buffer
137 * @param buf_size
138 * @param bps bits_per_coded_sample (must be <= 8)
139 * @param plane plane number to decode as
140 */
0a9cb385 141static void decodeplane8(uint8_t *dst, const uint8_t *buf, int buf_size, int bps, int plane)
687dc355 142{
0a9cb385
SV
143 const uint64_t *lut = plane8_lut[plane];
144 for(; --buf_size != 0; dst += 8) {
145 uint64_t v = AV_RN64A(dst) | lut[*buf++];
146 AV_WN64A(dst, v);
687dc355
SV
147 }
148}
149
150/**
151 * Decode interleaved plane buffer up to 24bpp
005caa34
PR
152 * @param dst Destination buffer
153 * @param buf Source buffer
154 * @param buf_size
155 * @param bps bits_per_coded_sample
156 * @param plane plane number to decode as
b9e06ddd 157 */
687dc355
SV
158static void decodeplane32(uint32_t *dst, const uint8_t *const buf, int buf_size, int bps, int plane)
159{
160 GetBitContext gb;
4fe4bb61 161 int i;
cfdaee45 162 const int b = buf_size * 8;
687dc355 163 init_get_bits(&gb, buf, buf_size * 8);
473147be
SV
164 for(i = 0; i < b; i++) {
165 dst[i] |= get_bits1(&gb) << plane;
687dc355 166 }
b9e06ddd
PR
167}
168
169static int decode_frame_ilbm(AVCodecContext *avctx,
170 void *data, int *data_size,
171 AVPacket *avpkt)
172{
005caa34 173 IffContext *s = avctx->priv_data;
b9e06ddd 174 const uint8_t *buf = avpkt->data;
4fe4bb61 175 int buf_size = avpkt->size;
cbba8fec 176 const uint8_t *buf_end = buf+buf_size;
4fe4bb61 177 int y, plane;
b9e06ddd 178
005caa34 179 if (avctx->reget_buffer(avctx, &s->frame) < 0){
b9e06ddd
PR
180 av_log(avctx, AV_LOG_ERROR, "get_buffer() failed\n");
181 return -1;
182 }
183
fe51b5ce 184 if (avctx->pix_fmt == PIX_FMT_PAL8) {
726dc061
SV
185 for(y = 0; y < avctx->height; y++ ) {
186 uint8_t *row = &s->frame.data[0][ y*s->frame.linesize[0] ];
187 memset(row, 0, avctx->width);
188 for (plane = 0; plane < avctx->bits_per_coded_sample && buf < buf_end; plane++) {
cbba8fec 189 decodeplane8(row, buf, FFMIN(s->planesize, buf_end - buf), avctx->bits_per_coded_sample, plane);
fe51b5ce
SV
190 buf += s->planesize;
191 }
192 }
726dc061 193 } else { // PIX_FMT_BGR32
fe51b5ce
SV
194 for(y = 0; y < avctx->height; y++ ) {
195 uint8_t *row = &s->frame.data[0][y*s->frame.linesize[0]];
196 memset(row, 0, avctx->width << 2);
197 for (plane = 0; plane < avctx->bits_per_coded_sample && buf < buf_end; plane++) {
473147be 198 decodeplane32((uint32_t *) row, buf, FFMIN(s->planesize, buf_end - buf), avctx->bits_per_coded_sample, plane);
726dc061 199 buf += s->planesize;
fe51b5ce 200 }
b9e06ddd
PR
201 }
202 }
203
204 *data_size = sizeof(AVFrame);
005caa34 205 *(AVFrame*)data = s->frame;
b9e06ddd
PR
206 return buf_size;
207}
208
209static int decode_frame_byterun1(AVCodecContext *avctx,
210 void *data, int *data_size,
211 AVPacket *avpkt)
212{
005caa34 213 IffContext *s = avctx->priv_data;
b9e06ddd 214 const uint8_t *buf = avpkt->data;
4fe4bb61 215 int buf_size = avpkt->size;
b9e06ddd 216 const uint8_t *buf_end = buf+buf_size;
4fe4bb61 217 int y, plane, x;
b9e06ddd 218
005caa34 219 if (avctx->reget_buffer(avctx, &s->frame) < 0){
b9e06ddd
PR
220 av_log(avctx, AV_LOG_ERROR, "get_buffer() failed\n");
221 return -1;
222 }
223
fe51b5ce
SV
224 if (avctx->codec_tag == MKTAG('I','L','B','M')) { //interleaved
225 if (avctx->pix_fmt == PIX_FMT_PAL8) {
726dc061
SV
226 for(y = 0; y < avctx->height ; y++ ) {
227 uint8_t *row = &s->frame.data[0][ y*s->frame.linesize[0] ];
228 memset(row, 0, avctx->width);
229 for (plane = 0; plane < avctx->bits_per_coded_sample; plane++) {
230 for(x = 0; x < s->planesize && buf < buf_end; ) {
231 int8_t value = *buf++;
232 unsigned length;
233 if (value >= 0) {
234 length = value + 1;
235 memcpy(s->planebuf + x, buf, FFMIN3(length, s->planesize - x, buf_end - buf));
236 buf += length;
237 } else if (value > -128) {
238 length = -value + 1;
239 memset(s->planebuf + x, *buf++, FFMIN(length, s->planesize - x));
240 } else { //noop
241 continue;
242 }
243 x += length;
b9e06ddd 244 }
005caa34 245 decodeplane8(row, s->planebuf, s->planesize, avctx->bits_per_coded_sample, plane);
fe51b5ce
SV
246 }
247 }
726dc061 248 } else { //PIX_FMT_BGR32
fe51b5ce
SV
249 for(y = 0; y < avctx->height ; y++ ) {
250 uint8_t *row = &s->frame.data[0][y*s->frame.linesize[0]];
251 memset(row, 0, avctx->width << 2);
252 for (plane = 0; plane < avctx->bits_per_coded_sample; plane++) {
253 for(x = 0; x < s->planesize && buf < buf_end; ) {
254 int8_t value = *buf++;
255 unsigned length;
256 if (value >= 0) {
257 length = value + 1;
258 memcpy(s->planebuf + x, buf, FFMIN3(length, s->planesize - x, buf_end - buf));
259 buf += length;
260 } else if (value > -128) {
261 length = -value + 1;
262 memset(s->planebuf + x, *buf++, FFMIN(length, s->planesize - x));
263 } else { // noop
264 continue;
265 }
266 x += length;
267 }
473147be 268 decodeplane32((uint32_t *) row, s->planebuf, s->planesize, avctx->bits_per_coded_sample, plane);
005caa34 269 }
b9e06ddd 270 }
fe51b5ce 271 }
726dc061
SV
272 } else {
273 for(y = 0; y < avctx->height ; y++ ) {
274 uint8_t *row = &s->frame.data[0][y*s->frame.linesize[0]];
b9e06ddd 275 for(x = 0; x < avctx->width && buf < buf_end; ) {
9f1d760a 276 int8_t value = *buf++;
473147be 277 unsigned length;
b9e06ddd
PR
278 if (value >= 0) {
279 length = value + 1;
280 memcpy(row + x, buf, FFMIN3(length, buf_end - buf, avctx->width - x));
281 buf += length;
282 } else if (value > -128) {
283 length = -value + 1;
284 memset(row + x, *buf++, FFMIN(length, avctx->width - x));
285 } else { //noop
286 continue;
287 }
288 x += length;
289 }
290 }
291 }
292
293 *data_size = sizeof(AVFrame);
005caa34 294 *(AVFrame*)data = s->frame;
b9e06ddd
PR
295 return buf_size;
296}
297
298static av_cold int decode_end(AVCodecContext *avctx)
299{
005caa34
PR
300 IffContext *s = avctx->priv_data;
301 if (s->frame.data[0])
302 avctx->release_buffer(avctx, &s->frame);
303 av_freep(&s->planebuf);
b9e06ddd
PR
304 return 0;
305}
306
307AVCodec iff_ilbm_decoder = {
308 "iff_ilbm",
72415b2a 309 AVMEDIA_TYPE_VIDEO,
b9e06ddd 310 CODEC_ID_IFF_ILBM,
005caa34 311 sizeof(IffContext),
b9e06ddd
PR
312 decode_init,
313 NULL,
314 decode_end,
315 decode_frame_ilbm,
316 CODEC_CAP_DR1,
317 .long_name = NULL_IF_CONFIG_SMALL("IFF ILBM"),
318};
319
320AVCodec iff_byterun1_decoder = {
321 "iff_byterun1",
72415b2a 322 AVMEDIA_TYPE_VIDEO,
b9e06ddd 323 CODEC_ID_IFF_BYTERUN1,
005caa34 324 sizeof(IffContext),
b9e06ddd
PR
325 decode_init,
326 NULL,
327 decode_end,
328 decode_frame_byterun1,
329 CODEC_CAP_DR1,
330 .long_name = NULL_IF_CONFIG_SMALL("IFF ByteRun1"),
331};