Commit | Line | Data |
---|---|---|
302898fc IK |
1 | /* |
2 | * XVideo Motion Compensation | |
3 | * Copyright (c) 2003 Ivan Kalvachev | |
4 | * | |
b78e7197 DB |
5 | * This file is part of FFmpeg. |
6 | * | |
7 | * FFmpeg is free software; you can redistribute it and/or | |
302898fc IK |
8 | * modify it under the terms of the GNU Lesser General Public |
9 | * License as published by the Free Software Foundation; either | |
b78e7197 | 10 | * version 2.1 of the License, or (at your option) any later version. |
302898fc | 11 | * |
b78e7197 | 12 | * FFmpeg is distributed in the hope that it will be useful, |
302898fc IK |
13 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
14 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
15 | * Lesser General Public License for more details. | |
16 | * | |
17 | * You should have received a copy of the GNU Lesser General Public | |
b78e7197 | 18 | * License along with FFmpeg; if not, write to the Free Software |
5509bffa | 19 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
302898fc IK |
20 | */ |
21 | ||
2e7b4c84 IK |
22 | #include <limits.h> |
23 | ||
2e7b4c84 IK |
24 | #include "avcodec.h" |
25 | #include "dsputil.h" | |
26 | #include "mpegvideo.h" | |
27 | ||
28 | #undef NDEBUG | |
29 | #include <assert.h> | |
30 | ||
fd949a63 | 31 | #include "xvmc.h" |
302898fc | 32 | |
a579db0c | 33 | //set s->block |
78f9a878 | 34 | void ff_xvmc_init_block(MpegEncContext *s) |
148302e7 | 35 | { |
7e2e870e | 36 | struct xvmc_render_state *render; |
c96da3ed | 37 | render = (struct xvmc_render_state*)s->current_picture.data[2]; |
3ae01928 | 38 | assert(render); |
9f00a41c | 39 | if (!render || render->magic != AV_XVMC_RENDER_MAGIC) { |
a579db0c | 40 | assert(0); |
1f7c1d14 | 41 | return; // make sure that this is a render packet |
a579db0c | 42 | } |
9f00a41c | 43 | s->block = (DCTELEM *)(render->data_blocks + render->next_free_data_block_num * 64); |
a579db0c IK |
44 | } |
45 | ||
78f9a878 | 46 | void ff_xvmc_pack_pblocks(MpegEncContext *s, int cbp) |
148302e7 | 47 | { |
7e2e870e | 48 | int i, j; |
148302e7 | 49 | const int mb_block_count = 4 + (1 << s->chroma_format); |
a579db0c | 50 | |
148302e7 DB |
51 | j = 0; |
52 | cbp <<= 12-mb_block_count; | |
53 | for (i = 0; i < mb_block_count; i++) { | |
4ec58e13 | 54 | if (cbp & (1 << 11)) |
4742762f | 55 | s->pblocks[i] = (short *)(&s->block[j++]); |
4ec58e13 | 56 | else |
39dba5e8 | 57 | s->pblocks[i] = NULL; |
bb270c08 | 58 | cbp+=cbp; |
a579db0c | 59 | } |
2e7b4c84 IK |
60 | } |
61 | ||
1f7c1d14 DB |
62 | // These functions should be called on every new field and/or frame. |
63 | // They should be safe if they are called a few times for the same field! | |
78f9a878 | 64 | int ff_xvmc_field_start(MpegEncContext*s, AVCodecContext *avctx) |
148302e7 | 65 | { |
7e2e870e | 66 | struct xvmc_render_state *render, *last, *next; |
2e7b4c84 | 67 | |
3ae01928 | 68 | assert(avctx); |
302898fc | 69 | |
c96da3ed | 70 | render = (struct xvmc_render_state*)s->current_picture.data[2]; |
3ae01928 | 71 | assert(render); |
9f00a41c | 72 | if (!render || render->magic != AV_XVMC_RENDER_MAGIC) |
a1db3b93 | 73 | return -1; // make sure that this is a render packet |
2e7b4c84 IK |
74 | |
75 | render->picture_structure = s->picture_structure; | |
9f00a41c | 76 | render->flags = s->first_field ? 0 : XVMC_SECOND_FIELD; |
2e7b4c84 | 77 | |
2d7d8cc7 | 78 | assert(render->filled_mv_blocks_num == 0); |
2e7b4c84 IK |
79 | |
80 | render->p_future_surface = NULL; | |
4ef690f5 | 81 | render->p_past_surface = NULL; |
2e7b4c84 | 82 | |
7e2e870e | 83 | switch(s->pict_type) { |
9701840b | 84 | case FF_I_TYPE: |
1f7c1d14 | 85 | return 0; // no prediction from other frames |
9701840b | 86 | case FF_B_TYPE: |
c96da3ed | 87 | next = (struct xvmc_render_state*)s->next_picture.data[2]; |
3ae01928 DB |
88 | assert(next); |
89 | if (!next) | |
148302e7 | 90 | return -1; |
ea375af8 | 91 | if (next->magic != AV_XVMC_RENDER_MAGIC) |
148302e7 | 92 | return -1; |
2e7b4c84 | 93 | render->p_future_surface = next->p_surface; |
1f7c1d14 | 94 | // no return here, going to set forward prediction |
9701840b | 95 | case FF_P_TYPE: |
c96da3ed | 96 | last = (struct xvmc_render_state*)s->last_picture.data[2]; |
63a21bc0 | 97 | if (!last) |
1f7c1d14 | 98 | last = render; // predict second field from the first |
ea375af8 | 99 | if (last->magic != AV_XVMC_RENDER_MAGIC) |
148302e7 | 100 | return -1; |
2e7b4c84 IK |
101 | render->p_past_surface = last->p_surface; |
102 | return 0; | |
5e5c247a | 103 | } |
2e7b4c84 IK |
104 | |
105 | return -1; | |
106 | } | |
107 | ||
78f9a878 | 108 | void ff_xvmc_field_end(MpegEncContext *s) |
148302e7 | 109 | { |
7e2e870e | 110 | struct xvmc_render_state *render; |
c96da3ed | 111 | render = (struct xvmc_render_state*)s->current_picture.data[2]; |
3ae01928 | 112 | assert(render); |
2e7b4c84 | 113 | |
148302e7 | 114 | if (render->filled_mv_blocks_num > 0) |
2e7b4c84 | 115 | ff_draw_horiz_band(s,0,0); |
2e7b4c84 IK |
116 | } |
117 | ||
78f9a878 | 118 | void ff_xvmc_decode_mb(MpegEncContext *s) |
148302e7 | 119 | { |
7e2e870e DB |
120 | XvMCMacroBlock *mv_block; |
121 | struct xvmc_render_state *render; | |
122 | int i, cbp, blocks_per_mb; | |
2e7b4c84 | 123 | |
39dba5e8 | 124 | const int mb_xy = s->mb_y * s->mb_stride + s->mb_x; |
2e7b4c84 IK |
125 | |
126 | ||
148302e7 | 127 | if (s->encoding) { |
8ac5c1b2 | 128 | av_log(s->avctx, AV_LOG_ERROR, "XVMC doesn't support encoding!!!\n"); |
61b76987 | 129 | return; |
2e7b4c84 IK |
130 | } |
131 | ||
1f7c1d14 | 132 | // from MPV_decode_mb(), update DC predictors for P macroblocks |
2e7b4c84 IK |
133 | if (!s->mb_intra) { |
134 | s->last_dc[0] = | |
135 | s->last_dc[1] = | |
136 | s->last_dc[2] = 128 << s->intra_dc_precision; | |
137 | } | |
138 | ||
1f7c1d14 | 139 | // MC doesn't skip blocks |
160d679c | 140 | s->mb_skipped = 0; |
2e7b4c84 IK |
141 | |
142 | ||
d15876d3 DB |
143 | // Do I need to export quant when I could not perform postprocessing? |
144 | // Anyway, it doesn't hurt. | |
2e7b4c84 IK |
145 | s->current_picture.qscale_table[mb_xy] = s->qscale; |
146 | ||
a1db3b93 | 147 | // start of XVMC-specific code |
c96da3ed | 148 | render = (struct xvmc_render_state*)s->current_picture.data[2]; |
3ae01928 | 149 | assert(render); |
7e2e870e | 150 | assert(render->magic == AV_XVMC_RENDER_MAGIC); |
2e7b4c84 | 151 | assert(render->mv_blocks); |
302898fc | 152 | |
1f7c1d14 | 153 | // take the next free macroblock |
115329f1 | 154 | mv_block = &render->mv_blocks[render->start_mv_blocks_num + |
39dba5e8 | 155 | render->filled_mv_blocks_num ]; |
2e7b4c84 | 156 | |
4ef690f5 DB |
157 | mv_block->x = s->mb_x; |
158 | mv_block->y = s->mb_y; | |
1f7c1d14 | 159 | mv_block->dct_type = s->interlaced_dct; // XVMC_DCT_TYPE_FRAME/FIELD; |
4ec58e13 | 160 | if (s->mb_intra) { |
1f7c1d14 | 161 | mv_block->macroblock_type = XVMC_MB_TYPE_INTRA; // no MC, all done |
4ec58e13 | 162 | } else { |
2e7b4c84 IK |
163 | mv_block->macroblock_type = XVMC_MB_TYPE_PATTERN; |
164 | ||
148302e7 | 165 | if (s->mv_dir & MV_DIR_FORWARD) { |
2d7d8cc7 | 166 | mv_block->macroblock_type |= XVMC_MB_TYPE_MOTION_FORWARD; |
0439c09d | 167 | // PMV[n][dir][xy] = mv[dir][n][xy] |
2e7b4c84 IK |
168 | mv_block->PMV[0][0][0] = s->mv[0][0][0]; |
169 | mv_block->PMV[0][0][1] = s->mv[0][0][1]; | |
170 | mv_block->PMV[1][0][0] = s->mv[0][1][0]; | |
171 | mv_block->PMV[1][0][1] = s->mv[0][1][1]; | |
172 | } | |
148302e7 | 173 | if (s->mv_dir & MV_DIR_BACKWARD) { |
2d7d8cc7 | 174 | mv_block->macroblock_type |= XVMC_MB_TYPE_MOTION_BACKWARD; |
2e7b4c84 IK |
175 | mv_block->PMV[0][1][0] = s->mv[1][0][0]; |
176 | mv_block->PMV[0][1][1] = s->mv[1][0][1]; | |
177 | mv_block->PMV[1][1][0] = s->mv[1][1][0]; | |
178 | mv_block->PMV[1][1][1] = s->mv[1][1][1]; | |
179 | } | |
180 | ||
181 | switch(s->mv_type){ | |
182 | case MV_TYPE_16X16: | |
183 | mv_block->motion_type = XVMC_PREDICTION_FRAME; | |
184 | break; | |
185 | case MV_TYPE_16X8: | |
186 | mv_block->motion_type = XVMC_PREDICTION_16x8; | |
187 | break; | |
188 | case MV_TYPE_FIELD: | |
189 | mv_block->motion_type = XVMC_PREDICTION_FIELD; | |
148302e7 DB |
190 | if (s->picture_structure == PICT_FRAME) { |
191 | mv_block->PMV[0][0][1] <<= 1; | |
192 | mv_block->PMV[1][0][1] <<= 1; | |
193 | mv_block->PMV[0][1][1] <<= 1; | |
194 | mv_block->PMV[1][1][1] <<= 1; | |
2e7b4c84 IK |
195 | } |
196 | break; | |
197 | case MV_TYPE_DMV: | |
198 | mv_block->motion_type = XVMC_PREDICTION_DUAL_PRIME; | |
148302e7 | 199 | if (s->picture_structure == PICT_FRAME) { |
2e7b4c84 | 200 | |
1f7c1d14 | 201 | mv_block->PMV[0][0][0] = s->mv[0][0][0]; // top from top |
81189e4f | 202 | mv_block->PMV[0][0][1] = s->mv[0][0][1] << 1; |
2e7b4c84 | 203 | |
1f7c1d14 | 204 | mv_block->PMV[0][1][0] = s->mv[0][0][0]; // bottom from bottom |
81189e4f | 205 | mv_block->PMV[0][1][1] = s->mv[0][0][1] << 1; |
2e7b4c84 | 206 | |
1f7c1d14 | 207 | mv_block->PMV[1][0][0] = s->mv[0][2][0]; // dmv00, top from bottom |
81189e4f | 208 | mv_block->PMV[1][0][1] = s->mv[0][2][1] << 1; // dmv01 |
2e7b4c84 | 209 | |
1f7c1d14 | 210 | mv_block->PMV[1][1][0] = s->mv[0][3][0]; // dmv10, bottom from top |
81189e4f | 211 | mv_block->PMV[1][1][1] = s->mv[0][3][1] << 1; // dmv11 |
2e7b4c84 | 212 | |
4ec58e13 | 213 | } else { |
1f7c1d14 DB |
214 | mv_block->PMV[0][1][0] = s->mv[0][2][0]; // dmv00 |
215 | mv_block->PMV[0][1][1] = s->mv[0][2][1]; // dmv01 | |
2e7b4c84 IK |
216 | } |
217 | break; | |
218 | default: | |
219 | assert(0); | |
220 | } | |
221 | ||
222 | mv_block->motion_vertical_field_select = 0; | |
223 | ||
1f7c1d14 | 224 | // set correct field references |
148302e7 | 225 | if (s->mv_type == MV_TYPE_FIELD || s->mv_type == MV_TYPE_16X8) { |
90509ec7 | 226 | mv_block->motion_vertical_field_select |= s->field_select[0][0]; |
7e2e870e DB |
227 | mv_block->motion_vertical_field_select |= s->field_select[1][0] << 1; |
228 | mv_block->motion_vertical_field_select |= s->field_select[0][1] << 2; | |
229 | mv_block->motion_vertical_field_select |= s->field_select[1][1] << 3; | |
2e7b4c84 | 230 | } |
1f7c1d14 | 231 | } // !intra |
a1db3b93 | 232 | // time to handle data blocks |
2e7b4c84 | 233 | mv_block->index = render->next_free_data_block_num; |
5e5c247a | 234 | |
2e7b4c84 | 235 | blocks_per_mb = 6; |
148302e7 | 236 | if (s->chroma_format >= 2) { |
4742762f | 237 | blocks_per_mb = 4 + (1 << s->chroma_format); |
2e7b4c84 | 238 | } |
5e5c247a | 239 | |
1f7c1d14 | 240 | // calculate cbp |
715731a3 | 241 | cbp = 0; |
148302e7 | 242 | for (i = 0; i < blocks_per_mb; i++) { |
2d7d8cc7 | 243 | cbp += cbp; |
148302e7 | 244 | if (s->block_last_index[i] >= 0) |
715731a3 IK |
245 | cbp++; |
246 | } | |
115329f1 | 247 | |
148302e7 | 248 | if (s->flags & CODEC_FLAG_GRAY) { |
a1db3b93 | 249 | if (s->mb_intra) { // intra frames are always full chroma blocks |
148302e7 | 250 | for (i = 4; i < blocks_per_mb; i++) { |
7e2e870e | 251 | memset(s->pblocks[i], 0, sizeof(short)*8*8); // so we need to clear them |
148302e7 DB |
252 | if (!render->unsigned_intra) |
253 | s->pblocks[i][0] = 1 << 10; | |
a579db0c | 254 | } |
4ec58e13 | 255 | } else { |
148302e7 | 256 | cbp &= 0xf << (blocks_per_mb - 4); |
1f7c1d14 | 257 | blocks_per_mb = 4; // luminance blocks only |
715731a3 | 258 | } |
a579db0c | 259 | } |
2e7b4c84 | 260 | mv_block->coded_block_pattern = cbp; |
148302e7 | 261 | if (cbp == 0) |
2e7b4c84 IK |
262 | mv_block->macroblock_type &= ~XVMC_MB_TYPE_PATTERN; |
263 | ||
148302e7 DB |
264 | for (i = 0; i < blocks_per_mb; i++) { |
265 | if (s->block_last_index[i] >= 0) { | |
7a74e067 | 266 | // I do not have unsigned_intra MOCO to test, hope it is OK. |
eba9cecc | 267 | if (s->mb_intra && (render->idct || (!render->idct && !render->unsigned_intra))) |
148302e7 DB |
268 | s->pblocks[i][0] -= 1 << 10; |
269 | if (!render->idct) { | |
a579db0c | 270 | s->dsp.idct(s->pblocks[i]); |
a1db3b93 DB |
271 | /* It is unclear if MC hardware requires pixel diff values to be |
272 | * in the range [-255;255]. TODO: Clipping if such hardware is | |
273 | * ever found. As of now it would only be an unnecessary | |
274 | * slowdown. */ | |
2e7b4c84 | 275 | } |
1f7c1d14 | 276 | // copy blocks only if the codec doesn't support pblocks reordering |
148302e7 | 277 | if (s->avctx->xvmc_acceleration == 1) { |
4742762f | 278 | memcpy(&render->data_blocks[render->next_free_data_block_num*64], |
39dba5e8 | 279 | s->pblocks[i],sizeof(short)*8*8); |
a579db0c IK |
280 | } |
281 | render->next_free_data_block_num++; | |
2e7b4c84 IK |
282 | } |
283 | } | |
284 | render->filled_mv_blocks_num++; | |
285 | ||
4ef690f5 | 286 | assert(render->filled_mv_blocks_num <= render->total_number_of_mv_blocks); |
2e7b4c84 IK |
287 | assert(render->next_free_data_block_num <= render->total_number_of_data_blocks); |
288 | ||
289 | ||
148302e7 | 290 | if (render->filled_mv_blocks_num >= render->total_number_of_mv_blocks) |
7e2e870e | 291 | ff_draw_horiz_band(s, 0, 0); |
2e7b4c84 | 292 | } |