Line data Source code
1 : /*
2 : * MJPEG encoder
3 : * Copyright (c) 2000, 2001 Fabrice Bellard
4 : * Copyright (c) 2003 Alex Beregszaszi
5 : * Copyright (c) 2003-2004 Michael Niedermayer
6 : *
7 : * Support for external huffman table, various fixes (AVID workaround),
8 : * aspecting, new decode_frame mechanism and apple mjpeg-b support
9 : * by Alex Beregszaszi
10 : *
11 : * This file is part of FFmpeg.
12 : *
13 : * FFmpeg is free software; you can redistribute it and/or
14 : * modify it under the terms of the GNU Lesser General Public
15 : * License as published by the Free Software Foundation; either
16 : * version 2.1 of the License, or (at your option) any later version.
17 : *
18 : * FFmpeg is distributed in the hope that it will be useful,
19 : * but WITHOUT ANY WARRANTY; without even the implied warranty of
20 : * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
21 : * Lesser General Public License for more details.
22 : *
23 : * You should have received a copy of the GNU Lesser General Public
24 : * License along with FFmpeg; if not, write to the Free Software
25 : * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
26 : */
27 :
28 : /**
29 : * @file
30 : * MJPEG encoder.
31 : */
32 :
33 : #include "libavutil/pixdesc.h"
34 :
35 : #include "avcodec.h"
36 : #include "jpegtables.h"
37 : #include "mjpegenc_common.h"
38 : #include "mpegvideo.h"
39 : #include "mjpeg.h"
40 : #include "mjpegenc.h"
41 :
42 26 : static int alloc_huffman(MpegEncContext *s)
43 : {
44 26 : MJpegContext *m = s->mjpeg_ctx;
45 : size_t num_mbs, num_blocks, num_codes;
46 : int blocks_per_mb;
47 :
48 : // We need to init this here as the mjpeg init is called before the common init,
49 26 : s->mb_width = (s->width + 15) / 16;
50 26 : s->mb_height = (s->height + 15) / 16;
51 :
52 26 : switch (s->chroma_format) {
53 18 : case CHROMA_420: blocks_per_mb = 6; break;
54 4 : case CHROMA_422: blocks_per_mb = 8; break;
55 4 : case CHROMA_444: blocks_per_mb = 12; break;
56 0 : default: av_assert0(0);
57 : };
58 :
59 : // Make sure we have enough space to hold this frame.
60 26 : num_mbs = s->mb_width * s->mb_height;
61 26 : num_blocks = num_mbs * blocks_per_mb;
62 26 : num_codes = num_blocks * 64;
63 :
64 26 : m->huff_buffer = av_malloc_array(num_codes, sizeof(MJpegHuffmanCode));
65 26 : if (!m->huff_buffer)
66 0 : return AVERROR(ENOMEM);
67 26 : return 0;
68 : }
69 :
70 30 : av_cold int ff_mjpeg_encode_init(MpegEncContext *s)
71 : {
72 : MJpegContext *m;
73 :
74 30 : av_assert0(s->slice_context_count == 1);
75 :
76 30 : if (s->width > 65500 || s->height > 65500) {
77 0 : av_log(s, AV_LOG_ERROR, "JPEG does not support resolutions above 65500x65500\n");
78 0 : return AVERROR(EINVAL);
79 : }
80 :
81 30 : m = av_mallocz(sizeof(MJpegContext));
82 30 : if (!m)
83 0 : return AVERROR(ENOMEM);
84 :
85 30 : s->min_qcoeff=-1023;
86 30 : s->max_qcoeff= 1023;
87 :
88 : // Build default Huffman tables.
89 : // These may be overwritten later with more optimal Huffman tables, but
90 : // they are needed at least right now for some processes like trellis.
91 30 : ff_mjpeg_build_huffman_codes(m->huff_size_dc_luminance,
92 30 : m->huff_code_dc_luminance,
93 : avpriv_mjpeg_bits_dc_luminance,
94 : avpriv_mjpeg_val_dc);
95 30 : ff_mjpeg_build_huffman_codes(m->huff_size_dc_chrominance,
96 30 : m->huff_code_dc_chrominance,
97 : avpriv_mjpeg_bits_dc_chrominance,
98 : avpriv_mjpeg_val_dc);
99 30 : ff_mjpeg_build_huffman_codes(m->huff_size_ac_luminance,
100 30 : m->huff_code_ac_luminance,
101 : avpriv_mjpeg_bits_ac_luminance,
102 : avpriv_mjpeg_val_ac_luminance);
103 30 : ff_mjpeg_build_huffman_codes(m->huff_size_ac_chrominance,
104 30 : m->huff_code_ac_chrominance,
105 : avpriv_mjpeg_bits_ac_chrominance,
106 : avpriv_mjpeg_val_ac_chrominance);
107 :
108 30 : ff_init_uni_ac_vlc(m->huff_size_ac_luminance, m->uni_ac_vlc_len);
109 30 : ff_init_uni_ac_vlc(m->huff_size_ac_chrominance, m->uni_chroma_ac_vlc_len);
110 30 : s->intra_ac_vlc_length =
111 30 : s->intra_ac_vlc_last_length = m->uni_ac_vlc_len;
112 30 : s->intra_chroma_ac_vlc_length =
113 30 : s->intra_chroma_ac_vlc_last_length = m->uni_chroma_ac_vlc_len;
114 :
115 : // Buffers start out empty.
116 30 : m->huff_ncode = 0;
117 30 : s->mjpeg_ctx = m;
118 :
119 30 : if(s->huffman == HUFFMAN_TABLE_OPTIMAL)
120 26 : return alloc_huffman(s);
121 :
122 4 : return 0;
123 : }
124 :
125 30 : av_cold void ff_mjpeg_encode_close(MpegEncContext *s)
126 : {
127 30 : av_freep(&s->mjpeg_ctx->huff_buffer);
128 30 : av_freep(&s->mjpeg_ctx);
129 30 : }
130 :
131 : /**
132 : * Add code and table_id to the JPEG buffer.
133 : *
134 : * @param s The MJpegContext which contains the JPEG buffer.
135 : * @param table_id Which Huffman table the code belongs to.
136 : * @param code The encoded exponent of the coefficients and the run-bits.
137 : */
138 28811107 : static inline void ff_mjpeg_encode_code(MJpegContext *s, uint8_t table_id, int code)
139 : {
140 28811107 : MJpegHuffmanCode *c = &s->huff_buffer[s->huff_ncode++];
141 28811107 : c->table_id = table_id;
142 28811107 : c->code = code;
143 28811107 : }
144 :
145 : /**
146 : * Add the coefficient's data to the JPEG buffer.
147 : *
148 : * @param s The MJpegContext which contains the JPEG buffer.
149 : * @param table_id Which Huffman table the code belongs to.
150 : * @param val The coefficient.
151 : * @param run The run-bits.
152 : */
153 26111467 : static void ff_mjpeg_encode_coef(MJpegContext *s, uint8_t table_id, int val, int run)
154 : {
155 : int mant, code;
156 :
157 26111467 : if (val == 0) {
158 103825 : av_assert0(run == 0);
159 103825 : ff_mjpeg_encode_code(s, table_id, 0);
160 : } else {
161 26007642 : mant = val;
162 26007642 : if (val < 0) {
163 12984441 : val = -val;
164 12984441 : mant--;
165 : }
166 :
167 26007642 : code = (run << 4) | (av_log2_16bit(val) + 1);
168 :
169 26007642 : s->huff_buffer[s->huff_ncode].mant = mant;
170 26007642 : ff_mjpeg_encode_code(s, table_id, code);
171 : }
172 26111467 : }
173 :
174 : /**
175 : * Add the block's data into the JPEG buffer.
176 : *
177 : * @param s The MJpegEncContext that contains the JPEG buffer.
178 : * @param block The block.
179 : * @param n The block's index or number.
180 : */
181 2722788 : static void record_block(MpegEncContext *s, int16_t *block, int n)
182 : {
183 : int i, j, table_id;
184 : int component, dc, last_index, val, run;
185 2722788 : MJpegContext *m = s->mjpeg_ctx;
186 :
187 : /* DC coef */
188 2722788 : component = (n <= 3 ? 0 : (n&1) + 1);
189 2722788 : table_id = (n <= 3 ? 0 : 1);
190 2722788 : dc = block[0]; /* overflow is impossible */
191 2722788 : val = dc - s->last_dc[component];
192 :
193 2722788 : ff_mjpeg_encode_coef(m, table_id, val, 0);
194 :
195 2722788 : s->last_dc[component] = dc;
196 :
197 : /* AC coefs */
198 :
199 2722788 : run = 0;
200 2722788 : last_index = s->block_last_index[n];
201 2722788 : table_id |= 2;
202 :
203 52748192 : for(i=1;i<=last_index;i++) {
204 50025404 : j = s->intra_scantable.permutated[i];
205 50025404 : val = block[j];
206 :
207 50025404 : if (val == 0) {
208 26636725 : run++;
209 : } else {
210 46833996 : while (run >= 16) {
211 56638 : ff_mjpeg_encode_code(m, table_id, 0xf0);
212 56638 : run -= 16;
213 : }
214 23388679 : ff_mjpeg_encode_coef(m, table_id, val, run);
215 23388679 : run = 0;
216 : }
217 : }
218 :
219 : /* output EOB only if not already 64 values */
220 2722788 : if (last_index < 63 || run != 0)
221 2643002 : ff_mjpeg_encode_code(m, table_id, 0);
222 2722788 : }
223 :
224 359100 : static void encode_block(MpegEncContext *s, int16_t *block, int n)
225 : {
226 : int mant, nbits, code, i, j;
227 : int component, dc, run, last_index, val;
228 359100 : MJpegContext *m = s->mjpeg_ctx;
229 : uint8_t *huff_size_ac;
230 : uint16_t *huff_code_ac;
231 :
232 : /* DC coef */
233 359100 : component = (n <= 3 ? 0 : (n&1) + 1);
234 359100 : dc = block[0]; /* overflow is impossible */
235 359100 : val = dc - s->last_dc[component];
236 359100 : if (n < 4) {
237 239400 : ff_mjpeg_encode_dc(&s->pb, val, m->huff_size_dc_luminance, m->huff_code_dc_luminance);
238 239400 : huff_size_ac = m->huff_size_ac_luminance;
239 239400 : huff_code_ac = m->huff_code_ac_luminance;
240 : } else {
241 119700 : ff_mjpeg_encode_dc(&s->pb, val, m->huff_size_dc_chrominance, m->huff_code_dc_chrominance);
242 119700 : huff_size_ac = m->huff_size_ac_chrominance;
243 119700 : huff_code_ac = m->huff_code_ac_chrominance;
244 : }
245 359100 : s->last_dc[component] = dc;
246 :
247 : /* AC coefs */
248 :
249 359100 : run = 0;
250 359100 : last_index = s->block_last_index[n];
251 6879268 : for(i=1;i<=last_index;i++) {
252 6520168 : j = s->intra_scantable.permutated[i];
253 6520168 : val = block[j];
254 6520168 : if (val == 0) {
255 3000879 : run++;
256 : } else {
257 7041596 : while (run >= 16) {
258 3018 : put_bits(&s->pb, huff_size_ac[0xf0], huff_code_ac[0xf0]);
259 3018 : run -= 16;
260 : }
261 3519289 : mant = val;
262 3519289 : if (val < 0) {
263 1776140 : val = -val;
264 1776140 : mant--;
265 : }
266 :
267 3519289 : nbits= av_log2_16bit(val) + 1;
268 3519289 : code = (run << 4) | nbits;
269 :
270 3519289 : put_bits(&s->pb, huff_size_ac[code], huff_code_ac[code]);
271 :
272 3519289 : put_sbits(&s->pb, nbits, mant);
273 3519289 : run = 0;
274 : }
275 : }
276 :
277 : /* output EOB only if not already 64 values */
278 359100 : if (last_index < 63 || run != 0)
279 344417 : put_bits(&s->pb, huff_size_ac[0], huff_code_ac[0]);
280 359100 : }
281 :
282 433998 : void ff_mjpeg_encode_mb(MpegEncContext *s, int16_t block[12][64])
283 : {
284 : int i;
285 433998 : if (s->huffman == HUFFMAN_TABLE_OPTIMAL) {
286 374148 : if (s->chroma_format == CHROMA_444) {
287 59850 : record_block(s, block[0], 0);
288 59850 : record_block(s, block[2], 2);
289 59850 : record_block(s, block[4], 4);
290 59850 : record_block(s, block[8], 8);
291 59850 : record_block(s, block[5], 5);
292 59850 : record_block(s, block[9], 9);
293 :
294 59850 : if (16*s->mb_x+8 < s->width) {
295 59700 : record_block(s, block[1], 1);
296 59700 : record_block(s, block[3], 3);
297 59700 : record_block(s, block[6], 6);
298 59700 : record_block(s, block[10], 10);
299 59700 : record_block(s, block[7], 7);
300 59700 : record_block(s, block[11], 11);
301 : }
302 : } else {
303 1885788 : for(i=0;i<5;i++) {
304 1571490 : record_block(s, block[i], i);
305 : }
306 314298 : if (s->chroma_format == CHROMA_420) {
307 254448 : record_block(s, block[5], 5);
308 : } else {
309 59850 : record_block(s, block[6], 6);
310 59850 : record_block(s, block[5], 5);
311 59850 : record_block(s, block[7], 7);
312 : }
313 : }
314 : } else {
315 59850 : if (s->chroma_format == CHROMA_444) {
316 0 : encode_block(s, block[0], 0);
317 0 : encode_block(s, block[2], 2);
318 0 : encode_block(s, block[4], 4);
319 0 : encode_block(s, block[8], 8);
320 0 : encode_block(s, block[5], 5);
321 0 : encode_block(s, block[9], 9);
322 :
323 0 : if (16*s->mb_x+8 < s->width) {
324 0 : encode_block(s, block[1], 1);
325 0 : encode_block(s, block[3], 3);
326 0 : encode_block(s, block[6], 6);
327 0 : encode_block(s, block[10], 10);
328 0 : encode_block(s, block[7], 7);
329 0 : encode_block(s, block[11], 11);
330 : }
331 : } else {
332 359100 : for(i=0;i<5;i++) {
333 299250 : encode_block(s, block[i], i);
334 : }
335 59850 : if (s->chroma_format == CHROMA_420) {
336 59850 : encode_block(s, block[5], 5);
337 : } else {
338 0 : encode_block(s, block[6], 6);
339 0 : encode_block(s, block[5], 5);
340 0 : encode_block(s, block[7], 7);
341 : }
342 : }
343 :
344 59850 : s->i_tex_bits += get_bits_diff(s);
345 : }
346 433998 : }
347 :
348 : #if CONFIG_AMV_ENCODER
349 : // maximum over s->mjpeg_vsample[i]
350 : #define V_MAX 2
351 200 : static int amv_encode_picture(AVCodecContext *avctx, AVPacket *pkt,
352 : const AVFrame *pic_arg, int *got_packet)
353 : {
354 200 : MpegEncContext *s = avctx->priv_data;
355 : AVFrame *pic;
356 : int i, ret;
357 : int chroma_h_shift, chroma_v_shift;
358 :
359 200 : av_pix_fmt_get_chroma_sub_sample(avctx->pix_fmt, &chroma_h_shift, &chroma_v_shift);
360 :
361 200 : if ((avctx->height & 15) && avctx->strict_std_compliance > FF_COMPLIANCE_UNOFFICIAL) {
362 0 : av_log(avctx, AV_LOG_ERROR,
363 : "Heights which are not a multiple of 16 might fail with some decoders, "
364 : "use vstrict=-1 / -strict -1 to use %d anyway.\n", avctx->height);
365 0 : av_log(avctx, AV_LOG_WARNING, "If you have a device that plays AMV videos, please test if videos "
366 : "with such heights work with it and report your findings to ffmpeg-devel@ffmpeg.org\n");
367 0 : return AVERROR_EXPERIMENTAL;
368 : }
369 :
370 200 : pic = av_frame_clone(pic_arg);
371 200 : if (!pic)
372 0 : return AVERROR(ENOMEM);
373 : //picture should be flipped upside-down
374 800 : for(i=0; i < 3; i++) {
375 600 : int vsample = i ? 2 >> chroma_v_shift : 2;
376 600 : pic->data[i] += pic->linesize[i] * (vsample * s->height / V_MAX - 1);
377 600 : pic->linesize[i] *= -1;
378 : }
379 200 : ret = ff_mpv_encode_picture(avctx, pkt, pic, got_packet);
380 200 : av_frame_free(&pic);
381 200 : return ret;
382 : }
383 : #endif
384 :
385 : #define OFFSET(x) offsetof(MpegEncContext, x)
386 : #define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
387 : static const AVOption options[] = {
388 : FF_MPV_COMMON_OPTS
389 : { "pred", "Prediction method", OFFSET(pred), AV_OPT_TYPE_INT, { .i64 = 1 }, 1, 3, VE, "pred" },
390 : { "left", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 1 }, INT_MIN, INT_MAX, VE, "pred" },
391 : { "plane", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 2 }, INT_MIN, INT_MAX, VE, "pred" },
392 : { "median", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 3 }, INT_MIN, INT_MAX, VE, "pred" },
393 : { "huffman", "Huffman table strategy", OFFSET(huffman), AV_OPT_TYPE_INT, { .i64 = HUFFMAN_TABLE_OPTIMAL }, 0, NB_HUFFMAN_TABLE_OPTION - 1, VE, "huffman" },
394 : { "default", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = HUFFMAN_TABLE_DEFAULT }, INT_MIN, INT_MAX, VE, "huffman" },
395 : { "optimal", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = HUFFMAN_TABLE_OPTIMAL }, INT_MIN, INT_MAX, VE, "huffman" },
396 : { NULL},
397 : };
398 :
399 : #if CONFIG_MJPEG_ENCODER
400 : static const AVClass mjpeg_class = {
401 : .class_name = "mjpeg encoder",
402 : .item_name = av_default_item_name,
403 : .option = options,
404 : .version = LIBAVUTIL_VERSION_INT,
405 : };
406 :
407 : AVCodec ff_mjpeg_encoder = {
408 : .name = "mjpeg",
409 : .long_name = NULL_IF_CONFIG_SMALL("MJPEG (Motion JPEG)"),
410 : .type = AVMEDIA_TYPE_VIDEO,
411 : .id = AV_CODEC_ID_MJPEG,
412 : .priv_data_size = sizeof(MpegEncContext),
413 : .init = ff_mpv_encode_init,
414 : .encode2 = ff_mpv_encode_picture,
415 : .close = ff_mpv_encode_end,
416 : .capabilities = AV_CODEC_CAP_SLICE_THREADS | AV_CODEC_CAP_FRAME_THREADS | AV_CODEC_CAP_INTRA_ONLY,
417 : .pix_fmts = (const enum AVPixelFormat[]) {
418 : AV_PIX_FMT_YUVJ420P, AV_PIX_FMT_YUVJ422P, AV_PIX_FMT_YUVJ444P, AV_PIX_FMT_NONE
419 : },
420 : .priv_class = &mjpeg_class,
421 : };
422 : #endif
423 :
424 : #if CONFIG_AMV_ENCODER
425 : static const AVClass amv_class = {
426 : .class_name = "amv encoder",
427 : .item_name = av_default_item_name,
428 : .option = options,
429 : .version = LIBAVUTIL_VERSION_INT,
430 : };
431 :
432 : AVCodec ff_amv_encoder = {
433 : .name = "amv",
434 : .long_name = NULL_IF_CONFIG_SMALL("AMV Video"),
435 : .type = AVMEDIA_TYPE_VIDEO,
436 : .id = AV_CODEC_ID_AMV,
437 : .priv_data_size = sizeof(MpegEncContext),
438 : .init = ff_mpv_encode_init,
439 : .encode2 = amv_encode_picture,
440 : .close = ff_mpv_encode_end,
441 : .pix_fmts = (const enum AVPixelFormat[]) {
442 : AV_PIX_FMT_YUVJ420P, AV_PIX_FMT_NONE
443 : },
444 : .priv_class = &amv_class,
445 : };
446 : #endif
|