| /* |
| * The simplest mpeg encoder (well, it was the simplest!) |
| * Copyright (c) 2000,2001 Fabrice Bellard |
| * Copyright (c) 2002-2004 Michael Niedermayer <michaelni@gmx.at> |
| * |
| * 4MV & hq & B-frame encoding stuff by Michael Niedermayer <michaelni@gmx.at> |
| * |
| * This file is part of FFmpeg. |
| * |
| * FFmpeg is free software; you can redistribute it and/or |
| * modify it under the terms of the GNU Lesser General Public |
| * License as published by the Free Software Foundation; either |
| * version 2.1 of the License, or (at your option) any later version. |
| * |
| * FFmpeg is distributed in the hope that it will be useful, |
| * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| * Lesser General Public License for more details. |
| * |
| * You should have received a copy of the GNU Lesser General Public |
| * License along with FFmpeg; if not, write to the Free Software |
| * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
| */ |
| |
| /** |
| * @file |
| * The simplest mpeg encoder (well, it was the simplest!). |
| */ |
| |
| #include "libavutil/attributes.h" |
| #include "libavutil/avassert.h" |
| #include "libavutil/imgutils.h" |
| #include "libavutil/internal.h" |
| #include "libavutil/intreadwrite.h" |
| #include "libavutil/mem.h" |
| |
| #include "avcodec.h" |
| #include "blockdsp.h" |
| #include "idctdsp.h" |
| #include "mathops.h" |
| #include "mpeg_er.h" |
| #include "mpegutils.h" |
| #include "mpegvideo.h" |
| #include "mpegvideodata.h" |
| #include "libavutil/refstruct.h" |
| |
| |
| static void gray16(uint8_t *dst, const uint8_t *src, ptrdiff_t linesize, int h) |
| { |
| while(h--) |
| memset(dst + h*linesize, 128, 16); |
| } |
| |
| static void gray8(uint8_t *dst, const uint8_t *src, ptrdiff_t linesize, int h) |
| { |
| while(h--) |
| memset(dst + h*linesize, 128, 8); |
| } |
| |
| /* init common dct for both encoder and decoder */ |
| static av_cold void dsp_init(MpegEncContext *s) |
| { |
| ff_blockdsp_init(&s->bdsp); |
| ff_hpeldsp_init(&s->hdsp, s->avctx->flags); |
| ff_videodsp_init(&s->vdsp, s->avctx->bits_per_raw_sample); |
| |
| if (s->avctx->debug & FF_DEBUG_NOMC) { |
| int i; |
| for (i=0; i<4; i++) { |
| s->hdsp.avg_pixels_tab[0][i] = gray16; |
| s->hdsp.put_pixels_tab[0][i] = gray16; |
| s->hdsp.put_no_rnd_pixels_tab[0][i] = gray16; |
| |
| s->hdsp.avg_pixels_tab[1][i] = gray8; |
| s->hdsp.put_pixels_tab[1][i] = gray8; |
| s->hdsp.put_no_rnd_pixels_tab[1][i] = gray8; |
| } |
| } |
| } |
| |
| av_cold void ff_mpv_idct_init(MpegEncContext *s) |
| { |
| if (s->codec_id == AV_CODEC_ID_MPEG4) |
| s->idsp.mpeg4_studio_profile = s->studio_profile; |
| ff_idctdsp_init(&s->idsp, s->avctx); |
| |
| /* load & permutate scantables |
| * note: only wmv uses different ones |
| */ |
| if (s->alternate_scan) { |
| ff_init_scantable(s->idsp.idct_permutation, &s->inter_scantable, ff_alternate_vertical_scan); |
| ff_init_scantable(s->idsp.idct_permutation, &s->intra_scantable, ff_alternate_vertical_scan); |
| } else { |
| ff_init_scantable(s->idsp.idct_permutation, &s->inter_scantable, ff_zigzag_direct); |
| ff_init_scantable(s->idsp.idct_permutation, &s->intra_scantable, ff_zigzag_direct); |
| } |
| } |
| |
| av_cold int ff_mpv_init_duplicate_contexts(MpegEncContext *s) |
| { |
| const int nb_slices = s->slice_context_count; |
| const size_t slice_size = s->slice_ctx_size; |
| |
| for (int i = 1; i < nb_slices; i++) { |
| s->thread_context[i] = av_memdup(s, slice_size); |
| if (!s->thread_context[i]) |
| return AVERROR(ENOMEM); |
| s->thread_context[i]->start_mb_y = |
| (s->mb_height * (i ) + nb_slices / 2) / nb_slices; |
| s->thread_context[i]->end_mb_y = |
| (s->mb_height * (i + 1) + nb_slices / 2) / nb_slices; |
| } |
| s->start_mb_y = 0; |
| s->end_mb_y = nb_slices > 1 ? (s->mb_height + nb_slices / 2) / nb_slices |
| : s->mb_height; |
| return 0; |
| } |
| |
| static av_cold void free_duplicate_context(MpegEncContext *s) |
| { |
| if (!s) |
| return; |
| |
| av_freep(&s->sc.edge_emu_buffer); |
| av_freep(&s->sc.scratchpad_buf); |
| s->sc.obmc_scratchpad = NULL; |
| s->sc.linesize = 0; |
| } |
| |
| static av_cold void free_duplicate_contexts(MpegEncContext *s) |
| { |
| for (int i = 1; i < s->slice_context_count; i++) { |
| free_duplicate_context(s->thread_context[i]); |
| av_freep(&s->thread_context[i]); |
| } |
| free_duplicate_context(s); |
| } |
| |
| int ff_update_duplicate_context(MpegEncContext *dst, const MpegEncContext *src) |
| { |
| #define COPY(M) \ |
| M(ScratchpadContext, sc) \ |
| M(int, start_mb_y) \ |
| M(int, end_mb_y) \ |
| M(int16_t*, dc_val) \ |
| M(void*, ac_val) |
| |
| int ret; |
| // FIXME copy only needed parts |
| #define BACKUP(T, member) T member = dst->member; |
| COPY(BACKUP) |
| memcpy(dst, src, sizeof(MpegEncContext)); |
| #define RESTORE(T, member) dst->member = member; |
| COPY(RESTORE) |
| |
| ret = ff_mpv_framesize_alloc(dst->avctx, &dst->sc, dst->linesize); |
| if (ret < 0) { |
| av_log(dst->avctx, AV_LOG_ERROR, "failed to allocate context " |
| "scratch buffers.\n"); |
| return ret; |
| } |
| return 0; |
| } |
| |
| /** |
| * Set the given MpegEncContext to common defaults |
| * (same for encoding and decoding). |
| * The changed fields will not depend upon the |
| * prior state of the MpegEncContext. |
| */ |
| av_cold void ff_mpv_common_defaults(MpegEncContext *s) |
| { |
| s->chroma_qscale_table = ff_default_chroma_qscale_table; |
| s->progressive_frame = 1; |
| s->progressive_sequence = 1; |
| s->picture_structure = PICT_FRAME; |
| |
| s->slice_context_count = 1; |
| } |
| |
| static av_cold void free_buffer_pools(BufferPoolContext *pools) |
| { |
| av_refstruct_pool_uninit(&pools->mbskip_table_pool); |
| av_refstruct_pool_uninit(&pools->qscale_table_pool); |
| av_refstruct_pool_uninit(&pools->mb_type_pool); |
| av_refstruct_pool_uninit(&pools->motion_val_pool); |
| av_refstruct_pool_uninit(&pools->ref_index_pool); |
| pools->alloc_mb_height = pools->alloc_mb_width = pools->alloc_mb_stride = 0; |
| } |
| |
| av_cold int ff_mpv_init_context_frame(MpegEncContext *s) |
| { |
| int nb_slices = (HAVE_THREADS && |
| s->avctx->active_thread_type & FF_THREAD_SLICE) ? |
| s->avctx->thread_count : 1; |
| BufferPoolContext *const pools = &s->buffer_pools; |
| int y_size, c_size, yc_size, mb_array_size, mv_table_size, x, y; |
| int mb_height; |
| |
| if (s->encoding && s->avctx->slices) |
| nb_slices = s->avctx->slices; |
| |
| if (s->codec_id == AV_CODEC_ID_MPEG2VIDEO && !s->progressive_sequence) |
| s->mb_height = (s->height + 31) / 32 * 2; |
| else |
| s->mb_height = (s->height + 15) / 16; |
| |
| if (nb_slices > MAX_THREADS || (nb_slices > s->mb_height && s->mb_height)) { |
| int max_slices; |
| if (s->mb_height) |
| max_slices = FFMIN(MAX_THREADS, s->mb_height); |
| else |
| max_slices = MAX_THREADS; |
| av_log(s->avctx, AV_LOG_WARNING, "too many threads/slices (%d)," |
| " reducing to %d\n", nb_slices, max_slices); |
| nb_slices = max_slices; |
| } |
| |
| s->slice_context_count = nb_slices; |
| |
| /* VC-1 can change from being progressive to interlaced on a per-frame |
| * basis. We therefore allocate certain buffers so big that they work |
| * in both instances. */ |
| mb_height = s->msmpeg4_version == MSMP4_VC1 ? |
| FFALIGN(s->mb_height, 2) : s->mb_height; |
| |
| s->mb_width = (s->width + 15) / 16; |
| s->mb_stride = s->mb_width + 1; |
| s->b8_stride = s->mb_width * 2 + 1; |
| mb_array_size = mb_height * s->mb_stride; |
| mv_table_size = (mb_height + 2) * s->mb_stride + 1; |
| |
| /* set default edge pos, will be overridden |
| * in decode_header if needed */ |
| s->h_edge_pos = s->mb_width * 16; |
| s->v_edge_pos = s->mb_height * 16; |
| |
| s->mb_num = s->mb_width * s->mb_height; |
| |
| s->block_wrap[0] = |
| s->block_wrap[1] = |
| s->block_wrap[2] = |
| s->block_wrap[3] = s->b8_stride; |
| s->block_wrap[4] = |
| s->block_wrap[5] = s->mb_stride; |
| |
| y_size = s->b8_stride * (2 * mb_height + 1); |
| c_size = s->mb_stride * (mb_height + 1); |
| yc_size = y_size + 2 * c_size; |
| |
| if (!FF_ALLOCZ_TYPED_ARRAY(s->mb_index2xy, s->mb_num + 1)) |
| return AVERROR(ENOMEM); |
| for (y = 0; y < s->mb_height; y++) |
| for (x = 0; x < s->mb_width; x++) |
| s->mb_index2xy[x + y * s->mb_width] = x + y * s->mb_stride; |
| |
| s->mb_index2xy[s->mb_height * s->mb_width] = (s->mb_height - 1) * s->mb_stride + s->mb_width; // FIXME really needed? |
| |
| #define ALLOC_POOL(name, size, flags) do { \ |
| pools->name ##_pool = av_refstruct_pool_alloc((size), (flags)); \ |
| if (!pools->name ##_pool) \ |
| return AVERROR(ENOMEM); \ |
| } while (0) |
| |
| if (s->codec_id == AV_CODEC_ID_MPEG4 || |
| (s->avctx->flags & AV_CODEC_FLAG_INTERLACED_ME)) { |
| /* interlaced direct mode decoding tables */ |
| int16_t (*tmp)[2] = av_calloc(mv_table_size, 4 * sizeof(*tmp)); |
| if (!tmp) |
| return AVERROR(ENOMEM); |
| s->p_field_mv_table_base = tmp; |
| tmp += s->mb_stride + 1; |
| for (int i = 0; i < 2; i++) { |
| for (int j = 0; j < 2; j++) { |
| s->p_field_mv_table[i][j] = tmp; |
| tmp += mv_table_size; |
| } |
| } |
| if (s->codec_id == AV_CODEC_ID_MPEG4) { |
| ALLOC_POOL(mbskip_table, mb_array_size + 2, |
| !s->encoding ? AV_REFSTRUCT_POOL_FLAG_ZERO_EVERY_TIME : 0); |
| if (!s->encoding) { |
| /* cbp, pred_dir */ |
| if (!(s->cbp_table = av_mallocz(mb_array_size)) || |
| !(s->pred_dir_table = av_mallocz(mb_array_size))) |
| return AVERROR(ENOMEM); |
| } |
| } |
| } |
| |
| if (s->msmpeg4_version >= MSMP4_V3) { |
| s->coded_block_base = av_mallocz(y_size); |
| if (!s->coded_block_base) |
| return AVERROR(ENOMEM); |
| s->coded_block = s->coded_block_base + s->b8_stride + 1; |
| } |
| |
| if (s->h263_pred || s->h263_aic || !s->encoding) { |
| // When encoding, each slice (and therefore each thread) |
| // gets its own ac_val and dc_val buffers in order to avoid |
| // races. |
| size_t allslice_yc_size = yc_size * (s->encoding ? nb_slices : 1); |
| if (s->out_format == FMT_H263) { |
| /* ac values */ |
| if (!FF_ALLOCZ_TYPED_ARRAY(s->ac_val_base, allslice_yc_size)) |
| return AVERROR(ENOMEM); |
| s->ac_val = s->ac_val_base + s->b8_stride + 1; |
| } |
| |
| /* dc values */ |
| // MN: we need these for error resilience of intra-frames |
| // Allocating them unconditionally for decoders also means |
| // that we don't need to reinitialize when e.g. h263_aic changes. |
| |
| // y_size and therefore yc_size is always odd; allocate one element |
| // more for each encoder slice in order to be able to align each slice's |
| // dc_val to four in order to use aligned stores when cleaning dc_val. |
| allslice_yc_size += s->encoding * nb_slices; |
| if (!FF_ALLOC_TYPED_ARRAY(s->dc_val_base, allslice_yc_size)) |
| return AVERROR(ENOMEM); |
| s->dc_val = s->dc_val_base + s->b8_stride + 1; |
| for (size_t i = 0; i < allslice_yc_size; ++i) |
| s->dc_val_base[i] = 1024; |
| } |
| |
| // Note the + 1 is for a quicker MPEG-4 slice_end detection |
| if (!(s->mbskip_table = av_mallocz(mb_array_size + 2)) || |
| /* which mb is an intra block, init macroblock skip table */ |
| !(s->mbintra_table = av_mallocz(mb_array_size))) |
| return AVERROR(ENOMEM); |
| |
| ALLOC_POOL(qscale_table, mv_table_size, 0); |
| ALLOC_POOL(mb_type, mv_table_size * sizeof(uint32_t), 0); |
| |
| if (s->out_format == FMT_H263 || s->encoding || |
| (s->avctx->export_side_data & AV_CODEC_EXPORT_DATA_MVS)) { |
| const int b8_array_size = s->b8_stride * mb_height * 2; |
| int mv_size = 2 * (b8_array_size + 4) * sizeof(int16_t); |
| int ref_index_size = 4 * mb_array_size; |
| |
| /* FIXME: The output of H.263 with OBMC depends upon |
| * the earlier content of the buffer; therefore we set |
| * the flags to always reset returned buffers here. */ |
| ALLOC_POOL(motion_val, mv_size, AV_REFSTRUCT_POOL_FLAG_ZERO_EVERY_TIME); |
| ALLOC_POOL(ref_index, ref_index_size, 0); |
| } |
| #undef ALLOC_POOL |
| pools->alloc_mb_width = s->mb_width; |
| pools->alloc_mb_height = mb_height; |
| pools->alloc_mb_stride = s->mb_stride; |
| |
| return !CONFIG_MPEGVIDEODEC || s->encoding ? 0 : ff_mpeg_er_init(s); |
| } |
| |
| /** |
| * init common structure for both encoder and decoder. |
| * this assumes that some variables like width/height are already set |
| */ |
| av_cold int ff_mpv_common_init(MpegEncContext *s) |
| { |
| int ret; |
| |
| if (s->avctx->pix_fmt == AV_PIX_FMT_NONE) { |
| av_log(s->avctx, AV_LOG_ERROR, |
| "decoding to AV_PIX_FMT_NONE is not supported.\n"); |
| return AVERROR(EINVAL); |
| } |
| |
| if ((s->width || s->height) && |
| av_image_check_size(s->width, s->height, 0, s->avctx)) |
| return AVERROR(EINVAL); |
| |
| dsp_init(s); |
| |
| /* set chroma shifts */ |
| ret = av_pix_fmt_get_chroma_sub_sample(s->avctx->pix_fmt, |
| &s->chroma_x_shift, |
| &s->chroma_y_shift); |
| if (ret) |
| return ret; |
| |
| if ((ret = ff_mpv_init_context_frame(s))) |
| goto fail; |
| |
| s->context_initialized = 1; |
| s->thread_context[0] = s; |
| |
| // if (s->width && s->height) { |
| if (!s->encoding) { |
| ret = ff_mpv_init_duplicate_contexts(s); |
| if (ret < 0) |
| goto fail; |
| } |
| // } |
| |
| return 0; |
| fail: |
| ff_mpv_common_end(s); |
| return ret; |
| } |
| |
| av_cold void ff_mpv_free_context_frame(MpegEncContext *s) |
| { |
| free_duplicate_contexts(s); |
| |
| free_buffer_pools(&s->buffer_pools); |
| av_freep(&s->p_field_mv_table_base); |
| for (int i = 0; i < 2; i++) |
| for (int j = 0; j < 2; j++) |
| s->p_field_mv_table[i][j] = NULL; |
| |
| av_freep(&s->ac_val_base); |
| av_freep(&s->dc_val_base); |
| av_freep(&s->coded_block_base); |
| av_freep(&s->mbintra_table); |
| av_freep(&s->cbp_table); |
| av_freep(&s->pred_dir_table); |
| |
| av_freep(&s->mbskip_table); |
| |
| av_freep(&s->er.error_status_table); |
| av_freep(&s->er.er_temp_buffer); |
| av_freep(&s->mb_index2xy); |
| |
| s->linesize = s->uvlinesize = 0; |
| } |
| |
| av_cold void ff_mpv_common_end(MpegEncContext *s) |
| { |
| ff_mpv_free_context_frame(s); |
| if (s->slice_context_count > 1) |
| s->slice_context_count = 1; |
| |
| ff_mpv_unref_picture(&s->last_pic); |
| ff_mpv_unref_picture(&s->cur_pic); |
| ff_mpv_unref_picture(&s->next_pic); |
| |
| s->context_initialized = 0; |
| s->context_reinit = 0; |
| s->linesize = s->uvlinesize = 0; |
| } |
| |
| |
| /** |
| * Clean dc, ac for the current non-intra MB. |
| */ |
| void ff_clean_intra_table_entries(MpegEncContext *s) |
| { |
| int wrap = s->b8_stride; |
| int xy = s->block_index[0]; |
| /* chroma */ |
| unsigned uxy = s->block_index[4]; |
| unsigned vxy = s->block_index[5]; |
| int16_t *dc_val = s->dc_val; |
| |
| AV_WN32A(dc_val + xy, 1024 << 16 | 1024); |
| AV_WN32 (dc_val + xy + wrap, 1024 << 16 | 1024); |
| dc_val[uxy] = |
| dc_val[vxy] = 1024; |
| /* ac pred */ |
| int16_t (*ac_val)[16] = s->ac_val; |
| av_assume(!((uintptr_t)ac_val & 0xF)); |
| // Don't reset the upper-left luma block, as it will only ever be |
| // referenced by blocks from the same macroblock. |
| memset(ac_val[xy + 1], 0, sizeof(*ac_val)); |
| memset(ac_val[xy + wrap], 0, 2 * sizeof(*ac_val)); |
| /* ac pred */ |
| memset(ac_val[uxy], 0, sizeof(*ac_val)); |
| memset(ac_val[vxy], 0, sizeof(*ac_val)); |
| } |
| |
| void ff_init_block_index(MpegEncContext *s){ //FIXME maybe rename |
| const int linesize = s->cur_pic.linesize[0]; //not s->linesize as this would be wrong for field pics |
| const int uvlinesize = s->cur_pic.linesize[1]; |
| const int width_of_mb = (4 + (s->avctx->bits_per_raw_sample > 8)) - s->avctx->lowres; |
| const int height_of_mb = 4 - s->avctx->lowres; |
| |
| s->block_index[0]= s->b8_stride*(s->mb_y*2 ) - 2 + s->mb_x*2; |
| s->block_index[1]= s->b8_stride*(s->mb_y*2 ) - 1 + s->mb_x*2; |
| s->block_index[2]= s->b8_stride*(s->mb_y*2 + 1) - 2 + s->mb_x*2; |
| s->block_index[3]= s->b8_stride*(s->mb_y*2 + 1) - 1 + s->mb_x*2; |
| s->block_index[4]= s->mb_stride*(s->mb_y + 1) + s->b8_stride*s->mb_height*2 + s->mb_x - 1; |
| s->block_index[5]= s->mb_stride*(s->mb_y + s->mb_height + 2) + s->b8_stride*s->mb_height*2 + s->mb_x - 1; |
| //block_index is not used by mpeg2, so it is not affected by chroma_format |
| |
| s->dest[0] = s->cur_pic.data[0] + (int)((s->mb_x - 1U) << width_of_mb); |
| s->dest[1] = s->cur_pic.data[1] + (int)((s->mb_x - 1U) << (width_of_mb - s->chroma_x_shift)); |
| s->dest[2] = s->cur_pic.data[2] + (int)((s->mb_x - 1U) << (width_of_mb - s->chroma_x_shift)); |
| |
| if (s->picture_structure == PICT_FRAME) { |
| s->dest[0] += s->mb_y * linesize << height_of_mb; |
| s->dest[1] += s->mb_y * uvlinesize << (height_of_mb - s->chroma_y_shift); |
| s->dest[2] += s->mb_y * uvlinesize << (height_of_mb - s->chroma_y_shift); |
| } else { |
| s->dest[0] += (s->mb_y>>1) * linesize << height_of_mb; |
| s->dest[1] += (s->mb_y>>1) * uvlinesize << (height_of_mb - s->chroma_y_shift); |
| s->dest[2] += (s->mb_y>>1) * uvlinesize << (height_of_mb - s->chroma_y_shift); |
| av_assert1((s->mb_y&1) == (s->picture_structure == PICT_BOTTOM_FIELD)); |
| } |
| } |
| |
| /** |
| * set qscale and update qscale dependent variables. |
| */ |
| void ff_set_qscale(MpegEncContext * s, int qscale) |
| { |
| if (qscale < 1) |
| qscale = 1; |
| else if (qscale > 31) |
| qscale = 31; |
| |
| s->qscale = qscale; |
| s->chroma_qscale= s->chroma_qscale_table[qscale]; |
| |
| s->y_dc_scale= s->y_dc_scale_table[ qscale ]; |
| s->c_dc_scale= s->c_dc_scale_table[ s->chroma_qscale ]; |
| } |