libavcodec/asvenc.c - third_party/ffmpeg - Git at Google

 /*
  * Copyright (c) 2003 Michael Niedermayer
  *
  * This file is part of FFmpeg.
  *
  * FFmpeg is free software; you can redistribute it and/or
  * modify it under the terms of the GNU Lesser General Public
  * License as published by the Free Software Foundation; either
  * version 2.1 of the License, or (at your option) any later version.
  *
  * FFmpeg is distributed in the hope that it will be useful,
  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  * Lesser General Public License for more details.
  *
  * You should have received a copy of the GNU Lesser General Public
  * License along with FFmpeg; if not, write to the Free Software
  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  */

 /**
  * @file
  * ASUS V1/V2 encoder.
  */

 #include "config_components.h"

 #include "libavutil/attributes.h"
 #include "libavutil/intreadwrite.h"
 #include "libavutil/mem.h"
 #include "libavutil/mem_internal.h"

 #include "aandcttab.h"
 #include "asv.h"
 #include "avcodec.h"
 #include "codec_internal.h"
 #include "encode.h"
 #include "fdctdsp.h"
 #include "mpeg12data.h"
 #include "pixblockdsp.h"
 #include "put_bits.h"

 typedef struct ASVEncContext {
     ASVCommonContext c;

     PutBitContext pb;

     void (*get_pixels)(int16_t *restrict block,
                        const uint8_t *pixels,
                        ptrdiff_t stride);

     PixblockDSPContext pdsp;
     FDCTDSPContext fdsp;
     DECLARE_ALIGNED(32, int16_t, block)[6][64];
     int q_intra_matrix[64];
 } ASVEncContext;

 enum {
     ASV1_MAX_BLOCK_SIZE = 8 + 10 * FFMAX(2 /* skip */, 5 /* ccp */ + 4 * 11 /* level */) + 5,
     ASV1_MAX_MB_SIZE    = 6 * ASV1_MAX_BLOCK_SIZE,
     ASV2_MAX_BLOCK_SIZE = 4 + 8 + 16 * (6 /* ccp */ + 4 * 13 /* level */),
     ASV2_MAX_MB_SIZE    = 6 * ASV2_MAX_BLOCK_SIZE,
     MAX_MB_SIZE         = (FFMAX(ASV1_MAX_MB_SIZE, ASV2_MAX_MB_SIZE) + 7) / 8
 };

 static inline void asv1_put_level(PutBitContext *pb, int level)
 {
     unsigned int index = level + 3;
     unsigned n, code;

     if (index <= 6) {
         n    = ff_asv_level_tab[index][1];
         code = ff_asv_level_tab[index][0];
     } else {
         n    = 3 + 8;
         code = (0 /* Escape code */ << 8)  | (level & 0xFF);
     }
     put_bits(pb, n, code);
 }

 static inline void asv2_put_level(ASVEncContext *a, PutBitContext *pb, int level)
 {
     unsigned int index = level + 31;
     unsigned n, code;

     if (index <= 62) {
         n    = ff_asv2_level_tab[index][1];
         code = ff_asv2_level_tab[index][0];
     } else {
         if (level < -128 || level > 127) {
             av_log(a->c.avctx, AV_LOG_WARNING, "Clipping level %d, increase qscale\n", level);
             level = av_clip_int8(level);
         }
         n    = 5 + 8;
         code = (level & 0xFF) << 5 | /* Escape code */ 0;
     }
     put_bits_le(pb, n, code);
 }

 static inline void asv1_encode_block(ASVEncContext *a, int16_t block[64])
 {
     put_bits(&a->pb, 8, (block[0] + 32) >> 6);
     block[0] = 0;

     for (unsigned i = 0, nc_bits = 0, nc_val = 0; i < 10; i++) {
         const int index = ff_asv_scantab[4 * i];
         int ccp         = 0;

         if ((block[index + 0] = (block[index + 0] *
                                  a->q_intra_matrix[index + 0] + (1 << 15)) >> 16))
             ccp |= 8;
         if ((block[index + 8] = (block[index + 8] *
                                  a->q_intra_matrix[index + 8] + (1 << 15)) >> 16))
             ccp |= 4;
         if ((block[index + 1] = (block[index + 1] *
                                  a->q_intra_matrix[index + 1] + (1 << 15)) >> 16))
             ccp |= 2;
         if ((block[index + 9] = (block[index + 9] *
                                  a->q_intra_matrix[index + 9] + (1 << 15)) >> 16))
             ccp |= 1;

         if (ccp) {
             put_bits(&a->pb, nc_bits + ff_asv_ccp_tab[ccp][1],
                              nc_val << ff_asv_ccp_tab[ccp][1] /* Skip */ |
                              ff_asv_ccp_tab[ccp][0]);
             nc_bits = 0;
             nc_val  = 0;

             if (ccp & 8)
                 asv1_put_level(&a->pb, block[index + 0]);
             if (ccp & 4)
                 asv1_put_level(&a->pb, block[index + 8]);
             if (ccp & 2)
                 asv1_put_level(&a->pb, block[index + 1]);
             if (ccp & 1)
                 asv1_put_level(&a->pb, block[index + 9]);
         } else {
             nc_bits += 2;
             nc_val   = (nc_val << 2) | 2;
         }
     }
     put_bits(&a->pb, 5, 0xF); /* End of block */
 }

 static inline void asv2_encode_block(ASVEncContext *a, int16_t block[64])
 {
     int i;
     int count = 0;

     for (count = 63; count > 3; count--) {
         const int index = ff_asv_scantab[count];
         if ((block[index] * a->q_intra_matrix[index] + (1 << 15)) >> 16)
             break;
     }

     count >>= 2;

     put_bits_le(&a->pb, 4 + 8, count /* 4 bits */ |
                                (/* DC */(block[0] + 32) >> 6) << 4);
     block[0] = 0;

     for (i = 0; i <= count; i++) {
         const int index = ff_asv_scantab[4 * i];
         int ccp         = 0;

         if ((block[index + 0] = (block[index + 0] *
                                  a->q_intra_matrix[index + 0] + (1 << 15)) >> 16))
             ccp |= 8;
         if ((block[index + 8] = (block[index + 8] *
                                  a->q_intra_matrix[index + 8] + (1 << 15)) >> 16))
             ccp |= 4;
         if ((block[index + 1] = (block[index + 1] *
                                  a->q_intra_matrix[index + 1] + (1 << 15)) >> 16))
             ccp |= 2;
         if ((block[index + 9] = (block[index + 9] *
                                  a->q_intra_matrix[index + 9] + (1 << 15)) >> 16))
             ccp |= 1;

         av_assert2(i || ccp < 8);
         if (i)
             put_bits_le(&a->pb, ff_asv_ac_ccp_tab[ccp][1], ff_asv_ac_ccp_tab[ccp][0]);
         else
             put_bits_le(&a->pb, ff_asv_dc_ccp_tab[ccp][1], ff_asv_dc_ccp_tab[ccp][0]);

         if (ccp) {
             if (ccp & 8)
                 asv2_put_level(a, &a->pb, block[index + 0]);
             if (ccp & 4)
                 asv2_put_level(a, &a->pb, block[index + 8]);
             if (ccp & 2)
                 asv2_put_level(a, &a->pb, block[index + 1]);
             if (ccp & 1)
                 asv2_put_level(a, &a->pb, block[index + 9]);
         }
     }
 }

 static inline int encode_mb(ASVEncContext *a, int16_t block[6][64])
 {
     int i;

     av_assert0(put_bytes_left(&a->pb, 0) >= MAX_MB_SIZE);

     if (a->c.avctx->codec_id == AV_CODEC_ID_ASV1) {
         for (i = 0; i < 6; i++)
             asv1_encode_block(a, block[i]);
     } else {
         for (i = 0; i < 6; i++) {
             asv2_encode_block(a, block[i]);
         }
     }
     return 0;
 }

 static inline void dct_get(ASVEncContext *a, const AVFrame *frame,
                            int mb_x, int mb_y)
 {
     int16_t (*block)[64] = a->block;
     int linesize = frame->linesize[0];
     int i;

     const uint8_t *ptr_y  = frame->data[0] + (mb_y * 16 * linesize)           + mb_x * 16;
     const uint8_t *ptr_cb = frame->data[1] + (mb_y *  8 * frame->linesize[1]) + mb_x *  8;
     const uint8_t *ptr_cr = frame->data[2] + (mb_y *  8 * frame->linesize[2]) + mb_x *  8;

     a->get_pixels(block[0], ptr_y,                    linesize);
     a->get_pixels(block[1], ptr_y + 8,                linesize);
     a->get_pixels(block[2], ptr_y + 8 * linesize,     linesize);
     a->get_pixels(block[3], ptr_y + 8 * linesize + 8, linesize);
     for (i = 0; i < 4; i++)
         a->fdsp.fdct(block[i]);

     if (!(a->c.avctx->flags & AV_CODEC_FLAG_GRAY)) {
         a->get_pixels(block[4], ptr_cb, frame->linesize[1]);
         a->get_pixels(block[5], ptr_cr, frame->linesize[2]);
         for (i = 4; i < 6; i++)
             a->fdsp.fdct(block[i]);
     }
 }

 static void handle_partial_mb(ASVEncContext *a, const uint8_t *const data[3],
                               const int linesizes[3],
                               int valid_width, int valid_height)
 {
     const int nb_blocks = a->c.avctx->flags & AV_CODEC_FLAG_GRAY ? 4 : 6;
     static const struct Descriptor {
         uint8_t x_offset, y_offset;
         uint8_t component, subsampling;
     } block_descriptor[] = {
         { 0, 0, 0, 0 }, { 8, 0, 0, 0 }, { 0, 8, 0, 0 }, { 8, 8, 0, 0 },
         { 0, 0, 1, 1 }, { 0, 0, 2, 1 },
     };

     for (int i = 0; i < nb_blocks; ++i) {
         const struct Descriptor *const desc = block_descriptor + i;
         int width_avail  = AV_CEIL_RSHIFT(valid_width,  desc->subsampling) - desc->x_offset;
         int height_avail = AV_CEIL_RSHIFT(valid_height, desc->subsampling) - desc->y_offset;

         if (width_avail <= 0 || height_avail <= 0) {
             // This block is outside of the visible part; don't replicate pixels,
             // just zero the block, so that only the dc value will be coded.
             memset(a->block[i], 0, sizeof(a->block[i]));
             continue;
         }
         width_avail  = FFMIN(width_avail,  8);
         height_avail = FFMIN(height_avail, 8);

         ptrdiff_t linesize = linesizes[desc->component];
         const uint8_t *src = data[desc->component] + desc->y_offset * linesize + desc->x_offset;
         int16_t *block = a->block[i];

         for (int h = 0;; block += 8, src += linesize) {
             int16_t last;
             for (int w = 0; w < width_avail; ++w)
                 last = block[w] = src[w];
             for (int w = width_avail; w < 8; ++w)
                 block[w] = last;
             if (++h == height_avail)
                 break;
         }
         const int16_t *const last_row = block;
         for (int h = height_avail; h < 8; ++h) {
             block += 8;
             AV_COPY128(block, last_row);
         }

         a->fdsp.fdct(a->block[i]);
     }

     encode_mb(a, a->block);
 }

 static int encode_frame(AVCodecContext *avctx, AVPacket *pkt,
                         const AVFrame *pict, int *got_packet)
 {
     ASVEncContext *const a = avctx->priv_data;
     const ASVCommonContext *const c = &a->c;
     int size, ret;

     ret = ff_alloc_packet(avctx, pkt, c->mb_height * c->mb_width * MAX_MB_SIZE + 3);
     if (ret < 0)
         return ret;

     if (!PIXBLOCKDSP_8BPP_GET_PIXELS_SUPPORTS_UNALIGNED &&
         ((uintptr_t)pict->data[0] & 7 || pict->linesize[0] & 7 ||
          (uintptr_t)pict->data[1] & 7 || pict->linesize[1] & 7 ||
          (uintptr_t)pict->data[2] & 7 || pict->linesize[2] & 7))
         a->get_pixels = a->pdsp.get_pixels_unaligned;
     else
         a->get_pixels = a->pdsp.get_pixels;

     init_put_bits(&a->pb, pkt->data, pkt->size);

     for (int mb_y = 0; mb_y < c->mb_height2; mb_y++) {
         for (int mb_x = 0; mb_x < c->mb_width2; mb_x++) {
             dct_get(a, pict, mb_x, mb_y);
             encode_mb(a, a->block);
         }
     }

     if (avctx->width & 15) {
         const uint8_t *src[3] = {
             pict->data[0] + c->mb_width2 * 16,
             pict->data[1] + c->mb_width2 *  8,
             pict->data[2] + c->mb_width2 *  8,
         };
         int available_width = avctx->width & 15;

         for (int mb_y = 0; mb_y < c->mb_height2; mb_y++) {
             handle_partial_mb(a, src, pict->linesize, available_width, 16);
             src[0] += 16 * pict->linesize[0];
             src[1] +=  8 * pict->linesize[1];
             src[2] +=  8 * pict->linesize[2];
         }
     }

     if (avctx->height & 15) {
         const uint8_t *src[3] = {
             pict->data[0] + c->mb_height2 * 16 * pict->linesize[0],
             pict->data[1] + c->mb_height2 *  8 * pict->linesize[1],
             pict->data[2] + c->mb_height2 *  8 * pict->linesize[2],
         };
         int available_height = avctx->height & 15;

         for (int remaining = avctx->width;; remaining -= 16) {
             handle_partial_mb(a, src, pict->linesize, remaining, available_height);
             if (remaining <= 16)
                 break;
             src[0] += 16;
             src[1] +=  8;
             src[2] +=  8;
         }
     }

     if (avctx->codec_id == AV_CODEC_ID_ASV1)
         flush_put_bits(&a->pb);
     else
         flush_put_bits_le(&a->pb);
     AV_WN32(put_bits_ptr(&a->pb), 0);
     size = (put_bytes_output(&a->pb) + 3) / 4;

     if (avctx->codec_id == AV_CODEC_ID_ASV1) {
         c->bbdsp.bswap_buf((uint32_t *) pkt->data,
                            (uint32_t *) pkt->data, size);
     }

     pkt->size   = size * 4;
     *got_packet = 1;

     return 0;
 }

 static av_cold int encode_init(AVCodecContext *avctx)
 {
     ASVEncContext *const a = avctx->priv_data;
     int i;
     const int scale = avctx->codec_id == AV_CODEC_ID_ASV1 ? 1 : 2;
     int inv_qscale;

     ff_asv_common_init(avctx);
     ff_fdctdsp_init(&a->fdsp, avctx);
     ff_pixblockdsp_init(&a->pdsp, 8);

     if (avctx->global_quality <= 0)
         avctx->global_quality = 4 * FF_QUALITY_SCALE;

     inv_qscale = (32 * scale * FF_QUALITY_SCALE +
                      avctx->global_quality / 2) / avctx->global_quality;

     avctx->extradata                   = av_mallocz(8);
     if (!avctx->extradata)
         return AVERROR(ENOMEM);
     avctx->extradata_size              = 8;
     AV_WL32A(avctx->extradata, inv_qscale);
     AV_WL32A(avctx->extradata + 4, MKTAG('A', 'S', 'U', 'S'));

     for (i = 0; i < 64; i++) {
         if (a->fdsp.fdct == ff_fdct_ifast) {
             int q = 32LL * scale * ff_mpeg1_default_intra_matrix[i] * ff_aanscales[i];
             a->q_intra_matrix[i] = (((int64_t)inv_qscale << 30) + q / 2) / q;
         } else {
             int q = 32 * scale * ff_mpeg1_default_intra_matrix[i];
             a->q_intra_matrix[i] = ((inv_qscale << 16) + q / 2) / q;
         }
     }

     return 0;
 }

 #if CONFIG_ASV1_ENCODER
 const FFCodec ff_asv1_encoder = {
     .p.name         = "asv1",
     CODEC_LONG_NAME("ASUS V1"),
     .p.type         = AVMEDIA_TYPE_VIDEO,
     .p.id           = AV_CODEC_ID_ASV1,
     .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_ENCODER_REORDERED_OPAQUE,
     .priv_data_size = sizeof(ASVEncContext),
     .init           = encode_init,
     FF_CODEC_ENCODE_CB(encode_frame),
     CODEC_PIXFMTS(AV_PIX_FMT_YUV420P),
     .color_ranges   = AVCOL_RANGE_MPEG,
 };
 #endif

 #if CONFIG_ASV2_ENCODER
 const FFCodec ff_asv2_encoder = {
     .p.name         = "asv2",
     CODEC_LONG_NAME("ASUS V2"),
     .p.type         = AVMEDIA_TYPE_VIDEO,
     .p.id           = AV_CODEC_ID_ASV2,
     .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_ENCODER_REORDERED_OPAQUE,
     .priv_data_size = sizeof(ASVEncContext),
     .init           = encode_init,
     FF_CODEC_ENCODE_CB(encode_frame),
     CODEC_PIXFMTS(AV_PIX_FMT_YUV420P),
     .color_ranges   = AVCOL_RANGE_MPEG,
 };
 #endif
	/*
	* Copyright (c) 2003 Michael Niedermayer
	*
	* This file is part of FFmpeg.
	*
	* FFmpeg is free software; you can redistribute it and/or
	* modify it under the terms of the GNU Lesser General Public
	* License as published by the Free Software Foundation; either
	* version 2.1 of the License, or (at your option) any later version.
	*
	* FFmpeg is distributed in the hope that it will be useful,
	* but WITHOUT ANY WARRANTY; without even the implied warranty of
	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
	* Lesser General Public License for more details.
	*
	* You should have received a copy of the GNU Lesser General Public
	* License along with FFmpeg; if not, write to the Free Software
	* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
	*/

	/**
	* @file
	* ASUS V1/V2 encoder.
	*/

	#include "config_components.h"

	#include "libavutil/attributes.h"
	#include "libavutil/intreadwrite.h"
	#include "libavutil/mem.h"
	#include "libavutil/mem_internal.h"

	#include "aandcttab.h"
	#include "asv.h"
	#include "avcodec.h"
	#include "codec_internal.h"
	#include "encode.h"
	#include "fdctdsp.h"
	#include "mpeg12data.h"
	#include "pixblockdsp.h"
	#include "put_bits.h"

	typedef struct ASVEncContext {
	ASVCommonContext c;

	PutBitContext pb;

	void (get_pixels)(int16_t restrict block,
	const uint8_t *pixels,
	ptrdiff_t stride);

	PixblockDSPContext pdsp;
	FDCTDSPContext fdsp;
	DECLARE_ALIGNED(32, int16_t, block)[6][64];
	int q_intra_matrix[64];
	} ASVEncContext;

	enum {
	ASV1_MAX_BLOCK_SIZE = 8 + 10 * FFMAX(2 /* skip /, 5 / ccp / + 4 11 /* level */) + 5,
	ASV1_MAX_MB_SIZE = 6 * ASV1_MAX_BLOCK_SIZE,
	ASV2_MAX_BLOCK_SIZE = 4 + 8 + 16 * (6 /* ccp / + 4 13 /* level */),
	ASV2_MAX_MB_SIZE = 6 * ASV2_MAX_BLOCK_SIZE,
	MAX_MB_SIZE = (FFMAX(ASV1_MAX_MB_SIZE, ASV2_MAX_MB_SIZE) + 7) / 8
	};

	static inline void asv1_put_level(PutBitContext *pb, int level)
	{
	unsigned int index = level + 3;
	unsigned n, code;

	if (index <= 6) {
	n = ff_asv_level_tab[index][1];
	code = ff_asv_level_tab[index][0];
	} else {
	n = 3 + 8;
	code = (0 /* Escape code */ << 8) \| (level & 0xFF);
	}
	put_bits(pb, n, code);
	}

	static inline void asv2_put_level(ASVEncContext a, PutBitContext pb, int level)
	{
	unsigned int index = level + 31;
	unsigned n, code;

	if (index <= 62) {
	n = ff_asv2_level_tab[index][1];
	code = ff_asv2_level_tab[index][0];
	} else {
	if (level < -128 \|\| level > 127) {
	av_log(a->c.avctx, AV_LOG_WARNING, "Clipping level %d, increase qscale\n", level);
	level = av_clip_int8(level);
	}
	n = 5 + 8;
	code = (level & 0xFF) << 5 \| /* Escape code */ 0;
	}
	put_bits_le(pb, n, code);
	}

	static inline void asv1_encode_block(ASVEncContext *a, int16_t block[64])
	{
	put_bits(&a->pb, 8, (block[0] + 32) >> 6);
	block[0] = 0;

	for (unsigned i = 0, nc_bits = 0, nc_val = 0; i < 10; i++) {
	const int index = ff_asv_scantab[4 * i];
	int ccp = 0;

	if ((block[index + 0] = (block[index + 0] *
	a->q_intra_matrix[index + 0] + (1 << 15)) >> 16))
	ccp \|= 8;
	if ((block[index + 8] = (block[index + 8] *
	a->q_intra_matrix[index + 8] + (1 << 15)) >> 16))
	ccp \|= 4;
	if ((block[index + 1] = (block[index + 1] *
	a->q_intra_matrix[index + 1] + (1 << 15)) >> 16))
	ccp \|= 2;
	if ((block[index + 9] = (block[index + 9] *
	a->q_intra_matrix[index + 9] + (1 << 15)) >> 16))
	ccp \|= 1;

	if (ccp) {
	put_bits(&a->pb, nc_bits + ff_asv_ccp_tab[ccp][1],
	nc_val << ff_asv_ccp_tab[ccp][1] /* Skip */ \|
	ff_asv_ccp_tab[ccp][0]);
	nc_bits = 0;
	nc_val = 0;

	if (ccp & 8)
	asv1_put_level(&a->pb, block[index + 0]);
	if (ccp & 4)
	asv1_put_level(&a->pb, block[index + 8]);
	if (ccp & 2)
	asv1_put_level(&a->pb, block[index + 1]);
	if (ccp & 1)
	asv1_put_level(&a->pb, block[index + 9]);
	} else {
	nc_bits += 2;
	nc_val = (nc_val << 2) \| 2;
	}
	}
	put_bits(&a->pb, 5, 0xF); /* End of block */
	}

	static inline void asv2_encode_block(ASVEncContext *a, int16_t block[64])
	{
	int i;
	int count = 0;

	for (count = 63; count > 3; count--) {
	const int index = ff_asv_scantab[count];
	if ((block[index] * a->q_intra_matrix[index] + (1 << 15)) >> 16)
	break;
	}

	count >>= 2;

	put_bits_le(&a->pb, 4 + 8, count /* 4 bits */ \|
	(/* DC */(block[0] + 32) >> 6) << 4);
	block[0] = 0;

	for (i = 0; i <= count; i++) {
	const int index = ff_asv_scantab[4 * i];
	int ccp = 0;

	if ((block[index + 0] = (block[index + 0] *
	a->q_intra_matrix[index + 0] + (1 << 15)) >> 16))
	ccp \|= 8;
	if ((block[index + 8] = (block[index + 8] *
	a->q_intra_matrix[index + 8] + (1 << 15)) >> 16))
	ccp \|= 4;
	if ((block[index + 1] = (block[index + 1] *
	a->q_intra_matrix[index + 1] + (1 << 15)) >> 16))
	ccp \|= 2;
	if ((block[index + 9] = (block[index + 9] *
	a->q_intra_matrix[index + 9] + (1 << 15)) >> 16))
	ccp \|= 1;

	av_assert2(i \|\| ccp < 8);
	if (i)
	put_bits_le(&a->pb, ff_asv_ac_ccp_tab[ccp][1], ff_asv_ac_ccp_tab[ccp][0]);
	else
	put_bits_le(&a->pb, ff_asv_dc_ccp_tab[ccp][1], ff_asv_dc_ccp_tab[ccp][0]);

	if (ccp) {
	if (ccp & 8)
	asv2_put_level(a, &a->pb, block[index + 0]);
	if (ccp & 4)
	asv2_put_level(a, &a->pb, block[index + 8]);
	if (ccp & 2)
	asv2_put_level(a, &a->pb, block[index + 1]);
	if (ccp & 1)
	asv2_put_level(a, &a->pb, block[index + 9]);
	}
	}
	}

	static inline int encode_mb(ASVEncContext *a, int16_t block[6][64])
	{
	int i;

	av_assert0(put_bytes_left(&a->pb, 0) >= MAX_MB_SIZE);

	if (a->c.avctx->codec_id == AV_CODEC_ID_ASV1) {
	for (i = 0; i < 6; i++)
	asv1_encode_block(a, block[i]);
	} else {
	for (i = 0; i < 6; i++) {
	asv2_encode_block(a, block[i]);
	}
	}
	return 0;
	}

	static inline void dct_get(ASVEncContext a, const AVFrame frame,
	int mb_x, int mb_y)
	{
	int16_t (*block)[64] = a->block;
	int linesize = frame->linesize[0];
	int i;

	const uint8_t ptr_y = frame->data[0] + (mb_y 16 * linesize) + mb_x * 16;
	const uint8_t ptr_cb = frame->data[1] + (mb_y 8 * frame->linesize[1]) + mb_x * 8;
	const uint8_t ptr_cr = frame->data[2] + (mb_y 8 * frame->linesize[2]) + mb_x * 8;

	a->get_pixels(block[0], ptr_y, linesize);
	a->get_pixels(block[1], ptr_y + 8, linesize);
	a->get_pixels(block[2], ptr_y + 8 * linesize, linesize);
	a->get_pixels(block[3], ptr_y + 8 * linesize + 8, linesize);
	for (i = 0; i < 4; i++)
	a->fdsp.fdct(block[i]);

	if (!(a->c.avctx->flags & AV_CODEC_FLAG_GRAY)) {
	a->get_pixels(block[4], ptr_cb, frame->linesize[1]);
	a->get_pixels(block[5], ptr_cr, frame->linesize[2]);
	for (i = 4; i < 6; i++)
	a->fdsp.fdct(block[i]);
	}
	}

	static void handle_partial_mb(ASVEncContext a, const uint8_t const data[3],
	const int linesizes[3],
	int valid_width, int valid_height)
	{
	const int nb_blocks = a->c.avctx->flags & AV_CODEC_FLAG_GRAY ? 4 : 6;
	static const struct Descriptor {
	uint8_t x_offset, y_offset;
	uint8_t component, subsampling;
	} block_descriptor[] = {
	{ 0, 0, 0, 0 }, { 8, 0, 0, 0 }, { 0, 8, 0, 0 }, { 8, 8, 0, 0 },
	{ 0, 0, 1, 1 }, { 0, 0, 2, 1 },
	};

	for (int i = 0; i < nb_blocks; ++i) {
	const struct Descriptor *const desc = block_descriptor + i;
	int width_avail = AV_CEIL_RSHIFT(valid_width, desc->subsampling) - desc->x_offset;
	int height_avail = AV_CEIL_RSHIFT(valid_height, desc->subsampling) - desc->y_offset;

	if (width_avail <= 0 \|\| height_avail <= 0) {
	// This block is outside of the visible part; don't replicate pixels,
	// just zero the block, so that only the dc value will be coded.
	memset(a->block[i], 0, sizeof(a->block[i]));
	continue;
	}
	width_avail = FFMIN(width_avail, 8);
	height_avail = FFMIN(height_avail, 8);

	ptrdiff_t linesize = linesizes[desc->component];
	const uint8_t src = data[desc->component] + desc->y_offset linesize + desc->x_offset;
	int16_t *block = a->block[i];

	for (int h = 0;; block += 8, src += linesize) {
	int16_t last;
	for (int w = 0; w < width_avail; ++w)
	last = block[w] = src[w];
	for (int w = width_avail; w < 8; ++w)
	block[w] = last;
	if (++h == height_avail)
	break;
	}
	const int16_t *const last_row = block;
	for (int h = height_avail; h < 8; ++h) {
	block += 8;
	AV_COPY128(block, last_row);
	}

	a->fdsp.fdct(a->block[i]);
	}

	encode_mb(a, a->block);
	}

	static int encode_frame(AVCodecContext avctx, AVPacket pkt,
	const AVFrame pict, int got_packet)
	{
	ASVEncContext *const a = avctx->priv_data;
	const ASVCommonContext *const c = &a->c;
	int size, ret;

	ret = ff_alloc_packet(avctx, pkt, c->mb_height * c->mb_width * MAX_MB_SIZE + 3);
	if (ret < 0)
	return ret;

	if (!PIXBLOCKDSP_8BPP_GET_PIXELS_SUPPORTS_UNALIGNED &&
	((uintptr_t)pict->data[0] & 7 \|\| pict->linesize[0] & 7 \|\|
	(uintptr_t)pict->data[1] & 7 \|\| pict->linesize[1] & 7 \|\|
	(uintptr_t)pict->data[2] & 7 \|\| pict->linesize[2] & 7))
	a->get_pixels = a->pdsp.get_pixels_unaligned;
	else
	a->get_pixels = a->pdsp.get_pixels;

	init_put_bits(&a->pb, pkt->data, pkt->size);

	for (int mb_y = 0; mb_y < c->mb_height2; mb_y++) {
	for (int mb_x = 0; mb_x < c->mb_width2; mb_x++) {
	dct_get(a, pict, mb_x, mb_y);
	encode_mb(a, a->block);
	}
	}

	if (avctx->width & 15) {
	const uint8_t *src[3] = {
	pict->data[0] + c->mb_width2 * 16,
	pict->data[1] + c->mb_width2 * 8,
	pict->data[2] + c->mb_width2 * 8,
	};
	int available_width = avctx->width & 15;

	for (int mb_y = 0; mb_y < c->mb_height2; mb_y++) {
	handle_partial_mb(a, src, pict->linesize, available_width, 16);
	src[0] += 16 * pict->linesize[0];
	src[1] += 8 * pict->linesize[1];
	src[2] += 8 * pict->linesize[2];
	}
	}

	if (avctx->height & 15) {
	const uint8_t *src[3] = {
	pict->data[0] + c->mb_height2 * 16 * pict->linesize[0],
	pict->data[1] + c->mb_height2 * 8 * pict->linesize[1],
	pict->data[2] + c->mb_height2 * 8 * pict->linesize[2],
	};
	int available_height = avctx->height & 15;

	for (int remaining = avctx->width;; remaining -= 16) {
	handle_partial_mb(a, src, pict->linesize, remaining, available_height);
	if (remaining <= 16)
	break;
	src[0] += 16;
	src[1] += 8;
	src[2] += 8;
	}
	}

	if (avctx->codec_id == AV_CODEC_ID_ASV1)
	flush_put_bits(&a->pb);
	else
	flush_put_bits_le(&a->pb);
	AV_WN32(put_bits_ptr(&a->pb), 0);
	size = (put_bytes_output(&a->pb) + 3) / 4;

	if (avctx->codec_id == AV_CODEC_ID_ASV1) {
	c->bbdsp.bswap_buf((uint32_t *) pkt->data,
	(uint32_t *) pkt->data, size);
	}

	pkt->size = size * 4;
	*got_packet = 1;

	return 0;
	}

	static av_cold int encode_init(AVCodecContext *avctx)
	{
	ASVEncContext *const a = avctx->priv_data;
	int i;
	const int scale = avctx->codec_id == AV_CODEC_ID_ASV1 ? 1 : 2;
	int inv_qscale;

	ff_asv_common_init(avctx);
	ff_fdctdsp_init(&a->fdsp, avctx);
	ff_pixblockdsp_init(&a->pdsp, 8);

	if (avctx->global_quality <= 0)
	avctx->global_quality = 4 * FF_QUALITY_SCALE;

	inv_qscale = (32 * scale * FF_QUALITY_SCALE +
	avctx->global_quality / 2) / avctx->global_quality;

	avctx->extradata = av_mallocz(8);
	if (!avctx->extradata)
	return AVERROR(ENOMEM);
	avctx->extradata_size = 8;
	AV_WL32A(avctx->extradata, inv_qscale);
	AV_WL32A(avctx->extradata + 4, MKTAG('A', 'S', 'U', 'S'));

	for (i = 0; i < 64; i++) {
	if (a->fdsp.fdct == ff_fdct_ifast) {
	int q = 32LL * scale * ff_mpeg1_default_intra_matrix[i] * ff_aanscales[i];
	a->q_intra_matrix[i] = (((int64_t)inv_qscale << 30) + q / 2) / q;
	} else {
	int q = 32 * scale * ff_mpeg1_default_intra_matrix[i];
	a->q_intra_matrix[i] = ((inv_qscale << 16) + q / 2) / q;
	}
	}

	return 0;
	}

	#if CONFIG_ASV1_ENCODER
	const FFCodec ff_asv1_encoder = {
	.p.name = "asv1",
	CODEC_LONG_NAME("ASUS V1"),
	.p.type = AVMEDIA_TYPE_VIDEO,
	.p.id = AV_CODEC_ID_ASV1,
	.p.capabilities = AV_CODEC_CAP_DR1 \| AV_CODEC_CAP_ENCODER_REORDERED_OPAQUE,
	.priv_data_size = sizeof(ASVEncContext),
	.init = encode_init,
	FF_CODEC_ENCODE_CB(encode_frame),
	CODEC_PIXFMTS(AV_PIX_FMT_YUV420P),
	.color_ranges = AVCOL_RANGE_MPEG,
	};
	#endif

	#if CONFIG_ASV2_ENCODER
	const FFCodec ff_asv2_encoder = {
	.p.name = "asv2",
	CODEC_LONG_NAME("ASUS V2"),
	.p.type = AVMEDIA_TYPE_VIDEO,
	.p.id = AV_CODEC_ID_ASV2,
	.p.capabilities = AV_CODEC_CAP_DR1 \| AV_CODEC_CAP_ENCODER_REORDERED_OPAQUE,
	.priv_data_size = sizeof(ASVEncContext),
	.init = encode_init,
	FF_CODEC_ENCODE_CB(encode_frame),
	CODEC_PIXFMTS(AV_PIX_FMT_YUV420P),
	.color_ranges = AVCOL_RANGE_MPEG,
	};
	#endif