blob: c15c3516973e4631b0c4f3a8a7f8dbd34ca2cdf1 [file] [log] [blame]
/**************************************************************************
*
* Copyright 2013 Advanced Micro Devices, Inc.
* All Rights Reserved.
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the
* "Software"), to deal in the Software without restriction, including
* without limitation the rights to use, copy, modify, merge, publish,
* distribute, sub license, and/or sell copies of the Software, and to
* permit persons to whom the Software is furnished to do so, subject to
* the following conditions:
*
* The above copyright notice and this permission notice (including the
* next paragraph) shall be included in all copies or substantial portions
* of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
* IN NO EVENT SHALL THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR
* ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
*
**************************************************************************/
#include "vid_enc_common.h"
#include "vl/vl_video_buffer.h"
#include "tgsi/tgsi_text.h"
void enc_ReleaseTasks(struct list_head *head)
{
struct encode_task *i, *next;
if (!head || !head->next)
return;
LIST_FOR_EACH_ENTRY_SAFE(i, next, head, list) {
pipe_resource_reference(&i->bitstream, NULL);
i->buf->destroy(i->buf);
FREE(i);
}
}
void enc_MoveTasks(struct list_head *from, struct list_head *to)
{
to->prev->next = from->next;
from->next->prev = to->prev;
from->prev->next = to;
to->prev = from->prev;
list_inithead(from);
}
static void enc_GetPictureParamPreset(struct pipe_h264_enc_picture_desc *picture)
{
picture->motion_est.enc_disable_sub_mode = 0x000000fe;
picture->motion_est.enc_ime2_search_range_x = 0x00000001;
picture->motion_est.enc_ime2_search_range_y = 0x00000001;
picture->pic_ctrl.enc_constraint_set_flags = 0x00000040;
}
enum pipe_video_profile enc_TranslateOMXProfileToPipe(unsigned omx_profile)
{
switch (omx_profile) {
case OMX_VIDEO_AVCProfileBaseline:
return PIPE_VIDEO_PROFILE_MPEG4_AVC_BASELINE;
case OMX_VIDEO_AVCProfileMain:
return PIPE_VIDEO_PROFILE_MPEG4_AVC_MAIN;
case OMX_VIDEO_AVCProfileExtended:
return PIPE_VIDEO_PROFILE_MPEG4_AVC_EXTENDED;
case OMX_VIDEO_AVCProfileHigh:
return PIPE_VIDEO_PROFILE_MPEG4_AVC_HIGH;
case OMX_VIDEO_AVCProfileHigh10:
return PIPE_VIDEO_PROFILE_MPEG4_AVC_HIGH10;
case OMX_VIDEO_AVCProfileHigh422:
return PIPE_VIDEO_PROFILE_MPEG4_AVC_HIGH422;
case OMX_VIDEO_AVCProfileHigh444:
return PIPE_VIDEO_PROFILE_MPEG4_AVC_HIGH444;
default:
return PIPE_VIDEO_PROFILE_UNKNOWN;
}
}
unsigned enc_TranslateOMXLevelToPipe(unsigned omx_level)
{
switch (omx_level) {
case OMX_VIDEO_AVCLevel1:
case OMX_VIDEO_AVCLevel1b:
return 10;
case OMX_VIDEO_AVCLevel11:
return 11;
case OMX_VIDEO_AVCLevel12:
return 12;
case OMX_VIDEO_AVCLevel13:
return 13;
case OMX_VIDEO_AVCLevel2:
return 20;
case OMX_VIDEO_AVCLevel21:
return 21;
case OMX_VIDEO_AVCLevel22:
return 22;
case OMX_VIDEO_AVCLevel3:
return 30;
case OMX_VIDEO_AVCLevel31:
return 31;
case OMX_VIDEO_AVCLevel32:
return 32;
case OMX_VIDEO_AVCLevel4:
return 40;
case OMX_VIDEO_AVCLevel41:
return 41;
default:
case OMX_VIDEO_AVCLevel42:
return 42;
case OMX_VIDEO_AVCLevel5:
return 50;
case OMX_VIDEO_AVCLevel51:
return 51;
}
}
void vid_enc_BufferEncoded_common(vid_enc_PrivateType * priv, OMX_BUFFERHEADERTYPE* input, OMX_BUFFERHEADERTYPE* output)
{
struct output_buf_private *outp = output->pOutputPortPrivate;
struct input_buf_private *inp = input->pInputPortPrivate;
struct encode_task *task;
struct pipe_box box = {};
unsigned size;
#if ENABLE_ST_OMX_BELLAGIO
if (!inp || list_is_empty(&inp->tasks)) {
input->nFilledLen = 0; /* mark buffer as empty */
enc_MoveTasks(&priv->used_tasks, &inp->tasks);
return;
}
#endif
task = LIST_ENTRY(struct encode_task, inp->tasks.next, list);
list_del(&task->list);
list_addtail(&task->list, &priv->used_tasks);
if (!task->bitstream)
return;
/* ------------- map result buffer ----------------- */
if (outp->transfer)
pipe_transfer_unmap(priv->t_pipe, outp->transfer);
pipe_resource_reference(&outp->bitstream, task->bitstream);
pipe_resource_reference(&task->bitstream, NULL);
box.width = outp->bitstream->width0;
box.height = outp->bitstream->height0;
box.depth = outp->bitstream->depth0;
output->pBuffer = priv->t_pipe->transfer_map(priv->t_pipe, outp->bitstream, 0,
PIPE_TRANSFER_READ_WRITE,
&box, &outp->transfer);
/* ------------- get size of result ----------------- */
priv->codec->get_feedback(priv->codec, task->feedback, &size);
output->nOffset = 0;
output->nFilledLen = size; /* mark buffer as full */
/* all output buffers contain exactly one frame */
output->nFlags = OMX_BUFFERFLAG_ENDOFFRAME;
#if ENABLE_ST_OMX_TIZONIA
input->nFilledLen = 0; /* mark buffer as empty */
enc_MoveTasks(&priv->used_tasks, &inp->tasks);
#endif
}
struct encode_task *enc_NeedTask_common(vid_enc_PrivateType * priv, OMX_VIDEO_PORTDEFINITIONTYPE *def)
{
struct pipe_video_buffer templat = {};
struct encode_task *task;
if (!list_is_empty(&priv->free_tasks)) {
task = LIST_ENTRY(struct encode_task, priv->free_tasks.next, list);
list_del(&task->list);
return task;
}
/* allocate a new one */
task = CALLOC_STRUCT(encode_task);
if (!task)
return NULL;
templat.buffer_format = PIPE_FORMAT_NV12;
templat.chroma_format = PIPE_VIDEO_CHROMA_FORMAT_420;
templat.width = def->nFrameWidth;
templat.height = def->nFrameHeight;
templat.interlaced = false;
task->buf = priv->s_pipe->create_video_buffer(priv->s_pipe, &templat);
if (!task->buf) {
FREE(task);
return NULL;
}
return task;
}
void enc_ScaleInput_common(vid_enc_PrivateType * priv, OMX_VIDEO_PORTDEFINITIONTYPE *def,
struct pipe_video_buffer **vbuf, unsigned *size)
{
struct pipe_video_buffer *src_buf = *vbuf;
struct vl_compositor *compositor = &priv->compositor;
struct vl_compositor_state *s = &priv->cstate;
struct pipe_sampler_view **views;
struct pipe_surface **dst_surface;
unsigned i;
if (!priv->scale_buffer[priv->current_scale_buffer])
return;
views = src_buf->get_sampler_view_planes(src_buf);
dst_surface = priv->scale_buffer[priv->current_scale_buffer]->get_surfaces
(priv->scale_buffer[priv->current_scale_buffer]);
vl_compositor_clear_layers(s);
for (i = 0; i < VL_MAX_SURFACES; ++i) {
struct u_rect src_rect;
if (!views[i] || !dst_surface[i])
continue;
src_rect.x0 = 0;
src_rect.y0 = 0;
src_rect.x1 = def->nFrameWidth;
src_rect.y1 = def->nFrameHeight;
if (i > 0) {
src_rect.x1 /= 2;
src_rect.y1 /= 2;
}
vl_compositor_set_rgba_layer(s, compositor, 0, views[i], &src_rect, NULL, NULL);
vl_compositor_render(s, compositor, dst_surface[i], NULL, false);
}
*size = priv->scale.xWidth * priv->scale.xHeight * 2;
*vbuf = priv->scale_buffer[priv->current_scale_buffer++];
priv->current_scale_buffer %= OMX_VID_ENC_NUM_SCALING_BUFFERS;
}
void enc_ControlPicture_common(vid_enc_PrivateType * priv, struct pipe_h264_enc_picture_desc *picture)
{
struct pipe_h264_enc_rate_control *rate_ctrl = &picture->rate_ctrl;
/* Get bitrate from port */
switch (priv->bitrate.eControlRate) {
case OMX_Video_ControlRateVariable:
rate_ctrl->rate_ctrl_method = PIPE_H264_ENC_RATE_CONTROL_METHOD_VARIABLE;
break;
case OMX_Video_ControlRateConstant:
rate_ctrl->rate_ctrl_method = PIPE_H264_ENC_RATE_CONTROL_METHOD_CONSTANT;
break;
case OMX_Video_ControlRateVariableSkipFrames:
rate_ctrl->rate_ctrl_method = PIPE_H264_ENC_RATE_CONTROL_METHOD_VARIABLE_SKIP;
break;
case OMX_Video_ControlRateConstantSkipFrames:
rate_ctrl->rate_ctrl_method = PIPE_H264_ENC_RATE_CONTROL_METHOD_CONSTANT_SKIP;
break;
default:
rate_ctrl->rate_ctrl_method = PIPE_H264_ENC_RATE_CONTROL_METHOD_DISABLE;
break;
}
rate_ctrl->frame_rate_den = OMX_VID_ENC_CONTROL_FRAME_RATE_DEN_DEFAULT;
rate_ctrl->frame_rate_num = ((priv->frame_rate) >> 16) * rate_ctrl->frame_rate_den;
if (rate_ctrl->rate_ctrl_method != PIPE_H264_ENC_RATE_CONTROL_METHOD_DISABLE) {
if (priv->bitrate.nTargetBitrate < OMX_VID_ENC_BITRATE_MIN)
rate_ctrl->target_bitrate = OMX_VID_ENC_BITRATE_MIN;
else if (priv->bitrate.nTargetBitrate < OMX_VID_ENC_BITRATE_MAX)
rate_ctrl->target_bitrate = priv->bitrate.nTargetBitrate;
else
rate_ctrl->target_bitrate = OMX_VID_ENC_BITRATE_MAX;
rate_ctrl->peak_bitrate = rate_ctrl->target_bitrate;
if (rate_ctrl->target_bitrate < OMX_VID_ENC_BITRATE_MEDIAN)
rate_ctrl->vbv_buffer_size = MIN2((rate_ctrl->target_bitrate * 2.75), OMX_VID_ENC_BITRATE_MEDIAN);
else
rate_ctrl->vbv_buffer_size = rate_ctrl->target_bitrate;
if (rate_ctrl->frame_rate_num) {
unsigned long long t = rate_ctrl->target_bitrate;
t *= rate_ctrl->frame_rate_den;
rate_ctrl->target_bits_picture = t / rate_ctrl->frame_rate_num;
} else {
rate_ctrl->target_bits_picture = rate_ctrl->target_bitrate;
}
rate_ctrl->peak_bits_picture_integer = rate_ctrl->target_bits_picture;
rate_ctrl->peak_bits_picture_fraction = 0;
}
picture->quant_i_frames = priv->quant.nQpI;
picture->quant_p_frames = priv->quant.nQpP;
picture->quant_b_frames = priv->quant.nQpB;
picture->frame_num = priv->frame_num;
picture->ref_idx_l0 = priv->ref_idx_l0;
picture->ref_idx_l1 = priv->ref_idx_l1;
picture->enable_vui = (picture->rate_ctrl.frame_rate_num != 0);
enc_GetPictureParamPreset(picture);
}
static void *create_compute_state(struct pipe_context *pipe,
const char *source)
{
struct tgsi_token tokens[1024];
struct pipe_compute_state state = {0};
if (!tgsi_text_translate(source, tokens, ARRAY_SIZE(tokens))) {
assert(false);
return NULL;
}
state.ir_type = PIPE_SHADER_IR_TGSI;
state.prog = tokens;
return pipe->create_compute_state(pipe, &state);
}
void enc_InitCompute_common(vid_enc_PrivateType *priv)
{
struct pipe_context *pipe = priv->s_pipe;
struct pipe_screen *screen = pipe->screen;
/* We need the partial last block support. */
if (!screen->get_param(screen, PIPE_CAP_COMPUTE_GRID_INFO_LAST_BLOCK))
return;
static const char *copy_y =
"COMP\n"
"PROPERTY CS_FIXED_BLOCK_WIDTH 64\n"
"PROPERTY CS_FIXED_BLOCK_HEIGHT 1\n"
"PROPERTY CS_FIXED_BLOCK_DEPTH 1\n"
"DCL SV[0], THREAD_ID\n"
"DCL SV[1], BLOCK_ID\n"
"DCL IMAGE[0], 2D, PIPE_FORMAT_R8_UINT\n"
"DCL IMAGE[1], 2D, PIPE_FORMAT_R8_UINT, WR\n"
"DCL TEMP[0..1]\n"
"IMM[0] UINT32 {64, 0, 0, 0}\n"
"UMAD TEMP[0].x, SV[1], IMM[0], SV[0]\n"
"MOV TEMP[0].y, SV[1]\n"
"LOAD TEMP[1].x, IMAGE[0], TEMP[0], 2D, PIPE_FORMAT_R8_UINT\n"
"STORE IMAGE[1].x, TEMP[0], TEMP[1], 2D, PIPE_FORMAT_R8_UINT\n"
"END\n";
static const char *copy_uv =
"COMP\n"
"PROPERTY CS_FIXED_BLOCK_WIDTH 64\n"
"PROPERTY CS_FIXED_BLOCK_HEIGHT 1\n"
"PROPERTY CS_FIXED_BLOCK_DEPTH 1\n"
"DCL SV[0], THREAD_ID\n"
"DCL SV[1], BLOCK_ID\n"
"DCL IMAGE[0], 2D, PIPE_FORMAT_R8_UINT\n"
"DCL IMAGE[2], 2D, PIPE_FORMAT_R8G8_UINT, WR\n"
"DCL CONST[0][0]\n" /* .x = offset of the UV portion in the y direction */
"DCL TEMP[0..4]\n"
"IMM[0] UINT32 {64, 0, 2, 1}\n"
/* Destination R8G8 coordinates */
"UMAD TEMP[0].x, SV[1], IMM[0], SV[0]\n"
"MOV TEMP[0].y, SV[1]\n"
/* Source R8 coordinates of U */
"UMUL TEMP[1].x, TEMP[0], IMM[0].zzzz\n"
"UADD TEMP[1].y, TEMP[0], CONST[0].xxxx\n"
/* Source R8 coordinates of V */
"UADD TEMP[2].x, TEMP[1], IMM[0].wwww\n"
"MOV TEMP[2].y, TEMP[1]\n"
"LOAD TEMP[3].x, IMAGE[0], TEMP[1], 2D, PIPE_FORMAT_R8_UINT\n"
"LOAD TEMP[4].x, IMAGE[0], TEMP[2], 2D, PIPE_FORMAT_R8_UINT\n"
"MOV TEMP[3].y, TEMP[4].xxxx\n"
"STORE IMAGE[2], TEMP[0], TEMP[3], 2D, PIPE_FORMAT_R8G8_UINT\n"
"END\n";
priv->copy_y_shader = create_compute_state(pipe, copy_y);
priv->copy_uv_shader = create_compute_state(pipe, copy_uv);
}
void enc_ReleaseCompute_common(vid_enc_PrivateType *priv)
{
struct pipe_context *pipe = priv->s_pipe;
if (priv->copy_y_shader)
pipe->delete_compute_state(pipe, priv->copy_y_shader);
if (priv->copy_uv_shader)
pipe->delete_compute_state(pipe, priv->copy_uv_shader);
}
OMX_ERRORTYPE enc_LoadImage_common(vid_enc_PrivateType * priv, OMX_VIDEO_PORTDEFINITIONTYPE *def,
OMX_BUFFERHEADERTYPE *buf,
struct pipe_video_buffer *vbuf)
{
struct pipe_context *pipe = priv->s_pipe;
struct pipe_box box = {};
struct input_buf_private *inp = buf->pInputPortPrivate;
if (!inp->resource) {
struct pipe_sampler_view **views;
void *ptr;
views = vbuf->get_sampler_view_planes(vbuf);
if (!views)
return OMX_ErrorInsufficientResources;
ptr = buf->pBuffer;
box.width = def->nFrameWidth;
box.height = def->nFrameHeight;
box.depth = 1;
pipe->texture_subdata(pipe, views[0]->texture, 0,
PIPE_TRANSFER_WRITE, &box,
ptr, def->nStride, 0);
ptr = ((uint8_t*)buf->pBuffer) + (def->nStride * box.height);
box.width = def->nFrameWidth / 2;
box.height = def->nFrameHeight / 2;
box.depth = 1;
pipe->texture_subdata(pipe, views[1]->texture, 0,
PIPE_TRANSFER_WRITE, &box,
ptr, def->nStride, 0);
} else {
struct vl_video_buffer *dst_buf = (struct vl_video_buffer *)vbuf;
pipe_transfer_unmap(pipe, inp->transfer);
/* inp->resource uses PIPE_FORMAT_I8 and the layout looks like this:
*
* def->nFrameWidth = 4, def->nFrameHeight = 4:
* |----|
* |YYYY|
* |YYYY|
* |YYYY|
* |YYYY|
* |UVUV|
* |UVUV|
* |----|
*
* The copy has 2 steps:
* - Copy Y to dst_buf->resources[0] as R8.
* - Copy UV to dst_buf->resources[1] as R8G8.
*/
if (priv->copy_y_shader && priv->copy_uv_shader) {
/* Compute path */
/* Set shader images for both copies. */
struct pipe_image_view image[3] = {0};
image[0].resource = inp->resource;
image[0].shader_access = image[0].access = PIPE_IMAGE_ACCESS_READ;
image[0].format = PIPE_FORMAT_R8_UINT;
image[1].resource = dst_buf->resources[0];
image[1].shader_access = image[1].access = PIPE_IMAGE_ACCESS_WRITE;
image[1].format = PIPE_FORMAT_R8_UINT;
image[2].resource = dst_buf->resources[1];
image[2].shader_access = image[1].access = PIPE_IMAGE_ACCESS_WRITE;
image[2].format = PIPE_FORMAT_R8G8_UINT;
pipe->set_shader_images(pipe, PIPE_SHADER_COMPUTE, 0, 3, image);
/* Set the constant buffer. */
uint32_t constants[4] = {def->nFrameHeight};
struct pipe_constant_buffer cb = {};
cb.buffer_size = sizeof(constants);
cb.user_buffer = constants;
pipe->set_constant_buffer(pipe, PIPE_SHADER_COMPUTE, 0, &cb);
/* Use the optimal block size for the linear image layout. */
struct pipe_grid_info info = {};
info.block[0] = 64;
info.block[1] = 1;
info.block[2] = 1;
info.grid[2] = 1;
/* Copy Y */
pipe->bind_compute_state(pipe, priv->copy_y_shader);
info.grid[0] = DIV_ROUND_UP(def->nFrameWidth, 64);
info.grid[1] = def->nFrameHeight;
info.last_block[0] = def->nFrameWidth % 64;
pipe->launch_grid(pipe, &info);
/* Copy UV */
pipe->bind_compute_state(pipe, priv->copy_uv_shader);
info.grid[0] = DIV_ROUND_UP(def->nFrameWidth / 2, 64);
info.grid[1] = def->nFrameHeight / 2;
info.last_block[0] = (def->nFrameWidth / 2) % 64;
pipe->launch_grid(pipe, &info);
/* Make the result visible to all clients. */
pipe->memory_barrier(pipe, PIPE_BARRIER_ALL);
/* Unbind. */
pipe->set_shader_images(pipe, PIPE_SHADER_COMPUTE, 0, 3, NULL);
pipe->set_constant_buffer(pipe, PIPE_SHADER_COMPUTE, 0, NULL);
pipe->bind_compute_state(pipe, NULL);
} else {
/* Graphics path */
struct pipe_blit_info blit;
box.width = def->nFrameWidth;
box.height = def->nFrameHeight;
box.depth = 1;
/* Copy Y */
pipe->resource_copy_region(pipe,
dst_buf->resources[0],
0, 0, 0, 0, inp->resource, 0, &box);
/* Copy U */
memset(&blit, 0, sizeof(blit));
blit.src.resource = inp->resource;
blit.src.format = inp->resource->format;
blit.src.box.x = -1;
blit.src.box.y = def->nFrameHeight;
blit.src.box.width = def->nFrameWidth;
blit.src.box.height = def->nFrameHeight / 2 ;
blit.src.box.depth = 1;
blit.dst.resource = dst_buf->resources[1];
blit.dst.format = blit.dst.resource->format;
blit.dst.box.width = def->nFrameWidth / 2;
blit.dst.box.height = def->nFrameHeight / 2;
blit.dst.box.depth = 1;
blit.filter = PIPE_TEX_FILTER_NEAREST;
blit.mask = PIPE_MASK_R;
pipe->blit(pipe, &blit);
/* Copy V */
blit.src.box.x = 0;
blit.mask = PIPE_MASK_G;
pipe->blit(pipe, &blit);
}
pipe->flush(pipe, NULL, 0);
box.width = inp->resource->width0;
box.height = inp->resource->height0;
box.depth = inp->resource->depth0;
buf->pBuffer = pipe->transfer_map(pipe, inp->resource, 0,
PIPE_TRANSFER_WRITE, &box,
&inp->transfer);
}
return OMX_ErrorNone;
}