blob: a399be55160ab31140d7beb8dec2486fba6e7d4e [file] [log] [blame]
/*************************************************************************/ /*!
@File
@Title RGX firmware interface structures
@Copyright Copyright (c) Imagination Technologies Ltd. All Rights Reserved
@Description RGX firmware interface structures shared by both host client
and host server
@License MIT
The contents of this file are subject to the MIT license as set out below.
Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:
The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.
This License is also included in this distribution in the file called
"MIT-COPYING".
EXCEPT AS OTHERWISE STATED IN A NEGOTIATED AGREEMENT: (A) THE SOFTWARE IS
PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING
BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR
PURPOSE AND NONINFRINGEMENT; AND (B) IN NO EVENT SHALL THE AUTHORS OR
COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER
IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
*/ /**************************************************************************/
#if !defined (__RGX_FWIF_SHARED_H__)
#define __RGX_FWIF_SHARED_H__
#if defined(__KERNEL__) && defined(LINUX) && !defined(__GENKSYMS__)
#define __pvrsrv_defined_struct_enum__
#include <services_kernel_client.h>
#endif
#include "img_types.h"
#include "rgx_common.h"
#include "devicemem_typedefs.h"
/*
* Firmware binary block unit in bytes.
* Raw data stored in FW binary will be aligned on this size.
*/
#define FW_BLOCK_SIZE 4096L
/* Offset for BVNC struct from the end of the FW binary */
#define FW_BVNC_BACKWARDS_OFFSET (FW_BLOCK_SIZE)
/*!
******************************************************************************
* Device state flags
*****************************************************************************/
#define RGXKMIF_DEVICE_STATE_ZERO_FREELIST (0x1 << 0) /*!< Zeroing the physical pages of reconstructed free lists */
/*
* #define RGXKMIF_DEVICE_STATE_FTRACE_EN (0x1 << 1)
* Removed this obsolete flag from DDK.
*/
#define RGXKMIF_DEVICE_STATE_DISABLE_DW_LOGGING_EN (0x1 << 2) /*!< Used to disable the Devices Watchdog logging */
#define RGXKMIF_DEVICE_STATE_DUST_REQUEST_INJECT_EN (0x1 << 3) /*!< Used for validation to inject dust requests every TA/3D kick */
#define RGXKMIF_DEVICE_STATE_HWPERF_HOST_EN (0x1 << 4) /*!< Used to enable host-side-only HWPerf stream */
/* Required memory alignment for 64-bit variables accessible by Meta
(the gcc meta aligns 64-bit vars to 64-bit; therefore, mem shared between
the host and meta that contains 64-bit vars has to maintain this aligment)*/
#define RGXFWIF_FWALLOC_ALIGN sizeof(IMG_UINT64)
typedef struct _RGXFWIF_DEV_VIRTADDR_
{
IMG_UINT32 ui32Addr;
} RGXFWIF_DEV_VIRTADDR;
typedef struct _RGXFWIF_DMA_ADDR_
{
IMG_DEV_VIRTADDR RGXFW_ALIGN psDevVirtAddr;
RGXFWIF_DEV_VIRTADDR pbyFWAddr;
} UNCACHED_ALIGN RGXFWIF_DMA_ADDR;
typedef IMG_UINT8 RGXFWIF_CCCB;
typedef RGXFWIF_DEV_VIRTADDR PRGXFWIF_CCCB;
typedef RGXFWIF_DEV_VIRTADDR PRGXFWIF_CCCB_CTL;
typedef RGXFWIF_DEV_VIRTADDR PRGXFWIF_RENDER_TARGET;
typedef RGXFWIF_DEV_VIRTADDR PRGXFWIF_HWRTDATA;
typedef RGXFWIF_DEV_VIRTADDR PRGXFWIF_FREELIST;
typedef RGXFWIF_DEV_VIRTADDR PRGXFWIF_RAY_FRAME_DATA;
typedef RGXFWIF_DEV_VIRTADDR PRGXFWIF_RPM_FREELIST;
typedef RGXFWIF_DEV_VIRTADDR PRGXFWIF_RTA_CTL;
typedef RGXFWIF_DEV_VIRTADDR PRGXFWIF_UFO_ADDR;
typedef RGXFWIF_DEV_VIRTADDR PRGXFWIF_CLEANUP_CTL;
typedef RGXFWIF_DEV_VIRTADDR PRGXFWIF_TIMESTAMP_ADDR;
/* FIXME PRGXFWIF_UFO_ADDR and RGXFWIF_UFO should move back into rgx_fwif_client.h */
typedef struct _RGXFWIF_UFO_
{
PRGXFWIF_UFO_ADDR puiAddrUFO;
IMG_UINT32 ui32Value;
} RGXFWIF_UFO;
/*!
Last reset reason for a context.
*/
typedef enum _RGXFWIF_CONTEXT_RESET_REASON_
{
RGXFWIF_CONTEXT_RESET_REASON_NONE = 0, /*!< No reset reason recorded */
RGXFWIF_CONTEXT_RESET_REASON_GUILTY_LOCKUP = 1, /*!< Caused a reset due to locking up */
RGXFWIF_CONTEXT_RESET_REASON_INNOCENT_LOCKUP = 2, /*!< Affected by another context locking up */
RGXFWIF_CONTEXT_RESET_REASON_GUILTY_OVERRUNING = 3, /*!< Overran the global deadline */
RGXFWIF_CONTEXT_RESET_REASON_INNOCENT_OVERRUNING = 4, /*!< Affected by another context overrunning */
RGXFWIF_CONTEXT_RESET_REASON_HARD_CONTEXT_SWITCH = 5, /*!< Forced reset to ensure scheduling requirements */
} RGXFWIF_CONTEXT_RESET_REASON;
/*!
HWRTData state the render is in
*/
typedef enum
{
RGXFWIF_RTDATA_STATE_NONE = 0,
RGXFWIF_RTDATA_STATE_KICKTA,
RGXFWIF_RTDATA_STATE_KICKTAFIRST,
RGXFWIF_RTDATA_STATE_TAFINISHED,
RGXFWIF_RTDATA_STATE_KICK3D,
RGXFWIF_RTDATA_STATE_3DFINISHED,
RGXFWIF_RTDATA_STATE_TAOUTOFMEM,
RGXFWIF_RTDATA_STATE_PARTIALRENDERFINISHED,
RGXFWIF_RTDATA_STATE_HWR /*!< In case of HWR, we can't set the RTDATA state to NONE,
as this will cause any TA to become a first TA.
To ensure all related TA's are skipped, we use the HWR state */
} RGXFWIF_RTDATA_STATE;
typedef struct _RGXFWIF_CLEANUP_CTL_
{
IMG_UINT32 ui32SubmittedCommands; /*!< Number of commands received by the FW */
IMG_UINT32 ui32ExecutedCommands; /*!< Number of commands executed by the FW */
} UNCACHED_ALIGN RGXFWIF_CLEANUP_CTL;
/*!
* Client Circular Command Buffer (CCCB) control structure.
* This is shared between the Server and the Firmware and holds byte offsets
* into the CCCB as well as the wrapping mask to aid wrap around. A given
* snapshot of this queue with Cmd 1 running on the GPU might be:
*
* Roff Doff Woff
* [..........|-1----------|=2===|=3===|=4===|~5~~~~|~6~~~~|~7~~~~|..........]
* < runnable commands >< !ready to run >
*
* Cmd 1 : Currently executing on the GPU data master.
* Cmd 2,3,4: Fence dependencies met, commands runnable.
* Cmd 5... : Fence dependency not met yet.
*/
typedef struct _RGXFWIF_CCCB_CTL_
{
IMG_UINT32 ui32WriteOffset; /*!< Host write offset into CCB. This
* must be aligned to 16 bytes. */
IMG_UINT32 ui32ReadOffset; /*!< Firmware read offset into CCB.
Points to the command that is
* runnable on GPU, if R!=W */
IMG_UINT32 ui32DepOffset; /*!< Firmware fence dependency offset.
* Points to commands not ready, i.e.
* fence dependencies are not met. */
IMG_UINT32 ui32WrapMask; /*!< Offset wrapping mask, total capacity
* in bytes of the CCB-1 */
} UNCACHED_ALIGN RGXFWIF_CCCB_CTL;
typedef enum
{
RGXFW_LOCAL_FREELIST = 0,
RGXFW_GLOBAL_FREELIST = 1,
RGXFW_FREELIST_TYPE_LAST = RGXFW_GLOBAL_FREELIST,
} RGXFW_FREELIST_TYPE;
#define RGXFW_MAX_FREELISTS (RGXFW_FREELIST_TYPE_LAST + 1)
typedef struct _RGXFWIF_RTA_CTL_
{
IMG_UINT32 ui32RenderTargetIndex; //Render number
IMG_UINT32 ui32CurrentRenderTarget; //index in RTA
IMG_UINT32 ui32ActiveRenderTargets; //total active RTs
IMG_UINT32 ui32CumulActiveRenderTargets; //total active RTs from the first TA kick, for OOM
RGXFWIF_DEV_VIRTADDR sValidRenderTargets; //Array of valid RT indices
RGXFWIF_DEV_VIRTADDR sNumRenders; //Array of number of occurred partial renders per render target
IMG_UINT16 ui16MaxRTs; //Number of render targets in the array
} UNCACHED_ALIGN RGXFWIF_RTA_CTL;
typedef struct _RGXFWIF_FREELIST_
{
IMG_DEV_VIRTADDR RGXFW_ALIGN psFreeListDevVAddr;
IMG_UINT64 RGXFW_ALIGN ui64CurrentDevVAddr;
IMG_UINT32 ui32CurrentStackTop;
IMG_UINT32 ui32MaxPages;
IMG_UINT32 ui32GrowPages;
IMG_UINT32 ui32CurrentPages; /* HW pages */
IMG_UINT32 ui32AllocatedPageCount;
IMG_UINT32 ui32AllocatedMMUPageCount;
IMG_UINT32 ui32HWRCounter;
IMG_UINT32 ui32FreeListID;
IMG_BOOL bGrowPending;
IMG_UINT32 ui32ReadyPages; /* Pages that should be used only when OOM is reached */
} UNCACHED_ALIGN RGXFWIF_FREELIST;
typedef enum
{
RGXFW_RPM_SHF_FREELIST = 0,
RGXFW_RPM_SHG_FREELIST = 1,
} RGXFW_RPM_FREELIST_TYPE;
#define RGXFW_MAX_RPM_FREELISTS (2)
typedef struct _RGXFWIF_RPM_FREELIST_
{
IMG_DEV_VIRTADDR RGXFW_ALIGN sFreeListDevVAddr; /*!< device base address */
//IMG_DEV_VIRTADDR RGXFW_ALIGN sRPMPageListDevVAddr; /*!< device base address for RPM pages in-use */
IMG_UINT32 sSyncAddr; /*!< Free list sync object for OOM event */
IMG_UINT32 ui32MaxPages; /*!< maximum size */
IMG_UINT32 ui32GrowPages; /*!< grow size = maximum pages which may be added later */
IMG_UINT32 ui32CurrentPages; /*!< number of pages */
IMG_UINT32 ui32ReadOffset; /*!< head: where to read alloc'd pages */
IMG_UINT32 ui32WriteOffset; /*!< tail: where to write de-alloc'd pages */
IMG_BOOL bReadToggle; /*!< toggle bit for circular buffer */
IMG_BOOL bWriteToggle;
IMG_UINT32 ui32AllocatedPageCount; /*!< TODO: not sure yet if this is useful */
IMG_UINT32 ui32HWRCounter;
IMG_UINT32 ui32FreeListID; /*!< unique ID per device, e.g. rolling counter */
IMG_BOOL bGrowPending; /*!< FW is waiting for host to grow the freelist */
} UNCACHED_ALIGN RGXFWIF_RPM_FREELIST;
typedef struct _RGXFWIF_RAY_FRAME_DATA_
{
/* state manager for shared state between vertex and ray processing */
/* TODO: not sure if this will be useful, link it here for now */
IMG_UINT32 sRPMFreeLists[RGXFW_MAX_RPM_FREELISTS];
IMG_BOOL bAbortOccurred;
/* cleanup state.
* Both the SHG and RTU must complete or discard any outstanding work
* which references this frame data.
*/
RGXFWIF_CLEANUP_CTL sCleanupStateSHG;
RGXFWIF_CLEANUP_CTL sCleanupStateRTU;
IMG_UINT32 ui32CleanupStatus;
#define HWFRAMEDATA_SHG_CLEAN (1 << 0)
#define HWFRAMEDATA_RTU_CLEAN (1 << 1)
} UNCACHED_ALIGN RGXFWIF_RAY_FRAME_DATA;
typedef struct _RGXFWIF_RENDER_TARGET_
{
IMG_DEV_VIRTADDR RGXFW_ALIGN psVHeapTableDevVAddr; /*!< VHeap Data Store */
IMG_BOOL bTACachesNeedZeroing; /*!< Whether RTC and TPC caches (on mem) need to be zeroed on next first TA kick */
} UNCACHED_ALIGN RGXFWIF_RENDER_TARGET;
typedef struct _RGXFWIF_HWRTDATA_
{
RGXFWIF_RTDATA_STATE eState;
IMG_UINT32 ui32NumPartialRenders; /*!< Number of partial renders. Used to setup ZLS bits correctly */
IMG_BOOL bLastWasPartial; /*!< Whether the last render was a partial render */
IMG_DEV_VIRTADDR RGXFW_ALIGN psPMMListDevVAddr; /*!< MList Data Store */
IMG_UINT64 RGXFW_ALIGN ui64VCECatBase[4];
IMG_UINT64 RGXFW_ALIGN ui64VCELastCatBase[4];
IMG_UINT64 RGXFW_ALIGN ui64TECatBase[4];
IMG_UINT64 RGXFW_ALIGN ui64TELastCatBase[4];
IMG_UINT64 RGXFW_ALIGN ui64AlistCatBase;
IMG_UINT64 RGXFW_ALIGN ui64AlistLastCatBase;
IMG_UINT64 RGXFW_ALIGN ui64PMAListStackPointer;
IMG_UINT32 ui32PMMListStackPointer;
PRGXFWIF_FREELIST RGXFW_ALIGN apsFreeLists[RGXFW_MAX_FREELISTS];
IMG_UINT32 aui32FreeListHWRSnapshot[RGXFW_MAX_FREELISTS];
PRGXFWIF_RENDER_TARGET psParentRenderTarget;
RGXFWIF_CLEANUP_CTL sTACleanupState;
RGXFWIF_CLEANUP_CTL s3DCleanupState;
IMG_UINT32 ui32CleanupStatus;
#define HWRTDATA_TA_CLEAN (1 << 0)
#define HWRTDATA_3D_CLEAN (1 << 1)
PRGXFWIF_RTA_CTL psRTACtl;
IMG_UINT32 bHasLastTA;
IMG_BOOL bPartialRendered;
IMG_UINT32 ui32PPPScreen;
IMG_UINT32 ui32PPPGridOffset;
IMG_UINT64 RGXFW_ALIGN ui64PPPMultiSampleCtl;
IMG_UINT32 ui32TPCStride;
IMG_DEV_VIRTADDR RGXFW_ALIGN sTailPtrsDevVAddr;
IMG_UINT32 ui32TPCSize;
IMG_UINT32 ui32TEScreen;
IMG_UINT32 ui32MTileStride;
IMG_UINT32 ui32TEAA;
IMG_UINT32 ui32TEMTILE1;
IMG_UINT32 ui32TEMTILE2;
IMG_UINT32 ui32ISPMergeLowerX;
IMG_UINT32 ui32ISPMergeLowerY;
IMG_UINT32 ui32ISPMergeUpperX;
IMG_UINT32 ui32ISPMergeUpperY;
IMG_UINT32 ui32ISPMergeScaleX;
IMG_UINT32 ui32ISPMergeScaleY;
IMG_BOOL bDisableTileReordering;
#if defined(RGX_FIRMWARE)
struct _RGXFWIF_FWCOMMONCONTEXT_* psOwnerTA;
#else
RGXFWIF_DEV_VIRTADDR pui32OwnerTANotUsedByHost;
#endif
#if defined(FIX_HW_BRN_65101)
IMG_BOOL bNeedBRN65101Blit;
#endif
#if defined(FIX_HW_BRN_67182)
IMG_BOOL bNeedBRN67182SecondRender;
#endif
} UNCACHED_ALIGN RGXFWIF_HWRTDATA;
typedef enum
{
RGXFWIF_PRBUFFER_START = 0,
RGXFWIF_PRBUFFER_ZBUFFER = 0,
RGXFWIF_PRBUFFER_SBUFFER,
RGXFWIF_PRBUFFER_MSAABUFFER,
RGXFWIF_PRBUFFER_MAXSUPPORTED,
}RGXFWIF_PRBUFFER_TYPE;
typedef enum
{
RGXFWIF_PRBUFFER_UNBACKED = 0,
RGXFWIF_PRBUFFER_BACKED,
RGXFWIF_PRBUFFER_BACKING_PENDING,
RGXFWIF_PRBUFFER_UNBACKING_PENDING,
}RGXFWIF_PRBUFFER_STATE;
typedef struct _RGXFWIF_PRBUFFER_
{
IMG_UINT32 ui32BufferID; /*!< Buffer ID*/
IMG_BOOL bOnDemand; /*!< Needs On-demand Z/S/MSAA Buffer allocation */
RGXFWIF_PRBUFFER_STATE eState; /*!< Z/S/MSAA -Buffer state */
RGXFWIF_CLEANUP_CTL sCleanupState; /*!< Cleanup state */
} UNCACHED_ALIGN RGXFWIF_PRBUFFER;
/* Number of BIF tiling configurations / heaps */
#define RGXFWIF_NUM_BIF_TILING_CONFIGS 4
/*!
*****************************************************************************
* RGX Compatibility checks
*****************************************************************************/
/* WARNING: RGXFWIF_COMPCHECKS_BVNC_V_LEN_MAX can be increased only and
always equal to (N * sizeof(IMG_UINT32) - 1) */
#define RGXFWIF_COMPCHECKS_BVNC_V_LEN_MAX 7
/* WARNING: Whenever the layout of RGXFWIF_COMPCHECKS_BVNC is a subject of change,
following define should be increased by 1 to indicate to compatibility logic,
that layout has changed */
#define RGXFWIF_COMPCHECKS_LAYOUT_VERSION 2
typedef struct _RGXFWIF_COMPCHECKS_BVNC_
{
IMG_UINT32 ui32LayoutVersion; /* WARNING: This field must be defined as first one in this structure */
IMG_UINT32 ui32VLenMax;
IMG_UINT64 RGXFW_ALIGN ui64BNC;
IMG_CHAR aszV[RGXFWIF_COMPCHECKS_BVNC_V_LEN_MAX + 1];
} UNCACHED_ALIGN RGXFWIF_COMPCHECKS_BVNC;
#define RGXFWIF_COMPCHECKS_BVNC_DECLARE_AND_INIT(name) \
RGXFWIF_COMPCHECKS_BVNC name = { \
RGXFWIF_COMPCHECKS_LAYOUT_VERSION, \
RGXFWIF_COMPCHECKS_BVNC_V_LEN_MAX, \
0, \
{ 0 }, \
}
#define RGXFWIF_COMPCHECKS_BVNC_INIT(name) \
do { \
(name).ui32LayoutVersion = RGXFWIF_COMPCHECKS_LAYOUT_VERSION; \
(name).ui32VLenMax = RGXFWIF_COMPCHECKS_BVNC_V_LEN_MAX; \
(name).ui64BNC = 0; \
(name).aszV[0] = 0; \
} while (0)
typedef struct _RGXFWIF_COMPCHECKS_
{
RGXFWIF_COMPCHECKS_BVNC sHWBVNC; /*!< hardware BNC (from the RGX registers) */
RGXFWIF_COMPCHECKS_BVNC sFWBVNC; /*!< firmware BNC */
IMG_UINT32 ui32FWProcessorVersion; /*!< identifier of the MIPS/META version */
IMG_UINT32 ui32DDKVersion; /*!< software DDK version */
IMG_UINT32 ui32DDKBuild; /*!< software DDK build no. */
IMG_UINT32 ui32BuildOptions; /*!< build options bit-field */
IMG_BOOL bUpdated; /*!< Information is valid */
} UNCACHED_ALIGN RGXFWIF_COMPCHECKS;
#define GET_CCB_SPACE(WOff, ROff, CCBSize) \
((((ROff) - (WOff)) + ((CCBSize) - 1)) & ((CCBSize) - 1))
#define UPDATE_CCB_OFFSET(Off, PacketSize, CCBSize) \
(Off) = (((Off) + (PacketSize)) & ((CCBSize) - 1))
#define RESERVED_CCB_SPACE (sizeof(IMG_UINT32))
/* Defines relating to the per-context CCBs */
/* This size is to be used when a client CCB is found to consume very negligible space
* (e.g. a few hundred bytes to few KBs - less than a page). In such a case, instead of
* allocating CCB of size of only a few KBs, we allocate at-least this much to be future
* risk-free. */
#define MIN_SAFE_CCB_SIZE_LOG2 13 /* 8K (2 Pages) */
#define RGX_TQ3D_CCB_SIZE_LOG2 PVRSRV_RGX_LOG2_CLIENT_CCB_SIZE_TQ3D
static_assert(RGX_TQ3D_CCB_SIZE_LOG2 >= MIN_SAFE_CCB_SIZE_LOG2, "TQ3D CCB size is too small");
#define RGX_TQ2D_CCB_SIZE_LOG2 PVRSRV_RGX_LOG2_CLIENT_CCB_SIZE_TQ2D
static_assert(RGX_TQ2D_CCB_SIZE_LOG2 >= MIN_SAFE_CCB_SIZE_LOG2, "TQ2D CCB size is too small");
#define RGX_CDM_CCB_SIZE_LOG2 PVRSRV_RGX_LOG2_CLIENT_CCB_SIZE_CDM
static_assert(RGX_CDM_CCB_SIZE_LOG2 >= MIN_SAFE_CCB_SIZE_LOG2, "CDM CCB size is too small");
#define RGX_TA_CCB_SIZE_LOG2 PVRSRV_RGX_LOG2_CLIENT_CCB_SIZE_TA
static_assert(RGX_TA_CCB_SIZE_LOG2 >= MIN_SAFE_CCB_SIZE_LOG2, "TA CCB size is too small");
#define RGX_3D_CCB_SIZE_LOG2 PVRSRV_RGX_LOG2_CLIENT_CCB_SIZE_3D
static_assert(RGX_3D_CCB_SIZE_LOG2 >= MIN_SAFE_CCB_SIZE_LOG2, "3D CCB size is too small");
#define RGX_KICKSYNC_CCB_SIZE_LOG2 PVRSRV_RGX_LOG2_CLIENT_CCB_SIZE_KICKSYNC
static_assert(RGX_KICKSYNC_CCB_SIZE_LOG2 >= MIN_SAFE_CCB_SIZE_LOG2, "KickSync CCB size is too small");
#define RGX_RTU_CCB_SIZE_LOG2 PVRSRV_RGX_LOG2_CLIENT_CCB_SIZE_RTU
static_assert(RGX_RTU_CCB_SIZE_LOG2 >= MIN_SAFE_CCB_SIZE_LOG2, "RTU CCB size is too small");
/*!
******************************************************************************
* Defines for CMD_TYPE corruption detection and forward compatibility check
*****************************************************************************/
/* CMD_TYPE 32bit contains:
* 31:16 Reserved for magic value to detect corruption (16 bits)
* 15 Reserved for RGX_CCB_TYPE_TASK (1 bit)
* 14:0 Bits available for CMD_TYPEs (15 bits) */
/* Magic value to detect corruption */
#define RGX_CMD_MAGIC_DWORD (0x2ABCU)
#define RGX_CMD_MAGIC_DWORD_MASK (0xFFFF0000U)
#define RGX_CMD_MAGIC_DWORD_SHIFT (16U)
#define RGX_CMD_MAGIC_DWORD_SHIFTED (RGX_CMD_MAGIC_DWORD << RGX_CMD_MAGIC_DWORD_SHIFT)
/* Maximum number of CMD_TYPEs supported = 32767 (i.e. 15 bits length) */
#define RGX_CMD_TYPE_LENGTH (15U)
#define RGX_CMD_TYPE_MASK (0x00007FFFU)
#define RGX_CMD_TYPE_SHIFT (0U)
/*!
******************************************************************************
* Client CCB commands for RGX
*****************************************************************************/
#define RGX_CCB_TYPE_TASK (1U << 15)
#define RGX_CCB_FWALLOC_ALIGN(size) (((size) + (RGXFWIF_FWALLOC_ALIGN-1)) & ~(RGXFWIF_FWALLOC_ALIGN - 1))
typedef enum _RGXFWIF_CCB_CMD_TYPE_
{
RGXFWIF_CCB_CMD_TYPE_TA = 201 | RGX_CMD_MAGIC_DWORD_SHIFTED | RGX_CCB_TYPE_TASK,
RGXFWIF_CCB_CMD_TYPE_3D = 202 | RGX_CMD_MAGIC_DWORD_SHIFTED | RGX_CCB_TYPE_TASK,
RGXFWIF_CCB_CMD_TYPE_CDM = 203 | RGX_CMD_MAGIC_DWORD_SHIFTED | RGX_CCB_TYPE_TASK,
RGXFWIF_CCB_CMD_TYPE_TQ_3D = 204 | RGX_CMD_MAGIC_DWORD_SHIFTED | RGX_CCB_TYPE_TASK,
RGXFWIF_CCB_CMD_TYPE_TQ_2D = 205 | RGX_CMD_MAGIC_DWORD_SHIFTED | RGX_CCB_TYPE_TASK,
RGXFWIF_CCB_CMD_TYPE_3D_PR = 206 | RGX_CMD_MAGIC_DWORD_SHIFTED | RGX_CCB_TYPE_TASK,
RGXFWIF_CCB_CMD_TYPE_NULL = 207 | RGX_CMD_MAGIC_DWORD_SHIFTED | RGX_CCB_TYPE_TASK,
RGXFWIF_CCB_CMD_TYPE_SHG = 208 | RGX_CMD_MAGIC_DWORD_SHIFTED | RGX_CCB_TYPE_TASK,
RGXFWIF_CCB_CMD_TYPE_RTU = 209 | RGX_CMD_MAGIC_DWORD_SHIFTED | RGX_CCB_TYPE_TASK,
RGXFWIF_CCB_CMD_TYPE_RTU_FC = 210 | RGX_CMD_MAGIC_DWORD_SHIFTED | RGX_CCB_TYPE_TASK,
RGXFWIF_CCB_CMD_TYPE_PRE_TIMESTAMP = 211 | RGX_CMD_MAGIC_DWORD_SHIFTED | RGX_CCB_TYPE_TASK,
RGXFWIF_CCB_CMD_TYPE_TQ_TDM = 212 | RGX_CMD_MAGIC_DWORD_SHIFTED | RGX_CCB_TYPE_TASK,
/* Leave a gap between CCB specific commands and generic commands */
RGXFWIF_CCB_CMD_TYPE_FENCE = 213 | RGX_CMD_MAGIC_DWORD_SHIFTED,
RGXFWIF_CCB_CMD_TYPE_UPDATE = 214 | RGX_CMD_MAGIC_DWORD_SHIFTED,
RGXFWIF_CCB_CMD_TYPE_RMW_UPDATE = 215 | RGX_CMD_MAGIC_DWORD_SHIFTED,
RGXFWIF_CCB_CMD_TYPE_FENCE_PR = 216 | RGX_CMD_MAGIC_DWORD_SHIFTED,
RGXFWIF_CCB_CMD_TYPE_PRIORITY = 217 | RGX_CMD_MAGIC_DWORD_SHIFTED,
/* Pre and Post timestamp commands are supposed to sandwich the DM cmd. The
padding code with the CCB wrap upsets the FW if we don't have the task type
bit cleared for POST_TIMESTAMPs. That's why we have 2 different cmd types.
*/
RGXFWIF_CCB_CMD_TYPE_POST_TIMESTAMP = 218 | RGX_CMD_MAGIC_DWORD_SHIFTED,
RGXFWIF_CCB_CMD_TYPE_UNFENCED_UPDATE = 219 | RGX_CMD_MAGIC_DWORD_SHIFTED,
RGXFWIF_CCB_CMD_TYPE_UNFENCED_RMW_UPDATE = 220 | RGX_CMD_MAGIC_DWORD_SHIFTED,
RGXFWIF_CCB_CMD_TYPE_PADDING = 221 | RGX_CMD_MAGIC_DWORD_SHIFTED,
} RGXFWIF_CCB_CMD_TYPE;
typedef struct _RGXFWIF_WORKEST_KICK_DATA_
{
/* Index for the KM Workload estimation return data array */
IMG_UINT64 RGXFW_ALIGN ui64ReturnDataIndex;
/* Deadline for the workload */
IMG_UINT64 RGXFW_ALIGN ui64Deadline;
/* Predicted time taken to do the work in cycles */
IMG_UINT64 RGXFW_ALIGN ui64CyclesPrediction;
} RGXFWIF_WORKEST_KICK_DATA;
typedef struct _RGXFWIF_CCB_CMD_HEADER_
{
RGXFWIF_CCB_CMD_TYPE eCmdType;
IMG_UINT32 ui32CmdSize;
IMG_UINT32 ui32ExtJobRef; /*!< external job reference - provided by client and used in debug for tracking submitted work */
IMG_UINT32 ui32IntJobRef; /*!< internal job reference - generated by services and used in debug for tracking submitted work */
RGXFWIF_WORKEST_KICK_DATA sWorkEstKickData; /*!< Workload Estimation - Workload Estimation Data */
IMG_DEV_VIRTADDR sRobustnessResetReason; /*!< Address to write reset reason to */
IMG_UINT32 ui32SubmissionOrdinal; /*!< 'Timestamp' indicating order of command submission */
} RGXFWIF_CCB_CMD_HEADER;
typedef enum _RGXFWIF_REG_CFG_TYPE_
{
RGXFWIF_REG_CFG_TYPE_PWR_ON=0, /* Sidekick power event */
RGXFWIF_REG_CFG_TYPE_DUST_CHANGE, /* Rascal / dust power event */
RGXFWIF_REG_CFG_TYPE_TA, /* TA kick */
RGXFWIF_REG_CFG_TYPE_3D, /* 3D kick */
RGXFWIF_REG_CFG_TYPE_CDM, /* Compute kick */
RGXFWIF_REG_CFG_TYPE_TLA, /* TLA kick */
RGXFWIF_REG_CFG_TYPE_TDM, /* TDM kick */
RGXFWIF_REG_CFG_TYPE_ALL /* Applies to all types. Keep as last element */
} RGXFWIF_REG_CFG_TYPE;
typedef struct _RGXFWIF_REG_CFG_REC_
{
IMG_UINT64 ui64Addr;
IMG_UINT64 ui64Mask;
IMG_UINT64 ui64Value;
} RGXFWIF_REG_CFG_REC;
typedef struct _RGXFWIF_TIME_CORR_
{
IMG_UINT64 RGXFW_ALIGN ui64OSTimeStamp;
IMG_UINT64 RGXFW_ALIGN ui64OSMonoTimeStamp;
IMG_UINT64 RGXFW_ALIGN ui64CRTimeStamp;
/* Utility variable used to convert CR timer deltas to OS timer deltas (nS),
* where the deltas are relative to the timestamps above:
* deltaOS = (deltaCR * K) >> decimal_shift, see full explanation below */
IMG_UINT64 RGXFW_ALIGN ui64CRDeltaToOSDeltaKNs;
IMG_UINT32 ui32CoreClockSpeed;
} UNCACHED_ALIGN RGXFWIF_TIME_CORR;
/* These macros are used to help converting FW timestamps to the Host time domain.
* On the FW the RGX_CR_TIMER counter is used to keep track of the time;
* it increments by 1 every 256 GPU clock ticks, so the general formula
* to perform the conversion is:
*
* [ GPU clock speed in Hz, if (scale == 10^9) then deltaOS is in nS,
* otherwise if (scale == 10^6) then deltaOS is in uS ]
*
* deltaCR * 256 256 * scale
* deltaOS = --------------- * scale = deltaCR * K [ K = --------------- ]
* GPUclockspeed GPUclockspeed
*
* The actual K is multiplied by 2^20 (and deltaCR * K is divided by 2^20)
* to get some better accuracy and to avoid returning 0 in the integer
* division 256000000/GPUfreq if GPUfreq is greater than 256MHz.
* This is the same as keeping K as a decimal number.
*
* The maximum deltaOS is slightly more than 5hrs for all GPU frequencies
* (deltaCR * K is more or less a constant), and it's relative to
* the base OS timestamp sampled as a part of the timer correlation data.
* This base is refreshed on GPU power-on, DVFS transition and
* periodic frequency calibration (executed every few seconds if the FW is
* doing some work), so as long as the GPU is doing something and one of these
* events is triggered then deltaCR * K will not overflow and deltaOS will be
* correct.
*/
#define RGXFWIF_CRDELTA_TO_OSDELTA_ACCURACY_SHIFT (20)
/*
* Calibrated GPU frequencies are rounded to the nearest multiple of 1 KHz
* before use, to reduce the noise introduced by calculations done with
* imperfect operands (correlated timers not sampled at exactly the same time,
* GPU CR timer incrementing only once every 256 GPU cycles).
* This also helps reducing the variation between consecutive calculations.
*/
#define RGXFWIF_CONVERT_TO_KHZ(freq) (((freq) + 500) / 1000)
#define RGXFWIF_ROUND_TO_KHZ(freq) ((((freq) + 500) / 1000) * 1000)
#define RGXFWIF_GET_CRDELTA_TO_OSDELTA_K_NS(clockfreq, remainder) \
OSDivide64r64((256000000ULL << RGXFWIF_CRDELTA_TO_OSDELTA_ACCURACY_SHIFT), \
RGXFWIF_CONVERT_TO_KHZ(clockfreq), \
&(remainder))
#define RGXFWIF_GET_DELTA_OSTIME_NS(deltaCR, K) \
( ((deltaCR) * (K)) >> RGXFWIF_CRDELTA_TO_OSDELTA_ACCURACY_SHIFT)
#define RGXFWIF_GET_DELTA_OSTIME_US(deltacr, clockfreq, remainder) \
OSDivide64r64((deltacr) * 256000, \
RGXFWIF_CONVERT_TO_KHZ(clockfreq), \
&(remainder))
/* Use this macro to get a more realistic GPU core clock speed than
* the one given by the upper layers (used when doing GPU frequency
* calibration)
*/
#define RGXFWIF_GET_GPU_CLOCK_FREQUENCY_HZ(deltacr_us, deltaos_us, remainder) \
OSDivide64((deltacr_us) * 256000000, (deltaos_us), &(remainder))
/*
The maximum configurable size via RGX_FW_HEAP_SHIFT is
32MiB (1<<25) and the minimum is 4MiB (1<<22); the
default firmware heap size is set to maximum 32MiB.
*/
#if (RGX_FW_HEAP_SHIFT < 22 || RGX_FW_HEAP_SHIFT > 25)
#error "RGX_FW_HEAP_SHIFT is outside valid range [22, 25]"
#endif
#endif /* __RGX_FWIF_SHARED_H__ */
/******************************************************************************
End of file (rgx_fwif_shared.h)
******************************************************************************/