/* * Copyright (c) 2011 Intel Corporation. All Rights Reserved. * Copyright (c) Imagination Technologies Limited, UK * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the * "Software"), to deal in the Software without restriction, including * without limitation the rights to use, copy, modify, merge, publish, * distribute, sub license, and/or sell copies of the Software, and to * permit persons to whom the Software is furnished to do so, subject to * the following conditions: * * The above copyright notice and this permission notice (including the * next paragraph) shall be included in all copies or substantial portions * of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. * IN NO EVENT SHALL PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. * * Authors: * Edward Lin <edward.lin@intel.com> * */ #include <unistd.h> #include <stdio.h> #include <memory.h> #include "psb_drv_video.h" #include "psb_drv_debug.h" #include "tng_hostdefs.h" #include "tng_hostcode.h" #include "tng_hostair.h" /*********************************************************************************** * Function Name : functions of pi8AIR_Table table ************************************************************************************/ VAStatus tng_air_buf_create(context_ENC_p ctx) { IMG_UINT32 ui32MbNum = (ctx->ui16PictureHeight * ctx->ui16Width) >> 8; ctx->sAirInfo.pi8AIR_Table = (IMG_INT8 *)malloc(ui32MbNum); drv_debug_msg(VIDEO_DEBUG_GENERAL,"%s: ui32MbNum = %d\n", __FUNCTION__, ui32MbNum); if (!ctx->sAirInfo.pi8AIR_Table) { drv_debug_msg(VIDEO_DEBUG_ERROR, "\nERROR: Error allocating Adaptive Intra Refresh table of Application context (APP_SetVideoParams)"); return VA_STATUS_ERROR_ALLOCATION_FAILED; } memset(ctx->sAirInfo.pi8AIR_Table, 0, ui32MbNum); return VA_STATUS_SUCCESS; } static void tng_air_buf_clear(context_ENC_p ctx) { #if 0 IMG_UINT32 ui32MbNum = (ctx->ui16PictureHeight * ctx->ui16Width) >> 8; drv_debug_msg(VIDEO_DEBUG_ERROR,"%s: ui32MbNum = %d, ctx->sAirInfo.pi8AIR_Table = 0x%08x\n", __FUNCTION__, ui32MbNum, ctx->sAirInfo.pi8AIR_Table); memset(ctx->sAirInfo.pi8AIR_Table, 0, ui32MbNum); drv_debug_msg(VIDEO_DEBUG_ERROR,"%s: ui32MbNum = %d, ctx->sAirInfo.pi8AIR_Table = 0x%08x\n", __FUNCTION__, ui32MbNum, ctx->sAirInfo.pi8AIR_Table); #endif tng_cmdbuf_insert_command(ctx->obj_context, ctx->ui32StreamID, MTX_CMDID_SW_AIR_BUF_CLEAR, 0, 0, 0); return ; } void tng_air_buf_free(context_ENC_p ctx) { if (ctx->sAirInfo.pi8AIR_Table != NULL) free(ctx->sAirInfo.pi8AIR_Table); return ; } /*********************************************************************************** * Function Name : functions for input control ************************************************************************************/ static IMG_UINT16 tng__rand(context_ENC_p ctx) { IMG_UINT16 ui16ret = 0; ctx->ui32pseudo_rand_seed = (IMG_UINT32) ((ctx->ui32pseudo_rand_seed * 1103515245 + 12345) & 0xffffffff); //Using mask, just in case ui16ret = (IMG_UINT16)(ctx->ui32pseudo_rand_seed / 65536) % 32768; return ui16ret; } //APP_FillSliceMap IMG_UINT32 tng_fill_slice_map(context_ENC_p ctx, IMG_INT32 i32SlotNum, IMG_UINT32 ui32StreamIndex) { context_ENC_mem *ps_mem = &(ctx->ctx_mem[ui32StreamIndex]); unsigned char *pvBuffer; IMG_UINT8 ui8SlicesPerPicture; IMG_UINT8 ui8HalfWaySlice; IMG_UINT32 ui32HalfwayBU; ui8SlicesPerPicture = ctx->ui8SlicesPerPicture; ui32HalfwayBU = 0; ui8HalfWaySlice=ui8SlicesPerPicture/2; drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s: slot num = %d, aso = %d\n", __FUNCTION__, i32SlotNum, ctx->bArbitrarySO); drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s: stream id = %d, addr = 0x%x\n", __FUNCTION__, ui32StreamIndex, ps_mem->bufs_slice_map.virtual_addr); psb_buffer_map(&(ps_mem->bufs_slice_map), &(ps_mem->bufs_slice_map.virtual_addr)); if (ps_mem->bufs_slice_map.virtual_addr == NULL) { drv_debug_msg(VIDEO_DEBUG_ERROR, "%s error: mapping slice map\n", __FUNCTION__); goto out1; } pvBuffer = (unsigned char*)(ps_mem->bufs_slice_map.virtual_addr + (i32SlotNum * ctx->ctx_mem_size.slice_map)); if (pvBuffer == NULL) { drv_debug_msg(VIDEO_DEBUG_ERROR, "%s: pvBuffer == NULL\n", __FUNCTION__); goto out1; } if (ctx->bArbitrarySO) { IMG_UINT8 ui8Index; IMG_UINT8 ui32FirstBUInSlice; IMG_UINT8 ui8SizeInKicks; IMG_UINT8 ui8TotalBUs; IMG_UINT8 aui8SliceNumbers[MAX_SLICESPERPIC]; memset(aui8SliceNumbers, 0, MAX_SLICESPERPIC); ui8SlicesPerPicture = tng__rand(ctx) % ctx->ui8SlicesPerPicture + 1; // Fill slice map // Fill number of slices * pvBuffer = ui8SlicesPerPicture; pvBuffer++; for (ui8Index = 0; ui8Index < ui8SlicesPerPicture; ui8Index++) aui8SliceNumbers[ui8Index] = ui8Index; // randomise slice numbers for (ui8Index = 0; ui8Index < 20; ui8Index++) { IMG_UINT8 ui8FirstCandidate; IMG_UINT8 ui8SecondCandidate; IMG_UINT8 ui8Temp; ui8FirstCandidate = tng__rand(ctx) % ui8SlicesPerPicture; ui8SecondCandidate = tng__rand(ctx) % ui8SlicesPerPicture; ui8Temp = aui8SliceNumbers[ui8FirstCandidate]; aui8SliceNumbers[ui8FirstCandidate] = aui8SliceNumbers[ui8SecondCandidate]; aui8SliceNumbers[ui8SecondCandidate] = ui8Temp; } ui8TotalBUs = (ctx->ui16PictureHeight / 16) * (ctx->ui16Width / 16) / ctx->sRCParams.ui32BUSize; ui32FirstBUInSlice = 0; for (ui8Index = 0; ui8Index < ui8SlicesPerPicture - 1; ui8Index++) { IMG_UINT32 ui32BUsCalc; if (ui8Index==ui8HalfWaySlice) ui32HalfwayBU=ui32FirstBUInSlice; ui32BUsCalc=(ui8TotalBUs - 1 * (ui8SlicesPerPicture - ui8Index)); if(ui32BUsCalc) ui8SizeInKicks = tng__rand(ctx) %ui32BUsCalc + 1; else ui8SizeInKicks = 1; ui8TotalBUs -= ui8SizeInKicks; // slice number * pvBuffer = aui8SliceNumbers[ui8Index]; pvBuffer++; // SizeInKicks BU * pvBuffer = ui8SizeInKicks; pvBuffer++; ui32FirstBUInSlice += (IMG_UINT32) ui8SizeInKicks; } ui8SizeInKicks = ui8TotalBUs; // slice number * pvBuffer = aui8SliceNumbers[ui8SlicesPerPicture - 1]; pvBuffer++; // last BU * pvBuffer = ui8SizeInKicks; pvBuffer++; } else { // Fill standard Slice Map (non arbitrary) IMG_UINT8 ui8Index; IMG_UINT8 ui8SliceNumber; IMG_UINT8 ui32FirstBUInSlice; IMG_UINT8 ui8SizeInKicks; IMG_UINT32 ui32SliceHeight; // Fill number of slices * pvBuffer = ui8SlicesPerPicture; pvBuffer++; ui32SliceHeight = (ctx->ui16PictureHeight / ctx->ui8SlicesPerPicture) & ~15; ui32FirstBUInSlice = 0; ui8SliceNumber = 0; for (ui8Index = 0; ui8Index < ui8SlicesPerPicture - 1; ui8Index++) { if (ui8Index==ui8HalfWaySlice) ui32HalfwayBU=ui32FirstBUInSlice; ui8SizeInKicks = ((ui32SliceHeight / 16)*(ctx->ui16Width/16))/ctx->sRCParams.ui32BUSize; // slice number * pvBuffer = ui8SliceNumber; pvBuffer++; // SizeInKicks BU * pvBuffer = ui8SizeInKicks; pvBuffer++; ui8SliceNumber++; ui32FirstBUInSlice += (IMG_UINT32) ui8SizeInKicks; } ui32SliceHeight = ctx->ui16PictureHeight - ui32SliceHeight * (ctx->ui8SlicesPerPicture - 1); if (ui8Index==ui8HalfWaySlice) ui32HalfwayBU=ui32FirstBUInSlice; ui8SizeInKicks = ((ui32SliceHeight / 16)*(ctx->ui16Width/16))/ctx->sRCParams.ui32BUSize; // slice number * pvBuffer = ui8SliceNumber; pvBuffer++; // last BU * pvBuffer = ui8SizeInKicks; pvBuffer++; } out1: psb_buffer_unmap(&(ps_mem->bufs_slice_map)); ctx->ui32HalfWayBU[i32SlotNum] = ui32HalfwayBU; drv_debug_msg(VIDEO_DEBUG_GENERAL,"%s: ui32HalfWayBU = %d\n", __FUNCTION__, ctx->ui32HalfWayBU[i32SlotNum]); return ui32HalfwayBU; } //IMG_V_GetInpCtrlBuf static VAStatus tng__map_inp_ctrl_buf( context_ENC_p ctx, IMG_UINT8 ui8SlotNumber, IMG_UINT8 **ppsInpCtrlBuf) { VAStatus vaStatus = VA_STATUS_SUCCESS; context_ENC_mem* ps_mem = &(ctx->ctx_mem[0]); context_ENC_mem_size *ps_mem_size = &(ctx->ctx_mem_size); if (ppsInpCtrlBuf == NULL) { drv_debug_msg(VIDEO_DEBUG_GENERAL,"%s: ppsInpCtrlBuf == NULL\n", __FUNCTION__); return VA_STATUS_ERROR_INVALID_PARAMETER; } *ppsInpCtrlBuf = NULL; // Not enabled // if enabled, return the input-control buffer corresponding to this slot if (ctx->bEnableInpCtrl) { vaStatus = psb_buffer_map(&(ps_mem->bufs_mb_ctrl_in_params), ppsInpCtrlBuf); if (vaStatus == VA_STATUS_SUCCESS) *ppsInpCtrlBuf += ui8SlotNumber * ps_mem_size->mb_ctrl_in_params; else psb_buffer_unmap(&(ps_mem->bufs_mb_ctrl_in_params)); } return vaStatus; } static VAStatus tng__unmap_inp_ctrl_buf( context_ENC_p ctx, IMG_UINT8 __maybe_unused ui8SlotNumber, IMG_UINT8 **ppsInpCtrlBuf) { VAStatus vaStatus = VA_STATUS_SUCCESS; context_ENC_mem* ps_mem = &(ctx->ctx_mem[0]); // if enabled, return the input-control buffer corresponding to this slot if (*ppsInpCtrlBuf != NULL) { psb_buffer_unmap(&(ps_mem->bufs_mb_ctrl_in_params)); *ppsInpCtrlBuf = NULL; // Not enabled } return vaStatus; } //APP_FillInpCtrlBuf #define DEFAULT_INTER_INTRA_SCALE_TBL_IDX (0) #define DEFAULT_CODED_SKIPPED_SCALE_TBL_IDX (0) #define DEFAULT_INPUT_QP (0xF) #define SIZEOF_MB_IN_CTRL_PARAM (2) static void tng__fill_inp_ctrl_buf( context_ENC_p ctx, IMG_UINT8 *pInpCtrlBuf, IMG_INT16 i16IntraRefresh, IMG_INT8* pi8QP, IMG_UINT32 __maybe_unused ui32HalfWayBU) { IMG_PVOID pvBuffer; IMG_UINT32 ui32MBFrameWidth; IMG_UINT32 ui32MBPictureHeight; IMG_UINT32 ui32MBSliceHeight; IMG_UINT16 ui16DefaultParam; IMG_UINT16 ui16IntraParam; IMG_BOOL bRefresh=IMG_FALSE; IMG_UINT32 ui32CurrentIndex; IMG_UINT32 ui32MBx, ui32MBy; IMG_UINT16 *pui16MBParam; IMG_INT8 i8QPInit; IMG_INT8 i8QP; IMG_INT8 iMaxQP; #ifdef BRN_30324 IMG_UINT32 ui32HalfWayMB=ui32HalfWayBU * ctx->sRCParams.ui32BUSize; #endif if (pi8QP == NULL) { drv_debug_msg(VIDEO_DEBUG_GENERAL,"%s: start QP == NULL\n", __FUNCTION__); return ; } drv_debug_msg(VIDEO_DEBUG_GENERAL,"%s: start QP = %d\n", __FUNCTION__, *pi8QP); if (i16IntraRefresh > 0) { bRefresh=IMG_TRUE; } iMaxQP = 31; if (ctx->eStandard == IMG_STANDARD_H264) { iMaxQP = 51; } if(pi8QP) { i8QPInit = * pi8QP; } else { i8QPInit = DEFAULT_INPUT_QP; } // get the buffer // IMG_C_GetBuffer(psActiveContext->hContext, pInpCtrlBuf, &pvBuffer,IMG_TRUE); pvBuffer = (IMG_PVOID) pInpCtrlBuf; //fill data ui32MBFrameWidth = (ctx->ui16Width/16); ui32MBPictureHeight = (ctx->ui16PictureHeight/16); ui32MBSliceHeight = (ui32MBPictureHeight/ctx->ui8SlicesPerPicture); pui16MBParam = (IMG_UINT16 *)pvBuffer; ui32CurrentIndex=0; for(ui32MBy = 0; ui32MBy < (IMG_UINT32)(ctx->ui16PictureHeight / 16); ui32MBy++) { for(ui32MBx = 0; ui32MBx < ui32MBFrameWidth; ui32MBx++) { IMG_UINT16 ui16MBParam = 0; #ifdef BRN_30324 if (ui32HalfWayMB && ui32CurrentIndex == ui32HalfWayMB) if (ctx->ui8SlicesPerPicture > 1 && ctx->i32NumPipes > 1) { ui32CurrentIndex=(((ui32CurrentIndex)+31)&(~31)); } #endif i8QP = i8QPInit + ((tng__rand(ctx)%6)-3); i8QP = tng__max(tng__min(i8QP, iMaxQP), ctx->sRCParams.iMinQP); ui16DefaultParam = ( i8QP<<10) | (3 <<7) |(3<<4); ui16IntraParam = ( i8QP<<10) | (0 <<7) |(0<<4); ui16MBParam = ui16DefaultParam; if (bRefresh) { if ((IMG_INT32)ui32CurrentIndex > ctx->i32LastCIRIndex) { ctx->i32LastCIRIndex = ui32CurrentIndex; ui16MBParam = ui16IntraParam; i16IntraRefresh--; if(i16IntraRefresh <= 0) bRefresh = IMG_FALSE; } } pui16MBParam[ui32CurrentIndex++] = ui16MBParam; } } if (bRefresh) { ctx->i32LastCIRIndex = -1; while (i16IntraRefresh) { i8QP = i8QPInit + ((tng__rand(ctx)%6)-3); i8QP = tng__max(tng__min(i8QP, iMaxQP), ctx->sRCParams.iMinQP); ui16IntraParam = ( i8QP<<10) |(0 <<7) |(0<<4); pui16MBParam[++ctx->i32LastCIRIndex] = ui16IntraParam; i16IntraRefresh--; } } drv_debug_msg(VIDEO_DEBUG_GENERAL,"%s: end QP = %d\n", __FUNCTION__, *pi8QP); //release buffer //IMG_C_ReleaseBuffer(psActiveContext->hContext, pInpCtrlBuf,IMG_TRUE); return ; } /*********************************************************************************** * Function Name : APP_FillInputControl * Inputs : psContext * Description : Fills input control buffer for a given source picture ************************************************************************************/ static void tng__fill_input_control( context_ENC_p ctx, IMG_UINT8 ui8SlotNum, IMG_UINT32 __maybe_unused ui32HalfWayBU) { IMG_UINT8 * pInpCtrlBuf = NULL; IMG_INT8 i8InitialQp = ctx->sRCParams.ui32InitialQp; // Get pointer to MB Control buffer for current source buffer (if input control is enabled, otherwise buffer is NULL) // Please refer to kernel tng_setup_cir_buf() /* tng__map_inp_ctrl_buf(ctx, ui8SlotNum, &pInpCtrlBuf); if (pInpCtrlBuf!= IMG_NULL) { tng__fill_inp_ctrl_buf(ctx, pInpCtrlBuf,(IMG_INT16)(ctx->ui16IntraRefresh), &i8InitialQp, ui32HalfWayBU); } tng__unmap_inp_ctrl_buf(ctx, ui8SlotNum, &pInpCtrlBuf); */ tng_cmdbuf_insert_command(ctx->obj_context, ctx->ui32StreamID, MTX_CMDID_SW_FILL_INPUT_CTRL, ui8SlotNum, 0, 0); return ; } static void tng__send_air_inp_ctrl_buf(context_ENC_p ctx, IMG_INT8 *pInpCtrlBuf) { //IMG_PVOID pvICBuffer; IMG_UINT16 ui16IntraParam; //IMG_BOOL bRefresh = IMG_FALSE; IMG_UINT32 ui32CurrentCnt, ui32SentCnt; IMG_UINT32 ui32MBMaxSize; IMG_UINT16 *pui16MBParam; IMG_UINT32 ui32NewScanPos, ui32Skip; #ifdef ADAPTIVE_INTRA_REFRESH_DEBUG_OUTPUT IMG_CHAR TmpOutputTble[396]; //Debug only #endif ui16IntraParam = (0 << 7) | (0 << 4); if (ctx->ui32FrameCount[0] < 1) return; // get the buffer pui16MBParam = (IMG_UINT16 *) pInpCtrlBuf; //fill data ui32MBMaxSize = (IMG_UINT32)(ctx->ui16PictureHeight / 16) * (IMG_UINT32)(ctx->ui16Width / 16); ui32CurrentCnt = 0; if (ctx->sAirInfo.i16AIRSkipCnt >= 0) ui32Skip = ctx->sAirInfo.i16AIRSkipCnt; else //ui32Skip=APP_Rand() % psActiveContext->sAirInfo.i32NumAIRSPerFrame; // Pseudorandom skip. ui32Skip = (ctx->ui32FrameCount[0] & 0x7) + 1; // Pseudorandom skip. #ifdef ADAPTIVE_INTRA_REFRESH_DEBUG_OUTPUT { IMG_UINT32 tsp; if (fp) { fp = fopen("SADvals.txt", "a"); } else { fp = fopen("SADvals.txt", "w"); } fprintf(fp, "\n---------------------------------------------------------------------------\n"); fprintf(fp, "SENDING SADvals (skip:%i)\n", ui32Skip); for (tsp = 0; tsp < ui32MBMaxSize; tsp++) { if (ctx->sAirInfo.pi8AIR_Table[tsp] > 0) { TmpOutputTble[tsp] = 'x'; } else { TmpOutputTble[tsp] = 'o'; } } } #endif ui32NewScanPos = (IMG_UINT32) (ctx->sAirInfo.ui16AIRScanPos + ui32Skip) % ui32MBMaxSize; ui32CurrentCnt = ui32SentCnt = 0; while (ui32CurrentCnt < ui32MBMaxSize && ((ctx->sAirInfo.i32NumAIRSPerFrame == 0) || ui32SentCnt < (IMG_UINT32) ctx->sAirInfo.i32NumAIRSPerFrame)) { IMG_UINT16 ui16MBParam; if (ctx->sAirInfo.pi8AIR_Table[ui32NewScanPos] >= 0) { // Mark the entry as 'touched' ctx->sAirInfo.pi8AIR_Table[ui32NewScanPos] = -1 - ctx->sAirInfo.pi8AIR_Table[ui32NewScanPos]; if (ctx->sAirInfo.pi8AIR_Table[ui32NewScanPos] < -1) { ui16MBParam = pui16MBParam[ui32NewScanPos] & (0xFF << 10); ui16MBParam |= ui16IntraParam; pui16MBParam[ui32NewScanPos] = ui16MBParam; ctx->sAirInfo.pi8AIR_Table[ui32NewScanPos]++; #ifdef ADAPTIVE_INTRA_REFRESH_DEBUG_OUTPUT TmpOutputTble[ui32NewScanPos]='I'; #endif ui32NewScanPos += ui32Skip; ui32SentCnt++; } ui32CurrentCnt++; } ui32NewScanPos++; ui32NewScanPos = ui32NewScanPos % ui32MBMaxSize; if (ui32NewScanPos == ctx->sAirInfo.ui16AIRScanPos) { /* we have looped around */ break; } } ctx->sAirInfo.ui16AIRScanPos = ui32NewScanPos; #ifdef ADAPTIVE_INTRA_REFRESH_DEBUG_OUTPUT { IMG_UINT32 tsp; for (tsp = 0; tsp < ui32MBMaxSize; tsp++) { if (tsp % ((IMG_UINT32)(ctx->ui16Width/16)) == 0) { fprintf(fp, "\n%c", TmpOutputTble[tsp]); } else { fprintf(fp, "%c", TmpOutputTble[tsp]); } } fprintf(fp, "\n---------------------------------------------------------------------------\n"); fclose(fp); } #endif drv_debug_msg(VIDEO_DEBUG_GENERAL,"%s: end\n", __FUNCTION__); return ; } // Adaptive Intra Refresh (AIR) - send the AIR values to the next bufferk // APP_UpdateAdaptiveIntraRefresh_Send static void tng__update_air_send(context_ENC_p ctx, IMG_UINT8 ui8SlotNum) { IMG_UINT8 *pInpCtrlBuf = NULL; drv_debug_msg(VIDEO_DEBUG_GENERAL,"%s: start\n", __FUNCTION__); // Get pointer to MB Control buffer for current source buffer (if input control is enabled, otherwise buffer is NULL) #if 0 tng__map_inp_ctrl_buf(ctx, ui8SlotNum, &pInpCtrlBuf); if(pInpCtrlBuf!= IMG_NULL) { tng__send_air_inp_ctrl_buf(ctx, (IMG_INT8 *)pInpCtrlBuf); } tng__unmap_inp_ctrl_buf(ctx, ui8SlotNum, &pInpCtrlBuf); drv_debug_msg(VIDEO_DEBUG_GENERAL,"%s: end\n", __FUNCTION__); #endif tng_cmdbuf_insert_command(ctx->obj_context, ctx->ui32StreamID, MTX_CMDID_SW_UPDATE_AIR_SEND, ui8SlotNum, 0, 0); return ; } /*********************************************************************************** * Function Name : functions for output control ************************************************************************************/ //IMG_V_GetFirstPassOutBuf VAStatus tng__map_first_pass_out_buf( context_ENC_p ctx, IMG_UINT8 __maybe_unused ui8SlotNumber, IMG_UINT8 **ppsFirstPassOutBuf) { VAStatus vaStatus = VA_STATUS_SUCCESS; context_ENC_mem* ps_mem = &(ctx->ctx_mem[0]); if (ppsFirstPassOutBuf == NULL) { drv_debug_msg(VIDEO_DEBUG_GENERAL,"%s: ppsFirstPassOutBuf == NULL\n", __FUNCTION__); return VA_STATUS_ERROR_INVALID_PARAMETER; } *ppsFirstPassOutBuf = NULL; // Not enabled // if enabled, return the input-control buffer corresponding to this slot if (ctx->bEnableInpCtrl) { vaStatus = psb_buffer_map(&(ps_mem->bufs_first_pass_out_params), ppsFirstPassOutBuf); if (vaStatus != VA_STATUS_SUCCESS) psb_buffer_unmap(&(ps_mem->bufs_first_pass_out_params)); } return vaStatus; } VAStatus tng__unmap_first_pass_out_buf( context_ENC_p ctx, IMG_UINT8 __maybe_unused ui8SlotNumber, IMG_UINT8 **ppsFirstPassOutBuf) { VAStatus vaStatus = VA_STATUS_SUCCESS; context_ENC_mem* ps_mem = &(ctx->ctx_mem[0]); // if enabled, return the input-control buffer corresponding to this slot if (*ppsFirstPassOutBuf != NULL) { psb_buffer_unmap(&(ps_mem->bufs_first_pass_out_params)); *ppsFirstPassOutBuf = NULL; // Not enabled } return vaStatus; } //IMG_V_GetBestMBDecisionOutBuf VAStatus tng__map_best_mb_decision_out_buf( context_ENC_p ctx, IMG_UINT8 __maybe_unused ui8SlotNumber, IMG_UINT8 **ppsBestMBDecisionOutBuf) { VAStatus vaStatus = VA_STATUS_SUCCESS; context_ENC_mem* ps_mem = &(ctx->ctx_mem[0]); // if enabled, return the input-control buffer corresponding to this slot if (ctx->bEnableInpCtrl) vaStatus = psb_buffer_map(&(ps_mem->bufs_first_pass_out_best_multipass_param), ppsBestMBDecisionOutBuf); else *ppsBestMBDecisionOutBuf = NULL; // Not enabled return vaStatus; } VAStatus tng__unmap_best_mb_decision_out_buf( context_ENC_p ctx, IMG_UINT8 __maybe_unused ui8SlotNumber, IMG_UINT8 **ppsBestMBDecisionOutBuf) { VAStatus vaStatus = VA_STATUS_SUCCESS; context_ENC_mem* ps_mem = &(ctx->ctx_mem[0]); // if enabled, return the input-control buffer corresponding to this slot if (*ppsBestMBDecisionOutBuf != NULL) { psb_buffer_unmap(&(ps_mem->bufs_first_pass_out_best_multipass_param)); *ppsBestMBDecisionOutBuf = NULL; // Not enabled } return vaStatus; } // Calculate Adaptive Intra Refresh (AIR) static void tng__calc_air_inp_ctrl_buf(context_ENC_p ctx, IMG_UINT8 *pFirstPassOutBuf, IMG_UINT8 *pBestMBDecisionCtrlBuf) { IMG_UINT8 *pSADPointer; IMG_UINT8 *pvSADBuffer; IMG_UINT8 ui8IsAlreadyIntra; IMG_UINT32 ui32MBFrameWidth; IMG_UINT32 ui32MBPictureHeight; IMG_UINT16 ui16IntraParam; IMG_UINT32 ui32MBx, ui32MBy; IMG_UINT32 ui32SADParam; IMG_UINT32 ui32tSAD_Threshold, ui32tSAD_ThresholdLo, ui32tSAD_ThresholdHi; IMG_UINT32 ui32MaxMBs, ui32NumMBsOverThreshold, ui32NumMBsOverLo, ui32NumMBsOverHi; IMG_BEST_MULTIPASS_MB_PARAMS *psBestMB_Params; IMG_FIRST_STAGE_MB_PARAMS *psFirstMB_Params; ui16IntraParam = (0 << 7) | (0 << 4); ui32NumMBsOverThreshold = ui32NumMBsOverLo = ui32NumMBsOverHi = 0; //drv_debug_msg(VIDEO_DEBUG_GENERAL,"%s: start\n", __FUNCTION__); // if (psActiveContext->ui32EncodeSent < (IMG_UINT32)psActiveContext->ui8MaxSourceSlots + 1) // if (ctx->ui32FrameCount[0] < (IMG_UINT32)(ctx->ui8SlotsInUse + 1)) // return; drv_debug_msg(VIDEO_DEBUG_GENERAL,"%s: start\n", __FUNCTION__); //fill data ui32MBFrameWidth = (ctx->ui16Width/16); ui32MBPictureHeight = (ctx->ui16PictureHeight/16); // get the SAD results buffer (either IPE0 and IPE1 results or, preferably, the more accurate Best Multipass SAD results) if (pBestMBDecisionCtrlBuf) { pvSADBuffer = pBestMBDecisionCtrlBuf; drv_debug_msg(VIDEO_DEBUG_GENERAL,"AIR active: Using Best Multipass SAD values "); //#ifdef MULTIPASS_MV_PLACEMENT_ISSUE_FIXED if ((ctx->ui8EnableSelStatsFlags & ESF_MP_BEST_MOTION_VECTOR_STATS)) //#endif { // The actual Param structures (which contain SADs) are located after the Multipass Motion Vector entries pvSADBuffer += (ui32MBPictureHeight * (ui32MBFrameWidth) * sizeof(IMG_BEST_MULTIPASS_MB_PARAMS_IPMV)); } } else { pvSADBuffer = pFirstPassOutBuf; drv_debug_msg(VIDEO_DEBUG_GENERAL,"AIR active: Using IPE SAD values "); } if (ctx->sAirInfo.i32NumAIRSPerFrame == 0) ui32MaxMBs = ui32MBFrameWidth * ui32MBPictureHeight; // Default to ALL MB's in frame else if (ctx->sAirInfo.i32NumAIRSPerFrame < 0) ctx->sAirInfo.i32NumAIRSPerFrame = ui32MaxMBs = ((ui32MBFrameWidth * ui32MBPictureHeight) + 99) / 100; // Default to 1% of MB's in frame (min 1) else ui32MaxMBs = ctx->sAirInfo.i32NumAIRSPerFrame; pSADPointer = (IMG_UINT8 *)pvSADBuffer; if (ctx->sAirInfo.i32SAD_Threshold >= 0) ui32tSAD_Threshold = (IMG_UINT16)ctx->sAirInfo.i32SAD_Threshold; else { // Running auto adjust threshold adjust mode if (ctx->sAirInfo.i32SAD_Threshold == -1) { // This will occur only the first time if (pBestMBDecisionCtrlBuf) { psBestMB_Params=(IMG_BEST_MULTIPASS_MB_PARAMS *) pSADPointer; // Auto seed the threshold with the first value ui32SADParam = psBestMB_Params->ui32SAD_Inter_MBInfo & IMG_BEST_MULTIPASS_SAD_MASK; } else { psFirstMB_Params=(IMG_FIRST_STAGE_MB_PARAMS *) pSADPointer; // Auto seed the threshold with the first value ui32SADParam = (IMG_UINT32) psFirstMB_Params->ui16Ipe0Sad; } ctx->sAirInfo.i32SAD_Threshold = -1 - ui32SADParam; // Negative numbers indicate auto-adjusting threshold } ui32tSAD_Threshold = (IMG_UINT32) - (ctx->sAirInfo.i32SAD_Threshold + 1); } ui32tSAD_ThresholdLo = ui32tSAD_Threshold / 2; ui32tSAD_ThresholdHi = ui32tSAD_Threshold + ui32tSAD_ThresholdLo; drv_debug_msg(VIDEO_DEBUG_GENERAL,"Th:%u, MaxMbs:%u, Skp:%i\n", (unsigned int)ui32tSAD_Threshold, (unsigned int)ui32MaxMBs, ctx->sAirInfo.i16AIRSkipCnt); #ifdef ADAPTIVE_INTRA_REFRESH_DEBUG_OUTPUT if (fp) fp=fopen("SADvals.txt","a"); else fp=fopen("SADvals.txt","w"); if (ctx->sAirInfo.i32SAD_Threshold>=0) if (ctx->sAirInfo.i32NumAIRSPerFrame>0) fprintf(fp, "S_SADThreshold: %i MaxMBs: %i\n", ui32tSAD_Threshold, ui32MaxMBs); else fprintf(fp, "S_SADThreshold: %i MaxMBs: NA\n", ui32tSAD_Threshold, ui32MaxMBs); else fprintf(fp, "V_SADThreshold: %i MaxMBs: %i\n", ui32tSAD_Threshold, ui32MaxMBs); if (pBestMBDecisionCtrlBuf) fprintf(fp, "Using Best Multipass SAD values\n"); else fprintf(fp, "Using Motion Search Data IPE SAD values\n"); #endif // This loop could be optimised to a single counter if necessary, retaining for clarity for (ui32MBy = 0; ui32MBy < ui32MBPictureHeight; ui32MBy++) { for( ui32MBx=0; ui32MBx<ui32MBFrameWidth; ui32MBx++) { #ifdef ADAPTIVE_INTRA_REFRESH_DEBUG_OUTPUT IMG_CHAR cMarked; cMarked='_'; #endif // Turn all negative table values to positive (reset 'touched' state of a block that may have been set in APP_SendAIRInpCtrlBuf()) if (ctx->sAirInfo.pi8AIR_Table[ui32MBy * ui32MBFrameWidth + ui32MBx] < 0) ctx->sAirInfo.pi8AIR_Table[ui32MBy * ui32MBFrameWidth + ui32MBx] = -1 - ctx->sAirInfo.pi8AIR_Table[ui32MBy * ui32MBFrameWidth + ui32MBx]; // This will read the SAD value from the buffer (either IPE0 SAD or the superior Best multipass parameter structure SAD value) if (pBestMBDecisionCtrlBuf) { psBestMB_Params = (IMG_BEST_MULTIPASS_MB_PARAMS *) pSADPointer; ui32SADParam = psBestMB_Params->ui32SAD_Inter_MBInfo & IMG_BEST_MULTIPASS_SAD_MASK; if ((psBestMB_Params->ui32SAD_Intra_MBInfo & IMG_BEST_MULTIPASS_MB_TYPE_MASK) >> IMG_BEST_MULTIPASS_MB_TYPE_SHIFT == 1) ui8IsAlreadyIntra = 1; else ui8IsAlreadyIntra = 0; pSADPointer=(IMG_UINT8 *) &(psBestMB_Params[1]); } else { psFirstMB_Params=(IMG_FIRST_STAGE_MB_PARAMS *) pSADPointer; ui32SADParam = (IMG_UINT32) psFirstMB_Params->ui16Ipe0Sad; ui32SADParam += (IMG_UINT32) psFirstMB_Params->ui16Ipe1Sad; ui32SADParam /= 2; ui8IsAlreadyIntra = 0; // We don't have the information to determine this pSADPointer=(IMG_UINT8 *) &(psFirstMB_Params[1]); } if (ui32SADParam >= ui32tSAD_ThresholdLo) { ui32NumMBsOverLo++; if (ui32SADParam >= ui32tSAD_Threshold) { #ifdef ADAPTIVE_INTRA_REFRESH_DEBUG_OUTPUT cMarked='i'; #endif // if (!ui8IsAlreadyIntra) // Don't mark this block if it's just been encoded as an Intra block anyway // (results seem better without this condition anyway) { ctx->sAirInfo.pi8AIR_Table[ui32MBy * ui32MBFrameWidth + ui32MBx]++; #ifdef ADAPTIVE_INTRA_REFRESH_DEBUG_OUTPUT cMarked='I'; #endif } ui32NumMBsOverThreshold++; if (ui32SADParam >= ui32tSAD_ThresholdHi) ui32NumMBsOverHi++; } } #ifdef ADAPTIVE_INTRA_REFRESH_DEBUG_OUTPUT fprintf(fp,"%4x[%i]%c, ",ui32SADParam, ctx->sAirInfo.pi8AIR_Table[ui32MBy * ui32MBFrameWidth + ui32MBx], cMarked); #endif } pSADPointer=(IMG_UINT8 *) ALIGN_64(((IMG_UINT32) pSADPointer)); #ifdef ADAPTIVE_INTRA_REFRESH_DEBUG_OUTPUT fprintf(fp,"\n"); #endif } // Test and process running adaptive threshold case if (ctx->sAirInfo.i32SAD_Threshold < 0) { // Adjust our threshold (to indicate it's auto-adjustable store it as a negative value minus 1) if (ui32NumMBsOverLo <= ui32MaxMBs) ctx->sAirInfo.i32SAD_Threshold = (IMG_INT32) - ((IMG_INT32)ui32tSAD_ThresholdLo) - 1; else if (ui32NumMBsOverHi >= ui32MaxMBs) ctx->sAirInfo.i32SAD_Threshold = (IMG_INT32) - ((IMG_INT32)ui32tSAD_ThresholdHi) - 1; else { if (ui32MaxMBs < ui32NumMBsOverThreshold) { ctx->sAirInfo.i32SAD_Threshold = ((IMG_INT32)ui32tSAD_ThresholdHi - (IMG_INT32)ui32tSAD_Threshold); ctx->sAirInfo.i32SAD_Threshold *= ((IMG_INT32)ui32MaxMBs - (IMG_INT32)ui32NumMBsOverThreshold); ctx->sAirInfo.i32SAD_Threshold /= ((IMG_INT32)ui32NumMBsOverHi - (IMG_INT32)ui32NumMBsOverThreshold); ctx->sAirInfo.i32SAD_Threshold += ui32tSAD_Threshold; } else { ctx->sAirInfo.i32SAD_Threshold = ((IMG_INT32)ui32tSAD_Threshold - (IMG_INT32)ui32tSAD_ThresholdLo); ctx->sAirInfo.i32SAD_Threshold *= ((IMG_INT32)ui32MaxMBs - (IMG_INT32)ui32NumMBsOverLo); ctx->sAirInfo.i32SAD_Threshold /= ((IMG_INT32)ui32NumMBsOverThreshold - (IMG_INT32)ui32NumMBsOverLo); ctx->sAirInfo.i32SAD_Threshold += ui32tSAD_ThresholdLo; } ctx->sAirInfo.i32SAD_Threshold = -ctx->sAirInfo.i32SAD_Threshold - 1; } #ifdef ADAPTIVE_INTRA_REFRESH_DEBUG_OUTPUT fprintf(fp,"THRESHOLDS ADJUSTMENT\nThrLo:%i ThrMid:%i ThrHi:%i\nMBsLo:%i MBsMid:%i MBsHi:%i\n",ui32tSAD_ThresholdLo, ui32tSAD_Threshold, ui32tSAD_ThresholdHi, ui32NumMBsOverLo, ui32NumMBsOverThreshold, ui32NumMBsOverHi); fprintf(fp,"Target No. MB's:%i\nThreshold adjusted to: %i\n",ui32MaxMBs, -(ctx->sAirInfo.i32SAD_Threshold)); #endif } #ifdef ADAPTIVE_INTRA_REFRESH_DEBUG_OUTPUT fprintf(fp,"\n MBs tagged:%i\n", ui32NumMBsOverThreshold); fclose(fp); #endif drv_debug_msg(VIDEO_DEBUG_GENERAL,"%s: end\n", __FUNCTION__); return; } // Adaptive Intra Refresh (AIR) - Calculate the new AIR values based upon Motion Search feedback // APP_UpdateAdaptiveIntraRefresh_Calc static void tng_update_air_calc(context_ENC_p ctx, IMG_UINT8 ui8SlotNum) { IMG_UINT8 *pFirstPassOutBuf = NULL; IMG_UINT8 *pBestMBDecisionCtrlBuf = NULL; #if 0 // Get pointer to MB Control buffer for current source buffer (if input control is enabled, otherwise buffer is NULL) tng__map_first_pass_out_buf(ctx, ui8SlotNum, &pFirstPassOutBuf); tng__map_best_mb_decision_out_buf(ctx, ui8SlotNum, &pBestMBDecisionCtrlBuf); if(pFirstPassOutBuf || pBestMBDecisionCtrlBuf) tng__calc_air_inp_ctrl_buf (ctx, pFirstPassOutBuf, pBestMBDecisionCtrlBuf); tng__unmap_first_pass_out_buf(ctx, ui8SlotNum, &pFirstPassOutBuf); tng__unmap_best_mb_decision_out_buf(ctx, ui8SlotNum, &pBestMBDecisionCtrlBuf); #endif tng_cmdbuf_insert_command(ctx->obj_context, ctx->ui32StreamID, MTX_CMDID_SW_UPDATE_AIR_CALC, ui8SlotNum, 0, 0); } /*********************************************************************************** * Function Name : * Inputs : * Description : ************************************************************************************/ void tng_air_set_input_control(context_ENC_p ctx, IMG_UINT8 __maybe_unused ui8StreamID) { IMG_UINT8 ui8SlotIndex = ctx->ui8SlotsCoded; drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s: slot index = %d\n", __FUNCTION__, ctx->ui8SlotsCoded); //IMG_UINT32 ui32HalfWayBU; //ui32HalfWayBU = tng_fill_slice_map(ctx, ui8SlotIndex, ui8StreamID); ////////////////////////////// INPUT CONTROL // Add input control stuff here tng__fill_input_control(ctx, ui8SlotIndex, ctx->ui32HalfWayBU[ui8SlotIndex]); // Adaptive Intra Refresh (AIR) - send the AIR values to the next buffer if (ctx->bEnableAIR) tng__update_air_send(ctx, ui8SlotIndex); } /*********************************************************************************** * Function Name : * Inputs : * Description : ************************************************************************************/ void tng_air_set_output_control(context_ENC_p ctx, IMG_UINT8 __maybe_unused ui8StreamID) { IMG_UINT8 ui8SlotIndex = ctx->ui8SlotsCoded; drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s: slot index = %d\n", __FUNCTION__, ctx->ui8SlotsCoded); if ((ctx->eFrameType == IMG_INTRA_IDR) || (ctx->eFrameType == IMG_INTRA_FRAME)) tng_air_buf_clear(ctx); else tng_update_air_calc(ctx, ui8SlotIndex); return; }