Subversion Repositories Kolibri OS

Compare Revisions

Regard whitespace Rev 5563 → Rev 5564

/contrib/sdk/sources/Mesa/mesa-10.6.0/src/gallium/drivers/radeon/radeon_vce_40_2_2.c
0,0 → 1,452
/**************************************************************************
*
* Copyright 2013 Advanced Micro Devices, Inc.
* All Rights Reserved.
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the
* "Software"), to deal in the Software without restriction, including
* without limitation the rights to use, copy, modify, merge, publish,
* distribute, sub license, and/or sell copies of the Software, and to
* permit persons to whom the Software is furnished to do so, subject to
* the following conditions:
*
* The above copyright notice and this permission notice (including the
* next paragraph) shall be included in all copies or substantial portions
* of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
* IN NO EVENT SHALL THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR
* ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
*
**************************************************************************/
 
/*
* Authors:
* Christian König <christian.koenig@amd.com>
*
*/
 
#include <stdio.h>
 
#include "pipe/p_video_codec.h"
 
#include "util/u_video.h"
#include "util/u_memory.h"
 
#include "vl/vl_video_buffer.h"
 
#include "r600_pipe_common.h"
#include "radeon_video.h"
#include "radeon_vce.h"
 
static const unsigned profiles[7] = { 66, 77, 88, 100, 110, 122, 244 };
 
static struct rvce_cpb_slot *current_slot(struct rvce_encoder *enc)
{
return LIST_ENTRY(struct rvce_cpb_slot, enc->cpb_slots.prev, list);
}
 
static struct rvce_cpb_slot *l0_slot(struct rvce_encoder *enc)
{
return LIST_ENTRY(struct rvce_cpb_slot, enc->cpb_slots.next, list);
}
 
static struct rvce_cpb_slot *l1_slot(struct rvce_encoder *enc)
{
return LIST_ENTRY(struct rvce_cpb_slot, enc->cpb_slots.next->next, list);
}
 
static void frame_offset(struct rvce_encoder *enc, struct rvce_cpb_slot *slot,
unsigned *luma_offset, unsigned *chroma_offset)
{
unsigned pitch = align(enc->luma->level[0].pitch_bytes, 128);
unsigned vpitch = align(enc->luma->npix_y, 16);
unsigned fsize = pitch * (vpitch + vpitch / 2);
 
*luma_offset = slot->index * fsize;
*chroma_offset = *luma_offset + pitch * vpitch;
}
 
static void session(struct rvce_encoder *enc)
{
RVCE_BEGIN(0x00000001); // session cmd
RVCE_CS(enc->stream_handle);
RVCE_END();
}
 
static void task_info(struct rvce_encoder *enc, uint32_t taskOperation)
{
RVCE_BEGIN(0x00000002); // task info
RVCE_CS(0xffffffff); // offsetOfNextTaskInfo
RVCE_CS(taskOperation); // taskOperation
RVCE_CS(0x00000000); // referencePictureDependency
RVCE_CS(0x00000000); // collocateFlagDependency
RVCE_CS(0x00000000); // feedbackIndex
RVCE_CS(0x00000000); // videoBitstreamRingIndex
RVCE_END();
}
 
static void feedback(struct rvce_encoder *enc)
{
RVCE_BEGIN(0x05000005); // feedback buffer
RVCE_WRITE(enc->fb->res->cs_buf, enc->fb->res->domains); // feedbackRingAddressHi
RVCE_CS(0x00000000); // feedbackRingAddressLo
RVCE_CS(0x00000001); // feedbackRingSize
RVCE_END();
}
 
static void create(struct rvce_encoder *enc)
{
task_info(enc, 0x00000000);
 
RVCE_BEGIN(0x01000001); // create cmd
RVCE_CS(0x00000000); // encUseCircularBuffer
RVCE_CS(profiles[enc->base.profile -
PIPE_VIDEO_PROFILE_MPEG4_AVC_BASELINE]); // encProfile
RVCE_CS(enc->base.level); // encLevel
RVCE_CS(0x00000000); // encPicStructRestriction
RVCE_CS(enc->base.width); // encImageWidth
RVCE_CS(enc->base.height); // encImageHeight
RVCE_CS(enc->luma->level[0].pitch_bytes); // encRefPicLumaPitch
RVCE_CS(enc->chroma->level[0].pitch_bytes); // encRefPicChromaPitch
RVCE_CS(align(enc->luma->npix_y, 16) / 8); // encRefYHeightInQw
RVCE_CS(0x00000000); // encRefPic(Addr|Array)Mode, encPicStructRestriction, disableRDO
RVCE_END();
}
 
static void rate_control(struct rvce_encoder *enc)
{
RVCE_BEGIN(0x04000005); // rate control
RVCE_CS(enc->pic.rate_ctrl.rate_ctrl_method); // encRateControlMethod
RVCE_CS(enc->pic.rate_ctrl.target_bitrate); // encRateControlTargetBitRate
RVCE_CS(enc->pic.rate_ctrl.peak_bitrate); // encRateControlPeakBitRate
RVCE_CS(enc->pic.rate_ctrl.frame_rate_num); // encRateControlFrameRateNum
RVCE_CS(0x00000000); // encGOPSize
RVCE_CS(enc->pic.quant_i_frames); // encQP_I
RVCE_CS(enc->pic.quant_p_frames); // encQP_P
RVCE_CS(enc->pic.quant_b_frames); // encQP_B
RVCE_CS(enc->pic.rate_ctrl.vbv_buffer_size); // encVBVBufferSize
RVCE_CS(enc->pic.rate_ctrl.frame_rate_den); // encRateControlFrameRateDen
RVCE_CS(0x00000000); // encVBVBufferLevel
RVCE_CS(0x00000000); // encMaxAUSize
RVCE_CS(0x00000000); // encQPInitialMode
RVCE_CS(enc->pic.rate_ctrl.target_bits_picture); // encTargetBitsPerPicture
RVCE_CS(enc->pic.rate_ctrl.peak_bits_picture_integer); // encPeakBitsPerPictureInteger
RVCE_CS(enc->pic.rate_ctrl.peak_bits_picture_fraction); // encPeakBitsPerPictureFractional
RVCE_CS(0x00000000); // encMinQP
RVCE_CS(0x00000033); // encMaxQP
RVCE_CS(0x00000000); // encSkipFrameEnable
RVCE_CS(0x00000000); // encFillerDataEnable
RVCE_CS(0x00000000); // encEnforceHRD
RVCE_CS(0x00000000); // encBPicsDeltaQP
RVCE_CS(0x00000000); // encReferenceBPicsDeltaQP
RVCE_CS(0x00000000); // encRateControlReInitDisable
RVCE_END();
}
 
static void config_extension(struct rvce_encoder *enc)
{
RVCE_BEGIN(0x04000001); // config extension
RVCE_CS(0x00000003); // encEnablePerfLogging
RVCE_END();
}
 
static void pic_control(struct rvce_encoder *enc)
{
unsigned encNumMBsPerSlice;
 
encNumMBsPerSlice = align(enc->base.width, 16) / 16;
encNumMBsPerSlice *= align(enc->base.height, 16) / 16;
 
RVCE_BEGIN(0x04000002); // pic control
RVCE_CS(0x00000000); // encUseConstrainedIntraPred
RVCE_CS(0x00000000); // encCABACEnable
RVCE_CS(0x00000000); // encCABACIDC
RVCE_CS(0x00000000); // encLoopFilterDisable
RVCE_CS(0x00000000); // encLFBetaOffset
RVCE_CS(0x00000000); // encLFAlphaC0Offset
RVCE_CS(0x00000000); // encCropLeftOffset
RVCE_CS((align(enc->base.width, 16) - enc->base.width) >> 1); // encCropRightOffset
RVCE_CS(0x00000000); // encCropTopOffset
RVCE_CS((align(enc->base.height, 16) - enc->base.height) >> 1); // encCropBottomOffset
RVCE_CS(encNumMBsPerSlice); // encNumMBsPerSlice
RVCE_CS(0x00000000); // encIntraRefreshNumMBsPerSlot
RVCE_CS(0x00000000); // encForceIntraRefresh
RVCE_CS(0x00000000); // encForceIMBPeriod
RVCE_CS(0x00000000); // encPicOrderCntType
RVCE_CS(0x00000000); // log2_max_pic_order_cnt_lsb_minus4
RVCE_CS(0x00000000); // encSPSID
RVCE_CS(0x00000000); // encPPSID
RVCE_CS(0x00000040); // encConstraintSetFlags
RVCE_CS(MAX2(enc->base.max_references, 1) - 1); // encBPicPattern
RVCE_CS(0x00000000); // weightPredModeBPicture
RVCE_CS(MIN2(enc->base.max_references, 2)); // encNumberOfReferenceFrames
RVCE_CS(enc->base.max_references + 1); // encMaxNumRefFrames
RVCE_CS(0x00000001); // encNumDefaultActiveRefL0
RVCE_CS(0x00000001); // encNumDefaultActiveRefL1
RVCE_CS(0x00000000); // encSliceMode
RVCE_CS(0x00000000); // encMaxSliceSize
RVCE_END();
}
 
static void motion_estimation(struct rvce_encoder *enc)
{
RVCE_BEGIN(0x04000007); // motion estimation
RVCE_CS(0x00000001); // encIMEDecimationSearch
RVCE_CS(0x00000001); // motionEstHalfPixel
RVCE_CS(0x00000000); // motionEstQuarterPixel
RVCE_CS(0x00000000); // disableFavorPMVPoint
RVCE_CS(0x00000000); // forceZeroPointCenter
RVCE_CS(0x00000000); // LSMVert
RVCE_CS(0x00000010); // encSearchRangeX
RVCE_CS(0x00000010); // encSearchRangeY
RVCE_CS(0x00000010); // encSearch1RangeX
RVCE_CS(0x00000010); // encSearch1RangeY
RVCE_CS(0x00000000); // disable16x16Frame1
RVCE_CS(0x00000000); // disableSATD
RVCE_CS(0x00000000); // enableAMD
RVCE_CS(0x000000fe); // encDisableSubMode
RVCE_CS(0x00000000); // encIMESkipX
RVCE_CS(0x00000000); // encIMESkipY
RVCE_CS(0x00000000); // encEnImeOverwDisSubm
RVCE_CS(0x00000000); // encImeOverwDisSubmNo
RVCE_CS(0x00000001); // encIME2SearchRangeX
RVCE_CS(0x00000001); // encIME2SearchRangeY
RVCE_CS(0x00000000); // parallelModeSpeedupEnable
RVCE_CS(0x00000000); // fme0_encDisableSubMode
RVCE_CS(0x00000000); // fme1_encDisableSubMode
RVCE_CS(0x00000000); // imeSWSpeedupEnable
RVCE_END();
}
 
static void rdo(struct rvce_encoder *enc)
{
RVCE_BEGIN(0x04000008); // rdo
RVCE_CS(0x00000000); // encDisableTbePredIFrame
RVCE_CS(0x00000000); // encDisableTbePredPFrame
RVCE_CS(0x00000000); // useFmeInterpolY
RVCE_CS(0x00000000); // useFmeInterpolUV
RVCE_CS(0x00000000); // useFmeIntrapolY
RVCE_CS(0x00000000); // useFmeIntrapolUV
RVCE_CS(0x00000000); // useFmeInterpolY_1
RVCE_CS(0x00000000); // useFmeInterpolUV_1
RVCE_CS(0x00000000); // useFmeIntrapolY_1
RVCE_CS(0x00000000); // useFmeIntrapolUV_1
RVCE_CS(0x00000000); // enc16x16CostAdj
RVCE_CS(0x00000000); // encSkipCostAdj
RVCE_CS(0x00000000); // encForce16x16skip
RVCE_CS(0x00000000); // encDisableThresholdCalcA
RVCE_CS(0x00000000); // encLumaCoeffCost
RVCE_CS(0x00000000); // encLumaMBCoeffCost
RVCE_CS(0x00000000); // encChromaCoeffCost
RVCE_END();
}
 
static void vui(struct rvce_encoder *enc)
{
int i;
 
RVCE_BEGIN(0x04000009); // vui
RVCE_CS(0x00000000); //aspectRatioInfoPresentFlag
RVCE_CS(0x00000000); //aspectRatioInfo.aspectRatioIdc
RVCE_CS(0x00000000); //aspectRatioInfo.sarWidth
RVCE_CS(0x00000000); //aspectRatioInfo.sarHeight
RVCE_CS(0x00000000); //overscanInfoPresentFlag
RVCE_CS(0x00000000); //overScanInfo.overscanAppropFlag
RVCE_CS(0x00000000); //videoSignalTypePresentFlag
RVCE_CS(0x00000005); //videoSignalTypeInfo.videoFormat
RVCE_CS(0x00000000); //videoSignalTypeInfo.videoFullRangeFlag
RVCE_CS(0x00000000); //videoSignalTypeInfo.colorDescriptionPresentFlag
RVCE_CS(0x00000002); //videoSignalTypeInfo.colorPrim
RVCE_CS(0x00000002); //videoSignalTypeInfo.transferChar
RVCE_CS(0x00000002); //videoSignalTypeInfo.matrixCoef
RVCE_CS(0x00000000); //chromaLocInfoPresentFlag
RVCE_CS(0x00000000); //chromaLocInfo.chromaLocTop
RVCE_CS(0x00000000); //chromaLocInfo.chromaLocBottom
RVCE_CS(0x00000001); //timingInfoPresentFlag
RVCE_CS(enc->pic.rate_ctrl.frame_rate_den); //timingInfo.numUnitsInTick
RVCE_CS(enc->pic.rate_ctrl.frame_rate_num * 2); //timingInfo.timeScale;
RVCE_CS(0x00000001); //timingInfo.fixedFrameRateFlag
RVCE_CS(0x00000000); //nalHRDParametersPresentFlag
RVCE_CS(0x00000000); //hrdParam.cpbCntMinus1
RVCE_CS(0x00000004); //hrdParam.bitRateScale
RVCE_CS(0x00000006); //hrdParam.cpbSizeScale
for (i = 0; i < 32; i++) {
RVCE_CS(0x00000000); //hrdParam.bitRateValueMinus
RVCE_CS(0x00000000); //hrdParam.cpbSizeValueMinus
RVCE_CS(0x00000000); //hrdParam.cbrFlag
}
RVCE_CS(0x00000017); //hrdParam.initialCpbRemovalDelayLengthMinus1
RVCE_CS(0x00000017); //hrdParam.cpbRemovalDelayLengthMinus1
RVCE_CS(0x00000017); //hrdParam.dpbOutputDelayLengthMinus1
RVCE_CS(0x00000018); //hrdParam.timeOffsetLength
RVCE_CS(0x00000000); //lowDelayHRDFlag
RVCE_CS(0x00000000); //picStructPresentFlag
RVCE_CS(0x00000000); //bitstreamRestrictionPresentFlag
RVCE_CS(0x00000001); //bitstreamRestrictions.motionVectorsOverPicBoundariesFlag
RVCE_CS(0x00000002); //bitstreamRestrictions.maxBytesPerPicDenom
RVCE_CS(0x00000001); //bitstreamRestrictions.maxBitsPerMbDenom
RVCE_CS(0x00000010); //bitstreamRestrictions.log2MaxMvLengthHori
RVCE_CS(0x00000010); //bitstreamRestrictions.log2MaxMvLengthVert
RVCE_CS(0x00000003); //bitstreamRestrictions.numReorderFrames
RVCE_CS(0x00000003); //bitstreamRestrictions.maxDecFrameBuffering
RVCE_END();
}
 
static void encode(struct rvce_encoder *enc)
{
int i;
unsigned luma_offset, chroma_offset;
 
task_info(enc, 0x00000003);
 
RVCE_BEGIN(0x05000001); // context buffer
RVCE_READWRITE(enc->cpb.res->cs_buf, enc->cpb.res->domains); // encodeContextAddressHi
RVCE_CS(0x00000000); // encodeContextAddressLo
RVCE_END();
 
RVCE_BEGIN(0x05000004); // video bitstream buffer
RVCE_WRITE(enc->bs_handle, RADEON_DOMAIN_GTT); // videoBitstreamRingAddressHi
RVCE_CS(0x00000000); // videoBitstreamRingAddressLo
RVCE_CS(enc->bs_size); // videoBitstreamRingSize
RVCE_END();
 
RVCE_BEGIN(0x03000001); // encode
RVCE_CS(0x00000000); // insertHeaders
RVCE_CS(0x00000000); // pictureStructure
RVCE_CS(enc->bs_size); // allowedMaxBitstreamSize
RVCE_CS(0x00000000); // forceRefreshMap
RVCE_CS(0x00000000); // insertAUD
RVCE_CS(0x00000000); // endOfSequence
RVCE_CS(0x00000000); // endOfStream
RVCE_READ(enc->handle, RADEON_DOMAIN_VRAM); // inputPictureLumaAddressHi
RVCE_CS(enc->luma->level[0].offset); // inputPictureLumaAddressLo
RVCE_READ(enc->handle, RADEON_DOMAIN_VRAM); // inputPictureChromaAddressHi
RVCE_CS(enc->chroma->level[0].offset); // inputPictureChromaAddressLo
RVCE_CS(align(enc->luma->npix_y, 16)); // encInputFrameYPitch
RVCE_CS(enc->luma->level[0].pitch_bytes); // encInputPicLumaPitch
RVCE_CS(enc->chroma->level[0].pitch_bytes); // encInputPicChromaPitch
RVCE_CS(0x00000000); // encInputPic(Addr|Array)Mode
RVCE_CS(0x00000000); // encInputPicTileConfig
RVCE_CS(enc->pic.picture_type); // encPicType
RVCE_CS(enc->pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_IDR); // encIdrFlag
RVCE_CS(0x00000000); // encIdrPicId
RVCE_CS(0x00000000); // encMGSKeyPic
RVCE_CS(!enc->pic.not_referenced); // encReferenceFlag
RVCE_CS(0x00000000); // encTemporalLayerIndex
RVCE_CS(0x00000000); // num_ref_idx_active_override_flag
RVCE_CS(0x00000000); // num_ref_idx_l0_active_minus1
RVCE_CS(0x00000000); // num_ref_idx_l1_active_minus1
 
i = enc->pic.frame_num - enc->pic.ref_idx_l0;
if (i > 1 && enc->pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_P) {
RVCE_CS(0x00000001); // encRefListModificationOp
RVCE_CS(i - 1); // encRefListModificationNum
} else {
RVCE_CS(0x00000000); // encRefListModificationOp
RVCE_CS(0x00000000); // encRefListModificationNum
}
 
for (i = 0; i < 3; ++i) {
RVCE_CS(0x00000000); // encRefListModificationOp
RVCE_CS(0x00000000); // encRefListModificationNum
}
for (i = 0; i < 4; ++i) {
RVCE_CS(0x00000000); // encDecodedPictureMarkingOp
RVCE_CS(0x00000000); // encDecodedPictureMarkingNum
RVCE_CS(0x00000000); // encDecodedPictureMarkingIdx
RVCE_CS(0x00000000); // encDecodedRefBasePictureMarkingOp
RVCE_CS(0x00000000); // encDecodedRefBasePictureMarkingNum
}
 
// encReferencePictureL0[0]
RVCE_CS(0x00000000); // pictureStructure
if(enc->pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_P ||
enc->pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_B) {
struct rvce_cpb_slot *l0 = l0_slot(enc);
frame_offset(enc, l0, &luma_offset, &chroma_offset);
RVCE_CS(l0->picture_type); // encPicType
RVCE_CS(l0->frame_num); // frameNumber
RVCE_CS(l0->pic_order_cnt); // pictureOrderCount
RVCE_CS(luma_offset); // lumaOffset
RVCE_CS(chroma_offset); // chromaOffset
} else {
RVCE_CS(0x00000000); // encPicType
RVCE_CS(0x00000000); // frameNumber
RVCE_CS(0x00000000); // pictureOrderCount
RVCE_CS(0xffffffff); // lumaOffset
RVCE_CS(0xffffffff); // chromaOffset
}
 
// encReferencePictureL0[1]
RVCE_CS(0x00000000); // pictureStructure
RVCE_CS(0x00000000); // encPicType
RVCE_CS(0x00000000); // frameNumber
RVCE_CS(0x00000000); // pictureOrderCount
RVCE_CS(0xffffffff); // lumaOffset
RVCE_CS(0xffffffff); // chromaOffset
 
// encReferencePictureL1[0]
RVCE_CS(0x00000000); // pictureStructure
if(enc->pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_B) {
struct rvce_cpb_slot *l1 = l1_slot(enc);
frame_offset(enc, l1, &luma_offset, &chroma_offset);
RVCE_CS(l1->picture_type); // encPicType
RVCE_CS(l1->frame_num); // frameNumber
RVCE_CS(l1->pic_order_cnt); // pictureOrderCount
RVCE_CS(luma_offset); // lumaOffset
RVCE_CS(chroma_offset); // chromaOffset
} else {
RVCE_CS(0x00000000); // encPicType
RVCE_CS(0x00000000); // frameNumber
RVCE_CS(0x00000000); // pictureOrderCount
RVCE_CS(0xffffffff); // lumaOffset
RVCE_CS(0xffffffff); // chromaOffset
}
 
frame_offset(enc, current_slot(enc), &luma_offset, &chroma_offset);
RVCE_CS(luma_offset); // encReconstructedLumaOffset
RVCE_CS(chroma_offset); // encReconstructedChromaOffset
RVCE_CS(0x00000000); // encColocBufferOffset
RVCE_CS(0x00000000); // encReconstructedRefBasePictureLumaOffset
RVCE_CS(0x00000000); // encReconstructedRefBasePictureChromaOffset
RVCE_CS(0x00000000); // encReferenceRefBasePictureLumaOffset
RVCE_CS(0x00000000); // encReferenceRefBasePictureChromaOffset
RVCE_CS(0x00000000); // pictureCount
RVCE_CS(enc->pic.frame_num); // frameNumber
RVCE_CS(enc->pic.pic_order_cnt); // pictureOrderCount
RVCE_CS(0x00000000); // numIPicRemainInRCGOP
RVCE_CS(0x00000000); // numPPicRemainInRCGOP
RVCE_CS(0x00000000); // numBPicRemainInRCGOP
RVCE_CS(0x00000000); // numIRPicRemainInRCGOP
RVCE_CS(0x00000000); // enableIntraRefresh
RVCE_END();
}
 
static void destroy(struct rvce_encoder *enc)
{
task_info(enc, 0x00000001);
 
RVCE_BEGIN(0x02000001); // destroy
RVCE_END();
}
 
void radeon_vce_40_2_2_init(struct rvce_encoder *enc)
{
enc->session = session;
enc->create = create;
enc->feedback = feedback;
enc->rate_control = rate_control;
enc->config_extension = config_extension;
enc->pic_control = pic_control;
enc->motion_estimation = motion_estimation;
enc->rdo = rdo;
enc->vui = vui;
enc->encode = encode;
enc->destroy = destroy;
}