/************************************************************************** * * Copyright 2013 Advanced Micro Devices, Inc. * All Rights Reserved. * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the * "Software"), to deal in the Software without restriction, including * without limitation the rights to use, copy, modify, merge, publish, * distribute, sub license, and/or sell copies of the Software, and to * permit persons to whom the Software is furnished to do so, subject to * the following conditions: * * The above copyright notice and this permission notice (including the * next paragraph) shall be included in all copies or substantial portions * of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. * IN NO EVENT SHALL THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. * **************************************************************************/ #include "pipe/p_video_codec.h" #include "radeon_vce.h" #include "radeon_video.h" #include "si_pipe.h" #include "util/u_memory.h" #include "util/u_video.h" #include "vl/vl_video_buffer.h" #include static void session(struct rvce_encoder *enc) { RVCE_BEGIN(0x00000001); // session cmd RVCE_CS(enc->stream_handle); RVCE_END(); } static void task_info(struct rvce_encoder *enc, uint32_t op, uint32_t dep, uint32_t fb_idx, uint32_t ring_idx) { RVCE_BEGIN(0x00000002); // task info if (op == 0x3) { if (enc->task_info_idx) { uint32_t offs = enc->cs->current.cdw - enc->task_info_idx + 3; // Update offsetOfNextTaskInfo enc->cs->current.buf[enc->task_info_idx] = offs; } enc->task_info_idx = enc->cs->current.cdw; } RVCE_CS(0xffffffff); // offsetOfNextTaskInfo RVCE_CS(op); // taskOperation RVCE_CS(dep); // referencePictureDependency RVCE_CS(0x00000000); // collocateFlagDependency RVCE_CS(fb_idx); // feedbackIndex RVCE_CS(ring_idx); // videoBitstreamRingIndex RVCE_END(); } static void feedback(struct rvce_encoder *enc) { RVCE_BEGIN(0x05000005); // feedback buffer RVCE_WRITE(enc->fb->res->buf, enc->fb->res->domains, 0x0); // feedbackRingAddressHi/Lo RVCE_CS(0x00000001); // feedbackRingSize RVCE_END(); } static void create(struct rvce_encoder *enc) { enc->task_info(enc, 0x00000000, 0, 0, 0); RVCE_BEGIN(0x01000001); // create cmd RVCE_CS(0x00000000); // encUseCircularBuffer RVCE_CS(u_get_h264_profile_idc(enc->base.profile)); // encProfile RVCE_CS(enc->base.level); // encLevel RVCE_CS(0x00000000); // encPicStructRestriction RVCE_CS(enc->base.width); // encImageWidth RVCE_CS(enc->base.height); // encImageHeight RVCE_CS(enc->luma->u.legacy.level[0].nblk_x * enc->luma->bpe); // encRefPicLumaPitch RVCE_CS(enc->chroma->u.legacy.level[0].nblk_x * enc->chroma->bpe); // encRefPicChromaPitch RVCE_CS(align(enc->luma->u.legacy.level[0].nblk_y, 16) / 8); // encRefYHeightInQw RVCE_CS(0x00000000); // encRefPic(Addr|Array)Mode, encPicStructRestriction, disableRDO RVCE_END(); } static void rate_control(struct rvce_encoder *enc) { RVCE_BEGIN(0x04000005); // rate control RVCE_CS(enc->pic.rate_ctrl.rate_ctrl_method); // encRateControlMethod RVCE_CS(enc->pic.rate_ctrl.target_bitrate); // encRateControlTargetBitRate RVCE_CS(enc->pic.rate_ctrl.peak_bitrate); // encRateControlPeakBitRate RVCE_CS(enc->pic.rate_ctrl.frame_rate_num); // encRateControlFrameRateNum RVCE_CS(0x00000000); // encGOPSize RVCE_CS(enc->pic.quant_i_frames); // encQP_I RVCE_CS(enc->pic.quant_p_frames); // encQP_P RVCE_CS(enc->pic.quant_b_frames); // encQP_B RVCE_CS(enc->pic.rate_ctrl.vbv_buffer_size); // encVBVBufferSize RVCE_CS(enc->pic.rate_ctrl.frame_rate_den); // encRateControlFrameRateDen RVCE_CS(0x00000000); // encVBVBufferLevel RVCE_CS(0x00000000); // encMaxAUSize RVCE_CS(0x00000000); // encQPInitialMode RVCE_CS(enc->pic.rate_ctrl.target_bits_picture); // encTargetBitsPerPicture RVCE_CS(enc->pic.rate_ctrl.peak_bits_picture_integer); // encPeakBitsPerPictureInteger RVCE_CS(enc->pic.rate_ctrl.peak_bits_picture_fraction); // encPeakBitsPerPictureFractional RVCE_CS(0x00000000); // encMinQP RVCE_CS(0x00000033); // encMaxQP RVCE_CS(0x00000000); // encSkipFrameEnable RVCE_CS(0x00000000); // encFillerDataEnable RVCE_CS(0x00000000); // encEnforceHRD RVCE_CS(0x00000000); // encBPicsDeltaQP RVCE_CS(0x00000000); // encReferenceBPicsDeltaQP RVCE_CS(0x00000000); // encRateControlReInitDisable RVCE_END(); } static void config_extension(struct rvce_encoder *enc) { RVCE_BEGIN(0x04000001); // config extension RVCE_CS(0x00000003); // encEnablePerfLogging RVCE_END(); } static void pic_control(struct rvce_encoder *enc) { unsigned encNumMBsPerSlice; encNumMBsPerSlice = align(enc->base.width, 16) / 16; encNumMBsPerSlice *= align(enc->base.height, 16) / 16; RVCE_BEGIN(0x04000002); // pic control RVCE_CS(0x00000000); // encUseConstrainedIntraPred RVCE_CS(0x00000000); // encCABACEnable RVCE_CS(0x00000000); // encCABACIDC RVCE_CS(0x00000000); // encLoopFilterDisable RVCE_CS(0x00000000); // encLFBetaOffset RVCE_CS(0x00000000); // encLFAlphaC0Offset RVCE_CS(0x00000000); // encCropLeftOffset RVCE_CS((align(enc->base.width, 16) - enc->base.width) >> 1); // encCropRightOffset RVCE_CS(0x00000000); // encCropTopOffset RVCE_CS((align(enc->base.height, 16) - enc->base.height) >> 1); // encCropBottomOffset RVCE_CS(encNumMBsPerSlice); // encNumMBsPerSlice RVCE_CS(0x00000000); // encIntraRefreshNumMBsPerSlot RVCE_CS(0x00000000); // encForceIntraRefresh RVCE_CS(0x00000000); // encForceIMBPeriod RVCE_CS(0x00000000); // encPicOrderCntType RVCE_CS(0x00000000); // log2_max_pic_order_cnt_lsb_minus4 RVCE_CS(0x00000000); // encSPSID RVCE_CS(0x00000000); // encPPSID RVCE_CS(0x00000040); // encConstraintSetFlags RVCE_CS(MAX2(enc->base.max_references, 1) - 1); // encBPicPattern RVCE_CS(0x00000000); // weightPredModeBPicture RVCE_CS(MIN2(enc->base.max_references, 2)); // encNumberOfReferenceFrames RVCE_CS(enc->base.max_references + 1); // encMaxNumRefFrames RVCE_CS(0x00000001); // encNumDefaultActiveRefL0 RVCE_CS(0x00000001); // encNumDefaultActiveRefL1 RVCE_CS(0x00000000); // encSliceMode RVCE_CS(0x00000000); // encMaxSliceSize RVCE_END(); } static void motion_estimation(struct rvce_encoder *enc) { RVCE_BEGIN(0x04000007); // motion estimation RVCE_CS(0x00000001); // encIMEDecimationSearch RVCE_CS(0x00000001); // motionEstHalfPixel RVCE_CS(0x00000000); // motionEstQuarterPixel RVCE_CS(0x00000000); // disableFavorPMVPoint RVCE_CS(0x00000000); // forceZeroPointCenter RVCE_CS(0x00000000); // LSMVert RVCE_CS(0x00000010); // encSearchRangeX RVCE_CS(0x00000010); // encSearchRangeY RVCE_CS(0x00000010); // encSearch1RangeX RVCE_CS(0x00000010); // encSearch1RangeY RVCE_CS(0x00000000); // disable16x16Frame1 RVCE_CS(0x00000000); // disableSATD RVCE_CS(0x00000000); // enableAMD RVCE_CS(0x000000fe); // encDisableSubMode RVCE_CS(0x00000000); // encIMESkipX RVCE_CS(0x00000000); // encIMESkipY RVCE_CS(0x00000000); // encEnImeOverwDisSubm RVCE_CS(0x00000000); // encImeOverwDisSubmNo RVCE_CS(0x00000001); // encIME2SearchRangeX RVCE_CS(0x00000001); // encIME2SearchRangeY RVCE_CS(0x00000000); // parallelModeSpeedupEnable RVCE_CS(0x00000000); // fme0_encDisableSubMode RVCE_CS(0x00000000); // fme1_encDisableSubMode RVCE_CS(0x00000000); // imeSWSpeedupEnable RVCE_END(); } static void rdo(struct rvce_encoder *enc) { RVCE_BEGIN(0x04000008); // rdo RVCE_CS(0x00000000); // encDisableTbePredIFrame RVCE_CS(0x00000000); // encDisableTbePredPFrame RVCE_CS(0x00000000); // useFmeInterpolY RVCE_CS(0x00000000); // useFmeInterpolUV RVCE_CS(0x00000000); // useFmeIntrapolY RVCE_CS(0x00000000); // useFmeIntrapolUV RVCE_CS(0x00000000); // useFmeInterpolY_1 RVCE_CS(0x00000000); // useFmeInterpolUV_1 RVCE_CS(0x00000000); // useFmeIntrapolY_1 RVCE_CS(0x00000000); // useFmeIntrapolUV_1 RVCE_CS(0x00000000); // enc16x16CostAdj RVCE_CS(0x00000000); // encSkipCostAdj RVCE_CS(0x00000000); // encForce16x16skip RVCE_CS(0x00000000); // encDisableThresholdCalcA RVCE_CS(0x00000000); // encLumaCoeffCost RVCE_CS(0x00000000); // encLumaMBCoeffCost RVCE_CS(0x00000000); // encChromaCoeffCost RVCE_END(); } static void vui(struct rvce_encoder *enc) { int i; if (!enc->pic.rate_ctrl.frame_rate_num) return; RVCE_BEGIN(0x04000009); // vui RVCE_CS(0x00000000); // aspectRatioInfoPresentFlag RVCE_CS(0x00000000); // aspectRatioInfo.aspectRatioIdc RVCE_CS(0x00000000); // aspectRatioInfo.sarWidth RVCE_CS(0x00000000); // aspectRatioInfo.sarHeight RVCE_CS(0x00000000); // overscanInfoPresentFlag RVCE_CS(0x00000000); // overScanInfo.overscanAppropFlag RVCE_CS(0x00000000); // videoSignalTypePresentFlag RVCE_CS(0x00000005); // videoSignalTypeInfo.videoFormat RVCE_CS(0x00000000); // videoSignalTypeInfo.videoFullRangeFlag RVCE_CS(0x00000000); // videoSignalTypeInfo.colorDescriptionPresentFlag RVCE_CS(0x00000002); // videoSignalTypeInfo.colorPrim RVCE_CS(0x00000002); // videoSignalTypeInfo.transferChar RVCE_CS(0x00000002); // videoSignalTypeInfo.matrixCoef RVCE_CS(0x00000000); // chromaLocInfoPresentFlag RVCE_CS(0x00000000); // chromaLocInfo.chromaLocTop RVCE_CS(0x00000000); // chromaLocInfo.chromaLocBottom RVCE_CS(0x00000001); // timingInfoPresentFlag RVCE_CS(enc->pic.rate_ctrl.frame_rate_den); // timingInfo.numUnitsInTick RVCE_CS(enc->pic.rate_ctrl.frame_rate_num * 2); // timingInfo.timeScale; RVCE_CS(0x00000001); // timingInfo.fixedFrameRateFlag RVCE_CS(0x00000000); // nalHRDParametersPresentFlag RVCE_CS(0x00000000); // hrdParam.cpbCntMinus1 RVCE_CS(0x00000004); // hrdParam.bitRateScale RVCE_CS(0x00000006); // hrdParam.cpbSizeScale for (i = 0; i < 32; i++) { RVCE_CS(0x00000000); // hrdParam.bitRateValueMinus RVCE_CS(0x00000000); // hrdParam.cpbSizeValueMinus RVCE_CS(0x00000000); // hrdParam.cbrFlag } RVCE_CS(0x00000017); // hrdParam.initialCpbRemovalDelayLengthMinus1 RVCE_CS(0x00000017); // hrdParam.cpbRemovalDelayLengthMinus1 RVCE_CS(0x00000017); // hrdParam.dpbOutputDelayLengthMinus1 RVCE_CS(0x00000018); // hrdParam.timeOffsetLength RVCE_CS(0x00000000); // lowDelayHRDFlag RVCE_CS(0x00000000); // picStructPresentFlag RVCE_CS(0x00000000); // bitstreamRestrictionPresentFlag RVCE_CS(0x00000001); // bitstreamRestrictions.motionVectorsOverPicBoundariesFlag RVCE_CS(0x00000002); // bitstreamRestrictions.maxBytesPerPicDenom RVCE_CS(0x00000001); // bitstreamRestrictions.maxBitsPerMbDenom RVCE_CS(0x00000010); // bitstreamRestrictions.log2MaxMvLengthHori RVCE_CS(0x00000010); // bitstreamRestrictions.log2MaxMvLengthVert RVCE_CS(0x00000003); // bitstreamRestrictions.numReorderFrames RVCE_CS(0x00000003); // bitstreamRestrictions.maxDecFrameBuffering RVCE_END(); } static void config(struct rvce_encoder *enc) { enc->task_info(enc, 0x00000002, 0, 0xffffffff, 0); enc->rate_control(enc); enc->config_extension(enc); enc->motion_estimation(enc); enc->rdo(enc); if (enc->use_vui) enc->vui(enc); enc->pic_control(enc); } static void encode(struct rvce_encoder *enc) { signed luma_offset, chroma_offset; int i; enc->task_info(enc, 0x00000003, 0, 0, 0); RVCE_BEGIN(0x05000001); // context buffer RVCE_READWRITE(enc->cpb.res->buf, enc->cpb.res->domains, 0x0); // encodeContextAddressHi/Lo RVCE_END(); RVCE_BEGIN(0x05000004); // video bitstream buffer RVCE_WRITE(enc->bs_handle, RADEON_DOMAIN_GTT, 0x0); // videoBitstreamRingAddressHi/Lo RVCE_CS(enc->bs_size); // videoBitstreamRingSize RVCE_END(); RVCE_BEGIN(0x03000001); // encode RVCE_CS(0x00000000); // insertHeaders RVCE_CS(0x00000000); // pictureStructure RVCE_CS(enc->bs_size); // allowedMaxBitstreamSize RVCE_CS(0x00000000); // forceRefreshMap RVCE_CS(0x00000000); // insertAUD RVCE_CS(0x00000000); // endOfSequence RVCE_CS(0x00000000); // endOfStream RVCE_READ(enc->handle, RADEON_DOMAIN_VRAM, enc->luma->u.legacy.level[0].offset); // inputPictureLumaAddressHi/Lo RVCE_READ(enc->handle, RADEON_DOMAIN_VRAM, enc->chroma->u.legacy.level[0].offset); // inputPictureChromaAddressHi/Lo RVCE_CS(align(enc->luma->u.legacy.level[0].nblk_y, 16)); // encInputFrameYPitch RVCE_CS(enc->luma->u.legacy.level[0].nblk_x * enc->luma->bpe); // encInputPicLumaPitch RVCE_CS(enc->chroma->u.legacy.level[0].nblk_x * enc->chroma->bpe); // encInputPicChromaPitch RVCE_CS(0x00000000); // encInputPic(Addr|Array)Mode RVCE_CS(0x00000000); // encInputPicTileConfig RVCE_CS(enc->pic.picture_type); // encPicType RVCE_CS(enc->pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_IDR); // encIdrFlag RVCE_CS(0x00000000); // encIdrPicId RVCE_CS(0x00000000); // encMGSKeyPic RVCE_CS(!enc->pic.not_referenced); // encReferenceFlag RVCE_CS(0x00000000); // encTemporalLayerIndex RVCE_CS(0x00000000); // num_ref_idx_active_override_flag RVCE_CS(0x00000000); // num_ref_idx_l0_active_minus1 RVCE_CS(0x00000000); // num_ref_idx_l1_active_minus1 i = enc->pic.frame_num - enc->pic.ref_idx_l0; if (i > 1 && enc->pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_P) { RVCE_CS(0x00000001); // encRefListModificationOp RVCE_CS(i - 1); // encRefListModificationNum } else { RVCE_CS(0x00000000); // encRefListModificationOp RVCE_CS(0x00000000); // encRefListModificationNum } for (i = 0; i < 3; ++i) { RVCE_CS(0x00000000); // encRefListModificationOp RVCE_CS(0x00000000); // encRefListModificationNum } for (i = 0; i < 4; ++i) { RVCE_CS(0x00000000); // encDecodedPictureMarkingOp RVCE_CS(0x00000000); // encDecodedPictureMarkingNum RVCE_CS(0x00000000); // encDecodedPictureMarkingIdx RVCE_CS(0x00000000); // encDecodedRefBasePictureMarkingOp RVCE_CS(0x00000000); // encDecodedRefBasePictureMarkingNum } // encReferencePictureL0[0] RVCE_CS(0x00000000); // pictureStructure if (enc->pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_P || enc->pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_B) { struct rvce_cpb_slot *l0 = si_l0_slot(enc); si_vce_frame_offset(enc, l0, &luma_offset, &chroma_offset); RVCE_CS(l0->picture_type); // encPicType RVCE_CS(l0->frame_num); // frameNumber RVCE_CS(l0->pic_order_cnt); // pictureOrderCount RVCE_CS(luma_offset); // lumaOffset RVCE_CS(chroma_offset); // chromaOffset } else { RVCE_CS(0x00000000); // encPicType RVCE_CS(0x00000000); // frameNumber RVCE_CS(0x00000000); // pictureOrderCount RVCE_CS(0xffffffff); // lumaOffset RVCE_CS(0xffffffff); // chromaOffset } // encReferencePictureL0[1] RVCE_CS(0x00000000); // pictureStructure RVCE_CS(0x00000000); // encPicType RVCE_CS(0x00000000); // frameNumber RVCE_CS(0x00000000); // pictureOrderCount RVCE_CS(0xffffffff); // lumaOffset RVCE_CS(0xffffffff); // chromaOffset // encReferencePictureL1[0] RVCE_CS(0x00000000); // pictureStructure if (enc->pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_B) { struct rvce_cpb_slot *l1 = si_l1_slot(enc); si_vce_frame_offset(enc, l1, &luma_offset, &chroma_offset); RVCE_CS(l1->picture_type); // encPicType RVCE_CS(l1->frame_num); // frameNumber RVCE_CS(l1->pic_order_cnt); // pictureOrderCount RVCE_CS(luma_offset); // lumaOffset RVCE_CS(chroma_offset); // chromaOffset } else { RVCE_CS(0x00000000); // encPicType RVCE_CS(0x00000000); // frameNumber RVCE_CS(0x00000000); // pictureOrderCount RVCE_CS(0xffffffff); // lumaOffset RVCE_CS(0xffffffff); // chromaOffset } si_vce_frame_offset(enc, si_current_slot(enc), &luma_offset, &chroma_offset); RVCE_CS(luma_offset); // encReconstructedLumaOffset RVCE_CS(chroma_offset); // encReconstructedChromaOffset RVCE_CS(0x00000000); // encColocBufferOffset RVCE_CS(0x00000000); // encReconstructedRefBasePictureLumaOffset RVCE_CS(0x00000000); // encReconstructedRefBasePictureChromaOffset RVCE_CS(0x00000000); // encReferenceRefBasePictureLumaOffset RVCE_CS(0x00000000); // encReferenceRefBasePictureChromaOffset RVCE_CS(0x00000000); // pictureCount RVCE_CS(enc->pic.frame_num); // frameNumber RVCE_CS(enc->pic.pic_order_cnt); // pictureOrderCount RVCE_CS(0x00000000); // numIPicRemainInRCGOP RVCE_CS(0x00000000); // numPPicRemainInRCGOP RVCE_CS(0x00000000); // numBPicRemainInRCGOP RVCE_CS(0x00000000); // numIRPicRemainInRCGOP RVCE_CS(0x00000000); // enableIntraRefresh RVCE_END(); } static void destroy(struct rvce_encoder *enc) { enc->task_info(enc, 0x00000001, 0, 0, 0); feedback(enc); RVCE_BEGIN(0x02000001); // destroy RVCE_END(); } void si_vce_40_2_2_get_param(struct rvce_encoder *enc, struct pipe_h264_enc_picture_desc *pic) { } void si_vce_40_2_2_init(struct rvce_encoder *enc) { enc->session = session; enc->task_info = task_info; enc->create = create; enc->feedback = feedback; enc->rate_control = rate_control; enc->config_extension = config_extension; enc->pic_control = pic_control; enc->motion_estimation = motion_estimation; enc->rdo = rdo; enc->vui = vui; enc->config = config; enc->encode = encode; enc->destroy = destroy; enc->si_get_pic_param = si_vce_40_2_2_get_param; }