gallium/radeon: remove radeon_surf_level::pitch_bytes
[mesa.git] / src / gallium / drivers / radeon / radeon_vce_40_2_2.c
index 33a58f3e8e90ba38c97e78c6c6538beb6726aa4f..358c0fcf9dfc7f15bbccbafde665215739112366 100644 (file)
 
 #include "vl/vl_video_buffer.h"
 
-#include "../../winsys/radeon/drm/radeon_winsys.h"
+#include "r600_pipe_common.h"
 #include "radeon_video.h"
 #include "radeon_vce.h"
 
+static const unsigned profiles[7] = { 66, 77, 88, 100, 110, 122, 244 };
+
 static void session(struct rvce_encoder *enc)
 {
        RVCE_BEGIN(0x00000001); // session cmd
@@ -51,41 +53,50 @@ static void session(struct rvce_encoder *enc)
        RVCE_END();
 }
 
-static void task_info(struct rvce_encoder *enc, uint32_t taskOperation)
+static void task_info(struct rvce_encoder *enc, uint32_t op,
+                     uint32_t dep, uint32_t fb_idx, uint32_t ring_idx)
 {
        RVCE_BEGIN(0x00000002); // task info
+       if (op == 0x3) {
+               if (enc->task_info_idx) {
+                       uint32_t offs = enc->cs->current.cdw - enc->task_info_idx + 3;
+                       // Update offsetOfNextTaskInfo
+                       enc->cs->current.buf[enc->task_info_idx] = offs;
+               }
+               enc->task_info_idx = enc->cs->current.cdw;
+       }
        RVCE_CS(0xffffffff); // offsetOfNextTaskInfo
-       RVCE_CS(taskOperation); // taskOperation
-       RVCE_CS(0x00000000); // referencePictureDependency
+       RVCE_CS(op); // taskOperation
+       RVCE_CS(dep); // referencePictureDependency
        RVCE_CS(0x00000000); // collocateFlagDependency
-       RVCE_CS(0x00000000); // feedbackIndex
-       RVCE_CS(0x00000000); // videoBitstreamRingIndex
+       RVCE_CS(fb_idx); // feedbackIndex
+       RVCE_CS(ring_idx); // videoBitstreamRingIndex
        RVCE_END();
 }
 
 static void feedback(struct rvce_encoder *enc)
 {
        RVCE_BEGIN(0x05000005); // feedback buffer
-       RVCE_WRITE(enc->fb->cs_handle, enc->fb->domain); // feedbackRingAddressHi
-       RVCE_CS(0x00000000); // feedbackRingAddressLo
+       RVCE_WRITE(enc->fb->res->buf, enc->fb->res->domains, 0x0); // feedbackRingAddressHi/Lo
        RVCE_CS(0x00000001); // feedbackRingSize
        RVCE_END();
 }
 
 static void create(struct rvce_encoder *enc)
 {
-       task_info(enc, 0x00000000);
+       enc->task_info(enc, 0x00000000, 0, 0, 0);
 
        RVCE_BEGIN(0x01000001); // create cmd
        RVCE_CS(0x00000000); // encUseCircularBuffer
-       RVCE_CS(0x00000041); // encProfile
-       RVCE_CS(0x0000000a); // encLevel
+       RVCE_CS(profiles[enc->base.profile -
+               PIPE_VIDEO_PROFILE_MPEG4_AVC_BASELINE]); // encProfile
+       RVCE_CS(enc->base.level); // encLevel
        RVCE_CS(0x00000000); // encPicStructRestriction
        RVCE_CS(enc->base.width); // encImageWidth
        RVCE_CS(enc->base.height); // encImageHeight
-       RVCE_CS(enc->luma->level[0].pitch_bytes); // encRefPicLumaPitch
-       RVCE_CS(enc->chroma->level[0].pitch_bytes); // encRefPicChromaPitch
-       RVCE_CS(align(enc->luma->npix_y, 16) / 8); // encRefYHeightInQw
+       RVCE_CS(enc->luma->level[0].nblk_x * enc->luma->bpe); // encRefPicLumaPitch
+       RVCE_CS(enc->chroma->level[0].nblk_x * enc->chroma->bpe); // encRefPicChromaPitch
+       RVCE_CS(align(enc->luma->level[0].nblk_y, 16) / 8); // encRefYHeightInQw
        RVCE_CS(0x00000000); // encRefPic(Addr|Array)Mode, encPicStructRestriction, disableRDO
        RVCE_END();
 }
@@ -154,12 +165,12 @@ static void pic_control(struct rvce_encoder *enc)
        RVCE_CS(0x00000000); // encSPSID
        RVCE_CS(0x00000000); // encPPSID
        RVCE_CS(0x00000040); // encConstraintSetFlags
-       RVCE_CS(0x00000000); // encBPicPattern
+       RVCE_CS(MAX2(enc->base.max_references, 1) - 1); // encBPicPattern
        RVCE_CS(0x00000000); // weightPredModeBPicture
        RVCE_CS(MIN2(enc->base.max_references, 2)); // encNumberOfReferenceFrames
        RVCE_CS(enc->base.max_references + 1); // encMaxNumRefFrames
-       RVCE_CS(0x00000000); // encNumDefaultActiveRefL0
-       RVCE_CS(0x00000000); // encNumDefaultActiveRefL1
+       RVCE_CS(0x00000001); // encNumDefaultActiveRefL0
+       RVCE_CS(0x00000001); // encNumDefaultActiveRefL1
        RVCE_CS(0x00000000); // encSliceMode
        RVCE_CS(0x00000000); // encMaxSliceSize
        RVCE_END();
@@ -218,32 +229,85 @@ static void rdo(struct rvce_encoder *enc)
        RVCE_END();
 }
 
-static void frame_offset(struct rvce_encoder *enc, unsigned frame_num,
-                        unsigned *luma_offset, unsigned *chroma_offset)
+static void vui(struct rvce_encoder *enc)
 {
-       unsigned pitch = align(enc->luma->level[0].pitch_bytes, 128);
-       unsigned vpitch = align(enc->luma->npix_y, 16);
-       unsigned fsize = pitch * (vpitch + vpitch / 2);
+       int i;
+
+       if (!enc->pic.rate_ctrl.frame_rate_num)
+               return;
 
-       *luma_offset = (frame_num % RVCE_NUM_CPB_FRAMES) * fsize;
-       *chroma_offset = *luma_offset + pitch * vpitch;
+       RVCE_BEGIN(0x04000009); // vui
+       RVCE_CS(0x00000000); //aspectRatioInfoPresentFlag
+       RVCE_CS(0x00000000); //aspectRatioInfo.aspectRatioIdc
+       RVCE_CS(0x00000000); //aspectRatioInfo.sarWidth
+       RVCE_CS(0x00000000); //aspectRatioInfo.sarHeight
+       RVCE_CS(0x00000000); //overscanInfoPresentFlag
+       RVCE_CS(0x00000000); //overScanInfo.overscanAppropFlag
+       RVCE_CS(0x00000000); //videoSignalTypePresentFlag
+       RVCE_CS(0x00000005); //videoSignalTypeInfo.videoFormat
+       RVCE_CS(0x00000000); //videoSignalTypeInfo.videoFullRangeFlag
+       RVCE_CS(0x00000000); //videoSignalTypeInfo.colorDescriptionPresentFlag
+       RVCE_CS(0x00000002); //videoSignalTypeInfo.colorPrim
+       RVCE_CS(0x00000002); //videoSignalTypeInfo.transferChar
+       RVCE_CS(0x00000002); //videoSignalTypeInfo.matrixCoef
+       RVCE_CS(0x00000000); //chromaLocInfoPresentFlag
+       RVCE_CS(0x00000000); //chromaLocInfo.chromaLocTop
+       RVCE_CS(0x00000000); //chromaLocInfo.chromaLocBottom
+       RVCE_CS(0x00000001); //timingInfoPresentFlag
+       RVCE_CS(enc->pic.rate_ctrl.frame_rate_den); //timingInfo.numUnitsInTick
+       RVCE_CS(enc->pic.rate_ctrl.frame_rate_num * 2); //timingInfo.timeScale;
+       RVCE_CS(0x00000001); //timingInfo.fixedFrameRateFlag
+       RVCE_CS(0x00000000); //nalHRDParametersPresentFlag
+       RVCE_CS(0x00000000); //hrdParam.cpbCntMinus1
+       RVCE_CS(0x00000004); //hrdParam.bitRateScale
+       RVCE_CS(0x00000006); //hrdParam.cpbSizeScale
+       for (i = 0; i < 32; i++) {
+               RVCE_CS(0x00000000); //hrdParam.bitRateValueMinus
+               RVCE_CS(0x00000000); //hrdParam.cpbSizeValueMinus
+               RVCE_CS(0x00000000); //hrdParam.cbrFlag
+       }
+       RVCE_CS(0x00000017); //hrdParam.initialCpbRemovalDelayLengthMinus1
+       RVCE_CS(0x00000017); //hrdParam.cpbRemovalDelayLengthMinus1
+       RVCE_CS(0x00000017); //hrdParam.dpbOutputDelayLengthMinus1
+       RVCE_CS(0x00000018); //hrdParam.timeOffsetLength
+       RVCE_CS(0x00000000); //lowDelayHRDFlag
+       RVCE_CS(0x00000000); //picStructPresentFlag
+       RVCE_CS(0x00000000); //bitstreamRestrictionPresentFlag
+       RVCE_CS(0x00000001); //bitstreamRestrictions.motionVectorsOverPicBoundariesFlag
+       RVCE_CS(0x00000002); //bitstreamRestrictions.maxBytesPerPicDenom
+       RVCE_CS(0x00000001); //bitstreamRestrictions.maxBitsPerMbDenom
+       RVCE_CS(0x00000010); //bitstreamRestrictions.log2MaxMvLengthHori
+       RVCE_CS(0x00000010); //bitstreamRestrictions.log2MaxMvLengthVert
+       RVCE_CS(0x00000003); //bitstreamRestrictions.numReorderFrames
+       RVCE_CS(0x00000003); //bitstreamRestrictions.maxDecFrameBuffering
+       RVCE_END();
+}
+
+static void config(struct rvce_encoder *enc)
+{
+       enc->task_info(enc, 0x00000002, 0, 0xffffffff, 0);
+       enc->rate_control(enc);
+       enc->config_extension(enc);
+       enc->motion_estimation(enc);
+       enc->rdo(enc);
+       if (enc->use_vui)
+               enc->vui(enc);
+       enc->pic_control(enc);
 }
 
 static void encode(struct rvce_encoder *enc)
 {
+       signed luma_offset, chroma_offset;
        int i;
-       unsigned luma_offset, chroma_offset;
 
-       task_info(enc, 0x00000003);
+       enc->task_info(enc, 0x00000003, 0, 0, 0);
 
        RVCE_BEGIN(0x05000001); // context buffer
-       RVCE_READWRITE(enc->cpb.cs_handle, enc->cpb.domain); // encodeContextAddressHi
-       RVCE_CS(0x00000000); // encodeContextAddressLo
+       RVCE_READWRITE(enc->cpb.res->buf, enc->cpb.res->domains, 0x0); // encodeContextAddressHi/Lo
        RVCE_END();
 
        RVCE_BEGIN(0x05000004); // video bitstream buffer
-       RVCE_WRITE(enc->bs_handle, RADEON_DOMAIN_GTT); // videoBitstreamRingAddressHi
-       RVCE_CS(0x00000000); // videoBitstreamRingAddressLo
+       RVCE_WRITE(enc->bs_handle, RADEON_DOMAIN_GTT, 0x0); // videoBitstreamRingAddressHi/Lo
        RVCE_CS(enc->bs_size); // videoBitstreamRingSize
        RVCE_END();
 
@@ -255,25 +319,35 @@ static void encode(struct rvce_encoder *enc)
        RVCE_CS(0x00000000); // insertAUD
        RVCE_CS(0x00000000); // endOfSequence
        RVCE_CS(0x00000000); // endOfStream
-       RVCE_READ(enc->handle, RADEON_DOMAIN_VRAM); // inputPictureLumaAddressHi
-       RVCE_CS(enc->luma->level[0].offset); // inputPictureLumaAddressLo
-       RVCE_READ(enc->handle, RADEON_DOMAIN_VRAM); // inputPictureChromaAddressHi
-       RVCE_CS(enc->chroma->level[0].offset); // inputPictureChromaAddressLo
-       RVCE_CS(align(enc->luma->npix_y, 16)); // encInputFrameYPitch
-       RVCE_CS(enc->luma->level[0].pitch_bytes); // encInputPicLumaPitch
-       RVCE_CS(enc->chroma->level[0].pitch_bytes); // encInputPicChromaPitch
+       RVCE_READ(enc->handle, RADEON_DOMAIN_VRAM,
+                 enc->luma->level[0].offset); // inputPictureLumaAddressHi/Lo
+       RVCE_READ(enc->handle, RADEON_DOMAIN_VRAM,
+                 enc->chroma->level[0].offset); // inputPictureChromaAddressHi/Lo
+       RVCE_CS(align(enc->luma->level[0].nblk_y, 16)); // encInputFrameYPitch
+       RVCE_CS(enc->luma->level[0].nblk_x * enc->luma->bpe); // encInputPicLumaPitch
+       RVCE_CS(enc->chroma->level[0].nblk_x * enc->chroma->bpe); // encInputPicChromaPitch
        RVCE_CS(0x00000000); // encInputPic(Addr|Array)Mode
        RVCE_CS(0x00000000); // encInputPicTileConfig
        RVCE_CS(enc->pic.picture_type); // encPicType
-       RVCE_CS(enc->pic.picture_type == 3); // encIdrFlag
+       RVCE_CS(enc->pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_IDR); // encIdrFlag
        RVCE_CS(0x00000000); // encIdrPicId
        RVCE_CS(0x00000000); // encMGSKeyPic
-       RVCE_CS(0x00000001); // encReferenceFlag
+       RVCE_CS(!enc->pic.not_referenced); // encReferenceFlag
        RVCE_CS(0x00000000); // encTemporalLayerIndex
        RVCE_CS(0x00000000); // num_ref_idx_active_override_flag
        RVCE_CS(0x00000000); // num_ref_idx_l0_active_minus1
        RVCE_CS(0x00000000); // num_ref_idx_l1_active_minus1
-       for (i = 0; i < 4; ++i) {
+
+       i = enc->pic.frame_num - enc->pic.ref_idx_l0;
+       if (i > 1 && enc->pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_P) {
+               RVCE_CS(0x00000001); // encRefListModificationOp
+               RVCE_CS(i - 1);      // encRefListModificationNum
+       } else {
+               RVCE_CS(0x00000000); // encRefListModificationOp
+               RVCE_CS(0x00000000); // encRefListModificationNum
+       }
+
+       for (i = 0; i < 3; ++i) {
                RVCE_CS(0x00000000); // encRefListModificationOp
                RVCE_CS(0x00000000); // encRefListModificationNum
        }
@@ -281,40 +355,56 @@ static void encode(struct rvce_encoder *enc)
                RVCE_CS(0x00000000); // encDecodedPictureMarkingOp
                RVCE_CS(0x00000000); // encDecodedPictureMarkingNum
                RVCE_CS(0x00000000); // encDecodedPictureMarkingIdx
-       }
-       for (i = 0; i < 4; ++i) {
                RVCE_CS(0x00000000); // encDecodedRefBasePictureMarkingOp
                RVCE_CS(0x00000000); // encDecodedRefBasePictureMarkingNum
        }
 
+       // encReferencePictureL0[0]
        RVCE_CS(0x00000000); // pictureStructure
-
-       if (enc->pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_IDR) { 
+       if(enc->pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_P ||
+          enc->pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_B) {
+               struct rvce_cpb_slot *l0 = l0_slot(enc);
+               rvce_frame_offset(enc, l0, &luma_offset, &chroma_offset);
+               RVCE_CS(l0->picture_type); // encPicType
+               RVCE_CS(l0->frame_num); // frameNumber
+               RVCE_CS(l0->pic_order_cnt); // pictureOrderCount
+               RVCE_CS(luma_offset); // lumaOffset
+               RVCE_CS(chroma_offset); // chromaOffset
+       } else {
                RVCE_CS(0x00000000); // encPicType
                RVCE_CS(0x00000000); // frameNumber
                RVCE_CS(0x00000000); // pictureOrderCount
                RVCE_CS(0xffffffff); // lumaOffset
                RVCE_CS(0xffffffff); // chromaOffset
        }
-       else if(enc->pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_P) {
-               frame_offset(enc, enc->pic.ref_idx_l0, &luma_offset, &chroma_offset);
-               RVCE_CS(0x00000000); // encPicType
-               // TODO: Stores these in the CPB backtrack
-               RVCE_CS(enc->pic.frame_num - 1); // frameNumber
-               RVCE_CS(enc->pic.frame_num - 1); // pictureOrderCount
+
+       // encReferencePictureL0[1]
+       RVCE_CS(0x00000000); // pictureStructure
+       RVCE_CS(0x00000000); // encPicType
+       RVCE_CS(0x00000000); // frameNumber
+       RVCE_CS(0x00000000); // pictureOrderCount
+       RVCE_CS(0xffffffff); // lumaOffset
+       RVCE_CS(0xffffffff); // chromaOffset
+
+       // encReferencePictureL1[0]
+       RVCE_CS(0x00000000); // pictureStructure
+       if(enc->pic.picture_type == PIPE_H264_ENC_PICTURE_TYPE_B) {
+               struct rvce_cpb_slot *l1 = l1_slot(enc);
+               rvce_frame_offset(enc, l1, &luma_offset, &chroma_offset);
+               RVCE_CS(l1->picture_type); // encPicType
+               RVCE_CS(l1->frame_num); // frameNumber
+               RVCE_CS(l1->pic_order_cnt); // pictureOrderCount
                RVCE_CS(luma_offset); // lumaOffset
                RVCE_CS(chroma_offset); // chromaOffset
-       }
-       for (i = 0; i < 2; ++i) {
-               RVCE_CS(0x00000000); // pictureStructure
+       } else {
                RVCE_CS(0x00000000); // encPicType
                RVCE_CS(0x00000000); // frameNumber
                RVCE_CS(0x00000000); // pictureOrderCount
                RVCE_CS(0xffffffff); // lumaOffset
                RVCE_CS(0xffffffff); // chromaOffset
        }
-       
-       frame_offset(enc, enc->pic.frame_num, &luma_offset, &chroma_offset);
+
+       rvce_frame_offset(enc, current_slot(enc), &luma_offset, &chroma_offset);
        RVCE_CS(luma_offset); // encReconstructedLumaOffset
        RVCE_CS(chroma_offset); // encReconstructedChromaOffset
        RVCE_CS(0x00000000); // encColocBufferOffset
@@ -335,15 +425,20 @@ static void encode(struct rvce_encoder *enc)
 
 static void destroy(struct rvce_encoder *enc)
 {
-       task_info(enc, 0x00000001);
+       enc->task_info(enc, 0x00000001, 0, 0, 0);
 
        RVCE_BEGIN(0x02000001); // destroy
        RVCE_END();
 }
 
+void radeon_vce_40_2_2_get_param(struct rvce_encoder *enc, struct pipe_h264_enc_picture_desc *pic)
+{
+}
+
 void radeon_vce_40_2_2_init(struct rvce_encoder *enc)
 {
        enc->session = session;
+       enc->task_info = task_info;
        enc->create = create;
        enc->feedback = feedback;
        enc->rate_control = rate_control;
@@ -351,6 +446,8 @@ void radeon_vce_40_2_2_init(struct rvce_encoder *enc)
        enc->pic_control = pic_control;
        enc->motion_estimation = motion_estimation;
        enc->rdo = rdo;
+       enc->vui = vui;
+       enc->config = config;
        enc->encode = encode;
        enc->destroy = destroy;
 }