1 /**************************************************************************
3 * Copyright 2013 Advanced Micro Devices, Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
30 * Christian König <christian.koenig@amd.com>
36 #include "pipe/p_video_codec.h"
38 #include "util/u_video.h"
39 #include "util/u_memory.h"
41 #include "vl/vl_video_buffer.h"
43 #include "r600_pipe_common.h"
44 #include "radeon_video.h"
45 #include "radeon_vce.h"
47 static const unsigned profiles
[7] = { 66, 77, 88, 100, 110, 122, 244 };
49 static void session(struct rvce_encoder
*enc
)
51 RVCE_BEGIN(0x00000001); // session cmd
52 RVCE_CS(enc
->stream_handle
);
56 static void task_info(struct rvce_encoder
*enc
, uint32_t taskOperation
)
58 RVCE_BEGIN(0x00000002); // task info
59 RVCE_CS(0xffffffff); // offsetOfNextTaskInfo
60 RVCE_CS(taskOperation
); // taskOperation
61 RVCE_CS(0x00000000); // referencePictureDependency
62 RVCE_CS(0x00000000); // collocateFlagDependency
63 RVCE_CS(0x00000000); // feedbackIndex
64 RVCE_CS(0x00000000); // videoBitstreamRingIndex
68 static void feedback(struct rvce_encoder
*enc
)
70 RVCE_BEGIN(0x05000005); // feedback buffer
71 RVCE_WRITE(enc
->fb
->res
->cs_buf
, enc
->fb
->res
->domains
, 0x0); // feedbackRingAddressHi/Lo
72 RVCE_CS(0x00000001); // feedbackRingSize
76 static void create(struct rvce_encoder
*enc
)
78 task_info(enc
, 0x00000000);
80 RVCE_BEGIN(0x01000001); // create cmd
81 RVCE_CS(0x00000000); // encUseCircularBuffer
82 RVCE_CS(profiles
[enc
->base
.profile
-
83 PIPE_VIDEO_PROFILE_MPEG4_AVC_BASELINE
]); // encProfile
84 RVCE_CS(enc
->base
.level
); // encLevel
85 RVCE_CS(0x00000000); // encPicStructRestriction
86 RVCE_CS(enc
->base
.width
); // encImageWidth
87 RVCE_CS(enc
->base
.height
); // encImageHeight
88 RVCE_CS(enc
->luma
->level
[0].pitch_bytes
); // encRefPicLumaPitch
89 RVCE_CS(enc
->chroma
->level
[0].pitch_bytes
); // encRefPicChromaPitch
90 RVCE_CS(align(enc
->luma
->npix_y
, 16) / 8); // encRefYHeightInQw
91 RVCE_CS(0x00000000); // encRefPic(Addr|Array)Mode, encPicStructRestriction, disableRDO
95 static void rate_control(struct rvce_encoder
*enc
)
97 RVCE_BEGIN(0x04000005); // rate control
98 RVCE_CS(enc
->pic
.rate_ctrl
.rate_ctrl_method
); // encRateControlMethod
99 RVCE_CS(enc
->pic
.rate_ctrl
.target_bitrate
); // encRateControlTargetBitRate
100 RVCE_CS(enc
->pic
.rate_ctrl
.peak_bitrate
); // encRateControlPeakBitRate
101 RVCE_CS(enc
->pic
.rate_ctrl
.frame_rate_num
); // encRateControlFrameRateNum
102 RVCE_CS(0x00000000); // encGOPSize
103 RVCE_CS(enc
->pic
.quant_i_frames
); // encQP_I
104 RVCE_CS(enc
->pic
.quant_p_frames
); // encQP_P
105 RVCE_CS(enc
->pic
.quant_b_frames
); // encQP_B
106 RVCE_CS(enc
->pic
.rate_ctrl
.vbv_buffer_size
); // encVBVBufferSize
107 RVCE_CS(enc
->pic
.rate_ctrl
.frame_rate_den
); // encRateControlFrameRateDen
108 RVCE_CS(0x00000000); // encVBVBufferLevel
109 RVCE_CS(0x00000000); // encMaxAUSize
110 RVCE_CS(0x00000000); // encQPInitialMode
111 RVCE_CS(enc
->pic
.rate_ctrl
.target_bits_picture
); // encTargetBitsPerPicture
112 RVCE_CS(enc
->pic
.rate_ctrl
.peak_bits_picture_integer
); // encPeakBitsPerPictureInteger
113 RVCE_CS(enc
->pic
.rate_ctrl
.peak_bits_picture_fraction
); // encPeakBitsPerPictureFractional
114 RVCE_CS(0x00000000); // encMinQP
115 RVCE_CS(0x00000033); // encMaxQP
116 RVCE_CS(0x00000000); // encSkipFrameEnable
117 RVCE_CS(0x00000000); // encFillerDataEnable
118 RVCE_CS(0x00000000); // encEnforceHRD
119 RVCE_CS(0x00000000); // encBPicsDeltaQP
120 RVCE_CS(0x00000000); // encReferenceBPicsDeltaQP
121 RVCE_CS(0x00000000); // encRateControlReInitDisable
125 static void config_extension(struct rvce_encoder
*enc
)
127 RVCE_BEGIN(0x04000001); // config extension
128 RVCE_CS(0x00000003); // encEnablePerfLogging
132 static void pic_control(struct rvce_encoder
*enc
)
134 unsigned encNumMBsPerSlice
;
136 encNumMBsPerSlice
= align(enc
->base
.width
, 16) / 16;
137 encNumMBsPerSlice
*= align(enc
->base
.height
, 16) / 16;
139 RVCE_BEGIN(0x04000002); // pic control
140 RVCE_CS(0x00000000); // encUseConstrainedIntraPred
141 RVCE_CS(0x00000000); // encCABACEnable
142 RVCE_CS(0x00000000); // encCABACIDC
143 RVCE_CS(0x00000000); // encLoopFilterDisable
144 RVCE_CS(0x00000000); // encLFBetaOffset
145 RVCE_CS(0x00000000); // encLFAlphaC0Offset
146 RVCE_CS(0x00000000); // encCropLeftOffset
147 RVCE_CS((align(enc
->base
.width
, 16) - enc
->base
.width
) >> 1); // encCropRightOffset
148 RVCE_CS(0x00000000); // encCropTopOffset
149 RVCE_CS((align(enc
->base
.height
, 16) - enc
->base
.height
) >> 1); // encCropBottomOffset
150 RVCE_CS(encNumMBsPerSlice
); // encNumMBsPerSlice
151 RVCE_CS(0x00000000); // encIntraRefreshNumMBsPerSlot
152 RVCE_CS(0x00000000); // encForceIntraRefresh
153 RVCE_CS(0x00000000); // encForceIMBPeriod
154 RVCE_CS(0x00000000); // encPicOrderCntType
155 RVCE_CS(0x00000000); // log2_max_pic_order_cnt_lsb_minus4
156 RVCE_CS(0x00000000); // encSPSID
157 RVCE_CS(0x00000000); // encPPSID
158 RVCE_CS(0x00000040); // encConstraintSetFlags
159 RVCE_CS(MAX2(enc
->base
.max_references
, 1) - 1); // encBPicPattern
160 RVCE_CS(0x00000000); // weightPredModeBPicture
161 RVCE_CS(MIN2(enc
->base
.max_references
, 2)); // encNumberOfReferenceFrames
162 RVCE_CS(enc
->base
.max_references
+ 1); // encMaxNumRefFrames
163 RVCE_CS(0x00000001); // encNumDefaultActiveRefL0
164 RVCE_CS(0x00000001); // encNumDefaultActiveRefL1
165 RVCE_CS(0x00000000); // encSliceMode
166 RVCE_CS(0x00000000); // encMaxSliceSize
170 static void motion_estimation(struct rvce_encoder
*enc
)
172 RVCE_BEGIN(0x04000007); // motion estimation
173 RVCE_CS(0x00000001); // encIMEDecimationSearch
174 RVCE_CS(0x00000001); // motionEstHalfPixel
175 RVCE_CS(0x00000000); // motionEstQuarterPixel
176 RVCE_CS(0x00000000); // disableFavorPMVPoint
177 RVCE_CS(0x00000000); // forceZeroPointCenter
178 RVCE_CS(0x00000000); // LSMVert
179 RVCE_CS(0x00000010); // encSearchRangeX
180 RVCE_CS(0x00000010); // encSearchRangeY
181 RVCE_CS(0x00000010); // encSearch1RangeX
182 RVCE_CS(0x00000010); // encSearch1RangeY
183 RVCE_CS(0x00000000); // disable16x16Frame1
184 RVCE_CS(0x00000000); // disableSATD
185 RVCE_CS(0x00000000); // enableAMD
186 RVCE_CS(0x000000fe); // encDisableSubMode
187 RVCE_CS(0x00000000); // encIMESkipX
188 RVCE_CS(0x00000000); // encIMESkipY
189 RVCE_CS(0x00000000); // encEnImeOverwDisSubm
190 RVCE_CS(0x00000000); // encImeOverwDisSubmNo
191 RVCE_CS(0x00000001); // encIME2SearchRangeX
192 RVCE_CS(0x00000001); // encIME2SearchRangeY
193 RVCE_CS(0x00000000); // parallelModeSpeedupEnable
194 RVCE_CS(0x00000000); // fme0_encDisableSubMode
195 RVCE_CS(0x00000000); // fme1_encDisableSubMode
196 RVCE_CS(0x00000000); // imeSWSpeedupEnable
200 static void rdo(struct rvce_encoder
*enc
)
202 RVCE_BEGIN(0x04000008); // rdo
203 RVCE_CS(0x00000000); // encDisableTbePredIFrame
204 RVCE_CS(0x00000000); // encDisableTbePredPFrame
205 RVCE_CS(0x00000000); // useFmeInterpolY
206 RVCE_CS(0x00000000); // useFmeInterpolUV
207 RVCE_CS(0x00000000); // useFmeIntrapolY
208 RVCE_CS(0x00000000); // useFmeIntrapolUV
209 RVCE_CS(0x00000000); // useFmeInterpolY_1
210 RVCE_CS(0x00000000); // useFmeInterpolUV_1
211 RVCE_CS(0x00000000); // useFmeIntrapolY_1
212 RVCE_CS(0x00000000); // useFmeIntrapolUV_1
213 RVCE_CS(0x00000000); // enc16x16CostAdj
214 RVCE_CS(0x00000000); // encSkipCostAdj
215 RVCE_CS(0x00000000); // encForce16x16skip
216 RVCE_CS(0x00000000); // encDisableThresholdCalcA
217 RVCE_CS(0x00000000); // encLumaCoeffCost
218 RVCE_CS(0x00000000); // encLumaMBCoeffCost
219 RVCE_CS(0x00000000); // encChromaCoeffCost
223 static void vui(struct rvce_encoder
*enc
)
227 RVCE_BEGIN(0x04000009); // vui
228 RVCE_CS(0x00000000); //aspectRatioInfoPresentFlag
229 RVCE_CS(0x00000000); //aspectRatioInfo.aspectRatioIdc
230 RVCE_CS(0x00000000); //aspectRatioInfo.sarWidth
231 RVCE_CS(0x00000000); //aspectRatioInfo.sarHeight
232 RVCE_CS(0x00000000); //overscanInfoPresentFlag
233 RVCE_CS(0x00000000); //overScanInfo.overscanAppropFlag
234 RVCE_CS(0x00000000); //videoSignalTypePresentFlag
235 RVCE_CS(0x00000005); //videoSignalTypeInfo.videoFormat
236 RVCE_CS(0x00000000); //videoSignalTypeInfo.videoFullRangeFlag
237 RVCE_CS(0x00000000); //videoSignalTypeInfo.colorDescriptionPresentFlag
238 RVCE_CS(0x00000002); //videoSignalTypeInfo.colorPrim
239 RVCE_CS(0x00000002); //videoSignalTypeInfo.transferChar
240 RVCE_CS(0x00000002); //videoSignalTypeInfo.matrixCoef
241 RVCE_CS(0x00000000); //chromaLocInfoPresentFlag
242 RVCE_CS(0x00000000); //chromaLocInfo.chromaLocTop
243 RVCE_CS(0x00000000); //chromaLocInfo.chromaLocBottom
244 RVCE_CS(0x00000001); //timingInfoPresentFlag
245 RVCE_CS(enc
->pic
.rate_ctrl
.frame_rate_den
); //timingInfo.numUnitsInTick
246 RVCE_CS(enc
->pic
.rate_ctrl
.frame_rate_num
* 2); //timingInfo.timeScale;
247 RVCE_CS(0x00000001); //timingInfo.fixedFrameRateFlag
248 RVCE_CS(0x00000000); //nalHRDParametersPresentFlag
249 RVCE_CS(0x00000000); //hrdParam.cpbCntMinus1
250 RVCE_CS(0x00000004); //hrdParam.bitRateScale
251 RVCE_CS(0x00000006); //hrdParam.cpbSizeScale
252 for (i
= 0; i
< 32; i
++) {
253 RVCE_CS(0x00000000); //hrdParam.bitRateValueMinus
254 RVCE_CS(0x00000000); //hrdParam.cpbSizeValueMinus
255 RVCE_CS(0x00000000); //hrdParam.cbrFlag
257 RVCE_CS(0x00000017); //hrdParam.initialCpbRemovalDelayLengthMinus1
258 RVCE_CS(0x00000017); //hrdParam.cpbRemovalDelayLengthMinus1
259 RVCE_CS(0x00000017); //hrdParam.dpbOutputDelayLengthMinus1
260 RVCE_CS(0x00000018); //hrdParam.timeOffsetLength
261 RVCE_CS(0x00000000); //lowDelayHRDFlag
262 RVCE_CS(0x00000000); //picStructPresentFlag
263 RVCE_CS(0x00000000); //bitstreamRestrictionPresentFlag
264 RVCE_CS(0x00000001); //bitstreamRestrictions.motionVectorsOverPicBoundariesFlag
265 RVCE_CS(0x00000002); //bitstreamRestrictions.maxBytesPerPicDenom
266 RVCE_CS(0x00000001); //bitstreamRestrictions.maxBitsPerMbDenom
267 RVCE_CS(0x00000010); //bitstreamRestrictions.log2MaxMvLengthHori
268 RVCE_CS(0x00000010); //bitstreamRestrictions.log2MaxMvLengthVert
269 RVCE_CS(0x00000003); //bitstreamRestrictions.numReorderFrames
270 RVCE_CS(0x00000003); //bitstreamRestrictions.maxDecFrameBuffering
274 static void encode(struct rvce_encoder
*enc
)
277 unsigned luma_offset
, chroma_offset
;
279 task_info(enc
, 0x00000003);
281 RVCE_BEGIN(0x05000001); // context buffer
282 RVCE_READWRITE(enc
->cpb
.res
->cs_buf
, enc
->cpb
.res
->domains
, 0x0); // encodeContextAddressHi/Lo
285 RVCE_BEGIN(0x05000004); // video bitstream buffer
286 RVCE_WRITE(enc
->bs_handle
, RADEON_DOMAIN_GTT
, 0x0); // videoBitstreamRingAddressHi/Lo
287 RVCE_CS(enc
->bs_size
); // videoBitstreamRingSize
290 RVCE_BEGIN(0x03000001); // encode
291 RVCE_CS(0x00000000); // insertHeaders
292 RVCE_CS(0x00000000); // pictureStructure
293 RVCE_CS(enc
->bs_size
); // allowedMaxBitstreamSize
294 RVCE_CS(0x00000000); // forceRefreshMap
295 RVCE_CS(0x00000000); // insertAUD
296 RVCE_CS(0x00000000); // endOfSequence
297 RVCE_CS(0x00000000); // endOfStream
298 RVCE_READ(enc
->handle
, RADEON_DOMAIN_VRAM
,
299 enc
->luma
->level
[0].offset
); // inputPictureLumaAddressHi/Lo
300 RVCE_READ(enc
->handle
, RADEON_DOMAIN_VRAM
,
301 enc
->chroma
->level
[0].offset
); // inputPictureChromaAddressHi/Lo
302 RVCE_CS(align(enc
->luma
->npix_y
, 16)); // encInputFrameYPitch
303 RVCE_CS(enc
->luma
->level
[0].pitch_bytes
); // encInputPicLumaPitch
304 RVCE_CS(enc
->chroma
->level
[0].pitch_bytes
); // encInputPicChromaPitch
305 RVCE_CS(0x00000000); // encInputPic(Addr|Array)Mode
306 RVCE_CS(0x00000000); // encInputPicTileConfig
307 RVCE_CS(enc
->pic
.picture_type
); // encPicType
308 RVCE_CS(enc
->pic
.picture_type
== PIPE_H264_ENC_PICTURE_TYPE_IDR
); // encIdrFlag
309 RVCE_CS(0x00000000); // encIdrPicId
310 RVCE_CS(0x00000000); // encMGSKeyPic
311 RVCE_CS(!enc
->pic
.not_referenced
); // encReferenceFlag
312 RVCE_CS(0x00000000); // encTemporalLayerIndex
313 RVCE_CS(0x00000000); // num_ref_idx_active_override_flag
314 RVCE_CS(0x00000000); // num_ref_idx_l0_active_minus1
315 RVCE_CS(0x00000000); // num_ref_idx_l1_active_minus1
317 i
= enc
->pic
.frame_num
- enc
->pic
.ref_idx_l0
;
318 if (i
> 1 && enc
->pic
.picture_type
== PIPE_H264_ENC_PICTURE_TYPE_P
) {
319 RVCE_CS(0x00000001); // encRefListModificationOp
320 RVCE_CS(i
- 1); // encRefListModificationNum
322 RVCE_CS(0x00000000); // encRefListModificationOp
323 RVCE_CS(0x00000000); // encRefListModificationNum
326 for (i
= 0; i
< 3; ++i
) {
327 RVCE_CS(0x00000000); // encRefListModificationOp
328 RVCE_CS(0x00000000); // encRefListModificationNum
330 for (i
= 0; i
< 4; ++i
) {
331 RVCE_CS(0x00000000); // encDecodedPictureMarkingOp
332 RVCE_CS(0x00000000); // encDecodedPictureMarkingNum
333 RVCE_CS(0x00000000); // encDecodedPictureMarkingIdx
334 RVCE_CS(0x00000000); // encDecodedRefBasePictureMarkingOp
335 RVCE_CS(0x00000000); // encDecodedRefBasePictureMarkingNum
338 // encReferencePictureL0[0]
339 RVCE_CS(0x00000000); // pictureStructure
340 if(enc
->pic
.picture_type
== PIPE_H264_ENC_PICTURE_TYPE_P
||
341 enc
->pic
.picture_type
== PIPE_H264_ENC_PICTURE_TYPE_B
) {
342 struct rvce_cpb_slot
*l0
= l0_slot(enc
);
343 rvce_frame_offset(enc
, l0
, &luma_offset
, &chroma_offset
);
344 RVCE_CS(l0
->picture_type
); // encPicType
345 RVCE_CS(l0
->frame_num
); // frameNumber
346 RVCE_CS(l0
->pic_order_cnt
); // pictureOrderCount
347 RVCE_CS(luma_offset
); // lumaOffset
348 RVCE_CS(chroma_offset
); // chromaOffset
350 RVCE_CS(0x00000000); // encPicType
351 RVCE_CS(0x00000000); // frameNumber
352 RVCE_CS(0x00000000); // pictureOrderCount
353 RVCE_CS(0xffffffff); // lumaOffset
354 RVCE_CS(0xffffffff); // chromaOffset
357 // encReferencePictureL0[1]
358 RVCE_CS(0x00000000); // pictureStructure
359 RVCE_CS(0x00000000); // encPicType
360 RVCE_CS(0x00000000); // frameNumber
361 RVCE_CS(0x00000000); // pictureOrderCount
362 RVCE_CS(0xffffffff); // lumaOffset
363 RVCE_CS(0xffffffff); // chromaOffset
365 // encReferencePictureL1[0]
366 RVCE_CS(0x00000000); // pictureStructure
367 if(enc
->pic
.picture_type
== PIPE_H264_ENC_PICTURE_TYPE_B
) {
368 struct rvce_cpb_slot
*l1
= l1_slot(enc
);
369 rvce_frame_offset(enc
, l1
, &luma_offset
, &chroma_offset
);
370 RVCE_CS(l1
->picture_type
); // encPicType
371 RVCE_CS(l1
->frame_num
); // frameNumber
372 RVCE_CS(l1
->pic_order_cnt
); // pictureOrderCount
373 RVCE_CS(luma_offset
); // lumaOffset
374 RVCE_CS(chroma_offset
); // chromaOffset
376 RVCE_CS(0x00000000); // encPicType
377 RVCE_CS(0x00000000); // frameNumber
378 RVCE_CS(0x00000000); // pictureOrderCount
379 RVCE_CS(0xffffffff); // lumaOffset
380 RVCE_CS(0xffffffff); // chromaOffset
383 rvce_frame_offset(enc
, current_slot(enc
), &luma_offset
, &chroma_offset
);
384 RVCE_CS(luma_offset
); // encReconstructedLumaOffset
385 RVCE_CS(chroma_offset
); // encReconstructedChromaOffset
386 RVCE_CS(0x00000000); // encColocBufferOffset
387 RVCE_CS(0x00000000); // encReconstructedRefBasePictureLumaOffset
388 RVCE_CS(0x00000000); // encReconstructedRefBasePictureChromaOffset
389 RVCE_CS(0x00000000); // encReferenceRefBasePictureLumaOffset
390 RVCE_CS(0x00000000); // encReferenceRefBasePictureChromaOffset
391 RVCE_CS(0x00000000); // pictureCount
392 RVCE_CS(enc
->pic
.frame_num
); // frameNumber
393 RVCE_CS(enc
->pic
.pic_order_cnt
); // pictureOrderCount
394 RVCE_CS(0x00000000); // numIPicRemainInRCGOP
395 RVCE_CS(0x00000000); // numPPicRemainInRCGOP
396 RVCE_CS(0x00000000); // numBPicRemainInRCGOP
397 RVCE_CS(0x00000000); // numIRPicRemainInRCGOP
398 RVCE_CS(0x00000000); // enableIntraRefresh
402 static void destroy(struct rvce_encoder
*enc
)
404 task_info(enc
, 0x00000001);
406 RVCE_BEGIN(0x02000001); // destroy
410 void radeon_vce_40_2_2_init(struct rvce_encoder
*enc
)
412 enc
->session
= session
;
413 enc
->create
= create
;
414 enc
->feedback
= feedback
;
415 enc
->rate_control
= rate_control
;
416 enc
->config_extension
= config_extension
;
417 enc
->pic_control
= pic_control
;
418 enc
->motion_estimation
= motion_estimation
;
421 enc
->encode
= encode
;
422 enc
->destroy
= destroy
;