st/vdpau: Provide YV12 to NV12 putBits conversion v2
[mesa.git] / src / gallium / auxiliary / util / u_video.h
1 /**************************************************************************
2 *
3 * Copyright 2009 Younes Manton.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 #ifndef U_VIDEO_H
29 #define U_VIDEO_H
30
31 #include "pipe/p_defines.h"
32 #include "pipe/p_video_enums.h"
33
34 /* u_reduce_video_profile() needs these */
35 #include "pipe/p_compiler.h"
36 #include "util/u_debug.h"
37 #include "util/u_math.h"
38
39 #ifdef __cplusplus
40 extern "C" {
41 #endif
42
43 static inline enum pipe_video_format
44 u_reduce_video_profile(enum pipe_video_profile profile)
45 {
46 switch (profile)
47 {
48 case PIPE_VIDEO_PROFILE_MPEG1:
49 case PIPE_VIDEO_PROFILE_MPEG2_SIMPLE:
50 case PIPE_VIDEO_PROFILE_MPEG2_MAIN:
51 return PIPE_VIDEO_FORMAT_MPEG12;
52
53 case PIPE_VIDEO_PROFILE_MPEG4_SIMPLE:
54 case PIPE_VIDEO_PROFILE_MPEG4_ADVANCED_SIMPLE:
55 return PIPE_VIDEO_FORMAT_MPEG4;
56
57 case PIPE_VIDEO_PROFILE_VC1_SIMPLE:
58 case PIPE_VIDEO_PROFILE_VC1_MAIN:
59 case PIPE_VIDEO_PROFILE_VC1_ADVANCED:
60 return PIPE_VIDEO_FORMAT_VC1;
61
62 case PIPE_VIDEO_PROFILE_MPEG4_AVC_BASELINE:
63 case PIPE_VIDEO_PROFILE_MPEG4_AVC_CONSTRAINED_BASELINE:
64 case PIPE_VIDEO_PROFILE_MPEG4_AVC_MAIN:
65 case PIPE_VIDEO_PROFILE_MPEG4_AVC_EXTENDED:
66 case PIPE_VIDEO_PROFILE_MPEG4_AVC_HIGH:
67 case PIPE_VIDEO_PROFILE_MPEG4_AVC_HIGH10:
68 case PIPE_VIDEO_PROFILE_MPEG4_AVC_HIGH422:
69 case PIPE_VIDEO_PROFILE_MPEG4_AVC_HIGH444:
70 return PIPE_VIDEO_FORMAT_MPEG4_AVC;
71
72 case PIPE_VIDEO_PROFILE_HEVC_MAIN:
73 case PIPE_VIDEO_PROFILE_HEVC_MAIN_10:
74 case PIPE_VIDEO_PROFILE_HEVC_MAIN_STILL:
75 case PIPE_VIDEO_PROFILE_HEVC_MAIN_12:
76 case PIPE_VIDEO_PROFILE_HEVC_MAIN_444:
77 return PIPE_VIDEO_FORMAT_HEVC;
78
79 default:
80 return PIPE_VIDEO_FORMAT_UNKNOWN;
81 }
82 }
83
84 static inline void
85 u_copy_nv12_to_yv12(void *const *destination_data,
86 uint32_t const *destination_pitches,
87 int src_plane, int src_field,
88 int src_stride, int num_fields,
89 uint8_t const *src,
90 int width, int height)
91 {
92 int x, y;
93 unsigned u_stride = destination_pitches[2] * num_fields;
94 unsigned v_stride = destination_pitches[1] * num_fields;
95 uint8_t *u_dst = (uint8_t *)destination_data[2] + destination_pitches[2] * src_field;
96 uint8_t *v_dst = (uint8_t *)destination_data[1] + destination_pitches[1] * src_field;
97
98 /* TODO: SIMD */
99 for (y = 0; y < height; y++) {
100 for (x = 0; x < width; x++) {
101 u_dst[x] = src[2*x];
102 v_dst[x] = src[2*x+1];
103 }
104 u_dst += u_stride;
105 v_dst += v_stride;
106 src += src_stride;
107 }
108 }
109
110 /**
111 * \brief Copy YV12 chroma data while converting it NV12
112 *
113 * Given a set of YV12 source pointers and -pitches, copy the data to a
114 * layout typical for NV12 video buffers.
115 *
116 * \param source data[in] The plane data pointers. Array of 3.
117 * \param source_pitches[in] The plane pitches. Array of 3.
118 * \param dst_plane[in] The destination plane to copy to. For NV12 always 1.
119 * \param dst_field[in] The destination field if interlaced.
120 * \param dst_stride[in] The destination stride for this plane.
121 * \param num_fields[in] The number of fields in the video buffer.
122 * \param dst[in] The destination plane pointer.
123 * \param width[in] The source plane width.
124 * \param height[in] The source plane height.
125 */
126 static inline void
127 u_copy_nv12_from_yv12(const void *const *source_data,
128 uint32_t const *source_pitches,
129 int dst_plane, int dst_field,
130 int dst_stride, int num_fields,
131 uint8_t *dst,
132 int width, int height)
133 {
134 int x, y;
135 unsigned u_stride = source_pitches[2] * num_fields;
136 unsigned v_stride = source_pitches[1] * num_fields;
137 uint8_t *u_src = (uint8_t *)source_data[2] + source_pitches[2] * dst_field;
138 uint8_t *v_src = (uint8_t *)source_data[1] + source_pitches[1] * dst_field;
139
140 /* TODO: SIMD */
141 for (y = 0; y < height; y++) {
142 for (x = 0; x < width; x++) {
143 dst[2*x] = u_src[x];
144 dst[2*x+1] = v_src[x];
145 }
146 u_src += u_stride;
147 v_src += v_stride;
148 dst += dst_stride;
149 }
150 }
151
152 static inline void
153 u_copy_yv12_to_nv12(void *const *destination_data,
154 uint32_t const *destination_pitches,
155 int src_plane, int src_field,
156 int src_stride, int num_fields,
157 uint8_t const *src,
158 int width, int height)
159 {
160 int x, y;
161 unsigned offset = 2 - src_plane;
162 unsigned stride = destination_pitches[1] * num_fields;
163 uint8_t *dst = (uint8_t *)destination_data[1] + destination_pitches[1] * src_field;
164
165 /* TODO: SIMD */
166 for (y = 0; y < height; y++) {
167 for (x = 0; x < 2 * width; x += 2) {
168 dst[x+offset] = src[x>>1];
169 }
170 dst += stride;
171 src += src_stride;
172 }
173 }
174
175 static inline void
176 u_copy_yv12_img_to_nv12_surf(ubyte *const *src,
177 ubyte *dst,
178 unsigned width,
179 unsigned height,
180 unsigned src_stride,
181 unsigned dst_stride,
182 int field)
183 {
184 if (field == 0) {
185 ubyte *src_0 = src[field];
186 for (int i = 0; i < height ; i++) {
187 memcpy(dst, src_0, width);
188 dst += dst_stride;
189 src_0 += src_stride;
190 }
191 } else if (field == 1) {
192 const ubyte *src_1 = src[field];
193 const ubyte *src_2 = src[field+1];
194 bool odd = true;
195 for (unsigned i = 0; i < height ; i++) {
196 for (unsigned j = 0; j < width*2 ; j++) {
197 if (odd == false) {
198 dst[j] = src_1[j/2];
199 odd = true;
200 } else {
201 dst[j] = src_2[j/2];
202 odd = false;
203 }
204 }
205 dst += dst_stride;
206 src_1 += src_stride;
207 src_2 += src_stride;
208 }
209 }
210 }
211
212 static inline void
213 u_copy_swap422_packed(void *const *destination_data,
214 uint32_t const *destination_pitches,
215 int src_plane, int src_field,
216 int src_stride, int num_fields,
217 uint8_t const *src,
218 int width, int height)
219 {
220 int x, y;
221 unsigned stride = destination_pitches[0] * num_fields;
222 uint8_t *dst = (uint8_t *)destination_data[0] + destination_pitches[0] * src_field;
223
224 /* TODO: SIMD */
225 for (y = 0; y < height; y++) {
226 for (x = 0; x < 4 * width; x += 4) {
227 dst[x+0] = src[x+1];
228 dst[x+1] = src[x+0];
229 dst[x+2] = src[x+3];
230 dst[x+3] = src[x+2];
231 }
232 dst += stride;
233 src += src_stride;
234 }
235 }
236
237 static inline uint32_t
238 u_get_h264_level(uint32_t width, uint32_t height, uint32_t *max_reference)
239 {
240 uint32_t max_dpb_mbs;
241
242 width = align(width, 16);
243 height = align(height, 16);
244
245 /* Max references will be used for caculation of number of DPB buffers
246 in the UVD driver, limitation of max references is 16. Some client
247 like mpv application for VA-API, it requires references more than that,
248 so we have to set max of references to 16 here. */
249 *max_reference = MIN2(*max_reference, 16);
250 max_dpb_mbs = (width / 16) * (height / 16) * *max_reference;
251
252 /* The calculation is based on "Decoded picture buffering" section
253 from http://en.wikipedia.org/wiki/H.264/MPEG-4_AVC */
254 if (max_dpb_mbs <= 8100)
255 return 30;
256 else if (max_dpb_mbs <= 18000)
257 return 31;
258 else if (max_dpb_mbs <= 20480)
259 return 32;
260 else if (max_dpb_mbs <= 32768)
261 return 41;
262 else if (max_dpb_mbs <= 34816)
263 return 42;
264 else if (max_dpb_mbs <= 110400)
265 return 50;
266 else if (max_dpb_mbs <= 184320)
267 return 51;
268 else
269 return 52;
270 }
271
272 #ifdef __cplusplus
273 }
274 #endif
275
276 #endif /* U_VIDEO_H */