1 /**************************************************************************
3 * Copyright 2009 Younes Manton.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
31 #include <util/u_memory.h>
32 #include <util/u_rect.h>
33 #include <util/u_video.h>
35 #include "vl_mpeg12_decoder.h"
36 #include "vl_defines.h"
38 #define SCALE_FACTOR_SNORM (32768.0f / 256.0f)
39 #define SCALE_FACTOR_SSCALED (1.0f / 256.0f)
41 struct format_config
{
42 enum pipe_format zscan_source_format
;
43 enum pipe_format idct_source_format
;
44 enum pipe_format mc_source_format
;
50 static const struct format_config bitstream_format_config
[] = {
51 { PIPE_FORMAT_R16_SSCALED
, PIPE_FORMAT_R16G16B16A16_SSCALED
, PIPE_FORMAT_R16G16B16A16_FLOAT
, 1.0f
, SCALE_FACTOR_SSCALED
},
52 { PIPE_FORMAT_R16_SSCALED
, PIPE_FORMAT_R16G16B16A16_SSCALED
, PIPE_FORMAT_R16G16B16A16_SSCALED
, 1.0f
, SCALE_FACTOR_SSCALED
},
53 { PIPE_FORMAT_R16_SNORM
, PIPE_FORMAT_R16G16B16A16_SNORM
, PIPE_FORMAT_R16G16B16A16_FLOAT
, 1.0f
, SCALE_FACTOR_SNORM
},
54 { PIPE_FORMAT_R16_SNORM
, PIPE_FORMAT_R16G16B16A16_SNORM
, PIPE_FORMAT_R16G16B16A16_SNORM
, 1.0f
, SCALE_FACTOR_SNORM
}
57 static const unsigned num_bitstream_format_configs
=
58 sizeof(bitstream_format_config
) / sizeof(struct format_config
);
60 static const struct format_config idct_format_config
[] = {
61 { PIPE_FORMAT_R16_SSCALED
, PIPE_FORMAT_R16G16B16A16_SSCALED
, PIPE_FORMAT_R16G16B16A16_FLOAT
, 1.0f
, SCALE_FACTOR_SSCALED
},
62 { PIPE_FORMAT_R16_SSCALED
, PIPE_FORMAT_R16G16B16A16_SSCALED
, PIPE_FORMAT_R16G16B16A16_SSCALED
, 1.0f
, SCALE_FACTOR_SSCALED
},
63 { PIPE_FORMAT_R16_SNORM
, PIPE_FORMAT_R16G16B16A16_SNORM
, PIPE_FORMAT_R16G16B16A16_FLOAT
, 1.0f
, SCALE_FACTOR_SNORM
},
64 { PIPE_FORMAT_R16_SNORM
, PIPE_FORMAT_R16G16B16A16_SNORM
, PIPE_FORMAT_R16G16B16A16_SNORM
, 1.0f
, SCALE_FACTOR_SNORM
}
67 static const unsigned num_idct_format_configs
=
68 sizeof(idct_format_config
) / sizeof(struct format_config
);
70 static const struct format_config mc_format_config
[] = {
71 //{ PIPE_FORMAT_R16_SSCALED, PIPE_FORMAT_NONE, PIPE_FORMAT_R16_SSCALED, 0.0f, SCALE_FACTOR_SSCALED },
72 { PIPE_FORMAT_R16_SNORM
, PIPE_FORMAT_NONE
, PIPE_FORMAT_R16_SNORM
, 0.0f
, SCALE_FACTOR_SNORM
}
75 static const unsigned num_mc_format_configs
=
76 sizeof(mc_format_config
) / sizeof(struct format_config
);
79 init_zscan_buffer(struct vl_mpeg12_buffer
*buffer
)
81 enum pipe_format formats
[3];
83 struct pipe_sampler_view
**source
;
84 struct pipe_surface
**destination
;
86 struct vl_mpeg12_decoder
*dec
;
92 dec
= (struct vl_mpeg12_decoder
*)buffer
->base
.decoder
;
94 formats
[0] = formats
[1] = formats
[2] = dec
->zscan_source_format
;
95 buffer
->zscan_source
= vl_video_buffer_create_ex
98 dec
->blocks_per_line
* BLOCK_WIDTH
* BLOCK_HEIGHT
,
99 align(dec
->num_blocks
, dec
->blocks_per_line
) / dec
->blocks_per_line
,
100 1, PIPE_VIDEO_CHROMA_FORMAT_444
, formats
, PIPE_USAGE_STATIC
103 if (!buffer
->zscan_source
)
106 source
= buffer
->zscan_source
->get_sampler_view_planes(buffer
->zscan_source
);
110 if (dec
->base
.entrypoint
<= PIPE_VIDEO_ENTRYPOINT_IDCT
)
111 destination
= dec
->idct_source
->get_surfaces(dec
->idct_source
);
113 destination
= dec
->mc_source
->get_surfaces(dec
->mc_source
);
118 for (i
= 0; i
< VL_MAX_PLANES
; ++i
)
119 if (!vl_zscan_init_buffer(i
== 0 ? &dec
->zscan_y
: &dec
->zscan_c
,
120 &buffer
->zscan
[i
], source
[i
], destination
[i
]))
127 vl_zscan_cleanup_buffer(&buffer
->zscan
[i
- 1]);
131 buffer
->zscan_source
->destroy(buffer
->zscan_source
);
138 cleanup_zscan_buffer(struct vl_mpeg12_buffer
*buffer
)
144 for (i
= 0; i
< VL_MAX_PLANES
; ++i
)
145 vl_zscan_cleanup_buffer(&buffer
->zscan
[i
]);
146 buffer
->zscan_source
->destroy(buffer
->zscan_source
);
150 init_idct_buffer(struct vl_mpeg12_buffer
*buffer
)
152 struct pipe_sampler_view
**idct_source_sv
, **mc_source_sv
;
154 struct vl_mpeg12_decoder
*dec
;
160 dec
= (struct vl_mpeg12_decoder
*)buffer
->base
.decoder
;
162 idct_source_sv
= dec
->idct_source
->get_sampler_view_planes(dec
->idct_source
);
164 goto error_source_sv
;
166 mc_source_sv
= dec
->mc_source
->get_sampler_view_planes(dec
->mc_source
);
168 goto error_mc_source_sv
;
170 for (i
= 0; i
< 3; ++i
)
171 if (!vl_idct_init_buffer(i
== 0 ? &dec
->idct_y
: &dec
->idct_c
,
172 &buffer
->idct
[i
], idct_source_sv
[i
],
180 vl_idct_cleanup_buffer(&buffer
->idct
[i
- 1]);
188 cleanup_idct_buffer(struct vl_mpeg12_buffer
*buf
)
190 struct vl_mpeg12_decoder
*dec
;
195 dec
= (struct vl_mpeg12_decoder
*)buf
->base
.decoder
;
198 for (i
= 0; i
< 3; ++i
)
199 vl_idct_cleanup_buffer(&buf
->idct
[0]);
203 init_mc_buffer(struct vl_mpeg12_buffer
*buf
)
205 struct vl_mpeg12_decoder
*dec
;
209 dec
= (struct vl_mpeg12_decoder
*)buf
->base
.decoder
;
212 if(!vl_mc_init_buffer(&dec
->mc_y
, &buf
->mc
[0]))
215 if(!vl_mc_init_buffer(&dec
->mc_c
, &buf
->mc
[1]))
218 if(!vl_mc_init_buffer(&dec
->mc_c
, &buf
->mc
[2]))
224 vl_mc_cleanup_buffer(&buf
->mc
[1]);
227 vl_mc_cleanup_buffer(&buf
->mc
[0]);
234 cleanup_mc_buffer(struct vl_mpeg12_buffer
*buf
)
240 for (i
= 0; i
< VL_MAX_PLANES
; ++i
)
241 vl_mc_cleanup_buffer(&buf
->mc
[i
]);
245 vl_mpeg12_buffer_destroy(struct pipe_video_decode_buffer
*buffer
)
247 struct vl_mpeg12_buffer
*buf
= (struct vl_mpeg12_buffer
*)buffer
;
248 struct vl_mpeg12_decoder
*dec
;
252 dec
= (struct vl_mpeg12_decoder
*)buf
->base
.decoder
;
255 cleanup_zscan_buffer(buf
);
257 if (dec
->base
.entrypoint
<= PIPE_VIDEO_ENTRYPOINT_IDCT
)
258 cleanup_idct_buffer(buf
);
260 cleanup_mc_buffer(buf
);
262 vl_vb_cleanup(&buf
->vertex_stream
);
268 vl_mpeg12_buffer_begin_frame(struct pipe_video_decode_buffer
*buffer
)
270 struct vl_mpeg12_buffer
*buf
= (struct vl_mpeg12_buffer
*)buffer
;
271 struct vl_mpeg12_decoder
*dec
;
273 struct pipe_sampler_view
**sampler_views
;
278 dec
= (struct vl_mpeg12_decoder
*)buf
->base
.decoder
;
281 vl_vb_map(&buf
->vertex_stream
, dec
->base
.context
);
283 sampler_views
= buf
->zscan_source
->get_sampler_view_planes(buf
->zscan_source
);
285 assert(sampler_views
);
287 for (i
= 0; i
< VL_MAX_PLANES
; ++i
) {
288 struct pipe_resource
*tex
= sampler_views
[i
]->texture
;
289 struct pipe_box rect
=
297 buf
->tex_transfer
[i
] = dec
->base
.context
->get_transfer
299 dec
->base
.context
, tex
,
300 0, PIPE_TRANSFER_WRITE
| PIPE_TRANSFER_DISCARD
,
304 buf
->texels
[i
] = dec
->base
.context
->transfer_map(dec
->base
.context
, buf
->tex_transfer
[i
]);
307 if (dec
->base
.entrypoint
== PIPE_VIDEO_ENTRYPOINT_BITSTREAM
) {
308 struct pipe_ycbcr_block
*ycbcr_stream
[VL_MAX_PLANES
];
309 struct pipe_motionvector
*mv_stream
[VL_MAX_REF_FRAMES
];
311 for (i
= 0; i
< VL_MAX_PLANES
; ++i
)
312 ycbcr_stream
[i
] = vl_vb_get_ycbcr_stream(&buf
->vertex_stream
, i
);
314 for (i
= 0; i
< VL_MAX_REF_FRAMES
; ++i
)
315 mv_stream
[i
] = vl_vb_get_mv_stream(&buf
->vertex_stream
, i
);
317 vl_mpg12_bs_set_buffers(&buf
->bs
, ycbcr_stream
, buf
->texels
, mv_stream
);
320 for (i
= 0; i
< VL_MAX_PLANES
; ++i
)
321 vl_zscan_set_layout(&buf
->zscan
[i
], dec
->zscan_linear
);
326 vl_mpeg12_buffer_set_quant_matrix(struct pipe_video_decode_buffer
*buffer
,
327 const uint8_t intra_matrix
[64],
328 const uint8_t non_intra_matrix
[64])
330 struct vl_mpeg12_buffer
*buf
= (struct vl_mpeg12_buffer
*)buffer
;
333 for (i
= 0; i
< VL_MAX_PLANES
; ++i
) {
334 vl_zscan_upload_quant(&buf
->zscan
[i
], intra_matrix
, true);
335 vl_zscan_upload_quant(&buf
->zscan
[i
], non_intra_matrix
, false);
339 static struct pipe_ycbcr_block
*
340 vl_mpeg12_buffer_get_ycbcr_stream(struct pipe_video_decode_buffer
*buffer
, int component
)
342 struct vl_mpeg12_buffer
*buf
= (struct vl_mpeg12_buffer
*)buffer
;
346 return vl_vb_get_ycbcr_stream(&buf
->vertex_stream
, component
);
350 vl_mpeg12_buffer_get_ycbcr_buffer(struct pipe_video_decode_buffer
*buffer
, int component
)
352 struct vl_mpeg12_buffer
*buf
= (struct vl_mpeg12_buffer
*)buffer
;
355 assert(component
< VL_MAX_PLANES
);
357 return buf
->texels
[component
];
361 vl_mpeg12_buffer_get_mv_stream_stride(struct pipe_video_decode_buffer
*buffer
)
363 struct vl_mpeg12_buffer
*buf
= (struct vl_mpeg12_buffer
*)buffer
;
367 return vl_vb_get_mv_stream_stride(&buf
->vertex_stream
);
370 static struct pipe_motionvector
*
371 vl_mpeg12_buffer_get_mv_stream(struct pipe_video_decode_buffer
*buffer
, int ref_frame
)
373 struct vl_mpeg12_buffer
*buf
= (struct vl_mpeg12_buffer
*)buffer
;
377 return vl_vb_get_mv_stream(&buf
->vertex_stream
, ref_frame
);
381 vl_mpeg12_buffer_decode_bitstream(struct pipe_video_decode_buffer
*buffer
,
382 unsigned num_bytes
, const void *data
,
383 struct pipe_picture_desc
*picture
,
384 unsigned num_ycbcr_blocks
[3])
386 struct vl_mpeg12_buffer
*buf
= (struct vl_mpeg12_buffer
*)buffer
;
387 struct pipe_mpeg12_picture_desc
*pic
= (struct pipe_mpeg12_picture_desc
*)picture
;
389 struct vl_mpeg12_decoder
*dec
;
394 dec
= (struct vl_mpeg12_decoder
*)buf
->base
.decoder
;
397 for (i
= 0; i
< VL_MAX_PLANES
; ++i
)
398 vl_zscan_set_layout(&buf
->zscan
[i
], pic
->alternate_scan
? dec
->zscan_alternate
: dec
->zscan_normal
);
400 vl_mpg12_bs_decode(&buf
->bs
, num_bytes
, data
, pic
, num_ycbcr_blocks
);
404 vl_mpeg12_buffer_end_frame(struct pipe_video_decode_buffer
*buffer
)
406 struct vl_mpeg12_buffer
*buf
= (struct vl_mpeg12_buffer
*)buffer
;
407 struct vl_mpeg12_decoder
*dec
;
412 dec
= (struct vl_mpeg12_decoder
*)buf
->base
.decoder
;
415 vl_vb_unmap(&buf
->vertex_stream
, dec
->base
.context
);
417 for (i
= 0; i
< VL_MAX_PLANES
; ++i
) {
418 dec
->base
.context
->transfer_unmap(dec
->base
.context
, buf
->tex_transfer
[i
]);
419 dec
->base
.context
->transfer_destroy(dec
->base
.context
, buf
->tex_transfer
[i
]);
424 vl_mpeg12_destroy(struct pipe_video_decoder
*decoder
)
426 struct vl_mpeg12_decoder
*dec
= (struct vl_mpeg12_decoder
*)decoder
;
430 /* Asserted in softpipe_delete_fs_state() for some reason */
431 dec
->base
.context
->bind_vs_state(dec
->base
.context
, NULL
);
432 dec
->base
.context
->bind_fs_state(dec
->base
.context
, NULL
);
434 dec
->base
.context
->delete_depth_stencil_alpha_state(dec
->base
.context
, dec
->dsa
);
435 dec
->base
.context
->delete_sampler_state(dec
->base
.context
, dec
->sampler_ycbcr
);
437 vl_mc_cleanup(&dec
->mc_y
);
438 vl_mc_cleanup(&dec
->mc_c
);
439 dec
->mc_source
->destroy(dec
->mc_source
);
441 if (dec
->base
.entrypoint
<= PIPE_VIDEO_ENTRYPOINT_IDCT
) {
442 vl_idct_cleanup(&dec
->idct_y
);
443 vl_idct_cleanup(&dec
->idct_c
);
444 dec
->idct_source
->destroy(dec
->idct_source
);
447 vl_zscan_cleanup(&dec
->zscan_y
);
448 vl_zscan_cleanup(&dec
->zscan_c
);
450 dec
->base
.context
->delete_vertex_elements_state(dec
->base
.context
, dec
->ves_ycbcr
);
451 dec
->base
.context
->delete_vertex_elements_state(dec
->base
.context
, dec
->ves_mv
);
453 pipe_resource_reference(&dec
->quads
.buffer
, NULL
);
454 pipe_resource_reference(&dec
->pos
.buffer
, NULL
);
455 pipe_resource_reference(&dec
->block_num
.buffer
, NULL
);
457 pipe_sampler_view_reference(&dec
->zscan_linear
, NULL
);
458 pipe_sampler_view_reference(&dec
->zscan_normal
, NULL
);
459 pipe_sampler_view_reference(&dec
->zscan_alternate
, NULL
);
464 static struct pipe_video_decode_buffer
*
465 vl_mpeg12_create_buffer(struct pipe_video_decoder
*decoder
)
467 struct vl_mpeg12_decoder
*dec
= (struct vl_mpeg12_decoder
*)decoder
;
468 struct vl_mpeg12_buffer
*buffer
;
472 buffer
= CALLOC_STRUCT(vl_mpeg12_buffer
);
476 buffer
->base
.decoder
= decoder
;
477 buffer
->base
.destroy
= vl_mpeg12_buffer_destroy
;
478 buffer
->base
.begin_frame
= vl_mpeg12_buffer_begin_frame
;
479 buffer
->base
.set_quant_matrix
= vl_mpeg12_buffer_set_quant_matrix
;
480 buffer
->base
.get_ycbcr_stream
= vl_mpeg12_buffer_get_ycbcr_stream
;
481 buffer
->base
.get_ycbcr_buffer
= vl_mpeg12_buffer_get_ycbcr_buffer
;
482 buffer
->base
.get_mv_stream_stride
= vl_mpeg12_buffer_get_mv_stream_stride
;
483 buffer
->base
.get_mv_stream
= vl_mpeg12_buffer_get_mv_stream
;
484 buffer
->base
.decode_bitstream
= vl_mpeg12_buffer_decode_bitstream
;
485 buffer
->base
.end_frame
= vl_mpeg12_buffer_end_frame
;
487 if (!vl_vb_init(&buffer
->vertex_stream
, dec
->base
.context
,
488 dec
->base
.width
/ MACROBLOCK_WIDTH
,
489 dec
->base
.height
/ MACROBLOCK_HEIGHT
))
490 goto error_vertex_buffer
;
492 if (!init_mc_buffer(buffer
))
495 if (dec
->base
.entrypoint
<= PIPE_VIDEO_ENTRYPOINT_IDCT
)
496 if (!init_idct_buffer(buffer
))
499 if (!init_zscan_buffer(buffer
))
502 if (dec
->base
.entrypoint
== PIPE_VIDEO_ENTRYPOINT_BITSTREAM
)
503 vl_mpg12_bs_init(&buffer
->bs
,
504 dec
->base
.width
/ MACROBLOCK_WIDTH
,
505 dec
->base
.height
/ MACROBLOCK_HEIGHT
);
507 return &buffer
->base
;
510 if (dec
->base
.entrypoint
<= PIPE_VIDEO_ENTRYPOINT_IDCT
)
511 cleanup_idct_buffer(buffer
);
514 cleanup_mc_buffer(buffer
);
517 vl_vb_cleanup(&buffer
->vertex_stream
);
525 vl_mpeg12_decoder_flush_buffer(struct pipe_video_decode_buffer
*buffer
,
526 unsigned num_ycbcr_blocks
[3],
527 struct pipe_video_buffer
*refs
[2],
528 struct pipe_video_buffer
*dst
)
530 struct vl_mpeg12_buffer
*buf
= (struct vl_mpeg12_buffer
*)buffer
;
531 struct vl_mpeg12_decoder
*dec
;
533 struct pipe_sampler_view
**sv
[VL_MAX_REF_FRAMES
], **mc_source_sv
;
534 struct pipe_surface
**surfaces
;
536 struct pipe_vertex_buffer vb
[3];
538 unsigned i
, j
, component
;
539 unsigned nr_components
;
543 dec
= (struct vl_mpeg12_decoder
*)buf
->base
.decoder
;
546 for (i
= 0; i
< 2; ++i
)
547 sv
[i
] = refs
[i
] ? refs
[i
]->get_sampler_view_planes(refs
[i
]) : NULL
;
552 surfaces
= dst
->get_surfaces(dst
);
554 dec
->base
.context
->bind_vertex_elements_state(dec
->base
.context
, dec
->ves_mv
);
555 for (i
= 0; i
< VL_MAX_PLANES
; ++i
) {
556 if (!surfaces
[i
]) continue;
558 vl_mc_set_surface(&buf
->mc
[i
], surfaces
[i
]);
560 for (j
= 0; j
< VL_MAX_REF_FRAMES
; ++j
) {
561 if (!sv
[j
]) continue;
563 vb
[2] = vl_vb_get_mv(&buf
->vertex_stream
, j
);;
564 dec
->base
.context
->set_vertex_buffers(dec
->base
.context
, 3, vb
);
566 vl_mc_render_ref(&buf
->mc
[i
], sv
[j
][i
]);
570 vb
[2] = dec
->block_num
;
572 dec
->base
.context
->bind_vertex_elements_state(dec
->base
.context
, dec
->ves_ycbcr
);
573 for (i
= 0; i
< VL_MAX_PLANES
; ++i
) {
574 if (!num_ycbcr_blocks
[i
]) continue;
576 vb
[1] = vl_vb_get_ycbcr(&buf
->vertex_stream
, i
);
577 dec
->base
.context
->set_vertex_buffers(dec
->base
.context
, 3, vb
);
579 vl_zscan_render(&buf
->zscan
[i
] , num_ycbcr_blocks
[i
]);
581 if (dec
->base
.entrypoint
<= PIPE_VIDEO_ENTRYPOINT_IDCT
)
582 vl_idct_flush(&buf
->idct
[i
], num_ycbcr_blocks
[i
]);
585 mc_source_sv
= dec
->mc_source
->get_sampler_view_planes(dec
->mc_source
);
586 for (i
= 0, component
= 0; i
< VL_MAX_PLANES
; ++i
) {
587 if (!surfaces
[i
]) continue;
589 nr_components
= util_format_get_nr_components(surfaces
[i
]->texture
->format
);
590 for (j
= 0; j
< nr_components
; ++j
, ++component
) {
591 if (!num_ycbcr_blocks
[i
]) continue;
593 vb
[1] = vl_vb_get_ycbcr(&buf
->vertex_stream
, component
);
594 dec
->base
.context
->set_vertex_buffers(dec
->base
.context
, 3, vb
);
596 if (dec
->base
.entrypoint
<= PIPE_VIDEO_ENTRYPOINT_IDCT
)
597 vl_idct_prepare_stage2(&buf
->idct
[component
]);
599 dec
->base
.context
->set_fragment_sampler_views(dec
->base
.context
, 1, &mc_source_sv
[component
]);
600 dec
->base
.context
->bind_fragment_sampler_states(dec
->base
.context
, 1, &dec
->sampler_ycbcr
);
602 vl_mc_render_ycbcr(&buf
->mc
[i
], j
, num_ycbcr_blocks
[component
]);
608 init_pipe_state(struct vl_mpeg12_decoder
*dec
)
610 struct pipe_depth_stencil_alpha_state dsa
;
611 struct pipe_sampler_state sampler
;
616 memset(&dsa
, 0, sizeof dsa
);
617 dsa
.depth
.enabled
= 0;
618 dsa
.depth
.writemask
= 0;
619 dsa
.depth
.func
= PIPE_FUNC_ALWAYS
;
620 for (i
= 0; i
< 2; ++i
) {
621 dsa
.stencil
[i
].enabled
= 0;
622 dsa
.stencil
[i
].func
= PIPE_FUNC_ALWAYS
;
623 dsa
.stencil
[i
].fail_op
= PIPE_STENCIL_OP_KEEP
;
624 dsa
.stencil
[i
].zpass_op
= PIPE_STENCIL_OP_KEEP
;
625 dsa
.stencil
[i
].zfail_op
= PIPE_STENCIL_OP_KEEP
;
626 dsa
.stencil
[i
].valuemask
= 0;
627 dsa
.stencil
[i
].writemask
= 0;
629 dsa
.alpha
.enabled
= 0;
630 dsa
.alpha
.func
= PIPE_FUNC_ALWAYS
;
631 dsa
.alpha
.ref_value
= 0;
632 dec
->dsa
= dec
->base
.context
->create_depth_stencil_alpha_state(dec
->base
.context
, &dsa
);
633 dec
->base
.context
->bind_depth_stencil_alpha_state(dec
->base
.context
, dec
->dsa
);
635 memset(&sampler
, 0, sizeof(sampler
));
636 sampler
.wrap_s
= PIPE_TEX_WRAP_CLAMP_TO_EDGE
;
637 sampler
.wrap_t
= PIPE_TEX_WRAP_CLAMP_TO_EDGE
;
638 sampler
.wrap_r
= PIPE_TEX_WRAP_CLAMP_TO_BORDER
;
639 sampler
.min_img_filter
= PIPE_TEX_FILTER_NEAREST
;
640 sampler
.min_mip_filter
= PIPE_TEX_MIPFILTER_NONE
;
641 sampler
.mag_img_filter
= PIPE_TEX_FILTER_NEAREST
;
642 sampler
.compare_mode
= PIPE_TEX_COMPARE_NONE
;
643 sampler
.compare_func
= PIPE_FUNC_ALWAYS
;
644 sampler
.normalized_coords
= 1;
645 dec
->sampler_ycbcr
= dec
->base
.context
->create_sampler_state(dec
->base
.context
, &sampler
);
646 if (!dec
->sampler_ycbcr
)
652 static const struct format_config
*
653 find_format_config(struct vl_mpeg12_decoder
*dec
, const struct format_config configs
[], unsigned num_configs
)
655 struct pipe_screen
*screen
;
660 screen
= dec
->base
.context
->screen
;
662 for (i
= 0; i
< num_configs
; ++i
) {
663 if (!screen
->is_format_supported(screen
, configs
[i
].zscan_source_format
, PIPE_TEXTURE_2D
,
664 1, PIPE_BIND_SAMPLER_VIEW
))
667 if (configs
[i
].idct_source_format
!= PIPE_FORMAT_NONE
) {
668 if (!screen
->is_format_supported(screen
, configs
[i
].idct_source_format
, PIPE_TEXTURE_2D
,
669 1, PIPE_BIND_SAMPLER_VIEW
| PIPE_BIND_RENDER_TARGET
))
672 if (!screen
->is_format_supported(screen
, configs
[i
].mc_source_format
, PIPE_TEXTURE_3D
,
673 1, PIPE_BIND_SAMPLER_VIEW
| PIPE_BIND_RENDER_TARGET
))
676 if (!screen
->is_format_supported(screen
, configs
[i
].mc_source_format
, PIPE_TEXTURE_2D
,
677 1, PIPE_BIND_SAMPLER_VIEW
| PIPE_BIND_RENDER_TARGET
))
687 init_zscan(struct vl_mpeg12_decoder
*dec
, const struct format_config
* format_config
)
689 unsigned num_channels
;
693 dec
->zscan_source_format
= format_config
->zscan_source_format
;
694 dec
->zscan_linear
= vl_zscan_layout(dec
->base
.context
, vl_zscan_linear
, dec
->blocks_per_line
);
695 dec
->zscan_normal
= vl_zscan_layout(dec
->base
.context
, vl_zscan_normal
, dec
->blocks_per_line
);
696 dec
->zscan_alternate
= vl_zscan_layout(dec
->base
.context
, vl_zscan_alternate
, dec
->blocks_per_line
);
698 num_channels
= dec
->base
.entrypoint
<= PIPE_VIDEO_ENTRYPOINT_IDCT
? 4 : 1;
700 if (!vl_zscan_init(&dec
->zscan_y
, dec
->base
.context
, dec
->base
.width
, dec
->base
.height
,
701 dec
->blocks_per_line
, dec
->num_blocks
, num_channels
))
704 if (!vl_zscan_init(&dec
->zscan_c
, dec
->base
.context
, dec
->chroma_width
, dec
->chroma_height
,
705 dec
->blocks_per_line
, dec
->num_blocks
, num_channels
))
712 init_idct(struct vl_mpeg12_decoder
*dec
, const struct format_config
* format_config
)
714 unsigned nr_of_idct_render_targets
, max_inst
;
715 enum pipe_format formats
[3];
717 struct pipe_sampler_view
*matrix
= NULL
;
719 nr_of_idct_render_targets
= dec
->base
.context
->screen
->get_param
721 dec
->base
.context
->screen
, PIPE_CAP_MAX_RENDER_TARGETS
724 max_inst
= dec
->base
.context
->screen
->get_shader_param
726 dec
->base
.context
->screen
, PIPE_SHADER_FRAGMENT
, PIPE_SHADER_CAP_MAX_INSTRUCTIONS
729 // Just assume we need 32 inst per render target, not 100% true, but should work in most cases
730 if (nr_of_idct_render_targets
>= 4 && max_inst
>= 32*4)
731 // more than 4 render targets usually doesn't makes any seens
732 nr_of_idct_render_targets
= 4;
734 nr_of_idct_render_targets
= 1;
736 formats
[0] = formats
[1] = formats
[2] = format_config
->idct_source_format
;
737 dec
->idct_source
= vl_video_buffer_create_ex
739 dec
->base
.context
, dec
->base
.width
/ 4, dec
->base
.height
, 1,
740 dec
->base
.chroma_format
, formats
, PIPE_USAGE_STATIC
743 if (!dec
->idct_source
)
744 goto error_idct_source
;
746 formats
[0] = formats
[1] = formats
[2] = format_config
->mc_source_format
;
747 dec
->mc_source
= vl_video_buffer_create_ex
749 dec
->base
.context
, dec
->base
.width
/ nr_of_idct_render_targets
,
750 dec
->base
.height
/ 4, nr_of_idct_render_targets
,
751 dec
->base
.chroma_format
, formats
, PIPE_USAGE_STATIC
755 goto error_mc_source
;
757 if (!(matrix
= vl_idct_upload_matrix(dec
->base
.context
, format_config
->idct_scale
)))
760 if (!vl_idct_init(&dec
->idct_y
, dec
->base
.context
, dec
->base
.width
, dec
->base
.height
,
761 nr_of_idct_render_targets
, matrix
, matrix
))
764 if(!vl_idct_init(&dec
->idct_c
, dec
->base
.context
, dec
->chroma_width
, dec
->chroma_height
,
765 nr_of_idct_render_targets
, matrix
, matrix
))
768 pipe_sampler_view_reference(&matrix
, NULL
);
773 vl_idct_cleanup(&dec
->idct_y
);
776 pipe_sampler_view_reference(&matrix
, NULL
);
779 dec
->mc_source
->destroy(dec
->mc_source
);
782 dec
->idct_source
->destroy(dec
->idct_source
);
789 init_mc_source_widthout_idct(struct vl_mpeg12_decoder
*dec
, const struct format_config
* format_config
)
791 enum pipe_format formats
[3];
793 formats
[0] = formats
[1] = formats
[2] = format_config
->mc_source_format
;
794 dec
->mc_source
= vl_video_buffer_create_ex
796 dec
->base
.context
, dec
->base
.width
, dec
->base
.height
, 1,
797 dec
->base
.chroma_format
, formats
, PIPE_USAGE_STATIC
800 return dec
->mc_source
!= NULL
;
804 mc_vert_shader_callback(void *priv
, struct vl_mc
*mc
,
805 struct ureg_program
*shader
,
806 unsigned first_output
,
809 struct vl_mpeg12_decoder
*dec
= priv
;
810 struct ureg_dst o_vtex
;
815 if (dec
->base
.entrypoint
<= PIPE_VIDEO_ENTRYPOINT_IDCT
) {
816 struct vl_idct
*idct
= mc
== &dec
->mc_y
? &dec
->idct_y
: &dec
->idct_c
;
817 vl_idct_stage2_vert_shader(idct
, shader
, first_output
, tex
);
819 o_vtex
= ureg_DECL_output(shader
, TGSI_SEMANTIC_GENERIC
, first_output
);
820 ureg_MOV(shader
, ureg_writemask(o_vtex
, TGSI_WRITEMASK_XY
), ureg_src(tex
));
825 mc_frag_shader_callback(void *priv
, struct vl_mc
*mc
,
826 struct ureg_program
*shader
,
827 unsigned first_input
,
830 struct vl_mpeg12_decoder
*dec
= priv
;
831 struct ureg_src src
, sampler
;
836 if (dec
->base
.entrypoint
<= PIPE_VIDEO_ENTRYPOINT_IDCT
) {
837 struct vl_idct
*idct
= mc
== &dec
->mc_y
? &dec
->idct_y
: &dec
->idct_c
;
838 vl_idct_stage2_frag_shader(idct
, shader
, first_input
, dst
);
840 src
= ureg_DECL_fs_input(shader
, TGSI_SEMANTIC_GENERIC
, first_input
, TGSI_INTERPOLATE_LINEAR
);
841 sampler
= ureg_DECL_sampler(shader
, 0);
842 ureg_TEX(shader
, dst
, TGSI_TEXTURE_2D
, src
, sampler
);
846 struct pipe_video_decoder
*
847 vl_create_mpeg12_decoder(struct pipe_context
*context
,
848 enum pipe_video_profile profile
,
849 enum pipe_video_entrypoint entrypoint
,
850 enum pipe_video_chroma_format chroma_format
,
851 unsigned width
, unsigned height
)
853 const unsigned block_size_pixels
= BLOCK_WIDTH
* BLOCK_HEIGHT
;
854 const struct format_config
*format_config
;
855 struct vl_mpeg12_decoder
*dec
;
857 assert(u_reduce_video_profile(profile
) == PIPE_VIDEO_CODEC_MPEG12
);
859 dec
= CALLOC_STRUCT(vl_mpeg12_decoder
);
864 dec
->base
.context
= context
;
865 dec
->base
.profile
= profile
;
866 dec
->base
.entrypoint
= entrypoint
;
867 dec
->base
.chroma_format
= chroma_format
;
868 dec
->base
.width
= width
;
869 dec
->base
.height
= height
;
871 dec
->base
.destroy
= vl_mpeg12_destroy
;
872 dec
->base
.create_buffer
= vl_mpeg12_create_buffer
;
873 dec
->base
.flush_buffer
= vl_mpeg12_decoder_flush_buffer
;
875 dec
->blocks_per_line
= MAX2(util_next_power_of_two(dec
->base
.width
) / block_size_pixels
, 4);
876 dec
->num_blocks
= (dec
->base
.width
* dec
->base
.height
) / block_size_pixels
;
878 dec
->quads
= vl_vb_upload_quads(dec
->base
.context
);
879 dec
->pos
= vl_vb_upload_pos(
881 dec
->base
.width
/ MACROBLOCK_WIDTH
,
882 dec
->base
.height
/ MACROBLOCK_HEIGHT
884 dec
->block_num
= vl_vb_upload_block_num(dec
->base
.context
, dec
->num_blocks
);
886 dec
->ves_ycbcr
= vl_vb_get_ves_ycbcr(dec
->base
.context
);
887 dec
->ves_mv
= vl_vb_get_ves_mv(dec
->base
.context
);
889 /* TODO: Implement 422, 444 */
890 assert(dec
->base
.chroma_format
== PIPE_VIDEO_CHROMA_FORMAT_420
);
892 if (dec
->base
.chroma_format
== PIPE_VIDEO_CHROMA_FORMAT_420
) {
893 dec
->chroma_width
= dec
->base
.width
/ 2;
894 dec
->chroma_height
= dec
->base
.height
/ 2;
895 } else if (dec
->base
.chroma_format
== PIPE_VIDEO_CHROMA_FORMAT_422
) {
896 dec
->chroma_width
= dec
->base
.width
;
897 dec
->chroma_height
= dec
->base
.height
/ 2;
899 dec
->chroma_width
= dec
->base
.width
;
900 dec
->chroma_height
= dec
->base
.height
;
903 switch (entrypoint
) {
904 case PIPE_VIDEO_ENTRYPOINT_BITSTREAM
:
905 format_config
= find_format_config(dec
, bitstream_format_config
, num_bitstream_format_configs
);
908 case PIPE_VIDEO_ENTRYPOINT_IDCT
:
909 format_config
= find_format_config(dec
, idct_format_config
, num_idct_format_configs
);
912 case PIPE_VIDEO_ENTRYPOINT_MC
:
913 format_config
= find_format_config(dec
, mc_format_config
, num_mc_format_configs
);
924 if (!init_zscan(dec
, format_config
))
927 if (entrypoint
<= PIPE_VIDEO_ENTRYPOINT_IDCT
) {
928 if (!init_idct(dec
, format_config
))
931 if (!init_mc_source_widthout_idct(dec
, format_config
))
935 if (!vl_mc_init(&dec
->mc_y
, dec
->base
.context
, dec
->base
.width
, dec
->base
.height
,
936 MACROBLOCK_HEIGHT
, format_config
->mc_scale
,
937 mc_vert_shader_callback
, mc_frag_shader_callback
, dec
))
941 if (!vl_mc_init(&dec
->mc_c
, dec
->base
.context
, dec
->base
.width
, dec
->base
.height
,
942 BLOCK_HEIGHT
, format_config
->mc_scale
,
943 mc_vert_shader_callback
, mc_frag_shader_callback
, dec
))
946 if (!init_pipe_state(dec
))
947 goto error_pipe_state
;
952 vl_mc_cleanup(&dec
->mc_c
);
955 vl_mc_cleanup(&dec
->mc_y
);
958 if (entrypoint
<= PIPE_VIDEO_ENTRYPOINT_IDCT
) {
959 vl_idct_cleanup(&dec
->idct_y
);
960 vl_idct_cleanup(&dec
->idct_c
);
961 dec
->idct_source
->destroy(dec
->idct_source
);
963 dec
->mc_source
->destroy(dec
->mc_source
);
966 vl_zscan_cleanup(&dec
->zscan_y
);
967 vl_zscan_cleanup(&dec
->zscan_c
);