2 * Copyright (c) 2017-2019 Lima Project
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sub license,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the
12 * next paragraph) shall be included in all copies or substantial portions
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
25 #include "util/u_memory.h"
26 #include "util/ralloc.h"
27 #include "util/u_debug.h"
29 #include "tgsi/tgsi_dump.h"
30 #include "compiler/nir/nir.h"
31 #include "nir/tgsi_to_nir.h"
33 #include "pipe/p_state.h"
35 #include "lima_screen.h"
36 #include "lima_context.h"
37 #include "lima_program.h"
39 #include "ir/lima_ir.h"
41 static const nir_shader_compiler_options vs_nir_options
= {
52 /* could be implemented by clamp */
59 static const nir_shader_compiler_options fs_nir_options
= {
71 .lower_vector_cmp
= true,
74 static const struct nir_lower_tex_options tex_options
= {
79 lima_program_get_compiler_options(enum pipe_shader_type shader
)
82 case PIPE_SHADER_VERTEX
:
83 return &vs_nir_options
;
84 case PIPE_SHADER_FRAGMENT
:
85 return &fs_nir_options
;
92 type_size(const struct glsl_type
*type
, bool bindless
)
94 return glsl_count_attribute_slots(type
, false);
98 lima_program_optimize_vs_nir(struct nir_shader
*s
)
102 NIR_PASS_V(s
, nir_lower_viewport_transform
);
103 NIR_PASS_V(s
, nir_lower_io
, nir_var_all
, type_size
, 0);
104 NIR_PASS_V(s
, nir_lower_load_const_to_scalar
);
105 NIR_PASS_V(s
, lima_nir_lower_uniform_to_scalar
);
106 NIR_PASS_V(s
, nir_lower_io_to_scalar
,
107 nir_var_shader_in
|nir_var_shader_out
);
112 NIR_PASS_V(s
, nir_lower_vars_to_ssa
);
113 NIR_PASS(progress
, s
, nir_lower_alu_to_scalar
, NULL
);
114 NIR_PASS(progress
, s
, nir_lower_phis_to_scalar
);
115 NIR_PASS(progress
, s
, nir_copy_prop
);
116 NIR_PASS(progress
, s
, nir_opt_remove_phis
);
117 NIR_PASS(progress
, s
, nir_opt_dce
);
118 NIR_PASS(progress
, s
, nir_opt_dead_cf
);
119 NIR_PASS(progress
, s
, nir_opt_cse
);
120 NIR_PASS(progress
, s
, nir_opt_peephole_select
, 8, true, true);
121 NIR_PASS(progress
, s
, nir_opt_algebraic
);
122 NIR_PASS(progress
, s
, nir_opt_constant_folding
);
123 NIR_PASS(progress
, s
, nir_opt_undef
);
124 NIR_PASS(progress
, s
, nir_opt_loop_unroll
,
127 nir_var_function_temp
);
130 NIR_PASS_V(s
, nir_lower_int_to_float
);
131 NIR_PASS_V(s
, nir_lower_bool_to_float
);
133 /* Some ops must be lowered after being converted from int ops,
134 * so re-run nir_opt_algebraic after int lowering. */
137 NIR_PASS(progress
, s
, nir_opt_algebraic
);
140 NIR_PASS_V(s
, nir_copy_prop
);
141 NIR_PASS_V(s
, nir_opt_dce
);
142 NIR_PASS_V(s
, nir_lower_locals_to_regs
);
143 NIR_PASS_V(s
, nir_convert_from_ssa
, true);
144 NIR_PASS_V(s
, nir_remove_dead_variables
, nir_var_function_temp
);
149 lima_program_optimize_fs_nir(struct nir_shader
*s
)
151 BITSET_DECLARE(alu_lower
, nir_num_opcodes
) = {0};
154 BITSET_SET(alu_lower
, nir_op_frcp
);
155 BITSET_SET(alu_lower
, nir_op_frsq
);
156 BITSET_SET(alu_lower
, nir_op_flog2
);
157 BITSET_SET(alu_lower
, nir_op_fexp2
);
158 BITSET_SET(alu_lower
, nir_op_fsqrt
);
159 BITSET_SET(alu_lower
, nir_op_fsin
);
160 BITSET_SET(alu_lower
, nir_op_fcos
);
161 /* nir vec4 fcsel assumes that each component of the condition will be
162 * used to select the same component from the two options, but lima
163 * can't implement that since we only have 1 component condition */
164 BITSET_SET(alu_lower
, nir_op_fcsel
);
165 BITSET_SET(alu_lower
, nir_op_bcsel
);
167 NIR_PASS_V(s
, nir_lower_fragcoord_wtrans
);
168 NIR_PASS_V(s
, nir_lower_io
, nir_var_all
, type_size
, 0);
169 NIR_PASS_V(s
, nir_lower_regs_to_ssa
);
170 NIR_PASS_V(s
, nir_lower_tex
, &tex_options
);
174 NIR_PASS(progress
, s
, nir_opt_vectorize
);
180 NIR_PASS_V(s
, nir_lower_vars_to_ssa
);
181 NIR_PASS(progress
, s
, nir_lower_alu_to_scalar
, alu_lower
);
182 NIR_PASS(progress
, s
, nir_lower_phis_to_scalar
);
183 NIR_PASS(progress
, s
, nir_copy_prop
);
184 NIR_PASS(progress
, s
, nir_opt_remove_phis
);
185 NIR_PASS(progress
, s
, nir_opt_dce
);
186 NIR_PASS(progress
, s
, nir_opt_dead_cf
);
187 NIR_PASS(progress
, s
, nir_opt_cse
);
188 NIR_PASS(progress
, s
, nir_opt_peephole_select
, 8, true, true);
189 NIR_PASS(progress
, s
, nir_opt_algebraic
);
190 NIR_PASS(progress
, s
, nir_opt_constant_folding
);
191 NIR_PASS(progress
, s
, nir_opt_undef
);
192 NIR_PASS(progress
, s
, nir_opt_loop_unroll
,
195 nir_var_function_temp
);
198 NIR_PASS_V(s
, nir_lower_int_to_float
);
199 NIR_PASS_V(s
, nir_lower_bool_to_float
);
201 /* Some ops must be lowered after being converted from int ops,
202 * so re-run nir_opt_algebraic after int lowering. */
205 NIR_PASS(progress
, s
, nir_opt_algebraic
);
208 /* Must be run after optimization loop */
209 NIR_PASS_V(s
, lima_nir_scale_trig
);
211 /* Lower modifiers */
212 NIR_PASS_V(s
, nir_lower_to_source_mods
, nir_lower_all_source_mods
);
213 NIR_PASS_V(s
, nir_copy_prop
);
214 NIR_PASS_V(s
, nir_opt_dce
);
216 NIR_PASS_V(s
, nir_lower_locals_to_regs
);
217 NIR_PASS_V(s
, nir_convert_from_ssa
, true);
218 NIR_PASS_V(s
, nir_remove_dead_variables
, nir_var_function_temp
);
220 NIR_PASS_V(s
, nir_move_vec_src_uses_to_dest
);
221 NIR_PASS_V(s
, nir_lower_vec_to_movs
);
227 lima_create_fs_state(struct pipe_context
*pctx
,
228 const struct pipe_shader_state
*cso
)
230 struct lima_context
*ctx
= lima_context(pctx
);
231 struct lima_screen
*screen
= lima_screen(pctx
->screen
);
232 struct lima_fs_shader_state
*so
= rzalloc(NULL
, struct lima_fs_shader_state
);
238 if (cso
->type
== PIPE_SHADER_IR_NIR
)
241 assert(cso
->type
== PIPE_SHADER_IR_TGSI
);
243 nir
= tgsi_to_nir(cso
->tokens
, pctx
->screen
);
246 lima_program_optimize_fs_nir(nir
);
248 if (lima_debug
& LIMA_DEBUG_PP
)
249 nir_print_shader(nir
, stdout
);
251 if (!ppir_compile_nir(so
, nir
, screen
->pp_ra
, &ctx
->debug
)) {
260 lima_bind_fs_state(struct pipe_context
*pctx
, void *hwcso
)
262 struct lima_context
*ctx
= lima_context(pctx
);
265 ctx
->dirty
|= LIMA_CONTEXT_DIRTY_SHADER_FRAG
;
269 lima_delete_fs_state(struct pipe_context
*pctx
, void *hwcso
)
271 struct lima_fs_shader_state
*so
= hwcso
;
274 lima_bo_free(so
->bo
);
280 lima_update_vs_state(struct lima_context
*ctx
)
282 struct lima_vs_shader_state
*vs
= ctx
->vs
;
284 struct lima_screen
*screen
= lima_screen(ctx
->base
.screen
);
285 vs
->bo
= lima_bo_create(screen
, vs
->shader_size
, 0);
287 fprintf(stderr
, "lima: create vs shader bo fail\n");
291 memcpy(lima_bo_map(vs
->bo
), vs
->shader
, vs
->shader_size
);
292 ralloc_free(vs
->shader
);
300 lima_update_fs_state(struct lima_context
*ctx
)
302 struct lima_fs_shader_state
*fs
= ctx
->fs
;
304 struct lima_screen
*screen
= lima_screen(ctx
->base
.screen
);
305 fs
->bo
= lima_bo_create(screen
, fs
->shader_size
, 0);
307 fprintf(stderr
, "lima: create fs shader bo fail\n");
311 memcpy(lima_bo_map(fs
->bo
), fs
->shader
, fs
->shader_size
);
312 ralloc_free(fs
->shader
);
316 ctx
->pp_max_stack_size
= MAX2(ctx
->pp_max_stack_size
, ctx
->fs
->stack_size
);
322 lima_create_vs_state(struct pipe_context
*pctx
,
323 const struct pipe_shader_state
*cso
)
325 struct lima_context
*ctx
= lima_context(pctx
);
326 struct lima_vs_shader_state
*so
= rzalloc(NULL
, struct lima_vs_shader_state
);
332 if (cso
->type
== PIPE_SHADER_IR_NIR
)
335 assert(cso
->type
== PIPE_SHADER_IR_TGSI
);
337 nir
= tgsi_to_nir(cso
->tokens
, pctx
->screen
);
340 lima_program_optimize_vs_nir(nir
);
342 if (lima_debug
& LIMA_DEBUG_GP
)
343 nir_print_shader(nir
, stdout
);
345 if (!gpir_compile_nir(so
, nir
, &ctx
->debug
)) {
354 lima_bind_vs_state(struct pipe_context
*pctx
, void *hwcso
)
356 struct lima_context
*ctx
= lima_context(pctx
);
359 ctx
->dirty
|= LIMA_CONTEXT_DIRTY_SHADER_VERT
;
363 lima_delete_vs_state(struct pipe_context
*pctx
, void *hwcso
)
365 struct lima_vs_shader_state
*so
= hwcso
;
368 lima_bo_free(so
->bo
);
374 lima_program_init(struct lima_context
*ctx
)
376 ctx
->base
.create_fs_state
= lima_create_fs_state
;
377 ctx
->base
.bind_fs_state
= lima_bind_fs_state
;
378 ctx
->base
.delete_fs_state
= lima_delete_fs_state
;
380 ctx
->base
.create_vs_state
= lima_create_vs_state
;
381 ctx
->base
.bind_vs_state
= lima_bind_vs_state
;
382 ctx
->base
.delete_vs_state
= lima_delete_vs_state
;