2 * Copyright © 2012 Vincent Lejeune
3 * Copyright © 2012 Intel Corporation
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9 * and/or sell copies of the Software, and to permit persons to whom the
10 * Software is furnished to do so, subject to the following conditions:
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
22 * DEALINGS IN THE SOFTWARE.
26 #include "program/hash_table.h"
29 * \file lower_output_reads.cpp
31 * In GLSL, shader output variables (such as varyings) can be both read and
32 * written. However, on some hardware, reading an output register causes
35 * This pass creates temporary shadow copies of every (used) shader output,
36 * and replaces all accesses to use those instead. It also adds code to the
37 * main() function to copy the final values to the actual shader outputs.
42 class output_read_remover
: public ir_hierarchical_visitor
{
45 * A hash table mapping from the original ir_variable shader outputs
46 * (ir_var_shader_out mode) to the new temporaries to be used instead.
48 hash_table
*replacements
;
54 output_read_remover(unsigned stage
);
55 ~output_read_remover();
56 virtual ir_visitor_status
visit(class ir_dereference_variable
*);
57 virtual ir_visitor_status
visit_leave(class ir_emit_vertex
*);
58 virtual ir_visitor_status
visit_leave(class ir_return
*);
59 virtual ir_visitor_status
visit_leave(class ir_function_signature
*);
62 } /* anonymous namespace */
65 * Hash function for the output variables - computes the hash of the name.
66 * NOTE: We're using the name string to ensure that the hash doesn't depend
67 * on any random factors, otherwise the output_read_remover could produce
68 * the random order of the assignments.
70 * NOTE: If you want to reuse this function please take into account that
71 * generally the names of the variables are non-unique.
74 hash_table_var_hash(const void *key
)
76 const ir_variable
* var
= static_cast<const ir_variable
*>(key
);
77 return hash_table_string_hash(var
->name
);
80 output_read_remover::output_read_remover(unsigned stage
)
83 mem_ctx
= ralloc_context(NULL
);
85 hash_table_ctor(0, hash_table_var_hash
, hash_table_pointer_compare
);
88 output_read_remover::~output_read_remover()
90 hash_table_dtor(replacements
);
95 output_read_remover::visit(ir_dereference_variable
*ir
)
97 if (ir
->var
->data
.mode
!= ir_var_shader_out
)
98 return visit_continue
;
99 if (stage
== MESA_SHADER_TESS_CTRL
)
100 return visit_continue
;
102 ir_variable
*temp
= (ir_variable
*) hash_table_find(replacements
, ir
->var
);
104 /* If we don't have an existing temporary, create one. */
106 void *var_ctx
= ralloc_parent(ir
->var
);
107 temp
= new(var_ctx
) ir_variable(ir
->var
->type
, ir
->var
->name
,
109 hash_table_insert(replacements
, temp
, ir
->var
);
110 ir
->var
->insert_after(temp
);
113 /* Update the dereference to use the temporary */
116 return visit_continue
;
120 * Create an assignment to copy a temporary value back to the actual output.
122 static ir_assignment
*
123 copy(void *ctx
, ir_variable
*output
, ir_variable
*temp
)
125 ir_dereference_variable
*lhs
= new(ctx
) ir_dereference_variable(output
);
126 ir_dereference_variable
*rhs
= new(ctx
) ir_dereference_variable(temp
);
127 return new(ctx
) ir_assignment(lhs
, rhs
);
130 /** Insert a copy-back assignment before a "return" statement or a call to
134 emit_return_copy(const void *key
, void *data
, void *closure
)
136 ir_return
*ir
= (ir_return
*) closure
;
137 ir
->insert_before(copy(ir
, (ir_variable
*) key
, (ir_variable
*) data
));
140 /** Insert a copy-back assignment at the end of the main() function */
142 emit_main_copy(const void *key
, void *data
, void *closure
)
144 ir_function_signature
*sig
= (ir_function_signature
*) closure
;
145 sig
->body
.push_tail(copy(sig
, (ir_variable
*) key
, (ir_variable
*) data
));
149 output_read_remover::visit_leave(ir_return
*ir
)
151 hash_table_call_foreach(replacements
, emit_return_copy
, ir
);
152 return visit_continue
;
156 output_read_remover::visit_leave(ir_emit_vertex
*ir
)
158 hash_table_call_foreach(replacements
, emit_return_copy
, ir
);
159 hash_table_clear(replacements
);
160 return visit_continue
;
164 output_read_remover::visit_leave(ir_function_signature
*sig
)
166 if (strcmp(sig
->function_name(), "main") != 0)
167 return visit_continue
;
169 hash_table_call_foreach(replacements
, emit_main_copy
, sig
);
170 return visit_continue
;
174 lower_output_reads(unsigned stage
, exec_list
*instructions
)
176 output_read_remover
v(stage
);
177 visit_list_elements(&v
, instructions
);