2 * Copyright © 2012 Intel Corporation
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
24 #include <gtest/gtest.h>
32 #define register_coalesce(v) _register_coalesce(v, __func__)
34 class register_coalesce_test
: public ::testing::Test
{
38 struct brw_context
*brw
;
39 struct brw_device_info
*devinfo
;
40 struct gl_context
*ctx
;
41 struct gl_shader_program
*shader_prog
;
42 struct brw_vertex_program
*vp
;
47 class register_coalesce_vec4_visitor
: public vec4_visitor
50 register_coalesce_vec4_visitor(struct brw_context
*brw
,
51 struct gl_shader_program
*shader_prog
)
52 : vec4_visitor(brw
, NULL
, NULL
, NULL
, NULL
, shader_prog
,
53 MESA_SHADER_VERTEX
, NULL
,
54 false /* no_spills */,
55 ST_NONE
, ST_NONE
, ST_NONE
)
60 virtual dst_reg
*make_reg_for_system_value(ir_variable
*ir
)
62 unreachable("Not reached");
65 virtual void setup_payload()
67 unreachable("Not reached");
70 virtual void emit_prolog()
72 unreachable("Not reached");
75 virtual void emit_program_code()
77 unreachable("Not reached");
80 virtual void emit_thread_end()
82 unreachable("Not reached");
85 virtual void emit_urb_write_header(int mrf
)
87 unreachable("Not reached");
90 virtual vec4_instruction
*emit_urb_write_opcode(bool complete
)
92 unreachable("Not reached");
97 void register_coalesce_test::SetUp()
99 brw
= (struct brw_context
*)calloc(1, sizeof(*brw
));
100 devinfo
= (struct brw_device_info
*)calloc(1, sizeof(*brw
));
101 brw
->intelScreen
= (struct intel_screen
*)calloc(1, sizeof(*brw
->intelScreen
));
102 brw
->intelScreen
->devinfo
= devinfo
;
105 vp
= ralloc(NULL
, struct brw_vertex_program
);
107 shader_prog
= ralloc(NULL
, struct gl_shader_program
);
109 v
= new register_coalesce_vec4_visitor(brw
, shader_prog
);
111 _mesa_init_vertex_program(ctx
, &vp
->program
, GL_VERTEX_SHADER
, 0);
113 brw
->gen
= devinfo
->gen
= 4;
117 _register_coalesce(vec4_visitor
*v
, const char *func
)
122 printf("%s: instructions before:\n", func
);
123 v
->dump_instructions();
127 v
->opt_register_coalesce();
130 printf("%s: instructions after:\n", func
);
131 v
->dump_instructions();
135 TEST_F(register_coalesce_test
, test_compute_to_mrf
)
137 src_reg something
= src_reg(v
, glsl_type::float_type
);
138 dst_reg temp
= dst_reg(v
, glsl_type::float_type
);
141 dst_reg m0
= dst_reg(MRF
, 0);
142 m0
.writemask
= WRITEMASK_X
;
143 m0
.type
= BRW_REGISTER_TYPE_F
;
145 vec4_instruction
*mul
= v
->emit(v
->MUL(temp
, something
, src_reg(1.0f
)));
146 v
->emit(v
->MOV(m0
, src_reg(temp
)));
148 register_coalesce(v
);
150 EXPECT_EQ(mul
->dst
.file
, MRF
);
154 TEST_F(register_coalesce_test
, test_multiple_use
)
156 src_reg something
= src_reg(v
, glsl_type::float_type
);
157 dst_reg temp
= dst_reg(v
, glsl_type::vec4_type
);
160 dst_reg m0
= dst_reg(MRF
, 0);
161 m0
.writemask
= WRITEMASK_X
;
162 m0
.type
= BRW_REGISTER_TYPE_F
;
164 dst_reg m1
= dst_reg(MRF
, 1);
165 m1
.writemask
= WRITEMASK_XYZW
;
166 m1
.type
= BRW_REGISTER_TYPE_F
;
168 src_reg src
= src_reg(temp
);
169 vec4_instruction
*mul
= v
->emit(v
->MUL(temp
, something
, src_reg(1.0f
)));
170 src
.swizzle
= BRW_SWIZZLE_XXXX
;
171 v
->emit(v
->MOV(m0
, src
));
172 src
.swizzle
= BRW_SWIZZLE_XYZW
;
173 v
->emit(v
->MOV(m1
, src
));
175 register_coalesce(v
);
177 EXPECT_NE(mul
->dst
.file
, MRF
);
180 TEST_F(register_coalesce_test
, test_dp4_mrf
)
182 src_reg some_src_1
= src_reg(v
, glsl_type::vec4_type
);
183 src_reg some_src_2
= src_reg(v
, glsl_type::vec4_type
);
186 dst_reg m0
= dst_reg(MRF
, 0);
187 m0
.writemask
= WRITEMASK_Y
;
188 m0
.type
= BRW_REGISTER_TYPE_F
;
190 dst_reg temp
= dst_reg(v
, glsl_type::float_type
);
192 vec4_instruction
*dp4
= v
->emit(v
->DP4(temp
, some_src_1
, some_src_2
));
193 v
->emit(v
->MOV(m0
, src_reg(temp
)));
195 register_coalesce(v
);
197 EXPECT_EQ(dp4
->dst
.file
, MRF
);
198 EXPECT_EQ(dp4
->dst
.writemask
, WRITEMASK_Y
);
201 TEST_F(register_coalesce_test
, test_dp4_grf
)
203 src_reg some_src_1
= src_reg(v
, glsl_type::vec4_type
);
204 src_reg some_src_2
= src_reg(v
, glsl_type::vec4_type
);
207 dst_reg to
= dst_reg(v
, glsl_type::vec4_type
);
208 dst_reg temp
= dst_reg(v
, glsl_type::float_type
);
210 vec4_instruction
*dp4
= v
->emit(v
->DP4(temp
, some_src_1
, some_src_2
));
211 to
.writemask
= WRITEMASK_Y
;
212 v
->emit(v
->MOV(to
, src_reg(temp
)));
214 /* if we don't do something with the result, the automatic dead code
215 * elimination will remove all our instructions.
217 src_reg src
= src_reg(to
);
219 v
->emit(v
->MOV(dst_reg(MRF
, 0), src
));
221 register_coalesce(v
);
223 EXPECT_EQ(dp4
->dst
.reg
, to
.reg
);
224 EXPECT_EQ(dp4
->dst
.writemask
, WRITEMASK_Y
);
227 TEST_F(register_coalesce_test
, test_channel_mul_grf
)
229 src_reg some_src_1
= src_reg(v
, glsl_type::vec4_type
);
230 src_reg some_src_2
= src_reg(v
, glsl_type::vec4_type
);
233 dst_reg to
= dst_reg(v
, glsl_type::vec4_type
);
234 dst_reg temp
= dst_reg(v
, glsl_type::float_type
);
236 vec4_instruction
*mul
= v
->emit(v
->MUL(temp
, some_src_1
, some_src_2
));
237 to
.writemask
= WRITEMASK_Y
;
238 v
->emit(v
->MOV(to
, src_reg(temp
)));
240 /* if we don't do something with the result, the automatic dead code
241 * elimination will remove all our instructions.
243 src_reg src
= src_reg(to
);
245 v
->emit(v
->MOV(dst_reg(MRF
, 0), src
));
247 register_coalesce(v
);
249 EXPECT_EQ(mul
->dst
.reg
, to
.reg
);