2 * Copyright 2010 Jerome Glisse <glisse@freedesktop.org>
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
28 #include "r600_context.h"
31 static int r700_shader_cf_node_bytecode(struct r600_shader
*rshader
,
32 struct r600_shader_node
*rnode
,
38 rshader
->bcode
[id
++] = S_SQ_CF_WORD0_ADDR(rnode
->cf_addr
>> 1);
39 rshader
->bcode
[id
++] = S_SQ_CF_WORD1_CF_INST(V_SQ_CF_WORD1_SQ_CF_INST_VTX
) |
40 S_SQ_CF_WORD1_BARRIER(1) |
41 S_SQ_CF_WORD1_COUNT(rnode
->nfetch
- 1);
43 rshader
->bcode
[id
++] = S_SQ_CF_ALU_WORD0_ADDR(rnode
->cf_addr
>> 1);
44 rshader
->bcode
[id
++] = S_SQ_CF_ALU_WORD1_CF_INST(V_SQ_CF_ALU_WORD1_SQ_CF_INST_ALU
) |
45 S_SQ_CF_ALU_WORD1_BARRIER(1) |
46 S_SQ_CF_ALU_WORD1_COUNT(rnode
->nslot
- 1);
52 static int r700_shader_cf_output_bytecode(struct r600_shader
*rshader
,
57 struct r600_shader_operand out
;
61 r
= r600_shader_find_gpr(rshader
, v
, 0, &out
);
64 rshader
->bcode
[id
+ 0] = S_SQ_CF_ALLOC_EXPORT_WORD0_RW_GPR(out
.sel
) |
65 S_SQ_CF_ALLOC_EXPORT_WORD0_ELEM_SIZE(3);
66 rshader
->bcode
[id
+ 1] = S_SQ_CF_ALLOC_EXPORT_WORD1_SWIZ_SEL_X(0) |
67 S_SQ_CF_ALLOC_EXPORT_WORD1_SWIZ_SEL_Y(1) |
68 S_SQ_CF_ALLOC_EXPORT_WORD1_SWIZ_SEL_Z(2) |
69 S_SQ_CF_ALLOC_EXPORT_WORD1_SWIZ_SEL_W(3) |
70 S_SQ_CF_ALLOC_EXPORT_WORD1_BARRIER(1) |
71 S_SQ_CF_ALLOC_EXPORT_WORD1_CF_INST(V_SQ_CF_ALLOC_EXPORT_WORD1_SQ_CF_INST_EXPORT_DONE
) |
72 S_SQ_CF_ALLOC_EXPORT_WORD1_END_OF_PROGRAM(end
);
74 case C_SEMANTIC_POSITION
:
75 rshader
->bcode
[id
+ 0] |= S_SQ_CF_ALLOC_EXPORT_WORD0_ARRAY_BASE(60) |
76 S_SQ_CF_ALLOC_EXPORT_WORD0_TYPE(V_SQ_CF_ALLOC_EXPORT_WORD0_SQ_EXPORT_POS
);
78 case C_SEMANTIC_COLOR
:
79 if (rshader
->cshader
.type
== C_PROGRAM_TYPE_VS
) {
80 rshader
->output
[rshader
->noutput
].gpr
= out
.sel
;
81 rshader
->output
[rshader
->noutput
].sid
= v
->sid
;
82 rshader
->output
[rshader
->noutput
].name
= v
->name
;
83 rshader
->bcode
[id
+ 0] |= S_SQ_CF_ALLOC_EXPORT_WORD0_ARRAY_BASE(rshader
->noutput
++) |
84 S_SQ_CF_ALLOC_EXPORT_WORD0_TYPE(V_SQ_CF_ALLOC_EXPORT_WORD0_SQ_EXPORT_PARAM
);
86 rshader
->bcode
[id
+ 0] |= S_SQ_CF_ALLOC_EXPORT_WORD0_ARRAY_BASE(0) |
87 S_SQ_CF_ALLOC_EXPORT_WORD0_TYPE(V_SQ_CF_ALLOC_EXPORT_WORD0_SQ_EXPORT_PIXEL
);
90 case C_SEMANTIC_GENERIC
:
91 rshader
->output
[rshader
->noutput
].gpr
= out
.sel
;
92 rshader
->output
[rshader
->noutput
].sid
= v
->sid
;
93 rshader
->output
[rshader
->noutput
].name
= v
->name
;
94 rshader
->bcode
[id
+ 0] |= S_SQ_CF_ALLOC_EXPORT_WORD0_ARRAY_BASE(rshader
->noutput
++) |
95 S_SQ_CF_ALLOC_EXPORT_WORD0_TYPE(V_SQ_CF_ALLOC_EXPORT_WORD0_SQ_EXPORT_PARAM
);
98 fprintf(stderr
, "%s:%d unsupported\n", __func__
, __LINE__
);
105 static int r700_shader_alu_bytecode(struct r600_shader
*rshader
,
106 struct r600_shader_node
*rnode
,
107 struct r600_shader_inst
*alu
,
112 /* don't replace gpr by pv or ps for destination register */
114 rshader
->bcode
[id
++] = S_SQ_ALU_WORD0_SRC0_SEL(alu
->src
[0].sel
) |
115 S_SQ_ALU_WORD0_SRC0_CHAN(alu
->src
[0].chan
) |
116 S_SQ_ALU_WORD0_SRC1_SEL(alu
->src
[1].sel
) |
117 S_SQ_ALU_WORD0_SRC1_CHAN(alu
->src
[1].chan
) |
118 S_SQ_ALU_WORD0_LAST(alu
->last
);
119 rshader
->bcode
[id
++] = S_SQ_ALU_WORD1_DST_GPR(alu
->dst
.sel
) |
120 S_SQ_ALU_WORD1_DST_CHAN(alu
->dst
.chan
) |
121 S_SQ_ALU_WORD1_OP3_SRC2_SEL(alu
->src
[2].sel
) |
122 S_SQ_ALU_WORD1_OP3_SRC2_CHAN(alu
->src
[2].chan
) |
123 S_SQ_ALU_WORD1_OP3_SRC2_NEG(alu
->src
[2].neg
) |
124 S_SQ_ALU_WORD1_OP3_ALU_INST(alu
->opcode
) |
125 S_SQ_ALU_WORD1_BANK_SWIZZLE(0);
127 rshader
->bcode
[id
++] = S_SQ_ALU_WORD0_SRC0_SEL(alu
->src
[0].sel
) |
128 S_SQ_ALU_WORD0_SRC0_CHAN(alu
->src
[0].chan
) |
129 S_SQ_ALU_WORD0_SRC0_NEG(alu
->src
[0].neg
) |
130 S_SQ_ALU_WORD0_SRC1_SEL(alu
->src
[1].sel
) |
131 S_SQ_ALU_WORD0_SRC1_CHAN(alu
->src
[1].chan
) |
132 S_SQ_ALU_WORD0_SRC1_NEG(alu
->src
[1].neg
) |
133 S_SQ_ALU_WORD0_LAST(alu
->last
);
134 rshader
->bcode
[id
++] = S_SQ_ALU_WORD1_DST_GPR(alu
->dst
.sel
) |
135 S_SQ_ALU_WORD1_DST_CHAN(alu
->dst
.chan
) |
136 S_SQ_ALU_WORD1_OP2_SRC0_ABS(alu
->src
[0].abs
) |
137 S_SQ_ALU_WORD1_OP2_SRC1_ABS(alu
->src
[1].abs
) |
138 S_SQ_ALU_WORD1_OP2_WRITE_MASK(1) |
139 S_SQ_ALU_WORD1_OP2_ALU_INST(alu
->opcode
) |
140 S_SQ_ALU_WORD1_BANK_SWIZZLE(0);
146 int r700_shader_translate(struct r600_shader
*rshader
)
148 struct c_shader
*shader
= &rshader
->cshader
;
149 struct r600_shader_node
*rnode
;
150 struct r600_shader_vfetch
*vfetch
;
151 struct r600_shader_alu
*alu
;
156 r
= r600_shader_register(rshader
);
158 fprintf(stderr
, "%s %d register allocation failed\n", __FILE__
, __LINE__
);
161 r
= r600_shader_translate_rec(rshader
, &shader
->entry
);
163 fprintf(stderr
, "%s %d translation failed\n", __FILE__
, __LINE__
);
166 r
= r600_shader_legalize(rshader
);
168 fprintf(stderr
, "%s %d legalize failed\n", __FILE__
, __LINE__
);
171 r600_shader_node_place(rshader
);
172 rshader
->bcode
= malloc(rshader
->ndw
* 4);
173 if (rshader
->bcode
== NULL
)
175 c_list_for_each(rnode
, &rshader
->nodes
) {
177 c_list_for_each(vfetch
, &rnode
->vfetch
) {
178 r
= r600_shader_vfetch_bytecode(rshader
, rnode
, vfetch
, &id
);
182 c_list_for_each(alu
, &rnode
->alu
) {
183 for (i
= 0; i
< alu
->nalu
; i
++) {
184 r
= r700_shader_alu_bytecode(rshader
, rnode
, &alu
->alu
[i
], &id
);
188 for (i
= 0; i
< alu
->nliteral
; i
++) {
189 rshader
->bcode
[id
++] = alu
->literal
[i
];
194 c_list_for_each(rnode
, &rshader
->nodes
) {
195 r
= r700_shader_cf_node_bytecode(rshader
, rnode
, &id
);
199 c_list_for_each(v
, &rshader
->cshader
.files
[C_FILE_OUTPUT
].vectors
) {
201 if (v
->next
== &rshader
->cshader
.files
[C_FILE_OUTPUT
].vectors
)
203 r
= r700_shader_cf_output_bytecode(rshader
, v
, &id
, end
);
207 c_list_for_each(v
, &rshader
->cshader
.files
[C_FILE_INPUT
].vectors
) {
208 rshader
->input
[rshader
->ninput
].gpr
= rshader
->ninput
;
209 rshader
->input
[rshader
->ninput
].sid
= v
->sid
;
210 rshader
->input
[rshader
->ninput
].name
= v
->name
;