2 * Copyright © 2017 Intel Corporation
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
25 #include "brw_eu_defines.h"
26 #include "dev/gen_device_info.h"
31 BRW_HW_REG_TYPE_UD
= 0,
32 BRW_HW_REG_TYPE_D
= 1,
33 BRW_HW_REG_TYPE_UW
= 2,
34 BRW_HW_REG_TYPE_W
= 3,
35 BRW_HW_REG_TYPE_F
= 7,
36 GEN8_HW_REG_TYPE_UQ
= 8,
37 GEN8_HW_REG_TYPE_Q
= 9,
39 BRW_HW_REG_TYPE_UB
= 4,
40 BRW_HW_REG_TYPE_B
= 5,
41 GEN7_HW_REG_TYPE_DF
= 6,
42 GEN8_HW_REG_TYPE_HF
= 10,
44 GEN11_HW_REG_TYPE_UD
= 0,
45 GEN11_HW_REG_TYPE_D
= 1,
46 GEN11_HW_REG_TYPE_UW
= 2,
47 GEN11_HW_REG_TYPE_W
= 3,
48 GEN11_HW_REG_TYPE_UB
= 4,
49 GEN11_HW_REG_TYPE_B
= 5,
50 GEN11_HW_REG_TYPE_UQ
= 6,
51 GEN11_HW_REG_TYPE_Q
= 7,
52 GEN11_HW_REG_TYPE_HF
= 8,
53 GEN11_HW_REG_TYPE_F
= 9,
54 GEN11_HW_REG_TYPE_DF
= 10,
55 GEN11_HW_REG_TYPE_NF
= 11,
59 BRW_HW_IMM_TYPE_UD
= 0,
60 BRW_HW_IMM_TYPE_D
= 1,
61 BRW_HW_IMM_TYPE_UW
= 2,
62 BRW_HW_IMM_TYPE_W
= 3,
63 BRW_HW_IMM_TYPE_F
= 7,
64 GEN8_HW_IMM_TYPE_UQ
= 8,
65 GEN8_HW_IMM_TYPE_Q
= 9,
67 BRW_HW_IMM_TYPE_UV
= 4,
68 BRW_HW_IMM_TYPE_VF
= 5,
69 BRW_HW_IMM_TYPE_V
= 6,
70 GEN8_HW_IMM_TYPE_DF
= 10,
71 GEN8_HW_IMM_TYPE_HF
= 11,
73 GEN11_HW_IMM_TYPE_UD
= 0,
74 GEN11_HW_IMM_TYPE_D
= 1,
75 GEN11_HW_IMM_TYPE_UW
= 2,
76 GEN11_HW_IMM_TYPE_W
= 3,
77 GEN11_HW_IMM_TYPE_UV
= 4,
78 GEN11_HW_IMM_TYPE_V
= 5,
79 GEN11_HW_IMM_TYPE_UQ
= 6,
80 GEN11_HW_IMM_TYPE_Q
= 7,
81 GEN11_HW_IMM_TYPE_HF
= 8,
82 GEN11_HW_IMM_TYPE_F
= 9,
83 GEN11_HW_IMM_TYPE_DF
= 10,
84 GEN11_HW_IMM_TYPE_VF
= 11,
87 static const struct hw_type
{
88 enum hw_reg_type reg_type
;
89 enum hw_imm_type imm_type
;
91 [0 ... BRW_REGISTER_TYPE_LAST
] = { INVALID
, INVALID
},
93 [BRW_REGISTER_TYPE_DF
] = { GEN7_HW_REG_TYPE_DF
, GEN8_HW_IMM_TYPE_DF
},
94 [BRW_REGISTER_TYPE_F
] = { BRW_HW_REG_TYPE_F
, BRW_HW_IMM_TYPE_F
},
95 [BRW_REGISTER_TYPE_HF
] = { GEN8_HW_REG_TYPE_HF
, GEN8_HW_IMM_TYPE_HF
},
96 [BRW_REGISTER_TYPE_VF
] = { INVALID
, BRW_HW_IMM_TYPE_VF
},
98 [BRW_REGISTER_TYPE_Q
] = { GEN8_HW_REG_TYPE_Q
, GEN8_HW_IMM_TYPE_Q
},
99 [BRW_REGISTER_TYPE_UQ
] = { GEN8_HW_REG_TYPE_UQ
, GEN8_HW_IMM_TYPE_UQ
},
100 [BRW_REGISTER_TYPE_D
] = { BRW_HW_REG_TYPE_D
, BRW_HW_IMM_TYPE_D
},
101 [BRW_REGISTER_TYPE_UD
] = { BRW_HW_REG_TYPE_UD
, BRW_HW_IMM_TYPE_UD
},
102 [BRW_REGISTER_TYPE_W
] = { BRW_HW_REG_TYPE_W
, BRW_HW_IMM_TYPE_W
},
103 [BRW_REGISTER_TYPE_UW
] = { BRW_HW_REG_TYPE_UW
, BRW_HW_IMM_TYPE_UW
},
104 [BRW_REGISTER_TYPE_B
] = { BRW_HW_REG_TYPE_B
, INVALID
},
105 [BRW_REGISTER_TYPE_UB
] = { BRW_HW_REG_TYPE_UB
, INVALID
},
106 [BRW_REGISTER_TYPE_V
] = { INVALID
, BRW_HW_IMM_TYPE_V
},
107 [BRW_REGISTER_TYPE_UV
] = { INVALID
, BRW_HW_IMM_TYPE_UV
},
108 }, gen11_hw_type
[] = {
109 [BRW_REGISTER_TYPE_NF
] = { GEN11_HW_REG_TYPE_NF
, INVALID
},
110 [BRW_REGISTER_TYPE_DF
] = { GEN11_HW_REG_TYPE_DF
, GEN11_HW_IMM_TYPE_DF
},
111 [BRW_REGISTER_TYPE_F
] = { GEN11_HW_REG_TYPE_F
, GEN11_HW_IMM_TYPE_F
},
112 [BRW_REGISTER_TYPE_HF
] = { GEN11_HW_REG_TYPE_HF
, GEN11_HW_IMM_TYPE_HF
},
113 [BRW_REGISTER_TYPE_VF
] = { INVALID
, GEN11_HW_IMM_TYPE_VF
},
115 [BRW_REGISTER_TYPE_Q
] = { GEN11_HW_REG_TYPE_Q
, GEN11_HW_IMM_TYPE_Q
},
116 [BRW_REGISTER_TYPE_UQ
] = { GEN11_HW_REG_TYPE_UQ
, GEN11_HW_IMM_TYPE_UQ
},
117 [BRW_REGISTER_TYPE_D
] = { GEN11_HW_REG_TYPE_D
, GEN11_HW_IMM_TYPE_D
},
118 [BRW_REGISTER_TYPE_UD
] = { GEN11_HW_REG_TYPE_UD
, GEN11_HW_IMM_TYPE_UD
},
119 [BRW_REGISTER_TYPE_W
] = { GEN11_HW_REG_TYPE_W
, GEN11_HW_IMM_TYPE_W
},
120 [BRW_REGISTER_TYPE_UW
] = { GEN11_HW_REG_TYPE_UW
, GEN11_HW_IMM_TYPE_UW
},
121 [BRW_REGISTER_TYPE_B
] = { GEN11_HW_REG_TYPE_B
, INVALID
},
122 [BRW_REGISTER_TYPE_UB
] = { GEN11_HW_REG_TYPE_UB
, INVALID
},
123 [BRW_REGISTER_TYPE_V
] = { INVALID
, GEN11_HW_IMM_TYPE_V
},
124 [BRW_REGISTER_TYPE_UV
] = { INVALID
, GEN11_HW_IMM_TYPE_UV
},
127 /* SNB adds 3-src instructions (MAD and LRP) that only operate on floats, so
128 * the types were implied. IVB adds BFE and BFI2 that operate on doublewords
129 * and unsigned doublewords, so a new field is also available in the da3src
130 * struct (part of struct brw_instruction.bits1 in brw_structs.h) to select
131 * dst and shared-src types.
133 * CNL adds support for 3-src instructions in align1 mode, and with it support
134 * for most register types.
136 enum hw_3src_reg_type
{
137 GEN7_3SRC_TYPE_F
= 0,
138 GEN7_3SRC_TYPE_D
= 1,
139 GEN7_3SRC_TYPE_UD
= 2,
140 GEN7_3SRC_TYPE_DF
= 3,
142 /** When ExecutionDatatype is 1: @{ */
143 GEN10_ALIGN1_3SRC_REG_TYPE_HF
= 0b000,
144 GEN10_ALIGN1_3SRC_REG_TYPE_F
= 0b001,
145 GEN10_ALIGN1_3SRC_REG_TYPE_DF
= 0b010,
146 GEN11_ALIGN1_3SRC_REG_TYPE_NF
= 0b011,
149 /** When ExecutionDatatype is 0: @{ */
150 GEN10_ALIGN1_3SRC_REG_TYPE_UD
= 0b000,
151 GEN10_ALIGN1_3SRC_REG_TYPE_D
= 0b001,
152 GEN10_ALIGN1_3SRC_REG_TYPE_UW
= 0b010,
153 GEN10_ALIGN1_3SRC_REG_TYPE_W
= 0b011,
154 GEN10_ALIGN1_3SRC_REG_TYPE_UB
= 0b100,
155 GEN10_ALIGN1_3SRC_REG_TYPE_B
= 0b101,
159 static const struct hw_3src_type
{
160 enum hw_3src_reg_type reg_type
;
161 enum gen10_align1_3src_exec_type exec_type
;
162 } gen7_hw_3src_type
[] = {
163 [0 ... BRW_REGISTER_TYPE_LAST
] = { INVALID
},
165 [BRW_REGISTER_TYPE_F
] = { GEN7_3SRC_TYPE_F
},
166 [BRW_REGISTER_TYPE_D
] = { GEN7_3SRC_TYPE_D
},
167 [BRW_REGISTER_TYPE_UD
] = { GEN7_3SRC_TYPE_UD
},
168 [BRW_REGISTER_TYPE_DF
] = { GEN7_3SRC_TYPE_DF
},
169 }, gen10_hw_3src_align1_type
[] = {
170 #define E(x) BRW_ALIGN1_3SRC_EXEC_TYPE_##x
171 [0 ... BRW_REGISTER_TYPE_LAST
] = { INVALID
},
173 [BRW_REGISTER_TYPE_NF
] = { GEN11_ALIGN1_3SRC_REG_TYPE_NF
, E(FLOAT
) },
174 [BRW_REGISTER_TYPE_DF
] = { GEN10_ALIGN1_3SRC_REG_TYPE_DF
, E(FLOAT
) },
175 [BRW_REGISTER_TYPE_F
] = { GEN10_ALIGN1_3SRC_REG_TYPE_F
, E(FLOAT
) },
176 [BRW_REGISTER_TYPE_HF
] = { GEN10_ALIGN1_3SRC_REG_TYPE_HF
, E(FLOAT
) },
178 [BRW_REGISTER_TYPE_D
] = { GEN10_ALIGN1_3SRC_REG_TYPE_D
, E(INT
) },
179 [BRW_REGISTER_TYPE_UD
] = { GEN10_ALIGN1_3SRC_REG_TYPE_UD
, E(INT
) },
180 [BRW_REGISTER_TYPE_W
] = { GEN10_ALIGN1_3SRC_REG_TYPE_W
, E(INT
) },
181 [BRW_REGISTER_TYPE_UW
] = { GEN10_ALIGN1_3SRC_REG_TYPE_UW
, E(INT
) },
182 [BRW_REGISTER_TYPE_B
] = { GEN10_ALIGN1_3SRC_REG_TYPE_B
, E(INT
) },
183 [BRW_REGISTER_TYPE_UB
] = { GEN10_ALIGN1_3SRC_REG_TYPE_UB
, E(INT
) },
188 * Convert a brw_reg_type enumeration value into the hardware representation.
190 * The hardware encoding may depend on whether the value is an immediate.
193 brw_reg_type_to_hw_type(const struct gen_device_info
*devinfo
,
194 enum brw_reg_file file
,
195 enum brw_reg_type type
)
197 const struct hw_type
*table
;
199 if (devinfo
->gen
>= 11) {
200 assert(type
< ARRAY_SIZE(gen11_hw_type
));
201 table
= gen11_hw_type
;
203 assert(type
< ARRAY_SIZE(gen4_hw_type
));
204 table
= gen4_hw_type
;
207 assert(devinfo
->has_64bit_types
|| brw_reg_type_to_size(type
) < 8 ||
208 type
== BRW_REGISTER_TYPE_NF
);
210 if (file
== BRW_IMMEDIATE_VALUE
) {
211 assert(table
[type
].imm_type
!= (enum hw_imm_type
)INVALID
);
212 return table
[type
].imm_type
;
214 assert(table
[type
].reg_type
!= (enum hw_reg_type
)INVALID
);
215 return table
[type
].reg_type
;
220 * Convert the hardware representation into a brw_reg_type enumeration value.
222 * The hardware encoding may depend on whether the value is an immediate.
225 brw_hw_type_to_reg_type(const struct gen_device_info
*devinfo
,
226 enum brw_reg_file file
, unsigned hw_type
)
228 const struct hw_type
*table
;
230 if (devinfo
->gen
>= 11) {
231 table
= gen11_hw_type
;
233 table
= gen4_hw_type
;
236 if (file
== BRW_IMMEDIATE_VALUE
) {
237 for (enum brw_reg_type i
= 0; i
<= BRW_REGISTER_TYPE_LAST
; i
++) {
238 if (table
[i
].imm_type
== (enum hw_imm_type
)hw_type
) {
243 for (enum brw_reg_type i
= 0; i
<= BRW_REGISTER_TYPE_LAST
; i
++) {
244 if (table
[i
].reg_type
== (enum hw_reg_type
)hw_type
) {
249 unreachable("not reached");
253 * Convert a brw_reg_type enumeration value into the hardware representation
254 * for a 3-src align16 instruction
257 brw_reg_type_to_a16_hw_3src_type(const struct gen_device_info
*devinfo
,
258 enum brw_reg_type type
)
260 assert(type
< ARRAY_SIZE(gen7_hw_3src_type
));
261 assert(gen7_hw_3src_type
[type
].reg_type
!= (enum hw_3src_reg_type
)INVALID
);
262 return gen7_hw_3src_type
[type
].reg_type
;
266 * Convert a brw_reg_type enumeration value into the hardware representation
267 * for a 3-src align1 instruction
270 brw_reg_type_to_a1_hw_3src_type(const struct gen_device_info
*devinfo
,
271 enum brw_reg_type type
)
273 assert(type
< ARRAY_SIZE(gen10_hw_3src_align1_type
));
274 assert(gen10_hw_3src_align1_type
[type
].reg_type
!= (enum hw_3src_reg_type
)INVALID
);
275 return gen10_hw_3src_align1_type
[type
].reg_type
;
279 * Convert the hardware representation for a 3-src align16 instruction into a
280 * brw_reg_type enumeration value.
283 brw_a16_hw_3src_type_to_reg_type(const struct gen_device_info
*devinfo
,
286 for (enum brw_reg_type i
= 0; i
<= BRW_REGISTER_TYPE_LAST
; i
++) {
287 if (gen7_hw_3src_type
[i
].reg_type
== hw_type
) {
291 unreachable("not reached");
295 * Convert the hardware representation for a 3-src align1 instruction into a
296 * brw_reg_type enumeration value.
299 brw_a1_hw_3src_type_to_reg_type(const struct gen_device_info
*devinfo
,
300 unsigned hw_type
, unsigned exec_type
)
302 for (enum brw_reg_type i
= 0; i
<= BRW_REGISTER_TYPE_LAST
; i
++) {
303 if (gen10_hw_3src_align1_type
[i
].reg_type
== hw_type
&&
304 gen10_hw_3src_align1_type
[i
].exec_type
== exec_type
) {
308 unreachable("not reached");
312 * Return the element size given a register type.
315 brw_reg_type_to_size(enum brw_reg_type type
)
317 static const unsigned type_size
[] = {
318 [BRW_REGISTER_TYPE_NF
] = 8,
319 [BRW_REGISTER_TYPE_DF
] = 8,
320 [BRW_REGISTER_TYPE_F
] = 4,
321 [BRW_REGISTER_TYPE_HF
] = 2,
322 [BRW_REGISTER_TYPE_VF
] = 4,
324 [BRW_REGISTER_TYPE_Q
] = 8,
325 [BRW_REGISTER_TYPE_UQ
] = 8,
326 [BRW_REGISTER_TYPE_D
] = 4,
327 [BRW_REGISTER_TYPE_UD
] = 4,
328 [BRW_REGISTER_TYPE_W
] = 2,
329 [BRW_REGISTER_TYPE_UW
] = 2,
330 [BRW_REGISTER_TYPE_B
] = 1,
331 [BRW_REGISTER_TYPE_UB
] = 1,
332 [BRW_REGISTER_TYPE_V
] = 2,
333 [BRW_REGISTER_TYPE_UV
] = 2,
335 return type_size
[type
];
339 * Converts a BRW_REGISTER_TYPE_* enum to a short string (F, UD, and so on).
341 * This is different than reg_encoding from brw_disasm.c in that it operates
342 * on the abstract enum values, rather than the generation-specific encoding.
345 brw_reg_type_to_letters(enum brw_reg_type type
)
347 static const char letters
[][3] = {
348 [BRW_REGISTER_TYPE_NF
] = "NF",
349 [BRW_REGISTER_TYPE_DF
] = "DF",
350 [BRW_REGISTER_TYPE_F
] = "F",
351 [BRW_REGISTER_TYPE_HF
] = "HF",
352 [BRW_REGISTER_TYPE_VF
] = "VF",
354 [BRW_REGISTER_TYPE_Q
] = "Q",
355 [BRW_REGISTER_TYPE_UQ
] = "UQ",
356 [BRW_REGISTER_TYPE_D
] = "D",
357 [BRW_REGISTER_TYPE_UD
] = "UD",
358 [BRW_REGISTER_TYPE_W
] = "W",
359 [BRW_REGISTER_TYPE_UW
] = "UW",
360 [BRW_REGISTER_TYPE_B
] = "B",
361 [BRW_REGISTER_TYPE_UB
] = "UB",
362 [BRW_REGISTER_TYPE_V
] = "V",
363 [BRW_REGISTER_TYPE_UV
] = "UV",
365 assert(type
< ARRAY_SIZE(letters
));
366 return letters
[type
];