Revert "i965: Add 'wait' instruction support"
[mesa.git] / src / mesa / drivers / dri / i965 / brw_reg.h
1 /*
2 Copyright (C) Intel Corp. 2006. All Rights Reserved.
3 Intel funded Tungsten Graphics to
4 develop this 3D driver.
5
6 Permission is hereby granted, free of charge, to any person obtaining
7 a copy of this software and associated documentation files (the
8 "Software"), to deal in the Software without restriction, including
9 without limitation the rights to use, copy, modify, merge, publish,
10 distribute, sublicense, and/or sell copies of the Software, and to
11 permit persons to whom the Software is furnished to do so, subject to
12 the following conditions:
13
14 The above copyright notice and this permission notice (including the
15 next paragraph) shall be included in all copies or substantial
16 portions of the Software.
17
18 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
19 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
21 IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
22 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
23 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
24 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25
26 **********************************************************************/
27 /*
28 * Authors:
29 * Keith Whitwell <keithw@vmware.com>
30 */
31
32 /** @file brw_reg.h
33 *
34 * This file defines struct brw_reg, which is our representation for EU
35 * registers. They're not a hardware specific format, just an abstraction
36 * that intends to capture the full flexibility of the hardware registers.
37 *
38 * The brw_eu_emit.c layer's brw_set_dest/brw_set_src[01] functions encode
39 * the abstract brw_reg type into the actual hardware instruction encoding.
40 */
41
42 #ifndef BRW_REG_H
43 #define BRW_REG_H
44
45 #include <stdbool.h>
46 #include "main/imports.h"
47 #include "main/compiler.h"
48 #include "program/prog_instruction.h"
49 #include "brw_defines.h"
50
51 #ifdef __cplusplus
52 extern "C" {
53 #endif
54
55 /** Number of general purpose registers (VS, WM, etc) */
56 #define BRW_MAX_GRF 128
57
58 /**
59 * First GRF used for the MRF hack.
60 *
61 * On gen7, MRFs are no longer used, and contiguous GRFs are used instead. We
62 * haven't converted our compiler to be aware of this, so it asks for MRFs and
63 * brw_eu_emit.c quietly converts them to be accesses of the top GRFs. The
64 * register allocators have to be careful of this to avoid corrupting the "MRF"s
65 * with actual GRF allocations.
66 */
67 #define GEN7_MRF_HACK_START 112
68
69 /** Number of message register file registers */
70 #define BRW_MAX_MRF 16
71
72 #define BRW_SWIZZLE4(a,b,c,d) (((a)<<0) | ((b)<<2) | ((c)<<4) | ((d)<<6))
73 #define BRW_GET_SWZ(swz, idx) (((swz) >> ((idx)*2)) & 0x3)
74
75 #define BRW_SWIZZLE_NOOP BRW_SWIZZLE4(0,1,2,3)
76 #define BRW_SWIZZLE_XYZW BRW_SWIZZLE4(0,1,2,3)
77 #define BRW_SWIZZLE_XXXX BRW_SWIZZLE4(0,0,0,0)
78 #define BRW_SWIZZLE_YYYY BRW_SWIZZLE4(1,1,1,1)
79 #define BRW_SWIZZLE_ZZZZ BRW_SWIZZLE4(2,2,2,2)
80 #define BRW_SWIZZLE_WWWW BRW_SWIZZLE4(3,3,3,3)
81 #define BRW_SWIZZLE_XYXY BRW_SWIZZLE4(0,1,0,1)
82 #define BRW_SWIZZLE_YZXW BRW_SWIZZLE4(1,2,0,3)
83 #define BRW_SWIZZLE_ZXYW BRW_SWIZZLE4(2,0,1,3)
84 #define BRW_SWIZZLE_ZWZW BRW_SWIZZLE4(2,3,2,3)
85
86 static inline bool
87 brw_is_single_value_swizzle(int swiz)
88 {
89 return (swiz == BRW_SWIZZLE_XXXX ||
90 swiz == BRW_SWIZZLE_YYYY ||
91 swiz == BRW_SWIZZLE_ZZZZ ||
92 swiz == BRW_SWIZZLE_WWWW);
93 }
94
95 enum PACKED brw_reg_type {
96 BRW_REGISTER_TYPE_UD = 0,
97 BRW_REGISTER_TYPE_D,
98 BRW_REGISTER_TYPE_UW,
99 BRW_REGISTER_TYPE_W,
100 BRW_REGISTER_TYPE_F,
101
102 /** Non-immediates only: @{ */
103 BRW_REGISTER_TYPE_UB,
104 BRW_REGISTER_TYPE_B,
105 /** @} */
106
107 /** Immediates only: @{ */
108 BRW_REGISTER_TYPE_UV,
109 BRW_REGISTER_TYPE_V,
110 BRW_REGISTER_TYPE_VF,
111 /** @} */
112
113 BRW_REGISTER_TYPE_DF, /* Gen7+ (no immediates until Gen8+) */
114
115 /* Gen8+ */
116 BRW_REGISTER_TYPE_HF,
117 BRW_REGISTER_TYPE_UQ,
118 BRW_REGISTER_TYPE_Q,
119 };
120
121 unsigned brw_reg_type_to_hw_type(const struct brw_context *brw,
122 enum brw_reg_type type, unsigned file);
123 const char *brw_reg_type_letters(unsigned brw_reg_type);
124
125 #define REG_SIZE (8*4)
126
127 /* These aren't hardware structs, just something useful for us to pass around:
128 *
129 * Align1 operation has a lot of control over input ranges. Used in
130 * WM programs to implement shaders decomposed into "channel serial"
131 * or "structure of array" form:
132 */
133 struct brw_reg {
134 unsigned type:4;
135 unsigned file:2;
136 unsigned nr:8;
137 unsigned subnr:5; /* :1 in align16 */
138 unsigned negate:1; /* source only */
139 unsigned abs:1; /* source only */
140 unsigned vstride:4; /* source only */
141 unsigned width:3; /* src only, align1 only */
142 unsigned hstride:2; /* align1 only */
143 unsigned address_mode:1; /* relative addressing, hopefully! */
144 unsigned pad0:1;
145
146 union {
147 struct {
148 unsigned swizzle:8; /* src only, align16 only */
149 unsigned writemask:4; /* dest only, align16 only */
150 int indirect_offset:10; /* relative addressing offset */
151 unsigned pad1:10; /* two dwords total */
152 } bits;
153
154 float f;
155 int d;
156 unsigned ud;
157 } dw1;
158 };
159
160
161 struct brw_indirect {
162 unsigned addr_subnr:4;
163 int addr_offset:10;
164 unsigned pad:18;
165 };
166
167
168 static inline int
169 type_sz(unsigned type)
170 {
171 switch(type) {
172 case BRW_REGISTER_TYPE_UD:
173 case BRW_REGISTER_TYPE_D:
174 case BRW_REGISTER_TYPE_F:
175 return 4;
176 case BRW_REGISTER_TYPE_UW:
177 case BRW_REGISTER_TYPE_W:
178 return 2;
179 case BRW_REGISTER_TYPE_UB:
180 case BRW_REGISTER_TYPE_B:
181 return 1;
182 default:
183 return 0;
184 }
185 }
186
187 static inline bool
188 type_is_signed(unsigned type)
189 {
190 switch(type) {
191 case BRW_REGISTER_TYPE_D:
192 case BRW_REGISTER_TYPE_W:
193 case BRW_REGISTER_TYPE_F:
194 case BRW_REGISTER_TYPE_B:
195 case BRW_REGISTER_TYPE_V:
196 case BRW_REGISTER_TYPE_VF:
197 case BRW_REGISTER_TYPE_DF:
198 case BRW_REGISTER_TYPE_HF:
199 case BRW_REGISTER_TYPE_Q:
200 return true;
201
202 case BRW_REGISTER_TYPE_UD:
203 case BRW_REGISTER_TYPE_UW:
204 case BRW_REGISTER_TYPE_UB:
205 case BRW_REGISTER_TYPE_UV:
206 case BRW_REGISTER_TYPE_UQ:
207 return false;
208
209 default:
210 assert(!"Unreachable.");
211 return false;
212 }
213 }
214
215 /**
216 * Construct a brw_reg.
217 * \param file one of the BRW_x_REGISTER_FILE values
218 * \param nr register number/index
219 * \param subnr register sub number
220 * \param type one of BRW_REGISTER_TYPE_x
221 * \param vstride one of BRW_VERTICAL_STRIDE_x
222 * \param width one of BRW_WIDTH_x
223 * \param hstride one of BRW_HORIZONTAL_STRIDE_x
224 * \param swizzle one of BRW_SWIZZLE_x
225 * \param writemask WRITEMASK_X/Y/Z/W bitfield
226 */
227 static inline struct brw_reg
228 brw_reg(unsigned file,
229 unsigned nr,
230 unsigned subnr,
231 unsigned type,
232 unsigned vstride,
233 unsigned width,
234 unsigned hstride,
235 unsigned swizzle,
236 unsigned writemask)
237 {
238 struct brw_reg reg;
239 if (file == BRW_GENERAL_REGISTER_FILE)
240 assert(nr < BRW_MAX_GRF);
241 else if (file == BRW_MESSAGE_REGISTER_FILE)
242 assert((nr & ~(1 << 7)) < BRW_MAX_MRF);
243 else if (file == BRW_ARCHITECTURE_REGISTER_FILE)
244 assert(nr <= BRW_ARF_TIMESTAMP);
245
246 reg.type = type;
247 reg.file = file;
248 reg.nr = nr;
249 reg.subnr = subnr * type_sz(type);
250 reg.negate = 0;
251 reg.abs = 0;
252 reg.vstride = vstride;
253 reg.width = width;
254 reg.hstride = hstride;
255 reg.address_mode = BRW_ADDRESS_DIRECT;
256 reg.pad0 = 0;
257
258 /* Could do better: If the reg is r5.3<0;1,0>, we probably want to
259 * set swizzle and writemask to W, as the lower bits of subnr will
260 * be lost when converted to align16. This is probably too much to
261 * keep track of as you'd want it adjusted by suboffset(), etc.
262 * Perhaps fix up when converting to align16?
263 */
264 reg.dw1.bits.swizzle = swizzle;
265 reg.dw1.bits.writemask = writemask;
266 reg.dw1.bits.indirect_offset = 0;
267 reg.dw1.bits.pad1 = 0;
268 return reg;
269 }
270
271 /** Construct float[16] register */
272 static inline struct brw_reg
273 brw_vec16_reg(unsigned file, unsigned nr, unsigned subnr)
274 {
275 return brw_reg(file,
276 nr,
277 subnr,
278 BRW_REGISTER_TYPE_F,
279 BRW_VERTICAL_STRIDE_16,
280 BRW_WIDTH_16,
281 BRW_HORIZONTAL_STRIDE_1,
282 BRW_SWIZZLE_XYZW,
283 WRITEMASK_XYZW);
284 }
285
286 /** Construct float[8] register */
287 static inline struct brw_reg
288 brw_vec8_reg(unsigned file, unsigned nr, unsigned subnr)
289 {
290 return brw_reg(file,
291 nr,
292 subnr,
293 BRW_REGISTER_TYPE_F,
294 BRW_VERTICAL_STRIDE_8,
295 BRW_WIDTH_8,
296 BRW_HORIZONTAL_STRIDE_1,
297 BRW_SWIZZLE_XYZW,
298 WRITEMASK_XYZW);
299 }
300
301 /** Construct float[4] register */
302 static inline struct brw_reg
303 brw_vec4_reg(unsigned file, unsigned nr, unsigned subnr)
304 {
305 return brw_reg(file,
306 nr,
307 subnr,
308 BRW_REGISTER_TYPE_F,
309 BRW_VERTICAL_STRIDE_4,
310 BRW_WIDTH_4,
311 BRW_HORIZONTAL_STRIDE_1,
312 BRW_SWIZZLE_XYZW,
313 WRITEMASK_XYZW);
314 }
315
316 /** Construct float[2] register */
317 static inline struct brw_reg
318 brw_vec2_reg(unsigned file, unsigned nr, unsigned subnr)
319 {
320 return brw_reg(file,
321 nr,
322 subnr,
323 BRW_REGISTER_TYPE_F,
324 BRW_VERTICAL_STRIDE_2,
325 BRW_WIDTH_2,
326 BRW_HORIZONTAL_STRIDE_1,
327 BRW_SWIZZLE_XYXY,
328 WRITEMASK_XY);
329 }
330
331 /** Construct float[1] register */
332 static inline struct brw_reg
333 brw_vec1_reg(unsigned file, unsigned nr, unsigned subnr)
334 {
335 return brw_reg(file,
336 nr,
337 subnr,
338 BRW_REGISTER_TYPE_F,
339 BRW_VERTICAL_STRIDE_0,
340 BRW_WIDTH_1,
341 BRW_HORIZONTAL_STRIDE_0,
342 BRW_SWIZZLE_XXXX,
343 WRITEMASK_X);
344 }
345
346 static inline struct brw_reg
347 brw_vecn_reg(unsigned width, unsigned file, unsigned nr, unsigned subnr)
348 {
349 switch (width) {
350 case 1:
351 return brw_vec1_reg(file, nr, subnr);
352 case 2:
353 return brw_vec2_reg(file, nr, subnr);
354 case 4:
355 return brw_vec4_reg(file, nr, subnr);
356 case 8:
357 return brw_vec8_reg(file, nr, subnr);
358 case 16:
359 return brw_vec16_reg(file, nr, subnr);
360 default:
361 assert(!"Invalid register width");
362 }
363 unreachable();
364 }
365
366 static inline struct brw_reg
367 retype(struct brw_reg reg, unsigned type)
368 {
369 reg.type = type;
370 return reg;
371 }
372
373 static inline struct brw_reg
374 sechalf(struct brw_reg reg)
375 {
376 if (reg.vstride)
377 reg.nr++;
378 return reg;
379 }
380
381 static inline struct brw_reg
382 suboffset(struct brw_reg reg, unsigned delta)
383 {
384 reg.subnr += delta * type_sz(reg.type);
385 return reg;
386 }
387
388
389 static inline struct brw_reg
390 offset(struct brw_reg reg, unsigned delta)
391 {
392 reg.nr += delta;
393 return reg;
394 }
395
396
397 static inline struct brw_reg
398 byte_offset(struct brw_reg reg, unsigned bytes)
399 {
400 unsigned newoffset = reg.nr * REG_SIZE + reg.subnr + bytes;
401 reg.nr = newoffset / REG_SIZE;
402 reg.subnr = newoffset % REG_SIZE;
403 return reg;
404 }
405
406
407 /** Construct unsigned word[16] register */
408 static inline struct brw_reg
409 brw_uw16_reg(unsigned file, unsigned nr, unsigned subnr)
410 {
411 return suboffset(retype(brw_vec16_reg(file, nr, 0), BRW_REGISTER_TYPE_UW), subnr);
412 }
413
414 /** Construct unsigned word[8] register */
415 static inline struct brw_reg
416 brw_uw8_reg(unsigned file, unsigned nr, unsigned subnr)
417 {
418 return suboffset(retype(brw_vec8_reg(file, nr, 0), BRW_REGISTER_TYPE_UW), subnr);
419 }
420
421 /** Construct unsigned word[1] register */
422 static inline struct brw_reg
423 brw_uw1_reg(unsigned file, unsigned nr, unsigned subnr)
424 {
425 return suboffset(retype(brw_vec1_reg(file, nr, 0), BRW_REGISTER_TYPE_UW), subnr);
426 }
427
428 static inline struct brw_reg
429 brw_imm_reg(unsigned type)
430 {
431 return brw_reg(BRW_IMMEDIATE_VALUE,
432 0,
433 0,
434 type,
435 BRW_VERTICAL_STRIDE_0,
436 BRW_WIDTH_1,
437 BRW_HORIZONTAL_STRIDE_0,
438 0,
439 0);
440 }
441
442 /** Construct float immediate register */
443 static inline struct brw_reg
444 brw_imm_f(float f)
445 {
446 struct brw_reg imm = brw_imm_reg(BRW_REGISTER_TYPE_F);
447 imm.dw1.f = f;
448 return imm;
449 }
450
451 /** Construct integer immediate register */
452 static inline struct brw_reg
453 brw_imm_d(int d)
454 {
455 struct brw_reg imm = brw_imm_reg(BRW_REGISTER_TYPE_D);
456 imm.dw1.d = d;
457 return imm;
458 }
459
460 /** Construct uint immediate register */
461 static inline struct brw_reg
462 brw_imm_ud(unsigned ud)
463 {
464 struct brw_reg imm = brw_imm_reg(BRW_REGISTER_TYPE_UD);
465 imm.dw1.ud = ud;
466 return imm;
467 }
468
469 /** Construct ushort immediate register */
470 static inline struct brw_reg
471 brw_imm_uw(uint16_t uw)
472 {
473 struct brw_reg imm = brw_imm_reg(BRW_REGISTER_TYPE_UW);
474 imm.dw1.ud = uw | (uw << 16);
475 return imm;
476 }
477
478 /** Construct short immediate register */
479 static inline struct brw_reg
480 brw_imm_w(int16_t w)
481 {
482 struct brw_reg imm = brw_imm_reg(BRW_REGISTER_TYPE_W);
483 imm.dw1.d = w | (w << 16);
484 return imm;
485 }
486
487 /* brw_imm_b and brw_imm_ub aren't supported by hardware - the type
488 * numbers alias with _V and _VF below:
489 */
490
491 /** Construct vector of eight signed half-byte values */
492 static inline struct brw_reg
493 brw_imm_v(unsigned v)
494 {
495 struct brw_reg imm = brw_imm_reg(BRW_REGISTER_TYPE_V);
496 imm.vstride = BRW_VERTICAL_STRIDE_0;
497 imm.width = BRW_WIDTH_8;
498 imm.hstride = BRW_HORIZONTAL_STRIDE_1;
499 imm.dw1.ud = v;
500 return imm;
501 }
502
503 /** Construct vector of four 8-bit float values */
504 static inline struct brw_reg
505 brw_imm_vf(unsigned v)
506 {
507 struct brw_reg imm = brw_imm_reg(BRW_REGISTER_TYPE_VF);
508 imm.vstride = BRW_VERTICAL_STRIDE_0;
509 imm.width = BRW_WIDTH_4;
510 imm.hstride = BRW_HORIZONTAL_STRIDE_1;
511 imm.dw1.ud = v;
512 return imm;
513 }
514
515 /**
516 * Convert an integer into a "restricted" 8-bit float, used in vector
517 * immediates. The 8-bit floating point format has a sign bit, an
518 * excess-3 3-bit exponent, and a 4-bit mantissa. All integer values
519 * from -31 to 31 can be represented exactly.
520 */
521 static inline uint8_t
522 int_to_float8(int x)
523 {
524 if (x == 0) {
525 return 0;
526 } else if (x < 0) {
527 return 1 << 7 | int_to_float8(-x);
528 } else {
529 const unsigned exponent = _mesa_logbase2(x);
530 const unsigned mantissa = (x - (1 << exponent)) << (4 - exponent);
531 assert(exponent <= 4);
532 return (exponent + 3) << 4 | mantissa;
533 }
534 }
535
536 /**
537 * Construct a floating-point packed vector immediate from its integer
538 * values. \sa int_to_float8()
539 */
540 static inline struct brw_reg
541 brw_imm_vf4(int v0, int v1, int v2, int v3)
542 {
543 return brw_imm_vf((int_to_float8(v0) << 0) |
544 (int_to_float8(v1) << 8) |
545 (int_to_float8(v2) << 16) |
546 (int_to_float8(v3) << 24));
547 }
548
549
550 static inline struct brw_reg
551 brw_address(struct brw_reg reg)
552 {
553 return brw_imm_uw(reg.nr * REG_SIZE + reg.subnr);
554 }
555
556 /** Construct float[1] general-purpose register */
557 static inline struct brw_reg
558 brw_vec1_grf(unsigned nr, unsigned subnr)
559 {
560 return brw_vec1_reg(BRW_GENERAL_REGISTER_FILE, nr, subnr);
561 }
562
563 /** Construct float[2] general-purpose register */
564 static inline struct brw_reg
565 brw_vec2_grf(unsigned nr, unsigned subnr)
566 {
567 return brw_vec2_reg(BRW_GENERAL_REGISTER_FILE, nr, subnr);
568 }
569
570 /** Construct float[4] general-purpose register */
571 static inline struct brw_reg
572 brw_vec4_grf(unsigned nr, unsigned subnr)
573 {
574 return brw_vec4_reg(BRW_GENERAL_REGISTER_FILE, nr, subnr);
575 }
576
577 /** Construct float[8] general-purpose register */
578 static inline struct brw_reg
579 brw_vec8_grf(unsigned nr, unsigned subnr)
580 {
581 return brw_vec8_reg(BRW_GENERAL_REGISTER_FILE, nr, subnr);
582 }
583
584
585 static inline struct brw_reg
586 brw_uw8_grf(unsigned nr, unsigned subnr)
587 {
588 return brw_uw8_reg(BRW_GENERAL_REGISTER_FILE, nr, subnr);
589 }
590
591 static inline struct brw_reg
592 brw_uw16_grf(unsigned nr, unsigned subnr)
593 {
594 return brw_uw16_reg(BRW_GENERAL_REGISTER_FILE, nr, subnr);
595 }
596
597
598 /** Construct null register (usually used for setting condition codes) */
599 static inline struct brw_reg
600 brw_null_reg(void)
601 {
602 return brw_vec8_reg(BRW_ARCHITECTURE_REGISTER_FILE, BRW_ARF_NULL, 0);
603 }
604
605 static inline struct brw_reg
606 brw_address_reg(unsigned subnr)
607 {
608 return brw_uw1_reg(BRW_ARCHITECTURE_REGISTER_FILE, BRW_ARF_ADDRESS, subnr);
609 }
610
611 /* If/else instructions break in align16 mode if writemask & swizzle
612 * aren't xyzw. This goes against the convention for other scalar
613 * regs:
614 */
615 static inline struct brw_reg
616 brw_ip_reg(void)
617 {
618 return brw_reg(BRW_ARCHITECTURE_REGISTER_FILE,
619 BRW_ARF_IP,
620 0,
621 BRW_REGISTER_TYPE_UD,
622 BRW_VERTICAL_STRIDE_4, /* ? */
623 BRW_WIDTH_1,
624 BRW_HORIZONTAL_STRIDE_0,
625 BRW_SWIZZLE_XYZW, /* NOTE! */
626 WRITEMASK_XYZW); /* NOTE! */
627 }
628
629 static inline struct brw_reg
630 brw_acc_reg(void)
631 {
632 return brw_vec8_reg(BRW_ARCHITECTURE_REGISTER_FILE, BRW_ARF_ACCUMULATOR, 0);
633 }
634
635 static inline struct brw_reg
636 brw_flag_reg(int reg, int subreg)
637 {
638 return brw_uw1_reg(BRW_ARCHITECTURE_REGISTER_FILE,
639 BRW_ARF_FLAG + reg, subreg);
640 }
641
642
643 static inline struct brw_reg
644 brw_mask_reg(unsigned subnr)
645 {
646 return brw_uw1_reg(BRW_ARCHITECTURE_REGISTER_FILE, BRW_ARF_MASK, subnr);
647 }
648
649 static inline struct brw_reg
650 brw_message_reg(unsigned nr)
651 {
652 assert((nr & ~(1 << 7)) < BRW_MAX_MRF);
653 return brw_vec8_reg(BRW_MESSAGE_REGISTER_FILE, nr, 0);
654 }
655
656 static inline struct brw_reg
657 brw_uvec_mrf(unsigned width, unsigned nr, unsigned subnr)
658 {
659 return retype(brw_vecn_reg(width, BRW_MESSAGE_REGISTER_FILE, nr, subnr),
660 BRW_REGISTER_TYPE_UD);
661 }
662
663 /* This is almost always called with a numeric constant argument, so
664 * make things easy to evaluate at compile time:
665 */
666 static inline unsigned cvt(unsigned val)
667 {
668 switch (val) {
669 case 0: return 0;
670 case 1: return 1;
671 case 2: return 2;
672 case 4: return 3;
673 case 8: return 4;
674 case 16: return 5;
675 case 32: return 6;
676 }
677 return 0;
678 }
679
680 static inline struct brw_reg
681 stride(struct brw_reg reg, unsigned vstride, unsigned width, unsigned hstride)
682 {
683 reg.vstride = cvt(vstride);
684 reg.width = cvt(width) - 1;
685 reg.hstride = cvt(hstride);
686 return reg;
687 }
688
689
690 static inline struct brw_reg
691 vec16(struct brw_reg reg)
692 {
693 return stride(reg, 16,16,1);
694 }
695
696 static inline struct brw_reg
697 vec8(struct brw_reg reg)
698 {
699 return stride(reg, 8,8,1);
700 }
701
702 static inline struct brw_reg
703 vec4(struct brw_reg reg)
704 {
705 return stride(reg, 4,4,1);
706 }
707
708 static inline struct brw_reg
709 vec2(struct brw_reg reg)
710 {
711 return stride(reg, 2,2,1);
712 }
713
714 static inline struct brw_reg
715 vec1(struct brw_reg reg)
716 {
717 return stride(reg, 0,1,0);
718 }
719
720
721 static inline struct brw_reg
722 get_element(struct brw_reg reg, unsigned elt)
723 {
724 return vec1(suboffset(reg, elt));
725 }
726
727 static inline struct brw_reg
728 get_element_ud(struct brw_reg reg, unsigned elt)
729 {
730 return vec1(suboffset(retype(reg, BRW_REGISTER_TYPE_UD), elt));
731 }
732
733 static inline struct brw_reg
734 get_element_d(struct brw_reg reg, unsigned elt)
735 {
736 return vec1(suboffset(retype(reg, BRW_REGISTER_TYPE_D), elt));
737 }
738
739
740 static inline struct brw_reg
741 brw_swizzle(struct brw_reg reg, unsigned x, unsigned y, unsigned z, unsigned w)
742 {
743 assert(reg.file != BRW_IMMEDIATE_VALUE);
744
745 reg.dw1.bits.swizzle = BRW_SWIZZLE4(BRW_GET_SWZ(reg.dw1.bits.swizzle, x),
746 BRW_GET_SWZ(reg.dw1.bits.swizzle, y),
747 BRW_GET_SWZ(reg.dw1.bits.swizzle, z),
748 BRW_GET_SWZ(reg.dw1.bits.swizzle, w));
749 return reg;
750 }
751
752
753 static inline struct brw_reg
754 brw_swizzle1(struct brw_reg reg, unsigned x)
755 {
756 return brw_swizzle(reg, x, x, x, x);
757 }
758
759 static inline struct brw_reg
760 brw_writemask(struct brw_reg reg, unsigned mask)
761 {
762 assert(reg.file != BRW_IMMEDIATE_VALUE);
763 reg.dw1.bits.writemask &= mask;
764 return reg;
765 }
766
767 static inline struct brw_reg
768 brw_set_writemask(struct brw_reg reg, unsigned mask)
769 {
770 assert(reg.file != BRW_IMMEDIATE_VALUE);
771 reg.dw1.bits.writemask = mask;
772 return reg;
773 }
774
775 static inline struct brw_reg
776 negate(struct brw_reg reg)
777 {
778 reg.negate ^= 1;
779 return reg;
780 }
781
782 static inline struct brw_reg
783 brw_abs(struct brw_reg reg)
784 {
785 reg.abs = 1;
786 reg.negate = 0;
787 return reg;
788 }
789
790 /************************************************************************/
791
792 static inline struct brw_reg
793 brw_vec4_indirect(unsigned subnr, int offset)
794 {
795 struct brw_reg reg = brw_vec4_grf(0, 0);
796 reg.subnr = subnr;
797 reg.address_mode = BRW_ADDRESS_REGISTER_INDIRECT_REGISTER;
798 reg.dw1.bits.indirect_offset = offset;
799 return reg;
800 }
801
802 static inline struct brw_reg
803 brw_vec1_indirect(unsigned subnr, int offset)
804 {
805 struct brw_reg reg = brw_vec1_grf(0, 0);
806 reg.subnr = subnr;
807 reg.address_mode = BRW_ADDRESS_REGISTER_INDIRECT_REGISTER;
808 reg.dw1.bits.indirect_offset = offset;
809 return reg;
810 }
811
812 static inline struct brw_reg
813 deref_4f(struct brw_indirect ptr, int offset)
814 {
815 return brw_vec4_indirect(ptr.addr_subnr, ptr.addr_offset + offset);
816 }
817
818 static inline struct brw_reg
819 deref_1f(struct brw_indirect ptr, int offset)
820 {
821 return brw_vec1_indirect(ptr.addr_subnr, ptr.addr_offset + offset);
822 }
823
824 static inline struct brw_reg
825 deref_4b(struct brw_indirect ptr, int offset)
826 {
827 return retype(deref_4f(ptr, offset), BRW_REGISTER_TYPE_B);
828 }
829
830 static inline struct brw_reg
831 deref_1uw(struct brw_indirect ptr, int offset)
832 {
833 return retype(deref_1f(ptr, offset), BRW_REGISTER_TYPE_UW);
834 }
835
836 static inline struct brw_reg
837 deref_1d(struct brw_indirect ptr, int offset)
838 {
839 return retype(deref_1f(ptr, offset), BRW_REGISTER_TYPE_D);
840 }
841
842 static inline struct brw_reg
843 deref_1ud(struct brw_indirect ptr, int offset)
844 {
845 return retype(deref_1f(ptr, offset), BRW_REGISTER_TYPE_UD);
846 }
847
848 static inline struct brw_reg
849 get_addr_reg(struct brw_indirect ptr)
850 {
851 return brw_address_reg(ptr.addr_subnr);
852 }
853
854 static inline struct brw_indirect
855 brw_indirect_offset(struct brw_indirect ptr, int offset)
856 {
857 ptr.addr_offset += offset;
858 return ptr;
859 }
860
861 static inline struct brw_indirect
862 brw_indirect(unsigned addr_subnr, int offset)
863 {
864 struct brw_indirect ptr;
865 ptr.addr_subnr = addr_subnr;
866 ptr.addr_offset = offset;
867 ptr.pad = 0;
868 return ptr;
869 }
870
871 #ifdef __cplusplus
872 }
873 #endif
874
875 #endif