Merge remote branch 'origin/nv50-compiler'
[mesa.git] / src / gallium / drivers / nv50 / nv50_program.h
1 /*
2 * Copyright 2010 Ben Skeggs
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
18 * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF
19 * OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
20 * SOFTWARE.
21 */
22
23 #ifndef __NV50_PROG_H__
24 #define __NV50_PROG_H__
25
26 #include "pipe/p_state.h"
27 #include "tgsi/tgsi_scan.h"
28
29 #define NV50_CAP_MAX_PROGRAM_TEMPS 64
30
31 struct nv50_varying {
32 uint8_t id; /* tgsi index */
33 uint8_t hw; /* hw index, nv50 wants flat FP inputs last */
34
35 uint8_t mask : 4;
36 uint8_t linear : 1;
37 uint8_t pad : 3;
38
39 ubyte sn; /* semantic name */
40 ubyte si; /* semantic index */
41 };
42
43 struct nv50_program {
44 struct pipe_shader_state pipe;
45
46 ubyte type;
47 boolean translated;
48
49 struct nouveau_bo *bo;
50 struct nouveau_stateobj *so;
51
52 uint32_t *code;
53 unsigned code_size;
54 unsigned code_start; /* offset inside bo */
55 uint32_t *immd;
56 unsigned immd_size;
57 unsigned parm_size; /* size limit of uniform buffer */
58
59 ubyte max_gpr; /* REG_ALLOC_TEMP */
60 ubyte max_out; /* REG_ALLOC_RESULT or FP_RESULT_COUNT */
61
62 ubyte in_nr;
63 ubyte out_nr;
64 struct nv50_varying in[16];
65 struct nv50_varying out[16];
66
67 struct {
68 uint32_t attrs[3]; /* VP_ATTR_EN_0,1 and VP_GP_BUILTIN_ATTR_EN */
69 ubyte psiz;
70 ubyte bfc[2];
71 ubyte edgeflag;
72 ubyte clpd;
73 ubyte clpd_nr;
74 } vp;
75
76 struct {
77 uint32_t flags[2]; /* 0x19a8, 196c */
78 uint32_t interp; /* 0x1988 */
79 uint32_t colors; /* 0x1904 */
80 } fp;
81
82 struct {
83 ubyte primid; /* primitive id output register */
84 uint8_t vert_count;
85 uint8_t prim_type; /* point, line strip or tri strip */
86 } gp;
87
88 void *fixups;
89 unsigned num_fixups;
90 };
91
92 #define NV50_INTERP_LINEAR (1 << 0)
93 #define NV50_INTERP_FLAT (1 << 1)
94 #define NV50_INTERP_CENTROID (1 << 2)
95
96 /* analyze TGSI and see which TEMP[] are used as subroutine inputs/outputs */
97 struct nv50_subroutine {
98 unsigned id;
99 unsigned pos;
100 /* function inputs and outputs */
101 uint32_t argv[NV50_CAP_MAX_PROGRAM_TEMPS][4];
102 uint32_t retv[NV50_CAP_MAX_PROGRAM_TEMPS][4];
103 };
104
105 struct nv50_translation_info {
106 struct nv50_program *p;
107 unsigned inst_nr;
108 struct tgsi_full_instruction *insns;
109 ubyte input_file;
110 ubyte output_file;
111 ubyte input_map[PIPE_MAX_SHADER_INPUTS][4];
112 ubyte output_map[PIPE_MAX_SHADER_OUTPUTS][4];
113 ubyte interp_mode[PIPE_MAX_SHADER_INPUTS];
114 int input_access[PIPE_MAX_SHADER_INPUTS][4];
115 int output_access[PIPE_MAX_SHADER_OUTPUTS][4];
116 boolean indirect_inputs;
117 boolean indirect_outputs;
118 boolean store_to_memory;
119 struct tgsi_shader_info scan;
120 uint32_t *immd32;
121 unsigned immd32_nr;
122 ubyte *immd32_ty;
123 ubyte edgeflag_out;
124 struct nv50_subroutine *subr;
125 unsigned subr_nr;
126 };
127
128 int nv50_generate_code(struct nv50_translation_info *ti);
129 boolean nv50_program_tx(struct nv50_program *p);
130
131 #endif /* __NV50_PROG_H__ */