Merge branch 'sprite-coord'
[mesa.git] / src / gallium / drivers / nv50 / nv50_program.h
1 /*
2 * Copyright 2010 Ben Skeggs
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
18 * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF
19 * OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
20 * SOFTWARE.
21 */
22
23 #ifndef __NV50_PROG_H__
24 #define __NV50_PROG_H__
25
26 #include "pipe/p_state.h"
27 #include "tgsi/tgsi_scan.h"
28
29 #define NV50_CAP_MAX_PROGRAM_TEMPS 64
30
31 struct nv50_varying {
32 uint8_t id; /* tgsi index */
33 uint8_t hw; /* hw index, nv50 wants flat FP inputs last */
34
35 unsigned mask : 4;
36 unsigned linear : 1;
37 unsigned pad : 3;
38
39 ubyte sn; /* semantic name */
40 ubyte si; /* semantic index */
41 };
42
43 struct nv50_program {
44 struct pipe_shader_state pipe;
45
46 ubyte type;
47 boolean translated;
48 boolean uses_lmem;
49
50 struct nouveau_bo *bo;
51 struct nouveau_stateobj *so;
52
53 uint32_t *code;
54 unsigned code_size;
55 unsigned code_start; /* offset inside bo */
56 uint32_t *immd;
57 unsigned immd_size;
58 unsigned parm_size; /* size limit of uniform buffer */
59
60 ubyte max_gpr; /* REG_ALLOC_TEMP */
61 ubyte max_out; /* REG_ALLOC_RESULT or FP_RESULT_COUNT */
62
63 ubyte in_nr;
64 ubyte out_nr;
65 struct nv50_varying in[16];
66 struct nv50_varying out[16];
67
68 struct {
69 uint32_t attrs[3]; /* VP_ATTR_EN_0,1 and VP_GP_BUILTIN_ATTR_EN */
70 ubyte psiz;
71 ubyte bfc[2];
72 ubyte edgeflag;
73 ubyte clpd;
74 ubyte clpd_nr;
75 } vp;
76
77 struct {
78 uint32_t flags[2]; /* 0x19a8, 196c */
79 uint32_t interp; /* 0x1988 */
80 uint32_t colors; /* 0x1904 */
81 } fp;
82
83 struct {
84 ubyte primid; /* primitive id output register */
85 uint8_t vert_count;
86 uint8_t prim_type; /* point, line strip or tri strip */
87 } gp;
88
89 /* relocation records */
90 void *fixups;
91 unsigned num_fixups;
92 };
93
94 #define NV50_INTERP_LINEAR (1 << 0)
95 #define NV50_INTERP_FLAT (1 << 1)
96 #define NV50_INTERP_CENTROID (1 << 2)
97
98 /* analyze TGSI and see which TEMP[] are used as subroutine inputs/outputs */
99 struct nv50_subroutine {
100 unsigned id;
101 unsigned pos;
102 /* function inputs and outputs */
103 uint32_t argv[NV50_CAP_MAX_PROGRAM_TEMPS][4];
104 uint32_t retv[NV50_CAP_MAX_PROGRAM_TEMPS][4];
105 };
106
107 struct nv50_translation_info {
108 struct nv50_program *p;
109 unsigned inst_nr;
110 struct tgsi_full_instruction *insns;
111 ubyte input_file;
112 ubyte output_file;
113 ubyte input_map[PIPE_MAX_SHADER_INPUTS][4];
114 ubyte output_map[PIPE_MAX_SHADER_OUTPUTS][4];
115 ubyte interp_mode[PIPE_MAX_SHADER_INPUTS];
116 int input_access[PIPE_MAX_SHADER_INPUTS][4];
117 int output_access[PIPE_MAX_SHADER_OUTPUTS][4];
118 boolean indirect_inputs;
119 boolean indirect_outputs;
120 boolean store_to_memory;
121 struct tgsi_shader_info scan;
122 uint32_t *immd32;
123 unsigned immd32_nr;
124 ubyte *immd32_ty;
125 ubyte edgeflag_out;
126 struct nv50_subroutine *subr;
127 unsigned subr_nr;
128 };
129
130 int nv50_generate_code(struct nv50_translation_info *ti);
131
132 void nv50_relocate_program(struct nv50_program *p,
133 uint32_t code_base, uint32_t data_base);
134
135 boolean nv50_program_tx(struct nv50_program *p);
136
137 #endif /* __NV50_PROG_H__ */