freedreno/a3xx: only emit dirty consts
[mesa.git] / src / gallium / drivers / nouveau / nvc0 / nvc0_screen.h
1 #ifndef __NVC0_SCREEN_H__
2 #define __NVC0_SCREEN_H__
3
4 #include "nouveau_screen.h"
5 #include "nouveau_mm.h"
6 #include "nouveau_fence.h"
7 #include "nouveau_heap.h"
8
9 #include "nv_object.xml.h"
10
11 #include "nvc0/nvc0_winsys.h"
12 #include "nvc0/nvc0_stateobj.h"
13
14 #define NVC0_TIC_MAX_ENTRIES 2048
15 #define NVC0_TSC_MAX_ENTRIES 2048
16
17 /* doesn't count reserved slots (for auxiliary constants, immediates, etc.) */
18 #define NVC0_MAX_PIPE_CONSTBUFS 14
19 #define NVE4_MAX_PIPE_CONSTBUFS_COMPUTE 7
20
21 #define NVC0_MAX_SURFACE_SLOTS 16
22
23 #define NVC0_MAX_VIEWPORTS 16
24
25
26 struct nvc0_context;
27
28 struct nvc0_blitter;
29
30 struct nvc0_screen {
31 struct nouveau_screen base;
32
33 struct nvc0_context *cur_ctx;
34
35 int num_occlusion_queries_active;
36
37 struct nouveau_bo *text;
38 struct nouveau_bo *parm; /* for COMPUTE */
39 struct nouveau_bo *uniform_bo; /* for 3D */
40 struct nouveau_bo *tls;
41 struct nouveau_bo *txc; /* TIC (offset 0) and TSC (65536) */
42 struct nouveau_bo *poly_cache;
43
44 uint16_t mp_count;
45 uint16_t mp_count_compute; /* magic reg can make compute use fewer MPs */
46
47 struct nouveau_heap *text_heap;
48 struct nouveau_heap *lib_code; /* allocated from text_heap */
49
50 struct nvc0_blitter *blitter;
51
52 struct {
53 void **entries;
54 int next;
55 uint32_t lock[NVC0_TIC_MAX_ENTRIES / 32];
56 } tic;
57
58 struct {
59 void **entries;
60 int next;
61 uint32_t lock[NVC0_TSC_MAX_ENTRIES / 32];
62 } tsc;
63
64 struct {
65 struct nouveau_bo *bo;
66 uint32_t *map;
67 } fence;
68
69 struct {
70 struct nvc0_program *prog; /* compute state object to read MP counters */
71 struct pipe_query *mp_counter[8]; /* counter to query allocation */
72 uint8_t num_mp_pm_active[2];
73 boolean mp_counters_enabled;
74 } pm;
75
76 struct nouveau_mman *mm_VRAM_fe0;
77
78 struct nouveau_object *eng3d; /* sqrt(1/2)|kepler> + sqrt(1/2)|fermi> */
79 struct nouveau_object *eng2d;
80 struct nouveau_object *m2mf;
81 struct nouveau_object *compute;
82 struct nouveau_object *nvsw;
83 };
84
85 static INLINE struct nvc0_screen *
86 nvc0_screen(struct pipe_screen *screen)
87 {
88 return (struct nvc0_screen *)screen;
89 }
90
91
92 /* Performance counter queries:
93 */
94 #define NVE4_PM_QUERY_COUNT 49
95 #define NVE4_PM_QUERY(i) (PIPE_QUERY_DRIVER_SPECIFIC + (i))
96 #define NVE4_PM_QUERY_LAST NVE4_PM_QUERY(NVE4_PM_QUERY_COUNT - 1)
97 #define NVE4_PM_QUERY_PROF_TRIGGER_0 0
98 #define NVE4_PM_QUERY_PROF_TRIGGER_1 1
99 #define NVE4_PM_QUERY_PROF_TRIGGER_2 2
100 #define NVE4_PM_QUERY_PROF_TRIGGER_3 3
101 #define NVE4_PM_QUERY_PROF_TRIGGER_4 4
102 #define NVE4_PM_QUERY_PROF_TRIGGER_5 5
103 #define NVE4_PM_QUERY_PROF_TRIGGER_6 6
104 #define NVE4_PM_QUERY_PROF_TRIGGER_7 7
105 #define NVE4_PM_QUERY_LAUNCHED_WARPS 8
106 #define NVE4_PM_QUERY_LAUNCHED_THREADS 9
107 #define NVE4_PM_QUERY_LAUNCHED_CTA 10
108 #define NVE4_PM_QUERY_INST_ISSUED1 11
109 #define NVE4_PM_QUERY_INST_ISSUED2 12
110 #define NVE4_PM_QUERY_INST_EXECUTED 13
111 #define NVE4_PM_QUERY_LD_LOCAL 14
112 #define NVE4_PM_QUERY_ST_LOCAL 15
113 #define NVE4_PM_QUERY_LD_SHARED 16
114 #define NVE4_PM_QUERY_ST_SHARED 17
115 #define NVE4_PM_QUERY_L1_LOCAL_LOAD_HIT 18
116 #define NVE4_PM_QUERY_L1_LOCAL_LOAD_MISS 19
117 #define NVE4_PM_QUERY_L1_LOCAL_STORE_HIT 20
118 #define NVE4_PM_QUERY_L1_LOCAL_STORE_MISS 21
119 #define NVE4_PM_QUERY_GLD_REQUEST 22
120 #define NVE4_PM_QUERY_GST_REQUEST 23
121 #define NVE4_PM_QUERY_L1_GLOBAL_LOAD_HIT 24
122 #define NVE4_PM_QUERY_L1_GLOBAL_LOAD_MISS 25
123 #define NVE4_PM_QUERY_GLD_TRANSACTIONS_UNCACHED 26
124 #define NVE4_PM_QUERY_GST_TRANSACTIONS 27
125 #define NVE4_PM_QUERY_BRANCH 28
126 #define NVE4_PM_QUERY_BRANCH_DIVERGENT 29
127 #define NVE4_PM_QUERY_ACTIVE_WARPS 30
128 #define NVE4_PM_QUERY_ACTIVE_CYCLES 31
129 #define NVE4_PM_QUERY_INST_ISSUED 32
130 #define NVE4_PM_QUERY_ATOM_COUNT 33
131 #define NVE4_PM_QUERY_GRED_COUNT 34
132 #define NVE4_PM_QUERY_LD_SHARED_REPLAY 35
133 #define NVE4_PM_QUERY_ST_SHARED_REPLAY 36
134 #define NVE4_PM_QUERY_LD_LOCAL_TRANSACTIONS 37
135 #define NVE4_PM_QUERY_ST_LOCAL_TRANSACTIONS 38
136 #define NVE4_PM_QUERY_L1_LD_SHARED_TRANSACTIONS 39
137 #define NVE4_PM_QUERY_L1_ST_SHARED_TRANSACTIONS 40
138 #define NVE4_PM_QUERY_GLD_MEM_DIV_REPLAY 41
139 #define NVE4_PM_QUERY_GST_MEM_DIV_REPLAY 42
140 #define NVE4_PM_QUERY_METRIC_IPC 43
141 #define NVE4_PM_QUERY_METRIC_IPAC 44
142 #define NVE4_PM_QUERY_METRIC_IPEC 45
143 #define NVE4_PM_QUERY_METRIC_MP_OCCUPANCY 46
144 #define NVE4_PM_QUERY_METRIC_MP_EFFICIENCY 47
145 #define NVE4_PM_QUERY_METRIC_INST_REPLAY_OHEAD 48
146
147 /*
148 #define NVE4_PM_QUERY_GR_IDLE 50
149 #define NVE4_PM_QUERY_BSP_IDLE 51
150 #define NVE4_PM_QUERY_VP_IDLE 52
151 #define NVE4_PM_QUERY_PPP_IDLE 53
152 #define NVE4_PM_QUERY_CE0_IDLE 54
153 #define NVE4_PM_QUERY_CE1_IDLE 55
154 #define NVE4_PM_QUERY_CE2_IDLE 56
155 */
156 /* L2 queries (PCOUNTER) */
157 /*
158 #define NVE4_PM_QUERY_L2_SUBP_WRITE_L1_SECTOR_QUERIES 57
159 ...
160 */
161 /* TEX queries (PCOUNTER) */
162 /*
163 #define NVE4_PM_QUERY_TEX0_CACHE_SECTOR_QUERIES 58
164 ...
165 */
166
167 #define NVC0_PM_QUERY_COUNT 31
168 #define NVC0_PM_QUERY(i) (PIPE_QUERY_DRIVER_SPECIFIC + 2048 + (i))
169 #define NVC0_PM_QUERY_LAST NVC0_PM_QUERY(NVC0_PM_QUERY_COUNT - 1)
170 #define NVC0_PM_QUERY_INST_EXECUTED 0
171 #define NVC0_PM_QUERY_BRANCH 1
172 #define NVC0_PM_QUERY_BRANCH_DIVERGENT 2
173 #define NVC0_PM_QUERY_ACTIVE_WARPS 3
174 #define NVC0_PM_QUERY_ACTIVE_CYCLES 4
175 #define NVC0_PM_QUERY_LAUNCHED_WARPS 5
176 #define NVC0_PM_QUERY_LAUNCHED_THREADS 6
177 #define NVC0_PM_QUERY_LD_SHARED 7
178 #define NVC0_PM_QUERY_ST_SHARED 8
179 #define NVC0_PM_QUERY_LD_LOCAL 9
180 #define NVC0_PM_QUERY_ST_LOCAL 10
181 #define NVC0_PM_QUERY_GRED_COUNT 11
182 #define NVC0_PM_QUERY_ATOM_COUNT 12
183 #define NVC0_PM_QUERY_GLD_REQUEST 13
184 #define NVC0_PM_QUERY_GST_REQUEST 14
185 #define NVC0_PM_QUERY_INST_ISSUED1_0 15
186 #define NVC0_PM_QUERY_INST_ISSUED1_1 16
187 #define NVC0_PM_QUERY_INST_ISSUED2_0 17
188 #define NVC0_PM_QUERY_INST_ISSUED2_1 18
189 #define NVC0_PM_QUERY_TH_INST_EXECUTED_0 19
190 #define NVC0_PM_QUERY_TH_INST_EXECUTED_1 20
191 #define NVC0_PM_QUERY_TH_INST_EXECUTED_2 21
192 #define NVC0_PM_QUERY_TH_INST_EXECUTED_3 22
193 #define NVC0_PM_QUERY_PROF_TRIGGER_0 23
194 #define NVC0_PM_QUERY_PROF_TRIGGER_1 24
195 #define NVC0_PM_QUERY_PROF_TRIGGER_2 25
196 #define NVC0_PM_QUERY_PROF_TRIGGER_3 26
197 #define NVC0_PM_QUERY_PROF_TRIGGER_4 27
198 #define NVC0_PM_QUERY_PROF_TRIGGER_5 28
199 #define NVC0_PM_QUERY_PROF_TRIGGER_6 29
200 #define NVC0_PM_QUERY_PROF_TRIGGER_7 30
201
202 /* Driver statistics queries:
203 */
204 #ifdef NOUVEAU_ENABLE_DRIVER_STATISTICS
205
206 #define NVC0_QUERY_DRV_STAT(i) (PIPE_QUERY_DRIVER_SPECIFIC + 1024 + (i))
207 #define NVC0_QUERY_DRV_STAT_COUNT 29
208 #define NVC0_QUERY_DRV_STAT_LAST NVC0_QUERY_DRV_STAT(NVC0_QUERY_DRV_STAT_COUNT - 1)
209 #define NVC0_QUERY_DRV_STAT_TEX_OBJECT_CURRENT_COUNT 0
210 #define NVC0_QUERY_DRV_STAT_TEX_OBJECT_CURRENT_BYTES 1
211 #define NVC0_QUERY_DRV_STAT_BUF_OBJECT_CURRENT_COUNT 2
212 #define NVC0_QUERY_DRV_STAT_BUF_OBJECT_CURRENT_BYTES_VID 3
213 #define NVC0_QUERY_DRV_STAT_BUF_OBJECT_CURRENT_BYTES_SYS 4
214 #define NVC0_QUERY_DRV_STAT_TEX_TRANSFERS_READ 5
215 #define NVC0_QUERY_DRV_STAT_TEX_TRANSFERS_WRITE 6
216 #define NVC0_QUERY_DRV_STAT_TEX_COPY_COUNT 7
217 #define NVC0_QUERY_DRV_STAT_TEX_BLIT_COUNT 8
218 #define NVC0_QUERY_DRV_STAT_TEX_CACHE_FLUSH_COUNT 9
219 #define NVC0_QUERY_DRV_STAT_BUF_TRANSFERS_READ 10
220 #define NVC0_QUERY_DRV_STAT_BUF_TRANSFERS_WRITE 11
221 #define NVC0_QUERY_DRV_STAT_BUF_READ_BYTES_STAGING_VID 12
222 #define NVC0_QUERY_DRV_STAT_BUF_WRITE_BYTES_DIRECT 13
223 #define NVC0_QUERY_DRV_STAT_BUF_WRITE_BYTES_STAGING_VID 14
224 #define NVC0_QUERY_DRV_STAT_BUF_WRITE_BYTES_STAGING_SYS 15
225 #define NVC0_QUERY_DRV_STAT_BUF_COPY_BYTES 16
226 #define NVC0_QUERY_DRV_STAT_BUF_NON_KERNEL_FENCE_SYNC_COUNT 17
227 #define NVC0_QUERY_DRV_STAT_ANY_NON_KERNEL_FENCE_SYNC_COUNT 18
228 #define NVC0_QUERY_DRV_STAT_QUERY_SYNC_COUNT 19
229 #define NVC0_QUERY_DRV_STAT_GPU_SERIALIZE_COUNT 20
230 #define NVC0_QUERY_DRV_STAT_DRAW_CALLS_ARRAY 21
231 #define NVC0_QUERY_DRV_STAT_DRAW_CALLS_INDEXED 22
232 #define NVC0_QUERY_DRV_STAT_DRAW_CALLS_FALLBACK_COUNT 23
233 #define NVC0_QUERY_DRV_STAT_USER_BUFFER_UPLOAD_BYTES 24
234 #define NVC0_QUERY_DRV_STAT_CONSTBUF_UPLOAD_COUNT 25
235 #define NVC0_QUERY_DRV_STAT_CONSTBUF_UPLOAD_BYTES 26
236 #define NVC0_QUERY_DRV_STAT_PUSHBUF_COUNT 27
237 #define NVC0_QUERY_DRV_STAT_RESOURCE_VALIDATE_COUNT 28
238
239 #else
240
241 #define NVC0_QUERY_DRV_STAT_COUNT 0
242
243 #endif
244
245 int nvc0_screen_get_driver_query_info(struct pipe_screen *, unsigned,
246 struct pipe_driver_query_info *);
247
248 boolean nvc0_blitter_create(struct nvc0_screen *);
249 void nvc0_blitter_destroy(struct nvc0_screen *);
250
251 void nvc0_screen_make_buffers_resident(struct nvc0_screen *);
252
253 int nvc0_screen_tic_alloc(struct nvc0_screen *, void *);
254 int nvc0_screen_tsc_alloc(struct nvc0_screen *, void *);
255
256 int nve4_screen_compute_setup(struct nvc0_screen *, struct nouveau_pushbuf *);
257 int nvc0_screen_compute_setup(struct nvc0_screen *, struct nouveau_pushbuf *);
258
259 boolean nvc0_screen_resize_tls_area(struct nvc0_screen *, uint32_t lpos,
260 uint32_t lneg, uint32_t cstack);
261
262 static INLINE void
263 nvc0_resource_fence(struct nv04_resource *res, uint32_t flags)
264 {
265 struct nvc0_screen *screen = nvc0_screen(res->base.screen);
266
267 if (res->mm) {
268 nouveau_fence_ref(screen->base.fence.current, &res->fence);
269 if (flags & NOUVEAU_BO_WR)
270 nouveau_fence_ref(screen->base.fence.current, &res->fence_wr);
271 }
272 }
273
274 static INLINE void
275 nvc0_resource_validate(struct nv04_resource *res, uint32_t flags)
276 {
277 if (likely(res->bo)) {
278 if (flags & NOUVEAU_BO_WR)
279 res->status |= NOUVEAU_BUFFER_STATUS_GPU_WRITING |
280 NOUVEAU_BUFFER_STATUS_DIRTY;
281 if (flags & NOUVEAU_BO_RD)
282 res->status |= NOUVEAU_BUFFER_STATUS_GPU_READING;
283
284 nvc0_resource_fence(res, flags);
285 }
286 }
287
288 struct nvc0_format {
289 uint32_t rt;
290 uint32_t tic;
291 uint32_t vtx;
292 uint32_t usage;
293 };
294
295 extern const struct nvc0_format nvc0_format_table[];
296
297 static INLINE void
298 nvc0_screen_tic_unlock(struct nvc0_screen *screen, struct nv50_tic_entry *tic)
299 {
300 if (tic->id >= 0)
301 screen->tic.lock[tic->id / 32] &= ~(1 << (tic->id % 32));
302 }
303
304 static INLINE void
305 nvc0_screen_tsc_unlock(struct nvc0_screen *screen, struct nv50_tsc_entry *tsc)
306 {
307 if (tsc->id >= 0)
308 screen->tsc.lock[tsc->id / 32] &= ~(1 << (tsc->id % 32));
309 }
310
311 static INLINE void
312 nvc0_screen_tic_free(struct nvc0_screen *screen, struct nv50_tic_entry *tic)
313 {
314 if (tic->id >= 0) {
315 screen->tic.entries[tic->id] = NULL;
316 screen->tic.lock[tic->id / 32] &= ~(1 << (tic->id % 32));
317 }
318 }
319
320 static INLINE void
321 nvc0_screen_tsc_free(struct nvc0_screen *screen, struct nv50_tsc_entry *tsc)
322 {
323 if (tsc->id >= 0) {
324 screen->tsc.entries[tsc->id] = NULL;
325 screen->tsc.lock[tsc->id / 32] &= ~(1 << (tsc->id % 32));
326 }
327 }
328
329 #endif