2 * Copyright 2013 Advanced Micro Devices, Inc.
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
25 * This file contains helpers for writing commands to commands streams.
31 #include "radeonsi/si_pipe.h"
32 #include "amd/common/sid.h"
35 * Return true if there is enough memory in VRAM and GTT for the buffers
38 * \param vram VRAM memory size not added to the buffer list yet
39 * \param gtt GTT memory size not added to the buffer list yet
42 radeon_cs_memory_below_limit(struct si_screen
*screen
,
43 struct radeon_winsys_cs
*cs
,
44 uint64_t vram
, uint64_t gtt
)
46 vram
+= cs
->used_vram
;
49 /* Anything that goes above the VRAM size should go to GTT. */
50 if (vram
> screen
->info
.vram_size
)
51 gtt
+= vram
- screen
->info
.vram_size
;
53 /* Now we just need to check if we have enough GTT. */
54 return gtt
< screen
->info
.gart_size
* 0.7;
58 * Add a buffer to the buffer list for the given command stream (CS).
60 * All buffers used by a CS must be added to the list. This tells the kernel
61 * driver which buffers are used by GPU commands. Other buffers can
62 * be swapped out (not accessible) during execution.
64 * The buffer list becomes empty after every context flush and must be
67 static inline void radeon_add_to_buffer_list(struct r600_common_context
*rctx
,
68 struct r600_ring
*ring
,
69 struct r600_resource
*rbo
,
70 enum radeon_bo_usage usage
,
71 enum radeon_bo_priority priority
)
74 rctx
->ws
->cs_add_buffer(
76 (enum radeon_bo_usage
)(usage
| RADEON_USAGE_SYNCHRONIZED
),
77 rbo
->domains
, priority
);
81 * Same as above, but also checks memory usage and flushes the context
84 * When this SHOULD NOT be used:
86 * - if r600_context_add_resource_size has been called for the buffer
87 * followed by *_need_cs_space for checking the memory usage
89 * - if r600_need_dma_space has been called for the buffer
91 * - when emitting state packets and draw packets (because preceding packets
92 * can't be re-emitted at that point)
94 * - if shader resource "enabled_mask" is not up-to-date or there is
95 * a different constraint disallowing a context flush
98 radeon_add_to_gfx_buffer_list_check_mem(struct si_context
*sctx
,
99 struct r600_resource
*rbo
,
100 enum radeon_bo_usage usage
,
101 enum radeon_bo_priority priority
,
105 !radeon_cs_memory_below_limit(sctx
->screen
, sctx
->b
.gfx
.cs
,
106 sctx
->b
.vram
+ rbo
->vram_usage
,
107 sctx
->b
.gtt
+ rbo
->gart_usage
))
108 si_flush_gfx_cs(&sctx
->b
, PIPE_FLUSH_ASYNC
, NULL
);
110 radeon_add_to_buffer_list(&sctx
->b
, &sctx
->b
.gfx
, rbo
, usage
, priority
);
113 static inline void radeon_set_config_reg_seq(struct radeon_winsys_cs
*cs
, unsigned reg
, unsigned num
)
115 assert(reg
< SI_CONTEXT_REG_OFFSET
);
116 assert(cs
->current
.cdw
+ 2 + num
<= cs
->current
.max_dw
);
117 radeon_emit(cs
, PKT3(PKT3_SET_CONFIG_REG
, num
, 0));
118 radeon_emit(cs
, (reg
- SI_CONFIG_REG_OFFSET
) >> 2);
121 static inline void radeon_set_config_reg(struct radeon_winsys_cs
*cs
, unsigned reg
, unsigned value
)
123 radeon_set_config_reg_seq(cs
, reg
, 1);
124 radeon_emit(cs
, value
);
127 static inline void radeon_set_context_reg_seq(struct radeon_winsys_cs
*cs
, unsigned reg
, unsigned num
)
129 assert(reg
>= SI_CONTEXT_REG_OFFSET
);
130 assert(cs
->current
.cdw
+ 2 + num
<= cs
->current
.max_dw
);
131 radeon_emit(cs
, PKT3(PKT3_SET_CONTEXT_REG
, num
, 0));
132 radeon_emit(cs
, (reg
- SI_CONTEXT_REG_OFFSET
) >> 2);
135 static inline void radeon_set_context_reg(struct radeon_winsys_cs
*cs
, unsigned reg
, unsigned value
)
137 radeon_set_context_reg_seq(cs
, reg
, 1);
138 radeon_emit(cs
, value
);
141 static inline void radeon_set_context_reg_idx(struct radeon_winsys_cs
*cs
,
142 unsigned reg
, unsigned idx
,
145 assert(reg
>= SI_CONTEXT_REG_OFFSET
);
146 assert(cs
->current
.cdw
+ 3 <= cs
->current
.max_dw
);
147 radeon_emit(cs
, PKT3(PKT3_SET_CONTEXT_REG
, 1, 0));
148 radeon_emit(cs
, (reg
- SI_CONTEXT_REG_OFFSET
) >> 2 | (idx
<< 28));
149 radeon_emit(cs
, value
);
152 static inline void radeon_set_sh_reg_seq(struct radeon_winsys_cs
*cs
, unsigned reg
, unsigned num
)
154 assert(reg
>= SI_SH_REG_OFFSET
&& reg
< SI_SH_REG_END
);
155 assert(cs
->current
.cdw
+ 2 + num
<= cs
->current
.max_dw
);
156 radeon_emit(cs
, PKT3(PKT3_SET_SH_REG
, num
, 0));
157 radeon_emit(cs
, (reg
- SI_SH_REG_OFFSET
) >> 2);
160 static inline void radeon_set_sh_reg(struct radeon_winsys_cs
*cs
, unsigned reg
, unsigned value
)
162 radeon_set_sh_reg_seq(cs
, reg
, 1);
163 radeon_emit(cs
, value
);
166 static inline void radeon_set_uconfig_reg_seq(struct radeon_winsys_cs
*cs
, unsigned reg
, unsigned num
)
168 assert(reg
>= CIK_UCONFIG_REG_OFFSET
&& reg
< CIK_UCONFIG_REG_END
);
169 assert(cs
->current
.cdw
+ 2 + num
<= cs
->current
.max_dw
);
170 radeon_emit(cs
, PKT3(PKT3_SET_UCONFIG_REG
, num
, 0));
171 radeon_emit(cs
, (reg
- CIK_UCONFIG_REG_OFFSET
) >> 2);
174 static inline void radeon_set_uconfig_reg(struct radeon_winsys_cs
*cs
, unsigned reg
, unsigned value
)
176 radeon_set_uconfig_reg_seq(cs
, reg
, 1);
177 radeon_emit(cs
, value
);
180 static inline void radeon_set_uconfig_reg_idx(struct radeon_winsys_cs
*cs
,
181 unsigned reg
, unsigned idx
,
184 assert(reg
>= CIK_UCONFIG_REG_OFFSET
&& reg
< CIK_UCONFIG_REG_END
);
185 assert(cs
->current
.cdw
+ 3 <= cs
->current
.max_dw
);
186 radeon_emit(cs
, PKT3(PKT3_SET_UCONFIG_REG
, 1, 0));
187 radeon_emit(cs
, (reg
- CIK_UCONFIG_REG_OFFSET
) >> 2 | (idx
<< 28));
188 radeon_emit(cs
, value
);