2 * Copyright 2013 Advanced Micro Devices, Inc.
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
25 * This file contains helpers for writing commands to commands streams.
31 #include "r600_pipe_common.h"
32 #include "amd/common/sid.h"
35 * Return true if there is enough memory in VRAM and GTT for the buffers
38 * \param vram VRAM memory size not added to the buffer list yet
39 * \param gtt GTT memory size not added to the buffer list yet
42 radeon_cs_memory_below_limit(struct r600_common_screen
*screen
,
43 struct radeon_winsys_cs
*cs
,
44 uint64_t vram
, uint64_t gtt
)
46 vram
+= cs
->used_vram
;
49 /* Anything that goes above the VRAM size should go to GTT. */
50 if (vram
> screen
->info
.vram_size
)
51 gtt
+= vram
- screen
->info
.vram_size
;
53 /* Now we just need to check if we have enough GTT. */
54 return gtt
< screen
->info
.gart_size
* 0.7;
58 * Add a buffer to the buffer list for the given command stream (CS).
60 * All buffers used by a CS must be added to the list. This tells the kernel
61 * driver which buffers are used by GPU commands. Other buffers can
62 * be swapped out (not accessible) during execution.
64 * The buffer list becomes empty after every context flush and must be
67 static inline unsigned radeon_add_to_buffer_list(struct r600_common_context
*rctx
,
68 struct r600_ring
*ring
,
69 struct r600_resource
*rbo
,
70 enum radeon_bo_usage usage
,
71 enum radeon_bo_priority priority
)
74 return rctx
->ws
->cs_add_buffer(
76 (enum radeon_bo_usage
)(usage
| RADEON_USAGE_SYNCHRONIZED
),
77 rbo
->domains
, priority
) * 4;
81 * Same as above, but also checks memory usage and flushes the context
84 * When this SHOULD NOT be used:
86 * - if r600_context_add_resource_size has been called for the buffer
87 * followed by *_need_cs_space for checking the memory usage
89 * - if r600_need_dma_space has been called for the buffer
91 * - when emitting state packets and draw packets (because preceding packets
92 * can't be re-emitted at that point)
94 * - if shader resource "enabled_mask" is not up-to-date or there is
95 * a different constraint disallowing a context flush
97 static inline unsigned
98 radeon_add_to_buffer_list_check_mem(struct r600_common_context
*rctx
,
99 struct r600_ring
*ring
,
100 struct r600_resource
*rbo
,
101 enum radeon_bo_usage usage
,
102 enum radeon_bo_priority priority
,
106 !radeon_cs_memory_below_limit(rctx
->screen
, ring
->cs
,
107 rctx
->vram
+ rbo
->vram_usage
,
108 rctx
->gtt
+ rbo
->gart_usage
))
109 ring
->flush(rctx
, RADEON_FLUSH_ASYNC
, NULL
);
111 return radeon_add_to_buffer_list(rctx
, ring
, rbo
, usage
, priority
);
114 static inline void radeon_set_config_reg_seq(struct radeon_winsys_cs
*cs
, unsigned reg
, unsigned num
)
116 assert(reg
< SI_CONTEXT_REG_OFFSET
);
117 assert(cs
->current
.cdw
+ 2 + num
<= cs
->current
.max_dw
);
118 radeon_emit(cs
, PKT3(PKT3_SET_CONFIG_REG
, num
, 0));
119 radeon_emit(cs
, (reg
- SI_CONFIG_REG_OFFSET
) >> 2);
122 static inline void radeon_set_config_reg(struct radeon_winsys_cs
*cs
, unsigned reg
, unsigned value
)
124 radeon_set_config_reg_seq(cs
, reg
, 1);
125 radeon_emit(cs
, value
);
128 static inline void radeon_set_context_reg_seq(struct radeon_winsys_cs
*cs
, unsigned reg
, unsigned num
)
130 assert(reg
>= SI_CONTEXT_REG_OFFSET
);
131 assert(cs
->current
.cdw
+ 2 + num
<= cs
->current
.max_dw
);
132 radeon_emit(cs
, PKT3(PKT3_SET_CONTEXT_REG
, num
, 0));
133 radeon_emit(cs
, (reg
- SI_CONTEXT_REG_OFFSET
) >> 2);
136 static inline void radeon_set_context_reg(struct radeon_winsys_cs
*cs
, unsigned reg
, unsigned value
)
138 radeon_set_context_reg_seq(cs
, reg
, 1);
139 radeon_emit(cs
, value
);
142 static inline void radeon_set_context_reg_idx(struct radeon_winsys_cs
*cs
,
143 unsigned reg
, unsigned idx
,
146 assert(reg
>= SI_CONTEXT_REG_OFFSET
);
147 assert(cs
->current
.cdw
+ 3 <= cs
->current
.max_dw
);
148 radeon_emit(cs
, PKT3(PKT3_SET_CONTEXT_REG
, 1, 0));
149 radeon_emit(cs
, (reg
- SI_CONTEXT_REG_OFFSET
) >> 2 | (idx
<< 28));
150 radeon_emit(cs
, value
);
153 static inline void radeon_set_sh_reg_seq(struct radeon_winsys_cs
*cs
, unsigned reg
, unsigned num
)
155 assert(reg
>= SI_SH_REG_OFFSET
&& reg
< SI_SH_REG_END
);
156 assert(cs
->current
.cdw
+ 2 + num
<= cs
->current
.max_dw
);
157 radeon_emit(cs
, PKT3(PKT3_SET_SH_REG
, num
, 0));
158 radeon_emit(cs
, (reg
- SI_SH_REG_OFFSET
) >> 2);
161 static inline void radeon_set_sh_reg(struct radeon_winsys_cs
*cs
, unsigned reg
, unsigned value
)
163 radeon_set_sh_reg_seq(cs
, reg
, 1);
164 radeon_emit(cs
, value
);
167 static inline void radeon_set_uconfig_reg_seq(struct radeon_winsys_cs
*cs
, unsigned reg
, unsigned num
)
169 assert(reg
>= CIK_UCONFIG_REG_OFFSET
&& reg
< CIK_UCONFIG_REG_END
);
170 assert(cs
->current
.cdw
+ 2 + num
<= cs
->current
.max_dw
);
171 radeon_emit(cs
, PKT3(PKT3_SET_UCONFIG_REG
, num
, 0));
172 radeon_emit(cs
, (reg
- CIK_UCONFIG_REG_OFFSET
) >> 2);
175 static inline void radeon_set_uconfig_reg(struct radeon_winsys_cs
*cs
, unsigned reg
, unsigned value
)
177 radeon_set_uconfig_reg_seq(cs
, reg
, 1);
178 radeon_emit(cs
, value
);
181 static inline void radeon_set_uconfig_reg_idx(struct radeon_winsys_cs
*cs
,
182 unsigned reg
, unsigned idx
,
185 assert(reg
>= CIK_UCONFIG_REG_OFFSET
&& reg
< CIK_UCONFIG_REG_END
);
186 assert(cs
->current
.cdw
+ 3 <= cs
->current
.max_dw
);
187 radeon_emit(cs
, PKT3(PKT3_SET_UCONFIG_REG
, 1, 0));
188 radeon_emit(cs
, (reg
- CIK_UCONFIG_REG_OFFSET
) >> 2 | (idx
<< 28));
189 radeon_emit(cs
, value
);