1 /**********************************************************
2 * Copyright 2008-2009 VMware, Inc. All rights reserved.
4 * Permission is hereby granted, free of charge, to any person
5 * obtaining a copy of this software and associated documentation
6 * files (the "Software"), to deal in the Software without
7 * restriction, including without limitation the rights to use, copy,
8 * modify, merge, publish, distribute, sublicense, and/or sell copies
9 * of the Software, and to permit persons to whom the Software is
10 * furnished to do so, subject to the following conditions:
12 * The above copyright notice and this permission notice shall be
13 * included in all copies or substantial portions of the Software.
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24 **********************************************************/
26 #include "util/u_math.h"
27 #include "util/u_memory.h"
28 #include "util/crc32.h"
30 #include "svga_debug.h"
31 #include "svga_format.h"
32 #include "svga_winsys.h"
33 #include "svga_screen.h"
34 #include "svga_screen_cache.h"
35 #include "svga_context.h"
38 #define SVGA_SURFACE_CACHE_ENABLED 1
42 * Return the size of the surface described by the key (in bytes).
45 surface_size(const struct svga_host_surface_cache_key
*key
)
47 unsigned bw
, bh
, bpb
, total_size
, i
;
49 assert(key
->numMipLevels
> 0);
50 assert(key
->numFaces
> 0);
51 assert(key
->arraySize
> 0);
53 if (key
->format
== SVGA3D_BUFFER
) {
54 /* Special case: we don't want to count vertex/index buffers
55 * against the cache size limit, so view them as zero-sized.
60 svga_format_size(key
->format
, &bw
, &bh
, &bpb
);
64 for (i
= 0; i
< key
->numMipLevels
; i
++) {
65 unsigned w
= u_minify(key
->size
.width
, i
);
66 unsigned h
= u_minify(key
->size
.height
, i
);
67 unsigned d
= u_minify(key
->size
.depth
, i
);
68 unsigned img_size
= ((w
+ bw
- 1) / bw
) * ((h
+ bh
- 1) / bh
) * d
* bpb
;
69 total_size
+= img_size
;
72 total_size
*= key
->numFaces
* key
->arraySize
* MAX2(1, key
->sampleCount
);
79 * Compute the bucket for this key.
81 static inline unsigned
82 svga_screen_cache_bucket(const struct svga_host_surface_cache_key
*key
)
84 return util_hash_crc32(key
, sizeof *key
) % SVGA_HOST_SURFACE_CACHE_BUCKETS
;
89 * Search the cache for a surface that matches the key. If a match is
90 * found, remove it from the cache and return the surface pointer.
91 * Return NULL otherwise.
93 static struct svga_winsys_surface
*
94 svga_screen_cache_lookup(struct svga_screen
*svgascreen
,
95 const struct svga_host_surface_cache_key
*key
)
97 struct svga_host_surface_cache
*cache
= &svgascreen
->cache
;
98 struct svga_winsys_screen
*sws
= svgascreen
->sws
;
99 struct svga_host_surface_cache_entry
*entry
;
100 struct svga_winsys_surface
*handle
= NULL
;
101 struct list_head
*curr
, *next
;
105 assert(key
->cachable
);
107 bucket
= svga_screen_cache_bucket(key
);
109 mtx_lock(&cache
->mutex
);
111 curr
= cache
->bucket
[bucket
].next
;
113 while (curr
!= &cache
->bucket
[bucket
]) {
116 entry
= LIST_ENTRY(struct svga_host_surface_cache_entry
, curr
, bucket_head
);
118 assert(entry
->handle
);
120 /* If the key matches and the fence is signalled (the surface is no
121 * longer needed) the lookup was successful. We found a surface that
123 * We unlink the surface from the cache entry and we add the entry to
126 if (memcmp(&entry
->key
, key
, sizeof *key
) == 0 &&
127 sws
->fence_signalled(sws
, entry
->fence
, 0) == 0) {
130 assert(sws
->surface_is_flushed(sws
, entry
->handle
));
132 handle
= entry
->handle
; /* Reference is transfered here. */
133 entry
->handle
= NULL
;
135 /* Remove from hash table */
136 LIST_DEL(&entry
->bucket_head
);
138 /* remove from LRU list */
139 LIST_DEL(&entry
->head
);
141 /* Add the cache entry (but not the surface!) to the empty list */
142 LIST_ADD(&entry
->head
, &cache
->empty
);
144 /* update the cache size */
145 surf_size
= surface_size(&entry
->key
);
146 assert(surf_size
<= cache
->total_size
);
147 if (surf_size
> cache
->total_size
)
148 cache
->total_size
= 0; /* should never happen, but be safe */
150 cache
->total_size
-= surf_size
;
159 mtx_unlock(&cache
->mutex
);
161 if (SVGA_DEBUG
& DEBUG_DMA
)
162 debug_printf("%s: cache %s after %u tries (bucket %d)\n", __FUNCTION__
,
163 handle
? "hit" : "miss", tries
, bucket
);
170 * Free the least recently used entries in the surface cache until the
171 * cache size is <= the target size OR there are no unused entries left
172 * to discard. We don't do any flushing to try to free up additional
176 svga_screen_cache_shrink(struct svga_screen
*svgascreen
,
177 unsigned target_size
)
179 struct svga_host_surface_cache
*cache
= &svgascreen
->cache
;
180 struct svga_winsys_screen
*sws
= svgascreen
->sws
;
181 struct svga_host_surface_cache_entry
*entry
= NULL
, *next_entry
;
183 /* Walk over the list of unused buffers in reverse order: from oldest
186 LIST_FOR_EACH_ENTRY_SAFE_REV(entry
, next_entry
, &cache
->unused
, head
) {
187 if (entry
->key
.format
!= SVGA3D_BUFFER
) {
188 /* we don't want to discard vertex/index buffers */
190 cache
->total_size
-= surface_size(&entry
->key
);
192 assert(entry
->handle
);
193 sws
->surface_reference(sws
, &entry
->handle
, NULL
);
195 LIST_DEL(&entry
->bucket_head
);
196 LIST_DEL(&entry
->head
);
197 LIST_ADD(&entry
->head
, &cache
->empty
);
199 if (cache
->total_size
<= target_size
) {
209 * Add a surface to the cache. This is done when the driver deletes
210 * the surface. Note: transfers a handle reference.
213 svga_screen_cache_add(struct svga_screen
*svgascreen
,
214 const struct svga_host_surface_cache_key
*key
,
215 struct svga_winsys_surface
**p_handle
)
217 struct svga_host_surface_cache
*cache
= &svgascreen
->cache
;
218 struct svga_winsys_screen
*sws
= svgascreen
->sws
;
219 struct svga_host_surface_cache_entry
*entry
= NULL
;
220 struct svga_winsys_surface
*handle
= *p_handle
;
223 assert(key
->cachable
);
228 surf_size
= surface_size(key
);
231 mtx_lock(&cache
->mutex
);
233 if (surf_size
>= SVGA_HOST_SURFACE_CACHE_BYTES
) {
234 /* this surface is too large to cache, just free it */
235 sws
->surface_reference(sws
, &handle
, NULL
);
236 mtx_unlock(&cache
->mutex
);
240 if (cache
->total_size
+ surf_size
> SVGA_HOST_SURFACE_CACHE_BYTES
) {
241 /* Adding this surface would exceed the cache size.
242 * Try to discard least recently used entries until we hit the
243 * new target cache size.
245 unsigned target_size
= SVGA_HOST_SURFACE_CACHE_BYTES
- surf_size
;
247 svga_screen_cache_shrink(svgascreen
, target_size
);
249 if (cache
->total_size
> target_size
) {
250 /* we weren't able to shrink the cache as much as we wanted so
251 * just discard this surface.
253 sws
->surface_reference(sws
, &handle
, NULL
);
254 mtx_unlock(&cache
->mutex
);
259 if (!LIST_IS_EMPTY(&cache
->empty
)) {
260 /* An empty entry has no surface associated with it.
261 * Use the first empty entry.
263 entry
= LIST_ENTRY(struct svga_host_surface_cache_entry
,
264 cache
->empty
.next
, head
);
266 /* Remove from LRU list */
267 LIST_DEL(&entry
->head
);
269 else if (!LIST_IS_EMPTY(&cache
->unused
)) {
270 /* free the last used buffer and reuse its entry */
271 entry
= LIST_ENTRY(struct svga_host_surface_cache_entry
,
272 cache
->unused
.prev
, head
);
273 SVGA_DBG(DEBUG_CACHE
|DEBUG_DMA
,
274 "unref sid %p (make space)\n", entry
->handle
);
276 cache
->total_size
-= surface_size(&entry
->key
);
278 sws
->surface_reference(sws
, &entry
->handle
, NULL
);
280 /* Remove from hash table */
281 LIST_DEL(&entry
->bucket_head
);
283 /* Remove from LRU list */
284 LIST_DEL(&entry
->head
);
288 assert(entry
->handle
== NULL
);
289 entry
->handle
= handle
;
290 memcpy(&entry
->key
, key
, sizeof entry
->key
);
292 SVGA_DBG(DEBUG_CACHE
|DEBUG_DMA
,
293 "cache sid %p\n", entry
->handle
);
294 LIST_ADD(&entry
->head
, &cache
->validated
);
296 cache
->total_size
+= surf_size
;
299 /* Couldn't cache the buffer -- this really shouldn't happen */
300 SVGA_DBG(DEBUG_CACHE
|DEBUG_DMA
,
301 "unref sid %p (couldn't find space)\n", handle
);
302 sws
->surface_reference(sws
, &handle
, NULL
);
305 mtx_unlock(&cache
->mutex
);
310 * Called during the screen flush to move all buffers not in a validate list
311 * into the unused list.
314 svga_screen_cache_flush(struct svga_screen
*svgascreen
,
315 struct svga_context
*svga
,
316 struct pipe_fence_handle
*fence
)
318 struct svga_host_surface_cache
*cache
= &svgascreen
->cache
;
319 struct svga_winsys_screen
*sws
= svgascreen
->sws
;
320 struct svga_host_surface_cache_entry
*entry
;
321 struct list_head
*curr
, *next
;
324 mtx_lock(&cache
->mutex
);
326 /* Loop over entries in the invalidated list */
327 curr
= cache
->invalidated
.next
;
329 while (curr
!= &cache
->invalidated
) {
330 entry
= LIST_ENTRY(struct svga_host_surface_cache_entry
, curr
, head
);
332 assert(entry
->handle
);
334 if (sws
->surface_is_flushed(sws
, entry
->handle
)) {
335 /* remove entry from the invalidated list */
336 LIST_DEL(&entry
->head
);
338 sws
->fence_reference(sws
, &entry
->fence
, fence
);
340 /* Add entry to the unused list */
341 LIST_ADD(&entry
->head
, &cache
->unused
);
343 /* Add entry to the hash table bucket */
344 bucket
= svga_screen_cache_bucket(&entry
->key
);
345 LIST_ADD(&entry
->bucket_head
, &cache
->bucket
[bucket
]);
352 curr
= cache
->validated
.next
;
354 while (curr
!= &cache
->validated
) {
355 entry
= LIST_ENTRY(struct svga_host_surface_cache_entry
, curr
, head
);
357 assert(entry
->handle
);
359 if (sws
->surface_is_flushed(sws
, entry
->handle
)) {
360 /* remove entry from the validated list */
361 LIST_DEL(&entry
->head
);
363 /* It is now safe to invalidate the surface content.
364 * It will be done using the current context.
366 if (svga
->swc
->surface_invalidate(svga
->swc
, entry
->handle
) != PIPE_OK
) {
367 MAYBE_UNUSED
enum pipe_error ret
;
369 /* Even though surface invalidation here is done after the command
370 * buffer is flushed, it is still possible that it will
371 * fail because there might be just enough of this command that is
372 * filling up the command buffer, so in this case we will call
373 * the winsys flush directly to flush the buffer.
374 * Note, we don't want to call svga_context_flush() here because
375 * this function itself is called inside svga_context_flush().
377 svga
->swc
->flush(svga
->swc
, NULL
);
378 ret
= svga
->swc
->surface_invalidate(svga
->swc
, entry
->handle
);
379 assert(ret
== PIPE_OK
);
382 /* add the entry to the invalidated list */
383 LIST_ADD(&entry
->head
, &cache
->invalidated
);
390 mtx_unlock(&cache
->mutex
);
395 * Free all the surfaces in the cache.
396 * Called when destroying the svga screen object.
399 svga_screen_cache_cleanup(struct svga_screen
*svgascreen
)
401 struct svga_host_surface_cache
*cache
= &svgascreen
->cache
;
402 struct svga_winsys_screen
*sws
= svgascreen
->sws
;
405 for (i
= 0; i
< SVGA_HOST_SURFACE_CACHE_SIZE
; ++i
) {
406 if (cache
->entries
[i
].handle
) {
407 SVGA_DBG(DEBUG_CACHE
|DEBUG_DMA
,
408 "unref sid %p (shutdown)\n", cache
->entries
[i
].handle
);
409 sws
->surface_reference(sws
, &cache
->entries
[i
].handle
, NULL
);
411 cache
->total_size
-= surface_size(&cache
->entries
[i
].key
);
414 if (cache
->entries
[i
].fence
)
415 sws
->fence_reference(sws
, &cache
->entries
[i
].fence
, NULL
);
418 mtx_destroy(&cache
->mutex
);
423 svga_screen_cache_init(struct svga_screen
*svgascreen
)
425 struct svga_host_surface_cache
*cache
= &svgascreen
->cache
;
428 assert(cache
->total_size
== 0);
430 (void) mtx_init(&cache
->mutex
, mtx_plain
);
432 for (i
= 0; i
< SVGA_HOST_SURFACE_CACHE_BUCKETS
; ++i
)
433 LIST_INITHEAD(&cache
->bucket
[i
]);
435 LIST_INITHEAD(&cache
->unused
);
437 LIST_INITHEAD(&cache
->validated
);
439 LIST_INITHEAD(&cache
->invalidated
);
441 LIST_INITHEAD(&cache
->empty
);
442 for (i
= 0; i
< SVGA_HOST_SURFACE_CACHE_SIZE
; ++i
)
443 LIST_ADDTAIL(&cache
->entries
[i
].head
, &cache
->empty
);
450 * Allocate a new host-side surface. If the surface is marked as cachable,
451 * first try re-using a surface in the cache of freed surfaces. Otherwise,
452 * allocate a new surface.
453 * \param bind_flags bitmask of PIPE_BIND_x flags
454 * \param usage one of PIPE_USAGE_x values
455 * \param validated return True if the surface is a reused surface
457 struct svga_winsys_surface
*
458 svga_screen_surface_create(struct svga_screen
*svgascreen
,
459 unsigned bind_flags
, enum pipe_resource_usage usage
,
461 struct svga_host_surface_cache_key
*key
)
463 struct svga_winsys_screen
*sws
= svgascreen
->sws
;
464 struct svga_winsys_surface
*handle
= NULL
;
465 boolean cachable
= SVGA_SURFACE_CACHE_ENABLED
&& key
->cachable
;
467 SVGA_DBG(DEBUG_CACHE
|DEBUG_DMA
,
468 "%s sz %dx%dx%d mips %d faces %d arraySize %d cachable %d\n",
479 /* Try to re-cycle a previously freed, cached surface */
480 if (key
->format
== SVGA3D_BUFFER
) {
481 SVGA3dSurfaceAllFlags hint_flag
;
483 /* For buffers, round the buffer size up to the nearest power
484 * of two to increase the probability of cache hits. Keep
485 * texture surface dimensions unchanged.
488 while (size
< key
->size
.width
)
490 key
->size
.width
= size
;
492 /* Determine whether the buffer is static or dynamic.
493 * This is a bit of a heuristic which can be tuned as needed.
495 if (usage
== PIPE_USAGE_DEFAULT
||
496 usage
== PIPE_USAGE_IMMUTABLE
) {
497 hint_flag
= SVGA3D_SURFACE_HINT_STATIC
;
499 else if (bind_flags
& PIPE_BIND_INDEX_BUFFER
) {
500 /* Index buffers don't change too often. Mark them as static.
502 hint_flag
= SVGA3D_SURFACE_HINT_STATIC
;
505 /* Since we're reusing buffers we're effectively transforming all
506 * of them into dynamic buffers.
508 * It would be nice to not cache long lived static buffers. But there
509 * is no way to detect the long lived from short lived ones yet. A
510 * good heuristic would be buffer size.
512 hint_flag
= SVGA3D_SURFACE_HINT_DYNAMIC
;
515 key
->flags
&= ~(SVGA3D_SURFACE_HINT_STATIC
|
516 SVGA3D_SURFACE_HINT_DYNAMIC
);
517 key
->flags
|= hint_flag
;
520 handle
= svga_screen_cache_lookup(svgascreen
, key
);
522 if (key
->format
== SVGA3D_BUFFER
)
523 SVGA_DBG(DEBUG_CACHE
|DEBUG_DMA
,
524 "reuse sid %p sz %d (buffer)\n", handle
,
527 SVGA_DBG(DEBUG_CACHE
|DEBUG_DMA
,
528 "reuse sid %p sz %dx%dx%d mips %d faces %d arraySize %d\n", handle
,
540 /* Unable to recycle surface, allocate a new one */
544 usage
|= SVGA_SURFACE_USAGE_SHARED
;
546 usage
|= SVGA_SURFACE_USAGE_SCANOUT
;
548 handle
= sws
->surface_create(sws
,
553 key
->numFaces
* key
->arraySize
,
557 SVGA_DBG(DEBUG_CACHE
|DEBUG_DMA
,
558 " CREATE sid %p sz %dx%dx%d\n",
572 * Release a surface. We don't actually free the surface- we put
573 * it into the cache of freed surfaces (if it's cachable).
576 svga_screen_surface_destroy(struct svga_screen
*svgascreen
,
577 const struct svga_host_surface_cache_key
*key
,
578 struct svga_winsys_surface
**p_handle
)
580 struct svga_winsys_screen
*sws
= svgascreen
->sws
;
582 /* We only set the cachable flag for surfaces of which we are the
583 * exclusive owner. So just hold onto our existing reference in
586 if (SVGA_SURFACE_CACHE_ENABLED
&& key
->cachable
) {
587 svga_screen_cache_add(svgascreen
, key
, p_handle
);
591 "unref sid %p (uncachable)\n", *p_handle
);
592 sws
->surface_reference(sws
, p_handle
, NULL
);
598 * Print/dump the contents of the screen cache. For debugging.
601 svga_screen_cache_dump(const struct svga_screen
*svgascreen
)
603 const struct svga_host_surface_cache
*cache
= &svgascreen
->cache
;
607 debug_printf("svga3d surface cache:\n");
608 for (bucket
= 0; bucket
< SVGA_HOST_SURFACE_CACHE_BUCKETS
; bucket
++) {
609 struct list_head
*curr
;
610 curr
= cache
->bucket
[bucket
].next
;
611 while (curr
&& curr
!= &cache
->bucket
[bucket
]) {
612 struct svga_host_surface_cache_entry
*entry
=
613 LIST_ENTRY(struct svga_host_surface_cache_entry
,
615 if (entry
->key
.format
== SVGA3D_BUFFER
) {
616 debug_printf(" %p: buffer %u bytes\n",
618 entry
->key
.size
.width
);
621 debug_printf(" %p: %u x %u x %u format %u\n",
623 entry
->key
.size
.width
,
624 entry
->key
.size
.height
,
625 entry
->key
.size
.depth
,
633 debug_printf("%u surfaces, %u bytes\n", count
, cache
->total_size
);