2 * Copyright © 2014 Broadcom
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
24 #ifdef USE_VC4_SIMULATOR
26 #include "util/u_memory.h"
28 #include "vc4_screen.h"
29 #include "vc4_context.h"
30 #include "kernel/vc4_drv.h"
31 #include "vc4_simulator_validate.h"
32 #include "simpenrose/simpenrose.h"
34 #define OVERFLOW_SIZE (32 * 1024 * 1024)
36 static struct drm_gem_cma_object
*
37 vc4_wrap_bo_with_cma(struct drm_device
*dev
, struct vc4_bo
*bo
)
39 struct vc4_context
*vc4
= dev
->vc4
;
40 struct vc4_screen
*screen
= vc4
->screen
;
41 struct drm_gem_cma_object
*obj
= CALLOC_STRUCT(drm_gem_cma_object
);
42 uint32_t size
= align(bo
->size
, 4096);
45 obj
->base
.size
= size
;
46 obj
->vaddr
= screen
->simulator_mem_base
+ dev
->simulator_mem_next
;
47 obj
->paddr
= simpenrose_hw_addr(obj
->vaddr
);
49 dev
->simulator_mem_next
+= size
;
50 dev
->simulator_mem_next
= align(dev
->simulator_mem_next
, 4096);
51 assert(dev
->simulator_mem_next
<= screen
->simulator_mem_size
);
56 struct drm_gem_cma_object
*
57 drm_gem_cma_create(struct drm_device
*dev
, size_t size
)
59 struct vc4_context
*vc4
= dev
->vc4
;
60 struct vc4_screen
*screen
= vc4
->screen
;
62 struct vc4_bo
*bo
= vc4_bo_alloc(screen
, size
, "simulator validate");
63 return vc4_wrap_bo_with_cma(dev
, bo
);
67 vc4_simulator_pin_bos(struct drm_device
*dev
, struct exec_info
*exec
)
69 struct drm_vc4_submit_cl
*args
= exec
->args
;
70 struct vc4_context
*vc4
= dev
->vc4
;
71 struct vc4_bo
**bos
= vc4
->bo_pointers
.base
;
73 exec
->bo_count
= args
->bo_handle_count
;
74 exec
->bo
= calloc(exec
->bo_count
, sizeof(struct vc4_bo_exec_state
));
75 for (int i
= 0; i
< exec
->bo_count
; i
++) {
76 struct vc4_bo
*bo
= bos
[i
];
77 struct drm_gem_cma_object
*obj
= vc4_wrap_bo_with_cma(dev
, bo
);
80 fprintf(stderr
, "bo hindex %d: %s\n", i
, bo
->name
);
84 memcpy(obj
->vaddr
, bo
->map
, bo
->size
);
92 vc4_simulator_unpin_bos(struct exec_info
*exec
)
94 for (int i
= 0; i
< exec
->bo_count
; i
++) {
95 struct drm_gem_cma_object
*obj
= exec
->bo
[i
].bo
;
96 struct vc4_bo
*bo
= obj
->bo
;
98 memcpy(bo
->map
, obj
->vaddr
, bo
->size
);
109 vc4_simulator_flush(struct vc4_context
*vc4
, struct drm_vc4_submit_cl
*args
)
111 struct vc4_surface
*csurf
= vc4_surface(vc4
->framebuffer
.cbufs
[0]);
112 struct vc4_resource
*ctex
= csurf
? vc4_resource(csurf
->base
.texture
) : NULL
;
113 uint32_t winsys_stride
= ctex
? ctex
->bo
->simulator_winsys_stride
: 0;
114 uint32_t sim_stride
= ctex
? ctex
->slices
[0].stride
: 0;
115 uint32_t row_len
= MIN2(sim_stride
, winsys_stride
);
116 struct exec_info exec
;
117 struct drm_device local_dev
= {
119 .simulator_mem_next
= OVERFLOW_SIZE
,
121 struct drm_device
*dev
= &local_dev
;
124 memset(&exec
, 0, sizeof(exec
));
126 if (ctex
&& ctex
->bo
->simulator_winsys_map
) {
128 fprintf(stderr
, "%dx%d %d %d %d\n",
129 ctex
->base
.b
.width0
, ctex
->base
.b
.height0
,
135 for (int y
= 0; y
< ctex
->base
.b
.height0
; y
++) {
136 memcpy(ctex
->bo
->map
+ y
* sim_stride
,
137 ctex
->bo
->simulator_winsys_map
+ y
* winsys_stride
,
144 ret
= vc4_simulator_pin_bos(dev
, &exec
);
148 ret
= vc4_cl_validate(dev
, &exec
);
152 simpenrose_do_binning(exec
.ct0ca
, exec
.ct0ea
);
153 simpenrose_do_rendering(exec
.ct1ca
, exec
.ct1ea
);
155 ret
= vc4_simulator_unpin_bos(&exec
);
161 if (ctex
&& ctex
->bo
->simulator_winsys_map
) {
162 for (int y
= 0; y
< ctex
->base
.b
.height0
; y
++) {
163 memcpy(ctex
->bo
->simulator_winsys_map
+ y
* winsys_stride
,
164 ctex
->bo
->map
+ y
* sim_stride
,
173 vc4_simulator_init(struct vc4_screen
*screen
)
175 screen
->simulator_mem_size
= 256 * 1024 * 1024;
176 screen
->simulator_mem_base
= malloc(screen
->simulator_mem_size
);
178 /* We supply our own memory so that we can have more aperture
179 * available (256MB instead of simpenrose's default 64MB).
181 simpenrose_init_hardware_supply_mem(screen
->simulator_mem_base
,
182 screen
->simulator_mem_size
);
184 /* Carve out low memory for tile allocation overflow. The kernel
185 * should be automatically handling overflow memory setup on real
186 * hardware, but for simulation we just get one shot to set up enough
187 * overflow memory before execution. This overflow mem will be used
188 * up over the whole lifetime of simpenrose (not reused on each
189 * flush), so it had better be big.
191 simpenrose_supply_overflow_mem(0, OVERFLOW_SIZE
);
194 #endif /* USE_VC4_SIMULATOR */