2 #include "pipe/p_context.h"
3 #include "pipe/p_inlines.h"
4 #include "util/u_math.h"
6 #include "nv50_context.h"
9 struct pipe_transfer base
;
10 struct nouveau_bo
*bo
;
11 unsigned level_offset
;
12 unsigned level_tiling
;
22 nv50_transfer_rect_m2mf(struct pipe_screen
*pscreen
,
23 struct nouveau_bo
*src_bo
, unsigned src_offset
,
24 int src_pitch
, unsigned src_tile_mode
,
25 int sx
, int sy
, int sw
, int sh
, int sd
,
26 struct nouveau_bo
*dst_bo
, unsigned dst_offset
,
27 int dst_pitch
, unsigned dst_tile_mode
,
28 int dx
, int dy
, int dw
, int dh
, int dd
,
29 int cpp
, int width
, int height
,
30 unsigned src_reloc
, unsigned dst_reloc
)
32 struct nv50_screen
*screen
= nv50_screen(pscreen
);
33 struct nouveau_channel
*chan
= screen
->m2mf
->channel
;
34 struct nouveau_grobj
*m2mf
= screen
->m2mf
;
36 src_reloc
|= NOUVEAU_BO_RD
;
37 dst_reloc
|= NOUVEAU_BO_WR
;
41 if (!src_bo
->tile_flags
) {
42 BEGIN_RING(chan
, m2mf
,
43 NV50_MEMORY_TO_MEMORY_FORMAT_LINEAR_IN
, 1);
45 BEGIN_RING(chan
, m2mf
,
46 NV50_MEMORY_TO_MEMORY_FORMAT_PITCH_IN
, 1);
47 OUT_RING (chan
, src_pitch
);
48 src_offset
+= (sy
* src_pitch
) + (sx
* cpp
);
50 BEGIN_RING(chan
, m2mf
,
51 NV50_MEMORY_TO_MEMORY_FORMAT_LINEAR_IN
, 6);
53 OUT_RING (chan
, src_tile_mode
<< 4);
54 OUT_RING (chan
, sw
* cpp
);
60 if (!dst_bo
->tile_flags
) {
61 BEGIN_RING(chan
, m2mf
,
62 NV50_MEMORY_TO_MEMORY_FORMAT_LINEAR_OUT
, 1);
64 BEGIN_RING(chan
, m2mf
,
65 NV50_MEMORY_TO_MEMORY_FORMAT_PITCH_OUT
, 1);
66 OUT_RING (chan
, dst_pitch
);
67 dst_offset
+= (dy
* dst_pitch
) + (dx
* cpp
);
69 BEGIN_RING(chan
, m2mf
,
70 NV50_MEMORY_TO_MEMORY_FORMAT_LINEAR_OUT
, 6);
72 OUT_RING (chan
, dst_tile_mode
<< 4);
73 OUT_RING (chan
, dw
* cpp
);
80 int line_count
= height
> 2047 ? 2047 : height
;
83 BEGIN_RING(chan
, m2mf
,
84 NV50_MEMORY_TO_MEMORY_FORMAT_OFFSET_IN_HIGH
, 2);
85 OUT_RELOCh(chan
, src_bo
, src_offset
, src_reloc
);
86 OUT_RELOCh(chan
, dst_bo
, dst_offset
, dst_reloc
);
87 BEGIN_RING(chan
, m2mf
,
88 NV50_MEMORY_TO_MEMORY_FORMAT_OFFSET_IN
, 2);
89 OUT_RELOCl(chan
, src_bo
, src_offset
, src_reloc
);
90 OUT_RELOCl(chan
, dst_bo
, dst_offset
, dst_reloc
);
91 if (src_bo
->tile_flags
) {
92 BEGIN_RING(chan
, m2mf
,
93 NV50_MEMORY_TO_MEMORY_FORMAT_TILING_POSITION_IN
, 1);
94 OUT_RING (chan
, (sy
<< 16) | (sx
* cpp
));
96 src_offset
+= (line_count
* src_pitch
);
98 if (dst_bo
->tile_flags
) {
99 BEGIN_RING(chan
, m2mf
,
100 NV50_MEMORY_TO_MEMORY_FORMAT_TILING_POSITION_OUT
, 1);
101 OUT_RING (chan
, (dy
<< 16) | (dx
* cpp
));
103 dst_offset
+= (line_count
* dst_pitch
);
105 BEGIN_RING(chan
, m2mf
,
106 NV50_MEMORY_TO_MEMORY_FORMAT_LINE_LENGTH_IN
, 4);
107 OUT_RING (chan
, width
* cpp
);
108 OUT_RING (chan
, line_count
);
109 OUT_RING (chan
, 0x00000101);
113 height
-= line_count
;
119 static INLINE
unsigned
120 get_zslice_offset(unsigned tile_mode
, unsigned z
, unsigned pitch
, unsigned ny
)
122 unsigned tile_h
= get_tile_height(tile_mode
);
123 unsigned tile_d
= get_tile_depth(tile_mode
);
125 /* pitch_2d == to next slice within this volume-tile */
126 /* pitch_3d == to next slice in next 2D array of blocks */
127 unsigned pitch_2d
= tile_h
* 64;
128 unsigned pitch_3d
= tile_d
* align(ny
, tile_h
) * pitch
;
130 return (z
% tile_d
) * pitch_2d
+ (z
/ tile_d
) * pitch_3d
;
133 static struct pipe_transfer
*
134 nv50_transfer_new(struct pipe_screen
*pscreen
, struct pipe_texture
*pt
,
135 unsigned face
, unsigned level
, unsigned zslice
,
136 enum pipe_transfer_usage usage
,
137 unsigned x
, unsigned y
, unsigned w
, unsigned h
)
139 struct nouveau_device
*dev
= nouveau_screen(pscreen
)->device
;
140 struct nv50_miptree
*mt
= nv50_miptree(pt
);
141 struct nv50_miptree_level
*lvl
= &mt
->level
[level
];
142 struct nv50_transfer
*tx
;
143 unsigned nx
, ny
, image
= 0;
146 if (pt
->target
== PIPE_TEXTURE_CUBE
)
149 tx
= CALLOC_STRUCT(nv50_transfer
);
153 pipe_texture_reference(&tx
->base
.texture
, pt
);
154 tx
->base
.format
= pt
->format
;
157 tx
->base
.block
= pt
->block
;
158 if (!pt
->nblocksx
[level
]) {
159 tx
->base
.nblocksx
= pf_get_nblocksx(&pt
->block
,
160 u_minify(pt
->width0
, level
));
161 tx
->base
.nblocksy
= pf_get_nblocksy(&pt
->block
,
162 u_minify(pt
->height0
, level
));
164 tx
->base
.nblocksx
= pt
->nblocksx
[level
];
165 tx
->base
.nblocksy
= pt
->nblocksy
[level
];
167 tx
->base
.stride
= tx
->base
.nblocksx
* pt
->block
.size
;
168 tx
->base
.usage
= usage
;
170 tx
->level_pitch
= lvl
->pitch
;
171 tx
->level_width
= u_minify(mt
->base
.base
.width0
, level
);
172 tx
->level_height
= u_minify(mt
->base
.base
.height0
, level
);
173 tx
->level_depth
= u_minify(mt
->base
.base
.depth0
, level
);
174 tx
->level_offset
= lvl
->image_offset
[image
];
175 tx
->level_tiling
= lvl
->tile_mode
;
176 tx
->level_x
= pf_get_nblocksx(&tx
->base
.block
, x
);
177 tx
->level_y
= pf_get_nblocksy(&tx
->base
.block
, y
);
178 ret
= nouveau_bo_new(dev
, NOUVEAU_BO_GART
| NOUVEAU_BO_MAP
, 0,
179 tx
->base
.nblocksy
* tx
->base
.stride
, &tx
->bo
);
185 if (pt
->target
== PIPE_TEXTURE_3D
)
186 tx
->level_offset
+= get_zslice_offset(lvl
->tile_mode
, zslice
,
190 if (usage
& PIPE_TRANSFER_READ
) {
191 nx
= pf_get_nblocksx(&tx
->base
.block
, tx
->base
.width
);
192 ny
= pf_get_nblocksy(&tx
->base
.block
, tx
->base
.height
);
194 nv50_transfer_rect_m2mf(pscreen
, mt
->base
.bo
, tx
->level_offset
,
195 tx
->level_pitch
, tx
->level_tiling
,
197 tx
->base
.nblocksx
, tx
->base
.nblocksy
,
200 tx
->base
.stride
, tx
->bo
->tile_mode
,
202 tx
->base
.nblocksx
, tx
->base
.nblocksy
, 1,
203 tx
->base
.block
.size
, nx
, ny
,
204 NOUVEAU_BO_VRAM
| NOUVEAU_BO_GART
,
212 nv50_transfer_del(struct pipe_transfer
*ptx
)
214 struct nv50_transfer
*tx
= (struct nv50_transfer
*)ptx
;
215 struct nv50_miptree
*mt
= nv50_miptree(ptx
->texture
);
217 unsigned nx
= pf_get_nblocksx(&tx
->base
.block
, tx
->base
.width
);
218 unsigned ny
= pf_get_nblocksy(&tx
->base
.block
, tx
->base
.height
);
220 if (ptx
->usage
& PIPE_TRANSFER_WRITE
) {
221 struct pipe_screen
*pscreen
= ptx
->texture
->screen
;
223 nv50_transfer_rect_m2mf(pscreen
, tx
->bo
, 0,
224 tx
->base
.stride
, tx
->bo
->tile_mode
,
226 tx
->base
.nblocksx
, tx
->base
.nblocksy
, 1,
227 mt
->base
.bo
, tx
->level_offset
,
228 tx
->level_pitch
, tx
->level_tiling
,
229 tx
->level_x
, tx
->level_y
,
230 tx
->base
.nblocksx
, tx
->base
.nblocksy
,
232 tx
->base
.block
.size
, nx
, ny
,
233 NOUVEAU_BO_GART
, NOUVEAU_BO_VRAM
|
237 nouveau_bo_ref(NULL
, &tx
->bo
);
238 pipe_texture_reference(&ptx
->texture
, NULL
);
243 nv50_transfer_map(struct pipe_screen
*pscreen
, struct pipe_transfer
*ptx
)
245 struct nv50_transfer
*tx
= (struct nv50_transfer
*)ptx
;
249 if (ptx
->usage
& PIPE_TRANSFER_WRITE
)
250 flags
|= NOUVEAU_BO_WR
;
251 if (ptx
->usage
& PIPE_TRANSFER_READ
)
252 flags
|= NOUVEAU_BO_RD
;
254 ret
= nouveau_bo_map(tx
->bo
, flags
);
261 nv50_transfer_unmap(struct pipe_screen
*pscreen
, struct pipe_transfer
*ptx
)
263 struct nv50_transfer
*tx
= (struct nv50_transfer
*)ptx
;
265 nouveau_bo_unmap(tx
->bo
);
269 nv50_transfer_init_screen_functions(struct pipe_screen
*pscreen
)
271 pscreen
->get_tex_transfer
= nv50_transfer_new
;
272 pscreen
->tex_transfer_destroy
= nv50_transfer_del
;
273 pscreen
->transfer_map
= nv50_transfer_map
;
274 pscreen
->transfer_unmap
= nv50_transfer_unmap
;
278 nv50_upload_sifc(struct nv50_context
*nv50
,
279 struct nouveau_bo
*bo
, unsigned dst_offset
, unsigned reloc
,
280 unsigned dst_format
, int dst_w
, int dst_h
, int dst_pitch
,
281 void *src
, unsigned src_format
, int src_pitch
,
282 int x
, int y
, int w
, int h
, int cpp
)
284 struct nouveau_channel
*chan
= nv50
->screen
->base
.channel
;
285 struct nouveau_grobj
*eng2d
= nv50
->screen
->eng2d
;
286 struct nouveau_grobj
*tesla
= nv50
->screen
->tesla
;
287 unsigned line_dwords
= (w
* cpp
+ 3) / 4;
289 reloc
|= NOUVEAU_BO_WR
;
291 WAIT_RING (chan
, 32);
293 if (bo
->tile_flags
) {
294 BEGIN_RING(chan
, eng2d
, NV50_2D_DST_FORMAT
, 5);
295 OUT_RING (chan
, dst_format
);
297 OUT_RING (chan
, bo
->tile_mode
<< 4);
301 BEGIN_RING(chan
, eng2d
, NV50_2D_DST_FORMAT
, 2);
302 OUT_RING (chan
, dst_format
);
304 BEGIN_RING(chan
, eng2d
, NV50_2D_DST_PITCH
, 1);
305 OUT_RING (chan
, dst_pitch
);
308 BEGIN_RING(chan
, eng2d
, NV50_2D_DST_WIDTH
, 4);
309 OUT_RING (chan
, dst_w
);
310 OUT_RING (chan
, dst_h
);
311 OUT_RELOCh(chan
, bo
, dst_offset
, reloc
);
312 OUT_RELOCl(chan
, bo
, dst_offset
, reloc
);
314 /* NV50_2D_OPERATION_SRCCOPY assumed already set */
316 BEGIN_RING(chan
, eng2d
, NV50_2D_SIFC_UNK0800
, 2);
318 OUT_RING (chan
, src_format
);
319 BEGIN_RING(chan
, eng2d
, NV50_2D_SIFC_WIDTH
, 10);
332 const uint32_t *p
= src
;
333 unsigned count
= line_dwords
;
336 unsigned nr
= MIN2(count
, 1792);
338 if (chan
->pushbuf
->remaining
<= nr
) {
341 BEGIN_RING(chan
, eng2d
,
342 NV50_2D_DST_ADDRESS_HIGH
, 2);
343 OUT_RELOCh(chan
, bo
, dst_offset
, reloc
);
344 OUT_RELOCl(chan
, bo
, dst_offset
, reloc
);
346 assert(chan
->pushbuf
->remaining
> nr
);
348 BEGIN_RING(chan
, eng2d
,
349 NV50_2D_SIFC_DATA
| (2 << 29), nr
);
350 OUT_RINGp (chan
, p
, nr
);
359 BEGIN_RING(chan
, tesla
, 0x1440, 1);