Merge branch 'mesa_7_5_branch' into mesa_7_6_branch
[mesa.git] / src / gallium / drivers / cell / spu / spu_vertex_fetch.c
1 /**************************************************************************
2 *
3 * Copyright 2007 Tungsten Graphics, Inc., Cedar Park, Texas.
4 * (C) Copyright IBM Corporation 2008
5 * All Rights Reserved.
6 *
7 * Permission is hereby granted, free of charge, to any person obtaining a
8 * copy of this software and associated documentation files (the
9 * "Software"), to deal in the Software without restriction, including
10 * without limitation the rights to use, copy, modify, merge, publish,
11 * distribute, sub license, and/or sell copies of the Software, and to
12 * permit persons to whom the Software is furnished to do so, subject to
13 * the following conditions:
14 *
15 * The above copyright notice and this permission notice (including the
16 * next paragraph) shall be included in all copies or substantial portions
17 * of the Software.
18 *
19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
20 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
21 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
22 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
23 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
24 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
25 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 *
27 **************************************************************************/
28
29 /*
30 * Authors:
31 * Keith Whitwell <keith@tungstengraphics.com>
32 * Ian Romanick <idr@us.ibm.com>
33 */
34
35 #include "pipe/p_state.h"
36 #include "pipe/p_shader_tokens.h"
37 #include "spu_exec.h"
38 #include "spu_vertex_shader.h"
39 #include "spu_main.h"
40 #include "spu_dcache.h"
41
42 typedef void (*spu_fetch_func)(qword *out, const qword *in,
43 const qword *shuffle_data);
44
45
46 static const qword fetch_shuffle_data[5] ALIGN16_ATTRIB = {
47 /* Shuffle used by CVT_64_FLOAT
48 */
49 {
50 0x00, 0x01, 0x02, 0x03, 0x10, 0x11, 0x12, 0x13,
51 0x80, 0x80, 0x80, 0x80, 0x80, 0x80, 0x80, 0x80,
52 },
53
54 /* Shuffle used by CVT_8_USCALED and CVT_8_SSCALED
55 */
56 {
57 0x00, 0x80, 0x80, 0x80, 0x01, 0x80, 0x80, 0x80,
58 0x02, 0x80, 0x80, 0x80, 0x03, 0x80, 0x80, 0x80,
59 },
60
61 /* Shuffle used by CVT_16_USCALED and CVT_16_SSCALED
62 */
63 {
64 0x00, 0x01, 0x80, 0x80, 0x02, 0x03, 0x80, 0x80,
65 0x04, 0x05, 0x80, 0x80, 0x06, 0x07, 0x80, 0x80,
66 },
67
68 /* High value shuffle used by trans4x4.
69 */
70 {
71 0x00, 0x01, 0x02, 0x03, 0x10, 0x11, 0x12, 0x13,
72 0x04, 0x05, 0x06, 0x07, 0x14, 0x15, 0x16, 0x17
73 },
74
75 /* Low value shuffle used by trans4x4.
76 */
77 {
78 0x08, 0x09, 0x0A, 0x0B, 0x18, 0x19, 0x1A, 0x1B,
79 0x0C, 0x0D, 0x0E, 0x0F, 0x1C, 0x1D, 0x1E, 0x1F
80 }
81 };
82
83
84 /**
85 * Fetch vertex attributes for 'count' vertices.
86 */
87 static void generic_vertex_fetch(struct spu_vs_context *draw,
88 struct spu_exec_machine *machine,
89 const unsigned *elts,
90 unsigned count)
91 {
92 unsigned nr_attrs = draw->vertex_fetch.nr_attrs;
93 unsigned attr;
94
95 ASSERT(count <= 4);
96
97 #if DRAW_DBG
98 printf("SPU: %s count = %u, nr_attrs = %u\n",
99 __FUNCTION__, count, nr_attrs);
100 #endif
101
102 /* loop over vertex attributes (vertex shader inputs)
103 */
104 for (attr = 0; attr < nr_attrs; attr++) {
105 const unsigned pitch = draw->vertex_fetch.pitch[attr];
106 const uint64_t src = draw->vertex_fetch.src_ptr[attr];
107 const spu_fetch_func fetch = (spu_fetch_func)
108 (draw->vertex_fetch.code + draw->vertex_fetch.code_offset[attr]);
109 unsigned i;
110 unsigned idx;
111 const unsigned bytes_per_entry = draw->vertex_fetch.size[attr];
112 const unsigned quads_per_entry = (bytes_per_entry + 15) / 16;
113 qword in[2 * 4] ALIGN16_ATTRIB;
114
115
116 /* Fetch four attributes for four vertices.
117 */
118 idx = 0;
119 for (i = 0; i < count; i++) {
120 const uint64_t addr = src + (elts[i] * pitch);
121
122 #if DRAW_DBG
123 printf("SPU: fetching = 0x%llx\n", addr);
124 #endif
125
126 spu_dcache_fetch_unaligned(& in[idx], addr, bytes_per_entry);
127 idx += quads_per_entry;
128 }
129
130 /* Be nice and zero out any missing vertices.
131 */
132 (void) memset(& in[idx], 0, (8 - idx) * sizeof(qword));
133
134
135 /* Convert all 4 vertices to vectors of float.
136 */
137 (*fetch)(&machine->Inputs[attr].xyzw[0].q, in, fetch_shuffle_data);
138 }
139 }
140
141
142 void spu_update_vertex_fetch( struct spu_vs_context *draw )
143 {
144 draw->vertex_fetch.fetch_func = generic_vertex_fetch;
145 }