1 /* $Id: sse.c,v 1.1 2001/03/29 06:46:16 gareth Exp $ */
4 * Mesa 3-D graphics library
7 * Copyright (C) 1999-2001 Brian Paul All Rights Reserved.
9 * Permission is hereby granted, free of charge, to any person obtaining a
10 * copy of this software and associated documentation files (the "Software"),
11 * to deal in the Software without restriction, including without limitation
12 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
13 * and/or sell copies of the Software, and to permit persons to whom the
14 * Software is furnished to do so, subject to the following conditions:
16 * The above copyright notice and this permission notice shall be included
17 * in all copies or substantial portions of the Software.
19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
20 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
21 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
22 * BRIAN PAUL BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
23 * AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
24 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
28 * PentiumIII-SIMD (SSE) optimizations contributed by
29 * Andre Werthmann <wertmann@cs.uni-potsdam.de>
37 #include "math/m_vertices.h"
38 #include "math/m_xform.h"
40 #include "tnl/t_context.h"
43 #include "math/m_debug.h"
47 #define XFORM_ARGS GLvector4f *to_vec, \
48 const GLfloat m[16], \
49 const GLvector4f *from_vec, \
50 const GLubyte *mask, \
54 #define DECLARE_XFORM_GROUP( pfx, sz ) \
55 extern void _ASMAPI _mesa_##pfx##_transform_points##sz##_general( XFORM_ARGS ); \
56 extern void _ASMAPI _mesa_##pfx##_transform_points##sz##_identity( XFORM_ARGS ); \
57 extern void _ASMAPI _mesa_##pfx##_transform_points##sz##_3d_no_rot( XFORM_ARGS ); \
58 extern void _ASMAPI _mesa_##pfx##_transform_points##sz##_perspective( XFORM_ARGS ); \
59 extern void _ASMAPI _mesa_##pfx##_transform_points##sz##_2d( XFORM_ARGS ); \
60 extern void _ASMAPI _mesa_##pfx##_transform_points##sz##_2d_no_rot( XFORM_ARGS ); \
61 extern void _ASMAPI _mesa_##pfx##_transform_points##sz##_3d( XFORM_ARGS );
64 #define ASSIGN_XFORM_GROUP( pfx, sz ) \
65 _mesa_transform_tab[0][sz][MATRIX_GENERAL] = \
66 _mesa_##pfx##_transform_points##sz##_general; \
67 _mesa_transform_tab[0][sz][MATRIX_IDENTITY] = \
68 _mesa_##pfx##_transform_points##sz##_identity; \
69 _mesa_transform_tab[0][sz][MATRIX_3D_NO_ROT] = \
70 _mesa_##pfx##_transform_points##sz##_3d_no_rot; \
71 _mesa_transform_tab[0][sz][MATRIX_PERSPECTIVE] = \
72 _mesa_##pfx##_transform_points##sz##_perspective; \
73 _mesa_transform_tab[0][sz][MATRIX_2D] = \
74 _mesa_##pfx##_transform_points##sz##_2d; \
75 _mesa_transform_tab[0][sz][MATRIX_2D_NO_ROT] = \
76 _mesa_##pfx##_transform_points##sz##_2d_no_rot; \
77 _mesa_transform_tab[0][sz][MATRIX_3D] = \
78 _mesa_##pfx##_transform_points##sz##_3d;
82 #define NORM_ARGS const GLmatrix *mat, \
84 const GLvector3f *in, \
85 const GLfloat *lengths, \
86 const GLubyte mask[], \
90 #define DECLARE_NORM_GROUP( pfx ) \
91 extern void _ASMAPI _mesa_##pfx##_rescale_normals( NORM_ARGS ); \
92 extern void _ASMAPI _mesa_##pfx##_normalize_normals( NORM_ARGS ); \
93 extern void _ASMAPI _mesa_##pfx##_transform_normals( NORM_ARGS ); \
94 extern void _ASMAPI _mesa_##pfx##_transform_normals_no_rot( NORM_ARGS ); \
95 extern void _ASMAPI _mesa_##pfx##_transform_rescale_normals( NORM_ARGS ); \
96 extern void _ASMAPI _mesa_##pfx##_transform_rescale_normals_no_rot( NORM_ARGS ); \
97 extern void _ASMAPI _mesa_##pfx##_transform_normalize_normals( NORM_ARGS ); \
98 extern void _ASMAPI _mesa_##pfx##_transform_normalize_normals_no_rot( NORM_ARGS );
101 #define ASSIGN_NORM_GROUP( pfx ) \
102 _mesa_normal_tab[NORM_RESCALE][0] = \
103 _mesa_##pfx##_rescale_normals; \
104 _mesa_normal_tab[NORM_NORMALIZE][0] = \
105 _mesa_##pfx##_normalize_normals; \
106 _mesa_normal_tab[NORM_TRANSFORM][0] = \
107 _mesa_##pfx##_transform_normals; \
108 _mesa_normal_tab[NORM_TRANSFORM_NO_ROT][0] = \
109 _mesa_##pfx##_transform_normals_no_rot; \
110 _mesa_normal_tab[NORM_TRANSFORM|NORM_RESCALE][0] = \
111 _mesa_##pfx##_transform_rescale_normals; \
112 _mesa_normal_tab[NORM_TRANSFORM_NO_ROT|NORM_RESCALE][0] = \
113 _mesa_##pfx##_transform_rescale_normals_no_rot; \
114 _mesa_normal_tab[NORM_TRANSFORM|NORM_NORMALIZE][0] = \
115 _mesa_##pfx##_transform_normalize_normals; \
116 _mesa_normal_tab[NORM_TRANSFORM_NO_ROT|NORM_NORMALIZE][0] = \
117 _mesa_##pfx##_transform_normalize_normals_no_rot;
121 DECLARE_XFORM_GROUP( sse
, 2 )
122 DECLARE_XFORM_GROUP( sse
, 3 )
125 /* Some functions are not written in SSE-assembly, because the fpu ones are faster */
126 extern void _mesa_sse_transform_normals_no_rot( NORM_ARGS
);
127 extern void _mesa_sse_transform_rescale_normals( NORM_ARGS
);
128 extern void _mesa_sse_transform_rescale_normals_no_rot( NORM_ARGS
);
130 extern void _mesa_sse_transform_points4_general( XFORM_ARGS
);
131 extern void _mesa_sse_transform_points4_3d( XFORM_ARGS
);
132 extern void _mesa_sse_transform_points4_identity( XFORM_ARGS
);
134 DECLARE_NORM_GROUP( sse
)
139 _mesa_v16_sse_general_xform( GLfloat
*first_vert
,
146 _mesa_sse_project_vertices( GLfloat
*first
,
152 _mesa_sse_project_clipped_vertices( GLfloat
*first
,
156 const GLubyte
*clipmask
);
160 void _mesa_init_sse_transform_asm( void )
163 ASSIGN_XFORM_GROUP( sse
, 2 );
164 ASSIGN_XFORM_GROUP( sse
, 3 );
167 /* TODO: Finish these off.
169 _mesa_normal_tab
[NORM_TRANSFORM_NO_ROT
][0] =
170 _mesa_sse_transform_normals_no_rot
;
171 _mesa_normal_tab
[NORM_TRANSFORM
|NORM_RESCALE
][0] =
172 _mesa_sse_transform_rescale_normals
;
173 _mesa_normal_tab
[NORM_TRANSFORM_NO_ROT
|NORM_RESCALE
][0] =
174 _mesa_sse_transform_rescale_normals_no_rot
;
176 _mesa_transform_tab
[0][4][MATRIX_GENERAL
] =
177 _mesa_sse_transform_points4_general
;
178 _mesa_transform_tab
[0][4][MATRIX_3D
] =
179 _mesa_sse_transform_points4_3d
;
180 _mesa_transform_tab
[0][4][MATRIX_IDENTITY
] =
181 _mesa_sse_transform_points4_identity
;
183 ASSIGN_NORM_GROUP( sse
);
187 _math_test_all_transform_functions( "SSE" );
188 _math_test_all_normal_transform_functions( "SSE" );
193 void _mesa_init_sse_vertex_asm( void )
196 _mesa_xform_points3_v16_general
= _mesa_v16_sse_general_xform
;
198 /* GH: These are broken. I'm fixing them now.
200 _mesa_project_v16
= _mesa_sse_project_vertices
;
201 _mesa_project_clipped_v16
= _mesa_sse_project_clipped_vertices
;
205 _math_test_all_vertex_functions( "SSE" );