1 /**************************************************************************
3 * Copyright 2010 VMware, Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
32 #include "util/u_pointer.h"
33 #include "gallivm/lp_bld.h"
34 #include "gallivm/lp_bld_init.h"
35 #include "gallivm/lp_bld_arit.h"
37 #include <llvm-c/Analysis.h>
38 #include <llvm-c/ExecutionEngine.h>
39 #include <llvm-c/Target.h>
40 #include <llvm-c/Transforms/Scalar.h>
46 write_tsv_header(FILE *fp
)
59 #include "sse_mathfun.h"
61 typedef __m128 (*test_round_t
)(__m128
);
63 typedef LLVMValueRef (*lp_func_t
)(struct lp_build_context
*, LLVMValueRef
);
67 add_test(LLVMModuleRef module
, const char *name
, lp_func_t lp_func
)
69 LLVMTypeRef v4sf
= LLVMVectorType(LLVMFloatType(), 4);
70 LLVMTypeRef args
[1] = { v4sf
};
71 LLVMValueRef func
= LLVMAddFunction(module
, name
, LLVMFunctionType(v4sf
, args
, 1, 0));
72 LLVMValueRef arg1
= LLVMGetParam(func
, 0);
73 LLVMBuilderRef builder
= LLVMCreateBuilder();
74 LLVMBasicBlockRef block
= LLVMAppendBasicBlock(func
, "entry");
76 struct lp_build_context bld
;
78 lp_build_context_init(&bld
, builder
, lp_float32_vec4_type());
80 LLVMSetFunctionCallConv(func
, LLVMCCallConv
);
82 LLVMPositionBuilderAtEnd(builder
, block
);
84 ret
= lp_func(&bld
, arg1
);
86 LLVMBuildRet(builder
, ret
);
87 LLVMDisposeBuilder(builder
);
92 printv(char* string
, v4sf value
)
95 float *f
= (float *)&v
;
96 printf("%s: %10f %10f %10f %10f\n", string
,
97 f
[0], f
[1], f
[2], f
[3]);
101 compare(v4sf x
, v4sf y
)
103 boolean success
= TRUE
;
104 float *xp
= (float *) &x
;
105 float *yp
= (float *) &y
;
106 if (xp
[0] != yp
[0] ||
110 printf(" Incorrect result! ^^^^^^^^^^^^^^^^^^^^^^^^^^^^ \n");
120 test_round(unsigned verbose
, FILE *fp
)
122 LLVMModuleRef module
= NULL
;
123 LLVMValueRef test_round
= NULL
, test_trunc
, test_floor
, test_ceil
;
124 LLVMExecutionEngineRef engine
= lp_build_engine
;
125 LLVMPassManagerRef pass
= NULL
;
127 test_round_t round_func
, trunc_func
, floor_func
, ceil_func
;
130 boolean success
= TRUE
;
133 module
= LLVMModuleCreateWithName("test");
135 test_round
= add_test(module
, "round", lp_build_round
);
136 test_trunc
= add_test(module
, "trunc", lp_build_trunc
);
137 test_floor
= add_test(module
, "floor", lp_build_floor
);
138 test_ceil
= add_test(module
, "ceil", lp_build_ceil
);
140 if(LLVMVerifyModule(module
, LLVMPrintMessageAction
, &error
)) {
141 printf("LLVMVerifyModule: %s\n", error
);
142 LLVMDumpModule(module
);
145 LLVMDisposeMessage(error
);
148 pass
= LLVMCreatePassManager();
149 LLVMAddTargetData(LLVMGetExecutionEngineTargetData(engine
), pass
);
150 /* These are the passes currently listed in llvm-c/Transforms/Scalar.h,
151 * but there are more on SVN. */
152 LLVMAddConstantPropagationPass(pass
);
153 LLVMAddInstructionCombiningPass(pass
);
154 LLVMAddPromoteMemoryToRegisterPass(pass
);
155 LLVMAddGVNPass(pass
);
156 LLVMAddCFGSimplificationPass(pass
);
157 LLVMRunPassManager(pass
, module
);
162 round_func
= (test_round_t
) pointer_to_func(LLVMGetPointerToGlobal(engine
, test_round
));
163 trunc_func
= (test_round_t
) pointer_to_func(LLVMGetPointerToGlobal(engine
, test_trunc
));
164 floor_func
= (test_round_t
) pointer_to_func(LLVMGetPointerToGlobal(engine
, test_floor
));
165 ceil_func
= (test_round_t
) pointer_to_func(LLVMGetPointerToGlobal(engine
, test_ceil
));
167 memset(unpacked
, 0, sizeof unpacked
);
171 LLVMDumpModule(module
);
173 for (i
= 0; i
< 3; i
++) {
175 {-10.0, -1, 0, 12.0},
176 {-1.5, -0.25, 1.25, 2.5},
177 {-0.99, -0.01, 0.01, 0.99}
181 float *xp
= (float *) &x
;
182 float *refp
= (float *) &ref
;
187 refp
[0] = round(xp
[0]);
188 refp
[1] = round(xp
[1]);
189 refp
[2] = round(xp
[2]);
190 refp
[3] = round(xp
[3]);
192 printv("C round(x) ", ref
);
193 printv("LLVM round(x)", y
);
194 success
= success
&& compare(ref
, y
);
196 refp
[0] = trunc(xp
[0]);
197 refp
[1] = trunc(xp
[1]);
198 refp
[2] = trunc(xp
[2]);
199 refp
[3] = trunc(xp
[3]);
201 printv("C trunc(x) ", ref
);
202 printv("LLVM trunc(x)", y
);
203 success
= success
&& compare(ref
, y
);
205 refp
[0] = floor(xp
[0]);
206 refp
[1] = floor(xp
[1]);
207 refp
[2] = floor(xp
[2]);
208 refp
[3] = floor(xp
[3]);
210 printv("C floor(x) ", ref
);
211 printv("LLVM floor(x)", y
);
212 success
= success
&& compare(ref
, y
);
214 refp
[0] = ceil(xp
[0]);
215 refp
[1] = ceil(xp
[1]);
216 refp
[2] = ceil(xp
[2]);
217 refp
[3] = ceil(xp
[3]);
219 printv("C ceil(x) ", ref
);
220 printv("LLVM ceil(x) ", y
);
221 success
= success
&& compare(ref
, y
);
224 LLVMFreeMachineCodeForFunction(engine
, test_round
);
225 LLVMFreeMachineCodeForFunction(engine
, test_trunc
);
226 LLVMFreeMachineCodeForFunction(engine
, test_floor
);
227 LLVMFreeMachineCodeForFunction(engine
, test_ceil
);
229 LLVMDisposeExecutionEngine(engine
);
231 LLVMDisposePassManager(pass
);
236 #else /* !PIPE_ARCH_SSE */
239 test_round(unsigned verbose
, FILE *fp
)
244 #endif /* !PIPE_ARCH_SSE */
248 test_all(unsigned verbose
, FILE *fp
)
250 return test_round(verbose
, fp
);
255 test_some(unsigned verbose
, FILE *fp
, unsigned long n
)
257 return test_all(verbose
, fp
);
261 test_single(unsigned verbose
, FILE *fp
)
263 printf("no test_single()");