75309dd5fcd4aea9299d9bc7598219d08a291b4e
[mesa.git] / src / gallium / drivers / llvmpipe / lp_bld_blend.c
1 /**************************************************************************
2 *
3 * Copyright 2012 VMware, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 #include "pipe/p_state.h"
29 #include "util/u_debug.h"
30
31 #include "gallivm/lp_bld_type.h"
32 #include "gallivm/lp_bld_arit.h"
33
34 #include "lp_bld_blend.h"
35
36 /**
37 * Is (a OP b) == (b OP a)?
38 */
39 boolean
40 lp_build_blend_func_commutative(unsigned func)
41 {
42 switch (func) {
43 case PIPE_BLEND_ADD:
44 case PIPE_BLEND_MIN:
45 case PIPE_BLEND_MAX:
46 return TRUE;
47 case PIPE_BLEND_SUBTRACT:
48 case PIPE_BLEND_REVERSE_SUBTRACT:
49 return FALSE;
50 default:
51 assert(0);
52 return TRUE;
53 }
54 }
55
56
57 /**
58 * Whether the blending functions are the reverse of each other.
59 */
60 boolean
61 lp_build_blend_func_reverse(unsigned rgb_func, unsigned alpha_func)
62 {
63 if(rgb_func == alpha_func)
64 return FALSE;
65 if(rgb_func == PIPE_BLEND_SUBTRACT && alpha_func == PIPE_BLEND_REVERSE_SUBTRACT)
66 return TRUE;
67 if(rgb_func == PIPE_BLEND_REVERSE_SUBTRACT && alpha_func == PIPE_BLEND_SUBTRACT)
68 return TRUE;
69 return FALSE;
70 }
71
72
73 /**
74 * Whether the blending factors are complementary of each other.
75 */
76 static INLINE boolean
77 lp_build_blend_factor_complementary(unsigned src_factor, unsigned dst_factor)
78 {
79 return dst_factor == (src_factor ^ 0x10);
80 }
81
82
83 /**
84 * @sa http://www.opengl.org/sdk/docs/man/xhtml/glBlendEquationSeparate.xml
85 */
86 LLVMValueRef
87 lp_build_blend_func(struct lp_build_context *bld,
88 unsigned func,
89 LLVMValueRef term1,
90 LLVMValueRef term2)
91 {
92 switch (func) {
93 case PIPE_BLEND_ADD:
94 return lp_build_add(bld, term1, term2);
95 case PIPE_BLEND_SUBTRACT:
96 return lp_build_sub(bld, term1, term2);
97 case PIPE_BLEND_REVERSE_SUBTRACT:
98 return lp_build_sub(bld, term2, term1);
99 case PIPE_BLEND_MIN:
100 return lp_build_min(bld, term1, term2);
101 case PIPE_BLEND_MAX:
102 return lp_build_max(bld, term1, term2);
103 default:
104 assert(0);
105 return bld->zero;
106 }
107 }
108
109
110 /**
111 * Performs optimisations and blending independent of SoA/AoS
112 *
113 * @param func the blend function
114 * @param factor_src PIPE_BLENDFACTOR_xxx
115 * @param factor_dst PIPE_BLENDFACTOR_xxx
116 * @param src source rgba
117 * @param dst dest rgba
118 * @param src_factor src factor computed value
119 * @param dst_factor dst factor computed value
120 * @param not_alpha_dependent same factors accross all channels of src/dst
121 *
122 * not_alpha_dependent should be:
123 * SoA: always true as it is only one channel at a time
124 * AoS: rgb_src_factor == alpha_src_factor && rgb_dst_factor == alpha_dst_factor
125 *
126 * Note that pretty much every possible optimisation can only be done on non-unorm targets
127 * due to unorm values not going above 1.0 meaning factorisation can change results.
128 * e.g. (0.9 * 0.9) + (0.9 * 0.9) != 0.9 * (0.9 + 0.9) as result of + is always <= 1.
129 */
130 LLVMValueRef
131 lp_build_blend(struct lp_build_context *bld,
132 unsigned func,
133 unsigned factor_src,
134 unsigned factor_dst,
135 LLVMValueRef src,
136 LLVMValueRef dst,
137 LLVMValueRef src_factor,
138 LLVMValueRef dst_factor,
139 boolean not_alpha_dependent,
140 boolean optimise_only)
141 {
142 LLVMValueRef result, src_term, dst_term;
143
144 /* If we are not alpha dependent we can mess with the src/dst factors */
145 if (not_alpha_dependent) {
146 if (lp_build_blend_factor_complementary(factor_src, factor_dst)) {
147 if (func == PIPE_BLEND_ADD) {
148 if (factor_src < factor_dst) {
149 return lp_build_lerp(bld, src_factor, dst, src);
150 } else {
151 return lp_build_lerp(bld, dst_factor, src, dst);
152 }
153 } else if(bld->type.floating && func == PIPE_BLEND_SUBTRACT) {
154 result = lp_build_add(bld, src, dst);
155
156 if (factor_src < factor_dst) {
157 result = lp_build_mul(bld, result, src_factor);
158 return lp_build_sub(bld, result, dst);
159 } else {
160 result = lp_build_mul(bld, result, dst_factor);
161 return lp_build_sub(bld, src, result);
162 }
163 } else if(bld->type.floating && func == PIPE_BLEND_REVERSE_SUBTRACT) {
164 result = lp_build_add(bld, src, dst);
165
166 if (factor_src < factor_dst) {
167 result = lp_build_mul(bld, result, src_factor);
168 return lp_build_sub(bld, dst, result);
169 } else {
170 result = lp_build_mul(bld, result, dst_factor);
171 return lp_build_sub(bld, result, src);
172 }
173 }
174 }
175
176 if (bld->type.floating && factor_src == factor_dst) {
177 if (func == PIPE_BLEND_ADD ||
178 func == PIPE_BLEND_SUBTRACT ||
179 func == PIPE_BLEND_REVERSE_SUBTRACT) {
180 LLVMValueRef result;
181 result = lp_build_blend_func(bld, func, src, dst);
182 return lp_build_mul(bld, result, src_factor);
183 }
184 }
185 }
186
187 if (optimise_only)
188 return NULL;
189
190 src_term = lp_build_mul(bld, src, src_factor);
191 dst_term = lp_build_mul(bld, dst, dst_factor);
192 return lp_build_blend_func(bld, func, src_term, dst_term);
193 }