Merge remote-tracking branch 'public/master' into vulkan
[mesa.git] / src / intel / vulkan / genX_state.c
1 /*
2 * Copyright © 2015 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 */
23
24 #include <assert.h>
25 #include <stdbool.h>
26 #include <string.h>
27 #include <unistd.h>
28 #include <fcntl.h>
29
30 #include "anv_private.h"
31
32 #include "genxml/gen_macros.h"
33 #include "genxml/genX_pack.h"
34
35 VkResult
36 genX(init_device_state)(struct anv_device *device)
37 {
38 GENX(MEMORY_OBJECT_CONTROL_STATE_pack)(NULL, &device->default_mocs,
39 &GENX(MOCS));
40
41 struct anv_batch batch;
42
43 uint32_t cmds[64];
44 batch.start = batch.next = cmds;
45 batch.end = (void *) cmds + sizeof(cmds);
46
47 anv_batch_emit(&batch, GENX(PIPELINE_SELECT),
48 #if GEN_GEN >= 9
49 .MaskBits = 3,
50 #endif
51 .PipelineSelection = _3D);
52
53 anv_batch_emit(&batch, GENX(3DSTATE_VF_STATISTICS),
54 .StatisticsEnable = true);
55 anv_batch_emit(&batch, GENX(3DSTATE_HS));
56 anv_batch_emit(&batch, GENX(3DSTATE_TE));
57 anv_batch_emit(&batch, GENX(3DSTATE_DS));
58
59 anv_batch_emit(&batch, GENX(3DSTATE_STREAMOUT), .SOFunctionEnable = false);
60 anv_batch_emit(&batch, GENX(3DSTATE_AA_LINE_PARAMETERS));
61
62 #if GEN_GEN >= 8
63 anv_batch_emit(&batch, GENX(3DSTATE_WM_CHROMAKEY),
64 .ChromaKeyKillEnable = false);
65
66 /* See the Vulkan 1.0 spec Table 24.1 "Standard sample locations" and
67 * VkPhysicalDeviceFeatures::standardSampleLocations.
68 */
69 anv_batch_emit(&batch, GENX(3DSTATE_SAMPLE_PATTERN),
70 ._1xSample0XOffset = 0.5,
71 ._1xSample0YOffset = 0.5,
72 ._2xSample0XOffset = 0.25,
73 ._2xSample0YOffset = 0.25,
74 ._2xSample1XOffset = 0.75,
75 ._2xSample1YOffset = 0.75,
76 ._4xSample0XOffset = 0.375,
77 ._4xSample0YOffset = 0.125,
78 ._4xSample1XOffset = 0.875,
79 ._4xSample1YOffset = 0.375,
80 ._4xSample2XOffset = 0.125,
81 ._4xSample2YOffset = 0.625,
82 ._4xSample3XOffset = 0.625,
83 ._4xSample3YOffset = 0.875,
84 ._8xSample0XOffset = 0.5625,
85 ._8xSample0YOffset = 0.3125,
86 ._8xSample1XOffset = 0.4375,
87 ._8xSample1YOffset = 0.6875,
88 ._8xSample2XOffset = 0.8125,
89 ._8xSample2YOffset = 0.5625,
90 ._8xSample3XOffset = 0.3125,
91 ._8xSample3YOffset = 0.1875,
92 ._8xSample4XOffset = 0.1875,
93 ._8xSample4YOffset = 0.8125,
94 ._8xSample5XOffset = 0.0625,
95 ._8xSample5YOffset = 0.4375,
96 ._8xSample6XOffset = 0.6875,
97 ._8xSample6YOffset = 0.9375,
98 ._8xSample7XOffset = 0.9375,
99 ._8xSample7YOffset = 0.0625,
100 #if GEN_GEN >= 9
101 ._16xSample0XOffset = 0.5625,
102 ._16xSample0YOffset = 0.5625,
103 ._16xSample1XOffset = 0.4375,
104 ._16xSample1YOffset = 0.3125,
105 ._16xSample2XOffset = 0.3125,
106 ._16xSample2YOffset = 0.6250,
107 ._16xSample3XOffset = 0.7500,
108 ._16xSample3YOffset = 0.4375,
109 ._16xSample4XOffset = 0.1875,
110 ._16xSample4YOffset = 0.3750,
111 ._16xSample5XOffset = 0.6250,
112 ._16xSample5YOffset = 0.8125,
113 ._16xSample6XOffset = 0.8125,
114 ._16xSample6YOffset = 0.6875,
115 ._16xSample7XOffset = 0.6875,
116 ._16xSample7YOffset = 0.1875,
117 ._16xSample8XOffset = 0.3750,
118 ._16xSample8YOffset = 0.8750,
119 ._16xSample9XOffset = 0.5000,
120 ._16xSample9YOffset = 0.0625,
121 ._16xSample10XOffset = 0.2500,
122 ._16xSample10YOffset = 0.1250,
123 ._16xSample11XOffset = 0.1250,
124 ._16xSample11YOffset = 0.7500,
125 ._16xSample12XOffset = 0.0000,
126 ._16xSample12YOffset = 0.5000,
127 ._16xSample13XOffset = 0.9375,
128 ._16xSample13YOffset = 0.2500,
129 ._16xSample14XOffset = 0.8750,
130 ._16xSample14YOffset = 0.9375,
131 ._16xSample15XOffset = 0.0625,
132 ._16xSample15YOffset = 0.0000,
133 #endif
134 );
135 #endif
136
137 anv_batch_emit(&batch, GENX(MI_BATCH_BUFFER_END));
138
139 assert(batch.next <= batch.end);
140
141 return anv_device_submit_simple_batch(device, &batch);
142 }
143
144 static inline uint32_t
145 vk_to_gen_tex_filter(VkFilter filter, bool anisotropyEnable)
146 {
147 switch (filter) {
148 default:
149 assert(!"Invalid filter");
150 case VK_FILTER_NEAREST:
151 return MAPFILTER_NEAREST;
152 case VK_FILTER_LINEAR:
153 return anisotropyEnable ? MAPFILTER_ANISOTROPIC : MAPFILTER_LINEAR;
154 }
155 }
156
157 static inline uint32_t
158 vk_to_gen_max_anisotropy(float ratio)
159 {
160 return (anv_clamp_f(ratio, 2, 16) - 2) / 2;
161 }
162
163 static const uint32_t vk_to_gen_mipmap_mode[] = {
164 [VK_SAMPLER_MIPMAP_MODE_NEAREST] = MIPFILTER_NEAREST,
165 [VK_SAMPLER_MIPMAP_MODE_LINEAR] = MIPFILTER_LINEAR
166 };
167
168 static const uint32_t vk_to_gen_tex_address[] = {
169 [VK_SAMPLER_ADDRESS_MODE_REPEAT] = TCM_WRAP,
170 [VK_SAMPLER_ADDRESS_MODE_MIRRORED_REPEAT] = TCM_MIRROR,
171 [VK_SAMPLER_ADDRESS_MODE_CLAMP_TO_EDGE] = TCM_CLAMP,
172 [VK_SAMPLER_ADDRESS_MODE_MIRROR_CLAMP_TO_EDGE] = TCM_MIRROR_ONCE,
173 [VK_SAMPLER_ADDRESS_MODE_CLAMP_TO_BORDER] = TCM_CLAMP_BORDER,
174 };
175
176 /* Vulkan specifies the result of shadow comparisons as:
177 * 1 if ref <op> texel,
178 * 0 otherwise.
179 *
180 * The hardware does:
181 * 0 if texel <op> ref,
182 * 1 otherwise.
183 *
184 * So, these look a bit strange because there's both a negation
185 * and swapping of the arguments involved.
186 */
187 static const uint32_t vk_to_gen_shadow_compare_op[] = {
188 [VK_COMPARE_OP_NEVER] = PREFILTEROPALWAYS,
189 [VK_COMPARE_OP_LESS] = PREFILTEROPLEQUAL,
190 [VK_COMPARE_OP_EQUAL] = PREFILTEROPNOTEQUAL,
191 [VK_COMPARE_OP_LESS_OR_EQUAL] = PREFILTEROPLESS,
192 [VK_COMPARE_OP_GREATER] = PREFILTEROPGEQUAL,
193 [VK_COMPARE_OP_NOT_EQUAL] = PREFILTEROPEQUAL,
194 [VK_COMPARE_OP_GREATER_OR_EQUAL] = PREFILTEROPGREATER,
195 [VK_COMPARE_OP_ALWAYS] = PREFILTEROPNEVER,
196 };
197
198 VkResult genX(CreateSampler)(
199 VkDevice _device,
200 const VkSamplerCreateInfo* pCreateInfo,
201 const VkAllocationCallbacks* pAllocator,
202 VkSampler* pSampler)
203 {
204 ANV_FROM_HANDLE(anv_device, device, _device);
205 struct anv_sampler *sampler;
206
207 assert(pCreateInfo->sType == VK_STRUCTURE_TYPE_SAMPLER_CREATE_INFO);
208
209 sampler = anv_alloc2(&device->alloc, pAllocator, sizeof(*sampler), 8,
210 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
211 if (!sampler)
212 return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
213
214 uint32_t border_color_offset = device->border_colors.offset +
215 pCreateInfo->borderColor * 64;
216
217 struct GENX(SAMPLER_STATE) sampler_state = {
218 .SamplerDisable = false,
219 .TextureBorderColorMode = DX10OGL,
220
221 #if GEN_GEN >= 8
222 .LODPreClampMode = CLAMP_MODE_OGL,
223 #else
224 .LODPreClampEnable = CLAMP_ENABLE_OGL,
225 #endif
226
227 #if GEN_GEN == 8
228 .BaseMipLevel = 0.0,
229 #endif
230 .MipModeFilter = vk_to_gen_mipmap_mode[pCreateInfo->mipmapMode],
231 .MagModeFilter = vk_to_gen_tex_filter(pCreateInfo->magFilter,
232 pCreateInfo->anisotropyEnable),
233 .MinModeFilter = vk_to_gen_tex_filter(pCreateInfo->minFilter,
234 pCreateInfo->anisotropyEnable),
235 .TextureLODBias = anv_clamp_f(pCreateInfo->mipLodBias, -16, 15.996),
236 .AnisotropicAlgorithm = EWAApproximation,
237 .MinLOD = anv_clamp_f(pCreateInfo->minLod, 0, 14),
238 .MaxLOD = anv_clamp_f(pCreateInfo->maxLod, 0, 14),
239 .ChromaKeyEnable = 0,
240 .ChromaKeyIndex = 0,
241 .ChromaKeyMode = 0,
242 .ShadowFunction = vk_to_gen_shadow_compare_op[pCreateInfo->compareOp],
243 .CubeSurfaceControlMode = OVERRIDE,
244
245 .BorderColorPointer = border_color_offset,
246
247 #if GEN_GEN >= 8
248 .LODClampMagnificationMode = MIPNONE,
249 #endif
250
251 .MaximumAnisotropy = vk_to_gen_max_anisotropy(pCreateInfo->maxAnisotropy),
252 .RAddressMinFilterRoundingEnable = 0,
253 .RAddressMagFilterRoundingEnable = 0,
254 .VAddressMinFilterRoundingEnable = 0,
255 .VAddressMagFilterRoundingEnable = 0,
256 .UAddressMinFilterRoundingEnable = 0,
257 .UAddressMagFilterRoundingEnable = 0,
258 .TrilinearFilterQuality = 0,
259 .NonnormalizedCoordinateEnable = pCreateInfo->unnormalizedCoordinates,
260 .TCXAddressControlMode = vk_to_gen_tex_address[pCreateInfo->addressModeU],
261 .TCYAddressControlMode = vk_to_gen_tex_address[pCreateInfo->addressModeV],
262 .TCZAddressControlMode = vk_to_gen_tex_address[pCreateInfo->addressModeW],
263 };
264
265 GENX(SAMPLER_STATE_pack)(NULL, sampler->state, &sampler_state);
266
267 *pSampler = anv_sampler_to_handle(sampler);
268
269 return VK_SUCCESS;
270 }