--- /dev/null
+/*
+ * Copyright © 2016 Intel Corporation
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice (including the next
+ * paragraph) shall be included in all copies or substantial portions of the
+ * Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
+ * IN THE SOFTWARE.
+ */
+
+#include "anv_private.h"
+
+static bool
+lookup_blorp_shader(struct blorp_context *blorp,
+ const void *key, uint32_t key_size,
+ uint32_t *kernel_out, void *prog_data_out)
+{
+ struct anv_device *device = blorp->driver_ctx;
+
+ /* The blorp cache must be a real cache */
+ assert(device->blorp_shader_cache.cache);
+
+ struct anv_shader_bin *bin =
+ anv_pipeline_cache_search(&device->blorp_shader_cache, key, key_size);
+ if (!bin)
+ return false;
+
+ /* The cache already has a reference and it's not going anywhere so there
+ * is no need to hold a second reference.
+ */
+ anv_shader_bin_unref(device, bin);
+
+ *kernel_out = bin->kernel.offset;
+ *(const struct brw_stage_prog_data **)prog_data_out =
+ anv_shader_bin_get_prog_data(bin);
+
+ return true;
+}
+
+static void
+upload_blorp_shader(struct blorp_context *blorp,
+ const void *key, uint32_t key_size,
+ const void *kernel, uint32_t kernel_size,
+ const void *prog_data, uint32_t prog_data_size,
+ uint32_t *kernel_out, void *prog_data_out)
+{
+ struct anv_device *device = blorp->driver_ctx;
+
+ /* The blorp cache must be a real cache */
+ assert(device->blorp_shader_cache.cache);
+
+ struct anv_pipeline_bind_map bind_map = {
+ .surface_count = 0,
+ .sampler_count = 0,
+ };
+
+ struct anv_shader_bin *bin =
+ anv_pipeline_cache_upload_kernel(&device->blorp_shader_cache,
+ key, key_size, kernel, kernel_size,
+ prog_data, prog_data_size, &bind_map);
+
+ /* The cache already has a reference and it's not going anywhere so there
+ * is no need to hold a second reference.
+ */
+ anv_shader_bin_unref(device, bin);
+
+ *kernel_out = bin->kernel.offset;
+ *(const struct brw_stage_prog_data **)prog_data_out =
+ anv_shader_bin_get_prog_data(bin);
+}
+
+void
+anv_device_init_blorp(struct anv_device *device)
+{
+ anv_pipeline_cache_init(&device->blorp_shader_cache, device, true);
+ blorp_init(&device->blorp, device, &device->isl_dev);
+ device->blorp.compiler = device->instance->physicalDevice.compiler;
+ device->blorp.mocs.tex = device->default_mocs;
+ device->blorp.mocs.rb = device->default_mocs;
+ device->blorp.mocs.vb = device->default_mocs;
+ device->blorp.lookup_shader = lookup_blorp_shader;
+ device->blorp.upload_shader = upload_blorp_shader;
+ switch (device->info.gen) {
+ case 7:
+ if (device->info.is_haswell) {
+ device->blorp.exec = gen75_blorp_exec;
+ } else {
+ device->blorp.exec = gen7_blorp_exec;
+ }
+ break;
+ case 8:
+ device->blorp.exec = gen8_blorp_exec;
+ break;
+ case 9:
+ device->blorp.exec = gen9_blorp_exec;
+ break;
+ default:
+ unreachable("Unknown hardware generation");
+ }
+}
+
+void
+anv_device_finish_blorp(struct anv_device *device)
+{
+ blorp_finish(&device->blorp);
+ anv_pipeline_cache_finish(&device->blorp_shader_cache);
+}
--- /dev/null
+/*
+ * Copyright © 2016 Intel Corporation
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice (including the next
+ * paragraph) shall be included in all copies or substantial portions of the
+ * Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
+ * IN THE SOFTWARE.
+ */
+
+#include <assert.h>
+
+#include "anv_private.h"
+#include "genX_multisample.h"
+
+/* These are defined in anv_private.h and blorp_genX_exec.h */
+#undef __gen_address_type
+#undef __gen_user_data
+#undef __gen_combine_address
+
+#include "common/gen_l3_config.h"
+#include "blorp/blorp_genX_exec.h"
+
+static void *
+blorp_emit_dwords(struct blorp_batch *batch, unsigned n)
+{
+ struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
+ return anv_batch_emit_dwords(&cmd_buffer->batch, n);
+}
+
+static uint64_t
+blorp_emit_reloc(struct blorp_batch *batch,
+ void *location, struct blorp_address address, uint32_t delta)
+{
+ struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
+ assert(cmd_buffer->batch.start <= location &&
+ location < cmd_buffer->batch.end);
+ return anv_batch_emit_reloc(&cmd_buffer->batch, location,
+ address.buffer, address.offset + delta);
+}
+
+static void
+blorp_surface_reloc(struct blorp_batch *batch, uint32_t ss_offset,
+ struct blorp_address address, uint32_t delta)
+{
+ struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
+ anv_reloc_list_add(&cmd_buffer->surface_relocs, &cmd_buffer->pool->alloc,
+ ss_offset, address.buffer, address.offset + delta);
+}
+
+static void *
+blorp_alloc_dynamic_state(struct blorp_batch *batch,
+ enum aub_state_struct_type type,
+ uint32_t size,
+ uint32_t alignment,
+ uint32_t *offset)
+{
+ struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
+
+ struct anv_state state =
+ anv_cmd_buffer_alloc_dynamic_state(cmd_buffer, size, alignment);
+
+ *offset = state.offset;
+ return state.map;
+}
+
+static void
+blorp_alloc_binding_table(struct blorp_batch *batch, unsigned num_entries,
+ unsigned state_size, unsigned state_alignment,
+ uint32_t *bt_offset,
+ uint32_t *surface_offsets, void **surface_maps)
+{
+ struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
+
+ uint32_t state_offset;
+ struct anv_state bt_state =
+ anv_cmd_buffer_alloc_binding_table(cmd_buffer, num_entries,
+ &state_offset);
+ if (bt_state.map == NULL) {
+ /* We ran out of space. Grab a new binding table block. */
+ VkResult result = anv_cmd_buffer_new_binding_table_block(cmd_buffer);
+ assert(result == VK_SUCCESS);
+
+ /* Re-emit state base addresses so we get the new surface state base
+ * address before we start emitting binding tables etc.
+ */
+ anv_cmd_buffer_emit_state_base_address(cmd_buffer);
+
+ bt_state = anv_cmd_buffer_alloc_binding_table(cmd_buffer, num_entries,
+ &state_offset);
+ assert(bt_state.map != NULL);
+ }
+
+ uint32_t *bt_map = bt_state.map;
+ *bt_offset = bt_state.offset;
+
+ for (unsigned i = 0; i < num_entries; i++) {
+ struct anv_state surface_state =
+ anv_cmd_buffer_alloc_surface_state(cmd_buffer);
+ bt_map[i] = surface_state.offset + state_offset;
+ surface_offsets[i] = surface_state.offset;
+ surface_maps[i] = surface_state.map;
+ }
+}
+
+static void *
+blorp_alloc_vertex_buffer(struct blorp_batch *batch, uint32_t size,
+ struct blorp_address *addr)
+{
+ struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
+ struct anv_state vb_state =
+ anv_cmd_buffer_alloc_dynamic_state(cmd_buffer, size, 16);
+
+ *addr = (struct blorp_address) {
+ .buffer = &cmd_buffer->device->dynamic_state_block_pool.bo,
+ .offset = vb_state.offset,
+ };
+
+ return vb_state.map;
+}
+
+static void
+blorp_emit_urb_config(struct blorp_batch *batch, unsigned vs_entry_size)
+{
+ struct anv_device *device = batch->blorp->driver_ctx;
+ struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
+
+ genX(emit_urb_setup)(device, &cmd_buffer->batch,
+ VK_SHADER_STAGE_VERTEX_BIT |
+ VK_SHADER_STAGE_FRAGMENT_BIT,
+ vs_entry_size, 0,
+ cmd_buffer->state.current_l3_config);
+}
+
+static void
+blorp_emit_3dstate_multisample(struct blorp_batch *batch, unsigned samples)
+{
+ blorp_emit(batch, GENX(3DSTATE_MULTISAMPLE), ms) {
+ ms.NumberofMultisamples = __builtin_ffs(samples) - 1;
+
+#if GEN_GEN >= 8
+ /* The PRM says that this bit is valid only for DX9:
+ *
+ * SW can choose to set this bit only for DX9 API. DX10/OGL API's
+ * should not have any effect by setting or not setting this bit.
+ */
+ ms.PixelPositionOffsetEnable = false;
+ ms.PixelLocation = CENTER;
+#else
+ ms.PixelLocation = PIXLOC_CENTER;
+
+ switch (samples) {
+ case 1:
+ SAMPLE_POS_1X(ms.Sample);
+ break;
+ case 2:
+ SAMPLE_POS_2X(ms.Sample);
+ break;
+ case 4:
+ SAMPLE_POS_4X(ms.Sample);
+ break;
+ case 8:
+ SAMPLE_POS_8X(ms.Sample);
+ break;
+ default:
+ break;
+ }
+#endif
+ }
+}
+
+void genX(blorp_exec)(struct blorp_batch *batch,
+ const struct blorp_params *params);
+
+void
+genX(blorp_exec)(struct blorp_batch *batch,
+ const struct blorp_params *params)
+{
+ struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
+
+ if (!cmd_buffer->state.current_l3_config) {
+ const struct gen_l3_config *cfg =
+ gen_get_default_l3_config(&cmd_buffer->device->info);
+ genX(cmd_buffer_config_l3)(cmd_buffer, cfg);
+ }
+
+ genX(cmd_buffer_apply_pipe_flushes)(cmd_buffer);
+
+ if (cmd_buffer->state.current_pipeline != _3D) {
+#if GEN_GEN <= 7
+ /* From "BXML » GT » MI » vol1a GPU Overview » [Instruction]
+ * PIPELINE_SELECT [DevBWR+]":
+ *
+ * Project: DEVSNB+
+ *
+ * Software must ensure all the write caches are flushed through a
+ * stalling PIPE_CONTROL command followed by another PIPE_CONTROL
+ * command to invalidate read only caches prior to programming
+ * MI_PIPELINE_SELECT command to change the Pipeline Select Mode.
+ */
+ blorp_emit(batch, GENX(PIPE_CONTROL), pc) {
+ pc.RenderTargetCacheFlushEnable = true;
+ pc.DepthCacheFlushEnable = true;
+ pc.DCFlushEnable = true;
+ pc.PostSyncOperation = NoWrite;
+ pc.CommandStreamerStallEnable = true;
+ }
+
+ blorp_emit(batch, GENX(PIPE_CONTROL), pc) {
+ pc.TextureCacheInvalidationEnable = true;
+ pc.ConstantCacheInvalidationEnable = true;
+ pc.StateCacheInvalidationEnable = true;
+ pc.InstructionCacheInvalidateEnable = true;
+ pc.PostSyncOperation = NoWrite;
+ }
+#endif
+
+ blorp_emit(batch, GENX(PIPELINE_SELECT), ps) {
+#if GEN_GEN >= 9
+ ps.MaskBits = 3;
+#endif
+ ps.PipelineSelection = _3D;
+ }
+
+ cmd_buffer->state.current_pipeline = _3D;
+ }
+
+ blorp_exec(batch, params);
+
+ /* BLORP sets DRAWING_RECTANGLE but we always want it set to the maximum.
+ * Since we set it once at driver init and never again, we have to set it
+ * back after invoking blorp.
+ *
+ * TODO: BLORP should assume a max drawing rectangle
+ */
+ blorp_emit(batch, GENX(3DSTATE_DRAWING_RECTANGLE), rect) {
+ rect.ClippedDrawingRectangleYMin = 0;
+ rect.ClippedDrawingRectangleXMin = 0;
+ rect.ClippedDrawingRectangleYMax = UINT16_MAX;
+ rect.ClippedDrawingRectangleXMax = UINT16_MAX;
+ rect.DrawingRectangleOriginY = 0;
+ rect.DrawingRectangleOriginX = 0;
+ }
+
+ cmd_buffer->state.vb_dirty = ~0;
+ cmd_buffer->state.dirty = ~0;
+ cmd_buffer->state.push_constants_dirty = ~0;
+}