src/gallium/drivers/iris/iris_batch.c

   1 /*
   2  * Copyright © 2017 Intel Corporation
   3  *
   4  * Permission is hereby granted, free of charge, to any person obtaining a
   5  * copy of this software and associated documentation files (the
   6  * "Software"), to deal in the Software without restriction, including
   7  * without limitation the rights to use, copy, modify, merge, publish,
   8  * distribute, sublicense, and/or sell copies of the Software, and to
   9  * permit persons to whom the Software is furnished to do so, subject to
  10  * the following conditions:
  11  *
  12  * The above copyright notice and this permission notice (including the
  13  * next paragraph) shall be included in all copies or substantial portions
  14  * of the Software.
  15  *
  16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
  17  * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  18  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
  19  * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
  20  * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
  21  * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
  22  * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
  23  */
  24
  25 #include "iris_batch.h"
  26 #include "iris_bufmgr.h"
  27 #include "iris_context.h"
  28 #include "common/gen_decoder.h"
  29
  30 #include "drm-uapi/i915_drm.h"
  31
  32 #include "util/hash_table.h"
  33 #include "main/macros.h"
  34
  35 #include <errno.h>
  36 #include <xf86drm.h>
  37
  38 #define FILE_DEBUG_FLAG DEBUG_BUFMGR
  39
  40 /**
  41  * Target sizes of the batch and state buffers.  We create the initial
  42  * buffers at these sizes, and flush when they're nearly full.  If we
  43  * underestimate how close we are to the end, and suddenly need more space
  44  * in the middle of a draw, we can grow the buffers, and finish the draw.
  45  * At that point, we'll be over our target size, so the next operation
  46  * should flush.  Each time we flush the batch, we recreate both buffers
  47  * at the original target size, so it doesn't grow without bound.
  48  */
  49 #define BATCH_SZ (20 * 1024)
  50 #define STATE_SZ (18 * 1024)
  51
  52 static void decode_batch(struct iris_batch *batch);
  53
  54 static void
  55 iris_batch_reset(struct iris_batch *batch);
  56
  57 UNUSED static void
  58 dump_validation_list(struct iris_batch *batch)
  59 {
  60    fprintf(stderr, "Validation list (length %d):\n", batch->exec_count);
  61
  62    for (int i = 0; i < batch->exec_count; i++) {
  63       assert(batch->validation_list[i].handle ==
  64              batch->exec_bos[i]->gem_handle);
  65       fprintf(stderr, "[%d] = %d %s %p\n", i,
  66               batch->validation_list[i].handle,
  67               batch->exec_bos[i]->name,
  68               batch->exec_bos[i]);
  69    }
  70 }
  71
  72 static bool
  73 uint_key_compare(const void *a, const void *b)
  74 {
  75    return a == b;
  76 }
  77
  78 static uint32_t
  79 uint_key_hash(const void *key)
  80 {
  81    return (uintptr_t) key;
  82 }
  83
  84 static void
  85 init_reloc_list(struct iris_reloc_list *rlist, int count)
  86 {
  87    rlist->reloc_count = 0;
  88    rlist->reloc_array_size = count;
  89    rlist->relocs = malloc(rlist->reloc_array_size *
  90                           sizeof(struct drm_i915_gem_relocation_entry));
  91 }
  92
  93 static void
  94 create_batch_buffer(struct iris_bufmgr *bufmgr,
  95                     struct iris_batch_buffer *buf,
  96                     const char *name, unsigned size)
  97 {
  98    buf->bo = iris_bo_alloc(bufmgr, name, size, 4096);
  99    buf->bo->kflags |= EXEC_OBJECT_CAPTURE;
 100    buf->map = iris_bo_map(NULL, buf->bo, MAP_READ | MAP_WRITE);
 101    buf->map_next = buf->map;
 102 }
 103
 104 void
 105 iris_init_batch(struct iris_batch *batch,
 106                 struct iris_screen *screen,
 107                 struct pipe_debug_callback *dbg,
 108                 uint8_t ring)
 109 {
 110    batch->screen = screen;
 111    batch->dbg = dbg;
 112
 113    /* ring should be one of I915_EXEC_RENDER, I915_EXEC_BLT, etc. */
 114    assert((ring & ~I915_EXEC_RING_MASK) == 0);
 115    assert(util_bitcount(ring) == 1);
 116    batch->ring = ring;
 117
 118    init_reloc_list(&batch->cmdbuf.relocs, 256);
 119    init_reloc_list(&batch->statebuf.relocs, 256);
 120
 121    batch->exec_count = 0;
 122    batch->exec_array_size = 100;
 123    batch->exec_bos =
 124       malloc(batch->exec_array_size * sizeof(batch->exec_bos[0]));
 125    batch->validation_list =
 126       malloc(batch->exec_array_size * sizeof(batch->validation_list[0]));
 127
 128    if (unlikely(INTEL_DEBUG)) {
 129       batch->state_sizes =
 130          _mesa_hash_table_create(NULL, uint_key_hash, uint_key_compare);
 131    }
 132
 133    iris_batch_reset(batch);
 134 }
 135
 136 #define READ_ONCE(x) (*(volatile __typeof__(x) *)&(x))
 137
 138 static unsigned
 139 add_exec_bo(struct iris_batch *batch, struct iris_bo *bo)
 140 {
 141    unsigned index = READ_ONCE(bo->index);
 142
 143    if (index < batch->exec_count && batch->exec_bos[index] == bo)
 144       return index;
 145
 146    /* May have been shared between multiple active batches */
 147    for (index = 0; index < batch->exec_count; index++) {
 148       if (batch->exec_bos[index] == bo)
 149          return index;
 150    }
 151
 152    iris_bo_reference(bo);
 153
 154    if (batch->exec_count == batch->exec_array_size) {
 155       batch->exec_array_size *= 2;
 156       batch->exec_bos =
 157          realloc(batch->exec_bos,
 158                  batch->exec_array_size * sizeof(batch->exec_bos[0]));
 159       batch->validation_list =
 160          realloc(batch->validation_list,
 161                  batch->exec_array_size * sizeof(batch->validation_list[0]));
 162    }
 163
 164    batch->validation_list[batch->exec_count] =
 165       (struct drm_i915_gem_exec_object2) {
 166          .handle = bo->gem_handle,
 167          .alignment = bo->align,
 168          .offset = bo->gtt_offset,
 169          .flags = bo->kflags,
 170       };
 171
 172    bo->index = batch->exec_count;
 173    batch->exec_bos[batch->exec_count] = bo;
 174    batch->aperture_space += bo->size;
 175
 176    return batch->exec_count++;
 177 }
 178
 179 static void
 180 iris_batch_reset(struct iris_batch *batch)
 181 {
 182    struct iris_screen *screen = batch->screen;
 183    struct iris_bufmgr *bufmgr = screen->bufmgr;
 184
 185    if (batch->last_cmd_bo != NULL) {
 186       iris_bo_unreference(batch->last_cmd_bo);
 187       batch->last_cmd_bo = NULL;
 188    }
 189    batch->last_cmd_bo = batch->cmdbuf.bo;
 190
 191    create_batch_buffer(bufmgr, &batch->cmdbuf, "command buffer", BATCH_SZ);
 192    create_batch_buffer(bufmgr, &batch->statebuf, "state buffer", STATE_SZ);
 193
 194    /* Avoid making 0 a valid state offset - otherwise the decoder will try
 195     * and decode data when we use offset 0 as a null pointer.
 196     */
 197    batch->statebuf.map_next += 1;
 198
 199    add_exec_bo(batch, batch->cmdbuf.bo);
 200    assert(batch->cmdbuf.bo->index == 0);
 201
 202    if (batch->state_sizes)
 203       _mesa_hash_table_clear(batch->state_sizes, NULL);
 204 }
 205
 206 static void
 207 iris_batch_reset_and_clear_render_cache(struct iris_batch *batch)
 208 {
 209    iris_batch_reset(batch);
 210    // XXX: iris_render_cache_set_clear(batch);
 211 }
 212
 213 static void
 214 free_batch_buffer(struct iris_batch_buffer *buf)
 215 {
 216    iris_bo_unreference(buf->bo);
 217    buf->bo = NULL;
 218    buf->map = NULL;
 219    buf->map_next = NULL;
 220
 221    free(buf->relocs.relocs);
 222    buf->relocs.relocs = NULL;
 223    buf->relocs.reloc_array_size = 0;
 224 }
 225
 226 void
 227 iris_batch_free(struct iris_batch *batch)
 228 {
 229    for (int i = 0; i < batch->exec_count; i++) {
 230       iris_bo_unreference(batch->exec_bos[i]);
 231    }
 232    free(batch->exec_bos);
 233    free(batch->validation_list);
 234    free_batch_buffer(&batch->cmdbuf);
 235    free_batch_buffer(&batch->statebuf);
 236
 237    iris_bo_unreference(batch->last_cmd_bo);
 238
 239    if (batch->state_sizes)
 240       _mesa_hash_table_destroy(batch->state_sizes, NULL);
 241 }
 242
 243 /**
 244  * Finish copying the old batch/state buffer's contents to the new one
 245  * after we tried to "grow" the buffer in an earlier operation.
 246  */
 247 static void
 248 finish_growing_bos(struct iris_batch_buffer *buf)
 249 {
 250    struct iris_bo *old_bo = buf->partial_bo;
 251    if (!old_bo)
 252       return;
 253
 254    void *old_map = old_bo->map_cpu ? old_bo->map_cpu : old_bo->map_wc;
 255    memcpy(buf->map, old_map, buf->partial_bytes);
 256
 257    buf->partial_bo = NULL;
 258    buf->partial_bytes = 0;
 259
 260    iris_bo_unreference(old_bo);
 261 }
 262
 263 static unsigned
 264 buffer_bytes_used(struct iris_batch_buffer *buf)
 265 {
 266    return buf->map_next - buf->map;
 267 }
 268
 269 /**
 270  * Grow either the batch or state buffer to a new larger size.
 271  *
 272  * We can't actually grow buffers, so we allocate a new one, copy over
 273  * the existing contents, and update our lists to refer to the new one.
 274  *
 275  * Note that this is only temporary - each new batch recreates the buffers
 276  * at their original target size (BATCH_SZ or STATE_SZ).
 277  */
 278 static void
 279 grow_buffer(struct iris_batch *batch,
 280             struct iris_batch_buffer *buf,
 281             unsigned new_size)
 282 {
 283    struct iris_bufmgr *bufmgr = batch->screen->bufmgr;
 284    struct iris_bo *bo = buf->bo;
 285
 286    perf_debug(batch->dbg, "Growing %s - ran out of space\n", bo->name);
 287
 288    if (buf->partial_bo) {
 289       /* We've already grown once, and now we need to do it again.
 290        * Finish our last grow operation so we can start a new one.
 291        * This should basically never happen.
 292        */
 293       perf_debug(batch->dbg, "Had to grow multiple times");
 294       finish_growing_bos(buf);
 295    }
 296
 297    const unsigned existing_bytes = buffer_bytes_used(buf);
 298
 299    struct iris_bo *new_bo =
 300       iris_bo_alloc(bufmgr, bo->name, new_size, bo->align);
 301
 302    buf->map = iris_bo_map(NULL, new_bo, MAP_READ | MAP_WRITE);
 303    buf->map_next = buf->map + existing_bytes;
 304
 305    /* Try to put the new BO at the same GTT offset as the old BO (which
 306     * we're throwing away, so it doesn't need to be there).
 307     *
 308     * This guarantees that our relocations continue to work: values we've
 309     * already written into the buffer, values we're going to write into the
 310     * buffer, and the validation/relocation lists all will match.
 311     *
 312     * Also preserve kflags for EXEC_OBJECT_CAPTURE.
 313     */
 314    new_bo->gtt_offset = bo->gtt_offset;
 315    new_bo->index = bo->index;
 316    new_bo->kflags = bo->kflags;
 317
 318    /* Batch/state buffers are per-context, and if we've run out of space,
 319     * we must have actually used them before, so...they will be in the list.
 320     */
 321    assert(bo->index < batch->exec_count);
 322    assert(batch->exec_bos[bo->index] == bo);
 323
 324    /* Update the validation list to use the new BO. */
 325    batch->exec_bos[bo->index] = new_bo;
 326    batch->validation_list[bo->index].handle = new_bo->gem_handle;
 327
 328    /* Exchange the two BOs...without breaking pointers to the old BO.
 329     *
 330     * Consider this scenario:
 331     *
 332     * 1. Somebody calls iris_state_batch() to get a region of memory, and
 333     *    and then creates a iris_address pointing to iris->batch.state.bo.
 334     * 2. They then call iris_state_batch() a second time, which happens to
 335     *    grow and replace the state buffer.  They then try to emit a
 336     *    relocation to their first section of memory.
 337     *
 338     * If we replace the iris->batch.state.bo pointer at step 2, we would
 339     * break the address created in step 1.  They'd have a pointer to the
 340     * old destroyed BO.  Emitting a relocation would add this dead BO to
 341     * the validation list...causing /both/ statebuffers to be in the list,
 342     * and all kinds of disasters.
 343     *
 344     * This is not a contrived case - BLORP vertex data upload hits this.
 345     *
 346     * There are worse scenarios too.  Fences for GL sync objects reference
 347     * iris->batch.batch.bo.  If we replaced the batch pointer when growing,
 348     * we'd need to chase down every fence and update it to point to the
 349     * new BO.  Otherwise, it would refer to a "batch" that never actually
 350     * gets submitted, and would fail to trigger.
 351     *
 352     * To work around both of these issues, we transmutate the buffers in
 353     * place, making the existing struct iris_bo represent the new buffer,
 354     * and "new_bo" represent the old BO.  This is highly unusual, but it
 355     * seems like a necessary evil.
 356     *
 357     * We also defer the memcpy of the existing batch's contents.  Callers
 358     * may make multiple iris_state_batch calls, and retain pointers to the
 359     * old BO's map.  We'll perform the memcpy in finish_growing_bo() when
 360     * we finally submit the batch, at which point we've finished uploading
 361     * state, and nobody should have any old references anymore.
 362     *
 363     * To do that, we keep a reference to the old BO in grow->partial_bo,
 364     * and store the number of bytes to copy in grow->partial_bytes.  We
 365     * can monkey with the refcounts directly without atomics because these
 366     * are per-context BOs and they can only be touched by this thread.
 367     */
 368    assert(new_bo->refcount == 1);
 369    new_bo->refcount = bo->refcount;
 370    bo->refcount = 1;
 371
 372    struct iris_bo tmp;
 373    memcpy(&tmp, bo, sizeof(struct iris_bo));
 374    memcpy(bo, new_bo, sizeof(struct iris_bo));
 375    memcpy(new_bo, &tmp, sizeof(struct iris_bo));
 376
 377    buf->partial_bo = new_bo; /* the one reference of the OLD bo */
 378    buf->partial_bytes = existing_bytes;
 379 }
 380
 381 static void
 382 require_buffer_space(struct iris_batch *batch,
 383                      struct iris_batch_buffer *buf,
 384                      unsigned size,
 385                      unsigned flush_threshold,
 386                      unsigned max_buffer_size)
 387 {
 388    const unsigned required_bytes = buffer_bytes_used(buf) + size;
 389
 390    if (!batch->no_wrap && required_bytes >= flush_threshold) {
 391       iris_batch_flush(batch);
 392    } else if (required_bytes >= buf->bo->size) {
 393       grow_buffer(batch, buf,
 394                   MIN2(buf->bo->size + buf->bo->size / 2, max_buffer_size));
 395       assert(required_bytes < buf->bo->size);
 396    }
 397 }
 398
 399
 400 void
 401 iris_require_command_space(struct iris_batch *batch, unsigned size)
 402 {
 403    require_buffer_space(batch, &batch->cmdbuf, size, BATCH_SZ, MAX_BATCH_SIZE);
 404 }
 405
 406 /**
 407  * Reserve some space in the statebuffer, or flush.
 408  *
 409  * This is used to estimate when we're near the end of the batch,
 410  * so we can flush early.
 411  */
 412 void
 413 iris_require_state_space(struct iris_batch *batch, unsigned size)
 414 {
 415    require_buffer_space(batch, &batch->statebuf, size, STATE_SZ,
 416                         MAX_STATE_SIZE);
 417 }
 418
 419 void
 420 iris_batch_emit(struct iris_batch *batch, const void *data, unsigned size)
 421 {
 422    iris_require_command_space(batch, size);
 423    memcpy(batch->cmdbuf.map_next, data, size);
 424    batch->cmdbuf.map_next += size;
 425 }
 426
 427 /**
 428  * Called from iris_batch_flush before emitting MI_BATCHBUFFER_END and
 429  * sending it off.
 430  *
 431  * This function can emit state (say, to preserve registers that aren't saved
 432  * between batches).
 433  */
 434 static void
 435 iris_finish_batch(struct iris_batch *batch)
 436 {
 437    batch->no_wrap = true;
 438
 439    /* Mark the end of the buffer. */
 440    const uint32_t MI_BATCH_BUFFER_END = (0xA << 23);
 441    iris_batch_emit(batch, &MI_BATCH_BUFFER_END, sizeof(uint32_t));
 442
 443    batch->no_wrap = false;
 444 }
 445
 446 static int
 447 submit_batch(struct iris_batch *batch, int in_fence_fd, int *out_fence_fd)
 448 {
 449    iris_bo_unmap(batch->cmdbuf.bo);
 450    iris_bo_unmap(batch->statebuf.bo);
 451
 452    /* The requirement for using I915_EXEC_NO_RELOC are:
 453     *
 454     *   The addresses written in the objects must match the corresponding
 455     *   reloc.gtt_offset which in turn must match the corresponding
 456     *   execobject.offset.
 457     *
 458     *   Any render targets written to in the batch must be flagged with
 459     *   EXEC_OBJECT_WRITE.
 460     *
 461     *   To avoid stalling, execobject.offset should match the current
 462     *   address of that object within the active context.
 463     */
 464    /* Set statebuffer relocations */
 465    const unsigned state_index = batch->statebuf.bo->index;
 466    if (state_index < batch->exec_count &&
 467        batch->exec_bos[state_index] == batch->statebuf.bo) {
 468       struct drm_i915_gem_exec_object2 *entry =
 469          &batch->validation_list[state_index];
 470       assert(entry->handle == batch->statebuf.bo->gem_handle);
 471       entry->relocation_count = batch->statebuf.relocs.reloc_count;
 472       entry->relocs_ptr = (uintptr_t) batch->statebuf.relocs.relocs;
 473    }
 474
 475    /* Set batchbuffer relocations */
 476    struct drm_i915_gem_exec_object2 *entry = &batch->validation_list[0];
 477    assert(entry->handle == batch->cmdbuf.bo->gem_handle);
 478    entry->relocation_count = batch->cmdbuf.relocs.reloc_count;
 479    entry->relocs_ptr = (uintptr_t) batch->cmdbuf.relocs.relocs;
 480
 481    struct drm_i915_gem_execbuffer2 execbuf = {
 482       .buffers_ptr = (uintptr_t) batch->validation_list,
 483       .buffer_count = batch->exec_count,
 484       .batch_start_offset = 0,
 485       .batch_len = buffer_bytes_used(&batch->cmdbuf),
 486       .flags = batch->ring |
 487                I915_EXEC_NO_RELOC |
 488                I915_EXEC_BATCH_FIRST |
 489                I915_EXEC_HANDLE_LUT,
 490       .rsvd1 = batch->hw_ctx_id, /* rsvd1 is actually the context ID */
 491    };
 492
 493    unsigned long cmd = DRM_IOCTL_I915_GEM_EXECBUFFER2;
 494
 495    if (in_fence_fd != -1) {
 496       execbuf.rsvd2 = in_fence_fd;
 497       execbuf.flags |= I915_EXEC_FENCE_IN;
 498    }
 499
 500    if (out_fence_fd != NULL) {
 501       cmd = DRM_IOCTL_I915_GEM_EXECBUFFER2_WR;
 502       *out_fence_fd = -1;
 503       execbuf.flags |= I915_EXEC_FENCE_OUT;
 504    }
 505
 506 #if 0
 507    int ret = drm_ioctl(batch->screen->fd, cmd, &execbuf);
 508    if (ret != 0)
 509       ret = -errno;
 510 #else
 511    int ret = 0;
 512    fprintf(stderr, "execbuf disabled for now\n");
 513 #endif
 514
 515    for (int i = 0; i < batch->exec_count; i++) {
 516       struct iris_bo *bo = batch->exec_bos[i];
 517
 518       bo->idle = false;
 519       bo->index = -1;
 520
 521       /* Update iris_bo::gtt_offset */
 522       if (batch->validation_list[i].offset != bo->gtt_offset) {
 523          DBG("BO %d migrated: 0x%" PRIx64 " -> 0x%llx\n",
 524              bo->gem_handle, bo->gtt_offset,
 525              batch->validation_list[i].offset);
 526          bo->gtt_offset = batch->validation_list[i].offset;
 527       }
 528    }
 529
 530    if (ret == 0 && out_fence_fd != NULL)
 531       *out_fence_fd = execbuf.rsvd2 >> 32;
 532
 533    return ret;
 534 }
 535
 536 /**
 537  * The in_fence_fd is ignored if -1.  Otherwise this function takes ownership
 538  * of the fd.
 539  *
 540  * The out_fence_fd is ignored if NULL. Otherwise, the caller takes ownership
 541  * of the returned fd.
 542  */
 543 int
 544 _iris_batch_flush_fence(struct iris_batch *batch,
 545                         int in_fence_fd, int *out_fence_fd,
 546                         const char *file, int line)
 547 {
 548    if (buffer_bytes_used(&batch->cmdbuf) == 0)
 549       return 0;
 550
 551    /* Check that we didn't just wrap our batchbuffer at a bad time. */
 552    assert(!batch->no_wrap);
 553
 554    iris_finish_batch(batch);
 555
 556    if (unlikely(INTEL_DEBUG & (DEBUG_BATCH | DEBUG_SUBMIT))) {
 557       int bytes_for_commands = buffer_bytes_used(&batch->cmdbuf);
 558       int bytes_for_state = buffer_bytes_used(&batch->statebuf);
 559       fprintf(stderr, "%19s:%-3d: Batchbuffer flush with %5db (%0.1f%%) (pkt),"
 560               " %5db (%0.1f%%) (state), %4d BOs (%0.1fMb aperture),"
 561               " %4d batch relocs, %4d state relocs\n", file, line,
 562               bytes_for_commands, 100.0f * bytes_for_commands / BATCH_SZ,
 563               bytes_for_state, 100.0f * bytes_for_state / STATE_SZ,
 564               batch->exec_count,
 565               (float) batch->aperture_space / (1024 * 1024),
 566               batch->cmdbuf.relocs.reloc_count,
 567               batch->statebuf.relocs.reloc_count);
 568    }
 569
 570    int ret = submit_batch(batch, in_fence_fd, out_fence_fd);
 571    if (ret < 0)
 572       return ret;
 573
 574    //throttle(iris);
 575
 576    if (unlikely(INTEL_DEBUG & DEBUG_BATCH))
 577       decode_batch(batch);
 578
 579    //if (iris->ctx.Const.ResetStrategy == GL_LOSE_CONTEXT_ON_RESET_ARB)
 580       //iris_check_for_reset(ice);
 581
 582    if (unlikely(INTEL_DEBUG & DEBUG_SYNC)) {
 583       dbg_printf("waiting for idle\n");
 584       iris_bo_wait_rendering(batch->cmdbuf.bo);
 585    }
 586
 587    /* Clean up after the batch we submitted and prepare for a new one. */
 588    for (int i = 0; i < batch->exec_count; i++) {
 589       iris_bo_unreference(batch->exec_bos[i]);
 590       batch->exec_bos[i] = NULL;
 591    }
 592    batch->cmdbuf.relocs.reloc_count = 0;
 593    batch->statebuf.relocs.reloc_count = 0;
 594    batch->exec_count = 0;
 595    batch->aperture_space = 0;
 596
 597    iris_bo_unreference(batch->statebuf.bo);
 598
 599    /* Start a new batch buffer. */
 600    iris_batch_reset_and_clear_render_cache(batch);
 601
 602    return 0;
 603 }
 604
 605 bool
 606 iris_batch_references(struct iris_batch *batch, struct iris_bo *bo)
 607 {
 608    unsigned index = READ_ONCE(bo->index);
 609    if (index < batch->exec_count && batch->exec_bos[index] == bo)
 610       return true;
 611
 612    for (int i = 0; i < batch->exec_count; i++) {
 613       if (batch->exec_bos[i] == bo)
 614          return true;
 615    }
 616    return false;
 617 }
 618
 619 /*  This is the only way buffers get added to the validate list.
 620  */
 621 static uint64_t
 622 emit_reloc(struct iris_batch *batch,
 623            struct iris_reloc_list *rlist, uint32_t offset,
 624            struct iris_bo *target, uint32_t target_offset,
 625            unsigned int reloc_flags)
 626 {
 627    assert(target != NULL);
 628
 629    if (rlist->reloc_count == rlist->reloc_array_size) {
 630       rlist->reloc_array_size *= 2;
 631       rlist->relocs = realloc(rlist->relocs,
 632                               rlist->reloc_array_size *
 633                               sizeof(struct drm_i915_gem_relocation_entry));
 634    }
 635
 636    unsigned int index = add_exec_bo(batch, target);
 637    struct drm_i915_gem_exec_object2 *entry = &batch->validation_list[index];
 638
 639    rlist->relocs[rlist->reloc_count++] =
 640       (struct drm_i915_gem_relocation_entry) {
 641          .offset = offset,
 642          .delta = target_offset,
 643          .target_handle = index,
 644          .presumed_offset = entry->offset,
 645       };
 646
 647    /* Using the old buffer offset, write in what the right data would be, in
 648     * case the buffer doesn't move and we can short-circuit the relocation
 649     * processing in the kernel
 650     */
 651    return entry->offset + target_offset;
 652 }
 653
 654 uint64_t
 655 iris_batch_reloc(struct iris_batch *batch, uint32_t batch_offset,
 656                  struct iris_bo *target, uint32_t target_offset,
 657                  unsigned int reloc_flags)
 658 {
 659    assert(batch_offset <= batch->cmdbuf.bo->size - sizeof(uint32_t));
 660
 661    return emit_reloc(batch, &batch->cmdbuf.relocs, batch_offset,
 662                      target, target_offset, reloc_flags);
 663 }
 664
 665 uint64_t
 666 iris_state_reloc(struct iris_batch *batch, uint32_t state_offset,
 667                  struct iris_bo *target, uint32_t target_offset,
 668                  unsigned int reloc_flags)
 669 {
 670    assert(state_offset <= batch->statebuf.bo->size - sizeof(uint32_t));
 671
 672    return emit_reloc(batch, &batch->statebuf.relocs, state_offset,
 673                      target, target_offset, reloc_flags);
 674 }
 675
 676
 677 static uint32_t
 678 iris_state_entry_size(struct iris_batch *batch, uint32_t offset)
 679 {
 680    struct hash_entry *entry =
 681       _mesa_hash_table_search(batch->state_sizes, (void *)(uintptr_t) offset);
 682    return entry ? (uintptr_t) entry->data : 0;
 683 }
 684
 685 /**
 686  * Allocates a block of space in the batchbuffer for indirect state.
 687  */
 688 void *
 689 iris_alloc_state(struct iris_batch *batch,
 690                  int size, int alignment,
 691                  uint32_t *out_offset)
 692 {
 693    assert(size < batch->statebuf.bo->size);
 694
 695    const unsigned existing_bytes = buffer_bytes_used(&batch->statebuf);
 696    unsigned aligned_size =
 697       ALIGN(existing_bytes, alignment) - existing_bytes + size;
 698
 699    require_buffer_space(batch, &batch->statebuf, aligned_size,
 700                         STATE_SZ, MAX_STATE_SIZE);
 701
 702    unsigned offset = ALIGN(buffer_bytes_used(&batch->statebuf), alignment);
 703
 704    if (unlikely(batch->state_sizes)) {
 705       _mesa_hash_table_insert(batch->state_sizes,
 706                               (void *) (uintptr_t) offset,
 707                               (void *) (uintptr_t) size);
 708    }
 709
 710    batch->statebuf.map_next += aligned_size;
 711
 712    *out_offset = offset;
 713    return batch->statebuf.map_next;
 714 }
 715
 716 uint32_t
 717 iris_emit_state(struct iris_batch *batch,
 718                 const void *data,
 719                 int size, int alignment)
 720 {
 721    uint32_t out_offset;
 722    void *dest = iris_alloc_state(batch, size, alignment, &out_offset);
 723    memcpy(dest, data, size);
 724    return out_offset;
 725 }
 726
 727 static void
 728 decode_batch(struct iris_batch *batch)
 729 {
 730    // XXX: decode the batch
 731 }