src/panfrost/lib/pan_device.h

   1 /**************************************************************************
   2  *
   3  * Copyright 2018-2019 Alyssa Rosenzweig
   4  * Copyright 2018-2019 Collabora, Ltd.
   5  * Copyright © 2015 Intel Corporation
   6  * All Rights Reserved.
   7  *
   8  * Permission is hereby granted, free of charge, to any person obtaining a
   9  * copy of this software and associated documentation files (the
  10  * "Software"), to deal in the Software without restriction, including
  11  * without limitation the rights to use, copy, modify, merge, publish,
  12  * distribute, sub license, and/or sell copies of the Software, and to
  13  * permit persons to whom the Software is furnished to do so, subject to
  14  * the following conditions:
  15  *
  16  * The above copyright notice and this permission notice (including the
  17  * next paragraph) shall be included in all copies or substantial portions
  18  * of the Software.
  19  *
  20  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
  21  * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  22  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
  23  * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
  24  * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
  25  * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
  26  * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
  27  *
  28  **************************************************************************/
  29
  30 #ifndef PAN_DEVICE_H
  31 #define PAN_DEVICE_H
  32
  33 #include <xf86drm.h>
  34 #include "renderonly/renderonly.h"
  35 #include "util/u_dynarray.h"
  36 #include "util/bitset.h"
  37 #include "util/list.h"
  38 #include "util/sparse_array.h"
  39
  40 #include <midgard_pack.h>
  41
  42 /* Driver limits */
  43 #define PAN_MAX_CONST_BUFFERS 16
  44
  45 /* Transient slab size. This is a balance between fragmentation against cache
  46  * locality and ease of bookkeeping */
  47
  48 #define TRANSIENT_SLAB_PAGES (16) /* 64kb */
  49 #define TRANSIENT_SLAB_SIZE (4096 * TRANSIENT_SLAB_PAGES)
  50
  51 /* Maximum number of transient slabs so we don't need dynamic arrays. Most
  52  * interesting Mali boards are 4GB RAM max, so if the entire RAM was filled
  53  * with transient slabs, you could never exceed (4GB / TRANSIENT_SLAB_SIZE)
  54  * allocations anyway. By capping, we can use a fixed-size bitset for tracking
  55  * free slabs, eliminating quite a bit of complexity. We can pack the free
  56  * state of 8 slabs into a single byte, so for 128kb transient slabs the bitset
  57  * occupies a cheap 4kb of memory */
  58
  59 #define MAX_TRANSIENT_SLABS (1024*1024 / TRANSIENT_SLAB_PAGES)
  60
  61 /* How many power-of-two levels in the BO cache do we want? 2^12
  62  * minimum chosen as it is the page size that all allocations are
  63  * rounded to */
  64
  65 #define MIN_BO_CACHE_BUCKET (12) /* 2^12 = 4KB */
  66 #define MAX_BO_CACHE_BUCKET (22) /* 2^22 = 4MB */
  67
  68 /* Fencepost problem, hence the off-by-one */
  69 #define NR_BO_CACHE_BUCKETS (MAX_BO_CACHE_BUCKET - MIN_BO_CACHE_BUCKET + 1)
  70
  71 /* Cache for blit shaders. Defined here so they can be cached with the device */
  72
  73 enum pan_blit_type {
  74         PAN_BLIT_FLOAT = 0,
  75         PAN_BLIT_UINT,
  76         PAN_BLIT_INT,
  77         PAN_BLIT_NUM_TYPES,
  78 };
  79
  80 #define PAN_BLIT_NUM_TARGETS (12)
  81
  82 struct pan_blit_shaders {
  83         struct panfrost_bo *bo;
  84         mali_ptr loads[PAN_BLIT_NUM_TARGETS][PAN_BLIT_NUM_TYPES][2];
  85 };
  86
  87 struct panfrost_device {
  88         /* For ralloc */
  89         void *memctx;
  90
  91         int fd;
  92
  93         /* Properties of the GPU in use */
  94         unsigned gpu_id;
  95         unsigned core_count;
  96         unsigned thread_tls_alloc;
  97         unsigned quirks;
  98
  99         /* Bitmask of supported compressed texture formats */
 100         uint32_t compressed_formats;
 101
 102         /* debug flags, see pan_util.h how to interpret */
 103         unsigned debug;
 104
 105         drmVersionPtr kernel_version;
 106
 107         struct renderonly *ro;
 108
 109         pthread_mutex_t bo_map_lock;
 110         struct util_sparse_array bo_map;
 111
 112         struct {
 113                 pthread_mutex_t lock;
 114
 115                 /* List containing all cached BOs sorted in LRU (Least
 116                  * Recently Used) order. This allows us to quickly evict BOs
 117                  * that are more than 1 second old.
 118                  */
 119                 struct list_head lru;
 120
 121                 /* The BO cache is a set of buckets with power-of-two sizes
 122                  * ranging from 2^12 (4096, the page size) to
 123                  * 2^(12 + MAX_BO_CACHE_BUCKETS).
 124                  * Each bucket is a linked list of free panfrost_bo objects. */
 125
 126                 struct list_head buckets[NR_BO_CACHE_BUCKETS];
 127         } bo_cache;
 128
 129         struct pan_blit_shaders blit_shaders;
 130
 131         /* Tiler heap shared across all tiler jobs, allocated against the
 132          * device since there's only a single tiler. Since this is invisible to
 133          * the CPU, it's okay for multiple contexts to reference it
 134          * simultaneously; by keeping on the device struct, we eliminate a
 135          * costly per-context allocation. */
 136
 137         struct panfrost_bo *tiler_heap;
 138 };
 139
 140 void
 141 panfrost_open_device(void *memctx, int fd, struct panfrost_device *dev);
 142
 143 void
 144 panfrost_close_device(struct panfrost_device *dev);
 145
 146 bool
 147 panfrost_supports_compressed_format(struct panfrost_device *dev, unsigned fmt);
 148
 149 static inline struct panfrost_bo *
 150 pan_lookup_bo(struct panfrost_device *dev, uint32_t gem_handle)
 151 {
 152         return util_sparse_array_get(&dev->bo_map, gem_handle);
 153 }
 154
 155 #endif