nvc0: add support for GL_EXT_demote_to_helper_invocation
[mesa.git] / src / amd / common / ac_llvm_util.h
1 /*
2 * Copyright 2016 Bas Nieuwenhuizen
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the
6 * "Software"), to deal in the Software without restriction, including
7 * without limitation the rights to use, copy, modify, merge, publish,
8 * distribute, sub license, and/or sell copies of the Software, and to
9 * permit persons to whom the Software is furnished to do so, subject to
10 * the following conditions:
11 *
12 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
13 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
14 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
15 * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
16 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
17 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
18 * USE OR OTHER DEALINGS IN THE SOFTWARE.
19 *
20 * The above copyright notice and this permission notice (including the
21 * next paragraph) shall be included in all copies or substantial portions
22 * of the Software.
23 *
24 */
25
26 #ifndef AC_LLVM_UTIL_H
27 #define AC_LLVM_UTIL_H
28
29 #include <stdbool.h>
30 #include <llvm-c/TargetMachine.h>
31 #include <llvm/Config/llvm-config.h>
32
33 #include "amd_family.h"
34
35 #ifdef __cplusplus
36 extern "C" {
37 #endif
38
39 struct ac_compiler_passes;
40
41 enum ac_func_attr {
42 AC_FUNC_ATTR_ALWAYSINLINE = (1 << 0),
43 AC_FUNC_ATTR_INREG = (1 << 2),
44 AC_FUNC_ATTR_NOALIAS = (1 << 3),
45 AC_FUNC_ATTR_NOUNWIND = (1 << 4),
46 AC_FUNC_ATTR_READNONE = (1 << 5),
47 AC_FUNC_ATTR_READONLY = (1 << 6),
48 AC_FUNC_ATTR_WRITEONLY = (1 << 7),
49 AC_FUNC_ATTR_INACCESSIBLE_MEM_ONLY = (1 << 8),
50 AC_FUNC_ATTR_CONVERGENT = (1 << 9),
51
52 /* Legacy intrinsic that needs attributes on function declarations
53 * and they must match the internal LLVM definition exactly, otherwise
54 * intrinsic selection fails.
55 */
56 AC_FUNC_ATTR_LEGACY = (1u << 31),
57 };
58
59 enum ac_target_machine_options {
60 AC_TM_SUPPORTS_SPILL = (1 << 0),
61 AC_TM_SISCHED = (1 << 1),
62 AC_TM_FORCE_ENABLE_XNACK = (1 << 2),
63 AC_TM_FORCE_DISABLE_XNACK = (1 << 3),
64 AC_TM_PROMOTE_ALLOCA_TO_SCRATCH = (1 << 4),
65 AC_TM_CHECK_IR = (1 << 5),
66 AC_TM_ENABLE_GLOBAL_ISEL = (1 << 6),
67 AC_TM_CREATE_LOW_OPT = (1 << 7),
68 AC_TM_NO_LOAD_STORE_OPT = (1 << 8),
69 AC_TM_WAVE32 = (1 << 9),
70 };
71
72 enum ac_float_mode {
73 AC_FLOAT_MODE_DEFAULT,
74 AC_FLOAT_MODE_NO_SIGNED_ZEROS_FP_MATH,
75 AC_FLOAT_MODE_UNSAFE_FP_MATH,
76 };
77
78 /* Per-thread persistent LLVM objects. */
79 struct ac_llvm_compiler {
80 LLVMTargetLibraryInfoRef target_library_info;
81 LLVMPassManagerRef passmgr;
82
83 /* Default compiler. */
84 LLVMTargetMachineRef tm;
85 struct ac_compiler_passes *passes;
86
87 /* Wave32 compiler for GFX10. */
88 LLVMTargetMachineRef tm_wave32;
89 struct ac_compiler_passes *passes_wave32;
90
91 /* Optional compiler for faster compilation with fewer optimizations.
92 * LLVM modules can be created with "tm" too. There is no difference.
93 */
94 LLVMTargetMachineRef low_opt_tm; /* uses -O1 instead of -O2 */
95 struct ac_compiler_passes *low_opt_passes;
96 };
97
98 const char *ac_get_llvm_processor_name(enum radeon_family family);
99 void ac_add_attr_dereferenceable(LLVMValueRef val, uint64_t bytes);
100 bool ac_is_sgpr_param(LLVMValueRef param);
101 void ac_add_function_attr(LLVMContextRef ctx, LLVMValueRef function,
102 int attr_idx, enum ac_func_attr attr);
103 void ac_add_func_attributes(LLVMContextRef ctx, LLVMValueRef function,
104 unsigned attrib_mask);
105 void ac_dump_module(LLVMModuleRef module);
106
107 LLVMValueRef ac_llvm_get_called_value(LLVMValueRef call);
108 bool ac_llvm_is_function(LLVMValueRef v);
109 LLVMModuleRef ac_create_module(LLVMTargetMachineRef tm, LLVMContextRef ctx);
110
111 LLVMBuilderRef ac_create_builder(LLVMContextRef ctx,
112 enum ac_float_mode float_mode);
113
114 void
115 ac_llvm_add_target_dep_function_attr(LLVMValueRef F,
116 const char *name, unsigned value);
117 void ac_llvm_set_workgroup_size(LLVMValueRef F, unsigned size);
118
119 static inline unsigned
120 ac_get_load_intr_attribs(bool can_speculate)
121 {
122 /* READNONE means writes can't affect it, while READONLY means that
123 * writes can affect it. */
124 return can_speculate ? AC_FUNC_ATTR_READNONE :
125 AC_FUNC_ATTR_READONLY;
126 }
127
128 unsigned
129 ac_count_scratch_private_memory(LLVMValueRef function);
130
131 LLVMTargetLibraryInfoRef ac_create_target_library_info(const char *triple);
132 void ac_dispose_target_library_info(LLVMTargetLibraryInfoRef library_info);
133 void ac_init_llvm_once(void);
134
135
136 bool ac_init_llvm_compiler(struct ac_llvm_compiler *compiler,
137 enum radeon_family family,
138 enum ac_target_machine_options tm_options);
139 void ac_destroy_llvm_compiler(struct ac_llvm_compiler *compiler);
140
141 struct ac_compiler_passes *ac_create_llvm_passes(LLVMTargetMachineRef tm);
142 void ac_destroy_llvm_passes(struct ac_compiler_passes *p);
143 bool ac_compile_module_to_elf(struct ac_compiler_passes *p, LLVMModuleRef module,
144 char **pelf_buffer, size_t *pelf_size);
145 void ac_llvm_add_barrier_noop_pass(LLVMPassManagerRef passmgr);
146 void ac_enable_global_isel(LLVMTargetMachineRef tm);
147
148 static inline bool
149 ac_has_vec3_support(enum chip_class chip, bool use_format)
150 {
151 if (chip == GFX6 && !use_format) {
152 /* GFX6 only supports vec3 with load/store format. */
153 return false;
154 }
155
156 return LLVM_VERSION_MAJOR >= 9;
157 }
158
159 #ifdef __cplusplus
160 }
161 #endif
162
163 #endif /* AC_LLVM_UTIL_H */