2 * Copyright 2014 Advanced Micro Devices, Inc.
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the
6 * "Software"), to deal in the Software without restriction, including
7 * without limitation the rights to use, copy, modify, merge, publish,
8 * distribute, sub license, and/or sell copies of the Software, and to
9 * permit persons to whom the Software is furnished to do so, subject to
10 * the following conditions:
12 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
13 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
14 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
15 * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
16 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
17 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
18 * USE OR OTHER DEALINGS IN THE SOFTWARE.
20 * The above copyright notice and this permission notice (including the
21 * next paragraph) shall be included in all copies or substantial portions
26 /* based on Marek's patch to lp_bld_misc.cpp */
28 // Workaround http://llvm.org/PR23628
29 #pragma push_macro("DEBUG")
32 #include "ac_binary.h"
33 #include "ac_llvm_util.h"
34 #include "ac_llvm_build.h"
36 #include <llvm-c/Core.h>
37 #include <llvm/Target/TargetMachine.h>
38 #include <llvm/IR/IRBuilder.h>
39 #include <llvm/Analysis/TargetLibraryInfo.h>
40 #include <llvm/Transforms/IPO.h>
42 #include <llvm/IR/LegacyPassManager.h>
44 void ac_add_attr_dereferenceable(LLVMValueRef val
, uint64_t bytes
)
46 llvm::Argument
*A
= llvm::unwrap
<llvm::Argument
>(val
);
47 A
->addAttr(llvm::Attribute::getWithDereferenceableBytes(A
->getContext(), bytes
));
50 bool ac_is_sgpr_param(LLVMValueRef arg
)
52 llvm::Argument
*A
= llvm::unwrap
<llvm::Argument
>(arg
);
53 llvm::AttributeList AS
= A
->getParent()->getAttributes();
54 unsigned ArgNo
= A
->getArgNo();
55 return AS
.hasAttribute(ArgNo
+ 1, llvm::Attribute::InReg
);
58 LLVMValueRef
ac_llvm_get_called_value(LLVMValueRef call
)
60 return LLVMGetCalledValue(call
);
63 bool ac_llvm_is_function(LLVMValueRef v
)
65 return LLVMGetValueKind(v
) == LLVMFunctionValueKind
;
68 LLVMModuleRef
ac_create_module(LLVMTargetMachineRef tm
, LLVMContextRef ctx
)
70 llvm::TargetMachine
*TM
= reinterpret_cast<llvm::TargetMachine
*>(tm
);
71 LLVMModuleRef module
= LLVMModuleCreateWithNameInContext("mesa-shader", ctx
);
73 llvm::unwrap(module
)->setTargetTriple(TM
->getTargetTriple().getTriple());
74 llvm::unwrap(module
)->setDataLayout(TM
->createDataLayout());
78 LLVMBuilderRef
ac_create_builder(LLVMContextRef ctx
,
79 enum ac_float_mode float_mode
)
81 LLVMBuilderRef builder
= LLVMCreateBuilderInContext(ctx
);
83 llvm::FastMathFlags flags
;
86 case AC_FLOAT_MODE_DEFAULT
:
88 case AC_FLOAT_MODE_NO_SIGNED_ZEROS_FP_MATH
:
89 flags
.setNoSignedZeros();
90 llvm::unwrap(builder
)->setFastMathFlags(flags
);
92 case AC_FLOAT_MODE_UNSAFE_FP_MATH
:
94 llvm::unwrap(builder
)->setFastMathFlags(flags
);
101 LLVMTargetLibraryInfoRef
102 ac_create_target_library_info(const char *triple
)
104 return reinterpret_cast<LLVMTargetLibraryInfoRef
>(new llvm::TargetLibraryInfoImpl(llvm::Triple(triple
)));
108 ac_dispose_target_library_info(LLVMTargetLibraryInfoRef library_info
)
110 delete reinterpret_cast<llvm::TargetLibraryInfoImpl
*>(library_info
);
113 /* The LLVM compiler is represented as a pass manager containing passes for
114 * optimizations, instruction selection, and code generation.
116 struct ac_compiler_passes
{
117 ac_compiler_passes(): ostream(code_string
) {}
119 llvm::SmallString
<0> code_string
; /* ELF shader binary */
120 llvm::raw_svector_ostream ostream
; /* stream for appending data to the binary */
121 llvm::legacy::PassManager passmgr
; /* list of passes */
124 struct ac_compiler_passes
*ac_create_llvm_passes(LLVMTargetMachineRef tm
)
126 struct ac_compiler_passes
*p
= new ac_compiler_passes();
130 llvm::TargetMachine
*TM
= reinterpret_cast<llvm::TargetMachine
*>(tm
);
132 if (TM
->addPassesToEmitFile(p
->passmgr
, p
->ostream
,
134 llvm::TargetMachine::CGFT_ObjectFile
)) {
135 fprintf(stderr
, "amd: TargetMachine can't emit a file of this type!\n");
142 void ac_destroy_llvm_passes(struct ac_compiler_passes
*p
)
147 /* This returns false on failure. */
148 bool ac_compile_module_to_binary(struct ac_compiler_passes
*p
, LLVMModuleRef module
,
149 struct ac_shader_binary
*binary
)
151 p
->passmgr
.run(*llvm::unwrap(module
));
153 llvm::StringRef data
= p
->ostream
.str();
154 bool success
= ac_elf_read(data
.data(), data
.size(), binary
);
155 p
->code_string
= ""; /* release the ELF shader binary */
158 fprintf(stderr
, "amd: cannot read an ELF shader binary\n");
162 void ac_llvm_add_barrier_noop_pass(LLVMPassManagerRef passmgr
)
164 llvm::unwrap(passmgr
)->add(llvm::createBarrierNoopPass());
167 void ac_enable_global_isel(LLVMTargetMachineRef tm
)
169 reinterpret_cast<llvm::TargetMachine
*>(tm
)->setGlobalISel(true);
172 LLVMValueRef
ac_build_atomic_rmw(struct ac_llvm_context
*ctx
, LLVMAtomicRMWBinOp op
,
173 LLVMValueRef ptr
, LLVMValueRef val
,
174 const char *sync_scope
) {
175 llvm::AtomicRMWInst::BinOp binop
;
177 case LLVMAtomicRMWBinOpXchg
:
178 binop
= llvm::AtomicRMWInst::Xchg
;
180 case LLVMAtomicRMWBinOpAdd
:
181 binop
= llvm::AtomicRMWInst::Add
;
183 case LLVMAtomicRMWBinOpSub
:
184 binop
= llvm::AtomicRMWInst::Sub
;
186 case LLVMAtomicRMWBinOpAnd
:
187 binop
= llvm::AtomicRMWInst::And
;
189 case LLVMAtomicRMWBinOpNand
:
190 binop
= llvm::AtomicRMWInst::Nand
;
192 case LLVMAtomicRMWBinOpOr
:
193 binop
= llvm::AtomicRMWInst::Or
;
195 case LLVMAtomicRMWBinOpXor
:
196 binop
= llvm::AtomicRMWInst::Xor
;
198 case LLVMAtomicRMWBinOpMax
:
199 binop
= llvm::AtomicRMWInst::Max
;
201 case LLVMAtomicRMWBinOpMin
:
202 binop
= llvm::AtomicRMWInst::Min
;
204 case LLVMAtomicRMWBinOpUMax
:
205 binop
= llvm::AtomicRMWInst::UMax
;
207 case LLVMAtomicRMWBinOpUMin
:
208 binop
= llvm::AtomicRMWInst::UMin
;
211 unreachable(!"invalid LLVMAtomicRMWBinOp");
214 unsigned SSID
= llvm::unwrap(ctx
->context
)->getOrInsertSyncScopeID(sync_scope
);
215 return llvm::wrap(llvm::unwrap(ctx
->builder
)->CreateAtomicRMW(
216 binop
, llvm::unwrap(ptr
), llvm::unwrap(val
),
217 llvm::AtomicOrdering::SequentiallyConsistent
, SSID
));
220 LLVMValueRef
ac_build_atomic_cmp_xchg(struct ac_llvm_context
*ctx
, LLVMValueRef ptr
,
221 LLVMValueRef cmp
, LLVMValueRef val
,
222 const char *sync_scope
) {
223 unsigned SSID
= llvm::unwrap(ctx
->context
)->getOrInsertSyncScopeID(sync_scope
);
224 return llvm::wrap(llvm::unwrap(ctx
->builder
)->CreateAtomicCmpXchg(
225 llvm::unwrap(ptr
), llvm::unwrap(cmp
), llvm::unwrap(val
),
226 llvm::AtomicOrdering::SequentiallyConsistent
,
227 llvm::AtomicOrdering::SequentiallyConsistent
, SSID
));