1 //===-- AMDGPUTargetMachine.cpp - TargetMachine for hw codegen targets-----===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 // The AMDGPU target machine contains all of the hardware specific information
11 // needed to emit code for R600 and SI GPUs.
13 //===----------------------------------------------------------------------===//
15 #include "AMDGPUTargetMachine.h"
17 #include "R600ISelLowering.h"
18 #include "R600InstrInfo.h"
19 #include "SIISelLowering.h"
20 #include "SIInstrInfo.h"
21 #include "llvm/Analysis/Passes.h"
22 #include "llvm/Analysis/Verifier.h"
23 #include "llvm/CodeGen/MachineFunctionAnalysis.h"
24 #include "llvm/CodeGen/MachineModuleInfo.h"
25 #include "llvm/CodeGen/Passes.h"
26 #include "llvm/MC/MCAsmInfo.h"
27 #include "llvm/PassManager.h"
28 #include "llvm/Support/TargetRegistry.h"
29 #include "llvm/Support/raw_os_ostream.h"
30 #include "llvm/Transforms/IPO.h"
31 #include "llvm/Transforms/Scalar.h"
35 extern "C" void LLVMInitializeAMDGPUTarget() {
36 // Register the target
37 RegisterTargetMachine
<AMDGPUTargetMachine
> X(TheAMDGPUTarget
);
40 AMDGPUTargetMachine::AMDGPUTargetMachine(const Target
&T
, StringRef TT
,
41 StringRef CPU
, StringRef FS
,
42 TargetOptions Options
,
43 Reloc::Model RM
, CodeModel::Model CM
,
44 CodeGenOpt::Level OptLevel
47 LLVMTargetMachine(T
, TT
, CPU
, FS
, Options
, RM
, CM
, OptLevel
),
48 Subtarget(TT
, CPU
, FS
),
49 DataLayout(Subtarget
.getDataLayout()),
50 FrameLowering(TargetFrameLowering::StackGrowsUp
,
51 Subtarget
.device()->getStackAlignment(), 0),
53 InstrItins(&Subtarget
.getInstrItineraryData()),
57 // TLInfo uses InstrInfo so it must be initialized after.
58 if (Subtarget
.device()->getGeneration() <= AMDILDeviceInfo::HD6XXX
) {
59 InstrInfo
= new R600InstrInfo(*this);
60 TLInfo
= new R600TargetLowering(*this);
62 InstrInfo
= new SIInstrInfo(*this);
63 TLInfo
= new SITargetLowering(*this);
67 AMDGPUTargetMachine::~AMDGPUTargetMachine()
71 bool AMDGPUTargetMachine::addPassesToEmitFile(PassManagerBase
&PM
,
72 formatted_raw_ostream
&Out
,
73 CodeGenFileType FileType
,
75 // XXX: Hack here addPassesToEmitFile will fail, but this is Ok since we are
76 // only using it to access addPassesToGenerateCode()
77 bool fail
= LLVMTargetMachine::addPassesToEmitFile(PM
, Out
, FileType
,
81 const AMDILSubtarget
&STM
= getSubtarget
<AMDILSubtarget
>();
82 std::string gpu
= STM
.getDeviceName();
84 PM
.add(createSICodeEmitterPass(Out
));
85 } else if (Subtarget
.device()->getGeneration() <= AMDILDeviceInfo::HD6XXX
) {
86 PM
.add(createR600CodeEmitterPass(Out
));
91 PM
.add(createGCInfoDeleter());
97 class AMDGPUPassConfig
: public TargetPassConfig
{
99 AMDGPUPassConfig(AMDGPUTargetMachine
*TM
, PassManagerBase
&PM
)
100 : TargetPassConfig(TM
, PM
) {}
102 AMDGPUTargetMachine
&getAMDGPUTargetMachine() const {
103 return getTM
<AMDGPUTargetMachine
>();
106 virtual bool addPreISel();
107 virtual bool addInstSelector();
108 virtual bool addPreRegAlloc();
109 virtual bool addPostRegAlloc();
110 virtual bool addPreSched2();
111 virtual bool addPreEmitPass();
113 } // End of anonymous namespace
115 TargetPassConfig
*AMDGPUTargetMachine::createPassConfig(PassManagerBase
&PM
) {
116 return new AMDGPUPassConfig(this, PM
);
120 AMDGPUPassConfig::addPreISel()
122 const AMDILSubtarget
&ST
= TM
->getSubtarget
<AMDILSubtarget
>();
123 if (ST
.device()->getGeneration() <= AMDILDeviceInfo::HD6XXX
) {
124 PM
->add(createR600KernelParametersPass(
125 getAMDGPUTargetMachine().getTargetData()));
130 bool AMDGPUPassConfig::addInstSelector() {
131 PM
->add(createAMDILPeepholeOpt(*TM
));
132 PM
->add(createAMDILISelDag(getAMDGPUTargetMachine()));
136 bool AMDGPUPassConfig::addPreRegAlloc() {
137 const AMDILSubtarget
&ST
= TM
->getSubtarget
<AMDILSubtarget
>();
139 if (ST
.device()->getGeneration() > AMDILDeviceInfo::HD6XXX
) {
140 PM
->add(createSIAssignInterpRegsPass(*TM
));
142 PM
->add(createAMDGPUConvertToISAPass(*TM
));
146 bool AMDGPUPassConfig::addPostRegAlloc() {
150 bool AMDGPUPassConfig::addPreSched2() {
154 bool AMDGPUPassConfig::addPreEmitPass() {
155 PM
->add(createAMDILCFGPreparationPass(*TM
));
156 PM
->add(createAMDILCFGStructurizerPass(*TM
));