9fc4aab136e0fb813b4bb51997f532321d6ee5dd
1 //===-- SICodeEmitter.cpp - SI Code Emitter -------------------------------===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 // The SI code emitter produces machine code that can be executed directly on
13 //===----------------------------------------------------------------------===//
17 #include "AMDGPUCodeEmitter.h"
18 #include "AMDGPUUtil.h"
19 #include "SIInstrInfo.h"
20 #include "SIMachineFunctionInfo.h"
21 #include "llvm/CodeGen/MachineFunctionPass.h"
22 #include "llvm/CodeGen/MachineInstr.h"
23 #include "llvm/CodeGen/MachineInstrBuilder.h"
24 #include "llvm/Support/FormattedStream.h"
25 #include "llvm/Target/TargetMachine.h"
30 #define LITERAL_REG 255
31 #define VGPR_BIT(src_idx) (1ULL << (9 * src_idx - 1))
36 class SICodeEmitter
: public MachineFunctionPass
, public AMDGPUCodeEmitter
{
40 formatted_raw_ostream
&_OS
;
41 const TargetMachine
*TM
;
46 unsigned CurrentInstrIndex
;
47 std::map
<int, unsigned> BBIndexes
;
49 void InitProgramInfo(MachineFunction
&MF
);
50 void EmitState(MachineFunction
& MF
);
51 void emitInstr(MachineInstr
&MI
);
53 void outputBytes(uint64_t value
, unsigned bytes
);
54 unsigned GPRAlign(const MachineInstr
&MI
, unsigned OpNo
, unsigned shift
)
58 SICodeEmitter(formatted_raw_ostream
&OS
) : MachineFunctionPass(ID
),
59 _OS(OS
), TM(NULL
), MaxSGPR(0), MaxVGPR(0), CurrentInstrIndex(0) { }
60 const char *getPassName() const { return "SI Code Emitter"; }
61 bool runOnMachineFunction(MachineFunction
&MF
);
63 /// getMachineOpValue - Return the encoding for MO
64 virtual uint64_t getMachineOpValue(const MachineInstr
&MI
,
65 const MachineOperand
&MO
) const;
67 /// GPR4AlignEncode - Encoding for when 4 consectuive registers are used
68 virtual unsigned GPR4AlignEncode(const MachineInstr
&MI
, unsigned OpNo
)
71 /// GPR2AlignEncode - Encoding for when 2 consecutive registers are used
72 virtual unsigned GPR2AlignEncode(const MachineInstr
&MI
, unsigned OpNo
)
74 /// i32LiteralEncode - Encode an i32 literal this is used as an operand
75 /// for an instruction in place of a register.
76 virtual uint64_t i32LiteralEncode(const MachineInstr
&MI
, unsigned OpNo
)
78 /// SMRDmemriEncode - Encoding for SMRD indexed loads
79 virtual uint32_t SMRDmemriEncode(const MachineInstr
&MI
, unsigned OpNo
)
82 /// VOPPostEncode - Post-Encoder method for VOP instructions
83 virtual uint64_t VOPPostEncode(const MachineInstr
&MI
,
84 uint64_t Value
) const;
88 char SICodeEmitter::ID
= 0;
90 FunctionPass
*llvm::createSICodeEmitterPass(formatted_raw_ostream
&OS
) {
91 return new SICodeEmitter(OS
);
94 void SICodeEmitter::EmitState(MachineFunction
& MF
) {
95 SIMachineFunctionInfo
* MFI
= MF
.getInfo
<SIMachineFunctionInfo
>();
96 outputBytes(MaxSGPR
+ 1, 4);
97 outputBytes(MaxVGPR
+ 1, 4);
98 outputBytes(MFI
->spi_ps_input_addr
, 4);
101 void SICodeEmitter::InitProgramInfo(MachineFunction
&MF
) {
102 unsigned InstrIndex
= 0;
103 bool VCCUsed
= false;
104 const SIRegisterInfo
* RI
=
105 static_cast<const SIRegisterInfo
*>(TM
->getRegisterInfo());
107 for (MachineFunction::iterator BB
= MF
.begin(), BB_E
= MF
.end();
109 MachineBasicBlock
&MBB
= *BB
;
110 BBIndexes
[MBB
.getNumber()] = InstrIndex
;
111 InstrIndex
+= MBB
.size();
112 for (MachineBasicBlock::iterator I
= MBB
.begin(), E
= MBB
.end();
114 MachineInstr
&MI
= *I
;
116 unsigned numOperands
= MI
.getNumOperands();
117 for (unsigned op_idx
= 0; op_idx
< numOperands
; op_idx
++) {
118 MachineOperand
& MO
= MI
.getOperand(op_idx
);
128 if (reg
== AMDGPU::VCC
) {
132 if (AMDGPU::SReg_32RegClass
.contains(reg
)) {
135 } else if (AMDGPU::VReg_32RegClass
.contains(reg
)) {
138 } else if (AMDGPU::SReg_64RegClass
.contains(reg
)) {
141 } else if (AMDGPU::VReg_64RegClass
.contains(reg
)) {
144 } else if (AMDGPU::SReg_128RegClass
.contains(reg
)) {
147 } else if (AMDGPU::VReg_128RegClass
.contains(reg
)) {
150 } else if (AMDGPU::SReg_256RegClass
.contains(reg
)) {
154 assert("!Unknown register class");
156 hwReg
= RI
->getHWRegNum(reg
);
157 maxUsed
= hwReg
+ width
- 1;
159 MaxSGPR
= maxUsed
> MaxSGPR
? maxUsed
: MaxSGPR
;
161 MaxVGPR
= maxUsed
> MaxVGPR
? maxUsed
: MaxVGPR
;
171 bool SICodeEmitter::runOnMachineFunction(MachineFunction
&MF
)
173 TM
= &MF
.getTarget();
174 const AMDGPUSubtarget
&STM
= TM
->getSubtarget
<AMDGPUSubtarget
>();
176 if (STM
.dumpCode()) {
184 for (MachineFunction::iterator BB
= MF
.begin(), BB_E
= MF
.end();
186 MachineBasicBlock
&MBB
= *BB
;
187 for (MachineBasicBlock::iterator I
= MBB
.begin(), E
= MBB
.end();
189 MachineInstr
&MI
= *I
;
190 if (MI
.getOpcode() != AMDGPU::KILL
&& MI
.getOpcode() != AMDGPU::RETURN
) {
197 MachineInstr
* End
= BuildMI(MF
, DebugLoc(),
198 TM
->getInstrInfo()->get(AMDGPU::S_ENDPGM
));
203 void SICodeEmitter::emitInstr(MachineInstr
&MI
)
205 const SIInstrInfo
* SII
= static_cast<const SIInstrInfo
*>(TM
->getInstrInfo());
207 uint64_t hwInst
= getBinaryCodeForInstr(MI
);
209 if ((hwInst
& 0xffffffff) == 0xffffffff) {
210 fprintf(stderr
, "Unsupported Instruction: \n");
215 unsigned bytes
= SII
->getEncodingBytes(MI
);
216 outputBytes(hwInst
, bytes
);
219 uint64_t SICodeEmitter::getMachineOpValue(const MachineInstr
&MI
,
220 const MachineOperand
&MO
) const
222 const SIRegisterInfo
* RI
=
223 static_cast<const SIRegisterInfo
*>(TM
->getRegisterInfo());
225 switch(MO
.getType()) {
226 case MachineOperand::MO_Register
:
227 return RI
->getBinaryCode(MO
.getReg());
229 case MachineOperand::MO_Immediate
:
232 case MachineOperand::MO_FPImmediate
:
233 // XXX: Not all instructions can use inline literals
234 // XXX: We should make sure this is a 32-bit constant
235 return LITERAL_REG
| (MO
.getFPImm()->getValueAPF().bitcastToAPInt().getZExtValue() << 32);
237 case MachineOperand::MO_MachineBasicBlock
:
238 return (*BBIndexes
.find(MI
.getParent()->getNumber())).second
-
239 CurrentInstrIndex
- 1;
241 llvm_unreachable("Encoding of this operand type is not supported yet.");
246 unsigned SICodeEmitter::GPRAlign(const MachineInstr
&MI
, unsigned OpNo
,
247 unsigned shift
) const
249 const SIRegisterInfo
* RI
=
250 static_cast<const SIRegisterInfo
*>(TM
->getRegisterInfo());
251 unsigned regCode
= RI
->getHWRegNum(MI
.getOperand(OpNo
).getReg());
252 return regCode
>> shift
;
255 unsigned SICodeEmitter::GPR4AlignEncode(const MachineInstr
&MI
,
258 return GPRAlign(MI
, OpNo
, 2);
261 unsigned SICodeEmitter::GPR2AlignEncode(const MachineInstr
&MI
,
264 return GPRAlign(MI
, OpNo
, 1);
267 uint64_t SICodeEmitter::i32LiteralEncode(const MachineInstr
&MI
,
270 return LITERAL_REG
| (MI
.getOperand(OpNo
).getImm() << 32);
273 #define SMRD_OFFSET_MASK 0xff
274 #define SMRD_IMM_SHIFT 8
275 #define SMRD_SBASE_MASK 0x3f
276 #define SMRD_SBASE_SHIFT 9
277 /// SMRDmemriEncode - This function is responsibe for encoding the offset
278 /// and the base ptr for SMRD instructions it should return a bit string in
281 /// OFFSET = bits{7-0}
283 /// SBASE = bits{14-9}
285 uint32_t SICodeEmitter::SMRDmemriEncode(const MachineInstr
&MI
,
290 const MachineOperand
&OffsetOp
= MI
.getOperand(OpNo
+ 1);
292 //XXX: Use this function for SMRD loads with register offsets
293 assert(OffsetOp
.isImm());
296 (getMachineOpValue(MI
, OffsetOp
) & SMRD_OFFSET_MASK
)
297 | (1 << SMRD_IMM_SHIFT
) //XXX If the Offset is a register we shouldn't set this bit
298 | ((GPR2AlignEncode(MI
, OpNo
) & SMRD_SBASE_MASK
) << SMRD_SBASE_SHIFT
)
304 /// Set the "VGPR" bit for VOP args that can take either a VGPR or a SGPR.
305 /// XXX: It would be nice if we could handle this without a PostEncode function.
306 uint64_t SICodeEmitter::VOPPostEncode(const MachineInstr
&MI
,
307 uint64_t Value
) const
309 const SIInstrInfo
* SII
= static_cast<const SIInstrInfo
*>(TM
->getInstrInfo());
310 unsigned encodingType
= SII
->getEncodingType(MI
);
312 unsigned vgprBitOffset
;
314 if (encodingType
== SIInstrEncodingType::VOP3
) {
322 // Add one to skip over the destination reg operand.
323 for (unsigned opIdx
= 1; opIdx
< numSrcOps
+ 1; opIdx
++) {
324 if (!MI
.getOperand(opIdx
).isReg()) {
327 unsigned reg
= MI
.getOperand(opIdx
).getReg();
328 if (AMDGPU::VReg_32RegClass
.contains(reg
)
329 || AMDGPU::VReg_64RegClass
.contains(reg
)) {
330 Value
|= (VGPR_BIT(opIdx
)) << vgprBitOffset
;
337 void SICodeEmitter::outputBytes(uint64_t value
, unsigned bytes
)
339 for (unsigned i
= 0; i
< bytes
; i
++) {
340 _OS
.write((uint8_t) ((value
>> (8 * i
)) & 0xff));