R600MCCodeEmitter.cpp revision d6055262d23b1a8f2b5c74ab94fc6c143aca1c45
1f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//===- R600MCCodeEmitter.cpp - Code Emitter for R600->Cayman GPU families -===//
2f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//
3f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//                     The LLVM Compiler Infrastructure
4f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//
5f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard// This file is distributed under the University of Illinois Open Source
6f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard// License. See LICENSE.TXT for details.
7f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//
8f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//===----------------------------------------------------------------------===//
9f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//
10f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard/// \file
11f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard///
124f3d8a644043f85063ef7aac1ff87bfd4d83ca4cTom Stellard/// \brief The R600 code emitter produces machine code that can be executed
134f3d8a644043f85063ef7aac1ff87bfd4d83ca4cTom Stellard/// directly on the GPU device.
14f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//
15f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard//===----------------------------------------------------------------------===//
16f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
17f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard#include "R600Defines.h"
18f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard#include "MCTargetDesc/AMDGPUMCCodeEmitter.h"
1958a2cbef4aac9ee7d530dfb690c78d6fc11a2371Chandler Carruth#include "MCTargetDesc/AMDGPUMCTargetDesc.h"
20f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard#include "llvm/MC/MCCodeEmitter.h"
21f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard#include "llvm/MC/MCContext.h"
22f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard#include "llvm/MC/MCInst.h"
23f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard#include "llvm/MC/MCInstrInfo.h"
24f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard#include "llvm/MC/MCRegisterInfo.h"
25f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard#include "llvm/MC/MCSubtargetInfo.h"
26f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard#include "llvm/Support/raw_ostream.h"
27f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard#include <stdio.h>
28f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
29f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellardusing namespace llvm;
30f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
31f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellardnamespace {
32f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
33f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellardclass R600MCCodeEmitter : public AMDGPUMCCodeEmitter {
34a39058aaed4540fc37681cad728b99546595b2e8David Blaikie  R600MCCodeEmitter(const R600MCCodeEmitter &) LLVM_DELETED_FUNCTION;
35a39058aaed4540fc37681cad728b99546595b2e8David Blaikie  void operator=(const R600MCCodeEmitter &) LLVM_DELETED_FUNCTION;
36f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  const MCInstrInfo &MCII;
37f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  const MCRegisterInfo &MRI;
3834f533a6c351d8b255810c9b4b8713700e66ee88Tom Stellard  const MCSubtargetInfo &STI;
39f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
40f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellardpublic:
41f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
4234f533a6c351d8b255810c9b4b8713700e66ee88Tom Stellard  R600MCCodeEmitter(const MCInstrInfo &mcii, const MCRegisterInfo &mri,
4334f533a6c351d8b255810c9b4b8713700e66ee88Tom Stellard                    const MCSubtargetInfo &sti)
4434f533a6c351d8b255810c9b4b8713700e66ee88Tom Stellard    : MCII(mcii), MRI(mri), STI(sti) { }
45f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
46f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  /// \brief Encode the instruction and write it to the OS.
47f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  virtual void EncodeInstruction(const MCInst &MI, raw_ostream &OS,
48f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                         SmallVectorImpl<MCFixup> &Fixups) const;
49f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
50f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  /// \returns the encoding for an MCOperand.
51f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  virtual uint64_t getMachineOpValue(const MCInst &MI, const MCOperand &MO,
52f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                     SmallVectorImpl<MCFixup> &Fixups) const;
53f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellardprivate:
54f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
55f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  void EmitByte(unsigned int byte, raw_ostream &OS) const;
56f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
57f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  void Emit(uint32_t value, raw_ostream &OS) const;
58f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  void Emit(uint64_t value, raw_ostream &OS) const;
59f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
60f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  unsigned getHWRegChan(unsigned reg) const;
61f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  unsigned getHWReg(unsigned regNo) const;
62f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
63f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard};
64f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
65f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard} // End anonymous namespace
66f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
67f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellardenum RegElement {
68f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  ELEMENT_X = 0,
69f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  ELEMENT_Y,
70f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  ELEMENT_Z,
71f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  ELEMENT_W
72f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard};
73f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
74f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellardenum FCInstr {
75f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  FC_IF_PREDICATE = 0,
76f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  FC_ELSE,
77f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  FC_ENDIF,
78f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  FC_BGNLOOP,
79f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  FC_ENDLOOP,
80f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  FC_BREAK_PREDICATE,
81f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  FC_CONTINUE
82f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard};
83f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
84f98f2ce29e6e2996fa58f38979143eceaa818335Tom StellardMCCodeEmitter *llvm::createR600MCCodeEmitter(const MCInstrInfo &MCII,
8534f533a6c351d8b255810c9b4b8713700e66ee88Tom Stellard                                           const MCRegisterInfo &MRI,
8634f533a6c351d8b255810c9b4b8713700e66ee88Tom Stellard                                           const MCSubtargetInfo &STI) {
8734f533a6c351d8b255810c9b4b8713700e66ee88Tom Stellard  return new R600MCCodeEmitter(MCII, MRI, STI);
88f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
89f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
90f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellardvoid R600MCCodeEmitter::EncodeInstruction(const MCInst &MI, raw_ostream &OS,
91f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                       SmallVectorImpl<MCFixup> &Fixups) const {
9232c76107d029c1cad5935d08cdcde6139cf874bbTom Stellard  const MCInstrDesc &Desc = MCII.get(MI.getOpcode());
9332c76107d029c1cad5935d08cdcde6139cf874bbTom Stellard  if (MI.getOpcode() == AMDGPU::RETURN ||
94b6379de427c009284d47c5fc764f11bbd2bf2484Vincent Lejeune    MI.getOpcode() == AMDGPU::FETCH_CLAUSE ||
952c836f84dba99e7b041909160c739db779760b79Vincent Lejeune    MI.getOpcode() == AMDGPU::ALU_CLAUSE ||
96f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    MI.getOpcode() == AMDGPU::BUNDLE ||
97f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    MI.getOpcode() == AMDGPU::KILL) {
98f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    return;
9932c76107d029c1cad5935d08cdcde6139cf874bbTom Stellard  } else if (IS_VTX(Desc)) {
10032c76107d029c1cad5935d08cdcde6139cf874bbTom Stellard    uint64_t InstWord01 = getBinaryCodeForInstr(MI, Fixups);
10132c76107d029c1cad5935d08cdcde6139cf874bbTom Stellard    uint32_t InstWord2 = MI.getOperand(2).getImm(); // Offset
102d6055262d23b1a8f2b5c74ab94fc6c143aca1c45Tom Stellard    if (!(STI.getFeatureBits() & AMDGPU::FeatureCaymanISA)) {
103d6055262d23b1a8f2b5c74ab94fc6c143aca1c45Tom Stellard      InstWord2 |= 1 << 19; // Mega-Fetch bit
104d6055262d23b1a8f2b5c74ab94fc6c143aca1c45Tom Stellard    }
10532c76107d029c1cad5935d08cdcde6139cf874bbTom Stellard
10632c76107d029c1cad5935d08cdcde6139cf874bbTom Stellard    Emit(InstWord01, OS);
10732c76107d029c1cad5935d08cdcde6139cf874bbTom Stellard    Emit(InstWord2, OS);
1082134219b654641a7e813d593f4491ad18133963cRafael Espindola    Emit((uint32_t) 0, OS);
10932c76107d029c1cad5935d08cdcde6139cf874bbTom Stellard  } else if (IS_TEX(Desc)) {
110d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune      int64_t Sampler = MI.getOperand(14).getImm();
111d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune
112eee6cdd7819b66e0d95a7a18337569b981374937Rafael Espindola      int64_t SrcSelect[4] = {
113d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune        MI.getOperand(2).getImm(),
114d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune        MI.getOperand(3).getImm(),
115d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune        MI.getOperand(4).getImm(),
116d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune        MI.getOperand(5).getImm()
117d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune      };
1187eac03220344d1b558ea6690cf73d2b76c7e551eRafael Espindola      int64_t Offsets[3] = {
119d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune        MI.getOperand(6).getImm() & 0x1F,
120d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune        MI.getOperand(7).getImm() & 0x1F,
121d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune        MI.getOperand(8).getImm() & 0x1F
122d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune      };
123d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune
124d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune      uint64_t Word01 = getBinaryCodeForInstr(MI, Fixups);
125d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune      uint32_t Word2 = Sampler << 15 | SrcSelect[ELEMENT_X] << 20 |
126d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune          SrcSelect[ELEMENT_Y] << 23 | SrcSelect[ELEMENT_Z] << 26 |
127d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune          SrcSelect[ELEMENT_W] << 29 | Offsets[0] << 0 | Offsets[1] << 5 |
128d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune          Offsets[2] << 10;
129d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune
130d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune      Emit(Word01, OS);
131d3293b49f9c7af741d2edd3062499fb50db0e89bVincent Lejeune      Emit(Word2, OS);
1322134219b654641a7e813d593f4491ad18133963cRafael Espindola      Emit((uint32_t) 0, OS);
133f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  } else {
13432c76107d029c1cad5935d08cdcde6139cf874bbTom Stellard    uint64_t Inst = getBinaryCodeForInstr(MI, Fixups);
1350976e3c6d9b1bfaea1267188e6a20dc41318832aTom Stellard    if ((STI.getFeatureBits() & AMDGPU::FeatureR600ALUInst) &&
1360976e3c6d9b1bfaea1267188e6a20dc41318832aTom Stellard       ((Desc.TSFlags & R600_InstFlag::OP1) ||
1370976e3c6d9b1bfaea1267188e6a20dc41318832aTom Stellard         Desc.TSFlags & R600_InstFlag::OP2)) {
1380976e3c6d9b1bfaea1267188e6a20dc41318832aTom Stellard      uint64_t ISAOpCode = Inst & (0x3FFULL << 39);
1390976e3c6d9b1bfaea1267188e6a20dc41318832aTom Stellard      Inst &= ~(0x3FFULL << 39);
1400976e3c6d9b1bfaea1267188e6a20dc41318832aTom Stellard      Inst |= ISAOpCode << 1;
1410976e3c6d9b1bfaea1267188e6a20dc41318832aTom Stellard    }
14232c76107d029c1cad5935d08cdcde6139cf874bbTom Stellard    Emit(Inst, OS);
143f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  }
144f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
145f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
146f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellardvoid R600MCCodeEmitter::EmitByte(unsigned int Byte, raw_ostream &OS) const {
147f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  OS.write((uint8_t) Byte & 0xff);
148f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
149f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
150f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellardvoid R600MCCodeEmitter::Emit(uint32_t Value, raw_ostream &OS) const {
151f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  for (unsigned i = 0; i < 4; i++) {
152f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    OS.write((uint8_t) ((Value >> (8 * i)) & 0xff));
153f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  }
154f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
155f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
156f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellardvoid R600MCCodeEmitter::Emit(uint64_t Value, raw_ostream &OS) const {
157f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  for (unsigned i = 0; i < 8; i++) {
158f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    EmitByte((Value >> (8 * i)) & 0xff, OS);
159f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  }
160f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
161f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
162f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellardunsigned R600MCCodeEmitter::getHWRegChan(unsigned reg) const {
163f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  return MRI.getEncodingValue(reg) >> HW_CHAN_SHIFT;
164f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
165f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
166f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellardunsigned R600MCCodeEmitter::getHWReg(unsigned RegNo) const {
167f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  return MRI.getEncodingValue(RegNo) & HW_REG_MASK;
168f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
169f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
170f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellarduint64_t R600MCCodeEmitter::getMachineOpValue(const MCInst &MI,
171f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                              const MCOperand &MO,
172f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard                                        SmallVectorImpl<MCFixup> &Fixup) const {
173f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  if (MO.isReg()) {
174f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    if (HAS_NATIVE_OPERANDS(MCII.get(MI.getOpcode()).TSFlags)) {
175f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard      return MRI.getEncodingValue(MO.getReg());
176f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    } else {
177f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard      return getHWReg(MO.getReg());
178f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    }
179f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  } else if (MO.isImm()) {
180f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    return MO.getImm();
181f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  } else {
182f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    assert(0);
183f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard    return 0;
184f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard  }
185f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard}
186f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard
187f98f2ce29e6e2996fa58f38979143eceaa818335Tom Stellard#include "AMDGPUGenMCCodeEmitter.inc"
188