182 lines
		
	
	
		
			5.8 KiB
		
	
	
	
		
			C++
		
	
	
	
			
		
		
	
	
			182 lines
		
	
	
		
			5.8 KiB
		
	
	
	
		
			C++
		
	
	
	
//===- R600MCCodeEmitter.cpp - Code Emitter for R600->Cayman GPU families -===//
 | 
						|
//
 | 
						|
//                     The LLVM Compiler Infrastructure
 | 
						|
//
 | 
						|
// This file is distributed under the University of Illinois Open Source
 | 
						|
// License. See LICENSE.TXT for details.
 | 
						|
//
 | 
						|
//===----------------------------------------------------------------------===//
 | 
						|
//
 | 
						|
/// \file
 | 
						|
///
 | 
						|
/// \brief The R600 code emitter produces machine code that can be executed
 | 
						|
/// directly on the GPU device.
 | 
						|
//
 | 
						|
//===----------------------------------------------------------------------===//
 | 
						|
 | 
						|
#include "R600Defines.h"
 | 
						|
#include "MCTargetDesc/AMDGPUFixupKinds.h"
 | 
						|
#include "MCTargetDesc/AMDGPUMCCodeEmitter.h"
 | 
						|
#include "MCTargetDesc/AMDGPUMCTargetDesc.h"
 | 
						|
#include "llvm/MC/MCCodeEmitter.h"
 | 
						|
#include "llvm/MC/MCContext.h"
 | 
						|
#include "llvm/MC/MCInst.h"
 | 
						|
#include "llvm/MC/MCInstrInfo.h"
 | 
						|
#include "llvm/MC/MCRegisterInfo.h"
 | 
						|
#include "llvm/MC/MCSubtargetInfo.h"
 | 
						|
#include "llvm/Support/EndianStream.h"
 | 
						|
#include "llvm/Support/raw_ostream.h"
 | 
						|
 | 
						|
using namespace llvm;
 | 
						|
 | 
						|
namespace {
 | 
						|
 | 
						|
class R600MCCodeEmitter : public AMDGPUMCCodeEmitter {
 | 
						|
  R600MCCodeEmitter(const R600MCCodeEmitter &) = delete;
 | 
						|
  void operator=(const R600MCCodeEmitter &) = delete;
 | 
						|
  const MCInstrInfo &MCII;
 | 
						|
  const MCRegisterInfo &MRI;
 | 
						|
 | 
						|
public:
 | 
						|
  R600MCCodeEmitter(const MCInstrInfo &mcii, const MCRegisterInfo &mri)
 | 
						|
    : MCII(mcii), MRI(mri) { }
 | 
						|
 | 
						|
  /// \brief Encode the instruction and write it to the OS.
 | 
						|
  void encodeInstruction(const MCInst &MI, raw_ostream &OS,
 | 
						|
                         SmallVectorImpl<MCFixup> &Fixups,
 | 
						|
                         const MCSubtargetInfo &STI) const override;
 | 
						|
 | 
						|
  /// \returns the encoding for an MCOperand.
 | 
						|
  uint64_t getMachineOpValue(const MCInst &MI, const MCOperand &MO,
 | 
						|
                             SmallVectorImpl<MCFixup> &Fixups,
 | 
						|
                             const MCSubtargetInfo &STI) const override;
 | 
						|
 | 
						|
private:
 | 
						|
  void Emit(uint32_t value, raw_ostream &OS) const;
 | 
						|
  void Emit(uint64_t value, raw_ostream &OS) const;
 | 
						|
 | 
						|
  unsigned getHWReg(unsigned regNo) const;
 | 
						|
};
 | 
						|
 | 
						|
} // End anonymous namespace
 | 
						|
 | 
						|
enum RegElement {
 | 
						|
  ELEMENT_X = 0,
 | 
						|
  ELEMENT_Y,
 | 
						|
  ELEMENT_Z,
 | 
						|
  ELEMENT_W
 | 
						|
};
 | 
						|
 | 
						|
enum FCInstr {
 | 
						|
  FC_IF_PREDICATE = 0,
 | 
						|
  FC_ELSE,
 | 
						|
  FC_ENDIF,
 | 
						|
  FC_BGNLOOP,
 | 
						|
  FC_ENDLOOP,
 | 
						|
  FC_BREAK_PREDICATE,
 | 
						|
  FC_CONTINUE
 | 
						|
};
 | 
						|
 | 
						|
MCCodeEmitter *llvm::createR600MCCodeEmitter(const MCInstrInfo &MCII,
 | 
						|
                                             const MCRegisterInfo &MRI,
 | 
						|
                                             MCContext &Ctx) {
 | 
						|
  return new R600MCCodeEmitter(MCII, MRI);
 | 
						|
}
 | 
						|
 | 
						|
void R600MCCodeEmitter::encodeInstruction(const MCInst &MI, raw_ostream &OS,
 | 
						|
                                       SmallVectorImpl<MCFixup> &Fixups,
 | 
						|
                                       const MCSubtargetInfo &STI) const {
 | 
						|
  const MCInstrDesc &Desc = MCII.get(MI.getOpcode());
 | 
						|
  if (MI.getOpcode() == AMDGPU::RETURN ||
 | 
						|
    MI.getOpcode() == AMDGPU::FETCH_CLAUSE ||
 | 
						|
    MI.getOpcode() == AMDGPU::ALU_CLAUSE ||
 | 
						|
    MI.getOpcode() == AMDGPU::BUNDLE ||
 | 
						|
    MI.getOpcode() == AMDGPU::KILL) {
 | 
						|
    return;
 | 
						|
  } else if (IS_VTX(Desc)) {
 | 
						|
    uint64_t InstWord01 = getBinaryCodeForInstr(MI, Fixups, STI);
 | 
						|
    uint32_t InstWord2 = MI.getOperand(2).getImm(); // Offset
 | 
						|
    if (!(STI.getFeatureBits()[AMDGPU::FeatureCaymanISA])) {
 | 
						|
      InstWord2 |= 1 << 19; // Mega-Fetch bit
 | 
						|
    }
 | 
						|
 | 
						|
    Emit(InstWord01, OS);
 | 
						|
    Emit(InstWord2, OS);
 | 
						|
    Emit((uint32_t) 0, OS);
 | 
						|
  } else if (IS_TEX(Desc)) {
 | 
						|
      int64_t Sampler = MI.getOperand(14).getImm();
 | 
						|
 | 
						|
      int64_t SrcSelect[4] = {
 | 
						|
        MI.getOperand(2).getImm(),
 | 
						|
        MI.getOperand(3).getImm(),
 | 
						|
        MI.getOperand(4).getImm(),
 | 
						|
        MI.getOperand(5).getImm()
 | 
						|
      };
 | 
						|
      int64_t Offsets[3] = {
 | 
						|
        MI.getOperand(6).getImm() & 0x1F,
 | 
						|
        MI.getOperand(7).getImm() & 0x1F,
 | 
						|
        MI.getOperand(8).getImm() & 0x1F
 | 
						|
      };
 | 
						|
 | 
						|
      uint64_t Word01 = getBinaryCodeForInstr(MI, Fixups, STI);
 | 
						|
      uint32_t Word2 = Sampler << 15 | SrcSelect[ELEMENT_X] << 20 |
 | 
						|
          SrcSelect[ELEMENT_Y] << 23 | SrcSelect[ELEMENT_Z] << 26 |
 | 
						|
          SrcSelect[ELEMENT_W] << 29 | Offsets[0] << 0 | Offsets[1] << 5 |
 | 
						|
          Offsets[2] << 10;
 | 
						|
 | 
						|
      Emit(Word01, OS);
 | 
						|
      Emit(Word2, OS);
 | 
						|
      Emit((uint32_t) 0, OS);
 | 
						|
  } else {
 | 
						|
    uint64_t Inst = getBinaryCodeForInstr(MI, Fixups, STI);
 | 
						|
    if ((STI.getFeatureBits()[AMDGPU::FeatureR600ALUInst]) &&
 | 
						|
       ((Desc.TSFlags & R600_InstFlag::OP1) ||
 | 
						|
         Desc.TSFlags & R600_InstFlag::OP2)) {
 | 
						|
      uint64_t ISAOpCode = Inst & (0x3FFULL << 39);
 | 
						|
      Inst &= ~(0x3FFULL << 39);
 | 
						|
      Inst |= ISAOpCode << 1;
 | 
						|
    }
 | 
						|
    Emit(Inst, OS);
 | 
						|
  }
 | 
						|
}
 | 
						|
 | 
						|
void R600MCCodeEmitter::Emit(uint32_t Value, raw_ostream &OS) const {
 | 
						|
  support::endian::Writer<support::little>(OS).write(Value);
 | 
						|
}
 | 
						|
 | 
						|
void R600MCCodeEmitter::Emit(uint64_t Value, raw_ostream &OS) const {
 | 
						|
  support::endian::Writer<support::little>(OS).write(Value);
 | 
						|
}
 | 
						|
 | 
						|
unsigned R600MCCodeEmitter::getHWReg(unsigned RegNo) const {
 | 
						|
  return MRI.getEncodingValue(RegNo) & HW_REG_MASK;
 | 
						|
}
 | 
						|
 | 
						|
uint64_t R600MCCodeEmitter::getMachineOpValue(const MCInst &MI,
 | 
						|
                                              const MCOperand &MO,
 | 
						|
                                        SmallVectorImpl<MCFixup> &Fixups,
 | 
						|
                                        const MCSubtargetInfo &STI) const {
 | 
						|
  if (MO.isReg()) {
 | 
						|
    if (HAS_NATIVE_OPERANDS(MCII.get(MI.getOpcode()).TSFlags))
 | 
						|
      return MRI.getEncodingValue(MO.getReg());
 | 
						|
    return getHWReg(MO.getReg());
 | 
						|
  }
 | 
						|
 | 
						|
  if (MO.isExpr()) {
 | 
						|
    // We put rodata at the end of code section, then map the entire
 | 
						|
    // code secetion as vtx buf. Thus the section relative address is the
 | 
						|
    // correct one.
 | 
						|
    // Each R600 literal instruction has two operands
 | 
						|
    // We can't easily get the order of the current one, so compare against
 | 
						|
    // the first one and adjust offset.
 | 
						|
    const unsigned offset = (&MO == &MI.getOperand(0)) ? 0 : 4;
 | 
						|
    Fixups.push_back(MCFixup::create(offset, MO.getExpr(), FK_SecRel_4, MI.getLoc()));
 | 
						|
    return 0;
 | 
						|
  }
 | 
						|
 | 
						|
  assert(MO.isImm());
 | 
						|
  return MO.getImm();
 | 
						|
}
 | 
						|
 | 
						|
#include "AMDGPUGenMCCodeEmitter.inc"
 |