v811_spc009/external/llvm/lib/Target/AMDGPU/AMDGPUTargetTransformInfo.h

//===-- AMDGPUTargetTransformInfo.h - AMDGPU specific TTI -------*- C++ -*-===//
//
//                     The LLVM Compiler Infrastructure
//
// This file is distributed under the University of Illinois Open Source
// License. See LICENSE.TXT for details.
//
//===----------------------------------------------------------------------===//
/// \file
/// This file a TargetTransformInfo::Concept conforming object specific to the
/// AMDGPU target machine. It uses the target's detailed information to
/// provide more precise answers to certain TTI queries, while letting the
/// target independent and default TTI implementations handle the rest.
///
//===----------------------------------------------------------------------===//

#ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPUTARGETTRANSFORMINFO_H
#define LLVM_LIB_TARGET_AMDGPU_AMDGPUTARGETTRANSFORMINFO_H

#include "AMDGPU.h"
#include "AMDGPUTargetMachine.h"
#include "llvm/Analysis/TargetTransformInfo.h"
#include "llvm/CodeGen/BasicTTIImpl.h"

namespace llvm {
class AMDGPUTargetLowering;

class AMDGPUTTIImpl final : public BasicTTIImplBase<AMDGPUTTIImpl> {
  typedef BasicTTIImplBase<AMDGPUTTIImpl> BaseT;
  typedef TargetTransformInfo TTI;
  friend BaseT;

  const AMDGPUSubtarget *ST;
  const AMDGPUTargetLowering *TLI;

  const AMDGPUSubtarget *getST() const { return ST; }
  const AMDGPUTargetLowering *getTLI() const { return TLI; }


  static inline int getFullRateInstrCost() {
    return TargetTransformInfo::TCC_Basic;
  }

  static inline int getHalfRateInstrCost() {
    return 2 * TargetTransformInfo::TCC_Basic;
  }

  // TODO: The size is usually 8 bytes, but takes 4x as many cycles. Maybe
  // should be 2 or 4.
  static inline int getQuarterRateInstrCost() {
    return 3 * TargetTransformInfo::TCC_Basic;
  }

   // On some parts, normal fp64 operations are half rate, and others
   // quarter. This also applies to some integer operations.
  inline int get64BitInstrCost() const {
    return ST->hasHalfRate64Ops() ?
      getHalfRateInstrCost() : getQuarterRateInstrCost();
  }

public:
  explicit AMDGPUTTIImpl(const AMDGPUTargetMachine *TM, const Function &F)
    : BaseT(TM, F.getParent()->getDataLayout()),
      ST(TM->getSubtargetImpl(F)),
      TLI(ST->getTargetLowering()) {}

  // Provide value semantics. MSVC requires that we spell all of these out.
  AMDGPUTTIImpl(const AMDGPUTTIImpl &Arg)
      : BaseT(static_cast<const BaseT &>(Arg)), ST(Arg.ST), TLI(Arg.TLI) {}
  AMDGPUTTIImpl(AMDGPUTTIImpl &&Arg)
      : BaseT(std::move(static_cast<BaseT &>(Arg))), ST(std::move(Arg.ST)),
        TLI(std::move(Arg.TLI)) {}

  bool hasBranchDivergence() { return true; }

  void getUnrollingPreferences(Loop *L, TTI::UnrollingPreferences &UP);

  TTI::PopcntSupportKind getPopcntSupport(unsigned TyWidth) {
    assert(isPowerOf2_32(TyWidth) && "Ty width must be power of 2");
    return TTI::PSK_FastHardware;
  }

  unsigned getNumberOfRegisters(bool Vector);
  unsigned getRegisterBitWidth(bool Vector);
  unsigned getLoadStoreVecRegBitWidth(unsigned AddrSpace);
  unsigned getMaxInterleaveFactor(unsigned VF);

  int getArithmeticInstrCost(
    unsigned Opcode, Type *Ty,
    TTI::OperandValueKind Opd1Info = TTI::OK_AnyValue,
    TTI::OperandValueKind Opd2Info = TTI::OK_AnyValue,
    TTI::OperandValueProperties Opd1PropInfo = TTI::OP_None,
    TTI::OperandValueProperties Opd2PropInfo = TTI::OP_None);

  unsigned getCFInstrCost(unsigned Opcode);

  int getVectorInstrCost(unsigned Opcode, Type *ValTy, unsigned Index);
  bool isSourceOfDivergence(const Value *V) const;

  unsigned getVectorSplitCost() { return 0; }
};

} // end namespace llvm

#endif
v811_spc009_project 4 months ago			`//===-- AMDGPUTargetTransformInfo.h - AMDGPU specific TTI -------- C++ --===//`
			`//`
			`// The LLVM Compiler Infrastructure`
			`//`
			`// This file is distributed under the University of Illinois Open Source`
			`// License. See LICENSE.TXT for details.`
			`//`
			`//===----------------------------------------------------------------------===//`
			`/// \file`
			`/// This file a TargetTransformInfo::Concept conforming object specific to the`
			`/// AMDGPU target machine. It uses the target's detailed information to`
			`/// provide more precise answers to certain TTI queries, while letting the`
			`/// target independent and default TTI implementations handle the rest.`
			`///`
			`//===----------------------------------------------------------------------===//`

			`#ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPUTARGETTRANSFORMINFO_H`
			`#define LLVM_LIB_TARGET_AMDGPU_AMDGPUTARGETTRANSFORMINFO_H`

			`#include "AMDGPU.h"`
			`#include "AMDGPUTargetMachine.h"`
			`#include "llvm/Analysis/TargetTransformInfo.h"`
			`#include "llvm/CodeGen/BasicTTIImpl.h"`

			`namespace llvm {`
			`class AMDGPUTargetLowering;`

			`class AMDGPUTTIImpl final : public BasicTTIImplBase<AMDGPUTTIImpl> {`
			`typedef BasicTTIImplBase<AMDGPUTTIImpl> BaseT;`
			`typedef TargetTransformInfo TTI;`
			`friend BaseT;`

			`const AMDGPUSubtarget *ST;`
			`const AMDGPUTargetLowering *TLI;`

			`const AMDGPUSubtarget *getST() const { return ST; }`
			`const AMDGPUTargetLowering *getTLI() const { return TLI; }`


			`static inline int getFullRateInstrCost() {`
			`return TargetTransformInfo::TCC_Basic;`
			`}`

			`static inline int getHalfRateInstrCost() {`
			`return 2 * TargetTransformInfo::TCC_Basic;`
			`}`

			`// TODO: The size is usually 8 bytes, but takes 4x as many cycles. Maybe`
			`// should be 2 or 4.`
			`static inline int getQuarterRateInstrCost() {`
			`return 3 * TargetTransformInfo::TCC_Basic;`
			`}`

			`// On some parts, normal fp64 operations are half rate, and others`
			`// quarter. This also applies to some integer operations.`
			`inline int get64BitInstrCost() const {`
			`return ST->hasHalfRate64Ops() ?`
			`getHalfRateInstrCost() : getQuarterRateInstrCost();`
			`}`

			`public:`
			`explicit AMDGPUTTIImpl(const AMDGPUTargetMachine *TM, const Function &F)`
			`: BaseT(TM, F.getParent()->getDataLayout()),`
			`ST(TM->getSubtargetImpl(F)),`
			`TLI(ST->getTargetLowering()) {}`

			`// Provide value semantics. MSVC requires that we spell all of these out.`
			`AMDGPUTTIImpl(const AMDGPUTTIImpl &Arg)`
			`: BaseT(static_cast<const BaseT &>(Arg)), ST(Arg.ST), TLI(Arg.TLI) {}`
			`AMDGPUTTIImpl(AMDGPUTTIImpl &&Arg)`
			`: BaseT(std::move(static_cast<BaseT &>(Arg))), ST(std::move(Arg.ST)),`
			`TLI(std::move(Arg.TLI)) {}`

			`bool hasBranchDivergence() { return true; }`

			`void getUnrollingPreferences(Loop *L, TTI::UnrollingPreferences &UP);`

			`TTI::PopcntSupportKind getPopcntSupport(unsigned TyWidth) {`
			`assert(isPowerOf2_32(TyWidth) && "Ty width must be power of 2");`
			`return TTI::PSK_FastHardware;`
			`}`

			`unsigned getNumberOfRegisters(bool Vector);`
			`unsigned getRegisterBitWidth(bool Vector);`
			`unsigned getLoadStoreVecRegBitWidth(unsigned AddrSpace);`
			`unsigned getMaxInterleaveFactor(unsigned VF);`

			`int getArithmeticInstrCost(`
			`unsigned Opcode, Type *Ty,`
			`TTI::OperandValueKind Opd1Info = TTI::OK_AnyValue,`
			`TTI::OperandValueKind Opd2Info = TTI::OK_AnyValue,`
			`TTI::OperandValueProperties Opd1PropInfo = TTI::OP_None,`
			`TTI::OperandValueProperties Opd2PropInfo = TTI::OP_None);`

			`unsigned getCFInstrCost(unsigned Opcode);`

			`int getVectorInstrCost(unsigned Opcode, Type *ValTy, unsigned Index);`
			`bool isSourceOfDivergence(const Value *V) const;`

			`unsigned getVectorSplitCost() { return 0; }`
			`};`

			`} // end namespace llvm`

			`#endif`