/src/llvm-project/llvm/lib/Target/NVPTX/NVPTXSubtarget.h

Source (jump to first uncovered line)
//=====-- NVPTXSubtarget.h - Define Subtarget for the NVPTX ---*- C++ -*--====//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
//
// This file declares the NVPTX specific subclass of TargetSubtarget.
//
//===----------------------------------------------------------------------===//

#ifndef LLVM_LIB_TARGET_NVPTX_NVPTXSUBTARGET_H
#define LLVM_LIB_TARGET_NVPTX_NVPTXSUBTARGET_H

#include "NVPTX.h"
#include "NVPTXFrameLowering.h"
#include "NVPTXISelLowering.h"
#include "NVPTXInstrInfo.h"
#include "NVPTXRegisterInfo.h"
#include "llvm/CodeGen/SelectionDAGTargetInfo.h"
#include "llvm/CodeGen/TargetSubtargetInfo.h"
#include "llvm/IR/DataLayout.h"
#include <string>

#define GET_SUBTARGETINFO_HEADER
#include "NVPTXGenSubtargetInfo.inc"

namespace llvm {

class NVPTXSubtarget : public NVPTXGenSubtargetInfo {
  virtual void anchor();
  std::string TargetName;

  // PTX version x.y is represented as 10*x+y, e.g. 3.1 == 31
  unsigned PTXVersion;

  // Full SM version x.y is represented as 100*x+10*y+feature, e.g. 3.1 == 310
  // sm_90a == 901
  unsigned int FullSmVersion;

  // SM version x.y is represented as 10*x+y, e.g. 3.1 == 31. Derived from
  // FullSmVersion.
  unsigned int SmVersion;

  const NVPTXTargetMachine &TM;
  NVPTXInstrInfo InstrInfo;
  NVPTXTargetLowering TLInfo;
  SelectionDAGTargetInfo TSInfo;

  // NVPTX does not have any call stack frame, but need a NVPTX specific
  // FrameLowering class because TargetFrameLowering is abstract.
  NVPTXFrameLowering FrameLowering;

public:
  /// This constructor initializes the data members to match that
  /// of the specified module.
  ///
  NVPTXSubtarget(const Triple &TT, const std::string &CPU,
                 const std::string &FS, const NVPTXTargetMachine &TM);

  const TargetFrameLowering *getFrameLowering() const override {
    return &FrameLowering;
  }
  const NVPTXInstrInfo *getInstrInfo() const override { return &InstrInfo; }
  const NVPTXRegisterInfo *getRegisterInfo() const override {
    return &InstrInfo.getRegisterInfo();
  }
  const NVPTXTargetLowering *getTargetLowering() const override {
    return &TLInfo;
  }
  const SelectionDAGTargetInfo *getSelectionDAGInfo() const override {
    return &TSInfo;
  }

  bool hasAtomAddF64() const { return SmVersion >= 60; }
  bool hasAtomScope() const { return SmVersion >= 60; }
  bool hasAtomBitwise64() const { return SmVersion >= 32; }
  bool hasAtomMinMax64() const { return SmVersion >= 32; }
  bool hasLDG() const { return SmVersion >= 32; }
  inline bool hasHWROT32() const { return SmVersion >= 32; }
  bool hasImageHandles() const;
  bool hasFP16Math() const { return SmVersion >= 53; }
  bool hasBF16Math() const { return SmVersion >= 80; }
  bool allowFP16Math() const;
  bool hasMaskOperator() const { return PTXVersion >= 71; }
  bool hasNoReturn() const { return SmVersion >= 30 && PTXVersion >= 64; }
  unsigned int getFullSmVersion() const { return FullSmVersion; }
  unsigned int getSmVersion() const { return getFullSmVersion() / 10; }
  // GPUs with "a" suffix have include architecture-accelerated features that
  // are supported on the specified architecture only, hence such targets do not
  // follow the onion layer model. hasAAFeatures() allows distinguishing such
  // GPU variants from the base GPU architecture.
  // - 0 represents base GPU model,
  // - non-zero value identifies particular architecture-accelerated variant.
  bool hasAAFeatures() const { return getFullSmVersion() % 10; }
  std::string getTargetName() const { return TargetName; }

  // Get maximum value of required alignments among the supported data types.
  // From the PTX ISA doc, section 8.2.3:
  //  The memory consistency model relates operations executed on memory
  //  locations with scalar data-types, which have a maximum size and alignment
  //  of 64 bits. Memory operations with a vector data-type are modelled as a
  //  set of equivalent memory operations with a scalar data-type, executed in
  //  an unspecified order on the elements in the vector.
  unsigned getMaxRequiredAlignment() const { return 8; }

  unsigned getPTXVersion() const { return PTXVersion; }

  NVPTXSubtarget &initializeSubtargetDependencies(StringRef CPU, StringRef FS);
  void ParseSubtargetFeatures(StringRef CPU, StringRef TuneCPU, StringRef FS);
};

} // End llvm namespace

#endif

Line	Count	Source (jump to first uncovered line)
1		//=====-- NVPTXSubtarget.h - Define Subtarget for the NVPTX ---- C++ ---====//
2		//
3		// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4		// See https://llvm.org/LICENSE.txt for license information.
5		// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6		//
7		//===----------------------------------------------------------------------===//
8		//
9		// This file declares the NVPTX specific subclass of TargetSubtarget.
10		//
11		//===----------------------------------------------------------------------===//
12
13		#ifndef LLVM_LIB_TARGET_NVPTX_NVPTXSUBTARGET_H
14		#define LLVM_LIB_TARGET_NVPTX_NVPTXSUBTARGET_H
15
16		#include "NVPTX.h"
17		#include "NVPTXFrameLowering.h"
18		#include "NVPTXISelLowering.h"
19		#include "NVPTXInstrInfo.h"
20		#include "NVPTXRegisterInfo.h"
21		#include "llvm/CodeGen/SelectionDAGTargetInfo.h"
22		#include "llvm/CodeGen/TargetSubtargetInfo.h"
23		#include "llvm/IR/DataLayout.h"
24		#include <string>
25
26		#define GET_SUBTARGETINFO_HEADER
27		#include "NVPTXGenSubtargetInfo.inc"
28
29		namespace llvm {
30
31		class NVPTXSubtarget : public NVPTXGenSubtargetInfo {
32		virtual void anchor();
33		std::string TargetName;
34
35		// PTX version x.y is represented as 10*x+y, e.g. 3.1 == 31
36		unsigned PTXVersion;
37
38		// Full SM version x.y is represented as 100x+10y+feature, e.g. 3.1 == 310
39		// sm_90a == 901
40		unsigned int FullSmVersion;
41
42		// SM version x.y is represented as 10*x+y, e.g. 3.1 == 31. Derived from
43		// FullSmVersion.
44		unsigned int SmVersion;
45
46		const NVPTXTargetMachine &TM;
47		NVPTXInstrInfo InstrInfo;
48		NVPTXTargetLowering TLInfo;
49		SelectionDAGTargetInfo TSInfo;
50
51		// NVPTX does not have any call stack frame, but need a NVPTX specific
52		// FrameLowering class because TargetFrameLowering is abstract.
53		NVPTXFrameLowering FrameLowering;
54
55		public:
56		/// This constructor initializes the data members to match that
57		/// of the specified module.
58		///
59		NVPTXSubtarget(const Triple &TT, const std::string &CPU,
60		const std::string &FS, const NVPTXTargetMachine &TM);
61
62	4.42k	const TargetFrameLowering *getFrameLowering() const override {
63	4.42k	return &FrameLowering;
64	4.42k	}
65	16.8k	const NVPTXInstrInfo *getInstrInfo() const override { return &InstrInfo; }
66	55.3k	const NVPTXRegisterInfo *getRegisterInfo() const override {
67	55.3k	return &InstrInfo.getRegisterInfo();
68	55.3k	}
69	28.2k	const NVPTXTargetLowering *getTargetLowering() const override {
70	28.2k	return &TLInfo;
71	28.2k	}
72	2.95k	const SelectionDAGTargetInfo *getSelectionDAGInfo() const override {
73	2.95k	return &TSInfo;
74	2.95k	}
75
76	0	bool hasAtomAddF64() const { return SmVersion >= 60; }
77	0	bool hasAtomScope() const { return SmVersion >= 60; }
78	0	bool hasAtomBitwise64() const { return SmVersion >= 32; }
79	0	bool hasAtomMinMax64() const { return SmVersion >= 32; }
80	3.88k	bool hasLDG() const { return SmVersion >= 32; }
81	0	inline bool hasHWROT32() const { return SmVersion >= 32; }
82		bool hasImageHandles() const;
83	42	bool hasFP16Math() const { return SmVersion >= 53; }
84	56	bool hasBF16Math() const { return SmVersion >= 80; }
85		bool allowFP16Math() const;
86	0	bool hasMaskOperator() const { return PTXVersion >= 71; }
87	738	bool hasNoReturn() const { return SmVersion >= 30 && PTXVersion >= 64; }
88	3.75k	unsigned int getFullSmVersion() const { return FullSmVersion; }
89	3.75k	unsigned int getSmVersion() const { return getFullSmVersion() / 10; }
90		// GPUs with "a" suffix have include architecture-accelerated features that
91		// are supported on the specified architecture only, hence such targets do not
92		// follow the onion layer model. hasAAFeatures() allows distinguishing such
93		// GPU variants from the base GPU architecture.
94		// - 0 represents base GPU model,
95		// - non-zero value identifies particular architecture-accelerated variant.
96	0	bool hasAAFeatures() const { return getFullSmVersion() % 10; }
97	740	std::string getTargetName() const { return TargetName; }
98
99		// Get maximum value of required alignments among the supported data types.
100		// From the PTX ISA doc, section 8.2.3:
101		// The memory consistency model relates operations executed on memory
102		// locations with scalar data-types, which have a maximum size and alignment
103		// of 64 bits. Memory operations with a vector data-type are modelled as a
104		// set of equivalent memory operations with a scalar data-type, executed in
105		// an unspecified order on the elements in the vector.
106	0	unsigned getMaxRequiredAlignment() const { return 8; }
107
108	742	unsigned getPTXVersion() const { return PTXVersion; }
109
110		NVPTXSubtarget &initializeSubtargetDependencies(StringRef CPU, StringRef FS);
111		void ParseSubtargetFeatures(StringRef CPU, StringRef TuneCPU, StringRef FS);
112		};
113
114		} // End llvm namespace
115
116		#endif

Coverage Report

Created: 2024-01-17 10:31