1 //===- NVPTXSubtarget.cpp - NVPTX Subtarget Information -------------------===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 // This file implements the NVPTX specific subclass of TargetSubtarget.
11 //===----------------------------------------------------------------------===//
13 #include "NVPTXSubtarget.h"
14 #include "NVPTXTargetMachine.h"
18 #define DEBUG_TYPE "nvptx-subtarget"
20 #define GET_SUBTARGETINFO_ENUM
21 #define GET_SUBTARGETINFO_TARGET_DESC
22 #define GET_SUBTARGETINFO_CTOR
23 #include "NVPTXGenSubtargetInfo.inc"
26 NoF16Math("nvptx-no-f16-math", cl::Hidden
,
27 cl::desc("NVPTX Specific: Disable generation of f16 math ops."),
29 // Pin the vtable to this file.
30 void NVPTXSubtarget::anchor() {}
32 NVPTXSubtarget
&NVPTXSubtarget::initializeSubtargetDependencies(StringRef CPU
,
34 // Provide the default CPU if we don't have one.
35 TargetName
= std::string(CPU
.empty() ? "sm_30" : CPU
);
37 ParseSubtargetFeatures(TargetName
, /*TuneCPU*/ TargetName
, FS
);
39 // Re-map SM version numbers, SmVersion carries the regular SMs which do
40 // have relative order, while FullSmVersion allows distinguishing sm_90 from
41 // sm_90a, which would *not* be a subset of sm_91.
42 SmVersion
= getSmVersion();
44 // Set default to PTX 6.0 (CUDA 9.0)
45 if (PTXVersion
== 0) {
52 NVPTXSubtarget::NVPTXSubtarget(const Triple
&TT
, const std::string
&CPU
,
53 const std::string
&FS
,
54 const NVPTXTargetMachine
&TM
)
55 : NVPTXGenSubtargetInfo(TT
, CPU
, /*TuneCPU*/ CPU
, FS
), PTXVersion(0),
56 FullSmVersion(200), SmVersion(getSmVersion()), TM(TM
),
57 TLInfo(TM
, initializeSubtargetDependencies(CPU
, FS
)) {}
59 bool NVPTXSubtarget::hasImageHandles() const {
60 // Enable handles for Kepler+, where CUDA supports indirect surfaces and
62 if (TM
.getDrvInterface() == NVPTX::CUDA
)
63 return (SmVersion
>= 30);
65 // Disabled, otherwise
69 bool NVPTXSubtarget::allowFP16Math() const {
70 return hasFP16Math() && NoF16Math
== false;