Skip to content

Commit

Permalink
SWDEV-233718 update to final change in trunk
Browse files Browse the repository at this point in the history
[CUDA][HIP] Fix constexpr variables for C++17

constexpr variables are compile time constants and implicitly const, therefore
they are safe to emit on both device and host side. Besides, in many cases
they are intended for both device and host, therefore it makes sense
to emit them on both device and host sides if necessary.

In most cases constexpr variables are used as rvalue and the variables
themselves do not need to be emitted. However if their address is taken,
then they need to be emitted.

For C++14, clang is able to handle that since clang emits them with
available_externally linkage together with the initializer.

However for C++17, the constexpr static data member of a class or template class
become inline variables implicitly. Therefore they become definitions with
linkonce_odr or weak_odr linkages. As such, they can not have available_externally
linkage.

This patch fixes that by adding implicit constant attribute to
file scope constexpr variables and constexpr static data members
in device compilation.

Differential Revision: https://reviews.llvm.org/D79237

Change-Id: I7960fac9511daf4d966264c19fcedac25d84590a
  • Loading branch information
yxsamliu committed Jun 5, 2020
1 parent a8cf844 commit e22a0f0
Show file tree
Hide file tree
Showing 7 changed files with 121 additions and 14 deletions.
4 changes: 4 additions & 0 deletions clang/include/clang/Sema/Sema.h
Original file line number Diff line number Diff line change
Expand Up @@ -11656,6 +11656,10 @@ class Sema final {
void maybeAddCUDAHostDeviceAttrs(FunctionDecl *FD,
const LookupResult &Previous);

/// May add implicit CUDAConstantAttr attribute to VD, depending on VD
/// and current compilation settings.
void MaybeAddCUDAConstantAttr(VarDecl *VD);

public:
/// Check whether we're allowed to call Callee from the current context.
///
Expand Down
6 changes: 1 addition & 5 deletions clang/lib/CodeGen/CodeGenModule.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -2516,16 +2516,12 @@ void CodeGenModule::EmitGlobal(GlobalDecl GD) {
// If this is CUDA, be selective about which declarations we emit.
if (LangOpts.CUDA) {
if (LangOpts.CUDAIsDevice) {
bool IsConstexprVar = false;
if (auto *VD = dyn_cast<VarDecl>(Global))
IsConstexprVar = VD->isConstexpr();
if (!Global->hasAttr<CUDADeviceAttr>() &&
!Global->hasAttr<CUDAGlobalAttr>() &&
!Global->hasAttr<CUDAConstantAttr>() &&
!Global->hasAttr<CUDASharedAttr>() &&
!Global->getType()->isCUDADeviceBuiltinSurfaceType() &&
!Global->getType()->isCUDADeviceBuiltinTextureType() &&
!IsConstexprVar)
!Global->getType()->isCUDADeviceBuiltinTextureType())
return;
} else {
// We need to emit host-side 'shadows' for all global
Expand Down
18 changes: 15 additions & 3 deletions clang/lib/Sema/SemaCUDA.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -528,9 +528,14 @@ void Sema::checkAllowedCUDAInitializer(VarDecl *VD) {
// constructor according to CUDA rules. This deviates from NVCC,
// but allows us to handle things like constexpr constructors.
if (!AllowedInit &&
(VD->hasAttr<CUDADeviceAttr>() || VD->hasAttr<CUDAConstantAttr>()))
AllowedInit = VD->getInit()->isConstantInitializer(
Context, VD->getType()->isReferenceType());
(VD->hasAttr<CUDADeviceAttr>() || VD->hasAttr<CUDAConstantAttr>())) {
auto *Init = VD->getInit();
AllowedInit =
((VD->getType()->isDependentType() || Init->isValueDependent()) &&
VD->isConstexpr()) ||
Init->isConstantInitializer(Context,
VD->getType()->isReferenceType());
}

// Also make sure that destructor, if there is one, is empty.
if (AllowedInit)
Expand Down Expand Up @@ -627,6 +632,13 @@ void Sema::maybeAddCUDAHostDeviceAttrs(FunctionDecl *NewD,
NewD->addAttr(CUDADeviceAttr::CreateImplicit(Context));
}

void Sema::MaybeAddCUDAConstantAttr(VarDecl *VD) {
if (getLangOpts().CUDAIsDevice && VD->isConstexpr() &&
(VD->isFileVarDecl() || VD->isStaticDataMember())) {
VD->addAttr(CUDAConstantAttr::CreateImplicit(getASTContext()));
}
}

Sema::DeviceDiagBuilder Sema::CUDADiagIfDeviceCode(SourceLocation Loc,
unsigned DiagID) {
assert(getLangOpts().CUDA && "Should only be called during CUDA compilation");
Expand Down
1 change: 1 addition & 0 deletions clang/lib/Sema/SemaDecl.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -7081,6 +7081,7 @@ NamedDecl *Sema::ActOnVariableDeclarator(

case CSK_constexpr:
NewVD->setConstexpr(true);
MaybeAddCUDAConstantAttr(NewVD);
// C++1z [dcl.spec.constexpr]p1:
// A static data member declared with the constexpr specifier is
// implicitly an inline variable.
Expand Down
1 change: 1 addition & 0 deletions clang/lib/Sema/SemaTemplateInstantiateDecl.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -4836,6 +4836,7 @@ void Sema::BuildVariableInstantiation(
NewVar->setCXXForRangeDecl(OldVar->isCXXForRangeDecl());
NewVar->setObjCForDecl(OldVar->isObjCForDecl());
NewVar->setConstexpr(OldVar->isConstexpr());
MaybeAddCUDAConstantAttr(NewVar);
NewVar->setInitCapture(OldVar->isInitCapture());
NewVar->setPreviousDeclInSameBlockScope(
OldVar->isPreviousDeclInSameBlockScope());
Expand Down
25 changes: 19 additions & 6 deletions clang/test/CodeGenCUDA/constexpr-variables.cu
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
// RUN: %clang_cc1 -std=c++14 %s -emit-llvm -o - -triple nvptx \
// RUN: -fcuda-is-device | FileCheck --check-prefixes=COM,CXX14 %s
// RUN: -fcuda-is-device | FileCheck --check-prefixes=CXX14 %s
// RUN: %clang_cc1 -std=c++17 %s -emit-llvm -o - -triple nvptx \
// RUN: -fcuda-is-device | FileCheck --check-prefixes=COM,CXX17 %s
// RUN: -fcuda-is-device | FileCheck --check-prefixes=CXX17 %s

#include "Inputs/cuda.h"

Expand All @@ -16,15 +16,28 @@ namespace B {
__constant__ const int &use_B_b = B::b;

struct Q {
// CXX14: @_ZN1Q1kE = available_externally {{.*}}constant i32 5
// CXX17: @_ZN1Q1kE = linkonce_odr {{.*}}constant i32 5
static constexpr int k = 5;
// CXX14: @_ZN1Q2k2E = {{.*}}externally_initialized constant i32 6
// CXX17: @_ZN1Q2k2E = internal {{.*}}constant i32 6
// CXX14: @_ZN1Q2k1E = available_externally {{.*}}constant i32 5
// CXX17: @_ZN1Q2k1E = linkonce_odr {{.*}}constant i32 5
static constexpr int k1 = 5;
static constexpr int k2 = 6;
};
__constant__ const int &use_Q_k = Q::k;
constexpr int Q::k2;

__constant__ const int &use_Q_k1 = Q::k1;
__constant__ const int &use_Q_k2 = Q::k2;

template<typename T> struct X {
// CXX14: @_ZN1XIiE1aE = available_externally {{.*}}constant i32 123
// CXX17: @_ZN1XIiE1aE = linkonce_odr {{.*}}constant i32 123
static constexpr int a = 123;
};
__constant__ const int &use_X_a = X<int>::a;

template <typename T, T a, T b> struct A {
// CXX14: @_ZN1AIiLi1ELi2EE1xE = available_externally {{.*}}constant i32 2
// CXX17: @_ZN1AIiLi1ELi2EE1xE = linkonce_odr {{.*}}constant i32 2
constexpr static T x = a * b;
};
__constant__ const int &y = A<int, 1, 2>::x;
80 changes: 80 additions & 0 deletions clang/test/SemaCUDA/constexpr-variables.cu
Original file line number Diff line number Diff line change
@@ -0,0 +1,80 @@
// RUN: %clang_cc1 -std=c++14 %s -emit-llvm -o - -triple nvptx64-nvidia-cuda \
// RUN: -fcuda-is-device -verify -fsyntax-only
// RUN: %clang_cc1 -std=c++17 %s -emit-llvm -o - -triple nvptx64-nvidia-cuda \
// RUN: -fcuda-is-device -verify -fsyntax-only
// RUN: %clang_cc1 -std=c++14 %s -emit-llvm -o - \
// RUN: -triple x86_64-unknown-linux-gnu -verify -fsyntax-only
// RUN: %clang_cc1 -std=c++17 %s -emit-llvm -o - \
// RUN: -triple x86_64-unknown-linux-gnu -verify -fsyntax-only
#include "Inputs/cuda.h"

template<typename T>
__host__ __device__ void foo(const T **a) {
// expected-note@-1 {{declared here}}
static const T b = sizeof(a);
static constexpr T c = sizeof(a);
const T d = sizeof(a);
constexpr T e = sizeof(a);
constexpr T f = **a;
// expected-error@-1 {{constexpr variable 'f' must be initialized by a constant expression}}
// expected-note@-2 {{read of non-constexpr variable 'a' is not allowed in a constant expression}}
a[0] = &b;
a[1] = &c;
a[2] = &d;
a[3] = &e;
}

__device__ void device_fun(const int **a) {
// expected-note@-1 {{declared here}}
constexpr int b = sizeof(a);
static constexpr int c = sizeof(a);
constexpr int d = **a;
// expected-error@-1 {{constexpr variable 'd' must be initialized by a constant expression}}
// expected-note@-2 {{read of non-constexpr variable 'a' is not allowed in a constant expression}}
a[0] = &b;
a[1] = &c;
foo(a);
// expected-note@-1 {{in instantiation of function template specialization 'foo<int>' requested here}}
}

void host_fun(const int **a) {
// expected-note@-1 {{declared here}}
constexpr int b = sizeof(a);
static constexpr int c = sizeof(a);
constexpr int d = **a;
// expected-error@-1 {{constexpr variable 'd' must be initialized by a constant expression}}
// expected-note@-2 {{read of non-constexpr variable 'a' is not allowed in a constant expression}}
a[0] = &b;
a[1] = &c;
foo(a);
}

__host__ __device__ void host_device_fun(const int **a) {
// expected-note@-1 {{declared here}}
constexpr int b = sizeof(a);
static constexpr int c = sizeof(a);
constexpr int d = **a;
// expected-error@-1 {{constexpr variable 'd' must be initialized by a constant expression}}
// expected-note@-2 {{read of non-constexpr variable 'a' is not allowed in a constant expression}}
a[0] = &b;
a[1] = &c;
foo(a);
}

template <class T>
struct A {
explicit A() = default;
};
template <class T>
constexpr A<T> a{};

struct B {
static constexpr bool value = true;
};

template<typename T>
struct C {
static constexpr bool value = T::value;
};

__constant__ const bool &x = C<B>::value;

0 comments on commit e22a0f0

Please sign in to comment.