llvm-project/clang/test/AST/ast-dump-atomic-options.hip
Yaxun (Sam) Liu 240f2269ff
Add clang atomic control options and attribute (#114841)
Add option and statement attribute for controlling emitting of
target-specific
metadata to atomicrmw instructions in IR.

The RFC for this attribute and option is

https://discourse.llvm.org/t/rfc-add-clang-atomic-control-options-and-pragmas/80641,
Originally a pragma was proposed, then it was changed to clang
attribute.

This attribute allows users to specify one, two, or all three options
and must be applied
to a compound statement. The attribute can also be nested, with inner
attributes
overriding the options specified by outer attributes or the target's
default
options. These options will then determine the target-specific metadata
added to atomic
instructions in the IR.

In addition to the attribute, three new compiler options are introduced:
`-f[no-]atomic-remote-memory`, `-f[no-]atomic-fine-grained-memory`,
 `-f[no-]atomic-ignore-denormal-mode`.
These compiler options allow users to override the default options
through the
Clang driver and front end. `-m[no-]unsafe-fp-atomics` is aliased to
`-f[no-]ignore-denormal-mode`.

In terms of implementation, the atomic attribute is represented in the
AST by the
existing AttributedStmt, with minimal changes to AST and Sema.

During code generation in Clang, the CodeGenModule maintains the current
atomic options,
which are used to emit the relevant metadata for atomic instructions.
RAII is used
to manage the saving and restoring of atomic options when entering
and exiting nested AttributedStmt.
2025-02-27 10:41:04 -05:00

137 lines
5.1 KiB
Plaintext

// RUN: %clang_cc1 -ast-dump %s | FileCheck %s
// RUN: %clang_cc1 -ast-dump -fcuda-is-device %s | FileCheck %s
// RUN: %clang_cc1 -ast-dump -fcuda-is-device %s \
// RUN: -fatomic-fine-grained-memory -fatomic-ignore-denormal-mode \
// RUN: | FileCheck %s
#include "Inputs/cuda.h"
// CHECK-LABEL: FunctionDecl {{.*}} test_default
// CHECK-NOT: AttributedStmt
// CHECK-NOT: AtomicAttr
// CHECK: CompoundStmt
// CHECK-NEXT: `-AtomicExpr
__device__ __host__ void test_default(float *a) {
__scoped_atomic_fetch_add(a, 1, __ATOMIC_RELAXED, __MEMORY_SCOPE_SYSTEM);
}
// CHECK-LABEL: FunctionDecl {{.*}} test_one
// CHECK: `-AttributedStmt
// CHECK-NEXT: |-AtomicAttr {{.*}} no_remote_memory{{$}}
// CHECK-NEXT: `-CompoundStmt
// CHECK-NEXT: `-AtomicExpr
__device__ __host__ void test_one(float *a) {
[[clang::atomic(no_remote_memory)]] {
__scoped_atomic_fetch_add(a, 1, __ATOMIC_RELAXED, __MEMORY_SCOPE_SYSTEM);
}
}
// CHECK-LABEL: FunctionDecl {{.*}} test_two
// CHECK: `-AttributedStmt
// CHECK-NEXT: |-AtomicAttr {{.*}} remote_memory ignore_denormal_mode{{$}}
// CHECK-NEXT: `-CompoundStmt
// CHECK-NEXT: `-AtomicExpr
__device__ __host__ void test_two(float *a) {
[[clang::atomic(remote_memory, ignore_denormal_mode)]] {
__scoped_atomic_fetch_add(a, 1, __ATOMIC_RELAXED, __MEMORY_SCOPE_SYSTEM);
}
}
// CHECK-LABEL: FunctionDecl {{.*}} test_three
// CHECK: `-AttributedStmt
// CHECK-NEXT: |-AtomicAttr {{.*}} no_remote_memory fine_grained_memory no_ignore_denormal_mode{{$}}
// CHECK-NEXT: `-CompoundStmt
// CHECK-NEXT: `-AtomicExpr
__device__ __host__ void test_three(float *a) {
[[clang::atomic(no_remote_memory, fine_grained_memory, no_ignore_denormal_mode)]] {
__scoped_atomic_fetch_add(a, 1, __ATOMIC_RELAXED, __MEMORY_SCOPE_SYSTEM);
}
}
// CHECK-LABEL: FunctionDecl {{.*}} test_duplicate
// CHECK: `-AttributedStmt
// CHECK-NEXT: |-AtomicAttr {{.*}} no_remote_memory{{$}}
// CHECK-NEXT: `-CompoundStmt
// CHECK-NEXT: `-AtomicExpr
__device__ __host__ void test_duplicate(float *a) {
[[clang::atomic(no_remote_memory, no_remote_memory)]] {
__scoped_atomic_fetch_add(a, 1, __ATOMIC_RELAXED, __MEMORY_SCOPE_SYSTEM);
}
}
// CHECK-LABEL: FunctionDecl {{.*}} test_conflict
// CHECK: `-AttributedStmt
// CHECK-NEXT: |-AtomicAttr {{.*}} remote_memory{{$}}
// CHECK-NEXT: `-CompoundStmt
// CHECK-NEXT: `-AtomicExpr
__device__ __host__ void test_conflict(float *a) {
[[clang::atomic(no_remote_memory, remote_memory)]] {
__scoped_atomic_fetch_add(a, 1, __ATOMIC_RELAXED, __MEMORY_SCOPE_SYSTEM);
}
}
// CHECK-LABEL: FunctionDecl {{.*}} test_multiple_attrs
// CHECK: `-AttributedStmt
// CHECK-NEXT: |-AtomicAttr {{.*}} no_remote_memory{{$}}
// CHECK-NEXT: |-AtomicAttr {{.*}} remote_memory{{$}}
// CHECK-NEXT: `-CompoundStmt
// CHECK-NEXT: `-AtomicExpr
__device__ __host__ void test_multiple_attrs(float *a) {
[[clang::atomic(no_remote_memory)]] [[clang::atomic(remote_memory)]] {
__scoped_atomic_fetch_add(a, 1, __ATOMIC_RELAXED, __MEMORY_SCOPE_SYSTEM);
}
}
// CHECK-LABEL: FunctionDecl {{.*}} test_nested
// CHECK: CompoundStmt
// CHECK: |-AtomicExpr
// CHECK: `-AttributedStmt
// CHECK-NEXT: |-AtomicAttr {{.*}} remote_memory fine_grained_memory no_ignore_denormal_mode{{$}}
// CHECK-NEXT: `-CompoundStmt
// CHECK: |-AtomicExpr
// CHECK: |-AttributedStmt
// CHECK-NEXT: |-AtomicAttr {{.*}} no_remote_memory{{$}}
// CHECK-NEXT: `-CompoundStmt
// CHECK-NEXT: `-AtomicExpr
// CHECK: `-AttributedStmt
// CHECK-NEXT: |-AtomicAttr {{.*}} no_fine_grained_memory{{$}}
// CHECK-NEXT: `-CompoundStmt
// CHECK-NEXT: `-AtomicExpr
__device__ __host__ void test_nested(float *a) {
__scoped_atomic_fetch_add(a, 1, __ATOMIC_RELAXED, __MEMORY_SCOPE_SYSTEM);
[[clang::atomic(remote_memory, fine_grained_memory, no_ignore_denormal_mode)]] {
__scoped_atomic_fetch_max(a, 2, __ATOMIC_SEQ_CST, __MEMORY_SCOPE_DEVICE);
[[clang::atomic(no_remote_memory)]] {
__scoped_atomic_fetch_min(a, 3, __ATOMIC_ACQUIRE, __MEMORY_SCOPE_WRKGRP);
}
[[clang::atomic(no_fine_grained_memory)]] {
__scoped_atomic_fetch_sub(a, 4, __ATOMIC_RELEASE, __MEMORY_SCOPE_WVFRNT);
}
}
}
// CHECK-LABEL: FunctionTemplateDecl {{.*}} test_template
// CHECK: |-FunctionDecl {{.*}} test_template 'void (T *)'
// CHECK: | |-CompoundStmt
// CHECK: | | `-AttributedStmt
// CHECK: | | |-AtomicAttr {{.*}} no_remote_memory fine_grained_memory no_ignore_denormal_mode{{$}}
// CHECK: | | `-CompoundStmt
// CHECK: | | `-CallExpr {{.*}} '<dependent type>'
// CHECK: `-FunctionDecl {{.*}} used test_template 'void (float *)' implicit_instantiation
// CHECK: |-CompoundStmt
// CHECK: | `-AttributedStmt
// CHECK: | |-AtomicAttr {{.*}} no_remote_memory fine_grained_memory no_ignore_denormal_mode{{$}}
// CHECK: | `-CompoundStmt
// CHECK: | `-AtomicExpr {{.*}} 'float'
template<typename T>
__device__ __host__ void test_template(T *a) {
[[clang::atomic(no_remote_memory, fine_grained_memory, no_ignore_denormal_mode)]] {
__scoped_atomic_fetch_add(a, 1, __ATOMIC_RELAXED, __MEMORY_SCOPE_SYSTEM);
}
}
__device__ __host__ void test_template_caller() {
float *p;
test_template(p);
}