mirror of
https://github.com/llvm/llvm-project.git
synced 2025-04-27 02:56:05 +00:00

'reduction' has a few restrictions over normal 'var-list' clauses: 1- On parallel, a num_gangs can only have 1 argument when combined with reduction. These two aren't able to be combined on any other of the compute constructs however. 2- The vars all must be 'numerical data types' types of some sort, or a 'composite of numerical data types'. A list of types is given in the standard as a minimum, so we choose 'isScalar', which covers all of these types and keeps types that are actually numeric. Other compilers don't seem to implement the 'composite of numerical data types', though we do. 3- Because of the above restrictions, member-of-composite is not allowed, so any access via a memberexpr is disallowed. Array-element and sub-arrays (aka array sections) are both permitted, so long as they meet the requirements of #2. This patch implements all of these for compute constructs.
163 lines
5.4 KiB
C++
163 lines
5.4 KiB
C++
// RUN: %clang_cc1 -fopenacc -Wno-openacc-deprecated-clause-alias -ast-print %s -o - | FileCheck %s
|
|
|
|
void foo() {
|
|
int i;
|
|
int *iPtr;
|
|
float array[5];
|
|
float *arrayPtr[5];
|
|
// CHECK: #pragma acc parallel default(none)
|
|
// CHECK-NEXT: while (true)
|
|
#pragma acc parallel default(none)
|
|
while(true);
|
|
// CHECK: #pragma acc serial default(present)
|
|
// CHECK-NEXT: while (true)
|
|
#pragma acc serial default(present)
|
|
while(true);
|
|
// CHECK: #pragma acc kernels if(i == array[1])
|
|
// CHECK-NEXT: while (true)
|
|
#pragma acc kernels if(i == array[1])
|
|
while(true);
|
|
// CHECK: #pragma acc parallel self(i == 3)
|
|
// CHECK-NEXT: while (true)
|
|
#pragma acc parallel self(i == 3)
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc parallel num_gangs(i, (int)array[2])
|
|
// CHECK-NEXT: while (true)
|
|
#pragma acc parallel num_gangs(i, (int)array[2])
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc parallel num_workers(i)
|
|
// CHECK-NEXT: while (true)
|
|
#pragma acc parallel num_workers(i)
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc parallel vector_length((int)array[1])
|
|
// CHECK-NEXT: while (true)
|
|
#pragma acc parallel vector_length((int)array[1])
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc parallel private(i, array[1], array, array[1:2])
|
|
#pragma acc parallel private(i, array[1], array, array[1:2])
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc parallel firstprivate(i, array[1], array, array[1:2])
|
|
#pragma acc parallel firstprivate(i, array[1], array, array[1:2])
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc parallel no_create(i, array[1], array, array[1:2])
|
|
#pragma acc parallel no_create(i, array[1], array, array[1:2])
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc parallel present(i, array[1], array, array[1:2])
|
|
#pragma acc parallel present(i, array[1], array, array[1:2])
|
|
while(true);
|
|
// CHECK: #pragma acc parallel no_create(i, array[1], array, array[1:2]) present(i, array[1], array, array[1:2])
|
|
#pragma acc parallel no_create(i, array[1], array, array[1:2]) present(i, array[1], array, array[1:2])
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc parallel copyin(i, array[1], array, array[1:2]) pcopyin(readonly: i, array[1], array, array[1:2]) present_or_copyin(i, array[1], array, array[1:2])
|
|
#pragma acc parallel copyin(i, array[1], array, array[1:2]) pcopyin(readonly:i, array[1], array, array[1:2]) present_or_copyin(i, array[1], array, array[1:2])
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc parallel copyout(i, array[1], array, array[1:2]) pcopyout(zero: i, array[1], array, array[1:2]) present_or_copyout(i, array[1], array, array[1:2])
|
|
#pragma acc parallel copyout(i, array[1], array, array[1:2]) pcopyout(zero: i, array[1], array, array[1:2]) present_or_copyout(i, array[1], array, array[1:2])
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc parallel create(i, array[1], array, array[1:2]) pcreate(zero: i, array[1], array, array[1:2]) present_or_create(i, array[1], array, array[1:2])
|
|
#pragma acc parallel create(i, array[1], array, array[1:2]) pcreate(zero: i, array[1], array, array[1:2]) present_or_create(i, array[1], array, array[1:2])
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc serial attach(iPtr, arrayPtr[0])
|
|
#pragma acc serial attach(iPtr, arrayPtr[0])
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc kernels deviceptr(iPtr, arrayPtr[0])
|
|
#pragma acc kernels deviceptr(iPtr, arrayPtr[0])
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc kernels async(*iPtr)
|
|
#pragma acc kernels async(*iPtr)
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc kernels async
|
|
#pragma acc kernels async
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc parallel wait
|
|
#pragma acc parallel wait
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc parallel wait()
|
|
#pragma acc parallel wait()
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc parallel wait(*iPtr, i)
|
|
#pragma acc parallel wait(*iPtr, i)
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc parallel wait(queues: *iPtr, i)
|
|
#pragma acc parallel wait(queues:*iPtr, i)
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc parallel wait(devnum: i : *iPtr, i)
|
|
#pragma acc parallel wait(devnum:i:*iPtr, i)
|
|
while(true);
|
|
|
|
// CHECK: #pragma acc parallel wait(devnum: i : queues: *iPtr, i)
|
|
#pragma acc parallel wait(devnum:i:queues:*iPtr, i)
|
|
while(true);
|
|
|
|
bool SomeB;
|
|
struct SomeStruct{} SomeStructImpl;
|
|
|
|
//CHECK: #pragma acc parallel dtype(SomeB)
|
|
#pragma acc parallel dtype(SomeB)
|
|
while(true);
|
|
|
|
//CHECK: #pragma acc parallel device_type(SomeStruct)
|
|
#pragma acc parallel device_type(SomeStruct)
|
|
while(true);
|
|
|
|
//CHECK: #pragma acc parallel device_type(int)
|
|
#pragma acc parallel device_type(int)
|
|
while(true);
|
|
|
|
//CHECK: #pragma acc parallel dtype(bool)
|
|
#pragma acc parallel dtype(bool)
|
|
while(true);
|
|
|
|
//CHECK: #pragma acc parallel device_type(SomeStructImpl)
|
|
#pragma acc parallel device_type (SomeStructImpl)
|
|
while(true);
|
|
|
|
//CHECK: #pragma acc parallel reduction(+: iPtr)
|
|
#pragma acc parallel reduction(+: iPtr)
|
|
while(true);
|
|
//CHECK: #pragma acc parallel reduction(*: i)
|
|
#pragma acc parallel reduction(*: i)
|
|
while(true);
|
|
//CHECK: #pragma acc parallel reduction(max: SomeB)
|
|
#pragma acc parallel reduction(max: SomeB)
|
|
while(true);
|
|
//CHECK: #pragma acc parallel reduction(min: iPtr)
|
|
#pragma acc parallel reduction(min: iPtr)
|
|
while(true);
|
|
//CHECK: #pragma acc parallel reduction(&: i)
|
|
#pragma acc parallel reduction(&: i)
|
|
while(true);
|
|
//CHECK: #pragma acc parallel reduction(|: SomeB)
|
|
#pragma acc parallel reduction(|: SomeB)
|
|
while(true);
|
|
//CHECK: #pragma acc parallel reduction(^: iPtr)
|
|
#pragma acc parallel reduction(^: iPtr)
|
|
while(true);
|
|
//CHECK: #pragma acc parallel reduction(&&: i)
|
|
#pragma acc parallel reduction(&&: i)
|
|
while(true);
|
|
//CHECK: #pragma acc parallel reduction(||: SomeB)
|
|
#pragma acc parallel reduction(||: SomeB)
|
|
while(true);
|
|
}
|
|
|