[Clang][OpenMP] Support expression semantics in target update fields with non-contiguous array sections (#176708)

### Issue: Variable stride not recognized as non-contiguous
`CGOpenMPRuntime.cpp` failed to detect `DeclRefExpr`, `MemberExpr`,
`ArraySubscriptExpr` as non-contiguous.

**Fixes**:

`clang/lib/CodeGen/CGOpenMPRuntime.cpp` - Variable stride detection +
dimension count logic
Detect variable stride expressions
(`DeclRefExpr/MemberExpr/ArraySubscriptExpr`) as non-contiguous

Added testcases to cover stack arrays, heap pointers, struct members,
etc., for expression semantics in non-contiguous update.
This commit is contained in:
Amit Tiwari 2026-03-10 19:26:17 +05:30 committed by GitHub
parent 3548ec9517
commit 14de1bb711
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
10 changed files with 1025 additions and 1 deletions

View File

@ -8054,11 +8054,17 @@ private:
if (!StrideExpr)
return false;
assert(StrideExpr->getType()->isIntegerType() &&
"Stride expression must be of integer type");
// If stride is not evaluatable as a constant, treat as
// non-contiguous.
const auto Constant =
StrideExpr->getIntegerConstantExpr(CGF.getContext());
if (!Constant)
return false;
return true;
// Treat non-unitary strides as non-contiguous.
return !Constant->isOne();
});

View File

@ -0,0 +1,135 @@
// NOTE: Assertions have been autogenerated by utils/update_cc_test_checks.py UTC_ARGS: --check-globals --include-generated-funcs --replace-value-regex "__omp_offloading_[0-9a-z]+_[0-9a-z]+" "reduction_size[.].+[.]" "pl_cond[.].+[.|,]" --prefix-filecheck-ir-name _ --global-value-regex "\.offload_.*" --global-hex-value-regex ".offload_maptypes.*" --version 3
// RUN: %clang_cc1 -fopenmp -x c -triple x86_64-unknown-unknown -fopenmp-targets=amdgcn-amd-amdhsa -emit-llvm %s -o - \
// RUN: | FileCheck %s
// Check same results after serialization round-trip
// RUN: %clang_cc1 -fopenmp -x c -triple x86_64-unknown-unknown -fopenmp-targets=amdgcn-amd-amdhsa -emit-pch -o %t %s
// RUN: %clang_cc1 -fopenmp -x c -triple x86_64-unknown-unknown -fopenmp-targets=amdgcn-amd-amdhsa -include-pch %t -emit-llvm %s -o - \
// RUN: | FileCheck %s
// expected-no-diagnostics
#ifndef HEADER
#define HEADER
// Test that variable stride expressions in target update directives correctly
// set the OMP_MAP_NON_CONTIG flag. For NON_CONTIG entries, offload_sizes contains
// dimension count (2 for 1D array section). For non-NON_CONTIG entries,
// offload_sizes contains byte size (5 elements * 4 bytes = 20).
int data[10];
int stride;
void test_variable_stride_to() {
#pragma omp target update to(data[0:5:stride])
}
void test_variable_stride_from() {
#pragma omp target update from(data[0:5:stride])
}
void test_constant_stride_one() {
#pragma omp target update to(data[0:5:1])
}
#endif // HEADER
//.
// CHECK: @.offload_sizes = private unnamed_addr constant [1 x i64] [i64 2]
// CHECK: @.offload_maptypes = private unnamed_addr constant [1 x i64] [i64 [[#0x100000000001]]]
// CHECK: @.offload_sizes.1 = private unnamed_addr constant [1 x i64] [i64 2]
// CHECK: @.offload_maptypes.2 = private unnamed_addr constant [1 x i64] [i64 [[#0x100000000002]]]
// CHECK: @.offload_sizes.3 = private unnamed_addr constant [1 x i64] [i64 20]
// CHECK: @.offload_maptypes.4 = private unnamed_addr constant [1 x i64] [i64 [[#0x1]]]
//.
// CHECK-LABEL: define dso_local void @test_variable_stride_to(
// CHECK-SAME: ) #[[ATTR0:[0-9]+]] {
// CHECK-NEXT: entry:
// CHECK-NEXT: [[DOTOFFLOAD_BASEPTRS:%.*]] = alloca [1 x ptr], align 8
// CHECK-NEXT: [[DOTOFFLOAD_PTRS:%.*]] = alloca [1 x ptr], align 8
// CHECK-NEXT: [[DOTOFFLOAD_MAPPERS:%.*]] = alloca [1 x ptr], align 8
// CHECK-NEXT: [[DIMS:%.*]] = alloca [2 x [[STRUCT_DESCRIPTOR_DIM:%.*]]], align 8
// CHECK-NEXT: [[TMP0:%.*]] = load i32, ptr @stride, align 4
// CHECK-NEXT: [[TMP1:%.*]] = zext i32 [[TMP0]] to i64
// CHECK-NEXT: [[TMP2:%.*]] = mul nuw i64 4, [[TMP1]]
// CHECK-NEXT: [[TMP3:%.*]] = getelementptr inbounds [1 x ptr], ptr [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0
// CHECK-NEXT: store ptr @data, ptr [[TMP3]], align 8
// CHECK-NEXT: [[TMP4:%.*]] = getelementptr inbounds [1 x ptr], ptr [[DOTOFFLOAD_PTRS]], i32 0, i32 0
// CHECK-NEXT: store ptr @data, ptr [[TMP4]], align 8
// CHECK-NEXT: [[TMP5:%.*]] = getelementptr inbounds [1 x ptr], ptr [[DOTOFFLOAD_MAPPERS]], i64 0, i64 0
// CHECK-NEXT: store ptr null, ptr [[TMP5]], align 8
// CHECK-NEXT: [[TMP6:%.*]] = getelementptr inbounds [2 x [[STRUCT_DESCRIPTOR_DIM]]], ptr [[DIMS]], i64 0, i64 0
// CHECK-NEXT: [[TMP7:%.*]] = getelementptr inbounds nuw [[STRUCT_DESCRIPTOR_DIM]], ptr [[TMP6]], i32 0, i32 0
// CHECK-NEXT: store i64 0, ptr [[TMP7]], align 8
// CHECK-NEXT: [[TMP8:%.*]] = getelementptr inbounds nuw [[STRUCT_DESCRIPTOR_DIM]], ptr [[TMP6]], i32 0, i32 1
// CHECK-NEXT: store i64 5, ptr [[TMP8]], align 8
// CHECK-NEXT: [[TMP9:%.*]] = getelementptr inbounds nuw [[STRUCT_DESCRIPTOR_DIM]], ptr [[TMP6]], i32 0, i32 2
// CHECK-NEXT: store i64 [[TMP2]], ptr [[TMP9]], align 8
// CHECK-NEXT: [[TMP10:%.*]] = getelementptr inbounds [2 x [[STRUCT_DESCRIPTOR_DIM]]], ptr [[DIMS]], i64 0, i64 1
// CHECK-NEXT: [[TMP11:%.*]] = getelementptr inbounds nuw [[STRUCT_DESCRIPTOR_DIM]], ptr [[TMP10]], i32 0, i32 0
// CHECK-NEXT: store i64 0, ptr [[TMP11]], align 8
// CHECK-NEXT: [[TMP12:%.*]] = getelementptr inbounds nuw [[STRUCT_DESCRIPTOR_DIM]], ptr [[TMP10]], i32 0, i32 1
// CHECK-NEXT: store i64 1, ptr [[TMP12]], align 8
// CHECK-NEXT: [[TMP13:%.*]] = getelementptr inbounds nuw [[STRUCT_DESCRIPTOR_DIM]], ptr [[TMP10]], i32 0, i32 2
// CHECK-NEXT: store i64 4, ptr [[TMP13]], align 8
// CHECK-NEXT: [[TMP14:%.*]] = getelementptr inbounds [1 x ptr], ptr [[DOTOFFLOAD_PTRS]], i32 0, i32 0
// CHECK-NEXT: store ptr [[DIMS]], ptr [[TMP14]], align 8
// CHECK-NEXT: [[TMP15:%.*]] = getelementptr inbounds [1 x ptr], ptr [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0
// CHECK-NEXT: [[TMP16:%.*]] = getelementptr inbounds [1 x ptr], ptr [[DOTOFFLOAD_PTRS]], i32 0, i32 0
// CHECK-NEXT: call void @__tgt_target_data_update_mapper(ptr @[[GLOB1:[0-9]+]], i64 -1, i32 1, ptr [[TMP15]], ptr [[TMP16]], ptr @.offload_sizes, ptr @.offload_maptypes, ptr null, ptr null)
// CHECK-NEXT: ret void
//
//
// CHECK-LABEL: define dso_local void @test_variable_stride_from(
// CHECK-SAME: ) #[[ATTR0]] {
// CHECK-NEXT: entry:
// CHECK-NEXT: [[DOTOFFLOAD_BASEPTRS:%.*]] = alloca [1 x ptr], align 8
// CHECK-NEXT: [[DOTOFFLOAD_PTRS:%.*]] = alloca [1 x ptr], align 8
// CHECK-NEXT: [[DOTOFFLOAD_MAPPERS:%.*]] = alloca [1 x ptr], align 8
// CHECK-NEXT: [[DIMS:%.*]] = alloca [2 x [[STRUCT_DESCRIPTOR_DIM_0:%.*]]], align 8
// CHECK-NEXT: [[TMP0:%.*]] = load i32, ptr @stride, align 4
// CHECK-NEXT: [[TMP1:%.*]] = zext i32 [[TMP0]] to i64
// CHECK-NEXT: [[TMP2:%.*]] = mul nuw i64 4, [[TMP1]]
// CHECK-NEXT: [[TMP3:%.*]] = getelementptr inbounds [1 x ptr], ptr [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0
// CHECK-NEXT: store ptr @data, ptr [[TMP3]], align 8
// CHECK-NEXT: [[TMP4:%.*]] = getelementptr inbounds [1 x ptr], ptr [[DOTOFFLOAD_PTRS]], i32 0, i32 0
// CHECK-NEXT: store ptr @data, ptr [[TMP4]], align 8
// CHECK-NEXT: [[TMP5:%.*]] = getelementptr inbounds [1 x ptr], ptr [[DOTOFFLOAD_MAPPERS]], i64 0, i64 0
// CHECK-NEXT: store ptr null, ptr [[TMP5]], align 8
// CHECK-NEXT: [[TMP6:%.*]] = getelementptr inbounds [2 x [[STRUCT_DESCRIPTOR_DIM_0]]], ptr [[DIMS]], i64 0, i64 0
// CHECK-NEXT: [[TMP7:%.*]] = getelementptr inbounds nuw [[STRUCT_DESCRIPTOR_DIM_0]], ptr [[TMP6]], i32 0, i32 0
// CHECK-NEXT: store i64 0, ptr [[TMP7]], align 8
// CHECK-NEXT: [[TMP8:%.*]] = getelementptr inbounds nuw [[STRUCT_DESCRIPTOR_DIM_0]], ptr [[TMP6]], i32 0, i32 1
// CHECK-NEXT: store i64 5, ptr [[TMP8]], align 8
// CHECK-NEXT: [[TMP9:%.*]] = getelementptr inbounds nuw [[STRUCT_DESCRIPTOR_DIM_0]], ptr [[TMP6]], i32 0, i32 2
// CHECK-NEXT: store i64 [[TMP2]], ptr [[TMP9]], align 8
// CHECK-NEXT: [[TMP10:%.*]] = getelementptr inbounds [2 x [[STRUCT_DESCRIPTOR_DIM_0]]], ptr [[DIMS]], i64 0, i64 1
// CHECK-NEXT: [[TMP11:%.*]] = getelementptr inbounds nuw [[STRUCT_DESCRIPTOR_DIM_0]], ptr [[TMP10]], i32 0, i32 0
// CHECK-NEXT: store i64 0, ptr [[TMP11]], align 8
// CHECK-NEXT: [[TMP12:%.*]] = getelementptr inbounds nuw [[STRUCT_DESCRIPTOR_DIM_0]], ptr [[TMP10]], i32 0, i32 1
// CHECK-NEXT: store i64 1, ptr [[TMP12]], align 8
// CHECK-NEXT: [[TMP13:%.*]] = getelementptr inbounds nuw [[STRUCT_DESCRIPTOR_DIM_0]], ptr [[TMP10]], i32 0, i32 2
// CHECK-NEXT: store i64 4, ptr [[TMP13]], align 8
// CHECK-NEXT: [[TMP14:%.*]] = getelementptr inbounds [1 x ptr], ptr [[DOTOFFLOAD_PTRS]], i32 0, i32 0
// CHECK-NEXT: store ptr [[DIMS]], ptr [[TMP14]], align 8
// CHECK-NEXT: [[TMP15:%.*]] = getelementptr inbounds [1 x ptr], ptr [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0
// CHECK-NEXT: [[TMP16:%.*]] = getelementptr inbounds [1 x ptr], ptr [[DOTOFFLOAD_PTRS]], i32 0, i32 0
// CHECK-NEXT: call void @__tgt_target_data_update_mapper(ptr @[[GLOB1]], i64 -1, i32 1, ptr [[TMP15]], ptr [[TMP16]], ptr @.offload_sizes.1, ptr @.offload_maptypes.2, ptr null, ptr null)
// CHECK-NEXT: ret void
//
//
// CHECK-LABEL: define dso_local void @test_constant_stride_one(
// CHECK-SAME: ) #[[ATTR0]] {
// CHECK-NEXT: entry:
// CHECK-NEXT: [[DOTOFFLOAD_BASEPTRS:%.*]] = alloca [1 x ptr], align 8
// CHECK-NEXT: [[DOTOFFLOAD_PTRS:%.*]] = alloca [1 x ptr], align 8
// CHECK-NEXT: [[DOTOFFLOAD_MAPPERS:%.*]] = alloca [1 x ptr], align 8
// CHECK-NEXT: [[TMP0:%.*]] = getelementptr inbounds [1 x ptr], ptr [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0
// CHECK-NEXT: store ptr @data, ptr [[TMP0]], align 8
// CHECK-NEXT: [[TMP1:%.*]] = getelementptr inbounds [1 x ptr], ptr [[DOTOFFLOAD_PTRS]], i32 0, i32 0
// CHECK-NEXT: store ptr @data, ptr [[TMP1]], align 8
// CHECK-NEXT: [[TMP2:%.*]] = getelementptr inbounds [1 x ptr], ptr [[DOTOFFLOAD_MAPPERS]], i64 0, i64 0
// CHECK-NEXT: store ptr null, ptr [[TMP2]], align 8
// CHECK-NEXT: [[TMP3:%.*]] = getelementptr inbounds [1 x ptr], ptr [[DOTOFFLOAD_BASEPTRS]], i32 0, i32 0
// CHECK-NEXT: [[TMP4:%.*]] = getelementptr inbounds [1 x ptr], ptr [[DOTOFFLOAD_PTRS]], i32 0, i32 0
// CHECK-NEXT: call void @__tgt_target_data_update_mapper(ptr @[[GLOB1]], i64 -1, i32 1, ptr [[TMP3]], ptr [[TMP4]], ptr @.offload_sizes.3, ptr @.offload_maptypes.4, ptr null, ptr null)
// CHECK-NEXT: ret void
//

View File

@ -0,0 +1,145 @@
// RUN: %libomptarget-compile-run-and-check-generic
// Tests multiple arrays with different variable strides in single update
// clause.
#include <omp.h>
#include <stdio.h>
void test_1_update_from_multiple() {
int stride1 = 2;
int stride2 = 2;
double data1[10], data2[10];
// Initialize data on host
for (int i = 0; i < 10; i++) {
data1[i] = i;
data2[i] = i * 10;
}
printf("Test 1: Update FROM - Multiple arrays\n");
#pragma omp target data map(to : stride1, stride2, data1[0 : 10], data2[0 : 10])
{
#pragma omp target
{
for (int i = 0; i < 10; i++) {
data1[i] += i;
data2[i] += 100;
}
}
#pragma omp target update from(data1[0 : 5 : stride1], data2[0 : 5 : stride2])
}
printf("from target data1:\n");
for (int i = 0; i < 10; i++)
printf("%f\n", data1[i]);
printf("\nfrom target data2:\n");
for (int i = 0; i < 10; i++)
printf("%f\n", data2[i]);
}
void test_2_update_to_multiple() {
int stride1 = 2;
int stride2 = 2;
double data1[10], data2[10];
for (int i = 0; i < 10; i++) {
data1[i] = i;
data2[i] = i * 10;
}
printf("\nTest 2: Update TO - Multiple arrays\n");
#pragma omp target data map(tofrom : stride1, stride2, data1[0 : 10], \
data2[0 : 10])
{
#pragma omp target
{
for (int i = 0; i < 10; i++) {
data1[i] = 100.0;
data2[i] = 20.0;
}
}
for (int i = 0; i < 10; i += 2) {
data1[i] = 10.0;
data2[i] = 5.0;
}
#pragma omp target update to(data1[0 : 5 : stride1], data2[0 : 5 : stride2])
#pragma omp target
{
for (int i = 0; i < 10; i++) {
data1[i] += 2.0;
data2[i] += 2.0;
}
}
}
printf("device data1 after update to:\n");
for (int i = 0; i < 10; i++)
printf("%f\n", data1[i]);
printf("\ndevice data2 after update to:\n");
for (int i = 0; i < 10; i++)
printf("%f\n", data2[i]);
}
int main() {
test_1_update_from_multiple();
test_2_update_to_multiple();
return 0;
}
// CHECK: Test 1: Update FROM - Multiple arrays
// CHECK: from target data1:
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 1.000000
// CHECK-NEXT: 4.000000
// CHECK-NEXT: 3.000000
// CHECK-NEXT: 8.000000
// CHECK-NEXT: 5.000000
// CHECK-NEXT: 12.000000
// CHECK-NEXT: 7.000000
// CHECK-NEXT: 16.000000
// CHECK-NEXT: 9.000000
// CHECK: from target data2:
// CHECK-NEXT: 100.000000
// CHECK-NEXT: 10.000000
// CHECK-NEXT: 120.000000
// CHECK-NEXT: 30.000000
// CHECK-NEXT: 140.000000
// CHECK-NEXT: 50.000000
// CHECK-NEXT: 160.000000
// CHECK-NEXT: 70.000000
// CHECK-NEXT: 180.000000
// CHECK-NEXT: 90.000000
// CHECK: Test 2: Update TO - Multiple arrays
// CHECK: device data1 after update to:
// CHECK-NEXT: 12.000000
// CHECK-NEXT: 102.000000
// CHECK-NEXT: 12.000000
// CHECK-NEXT: 102.000000
// CHECK-NEXT: 12.000000
// CHECK-NEXT: 102.000000
// CHECK-NEXT: 12.000000
// CHECK-NEXT: 102.000000
// CHECK-NEXT: 12.000000
// CHECK-NEXT: 102.000000
// CHECK: device data2 after update to:
// CHECK-NEXT: 7.000000
// CHECK-NEXT: 22.000000
// CHECK-NEXT: 7.000000
// CHECK-NEXT: 22.000000
// CHECK-NEXT: 7.000000
// CHECK-NEXT: 22.000000
// CHECK-NEXT: 7.000000
// CHECK-NEXT: 22.000000
// CHECK-NEXT: 7.000000
// CHECK-NEXT: 22.000000

View File

@ -0,0 +1,136 @@
// RUN: %libomptarget-compile-run-and-check-generic
// Tests combining variable count expression AND variable stride in array
// sections.
#include <omp.h>
#include <stdio.h>
void test_1_update_from() {
int len = 10;
int stride = 2;
double data[len];
// Initialize data on host
for (int i = 0; i < len; i++) {
data[i] = i;
}
printf("Test 1: Update FROM - Variable count and stride\n");
printf("original values:\n");
for (int i = 0; i < len; i++)
printf("%f\n", data[i]);
#pragma omp target data map(to : len, stride, data[0 : len])
{
#pragma omp target
{
for (int i = 0; i < len; i++) {
data[i] += i;
}
}
#pragma omp target update from(data[0 : len / 2 : stride])
}
printf("from target results:\n");
for (int i = 0; i < len; i++)
printf("%f\n", data[i]);
}
void test_2_update_to() {
int len = 10;
int stride = 2;
double data[len];
for (int i = 0; i < len; i++) {
data[i] = i;
}
printf("\nTest 2: Update TO - Variable count and stride\n");
printf("original values:\n");
for (int i = 0; i < len; i++)
printf("%f\n", data[i]);
#pragma omp target data map(tofrom : len, stride, data[0 : len])
{
#pragma omp target
{
for (int i = 0; i < len; i++) {
data[i] = 50.0;
}
}
for (int i = 0; i < len / 2; i++) {
data[i * stride] = 10.0;
}
#pragma omp target update to(data[0 : len / 2 : stride])
#pragma omp target
{
for (int i = 0; i < len; i++) {
data[i] += 5.0;
}
}
}
printf("device values after update to:\n");
for (int i = 0; i < len; i++)
printf("%f\n", data[i]);
}
int main() {
test_1_update_from();
test_2_update_to();
return 0;
}
// CHECK: Test 1: Update FROM - Variable count and stride
// CHECK: original values:
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 1.000000
// CHECK-NEXT: 2.000000
// CHECK-NEXT: 3.000000
// CHECK-NEXT: 4.000000
// CHECK-NEXT: 5.000000
// CHECK-NEXT: 6.000000
// CHECK-NEXT: 7.000000
// CHECK-NEXT: 8.000000
// CHECK-NEXT: 9.000000
// CHECK: from target results:
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 1.000000
// CHECK-NEXT: 4.000000
// CHECK-NEXT: 3.000000
// CHECK-NEXT: 8.000000
// CHECK-NEXT: 5.000000
// CHECK-NEXT: 12.000000
// CHECK-NEXT: 7.000000
// CHECK-NEXT: 16.000000
// CHECK-NEXT: 9.000000
// CHECK: Test 2: Update TO - Variable count and stride
// CHECK: original values:
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 1.000000
// CHECK-NEXT: 2.000000
// CHECK-NEXT: 3.000000
// CHECK-NEXT: 4.000000
// CHECK-NEXT: 5.000000
// CHECK-NEXT: 6.000000
// CHECK-NEXT: 7.000000
// CHECK-NEXT: 8.000000
// CHECK-NEXT: 9.000000
// CHECK: device values after update to:
// CHECK-NEXT: 15.000000
// CHECK-NEXT: 55.000000
// CHECK-NEXT: 15.000000
// CHECK-NEXT: 55.000000
// CHECK-NEXT: 15.000000
// CHECK-NEXT: 55.000000
// CHECK-NEXT: 15.000000
// CHECK-NEXT: 55.000000
// CHECK-NEXT: 15.000000
// CHECK-NEXT: 55.000000

View File

@ -0,0 +1,134 @@
// This test checks "update from" and "update to" with variable stride.
// Tests data[0:5:stride] where stride is a variable, making it non-contiguous.
// RUN: %libomptarget-compile-run-and-check-generic
#include <omp.h>
#include <stdio.h>
void test_1_update_from() {
int stride = 2;
double data[10];
// Initialize data on host
for (int i = 0; i < 10; i++) {
data[i] = i;
}
printf("Test 1: Update FROM device\n");
printf("original values:\n");
for (int i = 0; i < 10; i++)
printf("%f\n", data[i]);
#pragma omp target data map(to : stride, data[0 : 10])
{
#pragma omp target
{
for (int i = 0; i < 10; i++) {
data[i] += i;
}
}
#pragma omp target update from(data[0 : 5 : stride])
}
printf("from target results:\n");
for (int i = 0; i < 10; i++)
printf("%f\n", data[i]);
}
void test_2_update_to() {
int stride = 2;
double data[10];
for (int i = 0; i < 10; i++) {
data[i] = i;
}
printf("\nTest 2: Update TO device\n");
printf("original values:\n");
for (int i = 0; i < 10; i++)
printf("%f\n", data[i]);
#pragma omp target data map(tofrom : stride, data[0 : 10])
{
#pragma omp target
{
for (int i = 0; i < 10; i++) {
data[i] = 50.0;
}
}
for (int i = 0; i < 10; i += 2) {
data[i] = 10.0;
}
#pragma omp target update to(data[0 : 5 : stride])
#pragma omp target
{
for (int i = 0; i < 10; i++) {
data[i] += 5.0;
}
}
}
printf("device values after update to:\n");
for (int i = 0; i < 10; i++)
printf("%f\n", data[i]);
}
int main() {
test_1_update_from();
test_2_update_to();
return 0;
}
// CHECK: Test 1: Update FROM device
// CHECK: original values:
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 1.000000
// CHECK-NEXT: 2.000000
// CHECK-NEXT: 3.000000
// CHECK-NEXT: 4.000000
// CHECK-NEXT: 5.000000
// CHECK-NEXT: 6.000000
// CHECK-NEXT: 7.000000
// CHECK-NEXT: 8.000000
// CHECK-NEXT: 9.000000
// CHECK: from target results:
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 1.000000
// CHECK-NEXT: 4.000000
// CHECK-NEXT: 3.000000
// CHECK-NEXT: 8.000000
// CHECK-NEXT: 5.000000
// CHECK-NEXT: 12.000000
// CHECK-NEXT: 7.000000
// CHECK-NEXT: 16.000000
// CHECK-NEXT: 9.000000
// CHECK: Test 2: Update TO device
// CHECK: original values:
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 1.000000
// CHECK-NEXT: 2.000000
// CHECK-NEXT: 3.000000
// CHECK-NEXT: 4.000000
// CHECK-NEXT: 5.000000
// CHECK-NEXT: 6.000000
// CHECK-NEXT: 7.000000
// CHECK-NEXT: 8.000000
// CHECK-NEXT: 9.000000
// CHECK: device values after update to:
// CHECK-NEXT: 15.000000
// CHECK-NEXT: 55.000000
// CHECK-NEXT: 15.000000
// CHECK-NEXT: 55.000000
// CHECK-NEXT: 15.000000
// CHECK-NEXT: 55.000000
// CHECK-NEXT: 15.000000
// CHECK-NEXT: 55.000000
// CHECK-NEXT: 15.000000
// CHECK-NEXT: 55.000000

View File

@ -0,0 +1,88 @@
// RUN: %libomptarget-compile-run-and-check-generic
// Miscellaneous variable stride tests: stride=1, stride=array_size, stride from
// array subscript.
#include <omp.h>
#include <stdio.h>
void test_1_variable_stride_one() {
int stride_one = 1;
double data1[10];
// Initialize data on host
for (int i = 0; i < 10; i++) {
data1[i] = i;
}
#pragma omp target data map(to : stride_one, data1[0 : 10])
{
#pragma omp target
{
for (int i = 0; i < 10; i++) {
data1[i] += i;
}
}
#pragma omp target update from(data1[0 : 10 : stride_one])
}
printf("Test 1: Variable stride = 1\n");
for (int i = 0; i < 10; i++)
printf("%f\n", data1[i]);
}
void test_2_variable_stride_large() {
int stride_large = 5;
double data2[10];
// Initialize data on host
for (int i = 0; i < 10; i++) {
data2[i] = i;
}
#pragma omp target data map(to : stride_large, data2[0 : 10])
{
#pragma omp target
{
for (int i = 0; i < 10; i++) {
data2[i] += i;
}
}
#pragma omp target update from(data2[0 : 2 : stride_large])
}
printf("\nTest 2: Variable stride = 5\n");
for (int i = 0; i < 10; i++)
printf("%f\n", data2[i]);
}
int main() {
test_1_variable_stride_one();
test_2_variable_stride_large();
return 0;
}
// CHECK: Test 1: Variable stride = 1
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 1.000000
// CHECK-NEXT: 2.000000
// CHECK-NEXT: 3.000000
// CHECK-NEXT: 4.000000
// CHECK-NEXT: 5.000000
// CHECK-NEXT: 6.000000
// CHECK-NEXT: 7.000000
// CHECK-NEXT: 8.000000
// CHECK-NEXT: 9.000000
// CHECK: Test 2: Variable stride = 5
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 1.000000
// CHECK-NEXT: 2.000000
// CHECK-NEXT: 3.000000
// CHECK-NEXT: 4.000000
// CHECK-NEXT: 10.000000
// CHECK-NEXT: 6.000000
// CHECK-NEXT: 7.000000
// CHECK-NEXT: 8.000000
// CHECK-NEXT: 9.000000

View File

@ -0,0 +1,94 @@
// RUN: %libomptarget-compile-run-and-check-generic
// Tests heap-allocated pointers with both variable count expression and
// variable stride.
#include <omp.h>
#include <stdio.h>
#include <stdlib.h>
int main() {
int len = 10;
int stride = 2;
double *result = (double *)malloc(len * sizeof(double));
for (int i = 0; i < len; i++) {
result[i] = 0;
}
#pragma omp target enter data map(to : len, stride, result[0 : len])
#pragma omp target map(alloc : result[0 : len])
{
for (int i = 0; i < len; i++) {
result[i] = i;
}
}
// Test FROM: Variable count and stride
#pragma omp target map(alloc : result[0 : len])
{
for (int i = 0; i < len; i++) {
result[i] += i * 10;
}
}
#pragma omp target update from(result[0 : len / 2 : stride])
printf("heap ptr variable count and stride (from):\n");
for (int i = 0; i < len; i++)
printf("%f\n", result[i]);
// Test TO: Reset, modify host, update to device
#pragma omp target map(alloc : result[0 : len])
{
for (int i = 0; i < len; i++) {
result[i] = i * 2;
}
}
for (int i = 0; i < len / 2; i++) {
result[i * stride] = i + 100;
}
#pragma omp target update to(result[0 : len / 2 : stride])
#pragma omp target map(alloc : result[0 : len])
{
for (int i = 0; i < len; i++) {
result[i] += 100;
}
}
#pragma omp target update from(result[0 : len])
printf("heap ptr variable count and stride (to):\n");
for (int i = 0; i < len; i++)
printf("%f\n", result[i]);
#pragma omp target exit data map(delete : len, stride, result[0 : len])
free(result);
return 0;
}
// CHECK: heap ptr variable count and stride (from):
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 22.000000
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 44.000000
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 66.000000
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 88.000000
// CHECK-NEXT: 0.000000
// CHECK: heap ptr variable count and stride (to):
// CHECK-NEXT: 200.000000
// CHECK-NEXT: 102.000000
// CHECK-NEXT: 201.000000
// CHECK-NEXT: 106.000000
// CHECK-NEXT: 202.000000
// CHECK-NEXT: 110.000000
// CHECK-NEXT: 203.000000
// CHECK-NEXT: 114.000000
// CHECK-NEXT: 204.000000
// CHECK-NEXT: 118.000000

View File

@ -0,0 +1,95 @@
// RUN: %libomptarget-compile-run-and-check-generic
// Tests non-contiguous array sections with variable stride on heap-allocated
// pointers.
#include <omp.h>
#include <stdio.h>
#include <stdlib.h>
int main() {
int stride = 2;
int len = 10;
double *result = (double *)malloc(len * sizeof(double));
// Initialize
for (int i = 0; i < len; i++) {
result[i] = 0;
}
#pragma omp target enter data map(to : stride, len, result[0 : len])
#pragma omp target map(alloc : result[0 : len])
{
for (int i = 0; i < len; i++) {
result[i] = i;
}
}
// Test FROM
#pragma omp target map(alloc : result[0 : len])
{
for (int i = 0; i < len; i++) {
result[i] += i * 10;
}
}
#pragma omp target update from(result[0 : 5 : stride])
printf("heap ptr variable stride (from):\n");
for (int i = 0; i < len; i++)
printf("%f\n", result[i]);
// Test TO: Reset, modify host, update to device
#pragma omp target map(alloc : result[0 : len])
{
for (int i = 0; i < len; i++) {
result[i] = i * 2;
}
}
for (int i = 0; i < 5; i++) {
result[i * stride] = i + 100;
}
#pragma omp target update to(result[0 : 5 : stride])
#pragma omp target map(alloc : result[0 : len])
{
for (int i = 0; i < len; i++) {
result[i] += 100;
}
}
#pragma omp target update from(result[0 : len])
printf("heap ptr variable stride (to):\n");
for (int i = 0; i < len; i++)
printf("%f\n", result[i]);
#pragma omp target exit data map(delete : stride, len, result[0 : len])
free(result);
return 0;
}
// CHECK: heap ptr variable stride (from):
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 22.000000
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 44.000000
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 66.000000
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 88.000000
// CHECK-NEXT: 0.000000
// CHECK: heap ptr variable stride (to):
// CHECK-NEXT: 200.000000
// CHECK-NEXT: 102.000000
// CHECK-NEXT: 201.000000
// CHECK-NEXT: 106.000000
// CHECK-NEXT: 202.000000
// CHECK-NEXT: 110.000000
// CHECK-NEXT: 203.000000
// CHECK-NEXT: 114.000000
// CHECK-NEXT: 204.000000
// CHECK-NEXT: 118.000000

View File

@ -0,0 +1,96 @@
// RUN: %libomptarget-compile-run-and-check-generic
// Tests struct member arrays with both variable count expression and variable
// stride.
#include <omp.h>
#include <stdio.h>
struct S {
int len;
int stride;
double data[20];
};
int main() {
struct S s;
s.len = 10;
s.stride = 2;
// Initialize
#pragma omp target map(tofrom : s)
{
for (int i = 0; i < s.len; i++) {
s.data[i] = i;
}
}
// Test FROM: Variable count and stride
#pragma omp target data map(to : s)
{
#pragma omp target
{
for (int i = 0; i < s.len; i++) {
s.data[i] += i * 10;
}
}
#pragma omp target update from(s.data[0 : s.len / 2 : s.stride])
}
printf("struct variable count and stride (from):\n");
for (int i = 0; i < s.len; i++)
printf("%f\n", s.data[i]);
// Test TO: Reset, modify host, update to device
#pragma omp target map(tofrom : s)
{
for (int i = 0; i < s.len; i++) {
s.data[i] = i * 2;
}
}
for (int i = 0; i < s.len / 2; i++) {
s.data[i * s.stride] = i + 100;
}
#pragma omp target data map(to : s)
{
#pragma omp target update to(s.data[0 : s.len / 2 : s.stride])
#pragma omp target
{
for (int i = 0; i < s.len; i++) {
s.data[i] += 100;
}
}
}
printf("struct variable count and stride (to):\n");
for (int i = 0; i < s.len; i++)
printf("%f\n", s.data[i]);
return 0;
}
// CHECK: struct variable count and stride (from):
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 11.000000
// CHECK-NEXT: 2.000000
// CHECK-NEXT: 33.000000
// CHECK-NEXT: 4.000000
// CHECK-NEXT: 55.000000
// CHECK-NEXT: 6.000000
// CHECK-NEXT: 77.000000
// CHECK-NEXT: 8.000000
// CHECK-NEXT: 9.000000
// CHECK: struct variable count and stride (to):
// CHECK-NEXT: 100.000000
// CHECK-NEXT: 2.000000
// CHECK-NEXT: 101.000000
// CHECK-NEXT: 6.000000
// CHECK-NEXT: 102.000000
// CHECK-NEXT: 10.000000
// CHECK-NEXT: 103.000000
// CHECK-NEXT: 14.000000
// CHECK-NEXT: 104.000000
// CHECK-NEXT: 18.000000

View File

@ -0,0 +1,95 @@
// RUN: %libomptarget-compile-run-and-check-generic
// Tests non-contiguous array sections with variable stride on struct member
// arrays.
#include <omp.h>
#include <stdio.h>
struct S {
int stride;
double data[20];
};
int main() {
struct S s;
s.stride = 2;
int len = 10;
// Initialize
#pragma omp target map(tofrom : s, len)
{
for (int i = 0; i < len; i++) {
s.data[i] = i;
}
}
// Test FROM
#pragma omp target data map(to : s, len)
{
#pragma omp target
{
for (int i = 0; i < len; i++) {
s.data[i] += i * 10;
}
}
#pragma omp target update from(s.data[0 : 5 : s.stride])
}
printf("struct variable stride (from):\n");
for (int i = 0; i < len; i++)
printf("%f\n", s.data[i]);
// Test TO: Reset, modify host, update to device
#pragma omp target map(tofrom : s)
{
for (int i = 0; i < len; i++) {
s.data[i] = i * 2;
}
}
for (int i = 0; i < 5; i++) {
s.data[i * s.stride] = i + 100;
}
#pragma omp target data map(to : s)
{
#pragma omp target update to(s.data[0 : 5 : s.stride])
#pragma omp target
{
for (int i = 0; i < len; i++) {
s.data[i] += 100;
}
}
}
printf("struct variable stride (to):\n");
for (int i = 0; i < len; i++)
printf("%f\n", s.data[i]);
return 0;
}
// CHECK: struct variable stride (from):
// CHECK-NEXT: 0.000000
// CHECK-NEXT: 11.000000
// CHECK-NEXT: 2.000000
// CHECK-NEXT: 33.000000
// CHECK-NEXT: 4.000000
// CHECK-NEXT: 55.000000
// CHECK-NEXT: 6.000000
// CHECK-NEXT: 77.000000
// CHECK-NEXT: 8.000000
// CHECK-NEXT: 9.000000
// CHECK: struct variable stride (to):
// CHECK-NEXT: 100.000000
// CHECK-NEXT: 2.000000
// CHECK-NEXT: 101.000000
// CHECK-NEXT: 6.000000
// CHECK-NEXT: 102.000000
// CHECK-NEXT: 10.000000
// CHECK-NEXT: 103.000000
// CHECK-NEXT: 14.000000
// CHECK-NEXT: 104.000000
// CHECK-NEXT: 18.000000