summaryrefslogtreecommitdiff
path: root/libgomp
diff options
context:
space:
mode:
authortschwinge <tschwinge@138bc75d-0d04-0410-961f-82ee72b054a4>2016-04-12 11:02:32 +0000
committertschwinge <tschwinge@138bc75d-0d04-0410-961f-82ee72b054a4>2016-04-12 11:02:32 +0000
commit40495bd0847a05aa76cc37e05292cf937449f9dd (patch)
tree3393e08ba599fadedb1ac88fc1156c593ed6591f /libgomp
parentf87ba9cde3958ccbb1f2c8b9efec997a458efc16 (diff)
downloadgcc-40495bd0847a05aa76cc37e05292cf937449f9dd.tar.gz
Merge libgomp.oacc-c-c++-common/loop-reduction-*.c into libgomp.oacc-c-c++-common/reduction-7.c
libgomp/ * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gang-np-1.c: Merge this file, and... * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gv-np-1.c: ... this file, and... * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gw-np-1.c: ... this file, and... * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-1.c: ... this file, and... * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-2.c: ... this file, and... * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-3.c: ... this file, and... * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-4.c: ... this file, and... * testsuite/libgomp.oacc-c-c++-common/loop-reduction-vector-p-1.c: ... this file, and... * testsuite/libgomp.oacc-c-c++-common/loop-reduction-vector-p-2.c: ... this file, and... * testsuite/libgomp.oacc-c-c++-common/loop-reduction-worker-p-1.c: ... this file, and... * testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-1.c: ... this file, and... * testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-2.c: ... this file, and... * testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-3.c: ... this file into... * testsuite/libgomp.oacc-c-c++-common/reduction-7.c: ... this file. git-svn-id: svn+ssh://gcc.gnu.org/svn/gcc/trunk@234899 138bc75d-0d04-0410-961f-82ee72b054a4
Diffstat (limited to 'libgomp')
-rw-r--r--libgomp/ChangeLog29
-rw-r--r--libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gang-np-1.c45
-rw-r--r--libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gv-np-1.c30
-rw-r--r--libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gw-np-1.c30
-rw-r--r--libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-1.c28
-rw-r--r--libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-2.c34
-rw-r--r--libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-3.c33
-rw-r--r--libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-4.c55
-rw-r--r--libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-vector-p-1.c43
-rw-r--r--libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-vector-p-2.c41
-rw-r--r--libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-worker-p-1.c43
-rw-r--r--libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-1.c41
-rw-r--r--libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-2.c45
-rw-r--r--libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-3.c38
-rw-r--r--libgomp/testsuite/libgomp.oacc-c-c++-common/reduction-7.c351
15 files changed, 380 insertions, 506 deletions
diff --git a/libgomp/ChangeLog b/libgomp/ChangeLog
index 6071b239f1f..1716ba071d5 100644
--- a/libgomp/ChangeLog
+++ b/libgomp/ChangeLog
@@ -1,5 +1,34 @@
2016-04-12 Thomas Schwinge <thomas@codesourcery.com>
+ * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gang-np-1.c:
+ Merge this file, and...
+ * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gv-np-1.c:
+ ... this file, and...
+ * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gw-np-1.c:
+ ... this file, and...
+ * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-1.c:
+ ... this file, and...
+ * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-2.c:
+ ... this file, and...
+ * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-3.c:
+ ... this file, and...
+ * testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-4.c:
+ ... this file, and...
+ * testsuite/libgomp.oacc-c-c++-common/loop-reduction-vector-p-1.c:
+ ... this file, and...
+ * testsuite/libgomp.oacc-c-c++-common/loop-reduction-vector-p-2.c:
+ ... this file, and...
+ * testsuite/libgomp.oacc-c-c++-common/loop-reduction-worker-p-1.c:
+ ... this file, and...
+ * testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-1.c:
+ ... this file, and...
+ * testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-2.c:
+ ... this file, and...
+ * testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-3.c:
+ ... this file into...
+ * testsuite/libgomp.oacc-c-c++-common/reduction-7.c: ... this
+ file.
+
* testsuite/libgomp.oacc-c-c++-common/par-loop-comb-reduction-2.c:
Make failure observable.
diff --git a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gang-np-1.c b/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gang-np-1.c
deleted file mode 100644
index 55ab3c96334..00000000000
--- a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gang-np-1.c
+++ /dev/null
@@ -1,45 +0,0 @@
-/* { dg-additional-options "-w" } */
-
-#include <assert.h>
-
-/* Test of reduction on loop directive (gangs, non-private reduction
- variable). */
-
-int
-main (int argc, char *argv[])
-{
- int i, arr[1024], res = 0, hres = 0;
-
- for (i = 0; i < 1024; i++)
- arr[i] = i;
-
- #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
- copy(res)
- {
- #pragma acc loop gang reduction(+:res)
- for (i = 0; i < 1024; i++)
- res += arr[i];
- }
-
- for (i = 0; i < 1024; i++)
- hres += arr[i];
-
- assert (res == hres);
-
- res = hres = 1;
-
- #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
- copy(res)
- {
- #pragma acc loop gang reduction(*:res)
- for (i = 0; i < 12; i++)
- res *= arr[i];
- }
-
- for (i = 0; i < 12; i++)
- hres *= arr[i];
-
- assert (res == hres);
-
- return 0;
-}
diff --git a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gv-np-1.c b/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gv-np-1.c
deleted file mode 100644
index d4341e9c2cf..00000000000
--- a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gv-np-1.c
+++ /dev/null
@@ -1,30 +0,0 @@
-/* { dg-additional-options "-w" } */
-
-#include <assert.h>
-
-/* Test of reduction on loop directive (gangs and vectors, non-private
- reduction variable). */
-
-int
-main (int argc, char *argv[])
-{
- int i, arr[1024], res = 0, hres = 0;
-
- for (i = 0; i < 1024; i++)
- arr[i] = i;
-
- #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
- copy(res)
- {
- #pragma acc loop gang vector reduction(+:res)
- for (i = 0; i < 1024; i++)
- res += arr[i];
- }
-
- for (i = 0; i < 1024; i++)
- hres += arr[i];
-
- assert (res == hres);
-
- return 0;
-}
diff --git a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gw-np-1.c b/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gw-np-1.c
deleted file mode 100644
index 2e5668b134e..00000000000
--- a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gw-np-1.c
+++ /dev/null
@@ -1,30 +0,0 @@
-/* { dg-additional-options "-w" } */
-
-#include <assert.h>
-
-/* Test of reduction on loop directive (gangs and workers, non-private
- reduction variable). */
-
-int
-main (int argc, char *argv[])
-{
- int i, arr[1024], res = 0, hres = 0;
-
- for (i = 0; i < 1024; i++)
- arr[i] = i;
-
- #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
- copy(res)
- {
- #pragma acc loop gang worker reduction(+:res)
- for (i = 0; i < 1024; i++)
- res += arr[i];
- }
-
- for (i = 0; i < 1024; i++)
- hres += arr[i];
-
- assert (res == hres);
-
- return 0;
-}
diff --git a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-1.c b/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-1.c
deleted file mode 100644
index d6103738813..00000000000
--- a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-1.c
+++ /dev/null
@@ -1,28 +0,0 @@
-#include <assert.h>
-
-/* Test of reduction on loop directive (gangs, workers and vectors, non-private
- reduction variable). */
-
-int
-main (int argc, char *argv[])
-{
- int i, arr[1024], res = 0, hres = 0;
-
- for (i = 0; i < 1024; i++)
- arr[i] = i;
-
- #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
- copy(res)
- {
- #pragma acc loop gang worker vector reduction(+:res)
- for (i = 0; i < 1024; i++)
- res += arr[i];
- }
-
- for (i = 0; i < 1024; i++)
- hres += arr[i];
-
- assert (res == hres);
-
- return 0;
-}
diff --git a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-2.c b/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-2.c
deleted file mode 100644
index ea5c151af3c..00000000000
--- a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-2.c
+++ /dev/null
@@ -1,34 +0,0 @@
-#include <assert.h>
-
-/* Test of reduction on loop directive (gangs, workers and vectors, non-private
- reduction variable: separate gang and worker/vector loops). */
-
-int
-main (int argc, char *argv[])
-{
- int i, j, arr[32768], res = 0, hres = 0;
-
- for (i = 0; i < 32768; i++)
- arr[i] = i;
-
- #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
- copy(res)
- {
- #pragma acc loop gang reduction(+:res)
- for (j = 0; j < 32; j++)
- {
- #pragma acc loop worker vector reduction(+:res)
- for (i = 0; i < 1024; i++)
- res += arr[j * 1024 + i];
- }
- /* "res" is non-private, and is not available until after the parallel
- region. */
- }
-
- for (i = 0; i < 32768; i++)
- hres += arr[i];
-
- assert (res == hres);
-
- return 0;
-}
diff --git a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-3.c b/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-3.c
deleted file mode 100644
index 0056f3ce10e..00000000000
--- a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-3.c
+++ /dev/null
@@ -1,33 +0,0 @@
-#include <assert.h>
-
-/* Test of reduction on loop directive (gangs, workers and vectors, non-private
- reduction variable: separate gang and worker/vector loops). */
-
-int
-main (int argc, char *argv[])
-{
- int i, j;
- double arr[32768], res = 0, hres = 0;
-
- for (i = 0; i < 32768; i++)
- arr[i] = i;
-
- #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
- copyin(arr) copy(res)
- {
- #pragma acc loop gang reduction(+:res)
- for (j = 0; j < 32; j++)
- {
- #pragma acc loop worker vector reduction(+:res)
- for (i = 0; i < 1024; i++)
- res += arr[j * 1024 + i];
- }
- }
-
- for (i = 0; i < 32768; i++)
- hres += arr[i];
-
- assert (res == hres);
-
- return 0;
-}
diff --git a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-4.c b/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-4.c
deleted file mode 100644
index e69d0ec04c7..00000000000
--- a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-gwv-np-4.c
+++ /dev/null
@@ -1,55 +0,0 @@
-#include <assert.h>
-
-/* Test of reduction on loop directive (gangs, workers and vectors, multiple
- non-private reduction variables, float type). */
-
-int
-main (int argc, char *argv[])
-{
- int i, j;
- float arr[32768];
- float res = 0, mres = 0, hres = 0, hmres = 0;
-
- for (i = 0; i < 32768; i++)
- arr[i] = i;
-
- #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
- copy(res, mres)
- {
- #pragma acc loop gang reduction(+:res) reduction(max:mres)
- for (j = 0; j < 32; j++)
- {
- #pragma acc loop worker vector reduction(+:res) reduction(max:mres)
- for (i = 0; i < 1024; i++)
- {
- res += arr[j * 1024 + i];
- if (arr[j * 1024 + i] > mres)
- mres = arr[j * 1024 + i];
- }
-
- #pragma acc loop worker vector reduction(+:res) reduction(max:mres)
- for (i = 0; i < 1024; i++)
- {
- res += arr[j * 1024 + (1023 - i)];
- if (arr[j * 1024 + (1023 - i)] > mres)
- mres = arr[j * 1024 + (1023 - i)];
- }
- }
- }
-
- for (j = 0; j < 32; j++)
- for (i = 0; i < 1024; i++)
- {
- hres += arr[j * 1024 + i];
- hres += arr[j * 1024 + (1023 - i)];
- if (arr[j * 1024 + i] > hmres)
- hmres = arr[j * 1024 + i];
- if (arr[j * 1024 + (1023 - i)] > hmres)
- hmres = arr[j * 1024 + (1023 - i)];
- }
-
- assert (res == hres);
- assert (mres == hmres);
-
- return 0;
-}
diff --git a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-vector-p-1.c b/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-vector-p-1.c
deleted file mode 100644
index 31e4366f88b..00000000000
--- a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-vector-p-1.c
+++ /dev/null
@@ -1,43 +0,0 @@
-/* { dg-additional-options "-w" } */
-
-#include <assert.h>
-
-/* Test of reduction on loop directive (vectors, private reduction
- variable). */
-
-int
-main (int argc, char *argv[])
-{
- int i, j, arr[1024], out[32], res = 0, hres = 0;
-
- for (i = 0; i < 1024; i++)
- arr[i] = i;
-
- #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
- private(res) copyout(out)
- {
- #pragma acc loop gang
- for (j = 0; j < 32; j++)
- {
- res = 0;
-
- #pragma acc loop vector reduction(+:res)
- for (i = 0; i < 32; i++)
- res += arr[j * 32 + i];
-
- out[j] = res;
- }
- }
-
- for (j = 0; j < 32; j++)
- {
- hres = 0;
-
- for (i = 0; i < 32; i++)
- hres += arr[j * 32 + i];
-
- assert (out[j] == hres);
- }
-
- return 0;
-}
diff --git a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-vector-p-2.c b/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-vector-p-2.c
deleted file mode 100644
index 15f0053e5bc..00000000000
--- a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-vector-p-2.c
+++ /dev/null
@@ -1,41 +0,0 @@
-#include <assert.h>
-
-/* Test of reduction on loop directive (vector reduction in
- gang-partitioned/worker-partitioned mode, private reduction variable). */
-
-int
-main (int argc, char *argv[])
-{
- int i, j, k;
- double ina[1024], inb[1024], out[1024], acc;
-
- for (j = 0; j < 32; j++)
- for (i = 0; i < 32; i++)
- {
- ina[j * 32 + i] = (i == j) ? 2.0 : 0.0;
- inb[j * 32 + i] = (double) (i + j);
- }
-
- #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
- private(acc) copyin(ina, inb) copyout(out)
- {
- #pragma acc loop gang worker
- for (k = 0; k < 32; k++)
- for (j = 0; j < 32; j++)
- {
- acc = 0;
-
- #pragma acc loop vector reduction(+:acc)
- for (i = 0; i < 32; i++)
- acc += ina[k * 32 + i] * inb[i * 32 + j];
-
- out[k * 32 + j] = acc;
- }
- }
-
- for (j = 0; j < 32; j++)
- for (i = 0; i < 32; i++)
- assert (out[j * 32 + i] == (i + j) * 2);
-
- return 0;
-}
diff --git a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-worker-p-1.c b/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-worker-p-1.c
deleted file mode 100644
index 4a925036a5b..00000000000
--- a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-worker-p-1.c
+++ /dev/null
@@ -1,43 +0,0 @@
-/* { dg-additional-options "-w" } */
-
-#include <assert.h>
-
-/* Test of reduction on loop directive (workers, private reduction
- variable). */
-
-int
-main (int argc, char *argv[])
-{
- int i, j, arr[1024], out[32], res = 0, hres = 0;
-
- for (i = 0; i < 1024; i++)
- arr[i] = i;
-
- #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
- private(res) copyout(out)
- {
- #pragma acc loop gang
- for (j = 0; j < 32; j++)
- {
- res = 0;
-
- #pragma acc loop worker reduction(+:res)
- for (i = 0; i < 32; i++)
- res += arr[j * 32 + i];
-
- out[j] = res;
- }
- }
-
- for (j = 0; j < 32; j++)
- {
- hres = 0;
-
- for (i = 0; i < 32; i++)
- hres += arr[j * 32 + i];
-
- assert (out[j] == hres);
- }
-
- return 0;
-}
diff --git a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-1.c b/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-1.c
deleted file mode 100644
index 1bfb284cb3b..00000000000
--- a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-1.c
+++ /dev/null
@@ -1,41 +0,0 @@
-#include <assert.h>
-
-/* Test of reduction on loop directive (workers and vectors, private reduction
- variable). */
-
-int
-main (int argc, char *argv[])
-{
- int i, j, arr[1024], out[32], res = 0, hres = 0;
-
- for (i = 0; i < 1024; i++)
- arr[i] = i;
-
- #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
- private(res) copyout(out)
- {
- #pragma acc loop gang
- for (j = 0; j < 32; j++)
- {
- res = 0;
-
- #pragma acc loop worker vector reduction(+:res)
- for (i = 0; i < 32; i++)
- res += arr[j * 32 + i];
-
- out[j] = res;
- }
- }
-
- for (j = 0; j < 32; j++)
- {
- hres = 0;
-
- for (i = 0; i < 32; i++)
- hres += arr[j * 32 + i];
-
- assert (out[j] == hres);
- }
-
- return 0;
-}
diff --git a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-2.c b/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-2.c
deleted file mode 100644
index 93ab78f106a..00000000000
--- a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-2.c
+++ /dev/null
@@ -1,45 +0,0 @@
-#include <assert.h>
-
-/* Test of reduction on loop directive (workers and vectors, private reduction
- variable). */
-
-int
-main (int argc, char *argv[])
-{
- int i, j, arr[32768], out[32], res = 0, hres = 0;
-
- for (i = 0; i < 32768; i++)
- arr[i] = i;
-
- #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
- private(res) copyout(out)
- {
- #pragma acc loop gang
- for (j = 0; j < 32; j++)
- {
- res = j;
-
- #pragma acc loop worker reduction(+:res)
- for (i = 0; i < 1024; i++)
- res += arr[j * 1024 + i];
-
- #pragma acc loop vector reduction(+:res)
- for (i = 1023; i >= 0; i--)
- res += arr[j * 1024 + i];
-
- out[j] = res;
- }
- }
-
- for (j = 0; j < 32; j++)
- {
- hres = j;
-
- for (i = 0; i < 1024; i++)
- hres += arr[j * 1024 + i] * 2;
-
- assert (out[j] == hres);
- }
-
- return 0;
-}
diff --git a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-3.c b/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-3.c
deleted file mode 100644
index 298e25c87d2..00000000000
--- a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-reduction-wv-p-3.c
+++ /dev/null
@@ -1,38 +0,0 @@
-#include <assert.h>
-
-/* Test of reduction on loop directive (workers and vectors, private reduction
- variable: gang-redundant mode). */
-
-int
-main (int argc, char *argv[])
-{
- int i, arr[1024], out[32], res = 0, hres = 0;
-
- for (i = 0; i < 1024; i++)
- arr[i] = i ^ 33;
-
- #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
- private(res) copyin(arr) copyout(out)
- {
- /* Private variables aren't initialized by default in openacc. */
- res = 0;
-
- /* "res" should be available at the end of the following loop (and should
- have the same value redundantly in each gang). */
- #pragma acc loop worker vector reduction(+:res)
- for (i = 0; i < 1024; i++)
- res += arr[i];
-
- #pragma acc loop gang (static: 1)
- for (i = 0; i < 32; i++)
- out[i] = res;
- }
-
- for (i = 0; i < 1024; i++)
- hres += arr[i];
-
- for (i = 0; i < 32; i++)
- assert (out[i] == hres);
-
- return 0;
-}
diff --git a/libgomp/testsuite/libgomp.oacc-c-c++-common/reduction-7.c b/libgomp/testsuite/libgomp.oacc-c-c++-common/reduction-7.c
index b23c75877f8..76c33e4470d 100644
--- a/libgomp/testsuite/libgomp.oacc-c-c++-common/reduction-7.c
+++ b/libgomp/testsuite/libgomp.oacc-c-c++-common/reduction-7.c
@@ -118,12 +118,363 @@ void gwv_np_1()
}
+/* Test of reduction on loop directive (gangs, workers and vectors, non-private
+ reduction variable: separate gang and worker/vector loops). */
+
+void gwv_np_2()
+{
+ int i, j, arr[32768], res = 0, hres = 0;
+
+ for (i = 0; i < 32768; i++)
+ arr[i] = i;
+
+ #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
+ copy(res)
+ {
+ #pragma acc loop gang reduction(+:res)
+ for (j = 0; j < 32; j++)
+ {
+ #pragma acc loop worker vector reduction(+:res)
+ for (i = 0; i < 1024; i++)
+ res += arr[j * 1024 + i];
+ }
+ /* "res" is non-private, and is not available until after the parallel
+ region. */
+ }
+
+ for (i = 0; i < 32768; i++)
+ hres += arr[i];
+
+ assert (res == hres);
+}
+
+
+/* Test of reduction on loop directive (gangs, workers and vectors, non-private
+ reduction variable: separate gang and worker/vector loops). */
+
+void gwv_np_3()
+{
+ int i, j;
+ double arr[32768], res = 0, hres = 0;
+
+ for (i = 0; i < 32768; i++)
+ arr[i] = i;
+
+ #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
+ copyin(arr) copy(res)
+ {
+ #pragma acc loop gang reduction(+:res)
+ for (j = 0; j < 32; j++)
+ {
+ #pragma acc loop worker vector reduction(+:res)
+ for (i = 0; i < 1024; i++)
+ res += arr[j * 1024 + i];
+ }
+ }
+
+ for (i = 0; i < 32768; i++)
+ hres += arr[i];
+
+ assert (res == hres);
+}
+
+
+/* Test of reduction on loop directive (gangs, workers and vectors, multiple
+ non-private reduction variables, float type). */
+
+void gwv_np_4()
+{
+ int i, j;
+ float arr[32768];
+ float res = 0, mres = 0, hres = 0, hmres = 0;
+
+ for (i = 0; i < 32768; i++)
+ arr[i] = i;
+
+ #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
+ copy(res, mres)
+ {
+ #pragma acc loop gang reduction(+:res) reduction(max:mres)
+ for (j = 0; j < 32; j++)
+ {
+ #pragma acc loop worker vector reduction(+:res) reduction(max:mres)
+ for (i = 0; i < 1024; i++)
+ {
+ res += arr[j * 1024 + i];
+ if (arr[j * 1024 + i] > mres)
+ mres = arr[j * 1024 + i];
+ }
+
+ #pragma acc loop worker vector reduction(+:res) reduction(max:mres)
+ for (i = 0; i < 1024; i++)
+ {
+ res += arr[j * 1024 + (1023 - i)];
+ if (arr[j * 1024 + (1023 - i)] > mres)
+ mres = arr[j * 1024 + (1023 - i)];
+ }
+ }
+ }
+
+ for (j = 0; j < 32; j++)
+ for (i = 0; i < 1024; i++)
+ {
+ hres += arr[j * 1024 + i];
+ hres += arr[j * 1024 + (1023 - i)];
+ if (arr[j * 1024 + i] > hmres)
+ hmres = arr[j * 1024 + i];
+ if (arr[j * 1024 + (1023 - i)] > hmres)
+ hmres = arr[j * 1024 + (1023 - i)];
+ }
+
+ assert (res == hres);
+ assert (mres == hmres);
+}
+
+
+/* Test of reduction on loop directive (vectors, private reduction
+ variable). */
+
+void v_p_1()
+{
+ int i, j, arr[1024], out[32], res = 0, hres = 0;
+
+ for (i = 0; i < 1024; i++)
+ arr[i] = i;
+
+ #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
+ private(res) copyout(out)
+ {
+ #pragma acc loop gang
+ for (j = 0; j < 32; j++)
+ {
+ res = 0;
+
+ #pragma acc loop vector reduction(+:res)
+ for (i = 0; i < 32; i++)
+ res += arr[j * 32 + i];
+
+ out[j] = res;
+ }
+ }
+
+ for (j = 0; j < 32; j++)
+ {
+ hres = 0;
+
+ for (i = 0; i < 32; i++)
+ hres += arr[j * 32 + i];
+
+ assert (out[j] == hres);
+ }
+}
+
+
+/* Test of reduction on loop directive (vector reduction in
+ gang-partitioned/worker-partitioned mode, private reduction variable). */
+
+void v_p_2()
+{
+ int i, j, k;
+ double ina[1024], inb[1024], out[1024], acc;
+
+ for (j = 0; j < 32; j++)
+ for (i = 0; i < 32; i++)
+ {
+ ina[j * 32 + i] = (i == j) ? 2.0 : 0.0;
+ inb[j * 32 + i] = (double) (i + j);
+ }
+
+ #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
+ private(acc) copyin(ina, inb) copyout(out)
+ {
+ #pragma acc loop gang worker
+ for (k = 0; k < 32; k++)
+ for (j = 0; j < 32; j++)
+ {
+ acc = 0;
+
+ #pragma acc loop vector reduction(+:acc)
+ for (i = 0; i < 32; i++)
+ acc += ina[k * 32 + i] * inb[i * 32 + j];
+
+ out[k * 32 + j] = acc;
+ }
+ }
+
+ for (j = 0; j < 32; j++)
+ for (i = 0; i < 32; i++)
+ assert (out[j * 32 + i] == (i + j) * 2);
+}
+
+
+/* Test of reduction on loop directive (workers, private reduction
+ variable). */
+
+void w_p_1()
+{
+ int i, j, arr[1024], out[32], res = 0, hres = 0;
+
+ for (i = 0; i < 1024; i++)
+ arr[i] = i;
+
+ #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
+ private(res) copyout(out)
+ {
+ #pragma acc loop gang
+ for (j = 0; j < 32; j++)
+ {
+ res = 0;
+
+ #pragma acc loop worker reduction(+:res)
+ for (i = 0; i < 32; i++)
+ res += arr[j * 32 + i];
+
+ out[j] = res;
+ }
+ }
+
+ for (j = 0; j < 32; j++)
+ {
+ hres = 0;
+
+ for (i = 0; i < 32; i++)
+ hres += arr[j * 32 + i];
+
+ assert (out[j] == hres);
+ }
+}
+
+
+/* Test of reduction on loop directive (workers and vectors, private reduction
+ variable). */
+
+void wv_p_1()
+{
+ int i, j, arr[1024], out[32], res = 0, hres = 0;
+
+ for (i = 0; i < 1024; i++)
+ arr[i] = i;
+
+ #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
+ private(res) copyout(out)
+ {
+ #pragma acc loop gang
+ for (j = 0; j < 32; j++)
+ {
+ res = 0;
+
+ #pragma acc loop worker vector reduction(+:res)
+ for (i = 0; i < 32; i++)
+ res += arr[j * 32 + i];
+
+ out[j] = res;
+ }
+ }
+
+ for (j = 0; j < 32; j++)
+ {
+ hres = 0;
+
+ for (i = 0; i < 32; i++)
+ hres += arr[j * 32 + i];
+
+ assert (out[j] == hres);
+ }
+}
+
+
+/* Test of reduction on loop directive (workers and vectors, private reduction
+ variable). */
+
+void wv_p_2()
+{
+ int i, j, arr[32768], out[32], res = 0, hres = 0;
+
+ for (i = 0; i < 32768; i++)
+ arr[i] = i;
+
+ #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
+ private(res) copyout(out)
+ {
+ #pragma acc loop gang
+ for (j = 0; j < 32; j++)
+ {
+ res = j;
+
+ #pragma acc loop worker reduction(+:res)
+ for (i = 0; i < 1024; i++)
+ res += arr[j * 1024 + i];
+
+ #pragma acc loop vector reduction(+:res)
+ for (i = 1023; i >= 0; i--)
+ res += arr[j * 1024 + i];
+
+ out[j] = res;
+ }
+ }
+
+ for (j = 0; j < 32; j++)
+ {
+ hres = j;
+
+ for (i = 0; i < 1024; i++)
+ hres += arr[j * 1024 + i] * 2;
+
+ assert (out[j] == hres);
+ }
+}
+
+
+/* Test of reduction on loop directive (workers and vectors, private reduction
+ variable: gang-redundant mode). */
+
+void wv_p_3()
+{
+ int i, arr[1024], out[32], res = 0, hres = 0;
+
+ for (i = 0; i < 1024; i++)
+ arr[i] = i ^ 33;
+
+ #pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
+ private(res) copyin(arr) copyout(out)
+ {
+ /* Private variables aren't initialized by default in openacc. */
+ res = 0;
+
+ /* "res" should be available at the end of the following loop (and should
+ have the same value redundantly in each gang). */
+ #pragma acc loop worker vector reduction(+:res)
+ for (i = 0; i < 1024; i++)
+ res += arr[i];
+
+ #pragma acc loop gang (static: 1)
+ for (i = 0; i < 32; i++)
+ out[i] = res;
+ }
+
+ for (i = 0; i < 1024; i++)
+ hres += arr[i];
+
+ for (i = 0; i < 32; i++)
+ assert (out[i] == hres);
+}
+
+
int main()
{
g_np_1();
gv_np_1();
gw_np_1();
gwv_np_1();
+ gwv_np_2();
+ gwv_np_3();
+ gwv_np_4();
+ v_p_1();
+ v_p_2();
+ w_p_1();
+ wv_p_1();
+ wv_p_2();
+ wv_p_3();
return 0;
}