1 /* { dg-do run { target openacc_nvidia_accel_selected } } */
2 /* { dg-additional-options "-foffload=-fdump-tree-oaccdevlow" } */
3 /* { dg-set-target-env-var "GOMP_DEBUG" "1" } */
17 for (unsigned int i
= 0; i
< n
; ++i
)
23 #pragma acc parallel num_workers (2) vector_length (128) copyin (a,b) copyout (c)
25 #pragma acc loop worker
26 for (unsigned int i
= 0; i
< 4; i
++)
27 #pragma acc loop vector
28 for (unsigned int j
= 0; j
< n
/ 4; j
++)
29 c
[(i
* N
/ 4) + j
] = a
[(i
* N
/ 4) + j
] + b
[(i
* N
/ 4) + j
];
32 for (unsigned int i
= 0; i
< n
; ++i
)
33 if (c
[i
] != (i
% 3) + (i
% 5))
39 /* { dg-final { scan-offload-tree-dump "__attribute__\\(\\(oacc function \\(1, 2, 128\\)" "oaccdevlow" } } */
40 /* { dg-output "nvptx_exec: kernel main\\\$_omp_fn\\\$0: launch gangs=1, workers=2, vectors=128" } */