Skip to content

Commit 4ffa2ab

Browse files
authored
Update shallow_swap.acc.c
collapse T100 and T200 loops
1 parent 87e95b2 commit 4ffa2ab

File tree

1 file changed

+3
-3
lines changed

1 file changed

+3
-3
lines changed

shallow_swap.acc.c

+3-3
Original file line numberDiff line numberDiff line change
@@ -250,7 +250,7 @@ int main(int argc, char **argv) {
250250

251251
// Compute capital u, capital v, z and h
252252
c1 = wtime();
253-
#pragma acc parallel loop independent present(p[:SIZE],u[:SIZE],v[:SIZE]) deviceptr(cu,cv,z,h)
253+
#pragma acc parallel loop collapse(2) present(p[:SIZE],u[:SIZE],v[:SIZE]) deviceptr(cu,cv,z,h)
254254
for (i=0;i<M;i++) {
255255
for (j=0;j<N;j++) {
256256
int idx00 = (i*N_LEN) + j;
@@ -296,7 +296,7 @@ int main(int argc, char **argv) {
296296
}
297297
c1 = wtime();
298298

299-
#pragma acc parallel loop independent present(unew[:SIZE],vnew[:SIZE],pnew[:SIZE]) deviceptr(cu,cv,z,h,uold,vold,pold)
299+
#pragma acc parallel loop collapse(2) present(unew[:SIZE],vnew[:SIZE],pnew[:SIZE]) deviceptr(cu,cv,z,h,uold,vold,pold)
300300
for (i=0;i<M;i++) {
301301
for (j=0;j<N;j++) {
302302
int idx00 = (i*N_LEN) + j;
@@ -315,7 +315,7 @@ int main(int argc, char **argv) {
315315
// Periodic continuation
316316
#pragma acc parallel loop independent present(unew[:SIZE],vnew[:SIZE],pnew[:SIZE])
317317
for (j=0;j<N;j++) {
318-
#pragma acc cache(unew[M*N_LEN:N_LEN],vnew[:N_LEN],pnew[:N_LEN])
318+
//#pragma acc cache(unew[M*N_LEN:N_LEN],vnew[:N_LEN],pnew[:N_LEN])
319319
//printf("N loop unew %d -> %d, vnew %d -> %d , pnew %d -> %d\n",M*N_LEN+j,j,j+1,M*N_LEN +j + 1,j,M*N_LEN +j);
320320
unew[j] = unew[M*N_LEN+j];
321321
vnew[M*N_LEN +j + 1] = vnew[j + 1];

0 commit comments

Comments
 (0)