OpenACC Tutorial - Adding directives: Difference between revisions

no edit summary
No edit summary
No edit summary
Line 260: Line 260:
</translate>
</translate>
{{Command
{{Command
|pgc++ -fast -Minfo{{=}}accel -ta{{=}}tesla:managed main.cpp -o challenge
|nvc++ -fast -Minfo{{=}}accel -ta{{=}}tesla:managed main.cpp -o challenge
|result=
|result=
matvec(const matrix &, const vector &, const vector &):
matvec(const matrix &, const vector &, const vector &):
     23, include "matrix_functions.h"
     23, include "matrix_functions.h"
           27, Generating copyout(ycoefs[:num_rows])
           27, Generating implicit copyout(ycoefs[:num_rows]) [if not already present]
               Generating copyin(xcoefs[:],Acoefs[:],cols[:],row_offsets[:num_rows+1])
               Generating implicit copyin(xcoefs[:],row_offsets[:num_rows+1],Acoefs[:],cols[:]) [if not already present]
           29, Loop is parallelizable
           30, Loop is parallelizable
              Accelerator kernel generated
               Generating Tesla code
               Generating Tesla code
               29, #pragma acc loop gang, vector(128) /* blockIdx.x threadIdx.x */
               30, #pragma acc loop gang /* blockIdx.x */
           33, Loop is parallelizable
              34, #pragma acc loop vector(128) /* threadIdx.x */
                  Generating implicit reduction(+:sum)
           34, Loop is parallelizable
}}
}}
<translate>
<translate>
Bureaucrats, cc_docs_admin, cc_staff, rsnt_translations
2,837

edits