Bureaucrats, cc_docs_admin, cc_staff, rsnt_translations
2,837
edits
No edit summary |
No edit summary |
||
Line 260: | Line 260: | ||
</translate> | </translate> | ||
{{Command | {{Command | ||
| | |nvc++ -fast -Minfo{{=}}accel -ta{{=}}tesla:managed main.cpp -o challenge | ||
|result= | |result= | ||
matvec(const matrix &, const vector &, const vector &): | matvec(const matrix &, const vector &, const vector &): | ||
23, include "matrix_functions.h" | 23, include "matrix_functions.h" | ||
27, Generating copyout(ycoefs[:num_rows]) | 27, Generating implicit copyout(ycoefs[:num_rows]) [if not already present] | ||
Generating copyin(xcoefs[:], | Generating implicit copyin(xcoefs[:],row_offsets[:num_rows+1],Acoefs[:],cols[:]) [if not already present] | ||
30, Loop is parallelizable | |||
Generating Tesla code | Generating Tesla code | ||
30, #pragma acc loop gang /* blockIdx.x */ | |||
34, #pragma acc loop vector(128) /* threadIdx.x */ | |||
Generating implicit reduction(+:sum) | |||
34, Loop is parallelizable | |||
}} | }} | ||
<translate> | <translate> |