Skip to content
Snippets Groups Projects
Commit e893cacf authored by gkusoglu's avatar gkusoglu
Browse files

trying optimize doitgen

parent 397ad5c2
Branches
No related merge requests found
......@@ -70,21 +70,18 @@ void kernel_doitgen(int nr, int nq, int np,
int r, q, p, s;
#pragma scop
#pragma omp parallel for ordered schedule(static)
for (q = 0; q < _PB_NQ; q++)
#pragma omp ordered
for (r = 0; r < _PB_NR; r++){
#pragma omp parallel for
#pragma omp parallel for schedule(static)
for (p = 0; p < _PB_NP; p++)
sum[p] = SCALAR_VAL(0.0);
#pragma omp parallel for
for (s = 0; s < _PB_NP; s++)
for (p = 0; p < _PB_NP; p++)
sum[p] += A[r][q][s] * C4[s][p];
#pragma omp parallel for
#pragma omp parallel for schedule(static)
for (p = 0; p < _PB_NP; p++)
A[r][q][p] = sum[p];
}
......
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment