Skip to content
Snippets Groups Projects
Commit ba1cb161 authored by gkusoglu's avatar gkusoglu
Browse files

symm

parent 37d4b070
Branches
No related merge requests found
......@@ -90,22 +90,20 @@ void kernel_symm(int m, int n,
// C is MxN
//note that due to Fortran array layout, the code below more closely resembles upper triangular case in BLAS
#pragma scop
for (i = 0; i < _PB_M; i++){
#pragma omp parallel for
for (i = 0; i < _PB_M; i++){
#pragma omp parallel for
for (k = 0; k < i; k++)
for (j = 0; j < _PB_N; j++ )
for (k = 0; k < i; k++)
C[k][j] += alpha*B[i][j] * A[i][k];
for (j = 0; j < _PB_N; j++ ){
temp2 = 0;
for (k = 0; k < i; k++) {
temp2 += B[k][j] * A[i][k];
}
C[i][j] = beta * C[i][j] + alpha*B[i][j] * A[i][i] + alpha * temp2;
}
}
C[k][j] += alpha*B[i][j] * A[i][k];
for (j = 0; j < _PB_N; j++ ){
temp2 = 0;
for (k = 0; k < i; k++) {
temp2 += B[k][j] * A[i][k];
}
C[i][j] = beta * C[i][j] + alpha*B[i][j] * A[i][i] + alpha * temp2;
}
}
#pragma endscop
}
......
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment