From 312391def5e2656e63c91f34b3eb5fe2843cee03 Mon Sep 17 00:00:00 2001 From: Mathieu Faverge <mathieu.faverge@inria.fr> Date: Wed, 7 Feb 2018 13:54:17 +0100 Subject: [PATCH] Silent bug issue reletaed to a = a in hetra1 kernels --- coreblas/compute/core_ztsmlq_hetra1.c | 6 ++++-- coreblas/compute/core_ztsmqr_hetra1.c | 6 ++++-- 2 files changed, 8 insertions(+), 4 deletions(-) diff --git a/coreblas/compute/core_ztsmlq_hetra1.c b/coreblas/compute/core_ztsmlq_hetra1.c index e7edbe4be..e7903c4e0 100644 --- a/coreblas/compute/core_ztsmlq_hetra1.c +++ b/coreblas/compute/core_ztsmlq_hetra1.c @@ -143,8 +143,9 @@ int CORE_ztsmlq_hetra1( MORSE_enum side, MORSE_enum trans, /* in-place transposition of A1 */ for (j = 0; j < n1; j++){ +#if defined(PRECISION_z) || defined(PRECISION_c) A1[j + j*lda1] = conj(A1[j + j*lda1]); - +#endif for (i = j+1; i < m1; i++){ *WORK = *(A1 + i + j*lda1); *(A1 + i + j*lda1) = conj(*(A1 + j + i*lda1)); @@ -159,8 +160,9 @@ int CORE_ztsmlq_hetra1( MORSE_enum side, MORSE_enum trans, /* in-place transposition of A1 */ for (j = 0; j < n1; j++){ +#if defined(PRECISION_z) || defined(PRECISION_c) A1[j + j*lda1] = conj(A1[j + j*lda1]); - +#endif for (i = j+1; i < m1; i++){ *WORK = *(A1 + i + j*lda1); *(A1 + i + j*lda1) = conj(*(A1 + j + i*lda1)); diff --git a/coreblas/compute/core_ztsmqr_hetra1.c b/coreblas/compute/core_ztsmqr_hetra1.c index e0675ddff..f66c27f11 100644 --- a/coreblas/compute/core_ztsmqr_hetra1.c +++ b/coreblas/compute/core_ztsmqr_hetra1.c @@ -145,8 +145,9 @@ int CORE_ztsmqr_hetra1( MORSE_enum side, MORSE_enum trans, /* in-place transposition of A1 */ for (j = 0; j < n1; j++){ +#if defined(PRECISION_z) || defined(PRECISION_c) A1[j + j*lda1] = conj(A1[j + j*lda1]); - +#endif for (i = j+1; i < m1; i++){ *WORK = *(A1 + i + j*lda1); *(A1 + i + j*lda1) = conj(*(A1 + j + i*lda1)); @@ -158,8 +159,9 @@ int CORE_ztsmqr_hetra1( MORSE_enum side, MORSE_enum trans, /* in-place transposition of A1 */ for (j = 0; j < n1; j++){ +#if defined(PRECISION_z) || defined(PRECISION_c) A1[j + j*lda1] = conj(A1[j + j*lda1]); - +#endif for (i = j+1; i < m1; i++){ *WORK = *(A1 + i + j*lda1); *(A1 + i + j*lda1) = conj(*(A1 + j + i*lda1)); -- GitLab