Mentions légales du service

Skip to content
Snippets Groups Projects
Commit 521fe1d6 authored by Mathieu Faverge's avatar Mathieu Faverge
Browse files

gepdf_qdwh: enforce the use of the original lacpy

parent 036be0d1
No related branches found
No related tags found
1 merge request!307GETRF NOPIV: Use explicit workspaces to control the communication flow
...@@ -15,7 +15,7 @@ ...@@ -15,7 +15,7 @@
* @author Mathieu Faverge * @author Mathieu Faverge
* @author Hatem Ltaief * @author Hatem Ltaief
* @author Lionel Eyraud-Dubois * @author Lionel Eyraud-Dubois
* @date 2023-07-05 * @date 2024-10-17
* @precisions normal z -> s d c * @precisions normal z -> s d c
* *
*/ */
...@@ -35,8 +35,8 @@ static int _zgepdf_qdwh_opt_genD = 1; ...@@ -35,8 +35,8 @@ static int _zgepdf_qdwh_opt_genD = 1;
static int _zgepdf_qdwh_opt_genD = 0; static int _zgepdf_qdwh_opt_genD = 0;
#endif #endif
static int _zgepdf_qdwh_opt_qr = 1; static int _zgepdf_qdwh_opt_qr = 1;
static int _zgepdf_qdwh_opt_id = 1; // There is a numerical issue when combining this optimization and the StarPU lacpy static int _zgepdf_qdwh_opt_id = 1;
static int _zgepdf_qdwh_verbose = 0; static int _zgepdf_qdwh_verbose = 0;
/** /**
...@@ -603,6 +603,7 @@ chameleon_pzgepdf_qdwh( cham_mtxtype_t mtxtype, CHAM_desc_t *descU, CHAM_desc_t ...@@ -603,6 +603,7 @@ chameleon_pzgepdf_qdwh( cham_mtxtype_t mtxtype, CHAM_desc_t *descU, CHAM_desc_t
double conv = 100.; double conv = 100.;
double normest, Unorm; double normest, Unorm;
int it, itconv, facto = -1; int it, itconv, facto = -1;
cham_bool_t optlacpy_backup;
double eps = CHAMELEON_dlamch(); double eps = CHAMELEON_dlamch();
double tol1 = 5. * eps; double tol1 = 5. * eps;
...@@ -615,6 +616,10 @@ chameleon_pzgepdf_qdwh( cham_mtxtype_t mtxtype, CHAM_desc_t *descU, CHAM_desc_t ...@@ -615,6 +616,10 @@ chameleon_pzgepdf_qdwh( cham_mtxtype_t mtxtype, CHAM_desc_t *descU, CHAM_desc_t
} }
assert( chamctxt->scheduler != RUNTIME_SCHED_PARSEC ); assert( chamctxt->scheduler != RUNTIME_SCHED_PARSEC );
/* Force unoptimized lacpy */
optlacpy_backup = chamctxt->optlacpy_enabled;
chamctxt->optlacpy_enabled = CHAMELEON_FALSE;
if ( info ) { if ( info ) {
info->itQR = 0; info->itQR = 0;
info->itPO = 0; info->itPO = 0;
...@@ -848,5 +853,8 @@ chameleon_pzgepdf_qdwh( cham_mtxtype_t mtxtype, CHAM_desc_t *descU, CHAM_desc_t ...@@ -848,5 +853,8 @@ chameleon_pzgepdf_qdwh( cham_mtxtype_t mtxtype, CHAM_desc_t *descU, CHAM_desc_t
&descB2, &descTS2, &descTT2, &descQ2, &descD2 ); &descB2, &descTS2, &descTT2, &descQ2, &descD2 );
CHAMELEON_zgemm_WS_Free( gemm_ws ); CHAMELEON_zgemm_WS_Free( gemm_ws );
/* Restore optimized lacpy value */
chamctxt->optlacpy_enabled = optlacpy_backup;
return; return;
} }
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment