time_zpotrf_tile.c 2.56 KB
Newer Older
1
/**
2 3
 *
 * @file time_zpotrf_tile.c
4
 *
Mathieu Faverge's avatar
Mathieu Faverge committed
5 6
 * @copyright 2009-2014 The University of Tennessee and The University of
 *                      Tennessee Research Foundation. All rights reserved.
Mathieu Faverge's avatar
Mathieu Faverge committed
7
 * @copyright 2012-2018 Bordeaux INP, CNRS (LaBRI UMR 5800), Inria,
8
 *                      Univ. Bordeaux. All rights reserved.
9
 *
10
 ***
11
 *
Mathieu Faverge's avatar
Mathieu Faverge committed
12
 * @version 1.0.0
13 14
 * @precisions normal z -> c d s
 *
15
 */
16
#define _TYPE  CHAMELEON_Complex64_t
17 18 19
#define _PREC  double
#define _LAMCH LAPACKE_dlamch_work

20
#define _NAME  "CHAMELEON_zpotrf_Tile"
21 22 23 24 25 26 27
/* See Lawn 41 page 120 */
#define _FMULS FMULS_POTRF( N )
#define _FADDS FADDS_POTRF( N )

#include "./timing.c"

static int
28
RunTest( int *iparam, double *dparam, chameleon_time_t *t_ )
29 30
{
    PASTE_CODE_IPARAM_LOCALS( iparam );
31
    cham_uplo_t uplo = ChamUpper;
32

33
    LDA = chameleon_max( LDA, N );
34 35

    /* Allocate Data */
36 37 38 39
    PASTE_CODE_ALLOCATE_MATRIX_TILE( descA,  1,     CHAMELEON_Complex64_t, ChamComplexDouble, LDA, N, N    );
    PASTE_CODE_ALLOCATE_MATRIX_TILE( descB,  check, CHAMELEON_Complex64_t, ChamComplexDouble, LDB, N, NRHS );
    PASTE_CODE_ALLOCATE_MATRIX_TILE( descAC, check, CHAMELEON_Complex64_t, ChamComplexDouble, LDA, N, N    );
    PASTE_CODE_ALLOCATE_MATRIX_TILE( descX,  check, CHAMELEON_Complex64_t, ChamComplexDouble, LDB, N, NRHS );
40

41 42 43 44 45 46 47
    /* Initialize data and save A if check */
    if ( check ) {
        CHAMELEON_zplghe_Tile( (double)N, ChamUpperLower, descAC, 51 );
        CHAMELEON_zlacpy_Tile( uplo, descAC, descA );
    }
    else {
        CHAMELEON_zplghe_Tile( (double)N, uplo, descA, 51 );
48 49 50
    }
    //RUNTIME_zlocality_allrestrict( STARPU_CUDA );

51
    /* CHAMELEON ZPOTRF */
52
    START_TIMING();
53
    CHAMELEON_zpotrf_Tile( uplo, descA );
54 55 56 57 58
    STOP_TIMING();

    /* Check the solution */
    if ( check )
    {
59
        /* Initialize and save B */
60
        CHAMELEON_zplrnt_Tile( descB, 7672 );
61
        CHAMELEON_zlacpy_Tile( ChamUpperLower, descB, descX );
62 63

        /* Compute the solution */
64
        CHAMELEON_zpotrs_Tile( uplo, descA, descX );
65 66

        /* Check solution */
67 68 69
        dparam[IPARAM_ANORM] = CHAMELEON_zlange_Tile( ChamInfNorm, descAC );
        dparam[IPARAM_BNORM] = CHAMELEON_zlange_Tile( ChamInfNorm, descB  );
        dparam[IPARAM_XNORM] = CHAMELEON_zlange_Tile( ChamInfNorm, descX  );
70
        CHAMELEON_zgemm_Tile( ChamNoTrans, ChamNoTrans, 1.0, descAC, descX, -1.0, descB );
71
        dparam[IPARAM_RES] = CHAMELEON_zlange_Tile( ChamInfNorm, descB );
72 73 74 75 76 77 78 79 80 81

        PASTE_CODE_FREE_MATRIX( descB  );
        PASTE_CODE_FREE_MATRIX( descAC );
        PASTE_CODE_FREE_MATRIX( descX  );

    }
    PASTE_CODE_FREE_MATRIX( descA );

    return 0;
}