pzlacpy.c 3.47 KB
Newer Older
1
/**
2 3
 *
 * @file pzlacpy.c
4
 *
Mathieu Faverge's avatar
Mathieu Faverge committed
5 6
 * @copyright 2009-2014 The University of Tennessee and The University of
 *                      Tennessee Research Foundation. All rights reserved.
Mathieu Faverge's avatar
Mathieu Faverge committed
7
 * @copyright 2012-2018 Bordeaux INP, CNRS (LaBRI UMR 5800), Inria,
8
 *                      Univ. Bordeaux. All rights reserved.
9
 *
10
 ***
11
 *
12
 * @brief Chameleon zlacpy parallel algorithm
13
 *
Mathieu Faverge's avatar
Mathieu Faverge committed
14
 * @version 1.0.0
15
 * @comment This file has been automatically generated
16
 *          from Plasma 2.5.0 for CHAMELEON 1.0.0
17 18 19 20 21 22
 * @author Mathieu Faverge
 * @author Emmanuel Agullo
 * @author Cedric Castagnede
 * @date 2010-11-15
 * @precisions normal z -> s d c
 *
23
 */
24
#include "control/common.h"
25 26 27

#define A(m,n) A,  m,  n
#define B(m,n) B,  m,  n
28
/**
29
 *
30 31
 */
/**
32
 *
33
 */
Mathieu Faverge's avatar
Mathieu Faverge committed
34
void chameleon_pzlacpy(cham_uplo_t uplo, CHAM_desc_t *A, CHAM_desc_t *B,
35
                          RUNTIME_sequence_t *sequence, RUNTIME_request_t *request)
36
{
Mathieu Faverge's avatar
Mathieu Faverge committed
37
    CHAM_context_t *chamctxt;
38
    RUNTIME_option_t options;
39 40 41 42 43

    int X, Y;
    int m, n;
    int ldam, ldbm;

Mathieu Faverge's avatar
Mathieu Faverge committed
44
    chamctxt = chameleon_context_self();
Mathieu Faverge's avatar
Mathieu Faverge committed
45
    if (sequence->status != CHAMELEON_SUCCESS) {
46
        return;
Mathieu Faverge's avatar
Mathieu Faverge committed
47
    }
Mathieu Faverge's avatar
Mathieu Faverge committed
48
    RUNTIME_options_init(&options, chamctxt, sequence, request);
49 50 51

    switch (uplo) {
    /*
52
     *  ChamUpper
53
     */
54
    case ChamUpper:
55 56 57 58 59 60
        for (m = 0; m < A->mt; m++) {
            X = m == A->mt-1 ? A->m-m*A->mb : A->mb;
            ldam = BLKLDD(A, m);
            ldbm = BLKLDD(B, m);
            if (m < A->nt) {
                Y = m == A->nt-1 ? A->n-m*A->nb : A->nb;
61
                INSERT_TASK_zlacpy(
62
                    &options,
63
                    ChamUpper,
64 65 66 67 68 69
                    X, Y, A->mb,
                    A(m, m), ldam,
                    B(m, m), ldbm);
            }
            for (n = m+1; n < A->nt; n++) {
                Y = n == A->nt-1 ? A->n-n*A->nb : A->nb;
70
                INSERT_TASK_zlacpy(
71
                    &options,
72
                    ChamUpperLower,
73 74 75 76 77 78 79
                    X, Y, A->mb,
                    A(m, n), ldam,
                    B(m, n), ldbm);
            }
        }
        break;
    /*
80
     *  ChamLower
81
     */
82
    case ChamLower:
83 84 85 86 87 88
        for (m = 0; m < A->mt; m++) {
            X = m == A->mt-1 ? A->m-m*A->mb : A->mb;
            ldam = BLKLDD(A, m);
            ldbm = BLKLDD(B, m);
            if (m < A->nt) {
                Y = m == A->nt-1 ? A->n-m*A->nb : A->nb;
89
                INSERT_TASK_zlacpy(
90
                    &options,
91
                    ChamLower,
92 93 94 95
                    X, Y, A->mb,
                    A(m, m), ldam,
                    B(m, m), ldbm);
            }
96
            for (n = 0; n < chameleon_min(m, A->nt); n++) {
97
                Y = n == A->nt-1 ? A->n-n*A->nb : A->nb;
98
                INSERT_TASK_zlacpy(
99
                    &options,
100
                    ChamUpperLower,
101 102 103 104 105 106 107
                    X, Y, A->mb,
                    A(m, n), ldam,
                    B(m, n), ldbm);
            }
        }
        break;
    /*
108
     *  ChamUpperLower
109
     */
110
    case ChamUpperLower:
111 112 113 114 115 116 117
    default:
        for (m = 0; m < A->mt; m++) {
            X = m == A->mt-1 ? A->m-m*A->mb : A->mb;
            ldam = BLKLDD(A, m);
            ldbm = BLKLDD(B, m);
            for (n = 0; n < A->nt; n++) {
                Y = n == A->nt-1 ? A->n-n*A->nb : A->nb;
118
                INSERT_TASK_zlacpy(
119
                    &options,
120
                    ChamUpperLower,
121 122 123 124 125 126
                    X, Y, A->mb,
                    A(m, n), ldam,
                    B(m, n), ldbm);
            }
        }
    }
Mathieu Faverge's avatar
Mathieu Faverge committed
127
    RUNTIME_options_finalize(&options, chamctxt);
128
}