-
Mathieu Faverge authoredMathieu Faverge authored
codelet_ztpqrt.c 2.79 KiB
/**
*
* @file starpu/codelet_ztpqrt.c
*
* @copyright 2009-2016 The University of Tennessee and The University of
* Tennessee Research Foundation. All rights reserved.
* @copyright 2012-2023 Bordeaux INP, CNRS (LaBRI UMR 5800), Inria,
* Univ. Bordeaux. All rights reserved.
*
***
*
* @brief Chameleon ztpqrt StarPU codelet
*
* @version 1.2.0
* @author Mathieu Faverge
* @author Florent Pruvost
* @author Lucas Barros de Assis
* @author Samuel Thibault
* @date 2022-02-22
* @precisions normal z -> s d c
*
*/
#include "chameleon_starpu.h"
#include "runtime_codelet_z.h"
#if !defined(CHAMELEON_SIMULATION)
static void cl_ztpqrt_cpu_func(void *descr[], void *cl_arg)
{
int M;
int N;
int L;
int ib;
CHAM_tile_t *tileA;
CHAM_tile_t *tileB;
CHAM_tile_t *tileT;
CHAM_tile_t *tileWORK;
tileA = cti_interface_get(descr[0]);
tileB = cti_interface_get(descr[1]);
tileT = cti_interface_get(descr[2]);
tileWORK = cti_interface_get(descr[3]); /* ib * nb */
starpu_codelet_unpack_args( cl_arg, &M, &N, &L, &ib );
TCORE_zlaset( ChamUpperLower, ib, N, 0., 0., tileT );
TCORE_ztpqrt( M, N, L, ib,
tileA, tileB, tileT, tileWORK->mat );
}
#endif /* !defined(CHAMELEON_SIMULATION) */
/*
* Codelet definition
*/
CODELETS_CPU(ztpqrt, cl_ztpqrt_cpu_func)
void INSERT_TASK_ztpqrt( const RUNTIME_option_t *options,
int M, int N, int L, int ib, int nb,
const CHAM_desc_t *A, int Am, int An,
const CHAM_desc_t *B, int Bm, int Bn,
const CHAM_desc_t *T, int Tm, int Tn )
{
struct starpu_codelet *codelet = &cl_ztpqrt;
void (*callback)(void*) = options->profiling ? cl_ztpqrt_callback : NULL;
CHAMELEON_BEGIN_ACCESS_DECLARATION;
CHAMELEON_ACCESS_RW(A, Am, An);
CHAMELEON_ACCESS_RW(B, Bm, Bn);
CHAMELEON_ACCESS_W(T, Tm, Tn);
CHAMELEON_END_ACCESS_DECLARATION;
rt_starpu_insert_task(