Commit 54816087 authored by PRUVOST Florent's avatar PRUVOST Florent

add eztrace chameleon_cuda module - not checked yet

parent ca3d1e6f
###
#
# @copyright (c) 2009-2014 The University of Tennessee and The University
# of Tennessee Research Foundation.
# All rights reserved.
# @copyright (c) 2012-2015 Inria. All rights reserved.
# @copyright (c) 2012-2014 Bordeaux INP, CNRS (LaBRI UMR 5800), Inria, Univ. Bordeaux. All rights reserved.
#
###
#
# @file CMakeLists.txt
#
# @project MORSE
# MORSE is a software package provided by:
# Inria Bordeaux - Sud-Ouest,
# Univ. of Tennessee,
# King Abdullah Univesity of Science and Technology
# Univ. of California Berkeley,
# Univ. of Colorado Denver.
#
# @version 0.9.0
# @author Florent Pruvost
# @date 16-09-2015
#
###
if (NOT EZTRACE_FOUND)
find_package(EZTRACE)
endif()
if (EZTRACE_FOUND AND EZTRACE_DIR_FOUND)
set(EZTRACE_eztrace_create_plugin_DIR "EZTRACE_eztrace_create_plugin_DIR-NOTFOUND")
find_path(EZTRACE_eztrace_create_plugin_DIR
NAMES eztrace_create_plugin
HINTS ${EZTRACE_DIR_FOUND}/bin)
if (EZTRACE_eztrace_create_plugin_DIR)
set(EZTRACE_CREATE_PLUGIN "${EZTRACE_eztrace_create_plugin_DIR}/eztrace_create_plugin")
add_custom_command(
OUTPUT ${CMAKE_CURRENT_BINARY_DIR}/output
COMMAND ${EZTRACE_CREATE_PLUGIN}
ARGS ${CMAKE_CURRENT_SOURCE_DIR}/cudablas_eztrace_module
DEPENDS ${CMAKE_CURRENT_SOURCE_DIR}/cudablas_eztrace_module
)
add_custom_target(
eztrace-module-chameleon_cuda-dir ALL
DEPENDS ${CMAKE_CURRENT_BINARY_DIR}/output
)
add_custom_command(
OUTPUT libeztrace-convert-chameleon_cuda.so
COMMAND make
WORKING_DIRECTORY ${CMAKE_CURRENT_BINARY_DIR}/output
DEPENDS ${CMAKE_CURRENT_BINARY_DIR}/output
)
add_custom_target(
eztrace-module-chameleon_cuda-libs ALL
DEPENDS libeztrace-convert-chameleon_cuda.so
)
# installation
# ------------
install(
FILES
${CMAKE_CURRENT_BINARY_DIR}/output/libeztrace-autostart-chameleon_cuda.so
${CMAKE_CURRENT_BINARY_DIR}/output/libeztrace-chameleon_cuda.so
${CMAKE_CURRENT_BINARY_DIR}/output/libeztrace-convert-chameleon_cuda.so
DESTINATION ${EZTRACE_LIBRARY_DIRS}
)
endif (EZTRACE_eztrace_create_plugin_DIR)
endif (EZTRACE_FOUND AND EZTRACE_DIR_FOUND)
###
### END CMakeLists.txt
###
BEGIN_MODULE
NAME chameleon_cuda
DESC "Module for Chameleon CUDA functions"
ID 7771
int CUDA_cgelqt(
void* m, void* n, void* nb,
void *da, void* ldda,
void *v, void* ldv,
void *dt, void* lddt,
void *t, void* ldt,
void *dd,
void *d, void* ldd,
void *tau,
void *hwork,
void *dwork,
void* stream);
int CUDA_cgemerge(
void* side, void* diag,
void* M, void* N,
void *A, void* LDA,
void *B, void* LDB,
void* stream);
int CUDA_cgemm_V2(
void* transa, void* transb,
int m, int n, int k,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_cgemm(
void* transa, void* transb,
int m, int n, int k,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_cgeqrt(
void* m, void* n, void* nb,
void *da, void* ldda,
void *v, void* ldv,
void *dt, void* lddt,
void *t, void* ldt,
void *dd,
void *d, void* ldd,
void *tau,
void *hwork,
void *dwork,
void* stream);
int CUDA_cgessm(
char storev, void* m, void* n, void* k, void* ib,
void* *ipiv,
void *dL1, void* lddl1,
void *dL, void* lddl,
void *dA, void* ldda,
void* info);
int CUDA_cgetrf_incpiv(
char storev, void* m, void* n, void* ib,
void *hA, void* ldha, void *dA, void* ldda,
void *hL, void* ldhl, void *dL, void* lddl,
void* *ipiv,
void *dwork, void* lddwork,
void* info);
int CUDA_cgetrf_nopiv(
void* m, void* n,
void *dA, void* ldda,
void* info);
int CUDA_chemm_V2(
void* side, void* uplo,
int m, int n,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_chemm(
void* side, void* uplo,
int m, int n,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_cher2k_V2(
void* uplo, void* trans,
int n, int k,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
float *beta,
void *C, int ldc,
void* stream);
int CUDA_cher2k(
void* uplo, void* trans,
int n, int k,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
float *beta,
void *C, int ldc,
void* stream);
int CUDA_cherk_V2(
void* uplo, void* trans,
int n, int k,
float *alpha,
const void *A, int lda,
float *beta,
void *B, int ldb,
void* stream);
int CUDA_cherk(
void* uplo, void* trans,
int n, int k,
float *alpha,
const void *A, int lda,
float *beta,
void *B, int ldb,
void* stream);
int CUDA_clauum(
char uplo, void* n,
void *dA, void* ldda, void* info);
int CUDA_cparfb(
void* side, void* trans,
void* direct, void* storev,
void* M1, void* N1,
void* M2, void* N2,
void* K, void* L,
void *A1, void* LDA1,
void *A2, void* LDA2,
void *V, void* LDV,
void *T, void* LDT,
void *WORK, void* LDWORK,
void *WORKC, void* LDWORKC,
void* stream);
int CUDA_cpotrf(
void* uplo, void* n,
void *dA, void* ldda, void* info);
int CUDA_cssssm(
void* storev, void* m1, void* n1,
void* m2, void* n2, void* k, void* ib,
void *dA1, void* ldda1,
void *dA2, void* ldda2,
void *dL1, void* lddl1,
void *dL2, void* lddl2,
void* *IPIV, void* info);
int CUDA_csymm_V2(
void* side, void* uplo,
int m, int n,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_csymm(
void* side, void* uplo,
int m, int n,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_csyr2k_V2(
void* uplo, void* trans,
int n, int k,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_csyr2k(
void* uplo, void* trans,
int n, int k,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_csyrk_V2(
void* uplo, void* trans,
int n, int k,
void *alpha,
const void *A, int lda,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_csyrk(
void* uplo, void* trans,
int n, int k,
void *alpha,
const void *A, int lda,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_ctrmm_V2(
void* side, void* uplo,
void* transa, void* diag,
int m, int n,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
void *C, int ldc,
void* stream);
int CUDA_ctrmm(
void* side, void* uplo,
void* transa, void* diag,
int m, int n,
void *alpha,
const void *A, int lda,
void *B, int ldb,
void* stream);
int CUDA_ctrsm_V2(
void* side, void* uplo,
void* transa, void* diag,
int m, int n,
const void *alpha,
const void *A, int lda,
void *B, int ldb,
void* stream);
int CUDA_ctrsm(
void* side, void* uplo,
void* transa, void* diag,
int m, int n,
void *alpha,
const void *A, int lda,
void *B, int ldb,
void* stream);
int CUDA_ctrtri(
void* uplo, void* diag, void* n,
void *dA, void* ldda, void* info);
int CUDA_ctslqt(
void* m, void* n, void* nb,
void *da1, void* ldda1,
void *da2, void* ldda2,
void *a2, void* lda2,
void *dt, void* lddt,
void *t, void* ldt,
void *dd,
void *d, void* ldd,
void *tau,
void *hwork,
void *dwork,
void* stream);
int CUDA_ctsmlq(
void* side, void* trans,
void* M1, void* N1,
void* M2, void* N2,
void* K, void* IB,
void *A1, void* LDA1,
void *A2, void* LDA2,
void *V, void* LDV,
void *T, void* LDT,
void *WORK, void* LDWORK,
void *WORKC, void* LDWORKC,
void* stream);
int CUDA_ctsmqr(
void* side, void* trans,
void* M1, void* N1,
void* M2, void* N2,
void* K, void* IB,
void *A1, void* LDA1,
void *A2, void* LDA2,
void *V, void* LDV,
void *T, void* LDT,
void *WORK, void* LDWORK,
void *WORKC, void* LDWORKC,
void* stream);
int CUDA_ctsqrt(
void* m, void* n, void* nb,
void *da1, void* ldda1,
void *da2, void* ldda2,
void *a2, void* lda2,
void *dt, void* lddt,
void *t, void* ldt,
void *dd,
void *d, void* ldd,
void *tau,
void *hwork,
void *dwork,
void* stream);
int CUDA_ctstrf(
char storev, void* m, void* n, void* ib, void* nb,
void *hU, void* ldhu, void *dU, void* lddu,
void *hA, void* ldha, void *dA, void* ldda,
void *hL, void* ldhl, void *dL, void* lddl,
void* *ipiv,
void *hwork, void* ldhwork,
void *dwork, void* lddwork,
void* info);
int CUDA_cunmlqt(
void* side, void* trans,
void* M, void* N, void* K, void* IB,
void *A, void* LDA,
void *T, void* LDT,
void *C, void* LDC,
void *WORK, void* LDWORK );
int CUDA_cunmqrt(
void* side, void* trans,
void* M, void* N, void* K, void* IB,
void *A, void* LDA,
void *T, void* LDT,
void *C, void* LDC,
void *WORK, void* LDWORK );
int CUDA_dgelqt(
void* m, void* n, void* nb,
double *da, void* ldda,
double *v, void* ldv,
double *dt, void* lddt,
double *t, void* ldt,
double *dd,
double *d, void* ldd,
double *tau,
double *hwork,
double *dwork,
void* stream);
int CUDA_dgemerge(
void* side, void* diag,
void* M, void* N,
double *A, void* LDA,
double *B, void* LDB,
void* stream);
int CUDA_dgemm_V2(
void* transa, void* transb,
int m, int n, int k,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dgemm(
void* transa, void* transb,
int m, int n, int k,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dgeqrt(
void* m, void* n, void* nb,
double *da, void* ldda,
double *v, void* ldv,
double *dt, void* lddt,
double *t, void* ldt,
double *dd,
double *d, void* ldd,
double *tau,
double *hwork,
double *dwork,
void* stream);
int CUDA_dgessm(
char storev, void* m, void* n, void* k, void* ib,
void* *ipiv,
double *dL1, void* lddl1,
double *dL, void* lddl,
double *dA, void* ldda,
void* info);
int CUDA_dgetrf_incpiv(
char storev, void* m, void* n, void* ib,
double *hA, void* ldha, double *dA, void* ldda,
double *hL, void* ldhl, double *dL, void* lddl,
void* *ipiv,
double *dwork, void* lddwork,
void* info);
int CUDA_dgetrf_nopiv(
void* m, void* n,
double *dA, void* ldda,
void* info);
int CUDA_dsymm_V2(
void* side, void* uplo,
int m, int n,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dsymm(
void* side, void* uplo,
int m, int n,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dsyr2k_V2(
void* uplo, void* trans,
int n, int k,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dsyr2k(
void* uplo, void* trans,
int n, int k,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dsyrk_V2(
void* uplo, void* trans,
int n, int k,
double *alpha,
const double *A, int lda,
double *beta,
double *B, int ldb,
void* stream);
int CUDA_dsyrk(
void* uplo, void* trans,
int n, int k,
double *alpha,
const double *A, int lda,
double *beta,
double *B, int ldb,
void* stream);
int CUDA_dlauum(
char uplo, void* n,
double *dA, void* ldda, void* info);
int CUDA_dparfb(
void* side, void* trans,
void* direct, void* storev,
void* M1, void* N1,
void* M2, void* N2,
void* K, void* L,
double *A1, void* LDA1,
double *A2, void* LDA2,
const double *V, void* LDV,
const double *T, void* LDT,
double *WORK, void* LDWORK,
double *WORKC, void* LDWORKC,
void* stream);
int CUDA_dpotrf(
void* uplo, void* n,
double *dA, void* ldda, void* info);
int CUDA_dssssm(
void* storev, void* m1, void* n1,
void* m2, void* n2, void* k, void* ib,
double *dA1, void* ldda1,
double *dA2, void* ldda2,
double *dL1, void* lddl1,
double *dL2, void* lddl2,
void* *IPIV, void* info);
int CUDA_dsymm_V2(
void* side, void* uplo,
int m, int n,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dsymm(
void* side, void* uplo,
int m, int n,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dsyr2k_V2(
void* uplo, void* trans,
int n, int k,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dsyr2k(
void* uplo, void* trans,
int n, int k,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dsyrk_V2(
void* uplo, void* trans,
int n, int k,
double *alpha,
const double *A, int lda,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dsyrk(
void* uplo, void* trans,
int n, int k,
double *alpha,
const double *A, int lda,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dtrmm_V2(
void* side, void* uplo,
void* transa, void* diag,
int m, int n,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *C, int ldc,
void* stream);
int CUDA_dtrmm(
void* side, void* uplo,
void* transa, void* diag,
int m, int n,
double *alpha,
const double *A, int lda,
double *B, int ldb,
void* stream);
int CUDA_dtrsm_V2(
void* side, void* uplo,
void* transa, void* diag,
int m, int n,
const double *alpha,
const double *A, int lda,
double *B, int ldb,
void* stream);
int CUDA_dtrsm(
void* side, void* uplo,
void* transa, void* diag,
int m, int n,
double *alpha,
const double *A, int lda,
double *B, int ldb,
void* stream);
int CUDA_dtrtri(
void* uplo, void* diag, void* n,
double *dA, void* ldda, void* info);
int CUDA_dtslqt(
void* m, void* n, void* nb,
double *da1, void* ldda1,
double *da2, void* ldda2,
double *a2, void* lda2,
double *dt, void* lddt,
double *t, void* ldt,
double *dd,
double *d, void* ldd,
double *tau,
double *hwork,
double *dwork,
void* stream);
int CUDA_dtsmlq(
void* side, void* trans,