Skip to content
GitLab
Projects
Groups
Snippets
Help
Loading...
Help
What's new
7
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Open sidebar
AGULLO Emmanuel
Chameleon
Commits
54816087
Commit
54816087
authored
Sep 17, 2015
by
PRUVOST Florent
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
add eztrace chameleon_cuda module - not checked yet
parent
ca3d1e6f
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
1312 additions
and
0 deletions
+1312
-0
cudablas/eztrace_module/CMakeLists.txt
cudablas/eztrace_module/CMakeLists.txt
+78
-0
cudablas/eztrace_module/cudablas_eztrace_module
cudablas/eztrace_module/cudablas_eztrace_module
+1234
-0
No files found.
cudablas/eztrace_module/CMakeLists.txt
0 → 100644
View file @
54816087
###
#
# @copyright (c) 2009-2014 The University of Tennessee and The University
# of Tennessee Research Foundation.
# All rights reserved.
# @copyright (c) 2012-2015 Inria. All rights reserved.
# @copyright (c) 2012-2014 Bordeaux INP, CNRS (LaBRI UMR 5800), Inria, Univ. Bordeaux. All rights reserved.
#
###
#
# @file CMakeLists.txt
#
# @project MORSE
# MORSE is a software package provided by:
# Inria Bordeaux - Sud-Ouest,
# Univ. of Tennessee,
# King Abdullah Univesity of Science and Technology
# Univ. of California Berkeley,
# Univ. of Colorado Denver.
#
# @version 0.9.0
# @author Florent Pruvost
# @date 16-09-2015
#
###
if
(
NOT EZTRACE_FOUND
)
find_package
(
EZTRACE
)
endif
()
if
(
EZTRACE_FOUND AND EZTRACE_DIR_FOUND
)
set
(
EZTRACE_eztrace_create_plugin_DIR
"EZTRACE_eztrace_create_plugin_DIR-NOTFOUND"
)
find_path
(
EZTRACE_eztrace_create_plugin_DIR
NAMES eztrace_create_plugin
HINTS
${
EZTRACE_DIR_FOUND
}
/bin
)
if
(
EZTRACE_eztrace_create_plugin_DIR
)
set
(
EZTRACE_CREATE_PLUGIN
"
${
EZTRACE_eztrace_create_plugin_DIR
}
/eztrace_create_plugin"
)
add_custom_command
(
OUTPUT
${
CMAKE_CURRENT_BINARY_DIR
}
/output
COMMAND
${
EZTRACE_CREATE_PLUGIN
}
ARGS
${
CMAKE_CURRENT_SOURCE_DIR
}
/cudablas_eztrace_module
DEPENDS
${
CMAKE_CURRENT_SOURCE_DIR
}
/cudablas_eztrace_module
)
add_custom_target
(
eztrace-module-chameleon_cuda-dir ALL
DEPENDS
${
CMAKE_CURRENT_BINARY_DIR
}
/output
)
add_custom_command
(
OUTPUT libeztrace-convert-chameleon_cuda.so
COMMAND make
WORKING_DIRECTORY
${
CMAKE_CURRENT_BINARY_DIR
}
/output
DEPENDS
${
CMAKE_CURRENT_BINARY_DIR
}
/output
)
add_custom_target
(
eztrace-module-chameleon_cuda-libs ALL
DEPENDS libeztrace-convert-chameleon_cuda.so
)
# installation
# ------------
install
(
FILES
${
CMAKE_CURRENT_BINARY_DIR
}
/output/libeztrace-autostart-chameleon_cuda.so
${
CMAKE_CURRENT_BINARY_DIR
}
/output/libeztrace-chameleon_cuda.so
${
CMAKE_CURRENT_BINARY_DIR
}
/output/libeztrace-convert-chameleon_cuda.so
DESTINATION
${
EZTRACE_LIBRARY_DIRS
}
)
endif
(
EZTRACE_eztrace_create_plugin_DIR
)
endif
(
EZTRACE_FOUND AND EZTRACE_DIR_FOUND
)
###
### END CMakeLists.txt
###
cudablas/eztrace_module/cudablas_eztrace_module
0 → 100644
View file @
54816087
BEGIN_MODULE
NAME chameleon_cuda
DESC "Module for Chameleon CUDA functions"
ID 7771
int CUDA_cgelqt(
void* m, void* n, void* nb,
void *da, void* ldda,
void *v, void* ldv,
void *dt, void* lddt,
void *t, void* ldt,
void *dd,
void *d, void* ldd,
void *tau,
void *hwork,
void *dwork,
void* stream);
int CUDA_cgemerge(
void* side, void* diag,
void* M, void* N,
void *A, void* LDA,
void *B, void* LDB,
void* stream);
int CUDA_cgemm_V2(
void* transa, void* transb,
int m, int n, int k,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_cgemm(
void* transa, void* transb,
int m, int n, int k,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_cgeqrt(
void* m, void* n, void* nb,
void *da, void* ldda,
void *v, void* ldv,
void *dt, void* lddt,
void *t, void* ldt,
void *dd,
void *d, void* ldd,
void *tau,
void *hwork,
void *dwork,
void* stream);
int CUDA_cgessm(
char storev, void* m, void* n, void* k, void* ib,
void* *ipiv,
void *dL1, void* lddl1,
void *dL, void* lddl,
void *dA, void* ldda,
void* info);
int CUDA_cgetrf_incpiv(
char storev, void* m, void* n, void* ib,
void *hA, void* ldha, void *dA, void* ldda,
void *hL, void* ldhl, void *dL, void* lddl,
void* *ipiv,
void *dwork, void* lddwork,
void* info);
int CUDA_cgetrf_nopiv(
void* m, void* n,
void *dA, void* ldda,
void* info);
int CUDA_chemm_V2(
void* side, void* uplo,
int m, int n,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_chemm(
void* side, void* uplo,
int m, int n,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_cher2k_V2(
void* uplo, void* trans,
int n, int k,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
float *beta,
void *C, int ldc,
void* stream);
int CUDA_cher2k(
void* uplo, void* trans,
int n, int k,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
float *beta,
void *C, int ldc,
void* stream);
int CUDA_cherk_V2(
void* uplo, void* trans,
int n, int k,
float *alpha,
const void *A, int lda,
float *beta,
void *B, int ldb,
void* stream);
int CUDA_cherk(
void* uplo, void* trans,
int n, int k,
float *alpha,
const void *A, int lda,
float *beta,
void *B, int ldb,
void* stream);
int CUDA_clauum(
char uplo, void* n,
void *dA, void* ldda, void* info);
int CUDA_cparfb(
void* side, void* trans,
void* direct, void* storev,
void* M1, void* N1,
void* M2, void* N2,
void* K, void* L,
void *A1, void* LDA1,
void *A2, void* LDA2,
void *V, void* LDV,
void *T, void* LDT,
void *WORK, void* LDWORK,
void *WORKC, void* LDWORKC,
void* stream);
int CUDA_cpotrf(
void* uplo, void* n,
void *dA, void* ldda, void* info);
int CUDA_cssssm(
void* storev, void* m1, void* n1,
void* m2, void* n2, void* k, void* ib,
void *dA1, void* ldda1,
void *dA2, void* ldda2,
void *dL1, void* lddl1,
void *dL2, void* lddl2,
void* *IPIV, void* info);
int CUDA_csymm_V2(
void* side, void* uplo,
int m, int n,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_csymm(
void* side, void* uplo,
int m, int n,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_csyr2k_V2(
void* uplo, void* trans,
int n, int k,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_csyr2k(
void* uplo, void* trans,
int n, int k,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_csyrk_V2(
void* uplo, void* trans,
int n, int k,
void *alpha,
const void *A, int lda,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_csyrk(
void* uplo, void* trans,
int n, int k,
void *alpha,
const void *A, int lda,
void *beta,
void *C, int ldc,
void* stream);
int CUDA_ctrmm_V2(
void* side, void* uplo,
void* transa, void* diag,
int m, int n,
void *alpha,
const void *A, int lda,
const void *B, int ldb,
void *C, int ldc,
void* stream);
int CUDA_ctrmm(
void* side, void* uplo,
void* transa, void* diag,
int m, int n,
void *alpha,
const void *A, int lda,
void *B, int ldb,
void* stream);
int CUDA_ctrsm_V2(
void* side, void* uplo,
void* transa, void* diag,
int m, int n,
const void *alpha,
const void *A, int lda,
void *B, int ldb,
void* stream);
int CUDA_ctrsm(
void* side, void* uplo,
void* transa, void* diag,
int m, int n,
void *alpha,
const void *A, int lda,
void *B, int ldb,
void* stream);
int CUDA_ctrtri(
void* uplo, void* diag, void* n,
void *dA, void* ldda, void* info);
int CUDA_ctslqt(
void* m, void* n, void* nb,
void *da1, void* ldda1,
void *da2, void* ldda2,
void *a2, void* lda2,
void *dt, void* lddt,
void *t, void* ldt,
void *dd,
void *d, void* ldd,
void *tau,
void *hwork,
void *dwork,
void* stream);
int CUDA_ctsmlq(
void* side, void* trans,
void* M1, void* N1,
void* M2, void* N2,
void* K, void* IB,
void *A1, void* LDA1,
void *A2, void* LDA2,
void *V, void* LDV,
void *T, void* LDT,
void *WORK, void* LDWORK,
void *WORKC, void* LDWORKC,
void* stream);
int CUDA_ctsmqr(
void* side, void* trans,
void* M1, void* N1,
void* M2, void* N2,
void* K, void* IB,
void *A1, void* LDA1,
void *A2, void* LDA2,
void *V, void* LDV,
void *T, void* LDT,
void *WORK, void* LDWORK,
void *WORKC, void* LDWORKC,
void* stream);
int CUDA_ctsqrt(
void* m, void* n, void* nb,
void *da1, void* ldda1,
void *da2, void* ldda2,
void *a2, void* lda2,
void *dt, void* lddt,
void *t, void* ldt,
void *dd,
void *d, void* ldd,
void *tau,
void *hwork,
void *dwork,
void* stream);
int CUDA_ctstrf(
char storev, void* m, void* n, void* ib, void* nb,
void *hU, void* ldhu, void *dU, void* lddu,
void *hA, void* ldha, void *dA, void* ldda,
void *hL, void* ldhl, void *dL, void* lddl,
void* *ipiv,
void *hwork, void* ldhwork,
void *dwork, void* lddwork,
void* info);
int CUDA_cunmlqt(
void* side, void* trans,
void* M, void* N, void* K, void* IB,
void *A, void* LDA,
void *T, void* LDT,
void *C, void* LDC,
void *WORK, void* LDWORK );
int CUDA_cunmqrt(
void* side, void* trans,
void* M, void* N, void* K, void* IB,
void *A, void* LDA,
void *T, void* LDT,
void *C, void* LDC,
void *WORK, void* LDWORK );
int CUDA_dgelqt(
void* m, void* n, void* nb,
double *da, void* ldda,
double *v, void* ldv,
double *dt, void* lddt,
double *t, void* ldt,
double *dd,
double *d, void* ldd,
double *tau,
double *hwork,
double *dwork,
void* stream);
int CUDA_dgemerge(
void* side, void* diag,
void* M, void* N,
double *A, void* LDA,
double *B, void* LDB,
void* stream);
int CUDA_dgemm_V2(
void* transa, void* transb,
int m, int n, int k,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dgemm(
void* transa, void* transb,
int m, int n, int k,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dgeqrt(
void* m, void* n, void* nb,
double *da, void* ldda,
double *v, void* ldv,
double *dt, void* lddt,
double *t, void* ldt,
double *dd,
double *d, void* ldd,
double *tau,
double *hwork,
double *dwork,
void* stream);
int CUDA_dgessm(
char storev, void* m, void* n, void* k, void* ib,
void* *ipiv,
double *dL1, void* lddl1,
double *dL, void* lddl,
double *dA, void* ldda,
void* info);
int CUDA_dgetrf_incpiv(
char storev, void* m, void* n, void* ib,
double *hA, void* ldha, double *dA, void* ldda,
double *hL, void* ldhl, double *dL, void* lddl,
void* *ipiv,
double *dwork, void* lddwork,
void* info);
int CUDA_dgetrf_nopiv(
void* m, void* n,
double *dA, void* ldda,
void* info);
int CUDA_dsymm_V2(
void* side, void* uplo,
int m, int n,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dsymm(
void* side, void* uplo,
int m, int n,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dsyr2k_V2(
void* uplo, void* trans,
int n, int k,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dsyr2k(
void* uplo, void* trans,
int n, int k,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dsyrk_V2(
void* uplo, void* trans,
int n, int k,
double *alpha,
const double *A, int lda,
double *beta,
double *B, int ldb,
void* stream);
int CUDA_dsyrk(
void* uplo, void* trans,
int n, int k,
double *alpha,
const double *A, int lda,
double *beta,
double *B, int ldb,
void* stream);
int CUDA_dlauum(
char uplo, void* n,
double *dA, void* ldda, void* info);
int CUDA_dparfb(
void* side, void* trans,
void* direct, void* storev,
void* M1, void* N1,
void* M2, void* N2,
void* K, void* L,
double *A1, void* LDA1,
double *A2, void* LDA2,
const double *V, void* LDV,
const double *T, void* LDT,
double *WORK, void* LDWORK,
double *WORKC, void* LDWORKC,
void* stream);
int CUDA_dpotrf(
void* uplo, void* n,
double *dA, void* ldda, void* info);
int CUDA_dssssm(
void* storev, void* m1, void* n1,
void* m2, void* n2, void* k, void* ib,
double *dA1, void* ldda1,
double *dA2, void* ldda2,
double *dL1, void* lddl1,
double *dL2, void* lddl2,
void* *IPIV, void* info);
int CUDA_dsymm_V2(
void* side, void* uplo,
int m, int n,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dsymm(
void* side, void* uplo,
int m, int n,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dsyr2k_V2(
void* uplo, void* trans,
int n, int k,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dsyr2k(
void* uplo, void* trans,
int n, int k,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dsyrk_V2(
void* uplo, void* trans,
int n, int k,
double *alpha,
const double *A, int lda,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dsyrk(
void* uplo, void* trans,
int n, int k,
double *alpha,
const double *A, int lda,
double *beta,
double *C, int ldc,
void* stream);
int CUDA_dtrmm_V2(
void* side, void* uplo,
void* transa, void* diag,
int m, int n,
double *alpha,
const double *A, int lda,
const double *B, int ldb,
double *C, int ldc,
void* stream);
int CUDA_dtrmm(
void* side, void* uplo,
void* transa, void* diag,
int m, int n,
double *alpha,
const double *A, int lda,
double *B, int ldb,
void* stream);
int CUDA_dtrsm_V2(
void* side, void* uplo,
void* transa, void* diag,
int m, int n,
const double *alpha,
const double *A, int lda,
double *B, int ldb,
void* stream);
int CUDA_dtrsm(
void* side, void* uplo,
void* transa, void* diag,
int m, int n,
double *alpha,
const double *A, int lda,
double *B, int ldb,
void* stream);
int CUDA_dtrtri(
void* uplo, void* diag, void* n,
double *dA, void* ldda, void* info);
int CUDA_dtslqt(
void* m, void* n, void* nb,
double *da1, void* ldda1,
double *da2, void* ldda2,
double *a2, void* lda2,
double *dt, void* lddt,
double *t, void* ldt,
double *dd,
double *d, void* ldd,
double *tau,
double *hwork,
double *dwork,
void* stream);
int CUDA_dtsmlq(
void* side, void* trans,