diff --git a/.gitlab-ci.yml b/.gitlab-ci.yml index d8b822d39283599f02292a1638d73d43109d7e0f..38622491e3585c9187e61402fea384adbc27c9ef 100644 --- a/.gitlab-ci.yml +++ b/.gitlab-ci.yml @@ -1,5 +1,6 @@ --- stages: + - pre - build - test - analyse diff --git a/.gitlab/build.yml b/.gitlab/build.yml index d6e8941f31159555c30b7e22ebdbfc1c6d39219e..22931bfc7b4f074dacc39af50eed9a80437c504e 100644 --- a/.gitlab/build.yml +++ b/.gitlab/build.yml @@ -51,7 +51,7 @@ build_starpu_simgrid: VERSION: starpu_simgrid build_starpu_macosx: - extends: .only-branches + extends: .only-merge-request stage: build tags: ['macosx'] variables: diff --git a/.gitlab/common.yml b/.gitlab/common.yml index f55aeb523a0a82330ad33ed72ed8dd3fa3c488f7..50833083b31d9622d9f6bbb89c95abd7bba02a43 100644 --- a/.gitlab/common.yml +++ b/.gitlab/common.yml @@ -6,24 +6,26 @@ default: image: registry.gitlab.inria.fr/solverstack/docker/distrib tags: ['ci.inria.fr', 'linux', 'large'] +# push event: executed only if the source branch name is master or starts with ci- +# merge request event: not executed +# schedule event: not executed .only-master: - except: ['schedule'] interruptible: true - only: - - master@solverstack/chameleon - - /^ci-.*$/ + rules: + - if: ($CI_COMMIT_BRANCH == $CI_DEFAULT_BRANCH || $CI_COMMIT_BRANCH =~ /^ci-.*$/) && $CI_PIPELINE_SOURCE != "schedule" -.only-branches: - except: ['schedule'] +# push event: executed only if the source branch name is master or starts with ci- +# merge request event: executed if the source branch name does not start with notest- +# schedule event: not executed +.only-merge-request: interruptible: true - only: - - merge_requests - - master@solverstack/chameleon - - /^ci-.*$/ + rules: + - if: ($CI_COMMIT_BRANCH == $CI_DEFAULT_BRANCH || $CI_COMMIT_BRANCH =~ /^ci-.*$/) && $CI_PIPELINE_SOURCE != "schedule" + - if: ($CI_MERGE_REQUEST_IID && $CI_MERGE_REQUEST_SOURCE_BRANCH_NAME !~ /^notest-.*$/) && $CI_PIPELINE_SOURCE != "schedule" .build_script_template: stage: build - extends: .only-branches + extends: .only-merge-request script: - ./.gitlab/build.sh artifacts: @@ -49,7 +51,8 @@ default: junit: junit.xml .bench_plafrim_common: - only: ['schedule'] + rules: + - if: $CI_PIPELINE_SOURCE == "schedule" stage: test tags: ['plafrim'] timeout: 1 week diff --git a/.gitlab/coverage.yml b/.gitlab/coverage.yml index 44d5576aece499b46004ebac402b6014542d16e5..d2393faac21fdd530c43f30a3fc71d2b1332445e 100644 --- a/.gitlab/coverage.yml +++ b/.gitlab/coverage.yml @@ -6,8 +6,7 @@ # --- coverage: - only: - - merge_requests + extends: .only-merge-request interruptible: true stage: analyse script: diff --git a/.gitlab/pages.yml b/.gitlab/pages.yml index 41aec70ac0decefb48477bff53e4fde8743b899a..8ae81ed8b24dac4580b1f3d9a64cd176f851d6d6 100644 --- a/.gitlab/pages.yml +++ b/.gitlab/pages.yml @@ -1,6 +1,7 @@ --- pages: stage: deploy + extends: .only-master dependencies: [] artifacts: name: "$CI_JOB_NAME-$CI_COMMIT_REF_SLUG" @@ -11,7 +12,3 @@ pages: VERSION: pages script: - ./tools/pages.sh - only: - - master@solverstack/chameleon - - /^ci.*$/ - interruptible: true diff --git a/.gitlab/preliminary.yml b/.gitlab/preliminary.yml index a1e137cb5c50729c3bc685baf10004c8ebc28b19..8c1a66437c5adaa75cad9539a45683cdc82c435b 100644 --- a/.gitlab/preliminary.yml +++ b/.gitlab/preliminary.yml @@ -3,13 +3,14 @@ # --- preliminary_checks: - stage: .pre + stage: pre + interruptible: true + rules: + - if: ($CI_COMMIT_BRANCH == $CI_DEFAULT_BRANCH || $CI_COMMIT_BRANCH =~ /^ci-.*$/) && $CI_PIPELINE_SOURCE != "schedule" + - if: $CI_MERGE_REQUEST_IID && $CI_PIPELINE_SOURCE != "schedule" parallel: matrix: - TEST: [rebase, draft, header] script: - .gitlab/check_ci.sh $TEST - only: - - merge_requests - interruptible: true diff --git a/.gitlab/release.yml b/.gitlab/release.yml index 5ed711f56a328f09fcc63b16806ac43925cad2ab..eade839d37879f0245921eba17df7055770e611d 100644 --- a/.gitlab/release.yml +++ b/.gitlab/release.yml @@ -1,6 +1,8 @@ --- release: stage: deploy + rules: + - if: $CI_COMMIT_BRANCH =~ /^release-.*$/ && $CI_PIPELINE_SOURCE != "schedule" dependencies: [] artifacts: name: "$CI_JOB_NAME-$CI_COMMIT_REF_SLUG" @@ -11,7 +13,3 @@ release: VERSION: release script: - ./tools/release.sh - only: - - /^release-.*$/ - except: - - schedules diff --git a/.gitlab/test_hmat.yml b/.gitlab/test_hmat.yml index 894dc50f1bf2fee033023d2503625ee38421102b..23cc8a5ccafb89740441997f21c4b62b98b0dccb 100644 --- a/.gitlab/test_hmat.yml +++ b/.gitlab/test_hmat.yml @@ -12,7 +12,7 @@ .test_hmat_template_branches: &test_hmat_branches extends: - .test_hmat_template - - .only-branches + - .only-merge-request test_hmat: <<: *test_hmat_branches diff --git a/.gitlab/test_openmp.yml b/.gitlab/test_openmp.yml index b026ae4517879090e8b69e599ba256200d20f49e..dbb9271bc368a565ca4682de47707e4082706820 100644 --- a/.gitlab/test_openmp.yml +++ b/.gitlab/test_openmp.yml @@ -12,7 +12,7 @@ .test_openmp_template_branches: &test_openmp_branches extends: - .test_openmp_template - - .only-branches + - .only-merge-request test_openmp_shm_s: <<: *test_openmp_master diff --git a/.gitlab/test_parsec.yml b/.gitlab/test_parsec.yml index ae137fafe09f5cdb72f8aef0252943e6439a0fba..842c7f13fbf3f6793774e238c6fd3c62632dab69 100644 --- a/.gitlab/test_parsec.yml +++ b/.gitlab/test_parsec.yml @@ -12,7 +12,7 @@ .test_parsec_template_branches: &test_parsec_branches extends: - .test_parsec_template - - .only-branches + - .only-merge-request test_parsec_shm_s: <<: *test_parsec_master diff --git a/.gitlab/test_quark.yml b/.gitlab/test_quark.yml index 98d27b947e4352e0b127ee480c8a349e621cb5f1..29421613ea23a9a4aa879e91337c41c91e2cecbe 100644 --- a/.gitlab/test_quark.yml +++ b/.gitlab/test_quark.yml @@ -12,7 +12,7 @@ .test_quark_template_branches: &test_quark_branches extends: - .test_quark_template - - .only-branches + - .only-merge-request test_quark_shm_s: <<: *test_quark_branches diff --git a/.gitlab/test_starpu.yml b/.gitlab/test_starpu.yml index 2574cdc8a80a980549619f0f0e1dd773a509df17..251204f0b8e91c962afdb0d2efd7ebde11b3d29d 100644 --- a/.gitlab/test_starpu.yml +++ b/.gitlab/test_starpu.yml @@ -12,7 +12,7 @@ .test_starpu_template_branches: &test_starpu_branches extends: - .test_starpu_template - - .only-branches + - .only-merge-request test_starpu_shm_s: <<: *test_starpu_master @@ -79,7 +79,7 @@ test_starpu_mpi_z: TESTS_RESTRICTION: "-R \"_${CATEGORY}_${PRECISION}\"" test_starpu_shm_s_macosx: - extends: .only-branches + extends: .only-merge-request stage: test tags: ['macosx'] needs: [build_starpu_macosx] diff --git a/.gitlab/test_starpu_simgrid.yml b/.gitlab/test_starpu_simgrid.yml index 0cd7b9ff3cbc40739592a7ee3694fc2a465a0daf..17ae0afb6c2458e52f96eb5188f451c16e4829f7 100644 --- a/.gitlab/test_starpu_simgrid.yml +++ b/.gitlab/test_starpu_simgrid.yml @@ -12,7 +12,7 @@ .test_starpu_simgrid_template_branches: &test_starpu_simgrid_branches extends: - .test_starpu_simgrid_template - - .only-branches + - .only-merge-request test_starpu_simgrid_simu_all: <<: *test_starpu_simgrid_branches diff --git a/distrib/debian/install_dependencies.sh b/distrib/debian/install_dependencies.sh index 1256a7c1c83dd834df7971149e78810df5c0eb63..795b4c2df32dd51359af5d8633409f2577ab3f90 100755 --- a/distrib/debian/install_dependencies.sh +++ b/distrib/debian/install_dependencies.sh @@ -2,7 +2,7 @@ # whatis: standard development environment to use the chameleon library sudo apt-get update -y -sudo apt-get install build-essential git gfortran cmake doxygen python pkg-config libopenblas-dev liblapacke-dev libstarpu-dev libopenmpi-dev libhwloc-dev -y +sudo apt-get install build-essential git gfortran cmake doxygen python-is-python3 pkg-config libopenblas-dev liblapacke-dev libstarpu-dev libopenmpi-dev libhwloc-dev -y # libopenblas-dev can be replaced by libmkl-dev or liblapack-dev # install chameleon with cmake diff --git a/doc/user/chapters/installing.org b/doc/user/chapters/installing.org index a8ed8454e2314556c1632f0f3cc8cbcfce246d1e..eeedfe097db6ebb82fac55fa208b7c7d216fdcb8 100644 --- a/doc/user/chapters/installing.org +++ b/doc/user/chapters/installing.org @@ -48,6 +48,7 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and Optional libraries: - cuda: [[https://developer.nvidia.com/cuda-downloads][cuda]], [[http://docs.nvidia.com/cuda/cublas/][cublas]] (comes with cuda) - mpi: [[http://www.open-mpi.org/][openmpi]], [[https://www.mpich.org/][mpich]], [[https://software.intel.com/en-us/mpi-library][intelmpi]] + - rocm: [[https://github.com/ROCm-Developer-Tools/HIP][HIP]] and [[https://github.com/ROCmSoftwarePlatform/hipBLAS][hipBLAS]] These packages must be installed on the system before trying to configure/build chameleon. Please look at the distrib/ directory @@ -78,14 +79,20 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and sudo apt-get install -y libfxt-dev # Install cuda and cuBLAS: only if you have a GPU cuda compatible sudo apt-get install -y nvidia-cuda-toolkit nvidia-cuda-dev + # Install HIP and hipBLAS: only if you have a GPU AMD compatible + curl -fsSL https://repo.radeon.com/rocm/rocm.gpg.key | sudo gpg --dearmor -o /etc/apt/trusted.gpg.d/rocm-keyring.gpg + echo 'deb [arch=amd64 signed-by=/etc/apt/trusted.gpg.d/rocm-keyring.gpg] https://repo.radeon.com/rocm/apt/5.4.2 jammy main' | sudo tee /etc/apt/sources.list.d/rocm.list + echo -e 'Package: *\nPin: release o=repo.radeon.com\nPin-Priority: 600' | sudo tee /etc/apt/preferences.d/rocm-pin-600 + sudo apt-get update + sudo apt-get install -y rocm-hip-sdk # If you prefer a specific version of StarPU, install it yourself, e.g. # Install StarPU (with MPI and FxT enabled) mkdir -p $HOME/install cd $HOME/install - wget https://files.inria.fr/starpu/starpu-1.3.7/starpu-1.3.7.tar.gz - tar xvzf starpu-1.3.7.tar.gz - cd starpu-1.3.7/ + wget https://files.inria.fr/starpu/starpu-1.3.10/starpu-1.3.10.tar.gz + tar xvzf starpu-1.3.10.tar.gz + cd starpu-1.3.10/ ./configure --prefix=/usr/local --with-fxt=/usr/lib/x86_64-linux-gnu/ make -j5 sudo make install @@ -261,6 +268,11 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and *Caution about the compatibility:* your compiler must be compatible with CUDA. +***** HIP + [[https://github.com/ROCm-Developer-Tools/HIP][HIP]] is a C++ Runtime + API and Kernel Language that allows developers to create portable + applications for AMD and NVIDIA GPUs from single source code. + *** Build and install Chameleon with CMake :PROPERTIES: :CUSTOM_ID: doc-install-cmake @@ -309,8 +321,7 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and -DCMAKE_INSTALL_PREFIX=/home/jdoe/install/ \ -DCHAMELEON_USE_CUDA=ON \ -DCHAMELEON_USE_MPI=ON \ - -DBLA_VENDOR=Intel10_64lp \ - -DCHAMELEON_ENABLE_TRACING=ON + -DBLA_VENDOR=Intel10_64lp_seq #+end_src You can get the full list of options with *-L[A][H]* options of cmake command @@ -322,13 +333,13 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and ***** Native CMake options (non-exhaustive list) * *CMAKE_BUILD_TYPE=Debug|Release|RelWithDebInfo|MinSizeRel*: - level of compiler optimization, enable/disable debug - information - * *CMAKE_INSTALL_PREFIX=path/to/your/install/dir*: where headers, - libraries, executables, etc, will be copied when invoking make - install - * *BUILD_SHARED_LIBS=ON|OFF*: indicates whether or not CMake has to - build Chameleon static (~OFF~) or shared (~ON~) libraries. + level of compiler optimization, enable/disable debug information. + * *CMAKE_PREFIX_PATH="path1;path2"*: + where paths denotes root to dependencies that may be installed with CMake. + * *CMAKE_INSTALL_PREFIX=path/to/your/install/dir*: + where headers, libraries, executables, etc, will be copied when invoking make install. + * *BUILD_SHARED_LIBS=ON|OFF*: + indicates whether or not CMake has to build Chameleon static (~OFF~) or shared (~ON~) libraries. * *CMAKE_C_COMPILER=gcc|icc|...*: to choose the C compilers if several exist in the environment * *CMAKE_Fortran_COMPILER=gfortran|ifort|...*: to choose the @@ -336,8 +347,8 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and ***** Related to specific modules (find_package) to find external libraries * *BLA_VENDOR=All|OpenBLAS|Generic|Intel10_64lp|Intel10_64lp_seq|FLAME*: - to use intel mkl for example, see the list of BLA_VENDOR in - FindBLAS.cmake in cmake_modules/morse_cmake/modules/find + to use intel mkl for example, see the list of + [[https://cmake.org/cmake/help/latest/module/FindBLAS.html][BLA_VENDOR]]. Libraries detected with an official cmake module (see module files in CMAKE_ROOT/Modules/): BLAS - LAPACK - CUDA - MPI - @@ -357,9 +368,17 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and nodes with distributed memory), can only be used with StarPU and PaRSEC * *CHAMELEON_USE_CUDA=ON|OFF* (default OFF): to link with CUDA - runtime (implementation paradigm for accelerated codes on GPUs) - and cuBLAS library (optimized BLAS kernels on GPUs), can only + runtime (implementation paradigm for accelerated codes on Nvidia GPUs) + and cuBLAS library (optimized BLAS kernels on Nvidia GPUs), can only be used with StarPU and PaRSEC + * *CHAMELEON_USE_HIP_ROC=ON|OFF* (default OFF): to link with HIP + runtime (implementation paradigm for accelerated codes on AMD GPUs) + and hipBLAS library (optimized BLAS kernels on AMD GPUs), can only + be used with StarPU + * *CHAMELEON_USE_HIP_CUDA=ON|OFF* (default OFF): to link with HIP + runtime (implementation paradigm for accelerated codes on Nvidia GPUs) + and hipBLAS library (optimized BLAS kernels on Nvidia GPUs), can only + be used with StarPU * *CHAMELEON_ENABLE_DOC=ON|OFF* (default OFF): to control build of the documentation contained in doc/ sub-directory * *CHAMELEON_ENABLE_EXAMPLE=ON|OFF* (default ON): to control build @@ -373,12 +392,22 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and simulation mode, means Chameleon will not really execute tasks, see details in section [[sec:simu][Use simulation mode with StarPU-SimGrid]]. This option must be used with StarPU compiled - with [[http://simgrid.gforge.inria.fr/][SimGrid]] allowing to guess the execution time on any + with [[https://framagit.org/simgrid/simgrid][SimGrid]] allowing to guess the execution time on any architecture. This feature should be used to make experiments on the scheduler behaviors and performances not to produce solutions of linear systems. - * *CHAMELEON_USE_MIGRATE=ON|OFF* (default OFF): enables the data - migration in QR algorithms + * *CHAMELEON_USE_MIGRATE=ON|OFF* (default OFF): + enables the data migration in QR algorithms. + * *CHAMELEON_USE_MPI_DATATYPES* (default OFF): + enables MPI datatypes whenever supported by the runtime. + * *CHAMELEON_USE_HMAT=ON|OFF* (default OFF): + enables Hmat-OSS kernels. + * *CHAMELEON_RUNTIME_SYNC* (default OFF): + enables synchronous task submission when available to debug the code without parallelism. + * *CHAMELEON_KERNELS_TRACE* (default OFF): + enables kernel traces to debug the task execution order. + * *CHAMELEON_KERNELS_MT* (default OFF): + Use multithreaded kernels (e.g. intel MKL MT) **** Dependencies detection <<sec:depdet>> @@ -386,7 +415,10 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and You have different choices to detect dependencies on your system, either by setting some environment variables containing paths to the libs and headers or by specifying them directly at cmake - configure. Different cases: + configure. In any case, if the dependencies are installed in non + standard directories, do not forget to use the ~PKG_CONFIG_PATH~ + environment variable and the ~CMAKE_PREFIX_PATH~ environment (or CMake) + variable. Different cases: 1) detection of dependencies through environment variables: - LD_LIBRARY_PATH (DYLD_LIBRARY_PATH on Mac OSX) should contain @@ -423,6 +455,8 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and - update your *PKG_CONFIG_PATH* to the paths where to find .pc files of installed external libraries like hwloc, starpu, some blas/lapack, etc + 5) using [[https://cmake.org/cmake/help/latest/variable/CMAKE_PREFIX_PATH.html#variable:CMAKE_PREFIX_PATH][CMAKE_PREFIX_PATH]] + for libraries that provide some CMake config files containing targets definitions (e.g. fooConfig.cmake). Note that PaRSEC and StarPU are only detected with pkg-config mechanism because it is always provided and this avoids errors. @@ -474,15 +508,21 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and Docker/Singularity images with Guix. **** Installing Guix - Guix requires a running GNU/Linux system, GNU tar and Xz. - #+begin_src sh - gpg --keyserver pgp.mit.edu --recv-keys 3CE464558A84FDC69DB40CFB090B11993D9AEBB5 + [[https://guix.gnu.org/][Guix]] requires a running GNU/Linux system, GNU tar and Xz. + Follow the [[https://guix.gnu.org/manual/en/html_node/Binary-Installation.html#Binary-Installation][installation instructions]] + #+begin_src sh :eval never-export + cd /tmp wget https://git.savannah.gnu.org/cgit/guix.git/plain/etc/guix-install.sh chmod +x guix-install.sh sudo ./guix-install.sh #+end_src + or on Debian + #+begin_src sh :eval never-export + sudo apt install guix + #+end_src + The Chameleon packages are not official Guix packages. It is then necessary to add a channel to get additional packages. Create a ~/.config/guix/channels.scm file with the following snippet: @@ -523,25 +563,29 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and Standard Chameleon, last release #+begin_src sh guix install chameleon + # or use guix shell to get a new shell (isolated from the native environment) with chameleon available in the PATH + guix shell --pure chameleon -- /bin/bash --norc #+end_src Notice that there exist several build variants - chameleon (default) : with starpu - with mpi - with OpenBlas - chameleon-mkl-mt : default version but with Intel MKL multithreaded to replace OpenBlas + - chameleon-mkl-mt-wompi : with Intel MKL multithreaded and without mpi - chameleon-cuda : with starpu - with mpi - with cuda + - chameleon-cuda-wompi : with starpu - without mpi - with cuda - chameleon-cuda-mkl-mt : with starpu - with mpi - with cuda - with Intel MKL multithreaded to replace OpenBlas + - chameleon-cuda-mkl-mt-wompi : with starpu - without mpi - with cuda - with Intel MKL multithreaded to replace OpenBlas - chameleon-simgrid : with starpu - with mpi - with simgrid - chameleon-openmp : with openmp - without mpi - chameleon-parsec : with parsec - without mpi - chameleon-quark : with quark - without mpi - Change the version #+begin_src sh guix install chameleon --with-branch=chameleon=master guix install chameleon --with-commit=chameleon=b31d7575fb7d9c0e1ba2d8ec633e16cb83778e8b guix install chameleon --with-git-url=chameleon=https://gitlab.inria.fr/fpruvost/chameleon.git - guix install chameleon --with-git-url=chameleon=$HOME/git/chameleon + guix install chameleon --with-source=chameleon=$HOME/git/chameleon #+end_src Notice also that default mpi is OpenMPI and default blas/lapack is @@ -605,17 +649,50 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and To package Chameleon and its dependencies within a singularity image (OpenMPI stack) #+begin_src sh - singularity_chameleon=`guix pack -f squashfs chameleon --with-branch=chameleon=master --with-input=openblas=mkl mkl starpu hwloc openmpi openssh slurm hdf5 zlib bash coreutils inetutils util-linux procps git grep tar sed gzip which gawk perl emacs-minimal vim gcc-toolchain make cmake pkg-config -S /bin=bin --entry-point=/bin/bash` - cp $singularity_chameleon chameleon-pack.gz.squashfs + # define reproducible guix environment + guix describe -f channels > guix-channels.scm + guix shell --export-manifest chameleon-cuda --with-branch=chameleon=master --with-input=openblas=mkl bash coreutils emacs gawk grep inetutils openmpi openssh procps sed time util-linux vim which > guix-manifests.scm + SINGULARITY_IMAGE=`guix time-machine -C guix-channels.scm -- pack -f squashfs -m guix-manifests.scm -S /bin=bin --entry-point=/bin/bash` + cp $SINGULARITY_IMAGE chameleon-cuda.gz.sif + # copy the singularity image on the supercomputer, e.g. 'supercomputer' - scp chameleon-pack.gz.squashfs supercomputer: + scp chameleon-cuda.gz.sif supercomputer: #+end_src On a machine where Singularity is installed Chameleon can then be called as follows #+begin_src sh # at least openmpi and singularity are required here, e.g. module add openmpi singularity - mpiexec -np 2 singularity exec chameleon-pack.gz.squashfs /bin/chameleon_stesting -H -o gemm -P 2 -t 2 -m 2000 -n 2000 -k 2000 + module add openmpi singularity + export SINGULARITY_CMD=`which singularity` + export SINGULARITY_IMAGE=$HOME/chameleon-cuda.gz.sif + # use LD_PRELOAD to give the location of the CUDA driver installed on the supercomputer + export LD_PRELOAD=/usr/lib/x86_64-linux-gnu/libcuda.so + # then in your allocation with Slurm or OAR, for example + mpirun $MPI_OPTIONS -x LD_PRELOAD $SINGULARITY_CMD exec --bind /usr/lib/x86_64-linux-gnu/:/usr/lib/x86_64-linux-gnu/ $SINGULARITY_IMAGE chameleon_stesting -o gemm -n 96000 -b 1600 --nowarmup -g 2 + #+end_src + +**** Generate a tar.gz package of Chameleon with Guix + + One can generate a tar.gz archive the same way as the singularity image + #+begin_src sh + guix describe -f channels > guix-channels.scm + guix shell --export-manifest chameleon-cuda --with-branch=chameleon=master --with-input=openblas=mkl bash coreutils emacs gawk grep inetutils openmpi openssh procps sed time util-linux vim which > guix-manifests.scm + PACKRR=`guix time-machine --channels=guix-channels.scm -- pack -RR --manifest=guix-manifests.scm -S /bin=bin` + cp $PACKRR chameleon-cuda.tar.gz + # copy the archive on the supercomputer, e.g. 'supercomputer' + scp chameleon-cuda.tar.gz supercomputer: + #+end_src + + Then on the supercomputer that has neither Guix nor Singularity one can do the following + #+begin_src sh + mkdir guixrr/ + cd guixrr/ + tar xvf $HOME/chameleon-cuda.tar.gz + chmod +w . + export GUIX_ROOT=$PWD + # then in your allocation with Slurm or OAR, for example + ${GUIX_ROOT}/bin/mpirun --launch-agent ${GUIX_ROOT}/bin/orted -x GUIX_EXECUTION_ENGINE=performance -x LD_PRELOAD="/usr/lib64/libcuda.so" -x STARPU_SILENT=1 ${GUIX_ROOT}/bin/chameleon_stesting -o gemm -n 16000,32000,64000,96000,128000 -b 2000 -g 4 -P 2 #+end_src *** Distribution of Chameleon using Spack @@ -626,18 +703,15 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and **** Installing Spack - To get support to install a full distribution on Linux or MacOS X, - Chameleon plus dependencies, we encourage users to use - [[https://spack.io/][Spack]]. Please refer to our [[https://gitlab.inria.fr/solverstack/spack-repo/blob/master/README.org][Spack Repository]]. + We provide a Chameleon [[https://github.com/spack/spack][Spack]] package (with StarPU) for Linux or macOS. + Please refer to the [[https://spack.readthedocs.io/en/latest/][documentation]] for installation instructions. #+begin_src sh - git clone https://github.com/llnl/spack.git - export SPACK_ROOT=$PWD/spack - cd spack/ - git checkout v0.16.0 - . $SPACK_ROOT/share/spack/setup-env.sh - git clone https://gitlab.inria.fr/solverstack/spack-repo.git ./var/spack/repos/solverstack - spack repo add ./var/spack/repos/solverstack + # please read https://spack.readthedocs.io/en/latest/getting_started.html + git clone https://github.com/spack/spack.git + . spack/share/spack/setup-env.sh + cd spack + git checkout v0.19.1 #+end_src Chameleon is then available @@ -646,8 +720,9 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and spack spec chameleon #+end_src - Refer to te [[https://spack.readthedocs.io/en/latest/basic_usage.html][official documentation of Spack]] to learn the basic - commands. + Refer to the [[https://spack.readthedocs.io/en/latest/getting_started.html][getting started guide]] + and [[https://spack.readthedocs.io/en/latest/basic_usage.html][basic usage guide]] + to learn how to use Spack properly. **** Installing Chameleon with Spack @@ -658,7 +733,7 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and spack location -i chameleon #+end_src - Notice that there exist several build variants + Notice that there exist several build variants (see ~spack info chameleon~) - chameleon (default) : with starpu - with mpi - tune the build type (CMake) with build_type=RelWithDebInfo|Debug|Release - enable/disable shared libraries with +/- shared @@ -666,12 +741,11 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and - enable/disable cuda with +/- cuda - enable/disable fxt with +/- fxt - enable/disable simgrid with +/- simgrid - - +openmp~starpu : with openmp - without starpu - - +quark~starpu : with quark - without starpu + - runtime=openmp : with openmp - without starpu Change the version #+begin_src sh - spack install -v chameleon@1.0.0 + spack install -v chameleon@master #+end_src Notice also that default mpi is OpenMPI and default blas/lapack is @@ -685,10 +759,9 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and # see mpi providers spack providers mpi # install chameleon with intel mkl to replace openblas - spack install -v chameleon ^intel-mkl - # install chameleon with nmad to replace openmpi - spack install -v chameleon ^nmad + spack install -v chameleon ^intel-mkl # or ^intel-oneapi-mkl #+end_src + *** Distribution Brew for Mac OS X :PROPERTIES: :CUSTOM_ID: doc-install-macos @@ -726,7 +799,7 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and # installed under <prefix>/lib/cmake/chameleon/ by setting your # CMAKE_PREFIX_PATH with the path of installation. In your cmake project, use # find_package(CHAMELEON) and link your libraries and/or executables with the - # library target MORSE::CHAMELEON + # library target CHAMELEON::chameleon cmake . -DCMAKE_PREFIX_PATH=$CHAMELEON_ROOT #+end_src **** For non CMake projects @@ -769,11 +842,11 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and /home/yourname/install/chameleon/lib/libchameleon.a \ /home/yourname/install/chameleon/lib/libchameleon_starpu.a \ /home/yourname/install/chameleon/lib/libcoreblas.a \ - -lstarpu-1.2 -Wl,--no-as-needed -lmkl_intel_lp64 \ + -lstarpu-1.3 -Wl,--no-as-needed -lmkl_intel_lp64 \ -lmkl_sequential -lmkl_core -lpthread -lm -lrt #+end_src As you can see in this example, we also link with some dynamic - libraries *starpu-1.2*, *Intel MKL* libraries (for + libraries *starpu-1.3*, *Intel MKL* libraries (for BLAS/LAPACK/CBLAS/LAPACKE), *pthread*, *m* (math) and *rt*. These libraries will depend on the configuration of your Chameleon build. You can find these dependencies in .pc files we generate @@ -798,7 +871,7 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and gcc main.o -o main \ -L/home/yourname/install/chameleon/lib \ -lchameleon -lchameleon_starpu -lcoreblas \ - -lstarpu-1.2 -Wl,--no-as-needed -lmkl_intel_lp64 \ + -lstarpu-1.3 -Wl,--no-as-needed -lmkl_intel_lp64 \ -lmkl_sequential -lmkl_core -lpthread -lm -lrt #+end_src Note that an update of your environment variable LD_LIBRARY_PATH @@ -829,7 +902,7 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and # # /home/yourname/install/chameleon/lib/libchameleon.a \ # # /home/yourname/install/chameleon/lib/libchameleon_starpu.a \ # # /home/yourname/install/chameleon/lib/libcoreblas.a \ - # # -lstarpu-1.2 -Wl,--no-as-needed -lmkl_intel_lp64 \ + # # -lstarpu-1.3 -Wl,--no-as-needed -lmkl_intel_lp64 \ # # -lmkl_sequential -lmkl_core -lpthread -lm -lrt # # #+end_src # # @@ -838,6 +911,6 @@ Finally some packages or also available for [[sec:ug:debian][Debian/Ubuntu]] and # # gfortran main.o -o main \ # # -L/home/yourname/install/chameleon/lib \ # # -lchameleon -lchameleon_starpu -lcoreblas \ - # # -lstarpu-1.2 -Wl,--no-as-needed -lmkl_intel_lp64 \ + # # -lstarpu-1.3 -Wl,--no-as-needed -lmkl_intel_lp64 \ # # -lmkl_sequential -lmkl_core -lpthread -lm -lrt # # #+end_src diff --git a/doc/user/homepage.org b/doc/user/homepage.org index c96129d3795e451d1c2c290d57207f61601c1ee3..d6692404ed9ed87b1f83db8eb1670226a83b86d2 100644 --- a/doc/user/homepage.org +++ b/doc/user/homepage.org @@ -138,7 +138,7 @@ wget https://gitlab.inria.fr/solverstack/chameleon/uploads/b299d6037d7636c6be16108c89bc2aab/chameleon-1.1.0.tar.gz tar xvf chameleon-1.1.0.tar.gz cd chameleon-1.1.0 - # or clone from git repository + # or clone the master branch from the git repository to get the last version # git clone --recursive https://gitlab.inria.fr/solverstack/chameleon.git && cd chameleon mkdir build && cd build cmake .. -DCHAMELEON_USE_MPI=ON -DBUILD_SHARED_LIBS=ON -DCMAKE_INSTALL_PREFIX=$PWD/install @@ -175,9 +175,9 @@ #+begin_src sh :eval never-export # install last starpu release cd $HOME - wget https://files.inria.fr/starpu/starpu-1.3.8/starpu-1.3.8.tar.gz - tar xvf starpu-1.3.8.tar.gz - cd starpu-1.3.8 + wget https://files.inria.fr/starpu/starpu-1.3.10/starpu-1.3.10.tar.gz + tar xvf starpu-1.3.10.tar.gz + cd starpu-1.3.10 ./configure make -j5 sudo make install @@ -201,9 +201,10 @@ Visit the [[https://gitlab.inria.fr/solverstack/chameleon/-/packages][packages]] page and download the appropriate file for your system. Then in a shell terminal #+begin_src sh :eval never-export - # to install one of our non offical package, for example on Ubuntu 20.04 - curl https://gitlab.inria.fr/solverstack/chameleon/-/package_files/15259/download -o chameleon_1.1.0-1_amd64.deb + # to install one of our non offical package, for example on Ubuntu 22.04 + wget https://gitlab.inria.fr/api/v4/projects/616/packages/generic/ubuntu_22.04/1.1.0/chameleon_1.1.0-1_amd64.deb sudo apt-get install -y ./chameleon_1.1.0-1_amd64.deb + mpiexec -n 2 chameleon_dtesting -o potrf -t 2 -n 3200 --nowarmup #+end_src If there are no package available for your Debian/Ubuntu distribution please [[sec:contact][contact us]] and we will try to provide one. @@ -229,13 +230,19 @@ :CUSTOM_ID: quickstart-install-guix :END: [[https://guix.gnu.org/][Guix]] requires a running GNU/Linux system, GNU tar and Xz. + Follow the [[https://guix.gnu.org/manual/en/html_node/Binary-Installation.html#Binary-Installation][installation instructions]] #+begin_src sh :eval never-export - gpg --keyserver pgp.mit.edu --recv-keys 3CE464558A84FDC69DB40CFB090B11993D9AEBB5 + cd /tmp wget https://git.savannah.gnu.org/cgit/guix.git/plain/etc/guix-install.sh chmod +x guix-install.sh sudo ./guix-install.sh #+end_src + or on Debian + #+begin_src sh :eval never-export + sudo apt install guix + #+end_src + Guix packages are stored in our [[https://gitlab.inria.fr/guix-hpc/guix-hpc][guix-hpc]], and [[https://gitlab.inria.fr/guix-hpc/guix-hpc-non-free][guix-hpc-non-free]] (for versions with Intel MKL and/or CUDA) git repositories. Please refer to the README to see how to add our package to the list of @@ -268,9 +275,8 @@ :PROPERTIES: :CUSTOM_ID: quickstart-install-spack :END: - Spack packages for Linux or macOS are stored in our [[https://gitlab.inria.fr/solverstack/spack-repo][spack-repo]] git - repository. Please refer to the [[https://gitlab.inria.fr/solverstack/spack-repo/-/blob/master/README.org][README]] for installation - instructions. + We provide a Chameleon [[https://github.com/spack/spack][Spack]] package (with StarPU) for Linux or macOS. + Please refer to the [[https://spack.readthedocs.io/en/latest/][documentation]] for installation instructions. Examples: #+begin_src sh :eval never-export diff --git a/example/link_chameleon/CMakeLists.txt b/example/link_chameleon/CMakeLists.txt index d56368d31d1bb9744e95e7a27a534ff4686d4674..dc282bc3b2f3db3a1369a0e560d203f133a82735 100644 --- a/example/link_chameleon/CMakeLists.txt +++ b/example/link_chameleon/CMakeLists.txt @@ -28,10 +28,10 @@ project(LINK_CHAMELEON Fortran C CXX) find_package(CHAMELEON) add_executable(link_chameleon_c link_chameleon.c) -target_link_libraries(link_chameleon_c PRIVATE MORSE::CHAMELEON) +target_link_libraries(link_chameleon_c PRIVATE CHAMELEON::chameleon) add_executable(link_chameleon_f link_chameleon.f90) -target_link_libraries(link_chameleon_f PRIVATE MORSE::CHAMELEON) +target_link_libraries(link_chameleon_f PRIVATE CHAMELEON::chameleon) ### ### END CMakeLists.txt ### diff --git a/example/link_chameleon/README.org b/example/link_chameleon/README.org index 0ce8ba13b100e82865b393646444555fe67c2a78..743f378df791a83fc5d9ab8d42bab42f9ec8853b 100644 --- a/example/link_chameleon/README.org +++ b/example/link_chameleon/README.org @@ -18,7 +18,7 @@ cmake .. -DCMAKE_INSTALL_PREFIX=$CHAMELEON_ROOT && make -j5 install # installed under <prefix>/lib/cmake/chameleon/ by setting your # CMAKE_PREFIX_PATH with the path of installation. In your cmake project, use # find_package(CHAMELEON) and link your libraries and/or executables with the -# library target MORSE::CHAMELEON +# library target CHAMELEON::chameleon cmake . -DCMAKE_PREFIX_PATH=$CHAMELEON_ROOT # if your work outside of cmake you can use the pkg-config file provided export PKG_CONFIG_PATH=$CHAMELEON_ROOT/lib/pkgconfig:$PKG_CONFIG_PATH diff --git a/tools/bench/plafrim/parameters/bora/parameters.xml b/tools/bench/plafrim/parameters/bora/parameters.xml index 8ad5c261e341a365b3903592bf37d89a07fbfb35..67e444eb8352ca62246ebfc04bb4c2ea6399475f 100644 --- a/tools/bench/plafrim/parameters/bora/parameters.xml +++ b/tools/bench/plafrim/parameters/bora/parameters.xml @@ -15,7 +15,7 @@ <parameter name="m" mode="python" type="int" >[${nmpi}*${b}, ${nmpi}*2*${b}, ${nmpi}*4*${b}, ${nmpi}*8*${b}, ${nmpi}*16*${b}, ${nmpi}*32*${b}, ${nmpi}*48*${b}][$i_mn]</parameter> <parameter name="k" mode="python" type="int" >${m}</parameter> <parameter name="n" mode="python" type="int" >${m}</parameter> - <parameter name="command" type="string">mpiexec $MPI_OPTIONS -np $nmpi $CHAMELEON_BUILD/testing/chameleon_${precision}testing -o ${algorithm} -P $p -t $nthr -g $ngpu -m $m -n $n -k $k -b $b</parameter> + <parameter name="command" type="string">mpiexec -np $nmpi $MPI_OPTIONS $CHAMELEON_BUILD/testing/chameleon_${precision}testing -o ${algorithm} -P $p -t $nthr -g $ngpu -m $m -n $n -k $k -b $b</parameter> </parameterset> <parameterset name="param_potrf"> <parameter name="hostname" type="string">bora</parameter> @@ -32,7 +32,7 @@ <parameter name="m" mode="python" type="int" >[${nmpi}*${b}, ${nmpi}*2*${b}, ${nmpi}*4*${b}, ${nmpi}*8*${b}, ${nmpi}*16*${b}, ${nmpi}*32*${b}, ${nmpi}*48*${b}][$i_mn]</parameter> <parameter name="n" mode="python" type="int" >${m}</parameter> <parameter name="k" type="int" >1</parameter> - <parameter name="command" type="string">mpiexec $MPI_OPTIONS -np $nmpi $CHAMELEON_BUILD/testing/chameleon_${precision}testing -o ${algorithm} -P $p -t $nthr -g $ngpu -m $m -n $n -k $k -b $b</parameter> + <parameter name="command" type="string">mpiexec -np $nmpi $MPI_OPTIONS $CHAMELEON_BUILD/testing/chameleon_${precision}testing -o ${algorithm} -P $p -t $nthr -g $ngpu -m $m -n $n -k $k -b $b</parameter> </parameterset> <parameterset name="param_geqrf"> <parameter name="hostname" type="string">bora</parameter> @@ -49,6 +49,6 @@ <parameter name="m" mode="python" type="int" >[${nmpi}*${b}, ${nmpi}*2*${b}, ${nmpi}*4*${b}, ${nmpi}*8*${b}, ${nmpi}*16*${b}, ${nmpi}*32*${b}, ${nmpi}*48*${b}][$i_mn]</parameter> <parameter name="n" mode="python" type="int" >${m}</parameter> <parameter name="k" type="int" >1</parameter> - <parameter name="command" type="string">mpiexec $MPI_OPTIONS -np $nmpi $CHAMELEON_BUILD/testing/chameleon_${precision}testing -o ${algorithm} -P $p -t $nthr -g $ngpu -m $m -n $n -k $k -b $b</parameter> + <parameter name="command" type="string">mpiexec -np $nmpi $MPI_OPTIONS $CHAMELEON_BUILD/testing/chameleon_${precision}testing -o ${algorithm} -P $p -t $nthr -g $ngpu -m $m -n $n -k $k -b $b</parameter> </parameterset> </jube> diff --git a/tools/bench/plafrim/parameters/sirocco/parameters.xml b/tools/bench/plafrim/parameters/sirocco/parameters.xml index 3f04ebc617f0a3fd73114f38fcc9caf1efa00d0c..23d63e53cf6f7170d49b038e79a8fc1f67f6da36 100644 --- a/tools/bench/plafrim/parameters/sirocco/parameters.xml +++ b/tools/bench/plafrim/parameters/sirocco/parameters.xml @@ -15,7 +15,7 @@ <parameter name="m" mode="python" type="int" >[${nmpi}*${b}, ${nmpi}*2*${b}, ${nmpi}*4*${b}, ${nmpi}*8*${b}, ${nmpi}*16*${b}, ${nmpi}*32*${b}][$i_mn]</parameter> <parameter name="k" mode="python" type="int" >[${nmpi}*${b}, ${nmpi}*2*${b}, ${nmpi}*4*${b}, ${nmpi}*8*${b}, ${nmpi}*16*${b}, ${nmpi}*32*${b}][$i_mn]</parameter> <parameter name="n" mode="python" type="int" >[${nmpi}*${b}, ${nmpi}*2*${b}, ${nmpi}*4*${b}, ${nmpi}*8*${b}, ${nmpi}*16*${b}, ${nmpi}*32*${b}][$i_mn]</parameter> - <parameter name="command" type="string">mpiexec $MPI_OPTIONS -np $nmpi $CHAMELEON_BUILD/testing/chameleon_${precision}testing -o ${algorithm} -P $p -t $nthr -g $ngpu -m $m -n $n -k $k -b $b</parameter> + <parameter name="command" type="string">mpiexec -np $nmpi $MPI_OPTIONS $CHAMELEON_BUILD/testing/chameleon_${precision}testing -o ${algorithm} -P $p -t $nthr -g $ngpu -m $m -n $n -k $k -b $b</parameter> </parameterset> <parameterset name="param_potrf"> <parameter name="hostname" type="string">sirocco</parameter> @@ -32,7 +32,7 @@ <parameter name="m" mode="python" type="int" >[${nmpi}*${b}, ${nmpi}*2*${b}, ${nmpi}*4*${b}, ${nmpi}*8*${b}, ${nmpi}*16*${b}, ${nmpi}*32*${b}][$i_mn]</parameter> <parameter name="n" mode="python" type="int" >${m}</parameter> <parameter name="k" type="int" >1</parameter> - <parameter name="command" type="string">mpiexec $MPI_OPTIONS -np $nmpi $CHAMELEON_BUILD/testing/chameleon_${precision}testing -o ${algorithm} -P $p -t $nthr -g $ngpu -m $m -n $n -k $k -b $b</parameter> + <parameter name="command" type="string">mpiexec -np $nmpi $MPI_OPTIONS $CHAMELEON_BUILD/testing/chameleon_${precision}testing -o ${algorithm} -P $p -t $nthr -g $ngpu -m $m -n $n -k $k -b $b</parameter> </parameterset> <parameterset name="param_geqrf"> <parameter name="hostname" type="string">sirocco</parameter> @@ -49,6 +49,6 @@ <parameter name="m" mode="python" type="int" >[${nmpi}*${b}, ${nmpi}*2*${b}, ${nmpi}*4*${b}, ${nmpi}*8*${b}, ${nmpi}*16*${b}, ${nmpi}*32*${b}][$i_mn]</parameter> <parameter name="n" mode="python" type="int" >${m}</parameter> <parameter name="k" type="int" >1</parameter> - <parameter name="command" type="string">mpiexec $MPI_OPTIONS -np $nmpi $CHAMELEON_BUILD/testing/chameleon_${precision}testing -o ${algorithm} -P $p -t $nthr -g $ngpu -m $m -n $n -k $k -b $b</parameter> + <parameter name="command" type="string">mpiexec -np $nmpi $MPI_OPTIONS $CHAMELEON_BUILD/testing/chameleon_${precision}testing -o ${algorithm} -P $p -t $nthr -g $ngpu -m $m -n $n -k $k -b $b</parameter> </parameterset> </jube> diff --git a/tools/bench/plafrim/run.sh b/tools/bench/plafrim/run.sh index 567a8cfad36cb03b7be7e118be44d713c2f98eb7..55ca0278540885f5434ecb0c62634dbdc3bbb1b6 100755 --- a/tools/bench/plafrim/run.sh +++ b/tools/bench/plafrim/run.sh @@ -34,7 +34,7 @@ then export SLURM_CONSTRAINTS="sirocco,omnipath,v100" export CHAMELEON_BUILD_OPTIONS="-DCHAMELEON_USE_MPI=ON -DCHAMELEON_USE_CUDA=ON -DCMAKE_BUILD_TYPE=Release" export STARPU_HOSTNAME="sirocco" - export LD_PRELOAD="/usr/lib64/libcuda.so /usr/lib64/libnvidia-fatbinaryloader.so.440.33.01" + export LD_PRELOAD="/usr/lib64/libcuda.so" else echo "$0: Please set the NODE environnement variable to bora or sirocco." exit -1 @@ -49,22 +49,19 @@ fi export MPI_OPTIONS="" if [ $MPI = "openmpi" ] then - if [ $NODE = "bora" ] - then - export MPI_OPTIONS="--map-by ppr:1:node:pe=36" - fi + export MPI_OPTIONS="--bind-to board" GUIX_ENV_MPI="" GUIX_ADHOC_MPI="openssh openmpi" elif [ $MPI = "nmad" ] then - export MPI_OPTIONS="-DPIOM_DEDICATED=1 -DPIOM_DEDICATED_WAIT=1" - GUIX_ENV_MPI="--with-input=openmpi=nmad --with-branch=starpu=starpu-1.3" + export MPI_OPTIONS="-DPIOM_DEDICATED=1 -DPIOM_DEDICATED_WAIT=1 hwloc-bind --cpubind machine:0" + GUIX_ENV_MPI="--with-input=openmpi=nmad" GUIX_ADHOC_MPI="which gzip zlib tar inetutils util-linux procps openssh nmad" else echo "$0: Please set the MPI environnement variable to openmpi or nmad." exit -1 fi -GUIX_ADHOC="coreutils gawk grep jube perl python python-click python-certifi python-elasticsearch python-gitpython python-matplotlib python-pandas python-seaborn r-ggplot2 r-plyr r-reshape2 sed slurm mkl" +GUIX_ADHOC="coreutils gawk grep hwloc jube perl python python-click python-certifi python-elasticsearch python-gitpython python-matplotlib python-pandas python-seaborn r-ggplot2 r-plyr r-reshape2 sed slurm mkl@2019.1.144" GUIX_RULE="-D $GUIX_ENV $GUIX_ENV_MPI $GUIX_ADHOC $GUIX_ADHOC_MPI" # Submit jobs