From 15d3d3c7e1506bc0332ab87aced86a8690372cc6 Mon Sep 17 00:00:00 2001
From: Mathieu Faverge <mathieu.faverge@inria.fr>
Date: Tue, 13 Oct 2020 18:52:44 +0200
Subject: [PATCH] Add the forcegpu option to enforce possible kernels on the
 GPU

---
 include/chameleon/runtime_struct.h |  6 ++++++
 testing/chameleon_ztesting.c       | 15 ++++++++++++++-
 2 files changed, 20 insertions(+), 1 deletion(-)

diff --git a/include/chameleon/runtime_struct.h b/include/chameleon/runtime_struct.h
index 96a8c5cb7..fa3fc31f5 100644
--- a/include/chameleon/runtime_struct.h
+++ b/include/chameleon/runtime_struct.h
@@ -33,6 +33,12 @@ typedef enum runtime_id_e {
     RUNTIME_SCHED_OPENMP, /**< OpenMP runtime */
 } RUNTIME_id_t;
 
+/**
+ * @brief Ids of the worker type
+ */
+#define RUNTIME_CPU  ((1ULL)<<1)
+#define RUNTIME_CUDA ((1ULL)<<3)
+
 /**
  * @brief RUNTIME request structure
  *
diff --git a/testing/chameleon_ztesting.c b/testing/chameleon_ztesting.c
index e535b6ff7..2ae0e946d 100644
--- a/testing/chameleon_ztesting.c
+++ b/testing/chameleon_ztesting.c
@@ -42,6 +42,7 @@ static parameter_t parameters[] = {
     { "nowarmup", "Disable the warmup run to load libraries", -31, PARAM_OPTION, 0, 0, TestValInt, {0}, NULL, pread_int, sprint_int },
     { "mtxfmt",   "Change the way the matrix is stored (0: global, 1: tiles, 2: OOC)", -32, PARAM_OPTION | PARAM_INPUT | PARAM_OUTPUT, 1, 6, TestValInt, {0}, NULL, pread_int, sprint_int },
     { "profile",  "Display the kernel profiling",             -33, PARAM_OPTION, 0, 0, TestValInt, {0}, NULL, pread_int, sprint_int },
+    { "forcegpu", "Force kernels on GPU",                     -34, PARAM_OPTION, 0, 0, TestValInt, {0}, NULL, pread_int, sprint_int },
 
     { NULL, "Machine parameters", 0, PARAM_OPTION, 0, 0, 0, {0}, NULL, NULL, NULL },
     { "threads", "Number of CPU workers per node",      't', PARAM_OPTION | PARAM_OUTPUT, 1, 7, TestValInt, {-1}, NULL, pread_int, sprint_int },
@@ -490,7 +491,7 @@ parameters_destroy()
 int main (int argc, char **argv) {
 
     int ncores, ngpus, human, check, i, niter;
-    int trace, nowarmup, profile;
+    int trace, nowarmup, profile, forcegpu;
     int rc, info = 0;
     int run_id = 0;
     char *func_name;
@@ -515,6 +516,7 @@ int main (int argc, char **argv) {
     trace     = parameters_getvalue_int( "trace"    );
     nowarmup  = parameters_getvalue_int( "nowarmup" );
     profile   = parameters_getvalue_int( "profile" );
+    forcegpu  = parameters_getvalue_int( "forcegpu" );
 
     CHAMELEON_Init( ncores, ngpus );
 
@@ -536,6 +538,17 @@ int main (int argc, char **argv) {
     run_print_header( test, check, human );
     run = runlist->head;
 
+    /* Force all possible kernels on GPU */
+    if ( forcegpu ) {
+        if ( ngpus == 0 ) {
+            fprintf( stderr,
+                     "--forcegpu can't be enable without GPU (-g 0).\n"
+                     "  Please specify a larger number of GPU or disable this option\n" );
+            return EXIT_FAILURE;
+        }
+        RUNTIME_zlocality_allrestrict( RUNTIME_CUDA );
+    }
+
     /* Warmup */
     if ( !nowarmup ) {
         run_arg_list_t copy = run_arg_list_copy( &(run->args) );
-- 
GitLab