Mentions légales du service

Skip to content
Snippets Groups Projects
runtime_profiling.c 4.21 KiB
/**
 *
 * @file starpu/runtime_profiling.c
 *
 * @copyright 2009-2014 The University of Tennessee and The University of
 *                      Tennessee Research Foundation. All rights reserved.
 * @copyright 2012-2023 Bordeaux INP, CNRS (LaBRI UMR 5800), Inria,
 *                      Univ. Bordeaux. All rights reserved.
 *
 ***
 *
 * @brief Chameleon StarPU profiling routines
 *
 * @version 1.2.0
 * @author Cedric Augonnet
 * @author Mathieu Faverge
 * @author Cedric Castagnede
 * @author Florent Pruvost
 * @author Samuel Thibault
 * @date 2022-02-22
 *
 */
#include "chameleon_starpu.h"
#include <math.h>
#if defined(STARPU_USE_FXT)
#include <starpu_fxt.h>
#endif

#ifdef CHAMELEON_ENABLE_PRUNING_STATS
unsigned long RUNTIME_total_tasks   = 0;
unsigned long RUNTIME_exec_tasks    = 0;
unsigned long RUNTIME_comm_tasks    = 0;
unsigned long RUNTIME_changed_tasks = 0;
#endif

double RUNTIME_get_time(){
    return starpu_timing_now()*1e-6;
}

/**
 *  Set iteration numbers for traces
 */
void RUNTIME_iteration_push( CHAM_context_t *chamctxt, unsigned long iteration )
{
    (void)chamctxt;
#if defined(HAVE_STARPU_ITERATION_PUSH)
    starpu_iteration_push(iteration);
#endif
    (void)iteration;
}

void RUNTIME_iteration_pop( CHAM_context_t *chamctxt )
{
    (void)chamctxt;
#if defined(HAVE_STARPU_ITERATION_PUSH)
    starpu_iteration_pop();
#endif
}

void RUNTIME_start_profiling(){
#if defined(STARPU_USE_FXT)
    starpu_fxt_start_profiling();
#endif
}

void RUNTIME_stop_profiling(){
#if defined(STARPU_USE_FXT)
    starpu_fxt_stop_profiling();
#endif
}

void RUNTIME_start_stats(){
#ifdef CHAMELEON_ENABLE_PRUNING_STATS
    RUNTIME_total_tasks = 0;
    RUNTIME_exec_tasks = 0;
    RUNTIME_comm_tasks = 0;
    RUNTIME_changed_tasks = 0;
#endif
}

void RUNTIME_stop_stats(){
#ifdef CHAMELEON_ENABLE_PRUNING_STATS
    fprintf( stderr, "\ntasks: %lu = exec: %lu + comm: %lu + changed: %lu\n",
             RUNTIME_total_tasks, RUNTIME_exec_tasks, RUNTIME_comm_tasks, RUNTIME_changed_tasks );
#endif
}

void RUNTIME_profiling_display_info(const char *kernel_name, measure_t perf[STARPU_NMAXWORKERS])
{
    int header = 1;
    unsigned worker;
    for (worker = 0; worker < starpu_worker_get_count(); worker++)
    {
        if (perf[worker].n > 0)
        {
            if ( header ) {
                fprintf(stderr, "Performance for kernel %s\n", kernel_name);
                header = 0;
            }
            char workername[128];
            starpu_worker_get_name(worker, workername, 128);

            long   n    = perf[worker].n;
            double sum  = perf[worker].sum;
            double sum2 = perf[worker].sum2;

            double avg = sum / n;
            double sd  = sqrt((sum2 - (sum*sum)/n)/n);

            fprintf(stderr, "\t%s\t%.2lf\t%.2lf\t%ld\n", workername, avg, sd, n);
        }
    }
}

void RUNTIME_profiling_display_efficiency(void)
{
    fprintf(stderr, "Efficiency\n");

    double max_total_time = 0.0;
    unsigned worker;

    for (worker = 0; worker < starpu_worker_get_count(); worker++)
    {
        char workername[128];
        starpu_worker_get_name(worker, workername, 128);

        struct starpu_profiling_worker_info info;
        starpu_profiling_worker_get_info(worker, &info);

        double executing_time = starpu_timing_timespec_to_us(&info.executing_time);
        double total_time = starpu_timing_timespec_to_us(&info.total_time);

        max_total_time = (total_time > max_total_time)?total_time:max_total_time;

        float overhead = 100.0 - (100.0*executing_time/total_time);
        fprintf(stderr, "\t%s\ttotal %.2lf s\texec %.2lf s\toverhead %.2lf%%\n",
                workername, total_time*1e-6, executing_time*1e-6, overhead);
    }

    fprintf(stderr, "Total execution time: %.2lf us\n", max_total_time);
}

void RUNTIME_schedprofile_display(void)
{
    fprintf(stderr, "\n");
    RUNTIME_profiling_display_efficiency();

    /* Display bus consumption */
    starpu_profiling_bus_helper_display_summary();
}

void RUNTIME_kernelprofile_display(void)
{
#if defined(PRECISION_z)
    RUNTIME_zdisplay_allprofile();
#endif
#if defined(PRECISION_c)
    RUNTIME_cdisplay_allprofile();
#endif
#if defined(PRECISION_d)
    RUNTIME_ddisplay_allprofile();
#endif
#if defined(PRECISION_s)
    RUNTIME_sdisplay_allprofile();
#endif
}