Mentions légales du service

Skip to content
Snippets Groups Projects
Commit a1b13c50 authored by Mathieu Faverge's avatar Mathieu Faverge
Browse files

Merge branch 'calibration' into 'master'

Recalibrate potrf with magma support enabled

See merge request !26
parents 98b2191f 929cffd7
No related branches found
No related tags found
1 merge request!26Recalibrate potrf with magma support enabled
Pipeline #
...@@ -5,7 +5,143 @@ ...@@ -5,7 +5,143 @@
#################### ####################
# COMBs # COMBs
# number of combinations # number of combinations
5
####################
# COMB_1
# number of types devices
1
####################
# DEV_0
# device type (CPU - 0, CUDA - 1, OPENCL - 2, MIC - 3, SCC - 4)
1
####################
# DEV_0
# device id
0
####################
# DEV_0
# number of cores
1
##########
# number of implementations
1
#####
# Model for cuda0_impl0 (Comb1)
# number of entries
5
# sumlnx sumlnx2 sumlny sumlnxlny alpha beta n minx maxx
0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 nan nan 0 0 0
# a b c
nan nan nan
# hash size flops mean (us) dev (us) sum sum2 n
25ebb669 16588800 0.000000e+00 1.927652e+04 3.502107e+03 9.059964e+05 1.804090e+10 47
617e5fe6 7372800 0.000000e+00 1.229853e+04 1.768810e+03 6.149267e+05 7.719131e+09 50
ad30af9b 51200 0.000000e+00 2.101636e+03 2.756395e+02 1.303014e+05 2.785568e+08 62
982013a8 1548800 0.000000e+00 4.903930e+03 3.193701e+02 2.550044e+05 1.255828e+09 52
5104f3b7 29491200 0.000000e+00 2.463348e+04 2.985247e+03 1.576542e+06 3.940607e+10 64
####################
# COMB_2
# number of types devices
1
####################
# DEV_0
# device type (CPU - 0, CUDA - 1, OPENCL - 2, MIC - 3, SCC - 4)
1
####################
# DEV_0
# device id
2
####################
# DEV_0
# number of cores
1
##########
# number of implementations
1
#####
# Model for cuda2_impl0 (Comb2)
# number of entries
5
# sumlnx sumlnx2 sumlny sumlnxlny alpha beta n minx maxx
0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 nan nan 0 0 0
# a b c
nan nan nan
# hash size flops mean (us) dev (us) sum sum2 n
25ebb669 16588800 0.000000e+00 1.940135e+04 4.068762e+03 6.984485e+05 1.414682e+10 36
617e5fe6 7372800 0.000000e+00 1.194505e+04 1.978674e+03 3.822416e+05 4.691180e+09 32
ad30af9b 51200 0.000000e+00 2.114340e+03 2.957222e+02 1.268604e+05 2.734732e+08 60
982013a8 1548800 0.000000e+00 5.046035e+03 5.465455e+02 1.766112e+05 9.016412e+08 35
5104f3b7 29491200 0.000000e+00 2.329330e+04 2.356823e+03 1.094785e+06 2.576222e+10 47
####################
# COMB_3
# number of types devices
1
####################
# DEV_0
# device type (CPU - 0, CUDA - 1, OPENCL - 2, MIC - 3, SCC - 4)
1
####################
# DEV_0
# device id
3
####################
# DEV_0
# number of cores
1 1
##########
# number of implementations
1
#####
# Model for cuda3_impl0 (Comb3)
# number of entries
5
# sumlnx sumlnx2 sumlny sumlnxlny alpha beta n minx maxx
0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 nan nan 0 0 0
# a b c
nan nan nan
# hash size flops mean (us) dev (us) sum sum2 n
25ebb669 16588800 0.000000e+00 1.848606e+04 2.220768e+03 5.545817e+05 1.039998e+10 30
617e5fe6 7372800 0.000000e+00 1.174012e+04 1.793250e+03 3.991641e+05 4.795570e+09 34
ad30af9b 51200 0.000000e+00 2.130842e+03 3.337398e+02 1.576823e+05 3.442383e+08 74
982013a8 1548800 0.000000e+00 5.078755e+03 5.140761e+02 2.437802e+05 1.250785e+09 48
5104f3b7 29491200 0.000000e+00 2.451908e+04 3.131104e+03 5.884580e+05 1.466374e+10 24
####################
# COMB_0
# number of types devices
1
####################
# DEV_0
# device type (CPU - 0, CUDA - 1, OPENCL - 2, MIC - 3, SCC - 4)
1
####################
# DEV_0
# device id
1
####################
# DEV_0
# number of cores
1
##########
# number of implementations
1
#####
# Model for cuda1_impl0 (Comb0)
# number of entries
5
# sumlnx sumlnx2 sumlny sumlnxlny alpha beta n minx maxx
0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 nan nan 0 0 0
# a b c
nan nan nan
# hash size flops mean (us) dev (us) sum sum2 n
25ebb669 16588800 0.000000e+00 1.807832e+04 2.125912e+03 7.412111e+05 1.358515e+10 41
ad30af9b 51200 0.000000e+00 2.127387e+03 2.904710e+02 1.404075e+05 3.042697e+08 66
617e5fe6 7372800 0.000000e+00 1.177248e+04 1.259016e+03 4.002642e+05 4.765995e+09 34
982013a8 1548800 0.000000e+00 4.993474e+03 5.010162e+02 2.546672e+05 1.284476e+09 51
5104f3b7 29491200 0.000000e+00 2.412058e+04 2.891586e+03 1.206029e+06 2.950819e+10 50
#################### ####################
# COMB_4 # COMB_4
# number of types devices # number of types devices
...@@ -34,9 +170,9 @@ ...@@ -34,9 +170,9 @@
# a b c # a b c
nan nan nan nan nan nan
# hash size flops mean (us) dev (us) sum sum2 n # hash size flops mean (us) dev (us) sum sum2 n
617e5fe6 7372800 0.000000e+00 1.199994e+04 1.417119e+03 2.051989e+06 2.496714e+10 171 25ebb669 16588800 0.000000e+00 3.521786e+04 3.719259e+03 2.183508e+06 7.775611e+10 62
ad30af9b 51200 0.000000e+00 4.029498e+01 7.344934e+00 1.938188e+04 8.069416e+05 481 982013a8 1548800 0.000000e+00 1.965233e+03 3.623952e+02 7.271360e+04 1.477584e+08 37
982013a8 1548800 0.000000e+00 1.778398e+03 2.306933e+02 5.015082e+05 9.068890e+08 282 617e5fe6 7372800 0.000000e+00 1.125962e+04 1.634952e+03 5.855000e+05 6.731505e+09 52
25ebb669 16588800 0.000000e+00 3.651073e+04 5.293321e+03 4.308266e+06 1.606042e+11 118 ad30af9b 51200 0.000000e+00 4.077398e+01 4.776338e+00 2.487213e+03 1.028052e+05 61
5104f3b7 29491200 0.000000e+00 8.248482e+04 9.428391e+03 9.403269e+06 7.857610e+11 114 5104f3b7 29491200 0.000000e+00 7.956441e+04 8.548094e+03 5.410380e+06 4.354424e+11 68
...@@ -5,7 +5,143 @@ ...@@ -5,7 +5,143 @@
#################### ####################
# COMBs # COMBs
# number of combinations # number of combinations
5
####################
# COMB_0
# number of types devices
1
####################
# DEV_0
# device type (CPU - 0, CUDA - 1, OPENCL - 2, MIC - 3, SCC - 4)
1
####################
# DEV_0
# device id
0
####################
# DEV_0
# number of cores
1
##########
# number of implementations
1
#####
# Model for cuda0_impl0 (Comb0)
# number of entries
5
# sumlnx sumlnx2 sumlny sumlnxlny alpha beta n minx maxx
0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 nan nan 0 0 0
# a b c
nan nan nan
# hash size flops mean (us) dev (us) sum sum2 n
5104f3b7 14745600 0.000000e+00 1.725922e+04 2.264939e+03 1.052812e+06 1.848364e+10 61
25ebb669 8294400 0.000000e+00 1.618055e+04 2.196987e+03 7.766664e+05 1.279857e+10 48
982013a8 774400 0.000000e+00 3.928085e+03 4.967651e+02 1.414111e+05 5.643587e+08 36
ad30af9b 25600 0.000000e+00 2.070017e+03 2.556262e+02 1.283410e+05 2.697195e+08 62
617e5fe6 3686400 0.000000e+00 9.570246e+03 1.453408e+03 5.263635e+05 5.153611e+09 55
####################
# COMB_2
# number of types devices
1
####################
# DEV_0
# device type (CPU - 0, CUDA - 1, OPENCL - 2, MIC - 3, SCC - 4)
1
####################
# DEV_0
# device id
1
####################
# DEV_0
# number of cores
1
##########
# number of implementations
1
#####
# Model for cuda1_impl0 (Comb2)
# number of entries
5
# sumlnx sumlnx2 sumlny sumlnxlny alpha beta n minx maxx
0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 nan nan 0 0 0
# a b c
nan nan nan
# hash size flops mean (us) dev (us) sum sum2 n
5104f3b7 14745600 0.000000e+00 1.689494e+04 1.439976e+03 1.081276e+06 1.840081e+10 64
25ebb669 8294400 0.000000e+00 1.549399e+04 1.742327e+03 8.211813e+05 1.288426e+10 53
982013a8 774400 0.000000e+00 3.925510e+03 5.372277e+02 1.334673e+05 5.337401e+08 34
ad30af9b 25600 0.000000e+00 2.102179e+03 3.123586e+02 1.303351e+05 2.800370e+08 62
617e5fe6 3686400 0.000000e+00 9.539420e+03 1.257811e+03 4.292739e+05 4.166218e+09 45
####################
# COMB_3
# number of types devices
1
####################
# DEV_0
# device type (CPU - 0, CUDA - 1, OPENCL - 2, MIC - 3, SCC - 4)
1 1
####################
# DEV_0
# device id
3
####################
# DEV_0
# number of cores
1
##########
# number of implementations
1
#####
# Model for cuda3_impl0 (Comb3)
# number of entries
5
# sumlnx sumlnx2 sumlny sumlnxlny alpha beta n minx maxx
0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 nan nan 0 0 0
# a b c
nan nan nan
# hash size flops mean (us) dev (us) sum sum2 n
5104f3b7 14745600 0.000000e+00 1.679050e+04 1.864821e+03 5.037149e+05 8.561949e+09 30
25ebb669 8294400 0.000000e+00 1.650986e+04 2.615948e+03 4.457661e+05 7.544300e+09 27
982013a8 774400 0.000000e+00 4.072426e+03 6.492225e+02 1.384625e+05 5.782087e+08 34
ad30af9b 25600 0.000000e+00 2.106632e+03 2.976700e+02 1.390377e+05 2.987493e+08 66
617e5fe6 3686400 0.000000e+00 9.596093e+03 1.252122e+03 2.686906e+05 2.622279e+09 28
####################
# COMB_1
# number of types devices
1
####################
# DEV_0
# device type (CPU - 0, CUDA - 1, OPENCL - 2, MIC - 3, SCC - 4)
1
####################
# DEV_0
# device id
2
####################
# DEV_0
# number of cores
1
##########
# number of implementations
1
#####
# Model for cuda2_impl0 (Comb1)
# number of entries
5
# sumlnx sumlnx2 sumlny sumlnxlny alpha beta n minx maxx
0.000000e+00 0.000000e+00 0.000000e+00 0.000000e+00 nan nan 0 0 0
# a b c
nan nan nan
# hash size flops mean (us) dev (us) sum sum2 n
5104f3b7 14745600 0.000000e+00 1.640619e+04 1.490045e+03 6.398413e+05 1.058394e+10 39
25ebb669 8294400 0.000000e+00 1.538862e+04 2.385658e+03 6.155449e+05 9.700043e+09 40
982013a8 774400 0.000000e+00 4.069845e+03 5.836273e+02 1.627938e+05 6.761704e+08 40
ad30af9b 25600 0.000000e+00 2.134159e+03 2.682985e+02 1.323178e+05 2.868503e+08 62
617e5fe6 3686400 0.000000e+00 9.181625e+03 8.594056e+02 3.580834e+05 3.316592e+09 39
#################### ####################
# COMB_4 # COMB_4
# number of types devices # number of types devices
...@@ -34,9 +170,9 @@ ...@@ -34,9 +170,9 @@
# a b c # a b c
nan nan nan nan nan nan
# hash size flops mean (us) dev (us) sum sum2 n # hash size flops mean (us) dev (us) sum sum2 n
5104f3b7 14745600 0.000000e+00 4.483079e+04 5.635100e+03 1.026625e+07 4.675159e+11 229 5104f3b7 14745600 0.000000e+00 4.292375e+04 3.070461e+03 2.704196e+06 1.166682e+11 63
25ebb669 8294400 0.000000e+00 1.993450e+04 2.800795e+03 3.109782e+06 6.321569e+10 156 25ebb669 8294400 0.000000e+00 1.889580e+04 1.888554e+03 1.473872e+06 2.812818e+10 78
617e5fe6 3686400 0.000000e+00 7.511506e+03 7.944975e+02 2.291009e+06 1.740145e+10 305 982013a8 774400 0.000000e+00 1.554382e+03 1.710542e+02 5.595775e+04 8.803307e+07 36
982013a8 774400 0.000000e+00 1.048226e+03 1.196694e+02 2.452850e+05 2.604652e+08 234 ad30af9b 25600 0.000000e+00 7.450665e+01 4.146608e+00 4.097866e+03 3.062640e+05 55
ad30af9b 25600 0.000000e+00 7.425993e+01 7.891218e+00 2.784747e+04 2.091303e+06 375 617e5fe6 3686400 0.000000e+00 6.920145e+03 2.464678e+02 2.214446e+05 1.534373e+09 32
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment