Sfoglia il codice sorgente

Add more measurements

Samuel Thibault 10 anni fa
parent
commit
4b28886ba9

+ 13 - 4
tools/perfmodels/.starpu/sampling/codelets/44/chol_model_11.mirage

@@ -28,13 +28,15 @@
 #####
 # Model for cpu0_impl0 (Comb0)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+cea37d6d	409600         	1.097392e+07   	9.221097e+02   	4.521529e+01   	7.930143e+04   	7.330044e+07   	86
 617e5fe6	3686400        	2.953730e+08   	1.884969e+04   	7.370619e+02   	2.111165e+06   	3.985565e+10   	112
+afdd228b	1638400        	8.758624e+07   	5.940712e+03   	2.434960e+02   	2.376285e+05   	1.414054e+09   	40
 
 ####################
 # COMB_1
@@ -58,13 +60,15 @@ nan            	nan            	nan
 #####
 # Model for cuda0_impl0 (Comb1)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+cea37d6d	409600         	1.097392e+07   	2.918360e+03   	1.924750e+02   	2.918360e+04   	8.553869e+07   	10
 617e5fe6	3686400        	2.953730e+08   	1.239445e+04   	1.620572e+03   	1.363389e+05   	1.718735e+09   	11
+afdd228b	1638400        	8.758624e+07   	5.044027e+03   	9.860073e+02   	6.052832e+04   	3.169730e+08   	12
 
 ####################
 # COMB_2
@@ -88,13 +92,15 @@ nan            	nan            	nan
 #####
 # Model for cuda1_impl0 (Comb2)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+cea37d6d	409600         	1.097392e+07   	3.820396e+03   	6.009552e+02   	3.820396e+04   	1.495658e+08   	10
 617e5fe6	3686400        	2.953730e+08   	4.056348e+04   	1.353308e+03   	4.056348e+05   	1.647228e+10   	10
+afdd228b	1638400        	8.758624e+07   	1.146929e+04   	1.466472e+03   	1.146929e+05   	1.336952e+09   	10
 
 ####################
 # COMB_3
@@ -118,10 +124,13 @@ nan            	nan            	nan
 #####
 # Model for cuda2_impl0 (Comb3)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+cea37d6d	409600         	1.097392e+07   	2.847962e+03   	2.297293e+02   	2.847962e+04   	8.163663e+07   	10
 617e5fe6	3686400        	2.953730e+08   	3.799962e+04   	4.946563e+03   	3.799962e+05   	1.468440e+10   	10
+afdd228b	1638400        	8.758624e+07   	1.204317e+04   	9.253606e+02   	1.204317e+05   	1.458942e+09   	10
+

+ 13 - 5
tools/perfmodels/.starpu/sampling/codelets/44/chol_model_21.mirage

@@ -6,7 +6,6 @@
 # COMBs
 # number of combinations
 4
-
 ####################
 # COMB_0
 # number of types devices
@@ -29,13 +28,15 @@
 #####
 # Model for cpu0_impl0 (Comb0)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+2c1922b7	819200         	3.287040e+07   	1.868713e+03   	9.872163e+01   	2.535843e+06   	4.751987e+09   	1357
 ff82dda0	7372800        	8.856576e+08   	4.564676e+04   	7.031596e+02   	5.687586e+07   	2.596815e+12   	1246
+d39bff17	3276800        	2.625536e+08   	1.417018e+04   	5.255501e+02   	8.232874e+06   	1.168218e+11   	581
 
 ####################
 # COMB_1
@@ -59,13 +60,15 @@ ff82dda0	7372800        	8.856576e+08   	4.564676e+04   	7.031596e+02   	5.68758
 #####
 # Model for cuda0_impl0 (Comb1)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+2c1922b7	819200         	3.287040e+07   	6.829247e+02   	7.632991e+01   	1.420483e+05   	9.822018e+07   	208
 ff82dda0	7372800        	8.856576e+08   	6.393638e+03   	3.362739e+02   	3.650767e+06   	2.340625e+10   	571
+d39bff17	3276800        	2.625536e+08   	2.602204e+03   	1.876810e+02   	6.895839e+05   	1.803772e+09   	265
 
 ####################
 # COMB_2
@@ -89,13 +92,15 @@ ff82dda0	7372800        	8.856576e+08   	6.393638e+03   	3.362739e+02   	3.65076
 #####
 # Model for cuda1_impl0 (Comb2)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+2c1922b7	819200         	3.287040e+07   	6.842707e+02   	6.860830e+01   	1.211159e+05   	8.370922e+07   	177
 ff82dda0	7372800        	8.856576e+08   	6.416842e+03   	2.746569e+02   	2.951747e+06   	1.897560e+10   	460
+d39bff17	3276800        	2.625536e+08   	2.601751e+03   	2.008905e+02   	6.114115e+05   	1.600224e+09   	235
 
 ####################
 # COMB_3
@@ -119,10 +124,13 @@ ff82dda0	7372800        	8.856576e+08   	6.416842e+03   	2.746569e+02   	2.95174
 #####
 # Model for cuda2_impl0 (Comb3)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+2c1922b7	819200         	3.287040e+07   	6.827700e+02   	7.214633e+01   	1.297263e+05   	8.956219e+07   	190
 ff82dda0	7372800        	8.856576e+08   	6.409443e+03   	3.434222e+02   	3.243178e+06   	2.084664e+10   	506
+d39bff17	3276800        	2.625536e+08   	2.604891e+03   	2.068197e+02   	6.069396e+05   	1.590978e+09   	233
+

+ 13 - 5
tools/perfmodels/.starpu/sampling/codelets/44/chol_model_22.mirage

@@ -6,7 +6,6 @@
 # COMBs
 # number of combinations
 4
-
 ####################
 # COMB_0
 # number of types devices
@@ -29,13 +28,15 @@
 #####
 # Model for cpu0_impl0 (Comb0)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d46431bb	1228800        	6.553600e+07   	3.262643e+03   	7.810468e+01   	1.532463e+07   	5.002746e+10   	4697
 24c84a50	11059200       	1.769472e+09   	8.778020e+04   	9.598441e+02   	2.889724e+08   	2.536909e+13   	3292
+f0ac7beb	4915200        	5.242880e+08   	2.647095e+04   	4.073263e+02   	4.762124e+07   	1.260878e+12   	1799
 
 ####################
 # COMB_1
@@ -59,13 +60,15 @@ nan            	nan            	nan
 #####
 # Model for cuda0_impl0 (Comb1)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d46431bb	1228800        	6.553600e+07   	2.011248e+02   	1.498037e+01   	1.633334e+06   	3.303264e+08   	8121
 24c84a50	11059200       	1.769472e+09   	2.805491e+03   	6.931361e+01   	3.683329e+07   	1.033985e+11   	13129
+f0ac7beb	4915200        	5.242880e+08   	8.944354e+02   	3.828761e+01   	5.687714e+06   	5.096615e+09   	6359
 
 ####################
 # COMB_2
@@ -89,13 +92,15 @@ nan            	nan            	nan
 #####
 # Model for cuda1_impl0 (Comb2)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d46431bb	1228800        	6.553600e+07   	2.004836e+02   	1.337883e+01   	1.620709e+06   	3.263726e+08   	8084
 24c84a50	11059200       	1.769472e+09   	2.828590e+03   	6.702999e+01   	3.650578e+07   	1.033178e+11   	12906
+f0ac7beb	4915200        	5.242880e+08   	9.090465e+02   	3.898196e+01   	5.691540e+06   	5.183389e+09   	6261
 
 ####################
 # COMB_3
@@ -119,10 +124,13 @@ nan            	nan            	nan
 #####
 # Model for cuda2_impl0 (Comb3)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d46431bb	1228800        	6.553600e+07   	1.603761e+02   	1.178063e+01   	1.522450e+06   	2.454821e+08   	9493
 24c84a50	11059200       	1.769472e+09   	2.828209e+03   	7.003112e+01   	3.675541e+07   	1.040157e+11   	12996
+f0ac7beb	4915200        	5.242880e+08   	8.858930e+02   	3.323656e+01   	5.675030e+06   	5.034546e+09   	6406
+

+ 18 - 10
tools/perfmodels/.starpu/sampling/codelets/44/starpu_dlu_lu_model_11.mirage

@@ -28,16 +28,18 @@
 #####
 # Model for cpu0_impl0 (Comb3)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+afdd228b	3276800        	0.000000e+00   	7.065042e+04   	7.118479e+03   	1.271707e+06   	9.075877e+10   	18
 617e5fe6	7372800        	0.000000e+00   	2.321971e+05   	3.386520e+04   	2.554168e+06   	6.056858e+11   	11
+cea37d6d	819200         	0.000000e+00   	8.644872e+03   	1.175676e+03   	4.581782e+05   	4.034149e+09   	53
 
 ####################
-# COMB_0
+# COMB_2
 # number of types devices
 1
 ####################
@@ -56,18 +58,20 @@ nan            	nan            	nan
 # number of implementations
 1
 #####
-# Model for cuda0_impl0 (Comb0)
+# Model for cuda0_impl0 (Comb2)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+afdd228b	3276800        	0.000000e+00   	3.469534e+04   	1.243993e+03   	9.714695e+05   	3.374879e+10   	28
 617e5fe6	7372800        	0.000000e+00   	8.533007e+04   	9.757927e+03   	1.194621e+06   	1.032701e+11   	14
+cea37d6d	819200         	0.000000e+00   	1.145973e+04   	6.017234e+02   	1.145973e+05   	1.316874e+09   	10
 
 ####################
-# COMB_1
+# COMB_0
 # number of types devices
 1
 ####################
@@ -86,18 +90,20 @@ nan            	nan            	nan
 # number of implementations
 1
 #####
-# Model for cuda1_impl0 (Comb1)
+# Model for cuda1_impl0 (Comb0)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+afdd228b	3276800        	0.000000e+00   	3.498011e+04   	2.179531e+03   	6.996022e+05   	2.456717e+10   	20
 617e5fe6	7372800        	0.000000e+00   	8.442764e+04   	6.770170e+03   	1.350842e+06   	1.147818e+11   	16
+cea37d6d	819200         	0.000000e+00   	1.080764e+04   	2.151492e+02   	1.188840e+05   	1.285365e+09   	11
 
 ####################
-# COMB_2
+# COMB_1
 # number of types devices
 1
 ####################
@@ -116,13 +122,15 @@ nan            	nan            	nan
 # number of implementations
 1
 #####
-# Model for cuda2_impl0 (Comb2)
+# Model for cuda2_impl0 (Comb1)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+afdd228b	3276800        	0.000000e+00   	3.506064e+04   	2.956747e+03   	6.310915e+05   	2.228383e+10   	18
 617e5fe6	7372800        	0.000000e+00   	8.151052e+04   	4.250155e+02   	1.059637e+06   	8.637388e+10   	13
+cea37d6d	819200         	0.000000e+00   	1.153062e+04   	1.200141e+03   	1.153062e+05   	1.343956e+09   	10
 

+ 18 - 11
tools/perfmodels/.starpu/sampling/codelets/44/starpu_dlu_lu_model_12.mirage

@@ -6,7 +6,6 @@
 # COMBs
 # number of combinations
 4
-
 ####################
 # COMB_3
 # number of types devices
@@ -29,16 +28,18 @@
 #####
 # Model for cpu0_impl0 (Comb3)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d39bff17	6553600        	0.000000e+00   	2.758103e+04   	7.024890e+02   	7.033162e+06   	1.941076e+11   	255
 ff82dda0	14745600       	0.000000e+00   	9.143755e+04   	1.725750e+03   	1.234407e+07   	1.129114e+12   	135
+2c1922b7	1638400        	0.000000e+00   	3.516018e+03   	1.528455e+02   	1.613852e+06   	5.685057e+09   	459
 
 ####################
-# COMB_0
+# COMB_2
 # number of types devices
 1
 ####################
@@ -57,18 +58,20 @@ ff82dda0	14745600       	0.000000e+00   	9.143755e+04   	1.725750e+03   	1.23440
 # number of implementations
 1
 #####
-# Model for cuda0_impl0 (Comb0)
+# Model for cuda0_impl0 (Comb2)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d39bff17	6553600        	0.000000e+00   	2.131008e+03   	3.294125e+02   	6.755295e+05   	1.473957e+09   	317
 ff82dda0	14745600       	0.000000e+00   	7.209283e+03   	1.090675e+03   	1.564414e+06   	1.153644e+10   	217
+2c1922b7	1638400        	0.000000e+00   	6.237527e+02   	1.148972e+02   	1.210080e+05   	7.804013e+07   	194
 
 ####################
-# COMB_1
+# COMB_0
 # number of types devices
 1
 ####################
@@ -87,18 +90,20 @@ ff82dda0	14745600       	0.000000e+00   	7.209283e+03   	1.090675e+03   	1.56441
 # number of implementations
 1
 #####
-# Model for cuda1_impl0 (Comb1)
+# Model for cuda1_impl0 (Comb0)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d39bff17	6553600        	0.000000e+00   	2.163459e+03   	3.374464e+02   	5.538454e+05   	1.227372e+09   	256
 ff82dda0	14745600       	0.000000e+00   	6.895326e+03   	1.111793e+03   	1.234263e+06   	8.731908e+09   	179
+2c1922b7	1638400        	0.000000e+00   	6.290993e+02   	1.019490e+02   	1.333690e+05   	8.610581e+07   	212
 
 ####################
-# COMB_2
+# COMB_1
 # number of types devices
 1
 ####################
@@ -117,13 +122,15 @@ ff82dda0	14745600       	0.000000e+00   	6.895326e+03   	1.111793e+03   	1.23426
 # number of implementations
 1
 #####
-# Model for cuda2_impl0 (Comb2)
+# Model for cuda2_impl0 (Comb1)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d39bff17	6553600        	0.000000e+00   	2.119354e+03   	3.243594e+02   	5.912998e+05   	1.282527e+09   	279
 ff82dda0	14745600       	0.000000e+00   	6.998019e+03   	1.239620e+03   	1.070697e+06   	7.727865e+09   	153
+2c1922b7	1638400        	0.000000e+00   	6.140937e+02   	1.075567e+02   	1.430838e+05   	9.056234e+07   	233
 

+ 18 - 11
tools/perfmodels/.starpu/sampling/codelets/44/starpu_dlu_lu_model_21.mirage

@@ -6,7 +6,6 @@
 # COMBs
 # number of combinations
 4
-
 ####################
 # COMB_3
 # number of types devices
@@ -29,16 +28,18 @@
 #####
 # Model for cpu0_impl0 (Comb3)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d39bff17	6553600        	0.000000e+00   	2.762618e+04   	9.983022e+02   	6.575032e+06   	1.818802e+11   	238
 ff82dda0	14745600       	0.000000e+00   	9.068591e+04   	1.985325e+03   	1.324014e+07   	1.201270e+12   	146
+2c1922b7	1638400        	0.000000e+00   	3.579286e+03   	2.361748e+02   	1.449611e+06   	5.211162e+09   	405
 
 ####################
-# COMB_0
+# COMB_2
 # number of types devices
 1
 ####################
@@ -57,18 +58,20 @@ ff82dda0	14745600       	0.000000e+00   	9.068591e+04   	1.985325e+03   	1.32401
 # number of implementations
 1
 #####
-# Model for cuda0_impl0 (Comb0)
+# Model for cuda0_impl0 (Comb2)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d39bff17	6553600        	0.000000e+00   	2.106536e+03   	3.670134e+02   	5.856171e+05   	1.271070e+09   	278
 ff82dda0	14745600       	0.000000e+00   	7.299043e+03   	1.073594e+03   	1.284632e+06   	9.579441e+09   	176
+2c1922b7	1638400        	0.000000e+00   	6.166979e+02   	1.186269e+02   	1.362902e+05   	8.715990e+07   	221
 
 ####################
-# COMB_1
+# COMB_0
 # number of types devices
 1
 ####################
@@ -87,18 +90,20 @@ ff82dda0	14745600       	0.000000e+00   	7.299043e+03   	1.073594e+03   	1.28463
 # number of implementations
 1
 #####
-# Model for cuda1_impl0 (Comb1)
+# Model for cuda1_impl0 (Comb0)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d39bff17	6553600        	0.000000e+00   	2.072463e+03   	3.421274e+02   	6.590431e+05   	1.403064e+09   	318
 ff82dda0	14745600       	0.000000e+00   	6.791353e+03   	1.183637e+03   	1.195278e+06   	8.364131e+09   	176
+2c1922b7	1638400        	0.000000e+00   	6.128580e+02   	1.104622e+02   	1.378931e+05   	8.725430e+07   	225
 
 ####################
-# COMB_2
+# COMB_1
 # number of types devices
 1
 ####################
@@ -117,13 +122,15 @@ ff82dda0	14745600       	0.000000e+00   	6.791353e+03   	1.183637e+03   	1.19527
 # number of implementations
 1
 #####
-# Model for cuda2_impl0 (Comb2)
+# Model for cuda2_impl0 (Comb1)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d39bff17	6553600        	0.000000e+00   	2.129169e+03   	3.327197e+02   	5.024838e+05   	1.095999e+09   	236
 ff82dda0	14745600       	0.000000e+00   	6.700018e+03   	1.125184e+03   	1.139003e+06   	7.846568e+09   	170
+2c1922b7	1638400        	0.000000e+00   	6.207819e+02   	1.142635e+02   	1.440214e+05   	9.243491e+07   	232
 

+ 18 - 11
tools/perfmodels/.starpu/sampling/codelets/44/starpu_dlu_lu_model_22.mirage

@@ -6,7 +6,6 @@
 # COMBs
 # number of combinations
 4
-
 ####################
 # COMB_3
 # number of types devices
@@ -29,16 +28,18 @@
 #####
 # Model for cpu0_impl0 (Comb3)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+f0ac7beb	9830400        	0.000000e+00   	5.319005e+04   	1.072845e+03   	1.074439e+08   	5.717271e+12   	2020
 24c84a50	22118400       	0.000000e+00   	1.747556e+05   	3.288616e+03   	2.457064e+08   	4.295378e+13   	1406
+d46431bb	2457600        	0.000000e+00   	6.731248e+03   	2.017842e+02   	1.758875e+07   	1.185006e+11   	2613
 
 ####################
-# COMB_0
+# COMB_2
 # number of types devices
 1
 ####################
@@ -57,18 +58,20 @@ nan            	nan            	nan
 # number of implementations
 1
 #####
-# Model for cuda0_impl0 (Comb0)
+# Model for cuda0_impl0 (Comb2)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+f0ac7beb	9830400        	0.000000e+00   	1.857771e+03   	5.953793e+01   	1.442559e+07   	2.682697e+10   	7765
 24c84a50	22118400       	0.000000e+00   	5.825821e+03   	1.536397e+02   	3.023019e+07   	1.762382e+11   	5189
+d46431bb	2457600        	0.000000e+00   	2.626388e+02   	2.130047e+01   	1.891262e+06   	4.999858e+08   	7201
 
 ####################
-# COMB_1
+# COMB_0
 # number of types devices
 1
 ####################
@@ -87,18 +90,20 @@ nan            	nan            	nan
 # number of implementations
 1
 #####
-# Model for cuda1_impl0 (Comb1)
+# Model for cuda1_impl0 (Comb0)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+f0ac7beb	9830400        	0.000000e+00   	1.841710e+03   	6.898710e+01   	1.448873e+07   	2.672149e+10   	7867
 24c84a50	22118400       	0.000000e+00   	5.866678e+03   	1.842980e+02   	2.977339e+07   	1.748433e+11   	5075
+d46431bb	2457600        	0.000000e+00   	2.614108e+02   	2.029949e+01   	1.936531e+06   	5.092829e+08   	7408
 
 ####################
-# COMB_2
+# COMB_1
 # number of types devices
 1
 ####################
@@ -117,13 +122,15 @@ nan            	nan            	nan
 # number of implementations
 1
 #####
-# Model for cuda2_impl0 (Comb2)
+# Model for cuda2_impl0 (Comb1)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+f0ac7beb	9830400        	0.000000e+00   	1.853277e+03   	6.983878e+01   	1.439996e+07   	2.672502e+10   	7770
 24c84a50	22118400       	0.000000e+00   	5.858635e+03   	1.761006e+02   	3.008995e+07   	1.764453e+11   	5136
+d46431bb	2457600        	0.000000e+00   	2.701366e+02   	1.779276e+01   	1.899060e+06   	5.152311e+08   	7030
 

+ 17 - 9
tools/perfmodels/.starpu/sampling/codelets/44/starpu_slu_lu_model_11.mirage

@@ -6,7 +6,6 @@
 # COMBs
 # number of combinations
 4
-
 ####################
 # COMB_3
 # number of types devices
@@ -29,13 +28,15 @@
 #####
 # Model for cpu0_impl0 (Comb3)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+afdd228b	1638400        	0.000000e+00   	3.789658e+04   	4.182352e+03   	1.250587e+06   	4.797021e+10   	33
 617e5fe6	3686400        	0.000000e+00   	1.286436e+05   	1.271269e+04   	2.958803e+06   	3.843483e+11   	23
+cea37d6d	409600         	0.000000e+00   	4.236597e+03   	2.366692e+02   	2.372495e+05   	1.008267e+09   	56
 
 ####################
 # COMB_0
@@ -59,16 +60,18 @@ nan            	nan            	nan
 #####
 # Model for cuda0_impl0 (Comb0)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+afdd228b	1638400        	0.000000e+00   	2.864580e+04   	3.233071e+03   	5.156243e+05   	1.495862e+10   	18
 617e5fe6	3686400        	0.000000e+00   	5.948740e+04   	4.910517e+03   	1.070773e+06   	6.413154e+10   	18
+cea37d6d	409600         	0.000000e+00   	1.060245e+04   	4.247968e+02   	1.060245e+05   	1.125924e+09   	10
 
 ####################
-# COMB_1
+# COMB_2
 # number of types devices
 1
 ####################
@@ -87,18 +90,20 @@ nan            	nan            	nan
 # number of implementations
 1
 #####
-# Model for cuda1_impl0 (Comb1)
+# Model for cuda1_impl0 (Comb2)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+afdd228b	1638400        	0.000000e+00   	3.046163e+04   	4.754796e+03   	5.483094e+05   	1.710934e+10   	18
 617e5fe6	3686400        	0.000000e+00   	5.865963e+04   	4.672589e+03   	1.349171e+06   	7.964405e+10   	23
+cea37d6d	409600         	0.000000e+00   	1.042618e+04   	1.817032e+02   	1.042618e+05   	1.087383e+09   	10
 
 ####################
-# COMB_2
+# COMB_1
 # number of types devices
 1
 ####################
@@ -117,12 +122,15 @@ nan            	nan            	nan
 # number of implementations
 1
 #####
-# Model for cuda2_impl0 (Comb2)
+# Model for cuda2_impl0 (Comb1)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+afdd228b	1638400        	0.000000e+00   	2.939722e+04   	4.040622e+03   	4.409582e+05   	1.320784e+10   	15
 617e5fe6	3686400        	0.000000e+00   	5.704610e+04   	3.429433e+03   	1.255014e+06   	7.185241e+10   	22
+cea37d6d	409600         	0.000000e+00   	1.049902e+04   	4.776188e+02   	1.049902e+05   	1.104575e+09   	10
+

+ 17 - 9
tools/perfmodels/.starpu/sampling/codelets/44/starpu_slu_lu_model_12.mirage

@@ -6,7 +6,6 @@
 # COMBs
 # number of combinations
 4
-
 ####################
 # COMB_3
 # number of types devices
@@ -29,13 +28,15 @@
 #####
 # Model for cpu0_impl0 (Comb3)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d39bff17	3276800        	0.000000e+00   	1.615269e+04   	4.099119e+02   	4.748890e+06   	7.675673e+10   	294
 ff82dda0	7372800        	0.000000e+00   	5.118532e+04   	6.422962e+02   	1.530441e+07   	7.834845e+11   	299
+2c1922b7	819200         	0.000000e+00   	2.296074e+03   	7.445272e+01   	1.021753e+06   	2.348487e+09   	445
 
 ####################
 # COMB_0
@@ -59,16 +60,18 @@ ff82dda0	7372800        	0.000000e+00   	5.118532e+04   	6.422962e+02   	1.53044
 #####
 # Model for cuda0_impl0 (Comb0)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d39bff17	3276800        	0.000000e+00   	2.740712e+03   	2.663471e+02   	5.755494e+05   	1.592313e+09   	210
 ff82dda0	7372800        	0.000000e+00   	6.504044e+03   	4.912781e+02   	1.385361e+06   	9.061859e+09   	213
+2c1922b7	819200         	0.000000e+00   	6.801212e+02   	1.149855e+02   	1.129001e+05   	7.898057e+07   	166
 
 ####################
-# COMB_1
+# COMB_2
 # number of types devices
 1
 ####################
@@ -87,18 +90,20 @@ ff82dda0	7372800        	0.000000e+00   	6.504044e+03   	4.912781e+02   	1.38536
 # number of implementations
 1
 #####
-# Model for cuda1_impl0 (Comb1)
+# Model for cuda1_impl0 (Comb2)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d39bff17	3276800        	0.000000e+00   	2.716114e+03   	2.688407e+02   	4.237138e+05   	1.162130e+09   	156
 ff82dda0	7372800        	0.000000e+00   	6.512491e+03   	5.367987e+02   	8.270864e+05   	5.422988e+09   	127
+2c1922b7	819200         	0.000000e+00   	7.284912e+02   	1.021807e+02   	1.049027e+05   	7.792421e+07   	144
 
 ####################
-# COMB_2
+# COMB_1
 # number of types devices
 1
 ####################
@@ -117,12 +122,15 @@ ff82dda0	7372800        	0.000000e+00   	6.512491e+03   	5.367987e+02   	8.27086
 # number of implementations
 1
 #####
-# Model for cuda2_impl0 (Comb2)
+# Model for cuda2_impl0 (Comb1)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d39bff17	3276800        	0.000000e+00   	2.294336e+03   	5.071880e+02   	4.909878e+05   	1.181540e+09   	214
 ff82dda0	7372800        	0.000000e+00   	6.469485e+03   	5.370376e+02   	7.698688e+05   	5.014976e+09   	119
+2c1922b7	819200         	0.000000e+00   	7.112055e+02   	1.136474e+02   	1.002800e+05   	7.314078e+07   	141
+

+ 17 - 9
tools/perfmodels/.starpu/sampling/codelets/44/starpu_slu_lu_model_21.mirage

@@ -6,7 +6,6 @@
 # COMBs
 # number of combinations
 4
-
 ####################
 # COMB_3
 # number of types devices
@@ -29,13 +28,15 @@
 #####
 # Model for cpu0_impl0 (Comb3)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d39bff17	3276800        	0.000000e+00   	1.373117e+04   	2.756172e+02   	7.167670e+06   	9.846014e+10   	522
 ff82dda0	7372800        	0.000000e+00   	4.545501e+04   	7.462378e+02   	1.750018e+07   	7.956851e+11   	385
+2c1922b7	819200         	0.000000e+00   	1.798916e+03   	8.480081e+01   	1.219665e+06   	2.198952e+09   	678
 
 ####################
 # COMB_0
@@ -59,16 +60,18 @@ ff82dda0	7372800        	0.000000e+00   	4.545501e+04   	7.462378e+02   	1.75001
 #####
 # Model for cuda0_impl0 (Comb0)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d39bff17	3276800        	0.000000e+00   	2.883473e+03   	4.679640e+02   	2.537456e+05   	7.509396e+08   	88
 ff82dda0	7372800        	0.000000e+00   	6.462089e+03   	4.136967e+02   	5.751259e+05   	3.731746e+09   	89
+2c1922b7	819200         	0.000000e+00   	4.040830e+02   	6.411732e+01   	3.717564e+04   	1.540026e+07   	92
 
 ####################
-# COMB_1
+# COMB_2
 # number of types devices
 1
 ####################
@@ -87,18 +90,20 @@ ff82dda0	7372800        	0.000000e+00   	6.462089e+03   	4.136967e+02   	5.75125
 # number of implementations
 1
 #####
-# Model for cuda1_impl0 (Comb1)
+# Model for cuda1_impl0 (Comb2)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d39bff17	3276800        	0.000000e+00   	2.231007e+03   	5.378925e+02   	3.234960e+05   	7.636746e+08   	145
 ff82dda0	7372800        	0.000000e+00   	3.904524e+03   	2.515208e+02   	4.021660e+05   	1.576783e+09   	103
+2c1922b7	819200         	0.000000e+00   	5.307827e+02   	1.276617e+02   	5.467062e+04   	3.069686e+07   	103
 
 ####################
-# COMB_2
+# COMB_1
 # number of types devices
 1
 ####################
@@ -117,12 +122,15 @@ ff82dda0	7372800        	0.000000e+00   	3.904524e+03   	2.515208e+02   	4.02166
 # number of implementations
 1
 #####
-# Model for cuda2_impl0 (Comb2)
+# Model for cuda2_impl0 (Comb1)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+d39bff17	3276800        	0.000000e+00   	1.665736e+03   	1.392688e+02   	2.881723e+05   	4.833744e+08   	173
 ff82dda0	7372800        	0.000000e+00   	3.891632e+03   	2.259287e+02   	7.199519e+05   	2.811230e+09   	185
+2c1922b7	819200         	0.000000e+00   	5.125766e+02   	1.240167e+02   	5.587085e+04   	3.031453e+07   	109
+

+ 17 - 9
tools/perfmodels/.starpu/sampling/codelets/44/starpu_slu_lu_model_22.mirage

@@ -6,7 +6,6 @@
 # COMBs
 # number of combinations
 4
-
 ####################
 # COMB_3
 # number of types devices
@@ -29,13 +28,15 @@
 #####
 # Model for cpu0_impl0 (Comb3)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+f0ac7beb	4915200        	0.000000e+00   	2.645658e+04   	4.968429e+02   	5.820449e+07   	1.540435e+12   	2200
 24c84a50	11059200       	0.000000e+00   	8.756135e+04   	9.752924e+02   	1.866808e+08   	1.634805e+13   	2132
+d46431bb	1228800        	0.000000e+00   	3.234444e+03   	8.877025e+01   	1.325799e+07   	4.291452e+10   	4099
 
 ####################
 # COMB_0
@@ -59,16 +60,18 @@ nan            	nan            	nan
 #####
 # Model for cuda0_impl0 (Comb0)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+f0ac7beb	4915200        	0.000000e+00   	8.760921e+02   	3.574580e+01   	7.074444e+06   	6.208182e+09   	8075
 24c84a50	11059200       	0.000000e+00   	2.988744e+03   	8.136061e+01   	2.363499e+07   	7.069126e+10   	7908
+d46431bb	1228800        	0.000000e+00   	1.911930e+02   	1.434147e+01   	1.248108e+06   	2.399722e+08   	6528
 
 ####################
-# COMB_1
+# COMB_2
 # number of types devices
 1
 ####################
@@ -87,18 +90,20 @@ nan            	nan            	nan
 # number of implementations
 1
 #####
-# Model for cuda1_impl0 (Comb1)
+# Model for cuda1_impl0 (Comb2)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+f0ac7beb	4915200        	0.000000e+00   	9.198175e+02   	4.677043e+01   	6.931745e+06   	6.392425e+09   	7536
 24c84a50	11059200       	0.000000e+00   	3.016176e+03   	6.737054e+01   	2.311597e+07   	6.975663e+10   	7664
+d46431bb	1228800        	0.000000e+00   	1.910500e+02   	1.400155e+01   	1.317099e+06   	2.529832e+08   	6894
 
 ####################
-# COMB_2
+# COMB_1
 # number of types devices
 1
 ####################
@@ -117,12 +122,15 @@ nan            	nan            	nan
 # number of implementations
 1
 #####
-# Model for cuda2_impl0 (Comb2)
+# Model for cuda2_impl0 (Comb1)
 # number of entries
-1
+3
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
 nan            	nan            	nan            
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
+f0ac7beb	4915200        	0.000000e+00   	9.143628e+02   	4.685332e+01   	6.720566e+06   	6.161171e+09   	7350
 24c84a50	11059200       	0.000000e+00   	3.002393e+03   	6.861698e+01   	2.339765e+07   	7.028562e+10   	7793
+d46431bb	1228800        	0.000000e+00   	1.898967e+02   	1.421585e+01   	1.327568e+06   	2.535136e+08   	6991
+