Переглянути джерело

Add sgemm perfmodels for 960*960*960*2

Samuel Thibault 4 роки тому
батько
коміт
509e930b67

+ 16 - 4
tools/perfmodels/sampling/codelets/45/starpu_sgemm_gemm.attila

@@ -29,7 +29,7 @@
 #####
 # Model for cpu0_impl0 (Comb3)
 # number of entries
-4
+7
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -38,6 +38,9 @@ nan            	nan            	nan
 0
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
 492beed5	33177600       	7.077888e+09   	3.328725e+05   	1.185902e+04   	2.563119e+07   	8.542747e+12   	77
+9c6670ef	29491200       	7.077888e+09   	3.328725e+05   	1.185902e+04   	2.563119e+07   	8.542747e+12   	77
+c00cf6b7	29491200       	7.077888e+09   	3.328725e+05   	1.185902e+04   	2.563119e+07   	8.542747e+12   	77
+78a2cc08	29491200       	7.077888e+09   	3.328725e+05   	1.185902e+04   	2.563119e+07   	8.542747e+12   	77
 24c84a50	11059200       	1.769472e+09   	8.321812e+04   	2.964755e+03   	6.407798e+06   	5.339217e+11   	77
 0b0b0ce8	3686400        	2.621440e+08   	1.421718e+04   	3.409134e+02   	9.098993e+05   	1.294364e+10   	64
 4220e23d	14745600       	2.097152e+09   	1.008105e+05   	2.361630e+03   	8.064841e+06   	8.134670e+11   	80
@@ -64,7 +67,7 @@ nan            	nan            	nan
 #####
 # Model for cuda0_impl0 (Comb0)
 # number of entries
-4
+7
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -73,6 +76,9 @@ nan            	nan            	nan
 0
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
 492beed5	33177600       	7.077888e+09   	1.123499e+04   	6.785566e+01   	1.190909e+06   	1.338033e+10   	106
+9c6670ef	29491200       	7.077888e+09   	1.123499e+04   	6.785566e+01   	1.190909e+06   	1.338033e+10   	106
+c00cf6b7	29491200       	7.077888e+09   	1.123499e+04   	6.785566e+01   	1.190909e+06   	1.338033e+10   	106
+78a2cc08	29491200       	7.077888e+09   	1.123499e+04   	6.785566e+01   	1.190909e+06   	1.338033e+10   	106
 24c84a50	11059200       	1.769472e+09   	2.808747e+03   	1.696392e+01   	2.977272e+05   	8.362706e+08   	106
 0b0b0ce8	3686400        	2.621440e+08   	6.738679e+02   	4.393713e+01   	6.873452e+04   	4.651489e+07   	102
 4220e23d	14745600       	2.097152e+09   	5.557425e+03   	3.241733e+02   	5.835297e+05   	3.253957e+09   	105
@@ -99,7 +105,7 @@ nan            	nan            	nan
 #####
 # Model for cuda1_impl0 (Comb2)
 # number of entries
-4
+7
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -108,6 +114,9 @@ nan            	nan            	nan
 0
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
 492beed5	33177600       	7.077888e+09   	1.123077e+04   	9.504466e+01   	1.179231e+06   	1.324463e+10   	105
+9c6670ef	29491200       	7.077888e+09   	1.123077e+04   	9.504466e+01   	1.179231e+06   	1.324463e+10   	105
+c00cf6b7	29491200       	7.077888e+09   	1.123077e+04   	9.504466e+01   	1.179231e+06   	1.324463e+10   	105
+78a2cc08	29491200       	7.077888e+09   	1.123077e+04   	9.504466e+01   	1.179231e+06   	1.324463e+10   	105
 24c84a50	11059200       	1.769472e+09   	2.807693e+03   	2.376116e+01   	2.948078e+05   	8.277894e+08   	105
 0b0b0ce8	3686400        	2.621440e+08   	6.672056e+02   	3.376608e+01   	6.805497e+04   	4.552295e+07   	102
 4220e23d	14745600       	2.097152e+09   	5.553764e+03   	3.500896e+02   	5.831453e+05   	3.251521e+09   	105
@@ -134,7 +143,7 @@ nan            	nan            	nan
 #####
 # Model for cuda2_impl0 (Comb1)
 # number of entries
-4
+7
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -143,6 +152,9 @@ nan            	nan            	nan
 0
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
 492beed5	33177600       	7.077888e+09   	1.124174e+04   	2.629960e+01   	1.180383e+06   	1.326963e+10   	105
+9c6670ef	29491200       	7.077888e+09   	1.124174e+04   	2.629960e+01   	1.180383e+06   	1.326963e+10   	105
+c00cf6b7	29491200       	7.077888e+09   	1.124174e+04   	2.629960e+01   	1.180383e+06   	1.326963e+10   	105
+78a2cc08	29491200       	7.077888e+09   	1.124174e+04   	2.629960e+01   	1.180383e+06   	1.326963e+10   	105
 24c84a50	11059200       	1.769472e+09   	2.810435e+03   	6.574900e+00   	2.950958e+05   	8.293519e+08   	105
 0b0b0ce8	3686400        	2.621440e+08   	6.002221e+02   	2.259043e+01   	6.242310e+04   	3.752080e+07   	104
 4220e23d	14745600       	2.097152e+09   	5.577722e+03   	1.615194e+02   	5.912385e+05   	3.300529e+09   	106

+ 36 - 9
tools/perfmodels/sampling/codelets/45/starpu_sgemm_gemm.idgraf

@@ -28,7 +28,7 @@
 #####
 # Model for cuda0_impl0 (Comb2)
 # number of entries
-4
+7
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -39,6 +39,9 @@ nan            	nan            	nan
 0b0b0ce8	3686400        	2.621440e+08   	6.801013e+02   	7.013561e+01   	4.760709e+04   	3.272198e+07   	70
 4220e23d	14745600       	2.097152e+09   	5.623635e+03   	5.419920e+02   	4.442672e+05   	2.521603e+09   	79
 492beed5	33177600       	7.077888e+09   	1.150361e+04   	5.884814e+02   	1.000814e+06   	1.154310e+10   	87
+9c6670ef	29491200       	7.077888e+09   	1.150361e+04   	5.884814e+02   	1.000814e+06   	1.154310e+10   	87
+c00cf6b7	29491200       	7.077888e+09   	1.150361e+04   	5.884814e+02   	1.000814e+06   	1.154310e+10   	87
+78a2cc08	29491200       	7.077888e+09   	1.150361e+04   	5.884814e+02   	1.000814e+06   	1.154310e+10   	87
 24c84a50	11059200       	1.769472e+09   	2.875903e+03   	1.471204e+02   	2.502035e+05   	7.214438e+08   	87
 
 ####################
@@ -63,7 +66,7 @@ nan            	nan            	nan
 #####
 # Model for cuda1_impl0 (Comb4)
 # number of entries
-4
+7
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -74,6 +77,9 @@ nan            	nan            	nan
 0b0b0ce8	3686400        	2.621440e+08   	6.717051e+02   	6.137607e+01   	4.500424e+04   	3.048197e+07   	67
 4220e23d	14745600       	2.097152e+09   	5.648275e+03   	4.677390e+02   	4.575103e+05   	2.601865e+09   	81
 492beed5	33177600       	7.077888e+09   	1.157020e+04   	6.521027e+02   	1.018178e+06   	1.181795e+10   	88
+9c6670ef	29491200       	7.077888e+09   	1.157020e+04   	6.521027e+02   	1.018178e+06   	1.181795e+10   	88
+c00cf6b7	29491200       	7.077888e+09   	1.157020e+04   	6.521027e+02   	1.018178e+06   	1.181795e+10   	88
+78a2cc08	29491200       	7.077888e+09   	1.157020e+04   	6.521027e+02   	1.018178e+06   	1.181795e+10   	88
 24c84a50	11059200       	1.769472e+09   	2.892550e+03   	1.630257e+02   	2.545445e+05   	7.386219e+08   	88
 
 ####################
@@ -98,7 +104,7 @@ nan            	nan            	nan
 #####
 # Model for cuda2_impl0 (Comb6)
 # number of entries
-4
+7
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -109,6 +115,9 @@ nan            	nan            	nan
 0b0b0ce8	3686400        	2.621440e+08   	6.265559e+02   	5.536840e+01   	4.824481e+04   	3.046412e+07   	77
 4220e23d	14745600       	2.097152e+09   	5.631203e+03   	4.767455e+02   	4.561275e+05   	2.586957e+09   	81
 492beed5	33177600       	7.077888e+09   	1.162826e+04   	6.757302e+02   	1.023286e+06   	1.193922e+10   	88
+9c6670ef	29491200       	7.077888e+09   	1.162826e+04   	6.757302e+02   	1.023286e+06   	1.193922e+10   	88
+c00cf6b7	29491200       	7.077888e+09   	1.162826e+04   	6.757302e+02   	1.023286e+06   	1.193922e+10   	88
+78a2cc08	29491200       	7.077888e+09   	1.162826e+04   	6.757302e+02   	1.023286e+06   	1.193922e+10   	88
 24c84a50	11059200       	1.769472e+09   	2.907065e+03   	1.689325e+02   	2.558215e+05   	7.462012e+08   	88
 
 ####################
@@ -133,7 +142,7 @@ nan            	nan            	nan
 #####
 # Model for cuda3_impl0 (Comb7)
 # number of entries
-4
+7
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -144,6 +153,9 @@ nan            	nan            	nan
 0b0b0ce8	3686400        	2.621440e+08   	6.780899e+02   	4.241206e+01   	4.543202e+04   	3.092751e+07   	67
 4220e23d	14745600       	2.097152e+09   	5.857201e+03   	8.346836e+02   	4.744333e+05   	2.835284e+09   	81
 492beed5	33177600       	7.077888e+09   	1.150498e+04   	4.254093e+02   	9.894285e+05   	1.139892e+10   	86
+9c6670ef	29491200       	7.077888e+09   	1.150498e+04   	4.254093e+02   	9.894285e+05   	1.139892e+10   	86
+c00cf6b7	29491200       	7.077888e+09   	1.150498e+04   	4.254093e+02   	9.894285e+05   	1.139892e+10   	86
+78a2cc08	29491200       	7.077888e+09   	1.150498e+04   	4.254093e+02   	9.894285e+05   	1.139892e+10   	86
 24c84a50	11059200       	1.769472e+09   	2.876245e+03   	1.063523e+02   	2.473571e+05   	7.124325e+08   	86
 
 ####################
@@ -168,7 +180,7 @@ nan            	nan            	nan
 #####
 # Model for cuda4_impl0 (Comb0)
 # number of entries
-4
+7
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -179,6 +191,9 @@ nan            	nan            	nan
 0b0b0ce8	3686400        	2.621440e+08   	6.759139e+02   	4.092799e+01   	4.190666e+04   	2.842915e+07   	62
 4220e23d	14745600       	2.097152e+09   	5.527477e+03   	2.733928e+02   	4.421982e+05   	2.450220e+09   	80
 492beed5	33177600       	7.077888e+09   	1.146770e+04   	1.768909e+02   	1.100899e+06   	1.262778e+10   	96
+9c6670ef	29491200       	7.077888e+09   	1.146770e+04   	1.768909e+02   	1.100899e+06   	1.262778e+10   	96
+c00cf6b7	29491200       	7.077888e+09   	1.146770e+04   	1.768909e+02   	1.100899e+06   	1.262778e+10   	96
+78a2cc08	29491200       	7.077888e+09   	1.146770e+04   	1.768909e+02   	1.100899e+06   	1.262778e+10   	96
 24c84a50	11059200       	1.769472e+09   	2.866925e+03   	4.422272e+01   	2.752248e+05   	7.892362e+08   	96
 
 ####################
@@ -203,7 +218,7 @@ nan            	nan            	nan
 #####
 # Model for cuda5_impl0 (Comb1)
 # number of entries
-4
+7
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -214,6 +229,9 @@ nan            	nan            	nan
 0b0b0ce8	3686400        	2.621440e+08   	6.339465e+02   	7.125158e+01   	4.184047e+04   	2.685969e+07   	66
 4220e23d	14745600       	2.097152e+09   	5.624130e+03   	4.755864e+02   	4.668028e+05   	2.644133e+09   	83
 492beed5	33177600       	7.077888e+09   	1.149102e+04   	5.375188e+02   	1.114629e+06   	1.283625e+10   	97
+9c6670ef	29491200       	7.077888e+09   	1.149102e+04   	5.375188e+02   	1.114629e+06   	1.283625e+10   	97
+c00cf6b7	29491200       	7.077888e+09   	1.149102e+04   	5.375188e+02   	1.114629e+06   	1.283625e+10   	97
+78a2cc08	29491200       	7.077888e+09   	1.149102e+04   	5.375188e+02   	1.114629e+06   	1.283625e+10   	97
 24c84a50	11059200       	1.769472e+09   	2.872755e+03   	1.343797e+02   	2.786572e+05   	8.022656e+08   	97
 
 ####################
@@ -238,7 +256,7 @@ nan            	nan            	nan
 #####
 # Model for cuda6_impl0 (Comb3)
 # number of entries
-4
+7
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -249,6 +267,9 @@ nan            	nan            	nan
 0b0b0ce8	3686400        	2.621440e+08   	6.389750e+02   	8.615382e+01   	4.728415e+04   	3.076266e+07   	74
 4220e23d	14745600       	2.097152e+09   	5.648331e+03   	5.220897e+02   	4.631632e+05   	2.638450e+09   	82
 492beed5	33177600       	7.077888e+09   	1.155069e+04   	5.660846e+02   	1.108866e+06   	1.283893e+10   	96
+9c6670ef	29491200       	7.077888e+09   	1.155069e+04   	5.660846e+02   	1.108866e+06   	1.283893e+10   	96
+c00cf6b7	29491200       	7.077888e+09   	1.155069e+04   	5.660846e+02   	1.108866e+06   	1.283893e+10   	96
+78a2cc08	29491200       	7.077888e+09   	1.155069e+04   	5.660846e+02   	1.108866e+06   	1.283893e+10   	96
 24c84a50	11059200       	1.769472e+09   	2.887673e+03   	1.415212e+02   	2.772165e+05   	8.024331e+08   	96
 
 ####################
@@ -273,7 +294,7 @@ nan            	nan            	nan
 #####
 # Model for cuda7_impl0 (Comb5)
 # number of entries
-4
+7
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -284,6 +305,9 @@ nan            	nan            	nan
 0b0b0ce8	3686400        	2.621440e+08   	6.386625e+02   	8.094896e+01   	4.342905e+04   	2.818209e+07   	68
 4220e23d	14745600       	2.097152e+09   	5.638657e+03   	3.709019e+02   	4.454539e+05   	2.522630e+09   	79
 492beed5	33177600       	7.077888e+09   	1.144012e+04   	2.531108e+02   	1.109691e+06   	1.270122e+10   	97
+9c6670ef	29491200       	7.077888e+09   	1.144012e+04   	2.531108e+02   	1.109691e+06   	1.270122e+10   	97
+c00cf6b7	29491200       	7.077888e+09   	1.144012e+04   	2.531108e+02   	1.109691e+06   	1.270122e+10   	97
+78a2cc08	29491200       	7.077888e+09   	1.144012e+04   	2.531108e+02   	1.109691e+06   	1.270122e+10   	97
 24c84a50	11059200       	1.769472e+09   	2.860030e+03   	6.327770e+01   	2.774228e+05   	7.938262e+08   	97
 
 ####################
@@ -308,7 +332,7 @@ nan            	nan            	nan
 #####
 # Model for cpu0_impl0 (Comb8)
 # number of entries
-4
+7
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -319,5 +343,8 @@ nan            	nan            	nan
 0b0b0ce8	3686400        	2.621440e+08   	1.414338e+04   	6.441210e+02   	3.535844e+05   	5.011251e+09   	25
 4220e23d	14745600       	2.097152e+09   	1.091117e+05   	2.701159e+03   	3.382462e+06   	3.692924e+11   	31
 492beed5	33177600       	7.077888e+09   	3.621356e+05   	7.764608e+03   	8.329119e+06   	3.017657e+12   	23
+9c6670ef	29491200       	7.077888e+09   	3.621356e+05   	7.764608e+03   	8.329119e+06   	3.017657e+12   	23
+c00cf6b7	29491200       	7.077888e+09   	3.621356e+05   	7.764608e+03   	8.329119e+06   	3.017657e+12   	23
+78a2cc08	29491200       	7.077888e+09   	3.621356e+05   	7.764608e+03   	8.329119e+06   	3.017657e+12   	23
 24c84a50	11059200       	1.769472e+09   	9.053390e+04   	1.941152e+03   	2.082280e+06   	1.886036e+11   	23
 

+ 16 - 4
tools/perfmodels/sampling/codelets/45/starpu_sgemm_gemm.mirage

@@ -29,7 +29,7 @@
 #####
 # Model for cpu0_impl0 (Comb3)
 # number of entries
-4
+7
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -39,6 +39,9 @@ nan            	nan            	nan
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
 0b0b0ce8	3686400        	2.621440e+08   	1.352609e+04   	3.616534e+02   	1.082087e+06   	1.464687e+10   	80
 492beed5	33177600       	7.077888e+09   	3.550396e+05   	8.949994e+03   	2.840317e+07   	1.009066e+13   	80
+9c6670ef	29491200       	7.077888e+09   	3.550396e+05   	8.949994e+03   	2.840317e+07   	1.009066e+13   	80
+c00cf6b7	29491200       	7.077888e+09   	3.550396e+05   	8.949994e+03   	2.840317e+07   	1.009066e+13   	80
+78a2cc08	29491200       	7.077888e+09   	3.550396e+05   	8.949994e+03   	2.840317e+07   	1.009066e+13   	80
 24c84a50	11059200       	1.769472e+09   	8.875990e+04   	2.237499e+03   	7.100792e+06   	6.306662e+11   	80
 4220e23d	14745600       	2.097152e+09   	1.078112e+05   	1.983800e+03   	8.624897e+06   	9.301755e+11   	80
 
@@ -64,7 +67,7 @@ nan            	nan            	nan
 #####
 # Model for cuda0_impl0 (Comb1)
 # number of entries
-4
+7
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -74,6 +77,9 @@ nan            	nan            	nan
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
 0b0b0ce8	3686400        	2.621440e+08   	6.589631e+02   	8.406511e+00   	6.787320e+04   	4.473321e+07   	103
 492beed5	33177600       	7.077888e+09   	1.151398e+04   	9.050114e+01   	1.220482e+06   	1.405348e+10   	106
+9c6670ef	29491200       	7.077888e+09   	1.151398e+04   	9.050114e+01   	1.220482e+06   	1.405348e+10   	106
+c00cf6b7	29491200       	7.077888e+09   	1.151398e+04   	9.050114e+01   	1.220482e+06   	1.405348e+10   	106
+78a2cc08	29491200       	7.077888e+09   	1.151398e+04   	9.050114e+01   	1.220482e+06   	1.405348e+10   	106
 24c84a50	11059200       	1.769472e+09   	2.878495e+03   	2.262529e+01   	3.051205e+05   	8.783425e+08   	106
 4220e23d	14745600       	2.097152e+09   	5.574713e+03   	3.353004e+02   	5.909196e+05   	3.306125e+09   	106
 
@@ -99,7 +105,7 @@ nan            	nan            	nan
 #####
 # Model for cuda1_impl0 (Comb0)
 # number of entries
-4
+7
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -109,6 +115,9 @@ nan            	nan            	nan
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
 0b0b0ce8	3686400        	2.621440e+08   	6.663664e+02   	8.616537e+01   	6.796937e+04   	4.604980e+07   	102
 492beed5	33177600       	7.077888e+09   	1.150036e+04   	8.404527e+01   	1.207538e+06   	1.388786e+10   	105
+9c6670ef	29491200       	7.077888e+09   	1.150036e+04   	8.404527e+01   	1.207538e+06   	1.388786e+10   	105
+c00cf6b7	29491200       	7.077888e+09   	1.150036e+04   	8.404527e+01   	1.207538e+06   	1.388786e+10   	105
+78a2cc08	29491200       	7.077888e+09   	1.150036e+04   	8.404527e+01   	1.207538e+06   	1.388786e+10   	105
 24c84a50	11059200       	1.769472e+09   	2.875090e+03   	2.101132e+01   	3.018845e+05   	8.679912e+08   	105
 4220e23d	14745600       	2.097152e+09   	5.579034e+03   	3.672012e+02   	5.857985e+05   	3.282348e+09   	105
 
@@ -134,7 +143,7 @@ nan            	nan            	nan
 #####
 # Model for cuda2_impl0 (Comb2)
 # number of entries
-4
+7
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -144,6 +153,9 @@ nan            	nan            	nan
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
 0b0b0ce8	3686400        	2.621440e+08   	6.181769e+02   	5.174143e+01   	6.181769e+04   	3.848198e+07   	100
 492beed5	33177600       	7.077888e+09   	1.148096e+04   	7.289415e+01   	1.205501e+06   	1.384086e+10   	105
+9c6670ef	29491200       	7.077888e+09   	1.148096e+04   	7.289415e+01   	1.205501e+06   	1.384086e+10   	105
+c00cf6b7	29491200       	7.077888e+09   	1.148096e+04   	7.289415e+01   	1.205501e+06   	1.384086e+10   	105
+78a2cc08	29491200       	7.077888e+09   	1.148096e+04   	7.289415e+01   	1.205501e+06   	1.384086e+10   	105
 24c84a50	11059200       	1.769472e+09   	2.870240e+03   	1.822354e+01   	3.013752e+05   	8.650538e+08   	105
 4220e23d	14745600       	2.097152e+09   	5.580581e+03   	3.970717e+02   	5.859610e+05   	3.286558e+09   	105
 

+ 20 - 5
tools/perfmodels/sampling/codelets/45/starpu_sgemm_gemm.sirocco

@@ -28,7 +28,7 @@
 #####
 # Model for cuda0_impl0 (Comb2)
 # number of entries
-5
+8
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -37,6 +37,9 @@ nan            	nan            	nan
 0
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
 492beed5	33177600       	7.077888e+09   	2.745578e+03   	3.064191e+02   	6.616844e+05   	1.839335e+09   	241
+9c6670ef	29491200       	7.077888e+09   	2.745578e+03   	3.064191e+02   	6.616844e+05   	1.839335e+09   	241
+c00cf6b7	29491200       	7.077888e+09   	2.745578e+03   	3.064191e+02   	6.616844e+05   	1.839335e+09   	241
+78a2cc08	29491200       	7.077888e+09   	2.745578e+03   	3.064191e+02   	6.616844e+05   	1.839335e+09   	241
 24c84a50	11059200       	1.769472e+09   	6.863945e+02   	7.660478e+01   	1.654211e+05   	1.149584e+08   	241
 0b0b0ce8	3686400        	2.621440e+08   	1.582927e+02   	3.333442e+01   	3.434951e+04   	5.678402e+06   	217
 4220e23d	14745600       	2.097152e+09   	8.206871e+02   	1.017181e+02   	1.148962e+05   	9.574235e+07   	140
@@ -64,7 +67,7 @@ nan            	nan            	nan
 #####
 # Model for cuda3_impl0 (Comb1)
 # number of entries
-5
+8
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -73,6 +76,9 @@ nan            	nan            	nan
 0
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
 492beed5	33177600       	7.077888e+09   	2.686428e+03   	2.002215e+02   	6.716071e+05   	1.814247e+09   	250
+9c6670ef	29491200       	7.077888e+09   	2.686428e+03   	2.002215e+02   	6.716071e+05   	1.814247e+09   	250
+c00cf6b7	29491200       	7.077888e+09   	2.686428e+03   	2.002215e+02   	6.716071e+05   	1.814247e+09   	250
+78a2cc08	29491200       	7.077888e+09   	2.686428e+03   	2.002215e+02   	6.716071e+05   	1.814247e+09   	250
 24c84a50	11059200       	1.769472e+09   	6.716070e+02   	5.005537e+01   	1.679018e+05   	1.133904e+08   	250
 0b0b0ce8	3686400        	2.621440e+08   	1.630480e+02   	3.438768e+01   	3.097912e+04   	5.275762e+06   	190
 4220e23d	14745600       	2.097152e+09   	8.448030e+02   	7.773742e+01   	2.433033e+05   	2.072837e+08   	288
@@ -100,7 +106,7 @@ nan            	nan            	nan
 #####
 # Model for cuda1_impl0 (Comb0)
 # number of entries
-5
+8
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -109,6 +115,9 @@ nan            	nan            	nan
 0
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
 492beed5	33177600       	7.077888e+09   	2.791098e+03   	3.147711e+02   	6.503258e+05   	1.838209e+09   	233
+9c6670ef	29491200       	7.077888e+09   	2.791098e+03   	3.147711e+02   	6.503258e+05   	1.838209e+09   	233
+c00cf6b7	29491200       	7.077888e+09   	2.791098e+03   	3.147711e+02   	6.503258e+05   	1.838209e+09   	233
+78a2cc08	29491200       	7.077888e+09   	2.791098e+03   	3.147711e+02   	6.503258e+05   	1.838209e+09   	233
 24c84a50	11059200       	1.769472e+09   	6.977745e+02   	7.869277e+01   	1.625815e+05   	1.148881e+08   	233
 0b0b0ce8	3686400        	2.621440e+08   	1.624855e+02   	3.298013e+01   	2.940987e+04   	4.975550e+06   	181
 4220e23d	14745600       	2.097152e+09   	8.152506e+02   	1.017614e+02   	1.173961e+05   	9.719839e+07   	144
@@ -136,7 +145,7 @@ nan            	nan            	nan
 #####
 # Model for cuda2_impl0 (Comb3)
 # number of entries
-5
+8
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -145,6 +154,9 @@ nan            	nan            	nan
 0
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
 492beed5	33177600       	7.077888e+09   	2.754203e+03   	2.682327e+02   	6.830422e+05   	1.899080e+09   	248
+9c6670ef	29491200       	7.077888e+09   	2.754203e+03   	2.682327e+02   	6.830422e+05   	1.899080e+09   	248
+c00cf6b7	29491200       	7.077888e+09   	2.754203e+03   	2.682327e+02   	6.830422e+05   	1.899080e+09   	248
+78a2cc08	29491200       	7.077888e+09   	2.754203e+03   	2.682327e+02   	6.830422e+05   	1.899080e+09   	248
 24c84a50	11059200       	1.769472e+09   	6.885507e+02   	6.705818e+01   	1.707605e+05   	1.186925e+08   	248
 0b0b0ce8	3686400        	2.621440e+08   	1.622246e+02   	3.553894e+01   	3.714942e+04   	6.315779e+06   	229
 4220e23d	14745600       	2.097152e+09   	8.611626e+02   	9.290485e+01   	2.411255e+05   	2.100651e+08   	280
@@ -172,7 +184,7 @@ nan            	nan            	nan
 #####
 # Model for cpu0_impl0 (Comb4)
 # number of entries
-5
+8
 # sumlnx	sumlnx2		sumlny		sumlnxlny	alpha		beta		n	minx		maxx
 0.000000e+00   	0.000000e+00   	0.000000e+00   	0.000000e+00   	nan            	nan            	0	0              	0              
 # a		b		c
@@ -181,6 +193,9 @@ nan            	nan            	nan
 0
 # hash		size		flops		mean (us)	dev (us)	sum		sum2		n
 492beed5	33177600       	7.077888e+09   	1.712078e+05   	4.163047e+04   	2.773567e+07   	5.029326e+12   	162
+9c6670ef	29491200       	7.077888e+09   	1.712078e+05   	4.163047e+04   	2.773567e+07   	5.029326e+12   	162
+c00cf6b7	29491200       	7.077888e+09   	1.712078e+05   	4.163047e+04   	2.773567e+07   	5.029326e+12   	162
+78a2cc08	29491200       	7.077888e+09   	1.712078e+05   	4.163047e+04   	2.773567e+07   	5.029326e+12   	162
 24c84a50	11059200       	1.769472e+09   	4.280195e+04   	1.040762e+04   	6.933918e+06   	3.143329e+11   	162
 0b0b0ce8	3686400        	2.621440e+08   	6.441655e+03   	1.152866e+03   	3.220827e+05   	2.141201e+09   	50
 4220e23d	14745600       	2.097152e+09   	4.927734e+04   	1.166029e+04   	5.913281e+06   	3.077063e+11   	120