Browse Source

update the number of fft tasks per worker

Samuel Thibault 15 years ago
parent
commit
714846e008
2 changed files with 16 additions and 0 deletions
  1. 8 0
      examples/starpufft/starpufftx1d.c
  2. 8 0
      examples/starpufft/starpufftx2d.c

+ 8 - 0
examples/starpufft/starpufftx1d.c

@@ -94,6 +94,8 @@ STARPUFFT(fft1_1d_kernel_gpu)(void *descr[], void *_args)
 
 	int workerid = starpu_worker_get_id();
 
+	task_per_worker[workerid]++;
+
 	cudaStream_t stream;
 
 	if (!plan->plans[workerid].initialized1) {
@@ -134,6 +136,8 @@ STARPUFFT(fft2_1d_kernel_gpu)(void *descr[], void *_args)
 
 	int workerid = starpu_worker_get_id();
 
+	task_per_worker[workerid]++;
+
 	if (!plan->plans[workerid].initialized2) {
 		cures = cufftPlan1d(&plan->plans[workerid].plan2_cuda, n1, _CUFFT_C2C, n3);
 
@@ -189,6 +193,8 @@ STARPUFFT(fft1_1d_kernel_cpu)(void *descr[], void *_args)
 	int n2 = plan->n2[0];
 	int workerid = starpu_worker_get_id();
 
+	task_per_worker[workerid]++;
+
 	const STARPUFFT(complex) * restrict twisted1 = (STARPUFFT(complex) *)STARPU_GET_VECTOR_PTR(descr[0]);
 	STARPUFFT(complex) * restrict fft1 = (STARPUFFT(complex) *)STARPU_GET_VECTOR_PTR(descr[1]);
 
@@ -245,6 +251,8 @@ STARPUFFT(fft2_1d_kernel_cpu)(void *descr[], void *_args)
 	//int jj = args->jj;
 	int workerid = starpu_worker_get_id();
 
+	task_per_worker[workerid]++;
+
 	const STARPUFFT(complex) * restrict twisted2 = (STARPUFFT(complex) *)STARPU_GET_VECTOR_PTR(descr[0]);
 	STARPUFFT(complex) * restrict fft2 = (STARPUFFT(complex) *)STARPU_GET_VECTOR_PTR(descr[1]);
 

+ 8 - 0
examples/starpufft/starpufftx2d.c

@@ -64,6 +64,8 @@ STARPUFFT(fft1_2d_kernel_gpu)(void *descr[], void *_args)
 
 	int workerid = starpu_worker_get_id();
 
+	task_per_worker[workerid]++;
+
 	cudaStream_t stream;
 
 	if (!plan->plans[workerid].initialized1) {
@@ -106,6 +108,8 @@ STARPUFFT(fft2_2d_kernel_gpu)(void *descr[], void *_args)
 
 	int workerid = starpu_worker_get_id();
 
+	task_per_worker[workerid]++;
+
 	if (!plan->plans[workerid].initialized2) {
 		cures = cufftPlan2d(&plan->plans[workerid].plan2_cuda, n1, m1, _CUFFT_C2C);
 
@@ -164,6 +168,8 @@ STARPUFFT(fft1_2d_kernel_cpu)(void *descr[], void *_args)
 	int m2 = plan->n2[1];
 	int workerid = starpu_worker_get_id();
 
+	task_per_worker[workerid]++;
+
 	const STARPUFFT(complex) *twisted1 = (STARPUFFT(complex) *)STARPU_GET_VECTOR_PTR(descr[0]);
 	STARPUFFT(complex) *fft1 = (STARPUFFT(complex) *)STARPU_GET_VECTOR_PTR(descr[1]);
 
@@ -223,6 +229,8 @@ STARPUFFT(fft2_2d_kernel_cpu)(void *descr[], void *_args)
 	//int ll = args->ll;
 	int workerid = starpu_worker_get_id();
 
+	task_per_worker[workerid]++;
+
 	const STARPUFFT(complex) *twisted2 = (STARPUFFT(complex) *)STARPU_GET_VECTOR_PTR(descr[0]);
 	STARPUFFT(complex) *fft2 = (STARPUFFT(complex) *)STARPU_GET_VECTOR_PTR(descr[1]);