black_scholes.c 6.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2020 Université de Bordeaux, CNRS (LaBRI UMR 5800), Inria
  4. * Copyright (C) 2019 Mael Keryell
  5. *
  6. * StarPU is free software; you can redistribute it and/or modify
  7. * it under the terms of the GNU Lesser General Public License as published by
  8. * the Free Software Foundation; either version 2.1 of the License, or (at
  9. * your option) any later version.
  10. *
  11. * StarPU is distributed in the hope that it will be useful, but
  12. * WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  14. *
  15. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  16. */
  17. #include <stdlib.h>
  18. #include <stdio.h>
  19. #include <starpu.h>
  20. #include <math.h>
  21. #include "../includes/sorting.h"
  22. void cpu_black_scholes(void **, void *);
  23. void gpu_black_scholes(void **, void *);
  24. static struct starpu_codelet cl =
  25. {
  26. .cpu_funcs = {cpu_black_scholes},
  27. .cuda_funcs = {gpu_black_scholes},
  28. .nbuffers = 7,
  29. .modes = {STARPU_R, STARPU_R, STARPU_R, STARPU_R, STARPU_R, STARPU_W, STARPU_W}
  30. };
  31. void black_scholes_with_starpu(double *S, double *K, double *R, double *T, double *sig, double *call_res, double *put_res, unsigned nbr_data, unsigned nslices)
  32. {
  33. starpu_data_handle_t S_handle, K_handle, R_handle, T_handle, SIG_handle, CRES_handle, PRES_handle;
  34. starpu_vector_data_register(&S_handle, STARPU_MAIN_RAM, (uintptr_t)S, nbr_data, sizeof(double));
  35. starpu_vector_data_register(&K_handle, STARPU_MAIN_RAM, (uintptr_t)K, nbr_data, sizeof(double));
  36. starpu_vector_data_register(&R_handle, STARPU_MAIN_RAM, (uintptr_t)R, nbr_data, sizeof(double));
  37. starpu_vector_data_register(&T_handle, STARPU_MAIN_RAM, (uintptr_t)T, nbr_data, sizeof(double));
  38. starpu_vector_data_register(&SIG_handle, STARPU_MAIN_RAM, (uintptr_t)sig, nbr_data, sizeof(double));
  39. starpu_vector_data_register(&CRES_handle, STARPU_MAIN_RAM, (uintptr_t)call_res, nbr_data, sizeof(double));
  40. starpu_vector_data_register(&PRES_handle, STARPU_MAIN_RAM, (uintptr_t)put_res, nbr_data, sizeof(double));
  41. struct starpu_data_filter f =
  42. {
  43. .filter_func = starpu_vector_filter_block,
  44. .nchildren = nslices
  45. };
  46. /* printf("%f %f\n", nslices, nbr_data); */
  47. starpu_data_partition(S_handle, &f);
  48. starpu_data_partition(K_handle, &f);
  49. starpu_data_partition(R_handle, &f);
  50. starpu_data_partition(T_handle, &f);
  51. starpu_data_partition(SIG_handle, &f);
  52. starpu_data_partition(CRES_handle, &f);
  53. starpu_data_partition(PRES_handle, &f);
  54. unsigned taskid;
  55. for (taskid = 0; taskid < nslices; taskid++){
  56. struct starpu_task *task = starpu_task_create();
  57. task->cl = &cl;
  58. task->handles[0] = starpu_data_get_sub_data(S_handle, 1, taskid);
  59. task->handles[1] = starpu_data_get_sub_data(K_handle, 1, taskid);
  60. task->handles[2] = starpu_data_get_sub_data(R_handle, 1, taskid);
  61. task->handles[3] = starpu_data_get_sub_data(T_handle, 1, taskid);
  62. task->handles[4] = starpu_data_get_sub_data(SIG_handle, 1, taskid);
  63. task->handles[5] = starpu_data_get_sub_data(CRES_handle, 1, taskid);
  64. task->handles[6] = starpu_data_get_sub_data(PRES_handle, 1, taskid);
  65. starpu_task_submit(task);
  66. }
  67. starpu_task_wait_for_all();
  68. starpu_data_unpartition(S_handle, STARPU_MAIN_RAM);
  69. starpu_data_unpartition(K_handle, STARPU_MAIN_RAM);
  70. starpu_data_unpartition(R_handle, STARPU_MAIN_RAM);
  71. starpu_data_unpartition(T_handle, STARPU_MAIN_RAM);
  72. starpu_data_unpartition(SIG_handle, STARPU_MAIN_RAM);
  73. starpu_data_unpartition(CRES_handle, STARPU_MAIN_RAM);
  74. starpu_data_unpartition(PRES_handle, STARPU_MAIN_RAM);
  75. starpu_data_unregister(S_handle);
  76. starpu_data_unregister(K_handle);
  77. starpu_data_unregister(R_handle);
  78. starpu_data_unregister(T_handle);
  79. starpu_data_unregister(SIG_handle);
  80. starpu_data_unregister(CRES_handle);
  81. starpu_data_unregister(PRES_handle);
  82. }
  83. static void init_S(double *S, unsigned nbr_data)
  84. {
  85. unsigned i;
  86. for (i = 0; i < nbr_data; i++){
  87. S[i] = 100. * rand() / (double) RAND_MAX;
  88. }
  89. }
  90. static void init_K(double *K, unsigned nbr_data)
  91. {
  92. unsigned i;
  93. for (i = 0; i < nbr_data; i++){
  94. K[i] = 100. * rand() / (double) RAND_MAX;
  95. }
  96. }
  97. static void init_R(double *R, unsigned nbr_data)
  98. {
  99. unsigned i;
  100. for (i = 0; i < nbr_data; i++){
  101. R[i] = rand() / (double) RAND_MAX;
  102. }
  103. }
  104. static void init_T(double *T, unsigned nbr_data)
  105. {
  106. unsigned i;
  107. for (i = 0; i < nbr_data; i++){
  108. T[i] = 10. * rand() / (double) RAND_MAX;
  109. }
  110. }
  111. static void init_sig(double *sig, unsigned nbr_data)
  112. {
  113. unsigned i;
  114. for (i = 0; i < nbr_data; i++){
  115. sig[i] = 10. * rand() / (double) RAND_MAX;
  116. }
  117. }
  118. double median_time(unsigned nbr_data, unsigned nslices, unsigned nbr_tests)
  119. {
  120. double exec_times[nbr_tests];
  121. double *S = malloc(nbr_data * sizeof(double));
  122. double *K = malloc(nbr_data * sizeof(double));
  123. double *R = malloc(nbr_data * sizeof(double));
  124. double *T = malloc(nbr_data * sizeof(double));
  125. double *sig = malloc(nbr_data * sizeof(double));
  126. double *call_res = calloc(nbr_data, sizeof(double));
  127. double *put_res = calloc(nbr_data, sizeof(double));
  128. double start, stop;
  129. unsigned i;
  130. for (i = 0; i < nbr_tests; i++){
  131. init_S(S,nbr_data);
  132. init_K(K,nbr_data);
  133. init_R(R,nbr_data);
  134. init_T(T,nbr_data);
  135. init_sig(sig,nbr_data);
  136. /* S[0] = 100.; */
  137. /* K[0] = 100.; */
  138. /* R[0] = 0.05; */
  139. /* T[0] = 1.0; */
  140. /* sig[0] = 0.2; */
  141. start = starpu_timing_now();
  142. black_scholes_with_starpu(S, K, R, T, sig, call_res, put_res, nbr_data, nslices);
  143. stop = starpu_timing_now();
  144. exec_times[i] = (stop - start) / 1.e6;
  145. }
  146. /* printf("%f %f\n", call_res[0], put_res[0]); */
  147. free(S);
  148. free(K);
  149. free(R);
  150. free(T);
  151. free(sig);
  152. free(call_res);
  153. free(put_res);
  154. quicksort(exec_times, 0, nbr_tests - 1);
  155. return exec_times[nbr_tests/2];
  156. }
  157. void display_times(unsigned start_nbr, unsigned step_nbr, unsigned stop_nbr, unsigned nslices, unsigned nbr_tests)
  158. {
  159. FILE *myfile;
  160. myfile = fopen("DAT/black_scholes_c_times.dat", "w");
  161. unsigned nbr_data;
  162. for (nbr_data = start_nbr; nbr_data <= stop_nbr; nbr_data += step_nbr){
  163. double t = median_time(nbr_data, nslices, nbr_tests);
  164. printf("nbr_data:\n%u\nTime:\n%f\n", nbr_data, t);
  165. fprintf(myfile, "%f\n", t);
  166. }
  167. fclose(myfile);
  168. }
  169. int main(int argc, char *argv[])
  170. {
  171. if (argc != 6){
  172. printf("Usage: %s start_nbr step_nbr stop_nbr nslices nbr_tests\n", argv[0]);
  173. return 1;
  174. }
  175. if (starpu_init(NULL) != EXIT_SUCCESS){
  176. fprintf(stderr, "ERROR\n");
  177. return 77;
  178. }
  179. unsigned start_nbr = (unsigned) atoi(argv[1]);
  180. unsigned step_nbr = (unsigned) atoi(argv[2]);
  181. unsigned stop_nbr = (unsigned) atoi(argv[3]);
  182. unsigned nslices = (unsigned) atoi(argv[4]);
  183. unsigned nbr_tests = (unsigned) atoi(argv[5]);
  184. srand(time(NULL));
  185. display_times(start_nbr, step_nbr, stop_nbr, nslices, nbr_tests);
  186. starpu_shutdown();
  187. return 0;
  188. }