common_node.c 48 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181
  1. #include "common_node.h"
  2. //extern int *pid_num;
  3. extern int num_idags, node_id ,my_idag;//, fd_log;
  4. extern FILE *log_file;
  5. extern core_states state;
  6. core_states pending_state=NO_PENDING_STATE;
  7. extern inter_list **core_inter_head,**core_inter_tail;
  8. extern app my_app;
  9. extern app init_app;
  10. extern app far_req_app;
  11. extern metrics my_stats;
  12. extern int far_req_or_sender;
  13. extern int *idag_mask, *idag_id_arr;
  14. extern int *Cl_x_max_arr, *Cl_y_max_arr;
  15. extern int DDS_count, my_cores_count;
  16. extern DDS_list *DDS, *DDS_tail;
  17. extern core_list *my_cores, *my_cores_tail;
  18. extern offer_list *init_man_offers, *selfopt_man_offers;
  19. extern offer_list *far_man_offers, *far_man_offers_tail;
  20. extern int far_list_count, far_man_agent_count;
  21. extern int my_agent, time_worked;
  22. extern int debug_global;
  23. extern time_t cur_time;
  24. extern struct tm *cur_t;
  25. extern struct sigevent sev;
  26. extern struct itimerspec its, chk_timer;
  27. extern timer_t timerid;
  28. extern long int selfopt_time_rem;//-1 means it is not set
  29. extern long int upper_work_bound;
  30. extern int time_for_farman;
  31. extern char scen_num[4];
  32. extern int chk_rem_count, chk_rem_num, sum_rem_time;
  33. extern float old_Speedup, my_Speedup;
  34. extern int nodes_ended_cnt;//, app_terminated;
  35. int my_x, my_y, init_areas_num;
  36. int init_DDS_replies, selfopt_DDS_replies, init_DDS_idags, selfopt_DDS_idags, selfopt_interval=200, init_idags_areas_replies, max_cores_count;
  37. target_list *init_targets_head=NULL, *init_targets_tail;
  38. target_list *selfopt_targets_head=NULL, *selfopt_targets_tail;
  39. FILE *app_log_file;
  40. application_states app_state;
  41. my_time_stamp init_app_times[2], my_app_times[2];
  42. extern int *sig_array, *data_array, NUES;
  43. extern RCCE_FLAG flag_signals_enabled,flag_data_written;
  44. void common_node_actions(char scen_num[4]){
  45. offer_list *tmp_offer_list;
  46. int one_core, i, old_cores_cnt;
  47. core_list *tmp_cores_list;
  48. target_list *tmp_target_list;
  49. inter_list *tmp_inter_list, *tmp_inter_prev;
  50. FILE *init_areas_file;//, *selfopt_areas_file;
  51. char init_areas_file_name[64], app_log_file_name[64];//selfopt_areas_file_name[32],
  52. int C,r,init_areas_cnt, init_areas_sent;//area_cnt,selfopt_areas=0,
  53. int time_per_node, time_left, time_to_work, init_core_found=0;
  54. int new_agent, min_dist=-1, tmp_int, j;
  55. //int new_x, new_y;//, selfopt_areas_sent;
  56. int selfopt_r;
  57. DDS_count=0;
  58. my_cores_count=0;
  59. my_stats.msg_count=0;
  60. my_stats.message_size=0;
  61. my_stats.distance=0;
  62. my_stats.app_turnaround=0;
  63. my_stats.comp_effort=0;
  64. my_stats.cores_utilized=0;
  65. my_stats.times_accessed=0;
  66. init_app_times[0].tm_sec = 0;
  67. init_app_times[0].tm_min = 0;
  68. init_app_times[0].tm_hour = 0;
  69. init_app_times[1].tm_sec = 0;
  70. init_app_times[1].tm_min = 0;
  71. init_app_times[1].tm_hour = 0;
  72. my_app_times[0].tm_sec = 0;
  73. my_app_times[0].tm_min = 0;
  74. my_app_times[0].tm_hour = 0;
  75. my_app_times[1].tm_sec = 0;
  76. my_app_times[1].tm_min = 0;
  77. my_app_times[1].tm_hour = 0;
  78. //printf("I Am %d\n",node_id);
  79. DDS=NULL;
  80. my_cores=NULL;
  81. selfopt_r = (int) (1.5 * (X_max / num_idags_x));
  82. install_signal_handlers();
  83. //sig_SEGV_enable();
  84. sev.sigev_notify = SIGEV_SIGNAL;
  85. sev.sigev_signo = SIG_TIMER;
  86. sev.sigev_value.sival_ptr = &timerid;
  87. if (timer_create(CLOCK_REALTIME, &sev, &timerid) == -1) printf("timer_create error\n");
  88. its.it_value.tv_sec = 0;
  89. its.it_interval.tv_sec = 0;//its.it_value.tv_sec;
  90. its.it_interval.tv_nsec = 0;
  91. log_file = create_log_file(node_id,scen_num);
  92. cur_time = time(NULL);
  93. cur_t = localtime(&cur_time);
  94. fprintf(log_file, "[%d:%d:%d]: Initialisation complete\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec);
  95. fflush(log_file);
  96. RCCE_barrier(&RCCE_COMM_WORLD);
  97. my_x = node_id % X_max;
  98. my_y = node_id / X_max;
  99. state = IDLE_CORE;
  100. RCCE_flag_write(&flag_signals_enabled, RCCE_FLAG_SET, node_id);
  101. my_idag = -1;
  102. int dummy=0;
  103. while (my_idag==-1) {//pause();
  104. for (i=0; i<1000; i++)
  105. for(j=0; j<1000; j++)
  106. dummy++;
  107. scc_signals_check();
  108. }
  109. while (state != TERMINATED)
  110. if (state == IDLE_CORE) {
  111. pending_state = NO_PENDING_STATE;
  112. //pause();
  113. dummy=0;
  114. for (i=0; i<1000; i++)
  115. for(j=0; j<1000; j++)
  116. dummy++;
  117. scc_signals_check();
  118. } else if (state == IDLE_INIT_MAN) {// || state == IDLE_FAR_MAN || state == IDLE_INIT_MAN_SELFOPT_PENDING || state == IDLE_INIT_MAN_WORK_PENDING) {
  119. //pause();
  120. dummy=0;
  121. for (i=0; i<1000; i++)
  122. for(j=0; j<1000; j++)
  123. dummy++;
  124. scc_signals_check();
  125. } else if (state == IDLE_AGENT) {
  126. if (app_state != APP_TERMINATED) {
  127. //pause();//!app_terminated
  128. dummy=0;
  129. for (i=0; i<1000; i++)
  130. for(j=0; j<1000; j++)
  131. dummy++;
  132. scc_signals_check();
  133. } else {
  134. if (timer_gettime(timerid, &chk_timer) == -1) printf("timer_gettime error 2\n");
  135. else selfopt_time_rem = chk_timer.it_value.tv_nsec;
  136. if (selfopt_time_rem > 0) {
  137. its.it_value.tv_nsec = 0;
  138. if (timer_settime(timerid, 0, &its, NULL) == -1) printf("timer_settime error42\n");
  139. }
  140. state = AGENT_ENDING;
  141. }
  142. } else if (state == AGENT_REWIND_FILE) {
  143. printf("I am %d and i have to rewind my selfopt_areas_file for app with id %d\n",node_id,init_app.id);
  144. fprintf(log_file,"I have to rewind my selfopt_areas_file for app with id %d\n",init_app.id);
  145. selfopt_interval = 200;
  146. its.it_value.tv_nsec = selfopt_interval * MS;
  147. selfopt_time_rem = selfopt_interval;
  148. if (timer_settime(timerid, 0, &its, NULL) == -1) perror("timer_settime error823\n");
  149. state = IDLE_AGENT;
  150. } else if (state == IDLE_AGENT_WAITING_OFF) {
  151. //pause();
  152. if (app_state != APP_TERMINATED) {
  153. //pause();//!app_terminated
  154. dummy=0;
  155. for (i=0; i<1000; i++)
  156. for(j=0; j<1000; j++)
  157. dummy++;
  158. scc_signals_check();
  159. } else {
  160. signals_disable();
  161. if (timer_gettime(timerid, &chk_timer) == -1) printf("timer_gettime error 2\n");
  162. else selfopt_time_rem = chk_timer.it_value.tv_nsec;
  163. //den stamataw edw thn diadikasia tou selfopt gia na mhn meinoun oi mexri twra prosfores kai oxi mono anapanthtes
  164. if (selfopt_time_rem == 0) state = AGENT_SELF_CHK_OFFERS;
  165. signals_enable();
  166. }
  167. } else if (state == INIT_MANAGER) {
  168. signals_disable();
  169. printf("Initialising app node_id = %d\n",node_id);
  170. cur_time = time(NULL);
  171. cur_t = localtime(&cur_time);
  172. fprintf(log_file, "[%d:%d:%d]: Initialising app\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec);
  173. fflush(log_file);
  174. strcpy(init_areas_file_name,"/shared/herc/scenaria/");
  175. strcat(init_areas_file_name,scen_num);
  176. strcat(init_areas_file_name,"/");
  177. strcat(init_areas_file_name, itoa(init_app.id));
  178. strcat(init_areas_file_name, ".txt");
  179. //printf("area file path = %s\n",areas_file_name);
  180. if ((init_areas_file = fopen(init_areas_file_name, "r")) == NULL){
  181. printf("Cannot open input file with file path = %s ",init_areas_file_name);
  182. perror("open init_areas_file_name");
  183. }
  184. init_areas_sent = 0;
  185. fscanf(init_areas_file,"%d",&init_areas_cnt);
  186. state = INIT_MANAGER_SEND_OFFERS;
  187. signals_enable();
  188. scc_signals_check();
  189. } else if (state == INIT_MANAGER_SEND_OFFERS) {// || state == INIT_MANAGER_SEND_OFFERS_SELFOPT_PENDING || state == INIT_MANAGER_SEND_OFFERS_WORK_PENDING) {
  190. signals_disable();
  191. init_idags_areas_replies=0;
  192. init_DDS_idags = 0;
  193. init_DDS_replies = 0;
  194. init_areas_num = 1;
  195. if (init_targets_head != NULL)
  196. while (init_targets_head != NULL){
  197. tmp_target_list = init_targets_head;
  198. init_targets_head = init_targets_head->next;
  199. free(tmp_target_list);
  200. }
  201. if (init_man_offers != NULL)
  202. while (init_man_offers != NULL) {
  203. tmp_offer_list = init_man_offers;
  204. init_man_offers = init_man_offers->next;
  205. free(tmp_offer_list);
  206. }
  207. fprintf(log_file, "near init area (%d,%d)\n",node_id,selfopt_r);
  208. fflush(log_file);
  209. if (core_inter_head[my_idag] == NULL){
  210. core_inter_head[my_idag] = (inter_list *) malloc(sizeof(inter_list));
  211. core_inter_tail[my_idag] = core_inter_head[my_idag];
  212. } else {
  213. core_inter_tail[my_idag]->next = (inter_list *) malloc(sizeof(inter_list));
  214. core_inter_tail[my_idag] = core_inter_tail[my_idag]->next;
  215. }
  216. core_inter_tail[my_idag]->type = IDAG_FIND_IDAGS_PENDING;
  217. core_inter_tail[my_idag]->data.reg.C = node_id;
  218. core_inter_tail[my_idag]->data.reg.r = selfopt_r;
  219. core_inter_tail[my_idag]->next = NULL;
  220. if (core_inter_head[my_idag]->next == NULL) {
  221. //kill(pid_num[my_idag],SIG_IDAG_FIND_IDAGS);
  222. scc_kill(my_idag,SIG_IDAG_FIND_IDAGS);
  223. my_stats.msg_count++;
  224. my_stats.distance += distance(node_id,my_idag);
  225. }
  226. for (i=0; i<init_areas_cnt && i<INIT_FAR_AREAS_NUM; i++) {
  227. fscanf(init_areas_file,"%d",&C);
  228. fscanf(init_areas_file,"%d",&r);
  229. fprintf(log_file, "init area (%d,%d)\n",C,r);
  230. fflush(log_file);
  231. printf("I am %d and i am sending a far offer in region (%d,%d)\n",node_id,C,r);
  232. one_core = C;
  233. if (core_inter_head[one_core] == NULL){
  234. core_inter_head[one_core] = (inter_list *) malloc(sizeof(inter_list));
  235. core_inter_tail[one_core] = core_inter_head[one_core];
  236. } else {
  237. core_inter_tail[one_core]->next = (inter_list *) malloc(sizeof(inter_list));
  238. core_inter_tail[one_core] = core_inter_tail[one_core]->next;
  239. }
  240. core_inter_tail[one_core]->type = FAR_INIT_REQ;
  241. core_inter_tail[one_core]->data.reg.C = C;
  242. core_inter_tail[one_core]->data.reg.r = r;
  243. core_inter_tail[one_core]->next = NULL;
  244. if (core_inter_head[one_core]->next == NULL) {
  245. //kill(pid_num[one_core],SIG_INIT_FAR_REQ);
  246. scc_kill(one_core,SIG_INIT_FAR_REQ);
  247. my_stats.msg_count++;
  248. my_stats.distance += distance(node_id,one_core);
  249. }
  250. //init_areas_num++;
  251. }
  252. init_areas_sent += i;
  253. //fclose(areas);
  254. if (selfopt_time_rem != -1){
  255. if (timer_gettime(timerid, &chk_timer) == -1) printf("timer_gettime error\n");
  256. else selfopt_time_rem = chk_timer.it_value.tv_nsec;
  257. if (selfopt_time_rem > 0) {
  258. its.it_value.tv_nsec = 0;//750000000;// * MS;
  259. if (timer_settime(timerid, 0, &its, NULL) == -1) printf("timer_settime error4123\n");
  260. }
  261. }
  262. state = IDLE_INIT_MAN;
  263. signals_enable();
  264. scc_signals_check();
  265. } else if (state == INIT_MAN_CHK_OFFERS) {// || state == INIT_MAN_CHK_OFFERS_SELFOPT_PENDING || state == INIT_MAN_CHK_OFFERS_WORK_PENDING){
  266. signals_disable();
  267. printf("init check alarm went off node_id=%d init_DDS_idags = %d init_DDS_replies = %d state=%d!\n",node_id,init_DDS_idags,init_DDS_replies,state);
  268. cur_time = time(NULL);
  269. cur_t = localtime(&cur_time);
  270. fprintf(log_file, "[%d:%d:%d]: init check alarm went off init_DDS_idags = %d init_DDS_replies = %d state=%d\n",
  271. cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec,init_DDS_idags,init_DDS_replies,state);
  272. fflush(log_file);
  273. init_core_found = 0;
  274. if (init_man_offers == NULL) {
  275. printf("I don't have offers\n");
  276. fprintf(log_file, "I don't have init man offers\n");
  277. fflush(log_file);
  278. printf("I am %d and didn't manage to find my core in this round of search for app with id %d\n",node_id,init_app.id);
  279. //state = IDLE_CORE;
  280. if (init_areas_sent == init_areas_cnt){
  281. printf("I am %d and i have to rewind my init_areas_file for app with id %d\n",node_id,init_app.id);
  282. rewind(init_areas_file);
  283. init_areas_sent = 0;
  284. fscanf(init_areas_file,"%d",&init_areas_cnt);
  285. }
  286. state = INIT_MANAGER_SEND_OFFERS;
  287. } else {
  288. tmp_offer_list = init_man_offers;
  289. while (tmp_offer_list != NULL){
  290. fprintf(log_file,"Offer by %d for %d cores with spd_loss %0.4f :",tmp_offer_list->sender,tmp_offer_list->off.num_of_cores,tmp_offer_list->off.spd_loss);
  291. for (i=0; i<tmp_offer_list->off.num_of_cores; i++)
  292. fprintf(log_file," %d,",tmp_offer_list->off.offered_cores[i]);
  293. fprintf(log_file,"\n");
  294. //printf("Offer by %d for %d cores\n",tmp_offer_list->sender,tmp_offer_list->off.num_of_cores);
  295. tmp_offer_list = tmp_offer_list->next;
  296. }
  297. fflush(log_file);
  298. *init_man_offers->answer = 1;
  299. //decide which will be the agent. Will be the one tha minimizes distance between cores
  300. min_dist = -1;
  301. for (i=0; i<init_man_offers->off.num_of_cores; i++){
  302. tmp_int = 0;
  303. for (j=0; j<init_man_offers->off.num_of_cores; j++){
  304. if (i == j) continue;
  305. tmp_int += distance(init_man_offers->off.offered_cores[i],init_man_offers->off.offered_cores[j]);
  306. }
  307. if (min_dist == -1 || tmp_int < min_dist) {
  308. min_dist = tmp_int;
  309. new_agent = init_man_offers->off.offered_cores[i];
  310. }
  311. }
  312. cur_time = time(NULL);
  313. cur_t = localtime(&cur_time);
  314. init_app_times[1].tm_sec = cur_t->tm_sec;
  315. init_app_times[1].tm_min = cur_t->tm_min;
  316. init_app_times[1].tm_hour = cur_t->tm_hour;
  317. printf("New agent is %d\n",new_agent);
  318. cur_time = time(NULL);
  319. cur_t = localtime(&cur_time);
  320. fprintf(log_file, "[%d:%d:%d]: New agent is %d\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec,new_agent);
  321. fflush(log_file);
  322. if (new_agent != node_id) {
  323. if (core_inter_head[new_agent] == NULL){
  324. core_inter_head[new_agent] = (inter_list *) malloc(sizeof(inter_list));
  325. core_inter_tail[new_agent] = core_inter_head[new_agent];
  326. } else {
  327. printf("Starting this app is not high priority. Should we change that?\n");
  328. core_inter_tail[new_agent]->next = (inter_list *) malloc(sizeof(inter_list));
  329. core_inter_tail[new_agent] = core_inter_tail[new_agent]->next;
  330. }
  331. core_inter_tail[new_agent]->type = INIT_AGENT;
  332. core_inter_tail[new_agent]->data.app_cores = (int *)malloc((init_man_offers->off.num_of_cores+1)*sizeof(int));
  333. core_inter_tail[new_agent]->data.app_cores[0] = init_man_offers->off.num_of_cores;
  334. for(i=1; i<=init_man_offers->off.num_of_cores; i++)
  335. core_inter_tail[new_agent]->data.app_cores[i] = init_man_offers->off.offered_cores[i-1];
  336. core_inter_tail[new_agent]->next = NULL;
  337. init_app.num_of_cores = init_man_offers->off.num_of_cores;
  338. if (core_inter_head[new_agent]->next == NULL) {
  339. //kill(pid_num[new_agent], SIG_INIT_AGENT);
  340. scc_kill(new_agent, SIG_INIT_AGENT);
  341. my_stats.msg_count++;
  342. my_stats.distance += distance(node_id,new_agent);
  343. } else printf("I am init manager and i am doing smth else with init agent interaction=%d\n",core_inter_head[new_agent]->type);
  344. } else {
  345. my_app = init_app;
  346. my_cores_count = init_man_offers->off.num_of_cores;
  347. my_app.num_of_cores = my_cores_count;//+1;
  348. if (my_cores == NULL) {
  349. my_cores = (core_list *) malloc(sizeof(core_list));
  350. my_cores_tail = my_cores;
  351. } else {
  352. printf("My cores still not fucking null!!\n");
  353. my_cores_tail->next = (core_list *) malloc(sizeof(core_list));
  354. my_cores_tail = my_cores_tail->next;
  355. }
  356. my_cores_tail->core_id = node_id;
  357. my_cores_tail->offered_to = -1;
  358. my_cores_tail->next = NULL;
  359. if (core_inter_head[my_idag] == NULL){
  360. core_inter_head[my_idag] = (inter_list *) malloc(sizeof(inter_list));
  361. core_inter_tail[my_idag] = core_inter_head[my_idag];
  362. } else {
  363. core_inter_tail[my_idag]->next = (inter_list *) malloc(sizeof(inter_list));
  364. core_inter_tail[my_idag] = core_inter_tail[my_idag]->next;
  365. }
  366. core_inter_tail[my_idag]->type = IDAG_ADD_CORES_DDS;
  367. core_inter_tail[my_idag]->data.app_cores = (int *)malloc((my_cores_count+1)*sizeof(int));
  368. core_inter_tail[my_idag]->data.app_cores[0] = my_cores_count;
  369. core_inter_tail[my_idag]->next = NULL;
  370. //I want myself to be first in my_cores list
  371. for(i=0; i<init_man_offers->off.num_of_cores; i++) {
  372. one_core = init_man_offers->off.offered_cores[i];
  373. //core_inter_tail[my_idag]->data.app_cores[i+1] = one_core;
  374. if (one_core != node_id){
  375. my_cores_tail->next = (core_list *) malloc(sizeof(core_list));
  376. my_cores_tail = my_cores_tail->next;
  377. my_cores_tail->core_id = one_core;
  378. my_cores_tail->offered_to = -1;
  379. my_cores_tail->next = NULL;
  380. }
  381. }
  382. my_app_times[0].tm_sec = init_app_times[0].tm_sec;
  383. my_app_times[0].tm_min = init_app_times[0].tm_min;
  384. my_app_times[0].tm_hour = init_app_times[0].tm_hour;
  385. my_app_times[1].tm_sec = init_app_times[1].tm_sec;
  386. my_app_times[1].tm_min = init_app_times[1].tm_min;
  387. my_app_times[1].tm_hour = init_app_times[1].tm_hour;
  388. init_app_times[0].tm_sec = 0;
  389. init_app_times[0].tm_min = 0;
  390. init_app_times[0].tm_hour = 0;
  391. init_app_times[1].tm_sec = 0;
  392. init_app_times[1].tm_min = 0;
  393. init_app_times[1].tm_hour = 0;
  394. /*kill(pid_num[0], SIG_INIT_APP);
  395. my_stats.msg_count++;
  396. my_stats.distance += distance(node_id,0);*/
  397. printf("I am new agent with id %d and app with A=%.2f, var=%.2f and %d my_cores_count = %d cores: \n"
  398. ,node_id,my_app.A,my_app.var,my_app.num_of_cores,my_cores_count);
  399. my_Speedup = Speedup(my_app, my_app.num_of_cores);
  400. if (core_inter_head[my_idag]->next == NULL) {
  401. //kill(pid_num[my_idag], SIG_ADD_CORES_DDS);
  402. scc_kill(my_idag, SIG_ADD_CORES_DDS);
  403. my_stats.msg_count++;
  404. my_stats.distance += distance(node_id,my_idag);
  405. } else printf("I am %d and i didn't call add!! with interaction %d\n",node_id,core_inter_head[my_idag]->type);
  406. if (my_agent != -1) {
  407. printf("I am %d and i do this agent switch in common node with pending_state=%d\n",node_id,pending_state);
  408. fprintf(log_file,"I do this agent switch in common node with pending_state=%d\n",pending_state);
  409. if (pending_state == WORKING_NODE) {
  410. if (core_inter_head[my_agent] == NULL){
  411. core_inter_head[my_agent] = (inter_list *) malloc(sizeof(inter_list));
  412. core_inter_tail[my_agent] = core_inter_head[my_agent];
  413. } else {
  414. core_inter_tail[my_agent]->next = (inter_list *) malloc(sizeof(inter_list));
  415. core_inter_tail[my_agent] = core_inter_tail[my_agent]->next;
  416. }
  417. core_inter_tail[my_agent]->type = REP_CHK_REM_TIME;
  418. core_inter_tail[my_agent]->data.work_time = upper_work_bound - time_worked;
  419. core_inter_tail[my_agent]->next = NULL;
  420. }
  421. upper_work_bound = 0;
  422. my_agent = -1;
  423. }
  424. state = AGENT_INIT_STATE;
  425. cur_time = time(NULL);
  426. cur_t = localtime(&cur_time);
  427. fprintf(log_file, "[%d:%d:%d]: Init ok!! my_cores_count = %d app_id=%d\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec,my_cores_count,my_app.id);
  428. fprintf(log_file, "my cores are:");
  429. for (tmp_cores_list=my_cores; tmp_cores_list!=NULL; tmp_cores_list=tmp_cores_list->next) fprintf(log_file, " %d", tmp_cores_list->core_id);
  430. fprintf(log_file, "\n");
  431. fflush(log_file);
  432. }
  433. tmp_offer_list = init_man_offers->next;
  434. while (tmp_offer_list != NULL){
  435. fflush(log_file);
  436. *tmp_offer_list->answer = 0;
  437. tmp_offer_list = tmp_offer_list->next;
  438. }
  439. while (init_man_offers != NULL){
  440. if (core_inter_head[init_man_offers->sender] != NULL) {
  441. if (core_inter_head[init_man_offers->sender]->type == REP_AGENT_OFFER_PENDING){
  442. core_inter_head[init_man_offers->sender]->type = REP_AGENT_OFFER_SENT;
  443. //kill(pid_num[init_man_offers->sender], SIG_REP_OFFERS);
  444. scc_kill(init_man_offers->sender, SIG_REP_OFFERS);
  445. my_stats.msg_count++;
  446. my_stats.distance += distance(node_id,init_man_offers->sender);
  447. } else if (core_inter_head[init_man_offers->sender]->type == REP_FAR_REQ_OFFER_PENDING){
  448. core_inter_head[init_man_offers->sender]->type = REP_FAR_REQ_OFFER_SENT;
  449. //kill(pid_num[init_man_offers->sender], SIG_REP_OFFERS);
  450. scc_kill(init_man_offers->sender, SIG_REP_OFFERS);
  451. my_stats.msg_count++;
  452. my_stats.distance += distance(node_id,init_man_offers->sender);
  453. } else if (core_inter_head[init_man_offers->sender]->type != REP_FAR_REQ_OFFER_SENT && core_inter_head[init_man_offers->sender]->type != REP_AGENT_OFFER_SENT)
  454. printf("We have aasdfa problem!\n");
  455. } else {
  456. printf("gamietai b = %d",init_man_offers->sender);
  457. fprintf(log_file,"gamietai b = %d",init_man_offers->sender);
  458. fflush(log_file);
  459. }
  460. tmp_offer_list = init_man_offers;
  461. init_man_offers = init_man_offers->next;
  462. free(tmp_offer_list);
  463. }
  464. fclose(init_areas_file);
  465. fprintf(log_file,"selfopt_time_rem = %ld app_state = %d state = %d pending_state = %d\n",selfopt_time_rem,app_state,state,pending_state);
  466. fflush(log_file);
  467. if (selfopt_time_rem != -1 && app_state != APP_TERMINATED){ //a selfopt is pending !app_terminated
  468. selfopt_time_rem -= 500000000;
  469. if (selfopt_time_rem > 0){
  470. its.it_value.tv_nsec = selfopt_time_rem;
  471. if (timer_settime(timerid, 0, &its, NULL) == -1) printf("timer_settime error5\n");
  472. state = IDLE_AGENT;
  473. } else {
  474. selfopt_time_rem = -1;
  475. state = AGENT_SELF_OPT;
  476. }
  477. } else if (state != AGENT_INIT_STATE) {
  478. if (pending_state == IDLE_AGENT) {
  479. printf("I am %d and i entered this realm of whores\n",node_id);
  480. fprintf(log_file,"I finished my init selfopt_interval=%d, selfopt_time_rem=%ld my_cores_count=%d, old_cores_cnt=%d\n"
  481. ,selfopt_interval,selfopt_time_rem,my_cores_count,old_cores_cnt);
  482. fflush(log_file);
  483. fprintf(app_log_file,"I finished my init selfopt_interval=%d, selfopt_time_rem=%ld my_cores_count=%d, old_cores_cnt=%d\n"
  484. ,selfopt_interval,selfopt_time_rem,my_cores_count,old_cores_cnt);
  485. fflush(app_log_file);
  486. if (selfopt_interval > 0) { // && !app_terminated
  487. its.it_value.tv_nsec = selfopt_interval * MS;
  488. selfopt_time_rem = selfopt_interval;
  489. if (old_cores_cnt == 1 || old_cores_cnt == my_cores_count) {
  490. if (my_cores_count == max_cores_count) {
  491. fprintf(app_log_file, "I have maximum cores count. I don't initiate selfopt process in here anyway.\n");
  492. fflush(app_log_file);
  493. selfopt_time_rem = -1;
  494. } else if (time_per_node <= (selfopt_interval / 2) && my_cores_count > 1) {
  495. fprintf(app_log_file, "I have little working time left time_per_node=%d selfopt_interval=%d in here anyway.\n",time_per_node,selfopt_interval);
  496. fflush(app_log_file);
  497. selfopt_time_rem = -1;
  498. } else if (timer_settime(timerid, 0, &its, NULL) == -1) printf("timer_settime error8\n");
  499. }
  500. } else if (my_cores_count == 1) {
  501. printf("I am %d and i have to rewind my selfopt_areas_file after init for app with id %d\n",node_id,init_app.id);
  502. fprintf(log_file,"I have to rewind my selfopt_areas_file after init for app with id %d\n",init_app.id);
  503. selfopt_interval = 200;
  504. its.it_value.tv_nsec = selfopt_interval * MS;
  505. selfopt_time_rem = selfopt_interval;
  506. if (timer_settime(timerid, 0, &its, NULL) == -1) perror("timer_settime error823\n");
  507. } else selfopt_time_rem = -1;
  508. state = IDLE_AGENT;
  509. pending_state = NO_PENDING_STATE;
  510. } else if (pending_state == AGENT_SELF_OPT || pending_state == WORKING_NODE || pending_state == AGENT_REWIND_FILE) {
  511. state = pending_state;//IDLE_AGENT;
  512. pending_state = NO_PENDING_STATE;
  513. } else state = IDLE_CORE;
  514. } else if (app_state != APP_TERMINATED && new_agent != node_id) state = IDLE_AGENT;//!app_terminated
  515. }
  516. signals_enable();
  517. scc_signals_check();
  518. } else if (state == AGENT_INIT_STATE) {//|| state == AGENT_INIT_STATE_INIT_INTERRUPTED
  519. signals_disable();
  520. selfopt_interval=200;
  521. nodes_ended_cnt = 0;
  522. app_state = RUNNING;
  523. max_cores_count = get_max_cores_count(my_app);
  524. //app_terminated = 0;
  525. //pending_state = NO_PENDING_STATE;
  526. if (my_cores_count > 1){
  527. time_to_work = (int) roundf(my_app.workld / my_Speedup);
  528. time_per_node = time_to_work / (my_cores_count-1);
  529. time_left = time_to_work % (my_cores_count-1);
  530. if (time_to_work == 0) time_left++;
  531. }
  532. printf("i am init agent %d. speedup = %0.2f time_to_work = %d time_per_node = %d, workld=%0.2f\n",node_id,my_Speedup,time_to_work,time_per_node,my_app.workld);
  533. strcpy(app_log_file_name,"/shared/herc/scenaria/");
  534. strcat(app_log_file_name,scen_num);
  535. strcat(app_log_file_name,"/app_logs/");
  536. strcat(app_log_file_name, itoa(my_app.id));
  537. strcat(app_log_file_name, ".txt");
  538. //printf("area file path self opt = %s\n",areas_file_name);
  539. if ((app_log_file = fopen(app_log_file_name, "w")) == NULL){
  540. printf("Cannot open input file with file path = %s ",app_log_file_name);
  541. perror("open selfopt_areas_file_name");
  542. }
  543. fprintf(app_log_file, "Came into init_agent at [%d:%d:%d]\n",my_app_times[0].tm_hour,my_app_times[0].tm_min,my_app_times[0].tm_sec);
  544. fprintf(app_log_file, "New agent found at [%d:%d:%d]\n",my_app_times[1].tm_hour,my_app_times[1].tm_min,my_app_times[1].tm_sec);
  545. cur_time = time(NULL);
  546. cur_t = localtime(&cur_time);
  547. fprintf(app_log_file, "[%d:%d:%d]: I am agent %d . Init ok!! my_cores_count = %d app_id=%d\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec,node_id,my_cores_count,my_app.id);
  548. fprintf(app_log_file, "my cores are:");
  549. for (tmp_cores_list=my_cores; tmp_cores_list!=NULL; tmp_cores_list=tmp_cores_list->next) fprintf(app_log_file, " %d", tmp_cores_list->core_id);
  550. fprintf(app_log_file, "\n");
  551. fprintf(app_log_file,"speedup = %0.2f time_to_work = %d time_per_node = %d, time_left = %d, workld=%0.2f\n",my_Speedup,time_to_work,time_per_node,time_left,my_app.workld);
  552. fflush(app_log_file);
  553. tmp_cores_list = my_cores->next;
  554. while (tmp_cores_list != NULL){
  555. one_core = tmp_cores_list->core_id;
  556. if (core_inter_head[one_core] == NULL){
  557. core_inter_head[one_core] = (inter_list *) malloc(sizeof(inter_list));
  558. core_inter_tail[one_core] = core_inter_head[one_core];
  559. } else {
  560. core_inter_tail[one_core]->next = (inter_list *) malloc(sizeof(inter_list));
  561. core_inter_tail[one_core] = core_inter_tail[one_core]->next;
  562. }
  563. core_inter_tail[one_core]->type = INIT_WORK_NODE;
  564. core_inter_tail[one_core]->data.work_time = time_per_node;
  565. if (time_left > 0) {
  566. core_inter_tail[one_core]->data.work_time++;
  567. time_left--;
  568. }
  569. core_inter_tail[one_core]->next = NULL;
  570. my_stats.app_turnaround += core_inter_tail[one_core]->data.work_time;
  571. if (core_inter_head[one_core]->next == NULL) {
  572. //kill(pid_num[one_core], SIG_APPOINT_WORK);
  573. scc_kill(one_core, SIG_APPOINT_WORK);
  574. my_stats.msg_count++;
  575. my_stats.distance += distance(node_id,one_core);
  576. } else printf("I am %d and i am doing smth else with my working node %d in init inter1 = %d inter2 = %d\n",
  577. node_id,one_core,core_inter_head[one_core]->type,core_inter_head[one_core]->next->type);
  578. tmp_cores_list = tmp_cores_list->next;
  579. } //else printf("i have only one fucking core\n");
  580. if (my_cores_count == max_cores_count) {
  581. fprintf(app_log_file, "I have maximum cores count. I don't initiate selfopt process ini init_agent.\n");
  582. fflush(app_log_file);
  583. selfopt_time_rem = -1;
  584. if (pending_state == IDLE_INIT_MAN || pending_state == INIT_MANAGER || pending_state == INIT_MANAGER_SEND_OFFERS
  585. || pending_state == INIT_MAN_CHK_OFFERS || pending_state == WORKING_NODE_IDLE_INIT) {
  586. state = pending_state;
  587. pending_state = IDLE_AGENT;
  588. } else state = IDLE_AGENT;
  589. } else if (time_per_node <= (selfopt_interval / 2) && my_cores_count > 1) {
  590. fprintf(app_log_file, "I have little working time left time_per_node=%d selfopt_interval=%d in init_agent.\n",time_per_node,selfopt_interval);
  591. fflush(app_log_file);
  592. if (pending_state == IDLE_INIT_MAN || pending_state == INIT_MANAGER || pending_state == INIT_MANAGER_SEND_OFFERS
  593. || pending_state == INIT_MAN_CHK_OFFERS || pending_state == WORKING_NODE_IDLE_INIT) {
  594. state = pending_state;
  595. pending_state = IDLE_AGENT;
  596. } else state = IDLE_AGENT;
  597. selfopt_time_rem = -1;
  598. } else {
  599. if (pending_state == IDLE_INIT_MAN || pending_state == INIT_MANAGER || pending_state == INIT_MANAGER_SEND_OFFERS
  600. || pending_state == INIT_MAN_CHK_OFFERS || pending_state == WORKING_NODE_IDLE_INIT) {
  601. state = pending_state;//IDLE_INIT_MAN;//IDLE_INIT_MAN_SELFOPT_PENDING;
  602. pending_state = AGENT_SELF_OPT;
  603. //printf("I am %d o fountas einai poustara pou zwgrafizei k ton fuckaroun oi gkomenes tou!\n",node_id);
  604. } else state = AGENT_SELF_OPT;
  605. }
  606. signals_enable();
  607. scc_signals_check();
  608. } else if (state == AGENT_SELF_OPT) {
  609. signals_disable();
  610. printf("Initialising self opt node_id = %d\n",node_id);
  611. cur_time = time(NULL);
  612. cur_t = localtime(&cur_time);
  613. fprintf(log_file, "[%d:%d:%d]: Initialising self opt!\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec);
  614. fflush(log_file);
  615. fprintf(app_log_file, "[%d:%d:%d]: Initialising self opt!\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec);
  616. fflush(app_log_file);
  617. pending_state = NO_PENDING_STATE;
  618. if (app_state != APP_TERMINATED) {//!app_terminated
  619. selfopt_DDS_idags = 0;
  620. selfopt_DDS_replies = 0;
  621. //selfopt_areas_sent = 0;
  622. //if (selfopt_man_offers != NULL) printf("selfopt offers list is not NULL\n");
  623. if (selfopt_targets_head != NULL) {
  624. //printf("selfopt targets list is not NULL\n");
  625. while (selfopt_targets_head != NULL){
  626. tmp_target_list = selfopt_targets_head;
  627. selfopt_targets_head = selfopt_targets_head->next;
  628. free(tmp_target_list);
  629. }
  630. }
  631. if (core_inter_head[my_idag] == NULL){
  632. core_inter_head[my_idag] = (inter_list *) malloc(sizeof(inter_list));
  633. core_inter_tail[my_idag] = core_inter_head[my_idag];
  634. } else {
  635. core_inter_tail[my_idag]->next = (inter_list *) malloc(sizeof(inter_list));
  636. core_inter_tail[my_idag] = core_inter_tail[my_idag]->next;
  637. }
  638. core_inter_tail[my_idag]->type = SELFOPT_IDAG_FIND_IDAGS_PENDING;
  639. core_inter_tail[my_idag]->data.reg.C = node_id;
  640. core_inter_tail[my_idag]->data.reg.r = selfopt_r;
  641. core_inter_tail[my_idag]->next = NULL;
  642. if (core_inter_head[my_idag]->next == NULL) {
  643. //kill(pid_num[my_idag],SIG_IDAG_FIND_IDAGS);
  644. scc_kill(my_idag,SIG_IDAG_FIND_IDAGS);
  645. my_stats.msg_count++;
  646. my_stats.distance += distance(node_id,my_idag);
  647. }
  648. if (selfopt_interval != 800) selfopt_interval = 2 * selfopt_interval;
  649. else selfopt_interval = -1;
  650. state = IDLE_AGENT_WAITING_OFF;
  651. } else state = AGENT_ENDING;
  652. signals_enable();
  653. scc_signals_check();
  654. } else if (state == AGENT_SELF_CHK_OFFERS) {
  655. signals_disable();
  656. printf("alarm went off for self opt node_id=%d selfopt_DDS_idags = %d selfopt_DDS_replies = %d! app_state=%d\n",node_id,selfopt_DDS_idags,selfopt_DDS_replies,app_state);
  657. cur_time = time(NULL);
  658. cur_t = localtime(&cur_time);
  659. fprintf(log_file, "[%d:%d:%d]: alarm went off for self opt selfopt_DDS_idags = %d selfopt_DDS_replies = %d app_state=%d pending_state = %d\n",
  660. cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec,selfopt_DDS_idags,selfopt_DDS_replies,app_state,pending_state);
  661. fflush(log_file);
  662. fprintf(app_log_file, "[%d:%d:%d]: alarm went off for self opt selfopt_DDS_idags = %d selfopt_DDS_replies = %d app_state=%d pending_state = %d\n",
  663. cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec,selfopt_DDS_idags,selfopt_DDS_replies,app_state,pending_state);
  664. fflush(app_log_file);
  665. old_cores_cnt = my_cores_count;
  666. if (selfopt_man_offers == NULL) {
  667. printf("I don't have self opt offers app_state=%d\n",app_state);
  668. fprintf(log_file,"I don't have self opt offers app_state=%d\n",app_state);
  669. fflush(log_file);
  670. fprintf(app_log_file,"I don't have self opt offers app_state=%d\n",app_state);
  671. fflush(app_log_file);
  672. //state = IDLE_AGENT;
  673. } else {
  674. tmp_offer_list = selfopt_man_offers;
  675. while (tmp_offer_list != NULL){
  676. //printf("Offer by %d for %d cores\n",tmp_offer_list->sender,tmp_offer_list->off.num_of_cores);
  677. fprintf(log_file,"Offer by %d for %d cores\n",tmp_offer_list->sender,tmp_offer_list->off.num_of_cores);
  678. fflush(log_file);
  679. tmp_offer_list = tmp_offer_list->next;
  680. }
  681. if (app_state != APP_TERMINATED) {
  682. *selfopt_man_offers->answer = 1;
  683. if (core_inter_head[my_idag] == NULL){
  684. core_inter_head[my_idag] = (inter_list *) malloc(sizeof(inter_list));
  685. core_inter_tail[my_idag] = core_inter_head[my_idag];
  686. } else {
  687. core_inter_tail[my_idag]->next = (inter_list *) malloc(sizeof(inter_list));
  688. core_inter_tail[my_idag] = core_inter_tail[my_idag]->next;
  689. }
  690. core_inter_tail[my_idag]->type = IDAG_ADD_CORES_DDS;
  691. core_inter_tail[my_idag]->data.app_cores = (int *)malloc((selfopt_man_offers->off.num_of_cores+1)*sizeof(int));
  692. core_inter_tail[my_idag]->data.app_cores[0] = selfopt_man_offers->off.num_of_cores;
  693. core_inter_tail[my_idag]->next = NULL;
  694. //
  695. if (app_state != RESIZING) {
  696. old_Speedup = my_Speedup;
  697. chk_rem_num = my_cores_count-1;
  698. fprintf(app_log_file,"Initialising resize with check_rem = %d\n",chk_rem_num);
  699. fflush(app_log_file);
  700. chk_rem_count = 0;
  701. sum_rem_time = 0;
  702. app_state = RESIZING;
  703. my_cores_count += selfopt_man_offers->off.num_of_cores;
  704. my_app.num_of_cores = my_cores_count;
  705. my_Speedup = Speedup(my_app, my_cores_count);
  706. if (old_cores_cnt > 1)
  707. for(tmp_cores_list=my_cores->next; tmp_cores_list!=NULL; tmp_cores_list=tmp_cores_list->next) {//first is myself
  708. one_core = tmp_cores_list->core_id;
  709. if (core_inter_head[one_core] == NULL){
  710. core_inter_head[one_core] = (inter_list *) malloc(sizeof(inter_list));
  711. core_inter_tail[one_core] = core_inter_head[one_core];
  712. } else {
  713. core_inter_tail[one_core]->next = (inter_list *) malloc(sizeof(inter_list));
  714. core_inter_tail[one_core] = core_inter_tail[one_core]->next;
  715. }
  716. core_inter_tail[one_core]->type = APPOINT_WORK_NODE_PENDING;//CHK_REM_TIME;
  717. core_inter_tail[one_core]->next = NULL;
  718. if (core_inter_head[one_core]->next == NULL) {
  719. //kill(pid_num[one_core], SIG_CHECK_REM_TIME);
  720. scc_kill(my_idag, SIG_ADD_CORES_DDS);
  721. my_stats.msg_count++;
  722. my_stats.distance += distance(node_id,one_core);
  723. } else printf("I am %d and i am doing smth else with my working node %d in send SIG_CHECK_REM_TIME interaction = %d\n",node_id,one_core,core_inter_head[one_core]->type);
  724. }
  725. } else {
  726. fprintf(app_log_file,"Allready resizing with chk_rem_num = %d chk_rem_count=%d\n",chk_rem_num,chk_rem_count);
  727. fflush(app_log_file);
  728. my_cores_count += selfopt_man_offers->off.num_of_cores;
  729. my_app.num_of_cores = my_cores_count;
  730. my_Speedup = Speedup(my_app, my_cores_count);
  731. }
  732. for (i=0; i<selfopt_man_offers->off.num_of_cores; i++){
  733. my_cores_tail->next = (core_list *) malloc(sizeof(core_list));
  734. my_cores_tail = my_cores_tail->next;
  735. my_cores_tail->core_id = selfopt_man_offers->off.offered_cores[i];
  736. my_cores_tail->offered_to = -1;
  737. my_cores_tail->next = NULL;
  738. core_inter_tail[my_idag]->data.app_cores[i+1] = selfopt_man_offers->off.offered_cores[i];
  739. one_core = my_cores_tail->core_id;
  740. //printf("I am %d and i put in appoint work %d\n",node_id,one_core);
  741. if (core_inter_head[one_core] == NULL){
  742. core_inter_head[one_core] = (inter_list *) malloc(sizeof(inter_list));
  743. core_inter_tail[one_core] = core_inter_head[one_core];
  744. } else {
  745. printf("I am %d and I am doing sth with my new core %d interaction is %d\n",node_id,one_core,core_inter_head[one_core]->type);
  746. core_inter_tail[one_core]->next = (inter_list *) malloc(sizeof(inter_list));
  747. core_inter_tail[one_core] = core_inter_tail[one_core]->next;
  748. }
  749. core_inter_tail[one_core]->type = INIT_WORK_NODE_PENDING;
  750. core_inter_tail[one_core]->next = NULL;
  751. }
  752. } else *selfopt_man_offers->answer = 0;
  753. tmp_offer_list = selfopt_man_offers->next;
  754. while (tmp_offer_list != NULL){
  755. *tmp_offer_list->answer = 0;
  756. tmp_offer_list = tmp_offer_list->next;
  757. }
  758. if (app_state != APP_TERMINATED) {
  759. //my idag may have offered smth
  760. if (core_inter_head[my_idag]->next == NULL) {
  761. //kill(pid_num[my_idag], SIG_ADD_CORES_DDS);
  762. scc_kill(my_idag, SIG_ADD_CORES_DDS);
  763. my_stats.msg_count++;
  764. my_stats.distance += distance(node_id,my_idag);
  765. } else printf("I am %d i didn't call add inside selfopt with interaction %d\n",node_id,core_inter_head[my_idag]->type);
  766. if (old_cores_cnt == 1) {
  767. nodes_ended_cnt = 0;
  768. time_to_work = (int) roundf(my_app.workld / my_Speedup);
  769. time_per_node = time_to_work / (my_cores_count-1);
  770. time_left = time_to_work % (my_cores_count-1);
  771. if (time_to_work == 0) time_left++;
  772. fprintf(app_log_file,"in one core speedup = %0.2f time_to_work = %d time_per_node = %d, workld=%0.2f\n",my_Speedup,time_to_work,time_per_node,my_app.workld);
  773. fflush(app_log_file);
  774. tmp_cores_list = my_cores->next;
  775. while (tmp_cores_list != NULL){
  776. //printf("I am inside core listing node=%d\n",node_id);
  777. one_core = tmp_cores_list->core_id;
  778. for (tmp_inter_list = core_inter_head[one_core]; tmp_inter_list != NULL; tmp_inter_list = tmp_inter_list->next)
  779. if (tmp_inter_list->type == INIT_WORK_NODE_PENDING) break;
  780. if (tmp_inter_list != NULL) {
  781. tmp_inter_list->type = INIT_WORK_NODE;
  782. tmp_inter_list->data.work_time = time_per_node;
  783. if (time_left > 0) {
  784. tmp_inter_list->data.work_time++;
  785. time_left--;
  786. }
  787. my_stats.app_turnaround += tmp_inter_list->data.work_time;
  788. } else printf("i am %d kai sto common_node ta hpiame one core = %d\n",node_id,one_core);
  789. if (core_inter_head[one_core]->next == NULL) {
  790. //kill(pid_num[one_core], SIG_APPOINT_WORK);
  791. scc_kill(one_core, SIG_APPOINT_WORK);
  792. my_stats.msg_count++;
  793. my_stats.distance += distance(node_id,one_core);
  794. } else printf("I am doing smth else with my working node? interaction=%d interaction2=%d\n",core_inter_head[one_core]->type,core_inter_head[one_core]->next->type);
  795. tmp_cores_list = tmp_cores_list->next;
  796. }
  797. app_state = RUNNING;
  798. }
  799. }
  800. while (selfopt_man_offers != NULL) {
  801. if (core_inter_head[selfopt_man_offers->sender]->type == REP_AGENT_OFFER_PENDING){
  802. core_inter_head[selfopt_man_offers->sender]->type = REP_AGENT_OFFER_SENT;
  803. //kill(pid_num[selfopt_man_offers->sender], SIG_REP_OFFERS);
  804. scc_kill(selfopt_man_offers->sender, SIG_REP_OFFERS);
  805. my_stats.msg_count++;
  806. my_stats.distance += distance(node_id,selfopt_man_offers->sender);
  807. } else if (core_inter_head[selfopt_man_offers->sender]->type != REP_AGENT_OFFER_SENT) printf("We have zxcvzxc problem!\n");
  808. tmp_offer_list = selfopt_man_offers;
  809. selfopt_man_offers = selfopt_man_offers->next;
  810. free(tmp_offer_list);
  811. }
  812. printf("Self opt seems to be ok cores count = %d\n",my_cores_count);
  813. cur_time = time(NULL);
  814. cur_t = localtime(&cur_time);
  815. fprintf(log_file, "[%d:%d:%d]: Self opt ok. my_cores_count = %d\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec,my_cores_count);
  816. fprintf(log_file, "my cores are:");
  817. fprintf(app_log_file, "[%d:%d:%d]: Self opt ok. my_cores_count = %d\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec,my_cores_count);
  818. fprintf(app_log_file, "my cores are:");
  819. printf("I am %d and my cores are:",node_id);
  820. for (tmp_cores_list=my_cores; tmp_cores_list!=NULL; tmp_cores_list=tmp_cores_list->next) {
  821. fprintf(log_file, " %d", tmp_cores_list->core_id);
  822. fprintf(app_log_file, " %d", tmp_cores_list->core_id);
  823. printf(" %d",tmp_cores_list->core_id);
  824. }
  825. printf("\n");
  826. fprintf(log_file, "\n");
  827. fflush(log_file);
  828. fprintf(app_log_file, "\n");
  829. fflush(app_log_file);
  830. }
  831. if (app_state == APP_TERMINATED) state = AGENT_ENDING;//app_terminated
  832. else {
  833. if (pending_state == INIT_MANAGER) {
  834. state = INIT_MANAGER;
  835. pending_state = IDLE_AGENT;
  836. } else {
  837. printf("I am %d in chk_offers and pending_state=%d\n",node_id,pending_state);
  838. if (selfopt_interval > 0) { // && !app_terminated
  839. its.it_value.tv_nsec = selfopt_interval * MS;
  840. selfopt_time_rem = selfopt_interval;
  841. if (old_cores_cnt == 1 || old_cores_cnt == my_cores_count) {
  842. if (my_cores_count == max_cores_count) {
  843. fprintf(app_log_file, "I have maximum cores count. I don't initiate selfopt process in selfopt.\n");
  844. fflush(app_log_file);
  845. selfopt_time_rem = -1;
  846. } else if (time_per_node <= (selfopt_interval / 2) && my_cores_count > 1) {
  847. fprintf(app_log_file, "I have little working time left time_per_node=%d selfopt_interval=%d in selfopt.\n",time_per_node,selfopt_interval);
  848. fflush(app_log_file);
  849. selfopt_time_rem = -1;
  850. } else if (timer_settime(timerid, 0, &its, NULL) == -1) printf("timer_settime error8\n");
  851. }
  852. } else if (my_cores_count == 1) {
  853. printf("I am %d and i have to rewind my selfopt_areas_file for app with id %d\n",node_id,init_app.id);
  854. fprintf(log_file,"I have to rewind my selfopt_areas_file for app with id %d\n",my_app.id);
  855. fflush(log_file);
  856. fprintf(app_log_file,"I have to rewind my selfopt_areas_file for app with id %d\n",my_app.id);
  857. fflush(app_log_file);
  858. selfopt_interval = 200;
  859. its.it_value.tv_nsec = selfopt_interval * MS;
  860. selfopt_time_rem = selfopt_interval;
  861. if (timer_settime(timerid, 0, &its, NULL) == -1) perror("timer_settime error82\n");
  862. } else selfopt_time_rem = -1;
  863. state = IDLE_AGENT;
  864. }
  865. }
  866. signals_enable();
  867. scc_signals_check();
  868. } else if (state == WORKING_NODE || state == WORKING_NODE_IDLE_INIT){
  869. int j,dummy=0;
  870. signals_disable();
  871. while (time_worked <= upper_work_bound){
  872. scc_signals_check();
  873. signals_enable();
  874. //the following code should be one ms long
  875. for (i=0; i<1000; i++)
  876. for(j=0; j<1000; j++)
  877. dummy++;
  878. signals_disable();
  879. time_worked++;
  880. }
  881. printf("I am node %d with agent = %d and I finished my work upper_work_bound = %ld time_passed=%d\n",node_id,my_agent,upper_work_bound,time_worked);
  882. if (upper_work_bound > 0) {
  883. //kill(pid_num[my_agent],SIG_FINISH);
  884. scc_kill(my_agent,SIG_FINISH);
  885. my_stats.msg_count++;
  886. my_stats.distance += distance(node_id,my_agent);
  887. }
  888. if (state == WORKING_NODE) state = IDLE_CORE;
  889. else if (state == WORKING_NODE_IDLE_INIT) state = IDLE_INIT_MAN;
  890. else if (pending_state == WORKING_NODE) pending_state = NO_PENDING_STATE; //just finished on return
  891. signals_enable();
  892. scc_signals_check();
  893. } else if (state == AGENT_ZOMBIE) {
  894. //pause();
  895. dummy=0;
  896. for (i=0; i<1000; i++)
  897. for(j=0; j<1000; j++)
  898. dummy++;
  899. scc_signals_check();
  900. } else if (state == AGENT_ENDING) {
  901. signals_disable();
  902. cur_time = time(NULL);
  903. cur_t = localtime(&cur_time);
  904. fprintf(log_file, "[%d:%d:%d]: I entered agent_ending\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec);
  905. fflush(log_file);
  906. fprintf(app_log_file, "[%d:%d:%d]: I entered agent_ending\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec);
  907. fflush(app_log_file);
  908. for (tmp_cores_list = my_cores->next; tmp_cores_list != NULL; tmp_cores_list = tmp_cores_list->next)
  909. fprintf(app_log_file,"Core %d is offered to %d\n",tmp_cores_list->core_id,tmp_cores_list->offered_to);
  910. fflush(app_log_file);
  911. for (tmp_cores_list = my_cores->next; tmp_cores_list != NULL; tmp_cores_list = tmp_cores_list->next)
  912. if (tmp_cores_list->offered_to != -1) break;
  913. if (tmp_cores_list != NULL) {
  914. state = AGENT_ZOMBIE;
  915. for (tmp_cores_list = my_cores->next; tmp_cores_list != NULL; tmp_cores_list = tmp_cores_list->next) {
  916. one_core = tmp_cores_list->core_id;
  917. tmp_inter_prev = NULL;
  918. tmp_inter_list = core_inter_head[one_core];
  919. //for (tmp_inter_list = core_inter_head[one_core]; tmp_inter_list != NULL; tmp_inter_list=tmp_inter_list->next)
  920. while (tmp_inter_list != NULL)
  921. if (tmp_inter_list->type == INIT_WORK_NODE || tmp_inter_list->type == APPOINT_WORK_NODE || tmp_inter_list->type == INIT_WORK_NODE_PENDING
  922. || tmp_inter_list->type == APPOINT_WORK_NODE_PENDING || tmp_inter_list->type == REMOVED_NODE_REM_TIME) {
  923. //|| (tmp_inter_list->type == APPOINT_WORK_NODE_PENDING && tmp_inter_prev != NULL)) {
  924. fprintf(log_file, "Removing in zombie one node of %d with inter = %d\n",one_core,tmp_inter_list->type);
  925. fflush(log_file);
  926. if (tmp_inter_prev == NULL) {
  927. core_inter_head[one_core] = core_inter_head[one_core]->next;
  928. free(tmp_inter_list);
  929. tmp_inter_list = core_inter_head[one_core];
  930. } else {
  931. tmp_inter_prev->next = tmp_inter_list->next;
  932. if (tmp_inter_prev->next == NULL) core_inter_tail[one_core] = tmp_inter_prev;
  933. free(tmp_inter_list);
  934. tmp_inter_list = tmp_inter_prev->next;
  935. }
  936. } else {
  937. tmp_inter_prev = tmp_inter_list;
  938. tmp_inter_list = tmp_inter_list->next;
  939. }
  940. }
  941. } else {
  942. if (core_inter_head[my_idag] == NULL){
  943. core_inter_head[my_idag] = (inter_list *) malloc(sizeof(inter_list));
  944. core_inter_tail[my_idag] = core_inter_head[my_idag];
  945. } else {
  946. core_inter_tail[my_idag]->next = (inter_list *) malloc(sizeof(inter_list));
  947. core_inter_tail[my_idag] = core_inter_tail[my_idag]->next;
  948. }
  949. core_inter_tail[my_idag]->type = REMOVE_APP;
  950. core_inter_tail[my_idag]->data.app_cores = (int *)malloc((my_cores_count+1)*sizeof(int));
  951. core_inter_tail[my_idag]->data.app_cores[0] = my_cores_count;
  952. core_inter_tail[my_idag]->next = NULL;
  953. i=1;
  954. core_inter_tail[my_idag]->data.app_cores[i++] = my_cores->core_id;
  955. tmp_cores_list = my_cores;
  956. my_cores=my_cores->next;
  957. free(tmp_cores_list);
  958. //for(my_cores=my_cores->next; my_cores!=NULL; my_cores = my_cores->next) {
  959. //free(tmp_cores_list);
  960. while (my_cores != NULL) {
  961. tmp_cores_list = my_cores;
  962. one_core = tmp_cores_list->core_id;
  963. core_inter_tail[my_idag]->data.app_cores[i++] = one_core;
  964. tmp_inter_prev = NULL;
  965. tmp_inter_list = core_inter_head[one_core];
  966. //for (tmp_inter_list = core_inter_head[one_core]; tmp_inter_list != NULL; tmp_inter_list=tmp_inter_list->next)
  967. while (tmp_inter_list != NULL)
  968. if (tmp_inter_list->type == INIT_WORK_NODE || tmp_inter_list->type == APPOINT_WORK_NODE || tmp_inter_list->type == INIT_WORK_NODE_PENDING
  969. || tmp_inter_list->type == APPOINT_WORK_NODE_PENDING || tmp_inter_list->type == REMOVED_NODE_REM_TIME) {
  970. fprintf(log_file, "Removing one node of %d with inter = %d\n",one_core,tmp_inter_list->type);
  971. fflush(log_file);
  972. if (tmp_inter_prev == NULL) {
  973. core_inter_head[one_core] = core_inter_head[one_core]->next;
  974. free(tmp_inter_list);
  975. tmp_inter_list = core_inter_head[one_core];
  976. } else {
  977. tmp_inter_prev->next = tmp_inter_list->next;
  978. if (tmp_inter_prev->next == NULL) core_inter_tail[one_core] = tmp_inter_prev;
  979. free(tmp_inter_list);
  980. tmp_inter_list = tmp_inter_prev->next;
  981. }
  982. } else {
  983. tmp_inter_prev = tmp_inter_list;
  984. tmp_inter_list = tmp_inter_list->next;
  985. }
  986. if (core_inter_head[one_core] == NULL) {
  987. //kill(pid_num[one_core],SIG_FINISH);
  988. scc_kill(one_core,SIG_FINISH);
  989. my_stats.msg_count++;
  990. my_stats.distance += distance(node_id,one_core);
  991. } else printf("I am %d and I still still have smth to do with my work node %d before finish which is %d\n",node_id,one_core,core_inter_head[one_core]->type);
  992. my_cores=my_cores->next;
  993. free(tmp_cores_list);
  994. }
  995. if (core_inter_head[my_idag]->next == NULL) {
  996. //kill(pid_num[my_idag],SIG_FINISH);
  997. scc_kill(my_idag,SIG_FINISH);
  998. my_stats.msg_count++;
  999. my_stats.distance += distance(node_id,my_idag);
  1000. } else printf("I am %d and i am doing smth else with my idag app_remove interaction=%d\n",node_id,core_inter_head[my_idag]->type);
  1001. my_app.A = 0.0;
  1002. my_app.var = 0.0;
  1003. my_app.num_of_cores = -1;
  1004. selfopt_time_rem = -1;
  1005. //app_terminated = 0;
  1006. app_state = NO_APP;
  1007. printf("I am %d My app ended app_id = %d pending_state=%d\n",node_id,my_app.id,pending_state);
  1008. cur_time = time(NULL);
  1009. cur_t = localtime(&cur_time);
  1010. fprintf(app_log_file, "[%d:%d:%d]: App ended app_id = %d pending_state=%d",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec,my_app.id,pending_state);
  1011. //fprintf(app_log_file,"App ended app_id = %d pending_state=%d\n",my_app.id,pending_state);
  1012. fclose(app_log_file);
  1013. if (pending_state == INIT_MANAGER) {
  1014. state = INIT_MANAGER;
  1015. pending_state = IDLE_CORE;
  1016. } else if (pending_state == NO_PENDING_STATE) state = IDLE_CORE;
  1017. else {
  1018. printf("I am %d in agent_ending and pending_state = %d\n",node_id,pending_state);
  1019. state = IDLE_CORE;
  1020. }
  1021. }
  1022. scc_kill(0, SIG_APP_TERMINATED);
  1023. signals_enable();
  1024. scc_signals_check();
  1025. } else {
  1026. printf("Unknown state node_id = %d state = %d\n",node_id,state);
  1027. state = IDLE_CORE;
  1028. }
  1029. cur_time = time(NULL);
  1030. cur_t = localtime(&cur_time);
  1031. fprintf(log_file, "[%d:%d:%d]: I ended well\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec);
  1032. fclose(log_file);
  1033. exit(0);
  1034. }