common_node.c~ 48 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184
  1. #include "common_node.h"
  2. //extern int *pid_num;
  3. extern int num_idags, node_id ,my_idag;//, fd_log;
  4. extern FILE *log_file;
  5. extern core_states state;
  6. core_states pending_state=NO_PENDING_STATE;
  7. extern inter_list **core_inter_head,**core_inter_tail;
  8. extern app my_app;
  9. extern app init_app;
  10. extern app far_req_app;
  11. extern metrics my_stats;
  12. extern int far_req_or_sender;
  13. extern int *idag_mask, *idag_id_arr;
  14. extern int *Cl_x_max_arr, *Cl_y_max_arr;
  15. extern int DDS_count, my_cores_count;
  16. extern DDS_list *DDS, *DDS_tail;
  17. extern core_list *my_cores, *my_cores_tail;
  18. extern offer_list *init_man_offers, *selfopt_man_offers;
  19. extern offer_list *far_man_offers, *far_man_offers_tail;
  20. extern int far_list_count, far_man_agent_count;
  21. extern int my_agent, time_worked;
  22. extern int debug_global;
  23. extern time_t cur_time;
  24. extern struct tm *cur_t;
  25. extern struct sigevent sev;
  26. extern struct itimerspec its, chk_timer;
  27. extern timer_t timerid;
  28. extern long int selfopt_time_rem;//-1 means it is not set
  29. extern long int upper_work_bound;
  30. extern int time_for_farman;
  31. extern char scen_num[4];
  32. extern int chk_rem_count, chk_rem_num, sum_rem_time;
  33. extern float old_Speedup, my_Speedup;
  34. extern int nodes_ended_cnt;//, app_terminated;
  35. int my_x, my_y, init_areas_num;
  36. int init_DDS_replies, selfopt_DDS_replies, init_DDS_idags, selfopt_DDS_idags, selfopt_interval=200, init_idags_areas_replies, max_cores_count;
  37. target_list *init_targets_head=NULL, *init_targets_tail;
  38. target_list *selfopt_targets_head=NULL, *selfopt_targets_tail;
  39. FILE *app_log_file;
  40. application_states app_state;
  41. my_time_stamp init_app_times[2], my_app_times[2];
  42. extern int *sig_array, *data_array, NUES;
  43. extern RCCE_FLAG flag_signals_enabled,flag_data_written;
  44. void common_node_actions(char scen_num[4]){
  45. offer_list *tmp_offer_list;
  46. int one_core, i, old_cores_cnt;
  47. core_list *tmp_cores_list;
  48. target_list *tmp_target_list;
  49. inter_list *tmp_inter_list, *tmp_inter_prev;
  50. FILE *init_areas_file;//, *selfopt_areas_file;
  51. char init_areas_file_name[64], app_log_file_name[64];//selfopt_areas_file_name[32],
  52. int C,r,init_areas_cnt, init_areas_sent;//area_cnt,selfopt_areas=0,
  53. int time_per_node, time_left, time_to_work, init_core_found=0;
  54. int new_agent, min_dist=-1, tmp_int, j;
  55. //int new_x, new_y;//, selfopt_areas_sent;
  56. int selfopt_r;
  57. DDS_count=0;
  58. my_cores_count=0;
  59. my_stats.msg_count=0;
  60. my_stats.message_size=0;
  61. my_stats.distance=0;
  62. my_stats.app_turnaround=0;
  63. my_stats.comp_effort=0;
  64. my_stats.cores_utilized=0;
  65. my_stats.times_accessed=0;
  66. init_app_times[0].tm_sec = 0;
  67. init_app_times[0].tm_min = 0;
  68. init_app_times[0].tm_hour = 0;
  69. init_app_times[1].tm_sec = 0;
  70. init_app_times[1].tm_min = 0;
  71. init_app_times[1].tm_hour = 0;
  72. my_app_times[0].tm_sec = 0;
  73. my_app_times[0].tm_min = 0;
  74. my_app_times[0].tm_hour = 0;
  75. my_app_times[1].tm_sec = 0;
  76. my_app_times[1].tm_min = 0;
  77. my_app_times[1].tm_hour = 0;
  78. //printf("I Am %d\n",node_id);
  79. DDS=NULL;
  80. my_cores=NULL;
  81. selfopt_r = (int) (1.5 * (X_max / num_idags_x));
  82. install_signal_handlers();
  83. //sig_SEGV_enable();
  84. sev.sigev_notify = SIGEV_SIGNAL;
  85. sev.sigev_signo = SIG_TIMER;
  86. sev.sigev_value.sival_ptr = &timerid;
  87. if (timer_create(CLOCK_REALTIME, &sev, &timerid) == -1) printf("timer_create error\n");
  88. its.it_value.tv_sec = 0;
  89. its.it_interval.tv_sec = 0;//its.it_value.tv_sec;
  90. its.it_interval.tv_nsec = 0;
  91. log_file = create_log_file(node_id,scen_num);
  92. cur_time = time(NULL);
  93. cur_t = localtime(&cur_time);
  94. fprintf(log_file, "[%d:%d:%d]: Initialisation complete\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec);
  95. fflush(log_file);
  96. RCCE_barrier(&RCCE_COMM_WORLD);
  97. my_x = node_id % X_max;
  98. my_y = node_id / X_max;
  99. state = IDLE_CORE;
  100. RCCE_flag_write(&flag_signals_enabled, RCCE_FLAG_SET, node_id);
  101. my_idag = -1;
  102. int dummy=0;
  103. while (my_idag==-1) {//pause();
  104. for (i=0; i<1000; i++)
  105. for(j=0; j<1000; j++)
  106. dummy++;
  107. scc_signals_check();
  108. }
  109. while (state != TERMINATED)
  110. if (state == IDLE_CORE) {
  111. pending_state = NO_PENDING_STATE;
  112. //pause();
  113. dummy=0;
  114. for (i=0; i<1000; i++)
  115. for(j=0; j<1000; j++)
  116. dummy++;
  117. scc_signals_check();
  118. } else if (state == IDLE_INIT_MAN) {// || state == IDLE_FAR_MAN || state == IDLE_INIT_MAN_SELFOPT_PENDING || state == IDLE_INIT_MAN_WORK_PENDING) {
  119. //pause();
  120. dummy=0;
  121. for (i=0; i<1000; i++)
  122. for(j=0; j<1000; j++)
  123. dummy++;
  124. scc_signals_check();
  125. } else if (state == IDLE_AGENT) {
  126. if (app_state != APP_TERMINATED) {
  127. //pause();//!app_terminated
  128. dummy=0;
  129. for (i=0; i<1000; i++)
  130. for(j=0; j<1000; j++)
  131. dummy++;
  132. scc_signals_check();
  133. } else {
  134. if (timer_gettime(timerid, &chk_timer) == -1) printf("timer_gettime error 2\n");
  135. else selfopt_time_rem = chk_timer.it_value.tv_nsec;
  136. if (selfopt_time_rem > 0) {
  137. its.it_value.tv_nsec = 0;
  138. if (timer_settime(timerid, 0, &its, NULL) == -1) printf("timer_settime error42\n");
  139. }
  140. state = AGENT_ENDING;
  141. }
  142. } else if (state == AGENT_REWIND_FILE) {
  143. printf("I am %d and i have to rewind my selfopt_areas_file for app with id %d\n",node_id,init_app.id);
  144. fprintf(log_file,"I have to rewind my selfopt_areas_file for app with id %d\n",init_app.id);
  145. selfopt_interval = 200;
  146. its.it_value.tv_nsec = selfopt_interval * MS;
  147. selfopt_time_rem = selfopt_interval;
  148. if (timer_settime(timerid, 0, &its, NULL) == -1) perror("timer_settime error823\n");
  149. state = IDLE_AGENT;
  150. } else if (state == IDLE_AGENT_WAITING_OFF) {
  151. //pause();
  152. if (app_state != APP_TERMINATED) {
  153. //pause();//!app_terminated
  154. dummy=0;
  155. for (i=0; i<1000; i++)
  156. for(j=0; j<1000; j++)
  157. dummy++;
  158. scc_signals_check();
  159. } else {
  160. signals_disable();
  161. if (timer_gettime(timerid, &chk_timer) == -1) printf("timer_gettime error 2\n");
  162. else selfopt_time_rem = chk_timer.it_value.tv_nsec;
  163. //den stamataw edw thn diadikasia tou selfopt gia na mhn meinoun oi mexri twra prosfores kai oxi mono anapanthtes
  164. if (selfopt_time_rem == 0) state = AGENT_SELF_CHK_OFFERS;
  165. signals_enable();
  166. }
  167. } else if (state == INIT_MANAGER) {
  168. signals_disable();
  169. printf("Initialising app node_id = %d\n",node_id);
  170. cur_time = time(NULL);
  171. cur_t = localtime(&cur_time);
  172. fprintf(log_file, "[%d:%d:%d]: Initialising app\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec);
  173. fflush(log_file);
  174. strcpy(init_areas_file_name,"/shared/herc/scenaria/");
  175. strcat(init_areas_file_name,scen_num);
  176. strcat(init_areas_file_name,"/");
  177. strcat(init_areas_file_name, itoa(init_app.id));
  178. strcat(init_areas_file_name, ".txt");
  179. //printf("area file path = %s\n",areas_file_name);
  180. if ((init_areas_file = fopen(init_areas_file_name, "r")) == NULL){
  181. printf("Cannot open input file with file path = %s ",init_areas_file_name);
  182. perror("open init_areas_file_name");
  183. }
  184. init_areas_sent = 0;
  185. fscanf(init_areas_file,"%d",&init_areas_cnt);
  186. state = INIT_MANAGER_SEND_OFFERS;
  187. signals_enable();
  188. scc_signals_check();
  189. } else if (state == INIT_MANAGER_SEND_OFFERS) {// || state == INIT_MANAGER_SEND_OFFERS_SELFOPT_PENDING || state == INIT_MANAGER_SEND_OFFERS_WORK_PENDING) {
  190. signals_disable();
  191. init_idags_areas_replies=0;
  192. init_DDS_idags = 0;
  193. init_DDS_replies = 0;
  194. init_areas_num = 1;
  195. if (init_targets_head != NULL)
  196. while (init_targets_head != NULL){
  197. tmp_target_list = init_targets_head;
  198. init_targets_head = init_targets_head->next;
  199. free(tmp_target_list);
  200. }
  201. if (init_man_offers != NULL)
  202. while (init_man_offers != NULL) {
  203. tmp_offer_list = init_man_offers;
  204. init_man_offers = init_man_offers->next;
  205. free(tmp_offer_list);
  206. }
  207. fprintf(log_file, "near init area (%d,%d)\n",node_id,selfopt_r);
  208. fflush(log_file);
  209. if (core_inter_head[my_idag] == NULL){
  210. core_inter_head[my_idag] = (inter_list *) malloc(sizeof(inter_list));
  211. core_inter_tail[my_idag] = core_inter_head[my_idag];
  212. } else {
  213. core_inter_tail[my_idag]->next = (inter_list *) malloc(sizeof(inter_list));
  214. core_inter_tail[my_idag] = core_inter_tail[my_idag]->next;
  215. }
  216. core_inter_tail[my_idag]->type = IDAG_FIND_IDAGS_PENDING;
  217. core_inter_tail[my_idag]->data.reg.C = node_id;
  218. core_inter_tail[my_idag]->data.reg.r = selfopt_r;
  219. core_inter_tail[my_idag]->next = NULL;
  220. if (core_inter_head[my_idag]->next == NULL) {
  221. //kill(pid_num[my_idag],SIG_IDAG_FIND_IDAGS);
  222. scc_kill(my_idag,SIG_IDAG_FIND_IDAGS);
  223. my_stats.msg_count++;
  224. my_stats.distance += distance(node_id,my_idag);
  225. }
  226. for (i=0; i<init_areas_cnt && i<INIT_FAR_AREAS_NUM; i++) {
  227. fscanf(init_areas_file,"%d",&C);
  228. fscanf(init_areas_file,"%d",&r);
  229. fprintf(log_file, "init area (%d,%d)\n",C,r);
  230. fflush(log_file);
  231. printf("I am %d and i am sending a far offer in region (%d,%d)\n",node_id,C,r);
  232. one_core = C;
  233. if (core_inter_head[one_core] == NULL){
  234. core_inter_head[one_core] = (inter_list *) malloc(sizeof(inter_list));
  235. core_inter_tail[one_core] = core_inter_head[one_core];
  236. } else {
  237. core_inter_tail[one_core]->next = (inter_list *) malloc(sizeof(inter_list));
  238. core_inter_tail[one_core] = core_inter_tail[one_core]->next;
  239. }
  240. core_inter_tail[one_core]->type = FAR_INIT_REQ;
  241. core_inter_tail[one_core]->data.reg.C = C;
  242. core_inter_tail[one_core]->data.reg.r = r;
  243. core_inter_tail[one_core]->next = NULL;
  244. if (core_inter_head[one_core]->next == NULL) {
  245. //kill(pid_num[one_core],SIG_INIT_FAR_REQ);
  246. scc_kill(one_core,SIG_INIT_FAR_REQ);
  247. my_stats.msg_count++;
  248. my_stats.distance += distance(node_id,one_core);
  249. }
  250. //init_areas_num++;
  251. }
  252. init_areas_sent += i;
  253. //fclose(areas);
  254. if (selfopt_time_rem != -1){
  255. if (timer_gettime(timerid, &chk_timer) == -1) printf("timer_gettime error\n");
  256. else selfopt_time_rem = chk_timer.it_value.tv_nsec;
  257. if (selfopt_time_rem > 0) {
  258. its.it_value.tv_nsec = 0;//750000000;// * MS;
  259. if (timer_settime(timerid, 0, &its, NULL) == -1) printf("timer_settime error4123\n");
  260. }
  261. }
  262. state = IDLE_INIT_MAN;
  263. signals_enable();
  264. scc_signals_check();
  265. } else if (state == INIT_MAN_CHK_OFFERS) {// || state == INIT_MAN_CHK_OFFERS_SELFOPT_PENDING || state == INIT_MAN_CHK_OFFERS_WORK_PENDING){
  266. signals_disable();
  267. printf("init check alarm went off node_id=%d init_DDS_idags = %d init_DDS_replies = %d state=%d!\n",node_id,init_DDS_idags,init_DDS_replies,state);
  268. cur_time = time(NULL);
  269. cur_t = localtime(&cur_time);
  270. fprintf(log_file, "[%d:%d:%d]: init check alarm went off init_DDS_idags = %d init_DDS_replies = %d state=%d\n",
  271. cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec,init_DDS_idags,init_DDS_replies,state);
  272. fflush(log_file);
  273. init_core_found = 0;
  274. if (init_man_offers == NULL) {
  275. printf("I don't have offers\n");
  276. fprintf(log_file, "I don't have init man offers\n");
  277. fflush(log_file);
  278. printf("I am %d and didn't manage to find my core in this round of search for app with id %d\n",node_id,init_app.id);
  279. //state = IDLE_CORE;
  280. if (init_areas_sent == init_areas_cnt){
  281. printf("I am %d and i have to rewind my init_areas_file for app with id %d\n",node_id,init_app.id);
  282. rewind(init_areas_file);
  283. init_areas_sent = 0;
  284. fscanf(init_areas_file,"%d",&init_areas_cnt);
  285. }
  286. state = INIT_MANAGER_SEND_OFFERS;
  287. } else {
  288. tmp_offer_list = init_man_offers;
  289. while (tmp_offer_list != NULL){
  290. fprintf(log_file,"Offer by %d for %d cores with spd_loss %0.4f :",tmp_offer_list->sender,tmp_offer_list->off.num_of_cores,tmp_offer_list->off.spd_loss);
  291. for (i=0; i<tmp_offer_list->off.num_of_cores; i++)
  292. fprintf(log_file," %d,",tmp_offer_list->off.offered_cores[i]);
  293. fprintf(log_file,"\n");
  294. //printf("Offer by %d for %d cores\n",tmp_offer_list->sender,tmp_offer_list->off.num_of_cores);
  295. tmp_offer_list = tmp_offer_list->next;
  296. }
  297. fflush(log_file);
  298. *init_man_offers->answer = 1;
  299. //decide which will be the agent. Will be the one tha minimizes distance between cores
  300. min_dist = -1;
  301. for (i=0; i<init_man_offers->off.num_of_cores; i++){
  302. tmp_int = 0;
  303. for (j=0; j<init_man_offers->off.num_of_cores; j++){
  304. if (i == j) continue;
  305. tmp_int += distance(init_man_offers->off.offered_cores[i],init_man_offers->off.offered_cores[j]);
  306. }
  307. if (min_dist == -1 || tmp_int < min_dist) {
  308. min_dist = tmp_int;
  309. new_agent = init_man_offers->off.offered_cores[i];
  310. }
  311. }
  312. cur_time = time(NULL);
  313. cur_t = localtime(&cur_time);
  314. init_app_times[1].tm_sec = cur_t->tm_sec;
  315. init_app_times[1].tm_min = cur_t->tm_min;
  316. init_app_times[1].tm_hour = cur_t->tm_hour;
  317. printf("New agent is %d\n",new_agent);
  318. cur_time = time(NULL);
  319. cur_t = localtime(&cur_time);
  320. fprintf(log_file, "[%d:%d:%d]: New agent is %d\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec,new_agent);
  321. fflush(log_file);
  322. if (new_agent != node_id) {
  323. if (core_inter_head[new_agent] == NULL){
  324. core_inter_head[new_agent] = (inter_list *) malloc(sizeof(inter_list));
  325. core_inter_tail[new_agent] = core_inter_head[new_agent];
  326. } else {
  327. printf("Starting this app is not high priority. Should we change that?\n");
  328. core_inter_tail[new_agent]->next = (inter_list *) malloc(sizeof(inter_list));
  329. core_inter_tail[new_agent] = core_inter_tail[new_agent]->next;
  330. }
  331. core_inter_tail[new_agent]->type = INIT_AGENT;
  332. core_inter_tail[new_agent]->data.app_cores = (int *)malloc((init_man_offers->off.num_of_cores+1)*sizeof(int));
  333. core_inter_tail[new_agent]->data.app_cores[0] = init_man_offers->off.num_of_cores;
  334. for(i=1; i<=init_man_offers->off.num_of_cores; i++)
  335. core_inter_tail[new_agent]->data.app_cores[i] = init_man_offers->off.offered_cores[i-1];
  336. core_inter_tail[new_agent]->next = NULL;
  337. init_app.num_of_cores = init_man_offers->off.num_of_cores;
  338. if (core_inter_head[new_agent]->next == NULL) {
  339. //kill(pid_num[new_agent], SIG_INIT_AGENT);
  340. scc_kill(new_agent, SIG_INIT_AGENT);
  341. my_stats.msg_count++;
  342. my_stats.distance += distance(node_id,new_agent);
  343. } else {
  344. fprintf(log_file,"I am init manager and i am doing smth else with init agent interaction=%d\n",core_inter_head[new_agent]->type);
  345. fflush(log_file);
  346. }
  347. } else {
  348. my_app = init_app;
  349. my_cores_count = init_man_offers->off.num_of_cores;
  350. my_app.num_of_cores = my_cores_count;//+1;
  351. if (my_cores == NULL) {
  352. my_cores = (core_list *) malloc(sizeof(core_list));
  353. my_cores_tail = my_cores;
  354. } else {
  355. printf("My cores still not fucking null!!\n");
  356. my_cores_tail->next = (core_list *) malloc(sizeof(core_list));
  357. my_cores_tail = my_cores_tail->next;
  358. }
  359. my_cores_tail->core_id = node_id;
  360. my_cores_tail->offered_to = -1;
  361. my_cores_tail->next = NULL;
  362. if (core_inter_head[my_idag] == NULL){
  363. core_inter_head[my_idag] = (inter_list *) malloc(sizeof(inter_list));
  364. core_inter_tail[my_idag] = core_inter_head[my_idag];
  365. } else {
  366. core_inter_tail[my_idag]->next = (inter_list *) malloc(sizeof(inter_list));
  367. core_inter_tail[my_idag] = core_inter_tail[my_idag]->next;
  368. }
  369. core_inter_tail[my_idag]->type = IDAG_ADD_CORES_DDS;
  370. core_inter_tail[my_idag]->data.app_cores = (int *)malloc((my_cores_count+1)*sizeof(int));
  371. core_inter_tail[my_idag]->data.app_cores[0] = my_cores_count;
  372. core_inter_tail[my_idag]->next = NULL;
  373. //I want myself to be first in my_cores list
  374. for(i=0; i<init_man_offers->off.num_of_cores; i++) {
  375. one_core = init_man_offers->off.offered_cores[i];
  376. core_inter_tail[my_idag]->data.app_cores[i+1] = one_core;
  377. if (one_core != node_id){
  378. my_cores_tail->next = (core_list *) malloc(sizeof(core_list));
  379. my_cores_tail = my_cores_tail->next;
  380. my_cores_tail->core_id = one_core;
  381. my_cores_tail->offered_to = -1;
  382. my_cores_tail->next = NULL;
  383. }
  384. }
  385. my_app_times[0].tm_sec = init_app_times[0].tm_sec;
  386. my_app_times[0].tm_min = init_app_times[0].tm_min;
  387. my_app_times[0].tm_hour = init_app_times[0].tm_hour;
  388. my_app_times[1].tm_sec = init_app_times[1].tm_sec;
  389. my_app_times[1].tm_min = init_app_times[1].tm_min;
  390. my_app_times[1].tm_hour = init_app_times[1].tm_hour;
  391. init_app_times[0].tm_sec = 0;
  392. init_app_times[0].tm_min = 0;
  393. init_app_times[0].tm_hour = 0;
  394. init_app_times[1].tm_sec = 0;
  395. init_app_times[1].tm_min = 0;
  396. init_app_times[1].tm_hour = 0;
  397. /*kill(pid_num[0], SIG_INIT_APP);
  398. my_stats.msg_count++;
  399. my_stats.distance += distance(node_id,0);*/
  400. printf("I am new agent with id %d and app with A=%.2f, var=%.2f and %d my_cores_count = %d cores: \n"
  401. ,node_id,my_app.A,my_app.var,my_app.num_of_cores,my_cores_count);
  402. my_Speedup = Speedup(my_app, my_app.num_of_cores);
  403. if (core_inter_head[my_idag]->next == NULL) {
  404. //kill(pid_num[my_idag], SIG_ADD_CORES_DDS);
  405. scc_kill(my_idag, SIG_ADD_CORES_DDS);
  406. my_stats.msg_count++;
  407. my_stats.distance += distance(node_id,my_idag);
  408. } else printf("I am %d and i didn't call add!! with interaction %d\n",node_id,core_inter_head[my_idag]->type);
  409. if (my_agent != -1) {
  410. printf("I am %d and i do this agent switch in common node with pending_state=%d\n",node_id,pending_state);
  411. fprintf(log_file,"I do this agent switch in common node with pending_state=%d\n",pending_state);
  412. if (pending_state == WORKING_NODE) {
  413. if (core_inter_head[my_agent] == NULL){
  414. core_inter_head[my_agent] = (inter_list *) malloc(sizeof(inter_list));
  415. core_inter_tail[my_agent] = core_inter_head[my_agent];
  416. } else {
  417. core_inter_tail[my_agent]->next = (inter_list *) malloc(sizeof(inter_list));
  418. core_inter_tail[my_agent] = core_inter_tail[my_agent]->next;
  419. }
  420. core_inter_tail[my_agent]->type = REP_CHK_REM_TIME;
  421. core_inter_tail[my_agent]->data.work_time = upper_work_bound - time_worked;
  422. core_inter_tail[my_agent]->next = NULL;
  423. }
  424. upper_work_bound = 0;
  425. my_agent = -1;
  426. }
  427. state = AGENT_INIT_STATE;
  428. cur_time = time(NULL);
  429. cur_t = localtime(&cur_time);
  430. fprintf(log_file, "[%d:%d:%d]: Init ok!! my_cores_count = %d app_id=%d\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec,my_cores_count,my_app.id);
  431. fprintf(log_file, "my cores are:");
  432. for (tmp_cores_list=my_cores; tmp_cores_list!=NULL; tmp_cores_list=tmp_cores_list->next) fprintf(log_file, " %d", tmp_cores_list->core_id);
  433. fprintf(log_file, "\n");
  434. fflush(log_file);
  435. }
  436. tmp_offer_list = init_man_offers->next;
  437. while (tmp_offer_list != NULL){
  438. fflush(log_file);
  439. *tmp_offer_list->answer = 0;
  440. tmp_offer_list = tmp_offer_list->next;
  441. }
  442. while (init_man_offers != NULL){
  443. if (core_inter_head[init_man_offers->sender] != NULL) {
  444. if (core_inter_head[init_man_offers->sender]->type == REP_AGENT_OFFER_PENDING){
  445. core_inter_head[init_man_offers->sender]->type = REP_AGENT_OFFER_SENT;
  446. //kill(pid_num[init_man_offers->sender], SIG_REP_OFFERS);
  447. scc_kill(init_man_offers->sender, SIG_REP_OFFERS);
  448. my_stats.msg_count++;
  449. my_stats.distance += distance(node_id,init_man_offers->sender);
  450. } else if (core_inter_head[init_man_offers->sender]->type == REP_FAR_REQ_OFFER_PENDING){
  451. core_inter_head[init_man_offers->sender]->type = REP_FAR_REQ_OFFER_SENT;
  452. //kill(pid_num[init_man_offers->sender], SIG_REP_OFFERS);
  453. scc_kill(init_man_offers->sender, SIG_REP_OFFERS);
  454. my_stats.msg_count++;
  455. my_stats.distance += distance(node_id,init_man_offers->sender);
  456. } else if (core_inter_head[init_man_offers->sender]->type != REP_FAR_REQ_OFFER_SENT && core_inter_head[init_man_offers->sender]->type != REP_AGENT_OFFER_SENT)
  457. printf("We have aasdfa problem!\n");
  458. } else {
  459. printf("gamietai b = %d",init_man_offers->sender);
  460. fprintf(log_file,"gamietai b = %d",init_man_offers->sender);
  461. fflush(log_file);
  462. }
  463. tmp_offer_list = init_man_offers;
  464. init_man_offers = init_man_offers->next;
  465. free(tmp_offer_list);
  466. }
  467. fclose(init_areas_file);
  468. fprintf(log_file,"selfopt_time_rem = %ld app_state = %d state = %d pending_state = %d\n",selfopt_time_rem,app_state,state,pending_state);
  469. fflush(log_file);
  470. if (selfopt_time_rem != -1 && app_state != APP_TERMINATED){ //a selfopt is pending !app_terminated
  471. selfopt_time_rem -= 500000000;
  472. if (selfopt_time_rem > 0){
  473. its.it_value.tv_nsec = selfopt_time_rem;
  474. if (timer_settime(timerid, 0, &its, NULL) == -1) printf("timer_settime error5\n");
  475. state = IDLE_AGENT;
  476. } else {
  477. selfopt_time_rem = -1;
  478. state = AGENT_SELF_OPT;
  479. }
  480. } else if (state != AGENT_INIT_STATE) {
  481. if (pending_state == IDLE_AGENT) {
  482. printf("I am %d and i entered this realm of whores\n",node_id);
  483. fprintf(log_file,"I finished my init selfopt_interval=%d, selfopt_time_rem=%ld my_cores_count=%d, old_cores_cnt=%d\n"
  484. ,selfopt_interval,selfopt_time_rem,my_cores_count,old_cores_cnt);
  485. fflush(log_file);
  486. fprintf(app_log_file,"I finished my init selfopt_interval=%d, selfopt_time_rem=%ld my_cores_count=%d, old_cores_cnt=%d\n"
  487. ,selfopt_interval,selfopt_time_rem,my_cores_count,old_cores_cnt);
  488. fflush(app_log_file);
  489. if (selfopt_interval > 0) { // && !app_terminated
  490. its.it_value.tv_nsec = selfopt_interval * MS;
  491. selfopt_time_rem = selfopt_interval;
  492. if (old_cores_cnt == 1 || old_cores_cnt == my_cores_count) {
  493. if (my_cores_count == max_cores_count) {
  494. fprintf(app_log_file, "I have maximum cores count. I don't initiate selfopt process in here anyway.\n");
  495. fflush(app_log_file);
  496. selfopt_time_rem = -1;
  497. } else if (time_per_node <= (selfopt_interval / 2) && my_cores_count > 1) {
  498. fprintf(app_log_file, "I have little working time left time_per_node=%d selfopt_interval=%d in here anyway.\n",time_per_node,selfopt_interval);
  499. fflush(app_log_file);
  500. selfopt_time_rem = -1;
  501. } else if (timer_settime(timerid, 0, &its, NULL) == -1) printf("timer_settime error8\n");
  502. }
  503. } else if (my_cores_count == 1) {
  504. printf("I am %d and i have to rewind my selfopt_areas_file after init for app with id %d\n",node_id,init_app.id);
  505. fprintf(log_file,"I have to rewind my selfopt_areas_file after init for app with id %d\n",init_app.id);
  506. selfopt_interval = 200;
  507. its.it_value.tv_nsec = selfopt_interval * MS;
  508. selfopt_time_rem = selfopt_interval;
  509. if (timer_settime(timerid, 0, &its, NULL) == -1) perror("timer_settime error823\n");
  510. } else selfopt_time_rem = -1;
  511. state = IDLE_AGENT;
  512. pending_state = NO_PENDING_STATE;
  513. } else if (pending_state == AGENT_SELF_OPT || pending_state == WORKING_NODE || pending_state == AGENT_REWIND_FILE) {
  514. state = pending_state;//IDLE_AGENT;
  515. pending_state = NO_PENDING_STATE;
  516. } else state = IDLE_CORE;
  517. } else if (app_state != APP_TERMINATED && new_agent != node_id) state = IDLE_AGENT;//!app_terminated
  518. }
  519. signals_enable();
  520. scc_signals_check();
  521. } else if (state == AGENT_INIT_STATE) {//|| state == AGENT_INIT_STATE_INIT_INTERRUPTED
  522. signals_disable();
  523. selfopt_interval=200;
  524. nodes_ended_cnt = 0;
  525. app_state = RUNNING;
  526. max_cores_count = get_max_cores_count(my_app);
  527. //app_terminated = 0;
  528. //pending_state = NO_PENDING_STATE;
  529. if (my_cores_count > 1){
  530. time_to_work = (int) roundf(my_app.workld / my_Speedup);
  531. time_per_node = time_to_work / (my_cores_count-1);
  532. time_left = time_to_work % (my_cores_count-1);
  533. if (time_to_work == 0) time_left++;
  534. }
  535. printf("i am init agent %d. speedup = %0.2f time_to_work = %d time_per_node = %d, workld=%0.2f\n",node_id,my_Speedup,time_to_work,time_per_node,my_app.workld);
  536. strcpy(app_log_file_name,"/shared/herc/scenaria/");
  537. strcat(app_log_file_name,scen_num);
  538. strcat(app_log_file_name,"/app_logs/");
  539. strcat(app_log_file_name, itoa(my_app.id));
  540. strcat(app_log_file_name, ".txt");
  541. //printf("area file path self opt = %s\n",areas_file_name);
  542. if ((app_log_file = fopen(app_log_file_name, "w")) == NULL){
  543. printf("Cannot open input file with file path = %s ",app_log_file_name);
  544. perror("open selfopt_areas_file_name");
  545. }
  546. fprintf(app_log_file, "Came into init_agent at [%d:%d:%d]\n",my_app_times[0].tm_hour,my_app_times[0].tm_min,my_app_times[0].tm_sec);
  547. fprintf(app_log_file, "New agent found at [%d:%d:%d]\n",my_app_times[1].tm_hour,my_app_times[1].tm_min,my_app_times[1].tm_sec);
  548. cur_time = time(NULL);
  549. cur_t = localtime(&cur_time);
  550. fprintf(app_log_file, "[%d:%d:%d]: I am agent %d . Init ok!! my_cores_count = %d app_id=%d\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec,node_id,my_cores_count,my_app.id);
  551. fprintf(app_log_file, "my cores are:");
  552. for (tmp_cores_list=my_cores; tmp_cores_list!=NULL; tmp_cores_list=tmp_cores_list->next) fprintf(app_log_file, " %d", tmp_cores_list->core_id);
  553. fprintf(app_log_file, "\n");
  554. fprintf(app_log_file,"speedup = %0.2f time_to_work = %d time_per_node = %d, time_left = %d, workld=%0.2f\n",my_Speedup,time_to_work,time_per_node,time_left,my_app.workld);
  555. fflush(app_log_file);
  556. tmp_cores_list = my_cores->next;
  557. while (tmp_cores_list != NULL){
  558. one_core = tmp_cores_list->core_id;
  559. if (core_inter_head[one_core] == NULL){
  560. core_inter_head[one_core] = (inter_list *) malloc(sizeof(inter_list));
  561. core_inter_tail[one_core] = core_inter_head[one_core];
  562. } else {
  563. core_inter_tail[one_core]->next = (inter_list *) malloc(sizeof(inter_list));
  564. core_inter_tail[one_core] = core_inter_tail[one_core]->next;
  565. }
  566. core_inter_tail[one_core]->type = INIT_WORK_NODE;
  567. core_inter_tail[one_core]->data.work_time = time_per_node;
  568. if (time_left > 0) {
  569. core_inter_tail[one_core]->data.work_time++;
  570. time_left--;
  571. }
  572. core_inter_tail[one_core]->next = NULL;
  573. my_stats.app_turnaround += core_inter_tail[one_core]->data.work_time;
  574. if (core_inter_head[one_core]->next == NULL) {
  575. //kill(pid_num[one_core], SIG_APPOINT_WORK);
  576. scc_kill(one_core, SIG_APPOINT_WORK);
  577. my_stats.msg_count++;
  578. my_stats.distance += distance(node_id,one_core);
  579. } else printf("I am %d and i am doing smth else with my working node %d in init inter1 = %d inter2 = %d\n",
  580. node_id,one_core,core_inter_head[one_core]->type,core_inter_head[one_core]->next->type);
  581. tmp_cores_list = tmp_cores_list->next;
  582. } //else printf("i have only one fucking core\n");
  583. if (my_cores_count == max_cores_count) {
  584. fprintf(app_log_file, "I have maximum cores count. I don't initiate selfopt process ini init_agent.\n");
  585. fflush(app_log_file);
  586. selfopt_time_rem = -1;
  587. if (pending_state == IDLE_INIT_MAN || pending_state == INIT_MANAGER || pending_state == INIT_MANAGER_SEND_OFFERS
  588. || pending_state == INIT_MAN_CHK_OFFERS || pending_state == WORKING_NODE_IDLE_INIT) {
  589. state = pending_state;
  590. pending_state = IDLE_AGENT;
  591. } else state = IDLE_AGENT;
  592. } else if (time_per_node <= (selfopt_interval / 2) && my_cores_count > 1) {
  593. fprintf(app_log_file, "I have little working time left time_per_node=%d selfopt_interval=%d in init_agent.\n",time_per_node,selfopt_interval);
  594. fflush(app_log_file);
  595. if (pending_state == IDLE_INIT_MAN || pending_state == INIT_MANAGER || pending_state == INIT_MANAGER_SEND_OFFERS
  596. || pending_state == INIT_MAN_CHK_OFFERS || pending_state == WORKING_NODE_IDLE_INIT) {
  597. state = pending_state;
  598. pending_state = IDLE_AGENT;
  599. } else state = IDLE_AGENT;
  600. selfopt_time_rem = -1;
  601. } else {
  602. if (pending_state == IDLE_INIT_MAN || pending_state == INIT_MANAGER || pending_state == INIT_MANAGER_SEND_OFFERS
  603. || pending_state == INIT_MAN_CHK_OFFERS || pending_state == WORKING_NODE_IDLE_INIT) {
  604. state = pending_state;//IDLE_INIT_MAN;//IDLE_INIT_MAN_SELFOPT_PENDING;
  605. pending_state = AGENT_SELF_OPT;
  606. //printf("I am %d o fountas einai poustara pou zwgrafizei k ton fuckaroun oi gkomenes tou!\n",node_id);
  607. } else state = AGENT_SELF_OPT;
  608. }
  609. signals_enable();
  610. scc_signals_check();
  611. } else if (state == AGENT_SELF_OPT) {
  612. signals_disable();
  613. printf("Initialising self opt node_id = %d\n",node_id);
  614. cur_time = time(NULL);
  615. cur_t = localtime(&cur_time);
  616. fprintf(log_file, "[%d:%d:%d]: Initialising self opt!\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec);
  617. fflush(log_file);
  618. fprintf(app_log_file, "[%d:%d:%d]: Initialising self opt!\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec);
  619. fflush(app_log_file);
  620. pending_state = NO_PENDING_STATE;
  621. if (app_state != APP_TERMINATED) {//!app_terminated
  622. selfopt_DDS_idags = 0;
  623. selfopt_DDS_replies = 0;
  624. //selfopt_areas_sent = 0;
  625. //if (selfopt_man_offers != NULL) printf("selfopt offers list is not NULL\n");
  626. if (selfopt_targets_head != NULL) {
  627. //printf("selfopt targets list is not NULL\n");
  628. while (selfopt_targets_head != NULL){
  629. tmp_target_list = selfopt_targets_head;
  630. selfopt_targets_head = selfopt_targets_head->next;
  631. free(tmp_target_list);
  632. }
  633. }
  634. if (core_inter_head[my_idag] == NULL){
  635. core_inter_head[my_idag] = (inter_list *) malloc(sizeof(inter_list));
  636. core_inter_tail[my_idag] = core_inter_head[my_idag];
  637. } else {
  638. core_inter_tail[my_idag]->next = (inter_list *) malloc(sizeof(inter_list));
  639. core_inter_tail[my_idag] = core_inter_tail[my_idag]->next;
  640. }
  641. core_inter_tail[my_idag]->type = SELFOPT_IDAG_FIND_IDAGS_PENDING;
  642. core_inter_tail[my_idag]->data.reg.C = node_id;
  643. core_inter_tail[my_idag]->data.reg.r = selfopt_r;
  644. core_inter_tail[my_idag]->next = NULL;
  645. if (core_inter_head[my_idag]->next == NULL) {
  646. //kill(pid_num[my_idag],SIG_IDAG_FIND_IDAGS);
  647. scc_kill(my_idag,SIG_IDAG_FIND_IDAGS);
  648. my_stats.msg_count++;
  649. my_stats.distance += distance(node_id,my_idag);
  650. }
  651. if (selfopt_interval != 800) selfopt_interval = 2 * selfopt_interval;
  652. else selfopt_interval = -1;
  653. state = IDLE_AGENT_WAITING_OFF;
  654. } else state = AGENT_ENDING;
  655. signals_enable();
  656. scc_signals_check();
  657. } else if (state == AGENT_SELF_CHK_OFFERS) {
  658. signals_disable();
  659. printf("alarm went off for self opt node_id=%d selfopt_DDS_idags = %d selfopt_DDS_replies = %d! app_state=%d\n",node_id,selfopt_DDS_idags,selfopt_DDS_replies,app_state);
  660. cur_time = time(NULL);
  661. cur_t = localtime(&cur_time);
  662. fprintf(log_file, "[%d:%d:%d]: alarm went off for self opt selfopt_DDS_idags = %d selfopt_DDS_replies = %d app_state=%d pending_state = %d\n",
  663. cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec,selfopt_DDS_idags,selfopt_DDS_replies,app_state,pending_state);
  664. fflush(log_file);
  665. fprintf(app_log_file, "[%d:%d:%d]: alarm went off for self opt selfopt_DDS_idags = %d selfopt_DDS_replies = %d app_state=%d pending_state = %d\n",
  666. cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec,selfopt_DDS_idags,selfopt_DDS_replies,app_state,pending_state);
  667. fflush(app_log_file);
  668. old_cores_cnt = my_cores_count;
  669. if (selfopt_man_offers == NULL) {
  670. printf("I don't have self opt offers app_state=%d\n",app_state);
  671. fprintf(log_file,"I don't have self opt offers app_state=%d\n",app_state);
  672. fflush(log_file);
  673. fprintf(app_log_file,"I don't have self opt offers app_state=%d\n",app_state);
  674. fflush(app_log_file);
  675. //state = IDLE_AGENT;
  676. } else {
  677. tmp_offer_list = selfopt_man_offers;
  678. while (tmp_offer_list != NULL){
  679. //printf("Offer by %d for %d cores\n",tmp_offer_list->sender,tmp_offer_list->off.num_of_cores);
  680. fprintf(log_file,"Offer by %d for %d cores\n",tmp_offer_list->sender,tmp_offer_list->off.num_of_cores);
  681. fflush(log_file);
  682. tmp_offer_list = tmp_offer_list->next;
  683. }
  684. if (app_state != APP_TERMINATED) {
  685. *selfopt_man_offers->answer = 1;
  686. if (core_inter_head[my_idag] == NULL){
  687. core_inter_head[my_idag] = (inter_list *) malloc(sizeof(inter_list));
  688. core_inter_tail[my_idag] = core_inter_head[my_idag];
  689. } else {
  690. core_inter_tail[my_idag]->next = (inter_list *) malloc(sizeof(inter_list));
  691. core_inter_tail[my_idag] = core_inter_tail[my_idag]->next;
  692. }
  693. core_inter_tail[my_idag]->type = IDAG_ADD_CORES_DDS;
  694. core_inter_tail[my_idag]->data.app_cores = (int *)malloc((selfopt_man_offers->off.num_of_cores+1)*sizeof(int));
  695. core_inter_tail[my_idag]->data.app_cores[0] = selfopt_man_offers->off.num_of_cores;
  696. core_inter_tail[my_idag]->next = NULL;
  697. //
  698. if (app_state != RESIZING) {
  699. old_Speedup = my_Speedup;
  700. chk_rem_num = my_cores_count-1;
  701. fprintf(app_log_file,"Initialising resize with check_rem = %d\n",chk_rem_num);
  702. fflush(app_log_file);
  703. chk_rem_count = 0;
  704. sum_rem_time = 0;
  705. app_state = RESIZING;
  706. my_cores_count += selfopt_man_offers->off.num_of_cores;
  707. my_app.num_of_cores = my_cores_count;
  708. my_Speedup = Speedup(my_app, my_cores_count);
  709. if (old_cores_cnt > 1)
  710. for(tmp_cores_list=my_cores->next; tmp_cores_list!=NULL; tmp_cores_list=tmp_cores_list->next) {//first is myself
  711. one_core = tmp_cores_list->core_id;
  712. if (core_inter_head[one_core] == NULL){
  713. core_inter_head[one_core] = (inter_list *) malloc(sizeof(inter_list));
  714. core_inter_tail[one_core] = core_inter_head[one_core];
  715. } else {
  716. core_inter_tail[one_core]->next = (inter_list *) malloc(sizeof(inter_list));
  717. core_inter_tail[one_core] = core_inter_tail[one_core]->next;
  718. }
  719. core_inter_tail[one_core]->type = APPOINT_WORK_NODE_PENDING;//CHK_REM_TIME;
  720. core_inter_tail[one_core]->next = NULL;
  721. if (core_inter_head[one_core]->next == NULL) {
  722. //kill(pid_num[one_core], SIG_CHECK_REM_TIME);
  723. scc_kill(my_idag, SIG_ADD_CORES_DDS);
  724. my_stats.msg_count++;
  725. my_stats.distance += distance(node_id,one_core);
  726. } else printf("I am %d and i am doing smth else with my working node %d in send SIG_CHECK_REM_TIME interaction = %d\n",node_id,one_core,core_inter_head[one_core]->type);
  727. }
  728. } else {
  729. fprintf(app_log_file,"Allready resizing with chk_rem_num = %d chk_rem_count=%d\n",chk_rem_num,chk_rem_count);
  730. fflush(app_log_file);
  731. my_cores_count += selfopt_man_offers->off.num_of_cores;
  732. my_app.num_of_cores = my_cores_count;
  733. my_Speedup = Speedup(my_app, my_cores_count);
  734. }
  735. for (i=0; i<selfopt_man_offers->off.num_of_cores; i++){
  736. my_cores_tail->next = (core_list *) malloc(sizeof(core_list));
  737. my_cores_tail = my_cores_tail->next;
  738. my_cores_tail->core_id = selfopt_man_offers->off.offered_cores[i];
  739. my_cores_tail->offered_to = -1;
  740. my_cores_tail->next = NULL;
  741. core_inter_tail[my_idag]->data.app_cores[i+1] = selfopt_man_offers->off.offered_cores[i];
  742. one_core = my_cores_tail->core_id;
  743. //printf("I am %d and i put in appoint work %d\n",node_id,one_core);
  744. if (core_inter_head[one_core] == NULL){
  745. core_inter_head[one_core] = (inter_list *) malloc(sizeof(inter_list));
  746. core_inter_tail[one_core] = core_inter_head[one_core];
  747. } else {
  748. printf("I am %d and I am doing sth with my new core %d interaction is %d\n",node_id,one_core,core_inter_head[one_core]->type);
  749. core_inter_tail[one_core]->next = (inter_list *) malloc(sizeof(inter_list));
  750. core_inter_tail[one_core] = core_inter_tail[one_core]->next;
  751. }
  752. core_inter_tail[one_core]->type = INIT_WORK_NODE_PENDING;
  753. core_inter_tail[one_core]->next = NULL;
  754. }
  755. } else *selfopt_man_offers->answer = 0;
  756. tmp_offer_list = selfopt_man_offers->next;
  757. while (tmp_offer_list != NULL){
  758. *tmp_offer_list->answer = 0;
  759. tmp_offer_list = tmp_offer_list->next;
  760. }
  761. if (app_state != APP_TERMINATED) {
  762. //my idag may have offered smth
  763. if (core_inter_head[my_idag]->next == NULL) {
  764. //kill(pid_num[my_idag], SIG_ADD_CORES_DDS);
  765. scc_kill(my_idag, SIG_ADD_CORES_DDS);
  766. my_stats.msg_count++;
  767. my_stats.distance += distance(node_id,my_idag);
  768. } else printf("I am %d i didn't call add inside selfopt with interaction %d\n",node_id,core_inter_head[my_idag]->type);
  769. if (old_cores_cnt == 1) {
  770. nodes_ended_cnt = 0;
  771. time_to_work = (int) roundf(my_app.workld / my_Speedup);
  772. time_per_node = time_to_work / (my_cores_count-1);
  773. time_left = time_to_work % (my_cores_count-1);
  774. if (time_to_work == 0) time_left++;
  775. fprintf(app_log_file,"in one core speedup = %0.2f time_to_work = %d time_per_node = %d, workld=%0.2f\n",my_Speedup,time_to_work,time_per_node,my_app.workld);
  776. fflush(app_log_file);
  777. tmp_cores_list = my_cores->next;
  778. while (tmp_cores_list != NULL){
  779. //printf("I am inside core listing node=%d\n",node_id);
  780. one_core = tmp_cores_list->core_id;
  781. for (tmp_inter_list = core_inter_head[one_core]; tmp_inter_list != NULL; tmp_inter_list = tmp_inter_list->next)
  782. if (tmp_inter_list->type == INIT_WORK_NODE_PENDING) break;
  783. if (tmp_inter_list != NULL) {
  784. tmp_inter_list->type = INIT_WORK_NODE;
  785. tmp_inter_list->data.work_time = time_per_node;
  786. if (time_left > 0) {
  787. tmp_inter_list->data.work_time++;
  788. time_left--;
  789. }
  790. my_stats.app_turnaround += tmp_inter_list->data.work_time;
  791. } else printf("i am %d kai sto common_node ta hpiame one core = %d\n",node_id,one_core);
  792. if (core_inter_head[one_core]->next == NULL) {
  793. //kill(pid_num[one_core], SIG_APPOINT_WORK);
  794. scc_kill(one_core, SIG_APPOINT_WORK);
  795. my_stats.msg_count++;
  796. my_stats.distance += distance(node_id,one_core);
  797. } else printf("I am doing smth else with my working node? interaction=%d interaction2=%d\n",core_inter_head[one_core]->type,core_inter_head[one_core]->next->type);
  798. tmp_cores_list = tmp_cores_list->next;
  799. }
  800. app_state = RUNNING;
  801. }
  802. }
  803. while (selfopt_man_offers != NULL) {
  804. if (core_inter_head[selfopt_man_offers->sender]->type == REP_AGENT_OFFER_PENDING){
  805. core_inter_head[selfopt_man_offers->sender]->type = REP_AGENT_OFFER_SENT;
  806. //kill(pid_num[selfopt_man_offers->sender], SIG_REP_OFFERS);
  807. scc_kill(selfopt_man_offers->sender, SIG_REP_OFFERS);
  808. my_stats.msg_count++;
  809. my_stats.distance += distance(node_id,selfopt_man_offers->sender);
  810. } else if (core_inter_head[selfopt_man_offers->sender]->type != REP_AGENT_OFFER_SENT) printf("We have zxcvzxc problem!\n");
  811. tmp_offer_list = selfopt_man_offers;
  812. selfopt_man_offers = selfopt_man_offers->next;
  813. free(tmp_offer_list);
  814. }
  815. printf("Self opt seems to be ok cores count = %d\n",my_cores_count);
  816. cur_time = time(NULL);
  817. cur_t = localtime(&cur_time);
  818. fprintf(log_file, "[%d:%d:%d]: Self opt ok. my_cores_count = %d\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec,my_cores_count);
  819. fprintf(log_file, "my cores are:");
  820. fprintf(app_log_file, "[%d:%d:%d]: Self opt ok. my_cores_count = %d\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec,my_cores_count);
  821. fprintf(app_log_file, "my cores are:");
  822. printf("I am %d and my cores are:",node_id);
  823. for (tmp_cores_list=my_cores; tmp_cores_list!=NULL; tmp_cores_list=tmp_cores_list->next) {
  824. fprintf(log_file, " %d", tmp_cores_list->core_id);
  825. fprintf(app_log_file, " %d", tmp_cores_list->core_id);
  826. printf(" %d",tmp_cores_list->core_id);
  827. }
  828. printf("\n");
  829. fprintf(log_file, "\n");
  830. fflush(log_file);
  831. fprintf(app_log_file, "\n");
  832. fflush(app_log_file);
  833. }
  834. if (app_state == APP_TERMINATED) state = AGENT_ENDING;//app_terminated
  835. else {
  836. if (pending_state == INIT_MANAGER) {
  837. state = INIT_MANAGER;
  838. pending_state = IDLE_AGENT;
  839. } else {
  840. printf("I am %d in chk_offers and pending_state=%d\n",node_id,pending_state);
  841. if (selfopt_interval > 0) { // && !app_terminated
  842. its.it_value.tv_nsec = selfopt_interval * MS;
  843. selfopt_time_rem = selfopt_interval;
  844. if (old_cores_cnt == 1 || old_cores_cnt == my_cores_count) {
  845. if (my_cores_count == max_cores_count) {
  846. fprintf(app_log_file, "I have maximum cores count. I don't initiate selfopt process in selfopt.\n");
  847. fflush(app_log_file);
  848. selfopt_time_rem = -1;
  849. } else if (time_per_node <= (selfopt_interval / 2) && my_cores_count > 1) {
  850. fprintf(app_log_file, "I have little working time left time_per_node=%d selfopt_interval=%d in selfopt.\n",time_per_node,selfopt_interval);
  851. fflush(app_log_file);
  852. selfopt_time_rem = -1;
  853. } else if (timer_settime(timerid, 0, &its, NULL) == -1) printf("timer_settime error8\n");
  854. }
  855. } else if (my_cores_count == 1) {
  856. printf("I am %d and i have to rewind my selfopt_areas_file for app with id %d\n",node_id,init_app.id);
  857. fprintf(log_file,"I have to rewind my selfopt_areas_file for app with id %d\n",my_app.id);
  858. fflush(log_file);
  859. fprintf(app_log_file,"I have to rewind my selfopt_areas_file for app with id %d\n",my_app.id);
  860. fflush(app_log_file);
  861. selfopt_interval = 200;
  862. its.it_value.tv_nsec = selfopt_interval * MS;
  863. selfopt_time_rem = selfopt_interval;
  864. if (timer_settime(timerid, 0, &its, NULL) == -1) perror("timer_settime error82\n");
  865. } else selfopt_time_rem = -1;
  866. state = IDLE_AGENT;
  867. }
  868. }
  869. signals_enable();
  870. scc_signals_check();
  871. } else if (state == WORKING_NODE || state == WORKING_NODE_IDLE_INIT){
  872. int j,dummy=0;
  873. signals_disable();
  874. while (time_worked <= upper_work_bound){
  875. scc_signals_check();
  876. signals_enable();
  877. //the following code should be one ms long
  878. for (i=0; i<1000; i++)
  879. for(j=0; j<1000; j++)
  880. dummy++;
  881. signals_disable();
  882. time_worked++;
  883. }
  884. printf("I am node %d with agent = %d and I finished my work upper_work_bound = %ld time_passed=%d\n",node_id,my_agent,upper_work_bound,time_worked);
  885. if (upper_work_bound > 0) {
  886. //kill(pid_num[my_agent],SIG_FINISH);
  887. scc_kill(my_agent,SIG_FINISH);
  888. my_stats.msg_count++;
  889. my_stats.distance += distance(node_id,my_agent);
  890. }
  891. if (state == WORKING_NODE) state = IDLE_CORE;
  892. else if (state == WORKING_NODE_IDLE_INIT) state = IDLE_INIT_MAN;
  893. else if (pending_state == WORKING_NODE) pending_state = NO_PENDING_STATE; //just finished on return
  894. signals_enable();
  895. scc_signals_check();
  896. } else if (state == AGENT_ZOMBIE) {
  897. //pause();
  898. dummy=0;
  899. for (i=0; i<1000; i++)
  900. for(j=0; j<1000; j++)
  901. dummy++;
  902. scc_signals_check();
  903. } else if (state == AGENT_ENDING) {
  904. signals_disable();
  905. cur_time = time(NULL);
  906. cur_t = localtime(&cur_time);
  907. fprintf(log_file, "[%d:%d:%d]: I entered agent_ending\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec);
  908. fflush(log_file);
  909. fprintf(app_log_file, "[%d:%d:%d]: I entered agent_ending\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec);
  910. fflush(app_log_file);
  911. for (tmp_cores_list = my_cores->next; tmp_cores_list != NULL; tmp_cores_list = tmp_cores_list->next)
  912. fprintf(app_log_file,"Core %d is offered to %d\n",tmp_cores_list->core_id,tmp_cores_list->offered_to);
  913. fflush(app_log_file);
  914. for (tmp_cores_list = my_cores->next; tmp_cores_list != NULL; tmp_cores_list = tmp_cores_list->next)
  915. if (tmp_cores_list->offered_to != -1) break;
  916. if (tmp_cores_list != NULL) {
  917. state = AGENT_ZOMBIE;
  918. for (tmp_cores_list = my_cores->next; tmp_cores_list != NULL; tmp_cores_list = tmp_cores_list->next) {
  919. one_core = tmp_cores_list->core_id;
  920. tmp_inter_prev = NULL;
  921. tmp_inter_list = core_inter_head[one_core];
  922. //for (tmp_inter_list = core_inter_head[one_core]; tmp_inter_list != NULL; tmp_inter_list=tmp_inter_list->next)
  923. while (tmp_inter_list != NULL)
  924. if (tmp_inter_list->type == INIT_WORK_NODE || tmp_inter_list->type == APPOINT_WORK_NODE || tmp_inter_list->type == INIT_WORK_NODE_PENDING
  925. || tmp_inter_list->type == APPOINT_WORK_NODE_PENDING || tmp_inter_list->type == REMOVED_NODE_REM_TIME) {
  926. //|| (tmp_inter_list->type == APPOINT_WORK_NODE_PENDING && tmp_inter_prev != NULL)) {
  927. fprintf(log_file, "Removing in zombie one node of %d with inter = %d\n",one_core,tmp_inter_list->type);
  928. fflush(log_file);
  929. if (tmp_inter_prev == NULL) {
  930. core_inter_head[one_core] = core_inter_head[one_core]->next;
  931. free(tmp_inter_list);
  932. tmp_inter_list = core_inter_head[one_core];
  933. } else {
  934. tmp_inter_prev->next = tmp_inter_list->next;
  935. if (tmp_inter_prev->next == NULL) core_inter_tail[one_core] = tmp_inter_prev;
  936. free(tmp_inter_list);
  937. tmp_inter_list = tmp_inter_prev->next;
  938. }
  939. } else {
  940. tmp_inter_prev = tmp_inter_list;
  941. tmp_inter_list = tmp_inter_list->next;
  942. }
  943. }
  944. } else {
  945. if (core_inter_head[my_idag] == NULL){
  946. core_inter_head[my_idag] = (inter_list *) malloc(sizeof(inter_list));
  947. core_inter_tail[my_idag] = core_inter_head[my_idag];
  948. } else {
  949. core_inter_tail[my_idag]->next = (inter_list *) malloc(sizeof(inter_list));
  950. core_inter_tail[my_idag] = core_inter_tail[my_idag]->next;
  951. }
  952. core_inter_tail[my_idag]->type = REMOVE_APP;
  953. core_inter_tail[my_idag]->data.app_cores = (int *)malloc((my_cores_count+1)*sizeof(int));
  954. core_inter_tail[my_idag]->data.app_cores[0] = my_cores_count;
  955. core_inter_tail[my_idag]->next = NULL;
  956. i=1;
  957. core_inter_tail[my_idag]->data.app_cores[i++] = my_cores->core_id;
  958. tmp_cores_list = my_cores;
  959. my_cores=my_cores->next;
  960. free(tmp_cores_list);
  961. //for(my_cores=my_cores->next; my_cores!=NULL; my_cores = my_cores->next) {
  962. //free(tmp_cores_list);
  963. while (my_cores != NULL) {
  964. tmp_cores_list = my_cores;
  965. one_core = tmp_cores_list->core_id;
  966. core_inter_tail[my_idag]->data.app_cores[i++] = one_core;
  967. tmp_inter_prev = NULL;
  968. tmp_inter_list = core_inter_head[one_core];
  969. //for (tmp_inter_list = core_inter_head[one_core]; tmp_inter_list != NULL; tmp_inter_list=tmp_inter_list->next)
  970. while (tmp_inter_list != NULL)
  971. if (tmp_inter_list->type == INIT_WORK_NODE || tmp_inter_list->type == APPOINT_WORK_NODE || tmp_inter_list->type == INIT_WORK_NODE_PENDING
  972. || tmp_inter_list->type == APPOINT_WORK_NODE_PENDING || tmp_inter_list->type == REMOVED_NODE_REM_TIME) {
  973. fprintf(log_file, "Removing one node of %d with inter = %d\n",one_core,tmp_inter_list->type);
  974. fflush(log_file);
  975. if (tmp_inter_prev == NULL) {
  976. core_inter_head[one_core] = core_inter_head[one_core]->next;
  977. free(tmp_inter_list);
  978. tmp_inter_list = core_inter_head[one_core];
  979. } else {
  980. tmp_inter_prev->next = tmp_inter_list->next;
  981. if (tmp_inter_prev->next == NULL) core_inter_tail[one_core] = tmp_inter_prev;
  982. free(tmp_inter_list);
  983. tmp_inter_list = tmp_inter_prev->next;
  984. }
  985. } else {
  986. tmp_inter_prev = tmp_inter_list;
  987. tmp_inter_list = tmp_inter_list->next;
  988. }
  989. if (core_inter_head[one_core] == NULL) {
  990. //kill(pid_num[one_core],SIG_FINISH);
  991. scc_kill(one_core,SIG_FINISH);
  992. my_stats.msg_count++;
  993. my_stats.distance += distance(node_id,one_core);
  994. } else printf("I am %d and I still still have smth to do with my work node %d before finish which is %d\n",node_id,one_core,core_inter_head[one_core]->type);
  995. my_cores=my_cores->next;
  996. free(tmp_cores_list);
  997. }
  998. if (core_inter_head[my_idag]->next == NULL) {
  999. //kill(pid_num[my_idag],SIG_FINISH);
  1000. scc_kill(my_idag,SIG_FINISH);
  1001. my_stats.msg_count++;
  1002. my_stats.distance += distance(node_id,my_idag);
  1003. } else printf("I am %d and i am doing smth else with my idag app_remove interaction=%d\n",node_id,core_inter_head[my_idag]->type);
  1004. my_app.A = 0.0;
  1005. my_app.var = 0.0;
  1006. my_app.num_of_cores = -1;
  1007. selfopt_time_rem = -1;
  1008. //app_terminated = 0;
  1009. app_state = NO_APP;
  1010. printf("I am %d My app ended app_id = %d pending_state=%d\n",node_id,my_app.id,pending_state);
  1011. cur_time = time(NULL);
  1012. cur_t = localtime(&cur_time);
  1013. fprintf(app_log_file, "[%d:%d:%d]: App ended app_id = %d pending_state=%d",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec,my_app.id,pending_state);
  1014. //fprintf(app_log_file,"App ended app_id = %d pending_state=%d\n",my_app.id,pending_state);
  1015. fclose(app_log_file);
  1016. if (pending_state == INIT_MANAGER) {
  1017. state = INIT_MANAGER;
  1018. pending_state = IDLE_CORE;
  1019. } else if (pending_state == NO_PENDING_STATE) state = IDLE_CORE;
  1020. else {
  1021. printf("I am %d in agent_ending and pending_state = %d\n",node_id,pending_state);
  1022. state = IDLE_CORE;
  1023. }
  1024. }
  1025. scc_kill(0, SIG_APP_TERMINATED);
  1026. signals_enable();
  1027. scc_signals_check();
  1028. } else {
  1029. printf("Unknown state node_id = %d state = %d\n",node_id,state);
  1030. state = IDLE_CORE;
  1031. }
  1032. cur_time = time(NULL);
  1033. cur_t = localtime(&cur_time);
  1034. fprintf(log_file, "[%d:%d:%d]: I ended well\n",cur_t->tm_hour,cur_t->tm_min,cur_t->tm_sec);
  1035. fclose(log_file);
  1036. exit(0);
  1037. }