#include <sys/stat.h>
#include <fcntl.h>
#include <unistd.h>
+#include <signal.h>
#include "nlsop.h"
#include "dfbapi.h"
#include "event.h"
#include "list.h"
-#define NLSOP_GUI 'g'
-#define NLSOP_CLIENT 'c'
-#define NLSOP_NJOB 'N'
-#define NLSOP_CJOB 'C'
+#include "nlsop_general.h"
-typedef struct s_client {
- int channel;
- unsigned char status;
-#define IDLE (1<<0)
-#define WORK (1<<1)
-} t_client;
+typedef struct s_priv {
+ t_event event;
+ t_net net;
+ t_list client;
+ t_list gui;
+ t_list job;
+} t_priv;
-typedef struct s_job {
- int channel;
- unsigned char status;
-#define IN_QUEUE (1<<0)
-#define IN_WORK (1<<1)
- int progress;
- unsigned char *ac;
- int *cc;
- int x,y,z;
- info info;
- int step;
-} t_job;
+/* global */
+int alert;
+int gi;
+t_priv priv;
+
+/*
+ * server specific stuff
+ */
int usage(char *prog)
{
return 1;
}
-/*
- * server specific stuff
- */
-
-int add_node(t_net *net,t_event *event,t_list *c_list,t_list *g_list) {
+int add_node(void) {
int channel;
unsigned char data;
t_client client;
- t_job job;
int gui_chan;
- channel=network_manage_incoming(net);
+ channel=network_manage_incoming(&(priv.net));
if(channel==N_E_ACCEPT) {
printf("accept failed!\n");
return -1;
printf("maximum connections reached!\n");
return -1;
}
- printf("connection from %s port %d (ch: %d)\n",net->connection[channel].ip,
- net->connection[channel].port,
- channel);
+ printf("connection from %s port %d (ch: %d)\n",
+ priv.net.connection[channel].ip,priv.net.connection[channel].port,
+ channel);
/* are you client or gui? */
- network_receive_chan(net,chanel,&data,1);
+ network_receive_chan(&(priv.net),channel,&data,1);
if(data==NLSOP_GUI) {
gui_chan=channel;
- list_add_element(g_list,&gui_chan,sizeof(int));
+ list_add_element(&(priv.gui),&gui_chan,sizeof(int));
+ printf("node is a gui\n");
}
else if(data==NLSOP_CLIENT) {
client.status=IDLE;
client.channel=channel;
- list_add_element(c_list,&client,sizeof(t_client));
+ list_add_element(&(priv.client),&client,sizeof(t_client));
+ printf("node is a client\n");
}
else {
printf("not a client or gui - lets kick that ass out of here!\n");
- network_close(net,channel);
+ network_close(&(priv.net),channel);
return -1;
}
/* if we have a new node - care for it! */
- event_math(net->connection[channel].fd,event,READ,ADD);
+ event_math(priv.net.connection[channel].fd,&(priv.event),READ,ADD);
+
+ printf("\n");
return 1;
}
-int save_job(t_net *net,int channel,t_job *job,unsigned char dc) {
+int save_job(unsigned char dc,unsigned char *ack) {
char filename[128];
- inf fd;
+ int fd;
int ret;
+ d3_lattice d3l;
+ info info;
+ t_job *j;
- ret=network_receive_chan(net,channel,job->ac,job->size*sizeof(unsigned char));
- if(ret==N_ERROR) printf("FATAL: getting ac status failed\n");
- ret=network_receice_chan(net,channel,job->cc,job->size*sizeof(int));
- if(ret==N_ERROR) printf("FATAL: getting cc failed\n");
- ret=network_receive_chan(net,channel,&(job->step),sizeof(int));
- if(ret==N_ERROR) printf("FATAL: getting step number failed\n");
+ j=(t_job *)priv.job.current->data;
+
+ printf("receiving data from client (#cells=%d)\n",j->size);
+
+ network_receive_chan(&(priv.net),gi,(unsigned char *)&d3l,
+ sizeof(d3_lattice));
+ network_receive_chan(&(priv.net),gi,(unsigned char *)&info,sizeof(info));
+ network_receive_chan(&(priv.net),gi,j->ac,j->size*sizeof(unsigned char));
+ network_receive_chan(&(priv.net),gi,(unsigned char *)j->cc,
+ j->size*sizeof(int));
+ network_receive_chan(&(priv.net),gi,(unsigned char *)&(j->step),sizeof(int));
+ network_receive_chan(&(priv.net),gi,ack,sizeof(unsigned char));
if(dc!=DC_QUIT) {
- snprintf(filename,"nlsop_b%f_c%f_s%f_ds%d_dr%f_Z%c__%d_of_%d.save",
- job->info->b,job->info->c,job->info->s,
- job->info->diff_rate,job->info->dr_ac,
- job->info->z_diff?'y':'n',
- job->step,job->info->steps);
+ if(*ack==DATA_OK)
+ snprintf(filename,128,
+ "./data/nlsop_b%f_c%f_s%f_ds%d_dr%f_-_%d_of_%d.save",
+ j->info.b,j->info.c,j->info.s,
+ j->info.diff_rate,j->info.dr_ac,
+ j->step,j->info.steps);
+ else
+ snprintf(filename,128,
+ "./data/nlsop_b%f_c%f_s%f_ds%d_dr%f_-_%d_of_%d.corrupt",
+ j->info.b,j->info.c,j->info.s,
+ j->info.diff_rate,j->info.dr_ac,
+ j->step,j->info.steps);
if((fd=open(filename,O_WRONLY|O_CREAT))<0) {
printf("FATAL: unable to open file %s\n",filename);
return -1;
}
+ if(write(fd,&d3l,sizeof(d3_lattice))<sizeof(d3_lattice)) {
+ printf("FATAL: write of d3_lattice failed\n");
+ return -1;
+ }
+
+ if(write(fd,&info,sizeof(info))<sizeof(info)) {
+ printf("FATAL: write of info failed\n");
+ return -1;
+ }
+
+ ret=write(fd,j->ac,j->size*sizeof(unsigned char));
+ if(ret<j->size*sizeof(unsigned char)) {
+ printf("FATAL: write of a/c states failed\n");
+ return -1;
+ }
+
+ ret=write(fd,j->cc,j->size*sizeof(int));
+ if(ret<j->size*sizeof(int)) {
+ printf("FATAL: write of c.-conc. failed\n");
+ return -1;
+ }
+ close(fd);
}
return 1;
}
-int handle_node(net,event,c_list,g_list,job) {
+int add_job(void) {
+
+ t_job job;
+
+ job.channel=-1;
+ job.status=IN_QUEUE;
+ job.progress=0;
+
+ network_receive_chan(&(priv.net),gi,(unsigned char *)&(job.x),sizeof(int));
+ network_receive_chan(&(priv.net),gi,(unsigned char *)&(job.y),sizeof(int));
+ network_receive_chan(&(priv.net),gi,(unsigned char *)&(job.z),sizeof(int));
+ network_receive_chan(&(priv.net),gi,(unsigned char *)&(job.info),
+ sizeof(info));
+
+ job.size=job.x*job.y*job.z;
+
+ job.ac=(unsigned char *)malloc(job.size*sizeof(unsigned char));
+ if(job.ac==NULL) {
+ printf("unable to malloc a/c memory\n");
+ return -1;
+ }
+
+ job.cc=(int *)malloc(job.size*sizeof(int));
+ if(job.cc==NULL) {
+ printf("unable to malloc cc memory\n");
+ return -1;
+ }
+
+ job.step=0;
+
+ list_add_element(&(priv.job),&job,sizeof(t_job));
+
+ printf("job added: b=%f | c=%f | s=%f ...\n",
+ job.info.b,job.info.c,job.info.s);
+
+ return 1;
+}
+
+int send_status(void) {
+ unsigned char data;
+ int count;
int i;
+
+ data=GUI_INFO;
+
+ network_send_chan(&(priv.net),gi,&data,sizeof(unsigned char));
+ printf("sending job + client list ...\n");
+
+ count=list_count(&(priv.job));
+ network_send_chan(&(priv.net),gi,(unsigned char *)&count,sizeof(int));
+ list_reset(&(priv.job));
+ for(i=0;i<count;i++) {
+ network_send_chan(&(priv.net),gi,priv.job.current->data,sizeof(t_job));
+ list_next(&(priv.job));
+ }
+
+ count=list_count(&(priv.client));
+ network_send_chan(&(priv.net),gi,(unsigned char *)&count,sizeof(int));
+ list_reset(&(priv.client));
+ for(i=0;i<count;i++) {
+ network_send_chan(&(priv.net),gi,priv.client.current->data,
+ sizeof(t_client));
+ list_next(&(priv.client));
+ }
+
+ return 1;
+}
+
+int handle_node(void) {
+
unsigned char data;
t_client *c;
t_job *j;
+ unsigned char ack;
- for(i=0;i<MAX_CONNECTIONS;i++) {
- if(FD_ISSET(net->connection[i].fd,&(event->rfds))) {
+ for(gi=0;gi<MAX_CONNECTIONS;gi++) {
+ if(FD_ISSET(priv.net.connection[gi].fd,&(priv.event.rfds))) {
- if(network_receive_chan(net,i,&data,1)==N_ERROR) {
- printf("connection to client (ch %d) fucked up!\n",i);
- event_math(net->connection[i].fd,event,READ,REMOVE);
- network_close(net,i);
- list_del_current(c_list);
- return -1;
- }
+ alert=0;
+ alarm(1);
+ network_receive_chan(&(priv.net),gi,&data,1);
+ alarm(0);
+
+ if(alert==1) return -1;
- if(list_search_data(c_list,&i,sizeof(int))==L_SUCCESS) {
+ if(list_search_data(&(priv.client),&gi,sizeof(int))==L_SUCCESS) {
/* it's a client */
- list_search_data(job,&i,sizeof(int));
- j=(t_job *)job->current->data;
- c=(t_client *)c_list->current-data;
+ list_search_data(&(priv.job),&gi,sizeof(int));
+ j=(t_job *)priv.job.current->data;
+ c=(t_client *)priv.client.current->data;
if(data==DC_END) {
- save_job(net,i,j,DC_END);
+ save_job(DC_END,&ack);
/* reset client */
- c->channel=i;
c->status=IDLE;
+ /* free job memory */
+ free(j->ac);
+ free(j->cc);
/* delete job entry */
- list_del_current(job);
+ list_del_current(&(priv.job));
+ printf("job ended, saved and removed from list.\n");
}
if(data==DC_OK) {
- save_job(net,i,j,DC_OK);
+ save_job(DC_OK,&ack);
/* inc progress state */
j->progress+=1;
+ printf("job at next level, saved.\n");
}
if(data==DC_QUIT) {
- save_job(net,i,j,DC_QUIT);
+ ack=0;
+ save_job(DC_QUIT,&ack);
/* network disconnect */
- event_math(net->connection[i].fd,event,READ,REMOVE);
- network_close(net,i);
+ event_math(priv.net.connection[gi].fd,&(priv.event),READ,REMOVE);
+ network_close(&(priv.net),gi);
/* del from client list */
- list_del_current(c_list);
- /* change job state */
- j->status=IN_QUEUE;
+ list_del_current(&(priv.client));
+ /* change job state (or reset it if corrupted) */
+ if(ack==DATA_OK) {
+ j->status=IN_QUEUE;
+ printf("client terminating, job queued, client removed.\n");
+ }
+ else {
+ j->channel=-1;
+ j->status=IN_QUEUE;
+ j->progress=0;
+ j->step=0;
+ printf("client terminating, corr. job cleared , client removed.\n");
+ }
}
}
- else if(list_search_data(g_list,&i,sizeof(int))==L_SUCCESS) {
+ else if(list_search_data(&(priv.gui),&gi,sizeof(int))==L_SUCCESS) {
/* its a gui */
-
+ if(data==GUI_ADDJOB) add_job();
+
+ else if(data==GUI_INFO) send_status();
+
+ else if(data==GUI_QUIT) {
+ printf("disconnecting gui on channel %d\n",gi);
+ event_math(priv.net.connection[gi].fd,&(priv.event),READ,REMOVE);
+ network_close(&(priv.net),gi);
+ list_del_current(&(priv.gui));
+ }
+
+ else {
+ printf("unknown gui command\n");
+ return -1;
+ }
}
else {
printf("this chan is not in client or gui list! i disconnect now!\n");
- event_math(net->connection[i].fd,event,READ,REMOVE);
- network_close(net,i);
+ event_math(priv.net.connection[gi].fd,&(priv.event),READ,REMOVE);
+ network_close(&(priv.net),gi);
}
}
}
+
+ printf("\n");
return 1;
}
-int parse_incoming(t_event *event,void *allineed) {
+int distribute_jobs(t_event *event,void *allineed) {
- t_net *net;
- t_list *c_list,*g_list,*job;
+ int count_j,count_c,min;
+ t_job *j;
+ t_client *c;
+ unsigned char data;
+ d3_lattice d3l;
+
+ list_reset(&(priv.job));
+ list_reset(&(priv.client));
+
+ count_j=0;
+ count_c=0;
+
+ if((priv.client.current==NULL)||(priv.job.current==NULL)) return 2;
+
+ j=(t_job *)priv.job.current->data;
+ c=(t_client *)priv.client.current->data;
+ if(j->status==IN_QUEUE) count_j++;
+ if(c->status==IDLE) count_c++;
- net=(t_net *)allineed;
- c_list=(t_list *)(allineed+sizeof(t_net));
- g_list=(t_list *)(allineed+sizeof(t_net)+sizeof(t_list));
- job=(t_list *)(allineed+sizeof(t_net)+2*sizeof(t_list));
+ while(list_next(&(priv.job))!=L_NO_NEXT_ELEMENT) {
+ j=(t_job *)priv.job.current->data;
+ if(j->status==IN_QUEUE) count_j++;
+ }
+ while(list_next(&(priv.client))!=L_NO_NEXT_ELEMENT) {
+ c=(t_client *)priv.client.current->data;
+ if(c->status==IDLE) count_c++;
+ }
+
+ min=(count_c<count_j)?count_c:count_j;
+
+ if(min!=0) {
+ printf("d: distributing jobs ...\n");
+ printf("%d queued jobs, %d idle clients\n\n",count_j,count_c);
+ }
+
+ list_reset(&(priv.job));
+ list_reset(&(priv.client));
+
+ while(min) {
+ j=(t_job *)priv.job.current->data;
+ c=(t_client *)priv.client.current->data;
+ while(c->status!=IDLE) {
+ list_next(&(priv.client));
+ c=(t_client *)priv.client.current->data;
+ }
+ while(j->status!=IN_QUEUE) {
+ list_next(&(priv.job));
+ j=(t_job *)priv.job.current->data;
+ }
+
+ /* direct current job to current client */
+ if(j->step==0) data=NLSOP_NJOB;
+ else data=NLSOP_CJOB;
+
+ c->status=WORK;
+ j->channel=c->channel;
+ j->status=IN_WORK;
+
+ d3l.max_x=j->x;
+ d3l.max_y=j->y;
+ d3l.max_z=j->z;
+
+ network_send_chan(&(priv.net),c->channel,&data,sizeof(unsigned char));
+ network_send_chan(&(priv.net),c->channel,(unsigned char *)&d3l,
+ sizeof(d3_lattice));
+ network_send_chan(&(priv.net),c->channel,(unsigned char *)&(j->info),
+ sizeof(info));
+
+ if(data==NLSOP_CJOB) {
+ network_send_chan(&(priv.net),c->channel,j->ac,
+ j->size*sizeof(unsigned char));
+ network_receive_chan(&(priv.net),c->channel,&data,sizeof(unsigned char));
+ network_send_chan(&(priv.net),c->channel,(unsigned char *)&(j->cc),
+ j->size*sizeof(int));
+ network_receive_chan(&(priv.net),c->channel,&data,sizeof(unsigned char));
+ network_send_chan(&(priv.net),c->channel,(unsigned char *)&(j->step),
+ sizeof(int));
+ network_receive_chan(&(priv.net),c->channel,&data,sizeof(unsigned char));
+ }
+
+ --min;
+ list_next(&(priv.client));
+ list_next(&(priv.job));
+ }
+
+ return 1;
+}
+
+int parse_incoming(t_event *event,void *allineed) {
/* decide what to do */
- if(FD_ISSET(net->l.fd,&(event->rfds))) {
+ if(FD_ISSET(priv.net.l_fd,&(priv.event.rfds))) {
/* new node */
printf("new node ...\n");
- add_node(net,event,c_list,g_list);
+ add_node();
}
else {
/* client/gui interaction */
printf("node interaction ...\n");
- handle_node(net,event,c_list,g_list,job);
+ handle_node();
}
return 1;
}
+void destroy_it(int signum) {
+
+ t_job *j;
+
+ printf("connection to client (ch %d) fucked up!\n",gi);
+ event_math(priv.net.connection[gi].fd,&(priv.event),READ,REMOVE);
+ network_close(&(priv.net),gi);
+ if(list_search_data(&(priv.client),&gi,sizeof(int))==L_SUCCESS) {
+ list_del_current(&(priv.client));
+ printf("removed client from list\n");
+ }
+ if(list_search_data(&(priv.job),&gi,sizeof(int))==L_SUCCESS) {
+ printf("associated job found. resetting & queueing job.\n");
+ j=(t_job *)priv.job.current->data;
+ j->channel=-1;
+ j->status=IN_QUEUE;
+ j->progress=0;
+ j->step=0;
+ }
+ if(list_search_data(&(priv.gui),&gi,sizeof(int))==L_SUCCESS) {
+ list_del_current(&(priv.gui));
+ printf("removed gui from list\n");
+ }
+
+ alert=1;
+ alarm(0);
+
+}
+
/*
* main program
*/
{
int port;
- t_net net;
- t_event event;
- t_list c_list;
- t_list g_list;
- t_list job;
- void *allyouneed;
-
- /* tzzz ... */
- allyouneed=malloc(sizeof(t_net)+3*sizeof(t_list));
- memcpy(allyouneed,&net,sizeof(t_net));
- memcpy(allyouneed+sizeof(t_net),&c_list,sizeof(list));
- memcpy(allyouneed+sizeof(t_net)+sizeof(t_list),&g_list,sizeof(list));
- memcpy(allyouneed+sizeof(t_net)+2*sizeof(t_list),&job,sizeof(list));
-
+
/* default values */
port=1025;
if(argc==2) port=atoi(argv[1]);
/* event init */
- event_init(&event,1);
- event_set_timeout(&event,0,0);
+ event_init(&(priv.event),1);
+ /* 10 sec event timeout - distributing jobs */
+ event_set_timeout(&(priv.event),10,0);
+
+ /* list init */
+ list_init(&(priv.client),1);
+ list_init(&(priv.gui),1);
+ list_init(&(priv.job),1);
/* connect to server */
- network_init(&net,1);
- network_set_listen_port(&net,port);
- if(network_listen(&net)!=N_SUCCESS) {
+ network_init(&(priv.net),1);
+ network_set_listen_port(&(priv.net),port);
+ if(network_listen(&(priv.net))!=N_SUCCESS) {
printf("unable to listen on port %d, aborting!\n",port);
return -1;
}
+ /* install sighandler */
+ signal(SIGALRM,destroy_it);
+
/* wait for events :) */
- event_math(net.l_fd,&event,READ,ADD);
- event_start(&event,allyouneed,parse_incoming,NULL);
+ event_math(priv.net.l_fd,&(priv.event),READ,ADD);
+ printf("\nNLSOP_SERVER started!\n\n");
+ event_start(&(priv.event),NULL,parse_incoming,distribute_jobs);
return 1;
}