+typo git-svn-id: https://www4.informatik.uni-erlangen.de/i4svn/danceos/trunk/devel/fail@1121 8c4709b5-6ec9-48aa-a5cd-a96041d1645a
122 lines
3.4 KiB
C++
122 lines
3.4 KiB
C++
#include "JobClient.hpp"
|
|
|
|
|
|
namespace fi {
|
|
|
|
JobClient::JobClient(std::string server, int port)
|
|
{
|
|
m_server_port = port;
|
|
m_server = server;
|
|
m_server_ent = gethostbyname(m_server.c_str());
|
|
if(m_server_ent == NULL) {
|
|
perror("[Client@gethostbyname()]");
|
|
exit(1);
|
|
}
|
|
srand(time(NULL)); // needed for random backoff (see connectToServer)
|
|
}
|
|
|
|
bool JobClient::connectToServer()
|
|
{
|
|
// Connect to server
|
|
struct sockaddr_in serv_addr;
|
|
m_sockfd = socket(AF_INET, SOCK_STREAM, 0);
|
|
if(m_sockfd < 0) {
|
|
perror("[Client@socket()]");
|
|
exit(0);
|
|
}
|
|
|
|
/* Enable address reuse */
|
|
int on = 1;
|
|
setsockopt( m_sockfd, SOL_SOCKET, SO_REUSEADDR, &on, sizeof(on) );
|
|
|
|
memset(&serv_addr, 0, sizeof(serv_addr));
|
|
serv_addr.sin_family = AF_INET;
|
|
memcpy(&serv_addr.sin_addr.s_addr, m_server_ent->h_addr, m_server_ent->h_length);
|
|
serv_addr.sin_port = htons(m_server_port);
|
|
|
|
int retries = RETRY_COUNT;
|
|
while(true) {
|
|
if(connect(m_sockfd, (sockaddr *)&serv_addr, sizeof(serv_addr)) < 0) {
|
|
perror("[Client@connect()]");
|
|
if(retries > 0) {
|
|
// Wait RAND_BACKOFF_TSTART to RAND_BACKOFF_TEND seconds:
|
|
int delay = rand() % (RAND_BACKOFF_TEND-RAND_BACKOFF_TSTART) + RAND_BACKOFF_TSTART;
|
|
cout << "[Client] Retrying to connect to server in ~" << delay << "s..." << endl;
|
|
sleep(delay);
|
|
usleep(rand() % 1000000);
|
|
--retries;
|
|
continue;
|
|
}
|
|
cout << "[Client] Unable to reconnect (tried " << RETRY_COUNT << " times); "
|
|
<< "I'll give it up!" << endl;
|
|
return false; // finally: unable to connect, give it up :-(
|
|
}
|
|
break; // connected! :-)
|
|
}
|
|
cout << "[Client] Connection established!" << endl;
|
|
|
|
return true;
|
|
}
|
|
|
|
bool JobClient::getParam(ExperimentData& exp){
|
|
while(1) { // Here we try to acquire a parameter set
|
|
switch(tryToGetExperimentData(exp)){
|
|
// Jobserver will sent workload, params are set in \c exp
|
|
case FailControlMessage_Command_WORK_FOLLOWS: return true;
|
|
// Nothing to do right now, but maybe later
|
|
case FailControlMessage_Command_COME_AGAIN:
|
|
sleep(1);
|
|
continue;
|
|
default:
|
|
return false;
|
|
}
|
|
}
|
|
}
|
|
FailControlMessage_Command JobClient::tryToGetExperimentData(ExperimentData& exp)
|
|
{
|
|
// Connection failed, minion can die
|
|
if( !connectToServer() ) return FailControlMessage_Command_DIE;
|
|
|
|
// Retrieve ExperimentData
|
|
FailControlMessage ctrlmsg;
|
|
ctrlmsg.set_command(FailControlMessage_Command_NEED_WORK);
|
|
ctrlmsg.set_build_id(42);
|
|
|
|
SocketComm::send_msg(m_sockfd, ctrlmsg);
|
|
ctrlmsg.Clear();
|
|
SocketComm::rcv_msg(m_sockfd, ctrlmsg);
|
|
|
|
switch(ctrlmsg.command()){
|
|
case FailControlMessage_Command_WORK_FOLLOWS:
|
|
SocketComm::rcv_msg(m_sockfd, exp.getMessage());
|
|
exp.setWorkloadID(ctrlmsg.workloadid()); // Store workload id of experiment data
|
|
break;
|
|
case FailControlMessage_Command_COME_AGAIN:
|
|
break;
|
|
|
|
default:
|
|
break;
|
|
}
|
|
close(m_sockfd);
|
|
return ctrlmsg.command();
|
|
}
|
|
|
|
bool JobClient::sendResult(ExperimentData& result)
|
|
{
|
|
if (!connectToServer() ) return false;
|
|
// Send back results
|
|
FailControlMessage ctrlmsg;
|
|
ctrlmsg.set_command(FailControlMessage_Command_RESULT_FOLLOWS);
|
|
ctrlmsg.set_build_id(42);
|
|
ctrlmsg.set_workloadid(result.getWorkloadID());
|
|
cout << "[Client] Sending back result [" << std::dec << result.getWorkloadID() << "]..." << endl;
|
|
SocketComm::send_msg(m_sockfd, ctrlmsg);
|
|
SocketComm::send_msg(m_sockfd, result.getMessage());
|
|
// close connection.
|
|
close(m_sockfd);
|
|
return true;
|
|
}
|
|
|
|
|
|
}
|