source: src/Fragmentation/Automation/FragmentScheduler.cpp@ 5adb84

Action_Thermostats Add_AtomRandomPerturbation Add_FitFragmentPartialChargesAction Add_RotateAroundBondAction Add_SelectAtomByNameAction Added_ParseSaveFragmentResults AddingActions_SaveParseParticleParameters Adding_Graph_to_ChangeBondActions Adding_MD_integration_tests Adding_ParticleName_to_Atom Adding_StructOpt_integration_tests AtomFragments Automaking_mpqc_open AutomationFragmentation_failures Candidate_v1.5.4 Candidate_v1.6.0 Candidate_v1.6.1 Candidate_v1.7.0 ChangeBugEmailaddress ChangingTestPorts ChemicalSpaceEvaluator CombiningParticlePotentialParsing Combining_Subpackages Debian_Package_split Debian_package_split_molecuildergui_only Disabling_MemDebug Docu_Python_wait EmpiricalPotential_contain_HomologyGraph EmpiricalPotential_contain_HomologyGraph_documentation Enable_parallel_make_install Enhance_userguide Enhanced_StructuralOptimization Enhanced_StructuralOptimization_continued Example_ManyWaysToTranslateAtom Exclude_Hydrogens_annealWithBondGraph FitPartialCharges_GlobalError Fix_BoundInBox_CenterInBox_MoleculeActions Fix_ChargeSampling_PBC Fix_ChronosMutex Fix_FitPartialCharges Fix_FitPotential_needs_atomicnumbers Fix_ForceAnnealing Fix_IndependentFragmentGrids Fix_ParseParticles Fix_ParseParticles_split_forward_backward_Actions Fix_PopActions Fix_QtFragmentList_sorted_selection Fix_Restrictedkeyset_FragmentMolecule Fix_StatusMsg Fix_StepWorldTime_single_argument Fix_Verbose_Codepatterns Fix_fitting_potentials Fixes ForceAnnealing_goodresults ForceAnnealing_oldresults ForceAnnealing_tocheck ForceAnnealing_with_BondGraph ForceAnnealing_with_BondGraph_continued ForceAnnealing_with_BondGraph_continued_betteresults ForceAnnealing_with_BondGraph_contraction-expansion FragmentAction_writes_AtomFragments FragmentMolecule_checks_bonddegrees GeometryObjects Gui_Fixes Gui_displays_atomic_force_velocity ImplicitCharges IndependentFragmentGrids IndependentFragmentGrids_IndividualZeroInstances IndependentFragmentGrids_IntegrationTest IndependentFragmentGrids_Sole_NN_Calculation JobMarket_RobustOnKillsSegFaults JobMarket_StableWorkerPool JobMarket_unresolvable_hostname_fix MoreRobust_FragmentAutomation ODR_violation_mpqc_open PartialCharges_OrthogonalSummation PdbParser_setsAtomName PythonUI_with_named_parameters QtGui_reactivate_TimeChanged_changes Recreated_GuiChecks Rewrite_FitPartialCharges RotateToPrincipalAxisSystem_UndoRedo SaturateAtoms_findBestMatching SaturateAtoms_singleDegree StoppableMakroAction Subpackage_CodePatterns Subpackage_JobMarket Subpackage_LinearAlgebra Subpackage_levmar Subpackage_mpqc_open Subpackage_vmg Switchable_LogView ThirdParty_MPQC_rebuilt_buildsystem TrajectoryDependenant_MaxOrder TremoloParser_IncreasedPrecision TremoloParser_MultipleTimesteps TremoloParser_setsAtomName Ubuntu_1604_changes stable
Last change on this file since 5adb84 was 0196c6, checked in by Frederik Heber <heber@…>, 13 years ago

Added Shutdown as choice to ControllerChoices.

  • new helper app Shutdowner that shuts down Server.
  • TESTFIX: Changed regression test Fragmentation/Automation where now Shutdowner is uses instead of Jobadder with 0 jobs to power down controller socket.
  • Property mode set to 100644
File size: 11.1 KB
RevLine 
[72eaf7f]1/*
[cd4a6e]2 * Project: MoleCuilder
3 * Description: creates and alters molecular systems
4 * Copyright (C) 2011 University of Bonn. All rights reserved.
5 * Please see the LICENSE file or "Copyright notice" in builder.cpp for details.
6 */
7
8/*
9 * \file FragmentScheduler.cpp
10 *
11 * This file strongly follows the Serialization example from the boost::asio
12 * library (see server.cpp)
[72eaf7f]13 *
[cd4a6e]14 * Created on: Oct 19, 2011
[72eaf7f]15 * Author: heber
16 */
17
[f93842]18// include config.h
19#ifdef HAVE_CONFIG_H
20#include <config.h>
21#endif
22
[c6bcd0]23// boost asio needs specific operator new
[72eaf7f]24#include <boost/asio.hpp>
[c6bcd0]25
26#include "CodePatterns/MemDebug.hpp"
27
[72eaf7f]28#include <boost/bind.hpp>
29#include <boost/lexical_cast.hpp>
30#include <iostream>
31#include <vector>
[af3aed]32#include "Connection.hpp" // Must come before boost/serialization headers.
[72eaf7f]33#include <boost/serialization/vector.hpp>
[af3aed]34#include "CodePatterns/Info.hpp"
[b0b64c]35#include "CodePatterns/Log.hpp"
[31ca5f]36#include "FragmentJob.hpp"
[ef2767]37#include "JobId.hpp"
[72eaf7f]38
[cd4a6e]39#include "FragmentScheduler.hpp"
[72eaf7f]40
[c7deca]41FragmentJob FragmentScheduler::NoJob(std::string("NoJob"), JobId::NoJob);
42
[db03d9]43/** Constructor of class FragmentScheduler.
44 *
45 * We setup both acceptors to accept connections from workers and Controller.
46 *
47 * \param io_service io_service of the asynchronous communications
48 * \param workerport port to listen for worker connections
49 * \param controllerport port to listen for controller connections.
50 */
51FragmentScheduler::FragmentScheduler(boost::asio::io_service& io_service, unsigned short workerport, unsigned short controllerport) :
52 worker_acceptor_(io_service,
53 boost::asio::ip::tcp::endpoint(boost::asio::ip::tcp::v4(), workerport)
54 ),
55 controller_acceptor_(io_service,
56 boost::asio::ip::tcp::endpoint(boost::asio::ip::tcp::v4(), controllerport)
[ef2767]57 ),
[db03d9]58 result(JobId::NoJob),
[778abb]59 choice(NoOperation),
[db03d9]60 Exitflag(OkFlag)
[ed2c5b]61{
[b0b64c]62 Info info(__FUNCTION__);
[72eaf7f]63
[778abb]64 // only initiate socket if jobs are already present
65 if (JobsQueue.isJobPresent()) {
66 LOG(1, "Listening for workers on port " << workerport << ".");
67 initiateWorkerSocket();
68 }
[402bde]69
70 initiateControllerSocket();
[778abb]71 LOG(1, "Listening for controller on port " << controllerport << ".");
[ed2c5b]72}
[72eaf7f]73
[402bde]74/** Internal function to start worker connection.
75 *
76 */
77void FragmentScheduler::initiateWorkerSocket()
78{
79 // Start an accept operation for worker connections.
80 connection_ptr new_conn(new Connection(worker_acceptor_.get_io_service()));
81 worker_acceptor_.async_accept(new_conn->socket(),
82 boost::bind(&FragmentScheduler::handle_AcceptWorker, this,
83 boost::asio::placeholders::error, new_conn));
84}
85
86/** Internal function to start controller connection.
87 *
88 */
89void FragmentScheduler::initiateControllerSocket()
90{
91 // Start an accept operation for controller connection.
92 connection_ptr new_conn(new Connection(controller_acceptor_.get_io_service()));
93 controller_acceptor_.async_accept(new_conn->socket(),
94 boost::bind(&FragmentScheduler::handle_AcceptController, this,
95 boost::asio::placeholders::error, new_conn));
96}
97
98
[db03d9]99/** Handle a new worker connection.
100 *
101 * We check whether jobs are in the JobsQueue. If present, job is sent.
102 *
103 * \sa handle_SendJobtoWorker()
104 *
105 * \param e error code if something went wrong
106 * \param conn reference with the connection
107 */
108void FragmentScheduler::handle_AcceptWorker(const boost::system::error_code& e, connection_ptr conn)
[ed2c5b]109{
[cd4a6e]110 Info info(__FUNCTION__);
[ed2c5b]111 if (!e)
[72eaf7f]112 {
[b0b64c]113 // Successfully accepted a new connection.
114 // Check whether there are jobs in the queue
115 if (JobsQueue.isJobPresent()) {
116 // pop a job and send it to the client.
[ef2767]117 FragmentJob job(JobsQueue.popJob());
[b0b64c]118 // The connection::async_write() function will automatically
119 // serialize the data structure for us.
[ef2767]120 LOG(1, "INFO: Sending job #" << job.getId() << ".");
121 conn->async_write(job,
[db03d9]122 boost::bind(&FragmentScheduler::handle_SendJobtoWorker, this,
[b0b64c]123 boost::asio::placeholders::error, conn));
[0bdd51b]124
[b0b64c]125 } else {
[c7deca]126 // send the static NoJob
127 conn->async_write(NoJob,
[db03d9]128 boost::bind(&FragmentScheduler::handle_SendJobtoWorker, this,
[c7deca]129 boost::asio::placeholders::error, conn));
130
[ef2767]131 // then there must be no read necesary
132
[b0b64c]133 ELOG(2, "There is currently no job present in the queue.");
134 }
[cd4a6e]135 }
136 else
137 {
138 // An error occurred. Log it and return. Since we are not starting a new
139 // accept operation the io_service will run out of work to do and the
140 // server will exit.
[3c4a5e]141 Exitflag = WorkerErrorFlag;
[b0b64c]142 ELOG(0, e.message());
[cd4a6e]143 }
[778abb]144
145 // Start an accept operation for a new Connection only when there
146 // are still jobs present
147 if (JobsQueue.isJobPresent())
148 initiateWorkerSocket();
[ed2c5b]149}
[72eaf7f]150
[db03d9]151/** Callback function when job has been sent.
152 *
153 * After job has been sent we start async_read() for the result.
154 *
155 * \sa handle_ReceiveResultFromWorker()
156 *
157 * \param e error code if something went wrong
158 * \param conn reference with the connection
159 */
160void FragmentScheduler::handle_SendJobtoWorker(const boost::system::error_code& e, connection_ptr conn)
[ed2c5b]161{
[af3aed]162 Info info(__FUNCTION__);
[ef2767]163 LOG(1, "INFO: Job sent.");
164 // obtain result
165 LOG(1, "INFO: Receiving result for a job ...");
166 conn->async_read(result,
[db03d9]167 boost::bind(&FragmentScheduler::handle_ReceiveResultFromWorker, this,
[ef2767]168 boost::asio::placeholders::error, conn));
169}
170
[db03d9]171/** Callback function when result has been received.
172 *
173 * \param e error code if something went wrong
174 * \param conn reference with the connection
175 */
176void FragmentScheduler::handle_ReceiveResultFromWorker(const boost::system::error_code& e, connection_ptr conn)
[ef2767]177{
[db03d9]178 Info info(__FUNCTION__);
179 LOG(1, "INFO: Received result for job #" << result.getId() << " ...");
180 ASSERT(result.getId() != (JobId_t)JobId::NoJob,
181 "FragmentScheduler::handle_ReceiveResultFromWorker() - result received has NoJob id.");
182 ASSERT(result.getId() != (JobId_t)JobId::IllegalJob,
183 "FragmentScheduler::handle_ReceiveResultFromWorker() - result received has IllegalJob id.");
[778abb]184 // place id into expected
[db03d9]185 if ((result.getId() != (JobId_t)JobId::NoJob) && (result.getId() != (JobId_t)JobId::IllegalJob))
186 JobsQueue.pushResult(result);
187 // erase result
188 result = FragmentResult(JobId::NoJob);
[778abb]189 LOG(1, "INFO: JobsQueue has " << JobsQueue.getDoneJobs() << " results.");
[db03d9]190}
191
192/** Handle a new controller connection.
193 *
194 * \sa handle_ReceiveJobs()
195 * \sa handle_CheckResultState()
196 * \sa handle_SendResults()
197 *
198 * \param e error code if something went wrong
199 * \param conn reference with the connection
200 */
201void FragmentScheduler::handle_AcceptController(const boost::system::error_code& e, connection_ptr conn)
202{
203 Info info(__FUNCTION__);
204 if (!e)
205 {
[778abb]206 conn->async_read(choice,
207 boost::bind(&FragmentScheduler::handle_ReadChoice, this,
208 boost::asio::placeholders::error, conn));
209 }
210 else
211 {
212 // An error occurred. Log it and return. Since we are not starting a new
213 // accept operation the io_service will run out of work to do and the
214 // server will exit.
215 Exitflag = ControllerErrorFlag;
216 ELOG(0, e.message());
217 }
218}
219
220/** Controller callback function to read the choice for next operation.
221 *
222 * \param e error code if something went wrong
223 * \param conn reference with the connection
224 */
225void FragmentScheduler::handle_ReadChoice(const boost::system::error_code& e, connection_ptr conn)
226{
227 Info info(__FUNCTION__);
228 if (!e)
229 {
[0196c6]230 bool LaunchNewAcceptor = true;
[778abb]231 // switch over the desired choice read previously
232 switch(choice) {
233 case NoOperation:
234 {
235 ELOG(1, "FragmentScheduler::handle_ReadChoice() - called with NoOperation.");
236 break;
237 }
238 case ReceiveJobs:
239 {
240 // The connection::async_write() function will automatically
241 // serialize the data structure for us.
242 LOG(1, "INFO: Receiving bunch of jobs from a controller ...");
243 conn->async_read(jobs,
244 boost::bind(&FragmentScheduler::handle_ReceiveJobs, this,
245 boost::asio::placeholders::error, conn));
246 break;
247 }
248 case CheckState:
249 {
[3c4a5e]250 // first update number
251 doneJobs = JobsQueue.getDoneJobs();
252 // now we accept connections to check for state of calculations
[778abb]253 LOG(1, "INFO: Sending state that "+toString(doneJobs)+" jobs are done to controller ...");
[3c4a5e]254 conn->async_write(doneJobs,
255 boost::bind(&FragmentScheduler::handle_CheckResultState, this,
256 boost::asio::placeholders::error, conn));
[778abb]257 break;
258 }
259 case SendResults:
260 {
261 const std::vector<FragmentResult> results = JobsQueue.getAllResults();
262 // ... or we give the results
263 LOG(1, "INFO: Sending "+toString(results.size())+" results to controller ...");
264 conn->async_write(results,
265 boost::bind(&FragmentScheduler::handle_SendResults, this,
266 boost::asio::placeholders::error, conn));
[0196c6]267 break;
268 }
269 case Shutdown:
270 {
271 LaunchNewAcceptor = false;
[778abb]272 break;
[db03d9]273 }
[778abb]274 default:
275 Exitflag = ControllerErrorFlag;
276 ELOG(1, "FragmentScheduler::handle_ReadChoice() - called with no valid choice.");
277 break;
278 }
279 // restore NoOperation choice such that choice is not read twice
280 choice = NoOperation;
281
[0196c6]282 if (LaunchNewAcceptor) {
283 LOG(1, "Launching new acceptor on socket.");
284 // Start an accept operation for a new Connection.
285 connection_ptr new_conn(new Connection(controller_acceptor_.get_io_service()));
286 controller_acceptor_.async_accept(new_conn->socket(),
287 boost::bind(&FragmentScheduler::handle_AcceptController, this,
288 boost::asio::placeholders::error, new_conn));
289 }
[db03d9]290 }
291 else
292 {
293 // An error occurred. Log it and return. Since we are not starting a new
294 // accept operation the io_service will run out of work to do and the
295 // server will exit.
[3c4a5e]296 Exitflag = ControllerErrorFlag;
[db03d9]297 ELOG(0, e.message());
298 }
299}
300
301/** Controller callback function when job has been sent.
[778abb]302 *
303 * We check here whether the worker socket is accepting, if there
304 * have been no jobs we re-activate it, as it is shut down after
305 * last job.
[db03d9]306 *
307 * \param e error code if something went wrong
308 * \param conn reference with the connection
309 */
310void FragmentScheduler::handle_ReceiveJobs(const boost::system::error_code& e, connection_ptr conn)
311{
312 Info info(__FUNCTION__);
[778abb]313 bool initiateSocket = !JobsQueue.isJobPresent();
314
[db03d9]315 // jobs are received, hence place in JobsQueue
316 if (!jobs.empty()) {
317 LOG(1, "INFO: Pushing " << jobs.size() << " jobs into queue.");
318 JobsQueue.pushJobs(jobs);
[778abb]319 // initiate socket if we had no jobs before
320 if (initiateSocket)
321 initiateWorkerSocket();
[db03d9]322 }
323
324 jobs.clear();
[778abb]325
[ed2c5b]326}
[cd4a6e]327
[3c4a5e]328/** Controller callback function when checking on state of results.
329 *
330 * \param e error code if something went wrong
331 * \param conn reference with the connection
332 */
333void FragmentScheduler::handle_CheckResultState(const boost::system::error_code& e, connection_ptr conn)
334{
335 Info info(__FUNCTION__);
336 // do nothing
337 LOG(1, "INFO: Sent that " << doneJobs << " jobs are done.");
338}
[778abb]339
340/** Controller callback function when result has been received.
341 *
342 * \param e error code if something went wrong
343 * \param conn reference with the connection
344 */
345void FragmentScheduler::handle_SendResults(const boost::system::error_code& e, connection_ptr conn)
346{
347 Info info(__FUNCTION__);
348 // do nothing
349 LOG(1, "INFO: Results have been sent.");
350}
351
Note: See TracBrowser for help on using the repository browser.