MADNESS 0.10.1
macrotaskq.h
Go to the documentation of this file.
1/**
2 \file macrotaskq.h
3 \brief Declares the \c macrotaskq and MacroTaskBase classes
4 \ingroup mra
5
6 A MacroTaskq executes tasks on World objects, e.g. differentiation of a function or other
7 arithmetic. Complex algorithms can be implemented.
8
9 The universe world is split into subworlds, each of them executing macrotasks of the task queue.
10 This improves locality and speedups for large number of compute nodes, by reducing communications
11 within worlds.
12
13 The user defines a macrotask (an example is found in test_vectormacrotask.cc), the tasks are
14 lightweight and carry only bookkeeping information, actual input and output are stored in a
15 cloud (see cloud.h)
16
17 The user-defined macrotask is derived from MacroTaskIntermediate and must implement the run()
18 method. A heterogeneous task queue is possible.
19
20 The result of a macrotask is an object that lives in the universe and that is accessible from all
21 subworlds. The result is accumulated in the universe and must therefore be a WorldObject. Currently we
22 have implemented
23 - Function<T,NDIM>
24 - std::vector<Function<T,NDIM>> (a vector of Function<T,NDIM>)
25 - ScalarResultImpl<T> (a scalar value)
26 - std::vector<std::shared_ptr<ScalarResultImpl<T>>> (a vector of scalar values), shared_ptr for technical reasons
27
28 - std::tuple<std::vector<XXX>, std::vector<YYY>> (a tuple of n vectors of WorldObjects: XXX, YYY, .. = {Function, ScalarResultImpl, ...})
29
30
31 TODO: priority q
32 TODO: task submission from inside task (serialize task instead of replicate)
33 TODO: update documentation
34 TODO: consider serializing task member variables
35
36*/
37
38
39
40#ifndef SRC_MADNESS_MRA_MACROTASKQ_H_
41#define SRC_MADNESS_MRA_MACROTASKQ_H_
42
43#include <madness/world/cloud.h>
44#include <madness/world/world.h>
46
47namespace madness {
48
49/// helper class for returning the result of a task, which is not a madness Function, but a simple scalar
50
51/// the result value is accumulated via gaxpy in universe rank=0, after completion of the taskq the final
52/// value can be obtained via get(), which includes a broadcast of the final value to all processes
53template<typename T>
54class ScalarResultImpl : public WorldObject<ScalarResultImpl<T>> {
55public:
56 typedef T value_type;
60
61 /// Disable the default copy constructor
62 ScalarResultImpl(const ScalarResultImpl& other) = delete;
63 // ScalarResultImpl<T>(ScalarResultImpl<T>&& ) = default;
64
65 /// disable assignment operator
67
69 // print("calling destructor of ScalarResultImpl",this->id());
70 // std::cout << std::flush;
71 }
72
73 /// simple assignment of the scalar value
75 value = x;
76 return *this;
77 }
78
80 gaxpy(1.0, x, 1.0,true);
81 return *this;
82 }
83
84 /// accumulate, optional fence
85 void gaxpy(const double a, const T& right, double b, const bool fence=true) {
86 if (this->get_world().rank()==0) {
87 value =a*value + b * right;
88 }
89 else this->send(0, &ScalarResultImpl<T>::gaxpy, a, right, b, fence);
90 }
91
92 template<typename Archive>
93 void serialize(Archive &ar) {
94 ar & value;
95 }
96
97 /// after completion of the taskq get the final value
98 T get() {
99 this->get_world().gop.broadcast_serializable(*this, 0);
100 return value;
101 }
102
103 /// get the local value of this rank, which might differ for different ranks
104 /// for the final value use get()
105 T get_local() const {
106 return value;
107 }
108
109private:
110 /// the scalar value
112};
113
114template<typename T=double>
116public:
118 std::shared_ptr<implT> impl;
119
120 ScalarResult() = default;
121 ScalarResult(World &world) : impl(new implT(world)) {}
122 ScalarResult(const std::shared_ptr<implT>& impl) : impl(impl) {}
124 *(this->impl) = x;
125 return *this;
126 }
127
128 std::shared_ptr<implT> get_impl() const {
129 return impl;
130 }
131
132 void set_impl(const std::shared_ptr<implT>& newimpl) {
133 impl=newimpl;
134 }
135
136 uniqueidT id() const {
137 return impl->id();
138 }
139
140 /// accumulate, optional fence
141 void gaxpy(const double a, const T& right, double b, const bool fence=true) {
142 impl->gaxpy(a,right,b,fence);
143 }
144
145 template<typename Archive>
146 void serialize(Archive &ar) {
147 ar & impl;
148 }
149
150 /// after completion of the taskq get the final value
151 T get() {
152 return impl->get();
153 }
154
155 /// after completion of the taskq get the final value
156 T get_local() const {
157 return impl->get_local();
158 }
159
160};
161
162/// helper function to create a vector of ScalarResultImpl, circumventing problems with the constructors
163template<typename T>
164std::vector<ScalarResult<T>> scalar_result_vector(World& world, std::size_t n) {
165 std::vector<ScalarResult<T>> v;
166 for (std::size_t i=0; i<n; ++i) v.emplace_back(ScalarResult<T>(world));
167 return v;
168}
169
170
171// type traits to check if a template parameter is a WorldContainer
172template<typename>
173struct is_scalar_result_ptr : std::false_type {};
174
175template <typename T>
176struct is_scalar_result_ptr<std::shared_ptr<madness::ScalarResultImpl<T>>> : std::true_type {};
177
178template<typename>
179struct is_scalar_result_ptr_vector : std::false_type {
180};
181
182template<typename T>
183struct is_scalar_result_ptr_vector<std::vector<std::shared_ptr<typename madness::ScalarResultImpl<T>>>> : std::true_type {
184};
185
186// type traits to check if a template parameter is a WorldContainer
187template<typename>
188struct is_scalar_result : std::false_type {};
189
190template <typename T>
191struct is_scalar_result<madness::ScalarResult<T>> : std::true_type {};
192
193template<typename>
194struct is_scalar_result_impl : std::false_type {};
195
196template <typename T>
197struct is_scalar_result<madness::ScalarResultImpl<T>> : std::true_type {};
198
199template<typename>
200struct is_scalar_result_vector : std::false_type {
201};
202
203template<typename T>
204struct is_scalar_result_vector<std::vector<typename madness::ScalarResult<T>>> : std::true_type {
205};
206
207/// check if type is a valid task result: it must be a WorldObject and must implement gaxpy
208template <typename T>
209inline constexpr bool is_valid_task_result_v =
210 is_madness_function<T>::value // Function<T,NDIM>
211 || is_madness_function_vector<T>::value // std::vector<Function<T,NDIM>>
212 || is_scalar_result<T>::value // ScalarResultImpl<T>
213 || is_scalar_result_vector<T>::value // std::vector<std::shared_ptr<ScalarResultImpl<T>>>
214 || is_scalar_result_ptr<T>::value // ScalarResultImpl<T>
215 || is_scalar_result_ptr_vector<T>::value; // std::vector<std::shared_ptr<ScalarResultImpl<T>>>
216
217
218template<typename> struct is_tuple : std::false_type { };
219template<typename ...T> struct is_tuple<std::tuple<T...>> : std::true_type { };
220
221/// given a tuple check recursively if all elements are valid task results
222template<typename tupleT, std::size_t I>
224
225 typedef decay_tuple <tupleT> argtupleT; // removes const, &, etc
226
227 if constexpr(I >= std::tuple_size_v<tupleT>) {
228 // Last case, if nothing is left to iterate, then exit the function
229 return true;
230 } else {
231 using typeT = typename std::tuple_element<I, argtupleT>::type;// use decay types for determining a vector
232 if constexpr (not is_valid_task_result_v<typeT>) {
233 return false;
234 } else {
235 // Going for next element.
236 return check_tuple_is_valid_task_result<tupleT,I+1>();
237 }
238 }
239}
240
241
242
243/// the result type of a macrotask must implement gaxpy
244template<typename T>
245void gaxpy(const double a, ScalarResult<T>& left, const double b, const T& right, const bool fence=true) {
246 left.gaxpy(a, right, b, fence);
247}
248
249template <class Archive, typename T>
250struct madness::archive::ArchiveStoreImpl<Archive, std::shared_ptr<ScalarResultImpl<T>>> {
251 static void store(const Archive& ar, const std::shared_ptr<ScalarResultImpl<T>>& ptr) {
252 bool exists=(ptr) ? true : false;
253 ar & exists;
254 if (exists) ar & ptr->id();
255 }
256};
257
258
259template <class Archive, typename T>
260struct madness::archive::ArchiveLoadImpl<Archive, std::shared_ptr<ScalarResultImpl<T>>> {
261 static void load(const Archive& ar, std::shared_ptr<ScalarResultImpl<T>>& ptr) {
262 bool exists=false;
263 ar & exists;
264 if (exists) {
265 uniqueidT id;
266 ar & id;
267 World* world = World::world_from_id(id.get_world_id());
268 MADNESS_ASSERT(world);
269 auto ptr_opt = (world->ptr_from_id< ScalarResultImpl<T> >(id));
270 if (!ptr_opt)
271 MADNESS_EXCEPTION("ScalarResultImpl: remote operation attempting to use a locally uninitialized object",0);
272 ptr.reset(ptr_opt.value(), [] (ScalarResultImpl<T> *p_) -> void {}); // disable destruction
273 if (!ptr)
274 MADNESS_EXCEPTION("ScalarResultImpl<T> operation attempting to use an unregistered object",0);
275 } else {
276 ptr=nullptr;
277 }
278 }
279};
280
281
282/// base class
284public:
285
286 typedef std::vector<std::shared_ptr<MacroTaskBase> > taskqT;
287
289 virtual ~MacroTaskBase() {};
290
291 double priority=1.0;
293
297
298 bool is_complete() const {return stat==Complete;}
299 bool is_running() const {return stat==Running;}
300 bool is_waiting() const {return stat==Waiting;}
301
302 virtual void run(World& world, Cloud& cloud, taskqT& taskq, const long element, const bool debug) = 0;
303 virtual void cleanup() = 0; // clear static data (presumably persistent input data)
304
305 virtual void print_me(std::string s="") const {
306 printf("this is task with priority %4.1f\n",priority);
307 }
308 virtual void print_me_as_table(std::string s="") const {
309 print("nothing to print");
310 }
312 std::stringstream ss;
313 ss << std::setw(5) << this->get_priority() << " " <<this->stat;
314 return ss.str();
315 }
316
317 double get_priority() const {return priority;}
318 void set_priority(const double p) {priority=p;}
319
320 friend std::ostream& operator<<(std::ostream& os, const MacroTaskBase::Status s) {
321 if (s==MacroTaskBase::Status::Running) os << "Running";
322 if (s==MacroTaskBase::Status::Waiting) os << "Waiting";
323 if (s==MacroTaskBase::Status::Complete) os << "Complete";
324 if (s==MacroTaskBase::Status::Unknown) os << "Unknown";
325 return os;
326 }
327};
328
329
330template<typename macrotaskT>
332
333public:
334
336
338
339 void cleanup() {};
340};
341
342
343
344class MacroTaskQ : public WorldObject< MacroTaskQ> {
345
347 std::shared_ptr<World> subworld_ptr;
349 std::mutex taskq_mutex;
351 long nsubworld=1;
352 std::shared_ptr< WorldDCPmapInterface< Key<1> > > pmap1;
353 std::shared_ptr< WorldDCPmapInterface< Key<2> > > pmap2;
354 std::shared_ptr< WorldDCPmapInterface< Key<3> > > pmap3;
355 std::shared_ptr< WorldDCPmapInterface< Key<4> > > pmap4;
356 std::shared_ptr< WorldDCPmapInterface< Key<5> > > pmap5;
357 std::shared_ptr< WorldDCPmapInterface< Key<6> > > pmap6;
358
359 bool printdebug() const {return printlevel>=10;}
360 bool printprogress() const {return (printlevel>=3) and (not (printdebug()));}
361 bool printtimings() const {return universe.rank()==0 and printlevel>=3;}
362
363public:
364
367 long get_nsubworld() const {return nsubworld;}
368 void set_printlevel(const long p) {printlevel=p;}
369
370 /// create an empty taskq and initialize the subworlds
371 MacroTaskQ(World& universe, int nworld, const long printlevel=0)
374 , taskq()
376 , nsubworld(nworld)
377 , cloud(universe)
378 {
379
381 this->process_pending();
382 }
383
385
386 /// for each process create a world using a communicator shared with other processes by round-robin
387 /// copy-paste from test_world.cc
388static std::shared_ptr<World> create_worlds(World& universe, const std::size_t nsubworld) {
389
390 int color = universe.rank() % nsubworld;
392
393 std::shared_ptr<World> all_worlds;
394 all_worlds.reset(new World(comm));
395
397 return all_worlds;
398 }
399
400 /// run all tasks
401 void run_all() {
402
403 if (printdebug()) print_taskq();
404 if (printtimings()) {
405 print("number of tasks in taskq",taskq.size());
406 print("redirecting output to files task.#####");
407 }
408
409 double cpu0=cpu_time();
412 double cpu1=cpu_time();
413 if (printtimings()) print("cloud replication wall time",cpu1-cpu0);
415 universe.gop.set_forbid_fence(true); // make sure there are no hidden universe fences
423
424 double cpu00=cpu_time();
425
426 World& subworld=get_subworld();
427// if (printdebug()) print("I am subworld",subworld.id());
428 double tasktime=0.0;
429 if (printprogress() and universe.rank()==0) std::cout << "progress in percent: " << std::flush;
430 while (true) {
431 long element=get_scheduled_task_number(subworld);
432 double cpu0=cpu_time();
433 if (element<0) break;
434 std::shared_ptr<MacroTaskBase> task=taskq[element];
435 if (printdebug()) print("starting task no",element, "in subworld",subworld.id(),"at time",wall_time());
436
437 task->run(subworld,cloud, taskq, element, printdebug());
438
439 double cpu1=cpu_time();
440 set_complete(element);
441 tasktime+=(cpu1-cpu0);
442 if (printdebug()) printf("completed task %3ld after %6.1fs at time %6.1fs\n",element,cpu1-cpu0,wall_time());
443
444 // print progress
445 const std::size_t ntask=taskq.size();
446 // return percentile of ntask for element
447 auto in_percentile = [&ntask](const long element) {
448 return std::floor(element/(0.1*(ntask+1)));
449 };
450 auto is_first_in_percentile = [&](const long element) {
451 return (in_percentile(element)!=in_percentile(element-1));
452 };
453 if (printprogress() and is_first_in_percentile(element)) {
454 std::cout << int(in_percentile(element)*10) << " " << std::flush;
455 }
456 }
459 universe.gop.sum(tasktime);
460 if (printprogress() and universe.rank()==0) std::cout << std::endl;
461 double cpu11=cpu_time();
463 if (printtimings()) {
464 printf("completed taskqueue after %4.1fs at time %4.1fs\n", cpu11 - cpu00, wall_time());
465 printf(" total cpu time / per world %4.1fs %4.1fs\n", tasktime, tasktime / universe.size());
466 }
467
468 // cleanup task-persistent input data
469 for (auto& task : taskq) task->cleanup();
470 cloud.clear_cache(subworld);
471 cloud.clear();
472 subworld.gop.fence();
473 subworld.gop.fence();
482 }
483
485 for (const auto& t : vtask) {
486 if (universe.rank()==0) t->set_waiting();
488 }
489 }
490
491 void print_taskq() const {
493 if (universe.rank()==0) {
494 print("\ntaskq on universe rank",universe.rank());
495 print("total number of tasks: ",taskq.size());
496 print(" task batch priority status");
497 for (const auto& t : taskq) t->print_me_as_table();
498 }
500 }
501
502private:
503 void add_replicated_task(const std::shared_ptr<MacroTaskBase>& task) {
504 taskq.push_back(task);
505 }
506
507 /// scheduler is located on universe.rank==0
509 long number=0;
510 if (subworld.rank()==0) {
512 number=r.get();
513 }
514 subworld.gop.broadcast_serializable(number, 0);
515 subworld.gop.fence();
516 return number;
517
518 }
519
522 std::lock_guard<std::mutex> lock(taskq_mutex);
523
524 auto is_Waiting = [](const std::shared_ptr<MacroTaskBase>& mtb_ptr) {return mtb_ptr->is_waiting();};
525 auto it=std::find_if(taskq.begin(),taskq.end(),is_Waiting);
526 if (it!=taskq.end()) {
527 it->get()->set_running();
528 long element=it-taskq.begin();
529 return element;
530 }
531// print("could not find task to schedule");
532 return -1;
533 }
534
535 /// scheduler is located on rank==0
536 void set_complete(const long task_number) const {
537 this->task(ProcessID(0), &MacroTaskQ::set_complete_local, task_number);
538 }
539
540 /// scheduler is located on rank==0
541 void set_complete_local(const long task_number) const {
543 taskq[task_number]->set_complete();
544 }
545
546public:
555private:
556 std::size_t size() const {
557 return taskq.size();
558 }
559
560};
561
562
563
564
565template<typename taskT>
568
569 template<typename Q>
570 struct is_vector : std::false_type {
571 };
572 template<typename Q>
573 struct is_vector<std::vector<Q>> : std::true_type {
574 };
575
576 typedef typename taskT::resultT resultT;
577 typedef typename taskT::argtupleT argtupleT;
579 taskT task;
580 bool debug=false;
581
582 /// RAII class to redirect cout to a file
583 struct io_redirect {
584 std::streambuf* stream_buffer_cout;
585 std::ofstream ofile;
586 bool debug=false;
587
588 io_redirect(const long task_number, std::string filename, bool debug=false) : debug(debug) {
589 constexpr std::size_t bufsize=256;
590 char cfilename[bufsize];
591 std::snprintf(cfilename,bufsize,"%s.%5.5ld",filename.c_str(),task_number);
592 ofile=std::ofstream(cfilename);
593 if (debug) std::cout << "redirecting to file " << cfilename << std::endl;
594 stream_buffer_cout = std::cout.rdbuf(ofile.rdbuf());
595 std::cout.sync_with_stdio(true);
596 }
597
599 std::cout.rdbuf(stream_buffer_cout);
600 ofile.close();
601 std::cout.sync_with_stdio(true);
602 if (debug) std::cout << "redirecting back to cout" << std::endl;
603 }
604 };
605
606
607public:
608
609 /// constructor takes the actual task
610 MacroTask(World &world, taskT &task, std::shared_ptr<MacroTaskQ> taskq_ptr = 0)
612 if (taskq_ptr) {
613 // for the time being this condition must hold because tasks are
614 // constructed as replicated objects and are not broadcast to other processes
615 MADNESS_CHECK(world.id()==taskq_ptr->get_world().id());
616 }
617 }
618
619 void set_debug(const bool value) {
620 debug=value;
621 }
622
623
624 /// this mimicks the original call to the task functor, called from the universe
625
626 /// store all input to the cloud, create output Function<T,NDIM> in the universe,
627 /// create the batched task and shove it into the taskq. Possibly execute the taskq.
628 template<typename ... Ts>
629 resultT operator()(const Ts &... args) {
630
631 const bool immediate_execution = (not taskq_ptr);
632 if (not taskq_ptr) taskq_ptr.reset(new MacroTaskQ(world, world.size()));
633 if (debug) taskq_ptr->set_printlevel(20);
634
635 auto argtuple = std::tie(args...);
636 static_assert(std::is_same<decltype(argtuple), argtupleT>::value, "type or number of arguments incorrect");
637
638 // partition the argument vector into batches
639 auto partitioner=task.partitioner;
640 if (not partitioner) partitioner.reset(new MacroTaskPartitioner);
641 partitioner->set_nsubworld(world.size());
642 partitionT partition = partitioner->partition_tasks(argtuple);
643
644 // store input and output: output being a pointer to a universe function (vector)
645 recordlistT inputrecords = taskq_ptr->cloud.store(world, argtuple);
646 resultT result = task.allocator(world, argtuple);
647 auto outputrecords =prepare_output_records(taskq_ptr->cloud, result);
648
649 // create tasks and add them to the taskq
651 for (const auto& batch_prio : partition) {
652 vtask.push_back(
653 std::shared_ptr<MacroTaskBase>(new MacroTaskInternal(task, batch_prio, inputrecords, outputrecords)));
654 }
655 taskq_ptr->add_tasks(vtask);
656
657 if (immediate_execution) taskq_ptr->run_all();
658
659 return result;
660 }
661
662//private:
663
665 std::shared_ptr<MacroTaskQ> taskq_ptr;
666private:
667
668
669 /// store *pointers* to the result WorldObject in the cloud and return the recordlist
671 if constexpr (is_tuple<resultT>::value) {
672 static_assert(check_tuple_is_valid_task_result<resultT,0>(),
673 "tuple has invalid result type in prepare_output_records");
674 } else {
675 static_assert(is_valid_task_result_v<resultT>, "unknown result type in prepare_output_records");
676 }
677
678 if (debug) print("storing pointers to output in cloud");
679 // store an element of the tuple only
680 auto store_output_records = [&](const auto& result) {
681 recordlistT outputrecords;
682 typedef std::decay_t<decltype(result)> argT;
683 if constexpr (is_madness_function<argT>::value) {
684 outputrecords += cloud.store(world, result.get_impl().get()); // store pointer to FunctionImpl
685 } else if constexpr (is_madness_function_vector<argT>::value) {
686 outputrecords += cloud.store(world, get_impl(result));
687 } else if constexpr (is_scalar_result<argT>::value) {
688 outputrecords += cloud.store(world, result.get_impl()); // store pointer to ScalarResultImpl
689 } else if constexpr (is_vector<argT>::value) {
691 // argT = std::vector<ScalarResult<T>>
692 std::vector<std::shared_ptr<typename argT::value_type::implT>> v;
693 for (const auto& ptr : result) v.push_back(ptr.get_impl());
694 outputrecords+=cloud.store(world,v);
695 } else {
696 MADNESS_EXCEPTION("\n\n unknown vector result type in prepare_input ", 1);
697 }
698 } else {
699 MADNESS_EXCEPTION("should not be here",1);
700 }
701 return outputrecords;
702 };
703
704 recordlistT outputrecords;
705 if constexpr (is_tuple<resultT>::value) {
706 // loop over tuple elements -- args is the individual tuple element
707 std::apply([&](auto &&... args) {
708 (( outputrecords+=store_output_records(args) ), ...);
709 }, result);
710 } else {
711 outputrecords=store_output_records(result);
712 }
713 return outputrecords;
714 }
715
716
717 class MacroTaskInternal : public MacroTaskIntermediate<MacroTask> {
718
719 typedef decay_tuple<typename taskT::argtupleT> argtupleT; // removes const, &, etc
720 typedef typename taskT::resultT resultT;
723 public:
724 taskT task;
725 std::string get_name() const {
726 if (task.name=="unknown_task") return typeid(task).name();
727 return task.name;
728 }
729
730 MacroTaskInternal(const taskT &task, const std::pair<Batch,double> &batch_prio,
733 if constexpr (is_tuple<resultT>::value) {
734 static_assert(check_tuple_is_valid_task_result<resultT,0>(),
735 "tuple has invalid result type in prepare_output_records");
736 } else {
737 static_assert(is_valid_task_result_v<resultT>, "unknown result type in prepare_output_records");
738 }
739 this->task.batch=batch_prio.first;
740 this->priority=batch_prio.second;
741 }
742
743
744 void print_me(std::string s="") const override {
745 print("this is task",get_name(),"with batch", task.batch,"priority",this->get_priority());
746 }
747
748 void print_me_as_table(std::string s="") const override {
749 std::stringstream ss;
750 std::string name=get_name();
751 std::size_t namesize=std::min(std::size_t(28),name.size());
752 name += std::string(28-namesize,' ');
753
754 std::stringstream ssbatch;
755 ssbatch << task.batch;
756 std::string strbatch=ssbatch.str();
757 int nspaces=std::max(int(0),35-int(ssbatch.str().size()));
758 strbatch+=std::string(nspaces,' ');
759
760 ss << name
761 << std::setw(10) << strbatch
763 print(ss.str());
764 }
765
766 /// loop over the tuple elements of both tuples and execute the operation op on each element pair
767 template<typename tupleT, typename tupleR, typename opT, std::size_t I=0>
768 void binary_tuple_loop(tupleT& tuple1, tupleR& tuple2, opT& op) const {
769 if constexpr(I < std::tuple_size_v<tupleT>) {
770 auto& element1=std::get<I>(tuple1);
771 auto& element2=std::get<I>(tuple2);
772 op(element1,element2);
773 binary_tuple_loop<tupleT, tupleR, opT, I+1>(tuple1,tuple2,op);
774 }
775 }
776
777 template<typename tupleT, typename opT, std::size_t I=0>
778 void unary_tuple_loop(tupleT& tuple, opT& op) const {
779 if constexpr(I < std::tuple_size_v<tupleT>) {
780 auto& element1=std::get<I>(tuple);
781 op(element1);
782 unary_tuple_loop<tupleT,opT, I+1>(tuple,op);
783 }
784 }
785
786 /// accumulate the result of the task into the final result living in the universe
787 template<typename resultT1, std::size_t I=0>
788 typename std::enable_if<is_tuple<resultT1>::value, void>::type
789 accumulate_into_final_result(World &subworld, resultT1 &final_result, const resultT1 &tmp_result, const argtupleT& argtuple) {
790 if constexpr(I < std::tuple_size_v<resultT1>) {
791 using elementT = typename std::tuple_element<I, resultT>::type;// use decay types for determining a vector
792 auto element_final=std::get<I>(final_result);
793 auto element_tmp=std::get<I>(tmp_result);
794 accumulate_into_final_result<elementT>(subworld, element_final, element_tmp, argtuple);
795 accumulate_into_final_result<resultT1,I+1>(subworld, final_result, tmp_result, argtuple);
796 }
797 }
798
799 /// accumulate the result of the task into the final result living in the universe
800 template<typename resultT1>
801 typename std::enable_if<not is_tuple<resultT1>::value, void>::type
802 accumulate_into_final_result(World &subworld, resultT1 &result, const resultT1 &result_tmp, const argtupleT& argtuple) {
804 // gaxpy can be done in reconstructed or compressed mode
805 TreeState operating_state=result_tmp.get_impl()->get_tensor_type()==TT_FULL ? compressed : reconstructed;
806 result_tmp.change_tree_state(operating_state);
807 gaxpy(1.0,result,1.0, result_tmp);
809 TreeState operating_state=result_tmp[0].get_impl()->get_tensor_type()==TT_FULL ? compressed : reconstructed;
810 change_tree_state(result_tmp,operating_state);
811 // compress(subworld, result_tmp);
812 // resultT1 tmp1=task.allocator(subworld,argtuple);
813 // tmp1=task.batch.template insert_result_batch(tmp1,result_tmp);
814 gaxpy(1.0,result,1.0,result_tmp,false);
815 // was using operator+=, but this requires a fence, which is not allowed here..
816 // result += tmp1;
817 } else if constexpr (is_scalar_result<resultT1>::value) {
818 gaxpy(1.0, result, 1.0, result_tmp.get_local(), false);
819 } else if constexpr (is_scalar_result_vector<resultT1>::value) {
820 // resultT1 tmp1=task.allocator(subworld,argtuple);
821 // tmp1=task.batch.template insert_result_batch(tmp1,result_tmp);
822 std::size_t sz=result.size();
823 for (int i=0; i<sz; ++i) {
824 gaxpy(1.0, result[i], 1.0, result_tmp[i].get_local(), false);
825 }
826 }
827
828 }
829
830
831 void run(World &subworld, Cloud &cloud, MacroTaskBase::taskqT &taskq, const long element, const bool debug) override {
832 io_redirect io(element,get_name()+"_task",debug);
833 const argtupleT argtuple = cloud.load<argtupleT>(subworld, inputrecords);
834 const argtupleT batched_argtuple = task.batch.template copy_input_batch(argtuple);
835 try {
836 print("starting task no",element, ", '",get_name(),"', in subworld",subworld.id(),"at time",wall_time());
837 double cpu0=cpu_time();
838 resultT result_batch = std::apply(task, batched_argtuple); // lives in the subworld, is a batch of the full vector (if applicable)
839 double cpu1=cpu_time();
840 constexpr std::size_t bufsize=256;
841 char buffer[bufsize];
842 std::snprintf(buffer,bufsize,"completed task %3ld after %6.1fs at time %6.1fs\n",element,cpu1-cpu0,wall_time());
843 print(std::string(buffer));
844
845 // move the result from the batch to the final result, all still in subworld
846 auto insert_batch = [&](auto& element1, auto& element2) {
847 typedef std::decay_t<decltype(element1)> decay_type;;
848 if constexpr (is_vector<decay_type>::value) {
849 element1=task.batch.template insert_result_batch(element1,element2);
850 } else {
851 std::swap(element1,element2);
852 }
853 };
854 resultT result_subworld=task.allocator(subworld,argtuple);
855 if constexpr (is_tuple<resultT>::value) {
856 binary_tuple_loop(result_subworld, result_batch, insert_batch);
857 } else {
858 insert_batch(result_subworld,result_batch);
859 }
860
861 // accumulate the subworld-local results into the final, universe result
862 resultT result_universe=get_output(subworld, cloud); // lives in the universe
863
864 accumulate_into_final_result<resultT>(subworld, result_universe, result_subworld, argtuple);
865
866 } catch (std::exception& e) {
867 print("failing task no",element,"in subworld",subworld.id(),"at time",wall_time());
868 print(e.what());
870 print("\n\n");
871 MADNESS_EXCEPTION("failing task",1);
872 }
873
874 };
875
876 // this is called after all tasks have been executed and the taskq has ended
877 void cleanup() override {
878 // resultT result_universe=get_output(subworld, cloud); // lives in the universe
879
880 }
881
882 template<typename T, std::size_t NDIM>
883 static Function<T,NDIM> pointer2WorldObject(const std::shared_ptr<FunctionImpl<T,NDIM>> impl) {
884 Function<T,NDIM> result;
885 result.set_impl(impl);
886 return result;
887 }
888
889 template<typename T, std::size_t NDIM>
890 static std::vector<Function<T,NDIM>> pointer2WorldObject(const std::vector<std::shared_ptr<FunctionImpl<T,NDIM>>> v_impl) {
891 std::vector<Function<T,NDIM>> vresult;
892 vresult.resize(v_impl.size());
893 set_impl(vresult,v_impl);
894 return vresult;
895 }
896
897 template<typename T>
898 static ScalarResult<T> pointer2WorldObject(const std::shared_ptr<ScalarResultImpl<T>> sr_impl) {
899 return ScalarResult(sr_impl);
900 }
901
902 template<typename T>
903 static std::vector<ScalarResult<T>> pointer2WorldObject(const std::vector<std::shared_ptr<ScalarResultImpl<T>>> v_sr_impl) {
904 std::vector<ScalarResult<T>> vresult(v_sr_impl.size());
905 for (auto i=0; i<v_sr_impl.size(); ++i) {
906 vresult[i].set_impl(v_sr_impl[i]);
907 }
908 return vresult;
909 }
910
911 /// return the WorldObjects or the result functions living in the universe
912
913 /// read the pointers to the universe WorldObjects from the cloud,
914 /// convert them to actual WorldObjects and return them
915 resultT get_output(World &subworld, Cloud &cloud) {
916 resultT result;
917
918 // save outputrecords, because they will be consumed by the cloud
919 auto outputrecords1 = this->outputrecords;
920
921 // turn an element of the tuple of pointers into an element of the tuple of WorldObjects
922 auto doit = [&](auto& element) {
923 typedef std::decay_t<decltype(element)> elementT;
924
925 // load the elements from the cloud -- they contain pointers to WorldObjects
927 typedef typename elementT::value_type::implT implT;
928 auto ptr_element = cloud.consuming_load<std::vector<std::shared_ptr<implT>>>(
929 subworld, outputrecords1);
930 element = pointer2WorldObject(ptr_element);
931 }
932 else if constexpr (is_madness_function<elementT>::value) {
933 typedef typename elementT::implT implT;
934 auto ptr_element = cloud.consuming_load<std::shared_ptr<implT>>(subworld, outputrecords1);
935 element = pointer2WorldObject(ptr_element);
936 }
937 else if constexpr (is_scalar_result_vector<elementT>::value) { // std::vector<ScalarResult<T>>
938 typedef typename elementT::value_type ScalarResultT;
939 typedef typename ScalarResultT::implT implT;
940 typedef std::vector<std::shared_ptr<implT>> vptrT;
941 auto ptr_element = cloud.consuming_load<vptrT>(subworld, outputrecords1);
942 element = pointer2WorldObject(ptr_element);
943 }
944 else if constexpr (is_scalar_result<elementT>::value) {
945 // elementT is a ScalarResultImpl<T>
946 // in cloud we store a std::shared_ptr<ScalarResultImpl<T>>
947 auto ptr_element = cloud.consuming_load<std::shared_ptr<typename elementT::implT>>(subworld, outputrecords1);
948 element = pointer2WorldObject(ptr_element);
949 }
950 else {
951 MADNESS_EXCEPTION("confused about the type of the result", 1);
952 }
953 };
954 if constexpr (is_tuple<resultT>::value) {
955 static_assert(check_tuple_is_valid_task_result<resultT, 0>(),
956 "invalid tuple task result -- must be vectors of functions");
957 static_assert(is_tuple<resultT>::value, "is a tuple");
958
959 // loop over all tuple elements
960 // 1. load the pointers to the WorldObjects living in the universe
961 // 2. create WorldObjects from the pointers and copy them into the tuple of type resultT
962
963 // turn the tuple of pointers into a tuple of WorldObjects
964 unary_tuple_loop(result,doit);
965
966
967 } else {
968 doit(result);
969
970 }
971 return result;
972 }
973
974 };
975
976};
977
979public:
981 std::string name="unknown_task";
982 std::shared_ptr<MacroTaskPartitioner> partitioner=0;
984};
985
986
987} /* namespace madness */
988
989#endif /* SRC_MADNESS_MRA_MACROTASKQ_H_ */
Wrapper around MPI_Comm. Has a shallow copy constructor; use Create(Get_group()) for deep copy.
Definition safempi.h:490
Intracomm Split(int Color, int Key=0) const
Definition safempi.h:635
a batch consists of a 2D-input batch and a 1D-output batch: K-batch <- (I-batch, J-batch)
Definition macrotaskpartitioner.h:124
cloud class
Definition cloud.h:147
void clear()
Definition cloud.h:258
recordlistT store(madness::World &world, const T &source)
Definition cloud.h:316
Recordlist< keyT > recordlistT
Definition cloud.h:160
void replicate(const std::size_t chunk_size=INT_MAX)
Definition cloud.h:339
void print_size(World &universe)
Definition cloud.h:193
T load(madness::World &world, const recordlistT recordlist) const
load a single object from the cloud, recordlist is kept unchanged
Definition cloud.h:276
void clear_cache(World &subworld)
Definition cloud.h:252
void print_timings(World &universe) const
Definition cloud.h:230
T consuming_load(madness::World &world, recordlistT &recordlist) const
similar to load, but will consume the recordlist
Definition cloud.h:289
static void set_default_pmap(World &world)
Sets the default process map.
Definition mraimpl.h:3548
static std::shared_ptr< WorldDCPmapInterface< Key< NDIM > > > & get_pmap()
Returns the default process map.
Definition funcdefaults.h:389
static void set_pmap(const std::shared_ptr< WorldDCPmapInterface< Key< NDIM > > > &value)
Sets the default process map (does not redistribute existing functions)
Definition funcdefaults.h:405
FunctionImpl holds all Function state to facilitate shallow copy semantics.
Definition funcimpl.h:945
A multiresolution adaptive numerical function.
Definition mra.h:139
void set_impl(const std::shared_ptr< FunctionImpl< T, NDIM > > &impl)
Replace current FunctionImpl with provided new one.
Definition mra.h:661
A future is a possibly yet unevaluated value.
Definition future.h:373
T & get(bool dowork=true) &
Gets the value, waiting if necessary.
Definition future.h:574
base class
Definition macrotaskq.h:283
void set_running()
Definition macrotaskq.h:295
virtual ~MacroTaskBase()
Definition macrotaskq.h:289
void set_waiting()
Definition macrotaskq.h:296
MacroTaskBase()
Definition macrotaskq.h:288
virtual void cleanup()=0
virtual void print_me(std::string s="") const
Definition macrotaskq.h:305
std::string print_priority_and_status_to_string() const
Definition macrotaskq.h:311
void set_complete()
Definition macrotaskq.h:294
double priority
Definition macrotaskq.h:291
bool is_complete() const
Definition macrotaskq.h:298
Status
Definition macrotaskq.h:292
@ Complete
Definition macrotaskq.h:292
@ Running
Definition macrotaskq.h:292
@ Unknown
Definition macrotaskq.h:292
@ Waiting
Definition macrotaskq.h:292
bool is_running() const
Definition macrotaskq.h:299
enum madness::MacroTaskBase::Status stat
double get_priority() const
Definition macrotaskq.h:317
void set_priority(const double p)
Definition macrotaskq.h:318
virtual void print_me_as_table(std::string s="") const
Definition macrotaskq.h:308
std::vector< std::shared_ptr< MacroTaskBase > > taskqT
Definition macrotaskq.h:286
virtual void run(World &world, Cloud &cloud, taskqT &taskq, const long element, const bool debug)=0
friend std::ostream & operator<<(std::ostream &os, const MacroTaskBase::Status s)
Definition macrotaskq.h:320
bool is_waiting() const
Definition macrotaskq.h:300
Definition macrotaskq.h:331
MacroTaskIntermediate()
Definition macrotaskq.h:335
void cleanup()
Definition macrotaskq.h:339
~MacroTaskIntermediate()
Definition macrotaskq.h:337
Definition macrotaskq.h:978
MacroTaskOperationBase()
Definition macrotaskq.h:983
Batch batch
Definition macrotaskq.h:980
std::shared_ptr< MacroTaskPartitioner > partitioner
Definition macrotaskq.h:982
std::string name
Definition macrotaskq.h:981
partition one (two) vectors into 1D (2D) batches.
Definition macrotaskpartitioner.h:182
std::list< std::pair< Batch, double > > partitionT
Definition macrotaskpartitioner.h:186
Definition macrotaskq.h:344
long nsubworld
Definition macrotaskq.h:351
std::mutex taskq_mutex
Definition macrotaskq.h:349
bool printdebug() const
Definition macrotaskq.h:359
static void set_pmap(World &world)
Definition macrotaskq.h:547
void run_all()
run all tasks
Definition macrotaskq.h:401
void set_complete(const long task_number) const
scheduler is located on rank==0
Definition macrotaskq.h:536
World & universe
Definition macrotaskq.h:346
std::shared_ptr< WorldDCPmapInterface< Key< 1 > > > pmap1
Definition macrotaskq.h:352
std::shared_ptr< WorldDCPmapInterface< Key< 3 > > > pmap3
Definition macrotaskq.h:354
MacroTaskBase::taskqT taskq
Definition macrotaskq.h:348
void add_tasks(MacroTaskBase::taskqT &vtask)
Definition macrotaskq.h:484
long get_scheduled_task_number(World &subworld)
scheduler is located on universe.rank==0
Definition macrotaskq.h:508
void set_complete_local(const long task_number) const
scheduler is located on rank==0
Definition macrotaskq.h:541
World & get_subworld()
Definition macrotaskq.h:366
MacroTaskQ(World &universe, int nworld, const long printlevel=0)
create an empty taskq and initialize the subworlds
Definition macrotaskq.h:371
std::shared_ptr< WorldDCPmapInterface< Key< 4 > > > pmap4
Definition macrotaskq.h:355
std::size_t size() const
Definition macrotaskq.h:556
std::shared_ptr< WorldDCPmapInterface< Key< 5 > > > pmap5
Definition macrotaskq.h:356
void print_taskq() const
Definition macrotaskq.h:491
std::shared_ptr< World > subworld_ptr
Definition macrotaskq.h:347
bool printtimings() const
Definition macrotaskq.h:361
std::shared_ptr< WorldDCPmapInterface< Key< 2 > > > pmap2
Definition macrotaskq.h:353
bool printprogress() const
Definition macrotaskq.h:360
std::shared_ptr< WorldDCPmapInterface< Key< 6 > > > pmap6
Definition macrotaskq.h:357
void set_printlevel(const long p)
Definition macrotaskq.h:368
long printlevel
Definition macrotaskq.h:350
madness::Cloud cloud
Definition macrotaskq.h:365
long get_nsubworld() const
Definition macrotaskq.h:367
void add_replicated_task(const std::shared_ptr< MacroTaskBase > &task)
Definition macrotaskq.h:503
~MacroTaskQ()
Definition macrotaskq.h:384
static std::shared_ptr< World > create_worlds(World &universe, const std::size_t nsubworld)
Definition macrotaskq.h:388
long get_scheduled_task_number_local()
Definition macrotaskq.h:520
Definition macrotaskq.h:717
taskT task
Definition macrotaskq.h:724
MacroTaskInternal(const taskT &task, const std::pair< Batch, double > &batch_prio, const recordlistT &inputrecords, const recordlistT &outputrecords)
Definition macrotaskq.h:730
std::enable_if< notis_tuple< resultT1 >::value, void >::type accumulate_into_final_result(World &subworld, resultT1 &result, const resultT1 &result_tmp, const argtupleT &argtuple)
accumulate the result of the task into the final result living in the universe
Definition macrotaskq.h:802
static ScalarResult< T > pointer2WorldObject(const std::shared_ptr< ScalarResultImpl< T > > sr_impl)
Definition macrotaskq.h:898
decay_tuple< typename taskT::argtupleT > argtupleT
Definition macrotaskq.h:719
static std::vector< Function< T, NDIM > > pointer2WorldObject(const std::vector< std::shared_ptr< FunctionImpl< T, NDIM > > > v_impl)
Definition macrotaskq.h:890
void cleanup() override
Definition macrotaskq.h:877
taskT::resultT resultT
Definition macrotaskq.h:720
recordlistT outputrecords
Definition macrotaskq.h:722
std::string get_name() const
Definition macrotaskq.h:725
void run(World &subworld, Cloud &cloud, MacroTaskBase::taskqT &taskq, const long element, const bool debug) override
Definition macrotaskq.h:831
void binary_tuple_loop(tupleT &tuple1, tupleR &tuple2, opT &op) const
loop over the tuple elements of both tuples and execute the operation op on each element pair
Definition macrotaskq.h:768
resultT get_output(World &subworld, Cloud &cloud)
return the WorldObjects or the result functions living in the universe
Definition macrotaskq.h:915
static Function< T, NDIM > pointer2WorldObject(const std::shared_ptr< FunctionImpl< T, NDIM > > impl)
Definition macrotaskq.h:883
static std::vector< ScalarResult< T > > pointer2WorldObject(const std::vector< std::shared_ptr< ScalarResultImpl< T > > > v_sr_impl)
Definition macrotaskq.h:903
void print_me_as_table(std::string s="") const override
Definition macrotaskq.h:748
void print_me(std::string s="") const override
Definition macrotaskq.h:744
void unary_tuple_loop(tupleT &tuple, opT &op) const
Definition macrotaskq.h:778
std::enable_if< is_tuple< resultT1 >::value, void >::type accumulate_into_final_result(World &subworld, resultT1 &final_result, const resultT1 &tmp_result, const argtupleT &argtuple)
accumulate the result of the task into the final result living in the universe
Definition macrotaskq.h:789
recordlistT inputrecords
Definition macrotaskq.h:721
Definition macrotaskq.h:566
taskT::resultT resultT
Definition macrotaskq.h:576
std::shared_ptr< MacroTaskQ > taskq_ptr
Definition macrotaskq.h:665
taskT::argtupleT argtupleT
Definition macrotaskq.h:577
MacroTask(World &world, taskT &task, std::shared_ptr< MacroTaskQ > taskq_ptr=0)
constructor takes the actual task
Definition macrotaskq.h:610
World & world
Definition macrotaskq.h:664
resultT operator()(const Ts &... args)
this mimicks the original call to the task functor, called from the universe
Definition macrotaskq.h:629
bool debug
Definition macrotaskq.h:580
taskT task
Definition macrotaskq.h:579
MacroTaskPartitioner::partitionT partitionT
Definition macrotaskq.h:567
Cloud::recordlistT recordlistT
Definition macrotaskq.h:578
void set_debug(const bool value)
Definition macrotaskq.h:619
recordlistT prepare_output_records(Cloud &cloud, resultT &result)
store pointers to the result WorldObject in the cloud and return the recordlist
Definition macrotaskq.h:670
helper class for returning the result of a task, which is not a madness Function, but a simple scalar
Definition macrotaskq.h:54
void gaxpy(const double a, const T &right, double b, const bool fence=true)
accumulate, optional fence
Definition macrotaskq.h:85
void serialize(Archive &ar)
Definition macrotaskq.h:93
T get()
after completion of the taskq get the final value
Definition macrotaskq.h:98
ScalarResultImpl< T > & operator=(const T &x)
simple assignment of the scalar value
Definition macrotaskq.h:74
ScalarResultImpl(const ScalarResultImpl &other)=delete
Disable the default copy constructor.
ScalarResultImpl< T > & operator=(const ScalarResultImpl< T > &other)=delete
disable assignment operator
ScalarResultImpl< T > & operator+=(const T &x)
Definition macrotaskq.h:79
~ScalarResultImpl()
Definition macrotaskq.h:68
T value
the scalar value
Definition macrotaskq.h:111
T get_local() const
Definition macrotaskq.h:105
T value_type
Definition macrotaskq.h:56
ScalarResultImpl(World &world)
Definition macrotaskq.h:57
Definition macrotaskq.h:115
void serialize(Archive &ar)
Definition macrotaskq.h:146
ScalarResult(const std::shared_ptr< implT > &impl)
Definition macrotaskq.h:122
void gaxpy(const double a, const T &right, double b, const bool fence=true)
accumulate, optional fence
Definition macrotaskq.h:141
ScalarResultImpl< T > implT
Definition macrotaskq.h:117
T get()
after completion of the taskq get the final value
Definition macrotaskq.h:151
ScalarResult(World &world)
Definition macrotaskq.h:121
std::shared_ptr< implT > impl
Definition macrotaskq.h:118
ScalarResult & operator=(const T &x)
Definition macrotaskq.h:123
std::shared_ptr< implT > get_impl() const
Definition macrotaskq.h:128
void set_impl(const std::shared_ptr< implT > &newimpl)
Definition macrotaskq.h:132
T get_local() const
after completion of the taskq get the final value
Definition macrotaskq.h:156
uniqueidT id() const
Definition macrotaskq.h:136
void broadcast_serializable(objT &obj, ProcessID root)
Broadcast a serializable object.
Definition worldgop.h:754
void fence(bool debug=false)
Synchronizes all processes in communicator AND globally ensures no pending AM or tasks.
Definition worldgop.cc:161
bool set_forbid_fence(bool value)
Set forbid_fence flag to new value and return old value.
Definition worldgop.h:674
void sum(T *buf, size_t nelem)
Inplace global sum while still processing AM & tasks.
Definition worldgop.h:870
SafeMPI::Intracomm & comm()
Returns the associated SafeMPI communicator.
Definition worldmpi.h:286
Implements most parts of a globally addressable object (via unique ID).
Definition world_object.h:364
World & get_world() const
Returns a reference to the world.
Definition world_object.h:717
World & world
The World this object belongs to. (Think globally, act locally).
Definition world_object.h:381
void process_pending()
To be called from derived constructor to process pending messages.
Definition world_object.h:656
detail::task_result_type< memfnT >::futureT send(ProcessID dest, memfnT memfn) const
Definition world_object.h:731
detail::task_result_type< memfnT >::futureT task(ProcessID dest, memfnT memfn, const TaskAttributes &attr=TaskAttributes()) const
Sends task to derived class method returnT (this->*memfn)().
Definition world_object.h:1005
A parallel world class.
Definition world.h:132
static World * world_from_id(std::uint64_t id)
Convert a World ID to a World pointer.
Definition world.h:492
ProcessID rank() const
Returns the process rank in this World (same as MPI_Comm_rank()).
Definition world.h:320
WorldMpiInterface & mpi
MPI interface.
Definition world.h:204
ProcessID size() const
Returns the number of processes in this World (same as MPI_Comm_size()).
Definition world.h:330
unsigned long id() const
Definition world.h:315
WorldGopInterface & gop
Global operations.
Definition world.h:207
std::optional< T * > ptr_from_id(uniqueidT id) const
Look up a local pointer from a world-wide unique ID.
Definition world.h:416
Class for unique global IDs.
Definition uniqueid.h:53
Declares the Cloud class for storing data and transfering them between worlds.
char * p(char *buf, const char *name, int k, int initial_level, double thresh, int order)
Definition derivatives.cc:72
const std::size_t bufsize
Definition derivatives.cc:16
static bool debug
Definition dirac-hatom.cc:16
auto T(World &world, response_space &f) -> response_space
Definition global_functions.cc:34
static const double v
Definition hatom_sf_dirac.cc:20
Tensor< double > op(const Tensor< double > &x)
Definition kain.cc:508
#define MADNESS_CHECK(condition)
Check a condition — even in a release build the condition is always evaluated so it can have side eff...
Definition madness_exception.h:182
#define MADNESS_EXCEPTION(msg, value)
Macro for throwing a MADNESS exception.
Definition madness_exception.h:119
#define MADNESS_ASSERT(condition)
Assert a condition that should be free of side-effects since in release builds this might be a no-op.
Definition madness_exception.h:134
Namespace for all elements and tools of MADNESS.
Definition DFParameters.h:10
std::vector< ScalarResult< T > > scalar_result_vector(World &world, std::size_t n)
helper function to create a vector of ScalarResultImpl, circumventing problems with the constructors
Definition macrotaskq.h:164
static const char * filename
Definition legendre.cc:96
static double cpu_time()
Returns the cpu time in seconds relative to an arbitrary origin.
Definition timers.h:127
void set_impl(std::vector< Function< T, NDIM > > &v, const std::vector< std::shared_ptr< FunctionImpl< T, NDIM > > > vimpl)
Definition vmra.h:688
std::vector< std::shared_ptr< FunctionImpl< T, NDIM > > > get_impl(const std::vector< Function< T, NDIM > > &v)
Definition vmra.h:681
TreeState
Definition funcdefaults.h:59
@ reconstructed
s coeffs at the leaves only
Definition funcdefaults.h:60
@ compressed
d coeffs in internal nodes, s and d coeffs at the root
Definition funcdefaults.h:61
constexpr bool check_tuple_is_valid_task_result()
given a tuple check recursively if all elements are valid task results
Definition macrotaskq.h:223
static const Slice _(0,-1, 1)
void print(const T &t, const Ts &... ts)
Print items to std::cout (items separated by spaces) and terminate with a new line.
Definition print.h:225
@ TT_FULL
Definition gentensor.h:120
constexpr bool is_valid_task_result_v
check if type is a valid task result: it must be a WorldObject and must implement gaxpy
Definition macrotaskq.h:209
const Function< T, NDIM > & change_tree_state(const Function< T, NDIM > &f, const TreeState finalstate, bool fence=true)
change tree state of a function
Definition mra.h:2807
decltype(decay_types(std::declval< T >())) decay_tuple
Definition macrotaskpartitioner.h:22
double wall_time()
Returns the wall time in seconds relative to an arbitrary origin.
Definition timers.cc:48
std::string type(const PairType &n)
Definition PNOParameters.h:18
std::string name(const FuncType &type, const int ex=-1)
Definition ccpairfunction.h:28
void gaxpy(const double a, ScalarResult< T > &left, const double b, const T &right, const bool fence=true)
the result type of a macrotask must implement gaxpy
Definition macrotaskq.h:245
Definition mraimpl.h:50
static const double b
Definition nonlinschro.cc:119
static const double a
Definition nonlinschro.cc:118
RAII class to redirect cout to a file.
Definition macrotaskq.h:583
io_redirect(const long task_number, std::string filename, bool debug=false)
Definition macrotaskq.h:588
std::streambuf * stream_buffer_cout
Definition macrotaskq.h:584
~io_redirect()
Definition macrotaskq.h:598
bool debug
Definition macrotaskq.h:586
std::ofstream ofile
Definition macrotaskq.h:585
Definition macrotaskq.h:570
Default load of an object via serialize(ar, t).
Definition archive.h:666
Default store of an object via serialize(ar, t).
Definition archive.h:611
Definition mra.h:2851
Definition macrotaskq.h:194
Definition macrotaskq.h:179
Definition macrotaskq.h:173
Definition macrotaskq.h:200
Definition macrotaskq.h:188
Definition macrotaskq.h:218
static void load(const Archive &ar, std::shared_ptr< ScalarResultImpl< T > > &ptr)
Definition macrotaskq.h:261
static void store(const Archive &ar, const std::shared_ptr< ScalarResultImpl< T > > &ptr)
Definition macrotaskq.h:251
static const double_complex I
Definition tdse1d.cc:164
void doit(World &world)
Definition tdse.cc:921
void e()
Definition test_sig.cc:75
Declares the World class for the parallel runtime environment.
int ProcessID
Used to clearly identify process number/rank.
Definition worldtypes.h:43