dataset.hpp 5.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161
  1. /**
  2. * @file
  3. * @author Caleb Fangmeier <caleb@fangmeier.tech>
  4. * @version 0.1
  5. *
  6. * @section LICENSE
  7. *
  8. *
  9. * MIT License
  10. *
  11. * Copyright (c) 2017 Caleb Fangmeier
  12. *
  13. * Permission is hereby granted, free of charge, to any person obtaining a copy
  14. * of this software and associated documentation files (the "Software"), to deal
  15. * in the Software without restriction, including without limitation the rights
  16. * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  17. * copies of the Software, and to permit persons to whom the Software is
  18. * furnished to do so, subject to the following conditions:
  19. *
  20. * The above copyright notice and this permission notice shall be included in all
  21. * copies or substantial portions of the Software.
  22. *
  23. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  24. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  25. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  26. * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  27. * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  28. * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  29. * SOFTWARE.
  30. */
  31. #ifndef dataset_hpp
  32. #define dataset_hpp
  33. #include <iostream>
  34. #include "value.hpp"
  35. #include "container.hpp"
  36. #include "datafile.hpp"
  37. #include "log.hpp"
  38. namespace fv{
  39. /*
  40. * A DataSet is a generic source of data that is used to populate
  41. * ObservedValues. For each ObservedValue, it is recommened that the DataSet
  42. * have a field whose value is updated when the load_next() method is called. A
  43. * pointer to this value is then passed during the creation of the
  44. * ObservedValue. It is important, therefore, that the location in memory of
  45. * the data not change from event to event.
  46. */
  47. class DataSet{
  48. private:
  49. void summary(){
  50. INFO(GenValue::summary());
  51. INFO(GenFunction::summary());
  52. }
  53. Value<int>* current_event_number;
  54. int max_events;
  55. protected:
  56. std::map<std::string, GenContainer*> containers;
  57. virtual bool load_next() = 0;
  58. virtual int get_events() = 0;
  59. virtual int get_current_event() = 0;
  60. virtual util::DataFileDescriptor& get_current_file() = 0;
  61. std::map<std::string,std::string> get_container_name_value_map(){
  62. std::map<std::string, std::string> value_map;
  63. for(auto container : containers)
  64. value_map[container.first] = container.second->get_value_name();
  65. return value_map;
  66. }
  67. std::map<std::string,std::string> get_function_name_impl_map(){
  68. std::map<std::string, std::string> impl_map;
  69. for(auto fn : GenFunction::function_registry)
  70. if (fn.second != nullptr){
  71. impl_map[fn.first] = GenFunction::format_code(fn.second->get_impl());
  72. }
  73. return impl_map;
  74. }
  75. public:
  76. DataSet():max_events(0){
  77. auto event_check = GenFunction::reg_func<int()>("event_number",
  78. FUNC(([ds=this](){
  79. return ds->get_current_event();
  80. })));
  81. current_event_number = new BoundValue<int>(event_check);
  82. }
  83. void process(bool silent=false){
  84. int events, current_event;
  85. summary();
  86. events = get_events();
  87. if (max_events > 0) events = max_events;
  88. if (!silent) std::cout << std::endl;
  89. while( load_next() ){
  90. current_event = get_current_event();
  91. if (!silent) std::cout << "\rprocessing event: " << current_event+1 << "/" << events
  92. << " of file: " << get_current_file().filename << std::flush;
  93. GenValue::reset();
  94. for(auto con : containers){
  95. DEBUG("Filling container " << con.first << ".");
  96. con.second->fill();
  97. }
  98. if(max_events && current_event+1 >= max_events) break;
  99. }
  100. if (!silent) std::cout << " Finished!" << std::endl;
  101. }
  102. void set_max_events(const int& max_events){
  103. this->max_events = max_events;
  104. }
  105. int get_max_events(){
  106. return this->max_events;
  107. }
  108. virtual void save_all(){
  109. for(auto container : containers)
  110. container.second->save();
  111. }
  112. template<typename C, typename... ArgTypes>
  113. C* register_container(ArgTypes... args){
  114. C* container = new C(args...);
  115. if (containers[container->get_name()] != nullptr){
  116. CRITICAL("Container with name \""+container->get_name()+"\" already exists.", -1);
  117. }
  118. containers[container->get_name()] = container;
  119. return container;
  120. }
  121. void cut_set(GenContainer* base_container, std::vector<std::pair<Value<bool>*, std::string>> filters){
  122. for(auto p : filters){
  123. Value<bool>* filter;
  124. std::string new_name;
  125. std::tie(filter, new_name) = p;
  126. if (containers[new_name] != nullptr){
  127. CRITICAL("Container with name \""<<new_name<<"\" already exists.", -1);
  128. }
  129. auto new_container = base_container->clone_as(new_name);
  130. new_container->add_filter(filter);
  131. containers[new_container->get_name()] = new_container;
  132. }
  133. }
  134. GenContainer* get_container(std::string container_name){
  135. GenContainer* c = containers[container_name];
  136. if (c == nullptr){
  137. CRITICAL("Request for container \"" << container_name << "\" failed. Doesn't exist.", -1);
  138. }
  139. return c;
  140. }
  141. Value<int>* get_current_event_number(){
  142. return current_event_number;
  143. }
  144. };
  145. }
  146. #endif // dataset_hpp