BlackCat_Tensors
A GPU-supported autograd and linear algebra library, designed for neural network construction
host.h
Go to the documentation of this file.
1 /*
2 
3  * Common.h
4  *
5  * Created on: Jan 13, 2019
6  * Author: joseph
7  */
8 
9 #ifndef BC_STREAMS_COMMON_H_
10 #define BC_STREAMS_COMMON_H_
11 
12 #include <memory>
13 #include "stream_synchronization.h"
14 #include "host_stream.h"
15 
16 namespace bc {
17 namespace streams {
18 
19 template<class SystemTag>
20 class Stream;
21 
22 template<>
23 class Stream<host_tag> {
24 
25  struct Contents {
26  std::unique_ptr<HostEvent> m_event;
27  HostStream m_stream;
29  };
30 
31  static std::shared_ptr<Contents> get_default_contents()
32  {
33  static thread_local std::shared_ptr<Contents> default_contents =
34  std::shared_ptr<Contents>(new Contents());
35 
36  return default_contents;
37  }
38 
39  std::shared_ptr<Contents> m_contents = get_default_contents();
40 
41 public:
42 
45 
47  return m_contents->m_workspace;
48  }
49 
50  template<class RebindType>
52  {
53  return typename allocator_type::
54  template rebind<RebindType>::other(m_contents->m_workspace);
55  }
56 
59 
60  bool is_default() {
61  return m_contents == get_default_contents();
62  }
63 
64  void create() {
65  m_contents = std::shared_ptr<Contents>(new Contents());
66  }
67 
68  void destroy() {
69  m_contents = get_default_contents();
70  }
71 
72  void sync()
73  {
74  //** Pushing a job while syncing is undefined behavior.
75  if (!is_default()) {
76  if (!m_contents->m_stream.empty()) {
77  record_event();
78  this->m_contents->m_event->get_waiter().operator ()();
79  }
80  }
81  }
82 
83  void set_stream(Stream stream_) {
84  this->m_contents = stream_.m_contents;
85  }
86 
87  void record_event()
88  {
89  if (!is_default()) {
90  m_contents->m_event = std::unique_ptr<HostEvent>(new HostEvent());
91  this->enqueue(m_contents->m_event->get_recorder());
92  }
93  }
94 
95  void wait_event(Stream& stream)
96  {
97  if (!stream.is_default()) {
98  BC_ASSERT(
99  stream.m_contents->m_event.get(),
100  "Attempting to wait on an event that was never recorded");
101  this->enqueue(stream.m_contents->m_event->get_waiter());
102  }
103  }
104 
105  void wait_stream(Stream& stream)
106  {
107  stream.record_event();
108  this->wait_event(stream);
109  }
110 
111  template<class Functor>
112  void enqueue(Functor functor)
113  {
114  if (this->is_default()) {
115  host_sync();
116  functor();
117  } else {
118  m_contents->m_stream.push(functor);
119  }
120  }
121 
122  template<class Functor>
123  void enqueue_callback(Functor functor) {
124  enqueue(functor);
125  }
126 
127  bool operator == (const Stream& dev) {
128  return m_contents == dev.m_contents;
129  }
130 
131  bool operator != (const Stream& dev) {
132  return m_contents != dev.m_contents;
133  }
134 };
135 
136 
137 }
138 }
139 
140 
141 #endif /* COMMON_H_ */
void host_sync()
Definition: stream_synchronization.h:16
auto get_allocator_rebound()
Definition: host.h:51
void create()
Definition: host.h:64
void enqueue(Functor functor)
Definition: host.h:112
Definition: host_stream.h:17
bool is_default()
Definition: host.h:60
Definition: host_stream.h:56
void record_event()
Definition: host.h:87
void wait_event(Stream &stream)
Definition: host.h:95
void set_blas_pointer_mode_host()
Definition: host.h:57
An unsynced memory pool implemented as a stack.
Definition: stack_allocator.h:138
void enqueue_callback(Functor functor)
Definition: host.h:123
void set_blas_pointer_mode_device()
Definition: host.h:58
#define BC_ASSERT(condition, message)
Definition: common.h:185
allocator_type & get_allocator()
Definition: host.h:46
void set_stream(Stream stream_)
Definition: host.h:83
void wait_stream(Stream &stream)
Definition: host.h:105
Definition: common.h:26
auto operator==(const Expression_Base< Xpr > &param) const
Definition: expression_operations.h:38
Definition: device.h:27
void destroy()
Definition: host.h:68
void sync()
Definition: host.h:72
The Evaluator determines if an expression needs to be greedily optimized.
Definition: algorithms.h:22