BlackCat_Tensors
A GPU-supported autograd and linear algebra library, designed for neural network construction
polymorphic_layer_base.h
Go to the documentation of this file.
1  /*
2  * Layer.h
3  *
4  * Created on: Mar 1, 2018
5  * Author: joseph
6  */
7 
8 #ifndef BLACKCAT_NEURAL_NETWORKS_POLYMORPHIC_LAYER_H_
9 #define LAYER_H_
10 
11 #include "../layer_loader.h"
12 #include "layer_traits.h"
13 #include <string>
14 
15 #include <sys/types.h>
16 #include <sys/stat.h>
17 #include <fstream>
18 #include <ostream>
19 
20 namespace bc {
21 namespace nn {
22 
23 template<class LearningRateValueType>
24 struct network_runtime_traits
25 {
26  using value_type = LearningRateValueType;
28  int m_batch_size = 1;
29 };
30 
31 template<class SystemTag, class ValueType>
34 
35 template<
36  class Dimension,
37  class ValueType,
38  class SystemTag,
40  class OutputDimension=Dimension,
41  class OutputValueType=ValueType,
42  class OutputSystemTag=SystemTag,
43  class OutputAllocator=Allocator>
45 {
46  using allocator_type = Allocator;
47  using value_type = ValueType;
48  using system_tag = SystemTag;
49 
50  using input_tensor_dimension = Dimension;
52 
53  using output_tensor_dimension = OutputDimension;
55 
56  using output_value_type = OutputValueType;
57  using output_system_tag = OutputSystemTag;
58  using output_allocator_type = OutputAllocator;
59 
64 
67  value_type,
69 
72 
75 
76  using this_layer_pointer_type = std::shared_ptr<this_layer_type>;
77  using next_layer_pointer_type = std::shared_ptr<next_layer_type>;
78 
81 
82 private:
83 
84  const std::string m_classname;
85  std::shared_ptr<network_runtime_traits<value_type>> m_network_vars
86  = std::shared_ptr<network_runtime_traits<value_type>>(
88 
89 protected:
90 
91  std::shared_ptr<allocator_type> m_allocator;
92  std::weak_ptr<this_layer_type> m_input_layer;
93  std::shared_ptr<next_layer_type> m_output_layer;
94 
95  input_shape_type m_input_shape;
96  output_shape_type m_output_shape; //ptr??
97 
98 public:
99 
100  Polymorphic_Layer_Base(std::string classname):
101  m_classname(parse_classname(classname)) {}
102 
104 
105  virtual ~Polymorphic_Layer_Base()=default;
106 
107  template<int ADL=0>
108  std::string get_string_architecture() const {
109  return classname() + ':'
110  + "\n\tinput_shape: " + m_input_shape.to_string();
111  }
112 
113  virtual batched_output_tensor_type forward_propagation(
114  const batched_input_tensor_type& inputs) = 0;
115 
116  virtual batched_input_tensor_type back_propagation(
117  const batched_output_tensor_type& delta) = 0;
118 
120  const batched_input_tensor_type& inputs) {
121  return forward_propagation(inputs);
122  }
123 
125  const batched_output_tensor_type& delta) {
126  return back_propagation(delta);
127  }
128 
129  virtual void update_weights() {}
130  //post constructor initialization
131  virtual void init() = 0;
132 
133  void set_batch_size(int bs)
134  {
135  set_batch_size_hook(bs);
136  m_network_vars->m_batch_size = bs;
137  y = batched_output_tensor_type(this->batched_output_shape());
138  }
139 
140  void set_learning_rate(double lr)
141  {
142  set_learning_rate_hook(lr);
143  m_network_vars->m_learning_rate = lr;
144  }
145 
146  std::shared_ptr<this_layer_type> prev() {
147  return m_input_layer.lock();
148  }
149 
150  std::shared_ptr<this_layer_type> prev() const {
151  return m_input_layer.lock();
152  }
153 
154  std::shared_ptr<next_layer_type> next() {
155  return m_input_layer;
156  }
157 
158  std::shared_ptr<next_layer_type> next() const {
159  return m_output_layer;
160  }
161 
163  m_input_layer = prev_layer;
164  }
165 
167  m_output_layer = next_layer;
168  }
169 
170 protected:
171 
172  virtual void set_batch_size_hook(int bs) {}
173  virtual void set_learning_rate_hook(double lr) {}
174 
175 public:
176 
177  auto batch_size() const { return m_network_vars->m_batch_size; }
178 
179  auto learning_rate() const { return m_network_vars->m_learning_rate; }
180  auto batched_learning_rate() const { return learning_rate() / batch_size(); }
181 
182  auto input_shape() const { return m_input_shape; }
183  auto output_shape() const { return m_output_shape; }
184 
185  auto batched_input_shape() const { return m_input_shape.concat(batch_size()); }
186  auto batched_output_shape() const { return m_output_shape.concat(batch_size()); }
187 
188  std::string classname() const { return m_classname; }
189  virtual void save(Layer_Loader&) const = 0;
190  virtual void save_from_cache(Layer_Loader&, Cache&) const {}
191  virtual void load(Layer_Loader&) = 0;
192  virtual void load_to_cache(Layer_Loader&, Cache&) {}
193 
194  void copy_training_data_to_single_predict(Cache&, int batch_index) {}
195 
196  //push me
197  static std::string parse_classname(std::string classname) {
198  auto classname_ns = std::find(classname.rbegin(), classname.rend(), ':');
199  classname.erase(classname.rend().base(), classname_ns.base());
200  return classname;
201  }
202 };
203 
204 template<class... ArgsA, class... ArgsB>
205 void link(std::shared_ptr<Layer_Base<ArgsA...>> prev, std::shared_ptr<Layer_Base<ArgsB...>> next)
206 {
207  prev->set_next(next);
208  next->set_prev(prev);
209 }
210 
211 }
212 }
213 
214 
215 
216 #endif /* LAYER_H_ */
SystemTag system_tag
Definition: polymorphic_layer_base.h:48
LearningRateValueType value_type
Definition: polymorphic_layer_base.h:26
virtual void save_from_cache(Layer_Loader &, Cache &) const
Definition: polymorphic_layer_base.h:190
std::shared_ptr< next_layer_type > next() const
Definition: polymorphic_layer_base.h:158
batched_output_tensor_type fp(const batched_input_tensor_type &inputs)
Definition: polymorphic_layer_base.h:119
std::string to_string(int begin, int end) const
Definition: dim.h:270
virtual void load_to_cache(Layer_Loader &, Cache &)
Definition: polymorphic_layer_base.h:192
auto output_shape() const
Definition: polymorphic_layer_base.h:183
std::shared_ptr< next_layer_type > next()
Definition: polymorphic_layer_base.h:154
Definition: constexpr_int.h:14
void set_next(next_layer_pointer_type next_layer)
Definition: polymorphic_layer_base.h:166
Definition: layer_base.h:86
A Dictionary designed to store any type using the &#39;store&#39; and &#39;load&#39; functions.
Definition: layer_cache.h:46
Definition: layer_loader.h:19
virtual void set_batch_size_hook(int bs)
Definition: polymorphic_layer_base.h:172
void set_learning_rate(double lr)
Definition: polymorphic_layer_base.h:140
std::shared_ptr< this_layer_type > prev()
Definition: polymorphic_layer_base.h:146
std::shared_ptr< this_layer_type > this_layer_pointer_type
Definition: polymorphic_layer_base.h:76
virtual void set_learning_rate_hook(double lr)
Definition: polymorphic_layer_base.h:173
std::shared_ptr< this_layer_type > prev() const
Definition: polymorphic_layer_base.h:150
void set_batch_size(int bs)
Definition: polymorphic_layer_base.h:133
static std::string parse_classname(std::string classname)
Definition: polymorphic_layer_base.h:197
auto batched_input_shape() const
Definition: polymorphic_layer_base.h:185
class::::::Args static auto find(bc::streams::Stream< bc::host_tag > stream, Begin begin, End end, Args... args)
Definition: algorithms.h:124
Definition: polymorphic_allocator.h:127
int m_batch_size
Definition: polymorphic_layer_base.h:28
batched_input_tensor_type bp(const batched_output_tensor_type &delta)
Definition: polymorphic_layer_base.h:124
Dimension input_tensor_dimension
Definition: polymorphic_layer_base.h:50
auto batched_output_shape() const
Definition: polymorphic_layer_base.h:186
Polymorphic_Layer_Base(std::string classname)
Definition: polymorphic_layer_base.h:100
auto input_shape() const
Definition: polymorphic_layer_base.h:182
OutputAllocator output_allocator_type
Definition: polymorphic_layer_base.h:58
value_type m_learning_rate
Definition: polymorphic_layer_base.h:27
Definition: allocators.h:20
auto batched_learning_rate() const
Definition: polymorphic_layer_base.h:180
auto batch_size() const
Definition: polymorphic_layer_base.h:177
OutputValueType output_value_type
Definition: polymorphic_layer_base.h:56
auto learning_rate() const
Definition: polymorphic_layer_base.h:179
Definition: polymorphic_layer_base.h:44
void link(std::shared_ptr< Layer_Base< ArgsA... >> prev, std::shared_ptr< Layer_Base< ArgsB... >> next)
Definition: polymorphic_layer_base.h:205
void copy_training_data_to_single_predict(Cache &, int batch_index)
Definition: polymorphic_layer_base.h:194
void set_prev(this_layer_pointer_type prev_layer)
Definition: polymorphic_layer_base.h:162
std::string classname() const
Definition: polymorphic_layer_base.h:188
Definition: polymorphic_layer_base.h:24
OutputSystemTag output_system_tag
Definition: polymorphic_layer_base.h:57
OutputDimension output_tensor_dimension
Definition: polymorphic_layer_base.h:53
BCINLINE auto concat(Ints... value) const
Definition: dim.h:105
ValueType value_type
Definition: polymorphic_layer_base.h:47
std::string get_string_architecture() const
Definition: polymorphic_layer_base.h:108
virtual void update_weights()
Definition: polymorphic_layer_base.h:129
The Evaluator determines if an expression needs to be greedily optimized.
Definition: algorithms.h:22
std::shared_ptr< next_layer_type > next_layer_pointer_type
Definition: polymorphic_layer_base.h:77