BlackCat_Tensors
A GPU-supported autograd and linear algebra library, designed for neural network construction
binary.h
Go to the documentation of this file.
1 /* Project: BlackCat_Tensors
2  * Author: JosephJaspers
3  * Copyright 2018
4  *
5  * This Source Code Form is subject to the terms of the Mozilla Public
6  * License, v. 2.0. If a copy of the MPL was not distributed with this
7  * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
8 
9 #ifndef EXPRESSION_BINARY_FUNCTORS_H_
10 #define EXPRESSION_BINARY_FUNCTORS_H_
11 
12 
13 #include "operation_traits.h"
14 #include "tags.h"
15 #include "../common.h"
16 #include <type_traits>
17 #include <cmath>
18 
19 
20 namespace bc {
21 namespace oper {
22 
23 #define BC_FORWARD_TO_APPLY\
24  template<class Lv, class Rv> \
25  BCINLINE auto operator () (Lv&& lv, Rv&& rv) const \
26  -> decltype(apply(lv, rv)) { \
27  return apply(lv, rv); \
28 }
29 
30 #define BC_FORWARD_DEF(...) \
31  template<class Lv, class Rv> \
32  BCINLINE \
33  static auto apply (Lv&& lv, Rv&& rv) \
34  -> decltype(__VA_ARGS__) { \
35  return __VA_ARGS__; \
36  } \
37  BC_FORWARD_TO_APPLY
38 
39 #define BC_ADVANCED_FORWARD_DEF(...) \
40  template<class Lv, class Rv> \
41  BCINLINE \
42  static auto apply (Lv&& lv, Rv&& rv) \
43  { \
44  __VA_ARGS__; \
45  } \
46  BC_FORWARD_TO_APPLY
47 
51  BC_FORWARD_DEF(lv = rv)
52 } assign;
53 
57  BC_FORWARD_DEF(lv += rv)
58 } add_assign;
59 
63  BC_FORWARD_DEF(lv -= rv)
64 } sub_assign;
65 
69  BC_FORWARD_DEF(lv = rv)
70 } alias_assign;
71 
75  BC_FORWARD_DEF(lv += rv)
77 
81  BC_FORWARD_DEF(lv -= rv)
83 
87  BC_FORWARD_DEF(lv *= rv)
88 } mul_assign;
89 
93  BC_FORWARD_DEF(lv /= rv)
94 } div_assign;
95 
96 struct Scalar_Mul {
97  BC_FORWARD_DEF(lv * rv)
98 } scalar_mul;
99 
102  BC_FORWARD_DEF(lv + rv)
103 } add;
104 
105 struct Mul {
106  BC_FORWARD_DEF(lv * rv)
107 } mul;
108 
111  BC_FORWARD_DEF(lv - rv)
112 } sub;
113 
114 struct Div {
115  BC_FORWARD_DEF(lv / rv)
116 } div;
117 
118 struct Equal {
119  BC_FORWARD_DEF(lv == rv)
120 } equal;
121 
122 struct Approx_Equal {
123  BC_FORWARD_DEF(std::abs(lv - rv) < .01)
124 } approx_equal;
125 
126 struct Greater {
127  BC_FORWARD_DEF(lv > rv)
128 } greater;
129 
130 struct Lesser {
131  BC_FORWARD_DEF(lv < rv)
132 } lesser;
133 
135  BC_FORWARD_DEF(lv >= rv)
136 } greater_equal;
137 
138 struct Lesser_Equal {
139  BC_FORWARD_DEF(lv <= rv)
140 } lesser_equal;
141 
142 struct Max {
143  BC_FORWARD_DEF(lv > rv ? lv : rv)
144 } max;
145 
146 struct Min {
147  BC_FORWARD_DEF(lv < rv ? lv : rv)
148 } min;
149 
150 struct And {
151  BC_FORWARD_DEF(lv && rv)
152 } and_;
153 
154 struct Or {
155  BC_FORWARD_DEF(lv || rv)
156 } or_;
157 
158 struct Xor {
159  BC_FORWARD_DEF(lv ^ rv)
160 } xor_;
161 
163 {
166  lv += rv;
167  return lv;
168  )
170 
171 
173 {
176  lv *= rv;
177  return lv;
178  )
180 
182 {
185  lv -= rv;
186  return lv;
187  )
189 
193  lv /= rv;
194  return lv;
195  )
197 
198 
199 namespace detail {
200 
201 template<class T>
202 static constexpr bool is_host = std::is_same<T, host_tag>::value;
203 
204 }
205 
206 #ifdef __CUDACC__
209  return atomicAdd(&lv, rv);
210  )
212 
213 
216  static_assert(
217  std::is_same<void, Lv>::value,
218  "BLACKCAT_TENSORS: Atomic-reduction "
219  "mul-assign is currently not available on the GPU");
220  )
222 
225  return atomicAdd(&lv, -rv);
226  )
228 
231  static_assert(
232  std::is_same<void, Lv>::value,
233  "BLACKCAT_TENSORS: Atomic-reduction "
234  "div-assign is currently not available on the GPU");
235  )
237 
238 template<class SystemTag>
239 using Atomic_Add = std::conditional_t<detail::is_host<SystemTag>,
241 template<class SystemTag>
242 using Atomic_Sub = std::conditional_t<detail::is_host<SystemTag>,
244 template<class SystemTag>
245 using Atomic_Div = std::conditional_t<detail::is_host<SystemTag>,
247 template<class SystemTag>
248 using Atomic_Mul = std::conditional_t<detail::is_host<SystemTag>,
250 
251 #else //if __CUDACC__ is not defined
252 
253 template<class SystemTag>
254 using Atomic_Add = std::enable_if_t<detail::is_host<SystemTag>,
256 template<class SystemTag>
257 using Atomic_Sub = std::enable_if_t<detail::is_host<SystemTag>,
258  Host_Atomic_Add>;
259 template<class SystemTag>
260 using Atomic_Div = std::enable_if_t<detail::is_host<SystemTag>,
261  Host_Atomic_Add>;
262 template<class SystemTag>
263 using Atomic_Mul = std::enable_if_t<detail::is_host<SystemTag>,
264  Host_Atomic_Add>;
265 
266 
267 #endif
268 
269 }
270 }
271 
272 #undef BC_FORWARD_DEF
273 #undef BC_FORWARD_TO_APPLY
274 
275 #endif /* EXPRESSION_BINARY_FUNCTORS_H_ */
276 
Definition: binary.h:130
Definition: tags.h:16
Definition: binary.h:122
struct bc::oper::Or or_
bc::oper::Alias_Add_Assign alias_add_assign
bc::oper::Device_Atomic_Add device_atomic_add
Definition: binary.h:114
Definition: constexpr_int.h:14
bc::oper::Sub sub
Definition: binary.h:142
bc::oper::Assign assign
bc::oper::Add_Assign add_assign
Definition: binary.h:100
std::conditional_t< detail::is_host< SystemTag >, Host_Atomic_Add, Device_Atomic_Sub > Atomic_Sub
Definition: binary.h:243
struct bc::oper::Lesser lesser
Definition: binary.h:105
Definition: binary.h:162
Definition: binary.h:214
Definition: binary.h:181
struct bc::oper::Approx_Equal approx_equal
Definition: binary.h:190
Definition: binary.h:48
struct bc::oper::Xor xor_
Definition: binary.h:223
std::conditional_t< detail::is_host< SystemTag >, Host_Atomic_Add, Device_Atomic_Div > Atomic_Div
Definition: binary.h:246
bc::oper::Add add
struct bc::oper::cmath_functions::Abs abs
struct bc::oper::Greater greater
struct bc::oper::Min min
#define BC_FORWARD_DEF(...)
Definition: binary.h:30
Definition: binary.h:96
struct bc::oper::Mul mul
bc::oper::Device_Atomic_Sub device_atomic_sub
Definition: binary.h:154
std::conditional_t< detail::is_host< SystemTag >, Host_Atomic_Add, Device_Atomic_Add > Atomic_Add
Definition: binary.h:240
struct bc::oper::Div div
struct bc::oper::Max max
bc::oper::Alias_Sub_Assign alias_sub_assign
struct bc::oper::Equal equal
Definition: binary.h:84
bc::oper::Device_Atomic_Mul device_atomic_mul
Definition: binary.h:90
Definition: binary.h:172
Definition: binary.h:60
#define BC_ADVANCED_FORWARD_DEF(...)
Definition: binary.h:39
bc::oper::Host_Atomic_Div host_atomic_div
bc::oper::Div_Assign div_assign
Definition: binary.h:78
Definition: binary.h:109
bc::oper::Mul_Assign mul_assign
Definition: binary.h:158
std::conditional_t< detail::is_host< SystemTag >, Host_Atomic_Add, Device_Atomic_Mul > Atomic_Mul
Definition: binary.h:249
Definition: binary.h:134
Definition: binary.h:229
Definition: binary.h:126
Definition: binary.h:118
struct bc::oper::Greater_Equal greater_equal
bc::oper::Alias_Assign alias_assign
bc::oper::Host_Atomic_Mul host_atomic_mul
bc::oper::Host_Atomic_Add host_atomic_add
Definition: tags.h:19
struct bc::oper::Lesser_Equal lesser_equal
bc::oper::Host_Atomic_Sub host_atomic_sub
Definition: binary.h:72
Definition: binary.h:207
struct bc::oper::Scalar_Mul scalar_mul
Definition: binary.h:150
Definition: binary.h:138
Definition: binary.h:146
Definition: binary.h:66
bc::oper::Sub_Assign sub_assign
The Evaluator determines if an expression needs to be greedily optimized.
Definition: algorithms.h:22
Definition: binary.h:54
#define BC_omp_atomic__
Definition: common.h:268
bc::oper::Device_Atomic_Div device_atomic_div
struct bc::oper::And and_