WPILibC++ 2023.4.3
BFloat16.h
Go to the documentation of this file.
1/* Copyright 2017 The TensorFlow Authors. All Rights Reserved.
2
3Licensed under the Apache License, Version 2.0 (the "License");
4you may not use this file except in compliance with the License.
5You may obtain a copy of the License at
6
7 http://www.apache.org/licenses/LICENSE-2.0
8
9Unless required by applicable law or agreed to in writing, software
10distributed under the License is distributed on an "AS IS" BASIS,
11WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12See the License for the specific language governing permissions and
13limitations under the License.
14==============================================================================*/
15
16#ifndef EIGEN_BFLOAT16_H
17#define EIGEN_BFLOAT16_H
18
19#define BF16_PACKET_FUNCTION(PACKET_F, PACKET_BF16, METHOD) \
20 template <> \
21 EIGEN_DEFINE_FUNCTION_ALLOWING_MULTIPLE_DEFINITIONS EIGEN_UNUSED \
22 PACKET_BF16 METHOD<PACKET_BF16>(const PACKET_BF16& _x) { \
23 return F32ToBf16(METHOD<PACKET_F>(Bf16ToF32(_x))); \
24 }
25
26namespace Eigen {
27
28struct bfloat16;
29
30namespace bfloat16_impl {
31
32// Make our own __bfloat16_raw definition.
35 explicit EIGEN_DEVICE_FUNC EIGEN_CONSTEXPR __bfloat16_raw(unsigned short raw) : value(raw) {}
36 unsigned short value;
37};
38
40template <bool AssumeArgumentIsNormalOrInfinityOrZero>
42// Forward declarations of template specializations, to avoid Visual C++ 2019 errors, saying:
43// > error C2908: explicit specialization; 'float_to_bfloat16_rtne' has already been instantiated
44template <>
46template <>
49
53};
54
55} // namespace bfloat16_impl
56
57// Class definition.
59
61
63
65
67 : bfloat16_impl::bfloat16_base(bfloat16_impl::raw_uint16_to_bfloat16(b ? 0x3f80 : 0)) {}
68
69 template<class T>
71 : bfloat16_impl::bfloat16_base(bfloat16_impl::float_to_bfloat16_rtne<internal::is_integral<T>::value>(static_cast<float>(val))) {}
72
73 explicit EIGEN_DEVICE_FUNC bfloat16(float f)
74 : bfloat16_impl::bfloat16_base(bfloat16_impl::float_to_bfloat16_rtne<false>(f)) {}
75
76 // Following the convention of numpy, converting between complex and
77 // float will lead to loss of imag value.
78 template<typename RealScalar>
79 explicit EIGEN_DEVICE_FUNC EIGEN_CONSTEXPR bfloat16(const std::complex<RealScalar>& val)
80 : bfloat16_impl::bfloat16_base(bfloat16_impl::float_to_bfloat16_rtne<false>(static_cast<float>(val.real()))) {}
81
82 EIGEN_DEVICE_FUNC operator float() const { // NOLINT: Allow implicit conversion to float, because it is lossless.
84 }
85};
86} // namespace Eigen
87
88namespace std {
89template<>
90struct numeric_limits<Eigen::bfloat16> {
91 static const bool is_specialized = true;
92 static const bool is_signed = true;
93 static const bool is_integer = false;
94 static const bool is_exact = false;
95 static const bool has_infinity = true;
96 static const bool has_quiet_NaN = true;
97 static const bool has_signaling_NaN = true;
98 static const float_denorm_style has_denorm = std::denorm_absent;
99 static const bool has_denorm_loss = false;
100 static const std::float_round_style round_style = numeric_limits<float>::round_style;
101 static const bool is_iec559 = false;
102 static const bool is_bounded = true;
103 static const bool is_modulo = false;
104 static const int digits = 8;
105 static const int digits10 = 2;
106 static const int max_digits10 = 4;
107 static const int radix = 2;
108 static const int min_exponent = numeric_limits<float>::min_exponent;
109 static const int min_exponent10 = numeric_limits<float>::min_exponent10;
110 static const int max_exponent = numeric_limits<float>::max_exponent;
111 static const int max_exponent10 = numeric_limits<float>::max_exponent10;
112 static const bool traps = numeric_limits<float>::traps;
113 static const bool tinyness_before = numeric_limits<float>::tinyness_before;
114
119 static Eigen::bfloat16 round_error() { return Eigen::bfloat16(0x3f00); }
124};
125
126// If std::numeric_limits<T> is specialized, should also specialize
127// std::numeric_limits<const T>, std::numeric_limits<volatile T>, and
128// std::numeric_limits<const volatile T>
129// https://stackoverflow.com/a/16519653/
130template<>
131struct numeric_limits<const Eigen::bfloat16> : numeric_limits<Eigen::bfloat16> {};
132template<>
133struct numeric_limits<volatile Eigen::bfloat16> : numeric_limits<Eigen::bfloat16> {};
134template<>
135struct numeric_limits<const volatile Eigen::bfloat16> : numeric_limits<Eigen::bfloat16> {};
136} // namespace std
137
138namespace Eigen {
139
140namespace bfloat16_impl {
141
142// We need to distinguish ‘clang as the CUDA compiler’ from ‘clang as the host compiler,
143// invoked by NVCC’ (e.g. on MacOS). The former needs to see both host and device implementation
144// of the functions, while the latter can only deal with one of them.
145#if !defined(EIGEN_HAS_NATIVE_BF16) || (EIGEN_COMP_CLANG && !EIGEN_COMP_NVCC) // Emulate support for bfloat16 floats
146
147#if EIGEN_COMP_CLANG && defined(EIGEN_CUDACC)
148// We need to provide emulated *host-side* BF16 operators for clang.
149#pragma push_macro("EIGEN_DEVICE_FUNC")
150#undef EIGEN_DEVICE_FUNC
151#if defined(EIGEN_HAS_CUDA_BF16) && defined(EIGEN_HAS_NATIVE_BF16)
152#define EIGEN_DEVICE_FUNC __host__
153#else // both host and device need emulated ops.
154#define EIGEN_DEVICE_FUNC __host__ __device__
155#endif
156#endif
157
158// Definitions for CPUs, mostly working through conversion
159// to/from fp32.
160
162 return bfloat16(float(a) + float(b));
163}
165 return bfloat16(float(a) + static_cast<float>(b));
166}
168 return bfloat16(static_cast<float>(a) + float(b));
169}
171 return bfloat16(float(a) * float(b));
172}
174 return bfloat16(float(a) - float(b));
175}
177 return bfloat16(float(a) / float(b));
178}
181 result.value = a.value ^ 0x8000;
182 return result;
183}
185 a = bfloat16(float(a) + float(b));
186 return a;
187}
189 a = bfloat16(float(a) * float(b));
190 return a;
191}
193 a = bfloat16(float(a) - float(b));
194 return a;
195}
197 a = bfloat16(float(a) / float(b));
198 return a;
199}
201 a += bfloat16(1);
202 return a;
203}
205 a -= bfloat16(1);
206 return a;
207}
209 bfloat16 original_value = a;
210 ++a;
211 return original_value;
212}
214 bfloat16 original_value = a;
215 --a;
216 return original_value;
217}
219 return numext::equal_strict(float(a),float(b));
220}
222 return numext::not_equal_strict(float(a), float(b));
223}
225 return float(a) < float(b);
226}
228 return float(a) <= float(b);
229}
231 return float(a) > float(b);
232}
234 return float(a) >= float(b);
235}
236
237#if EIGEN_COMP_CLANG && defined(EIGEN_CUDACC)
238#pragma pop_macro("EIGEN_DEVICE_FUNC")
239#endif
240#endif // Emulate support for bfloat16 floats
241
242// Division by an index. Do it in full float precision to avoid accuracy
243// issues in converting the denominator to bfloat16.
245 return bfloat16(static_cast<float>(a) / static_cast<float>(b));
246}
247
249 __bfloat16_raw output;
251 output.value = std::signbit(v) ? 0xFFC0: 0x7FC0;
252 return output;
253 }
254 const uint16_t* p = reinterpret_cast<const uint16_t*>(&v);
255#if defined(__BYTE_ORDER__) && __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__
256 output.value = p[0];
257#else
258 output.value = p[1];
259#endif
260 return output;
261}
262
264 return __bfloat16_raw(value);
265}
266
268 return bf.value;
269}
270
271// float_to_bfloat16_rtne template specialization that does not make any
272// assumption about the value of its function argument (ff).
273template <>
275#if (defined(EIGEN_HAS_CUDA_BF16) && defined(EIGEN_HAS_HIP_BF16))
276 // Nothing to do here
277#else
278 __bfloat16_raw output;
279
281 // If the value is a NaN, squash it to a qNaN with msb of fraction set,
282 // this makes sure after truncation we don't end up with an inf.
283 //
284 // qNaN magic: All exponent bits set + most significant bit of fraction
285 // set.
286 output.value = std::signbit(ff) ? 0xFFC0: 0x7FC0;
287 } else {
288 // Fast rounding algorithm that rounds a half value to nearest even. This
289 // reduces expected error when we convert a large number of floats. Here
290 // is how it works:
291 //
292 // Definitions:
293 // To convert a float 32 to bfloat16, a float 32 can be viewed as 32 bits
294 // with the following tags:
295 //
296 // Sign | Exp (8 bits) | Frac (23 bits)
297 // S EEEEEEEE FFFFFFLRTTTTTTTTTTTTTTT
298 //
299 // S: Sign bit.
300 // E: Exponent bits.
301 // F: First 6 bits of fraction.
302 // L: Least significant bit of resulting bfloat16 if we truncate away the
303 // rest of the float32. This is also the 7th bit of fraction
304 // R: Rounding bit, 8th bit of fraction.
305 // T: Sticky bits, rest of fraction, 15 bits.
306 //
307 // To round half to nearest even, there are 3 cases where we want to round
308 // down (simply truncate the result of the bits away, which consists of
309 // rounding bit and sticky bits) and two cases where we want to round up
310 // (truncate then add one to the result).
311 //
312 // The fast converting algorithm simply adds lsb (L) to 0x7fff (15 bits of
313 // 1s) as the rounding bias, adds the rounding bias to the input, then
314 // truncates the last 16 bits away.
315 //
316 // To understand how it works, we can analyze this algorithm case by case:
317 //
318 // 1. L = 0, R = 0:
319 // Expect: round down, this is less than half value.
320 //
321 // Algorithm:
322 // - Rounding bias: 0x7fff + 0 = 0x7fff
323 // - Adding rounding bias to input may create any carry, depending on
324 // whether there is any value set to 1 in T bits.
325 // - R may be set to 1 if there is a carry.
326 // - L remains 0.
327 // - Note that this case also handles Inf and -Inf, where all fraction
328 // bits, including L, R and Ts are all 0. The output remains Inf after
329 // this algorithm.
330 //
331 // 2. L = 1, R = 0:
332 // Expect: round down, this is less than half value.
333 //
334 // Algorithm:
335 // - Rounding bias: 0x7fff + 1 = 0x8000
336 // - Adding rounding bias to input doesn't change sticky bits but
337 // adds 1 to rounding bit.
338 // - L remains 1.
339 //
340 // 3. L = 0, R = 1, all of T are 0:
341 // Expect: round down, this is exactly at half, the result is already
342 // even (L=0).
343 //
344 // Algorithm:
345 // - Rounding bias: 0x7fff + 0 = 0x7fff
346 // - Adding rounding bias to input sets all sticky bits to 1, but
347 // doesn't create a carry.
348 // - R remains 1.
349 // - L remains 0.
350 //
351 // 4. L = 1, R = 1:
352 // Expect: round up, this is exactly at half, the result needs to be
353 // round to the next even number.
354 //
355 // Algorithm:
356 // - Rounding bias: 0x7fff + 1 = 0x8000
357 // - Adding rounding bias to input doesn't change sticky bits, but
358 // creates a carry from rounding bit.
359 // - The carry sets L to 0, creates another carry bit and propagate
360 // forward to F bits.
361 // - If all the F bits are 1, a carry then propagates to the exponent
362 // bits, which then creates the minimum value with the next exponent
363 // value. Note that we won't have the case where exponents are all 1,
364 // since that's either a NaN (handled in the other if condition) or inf
365 // (handled in case 1).
366 //
367 // 5. L = 0, R = 1, any of T is 1:
368 // Expect: round up, this is greater than half.
369 //
370 // Algorithm:
371 // - Rounding bias: 0x7fff + 0 = 0x7fff
372 // - Adding rounding bias to input creates a carry from sticky bits,
373 // sets rounding bit to 0, then create another carry.
374 // - The second carry sets L to 1.
375 //
376 // Examples:
377 //
378 // Exact half value that is already even:
379 // Input:
380 // Sign | Exp (8 bit) | Frac (first 7 bit) | Frac (last 16 bit)
381 // S E E E E E E E E F F F F F F L RTTTTTTTTTTTTTTT
382 // 0 0 0 0 0 0 0 0 0 0 0 0 0 0 1 0 1000000000000000
383 //
384 // This falls into case 3. We truncate the rest of 16 bits and no
385 // carry is created into F and L:
386 //
387 // Output:
388 // Sign | Exp (8 bit) | Frac (first 7 bit)
389 // S E E E E E E E E F F F F F F L
390 // 0 0 0 0 0 0 0 0 0 0 0 0 0 0 1 0
391 //
392 // Exact half value, round to next even number:
393 // Input:
394 // Sign | Exp (8 bit) | Frac (first 7 bit) | Frac (last 16 bit)
395 // S E E E E E E E E F F F F F F L RTTTTTTTTTTTTTTT
396 // 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 1 1000000000000000
397 //
398 // This falls into case 4. We create a carry from R and T,
399 // which then propagates into L and F:
400 //
401 // Output:
402 // Sign | Exp (8 bit) | Frac (first 7 bit)
403 // S E E E E E E E E F F F F F F L
404 // 0 0 0 0 0 0 0 0 0 0 0 0 0 0 1 0
405 //
406 //
407 // Max denormal value round to min normal value:
408 // Input:
409 // Sign | Exp (8 bit) | Frac (first 7 bit) | Frac (last 16 bit)
410 // S E E E E E E E E F F F F F F L RTTTTTTTTTTTTTTT
411 // 0 0 0 0 0 0 0 0 0 1 1 1 1 1 1 1 1111111111111111
412 //
413 // This falls into case 4. We create a carry from R and T,
414 // propagate into L and F, which then propagates into exponent
415 // bits:
416 //
417 // Output:
418 // Sign | Exp (8 bit) | Frac (first 7 bit)
419 // S E E E E E E E E F F F F F F L
420 // 0 0 0 0 0 0 0 0 1 0 0 0 0 0 0 0
421 //
422 // Max normal value round to Inf:
423 // Input:
424 // Sign | Exp (8 bit) | Frac (first 7 bit) | Frac (last 16 bit)
425 // S E E E E E E E E F F F F F F L RTTTTTTTTTTTTTTT
426 // 0 1 1 1 1 1 1 1 0 1 1 1 1 1 1 1 1111111111111111
427 //
428 // This falls into case 4. We create a carry from R and T,
429 // propagate into L and F, which then propagates into exponent
430 // bits:
431 //
432 // Sign | Exp (8 bit) | Frac (first 7 bit)
433 // S E E E E E E E E F F F F F F L
434 // 0 1 1 1 1 1 1 1 1 0 0 0 0 0 0 0
435
436 // At this point, ff must be either a normal float, or +/-infinity.
437 output = float_to_bfloat16_rtne<true>(ff);
438 }
439 return output;
440#endif
441}
442
443// float_to_bfloat16_rtne template specialization that assumes that its function
444// argument (ff) is either a normal floating point number, or +/-infinity, or
445// zero. Used to improve the runtime performance of conversion from an integer
446// type to bfloat16.
447template <>
449#if (defined(EIGEN_HAS_CUDA_BF16) && defined(EIGEN_HAS_HIP_BF16))
450 // Nothing to do here
451#else
452 numext::uint32_t input = numext::bit_cast<numext::uint32_t>(ff);
453 __bfloat16_raw output;
454
455 // Least significant bit of resulting bfloat.
456 numext::uint32_t lsb = (input >> 16) & 1;
457 numext::uint32_t rounding_bias = 0x7fff + lsb;
458 input += rounding_bias;
459 output.value = static_cast<numext::uint16_t>(input >> 16);
460 return output;
461#endif
462}
463
465 float result = 0;
466 unsigned short* q = reinterpret_cast<unsigned short*>(&result);
467#if defined(__BYTE_ORDER__) && __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__
468 q[0] = h.value;
469#else
470 q[1] = h.value;
471#endif
472 return result;
473}
474// --- standard functions ---
475
478 return (isinf)(float(a));
479}
482 return (isnan)(float(a));
483}
485 return !(isinf EIGEN_NOT_A_MACRO (a)) && !(isnan EIGEN_NOT_A_MACRO (a));
486}
487
490 result.value = a.value & 0x7FFF;
491 return result;
492}
494 return bfloat16(::expf(float(a)));
495}
497 return bfloat16(numext::expm1(float(a)));
498}
500 return bfloat16(::logf(float(a)));
501}
503 return bfloat16(numext::log1p(float(a)));
504}
506 return bfloat16(::log10f(float(a)));
507}
509 return bfloat16(static_cast<float>(EIGEN_LOG2E) * ::logf(float(a)));
510}
512 return bfloat16(::sqrtf(float(a)));
513}
515 return bfloat16(::powf(float(a), float(b)));
516}
518 return bfloat16(::sinf(float(a)));
519}
521 return bfloat16(::cosf(float(a)));
522}
524 return bfloat16(::tanf(float(a)));
525}
527 return bfloat16(::asinf(float(a)));
528}
530 return bfloat16(::acosf(float(a)));
531}
533 return bfloat16(::atanf(float(a)));
534}
536 return bfloat16(::sinhf(float(a)));
537}
539 return bfloat16(::coshf(float(a)));
540}
542 return bfloat16(::tanhf(float(a)));
543}
544#if EIGEN_HAS_CXX11_MATH
546 return bfloat16(::asinhf(float(a)));
547}
548EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 acosh(const bfloat16& a) {
549 return bfloat16(::acoshf(float(a)));
550}
551EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 atanh(const bfloat16& a) {
552 return bfloat16(::atanhf(float(a)));
553}
554#endif
556 return bfloat16(::floorf(float(a)));
557}
559 return bfloat16(::ceilf(float(a)));
560}
562 return bfloat16(::rintf(float(a)));
563}
565 return bfloat16(::roundf(float(a)));
566}
568 return bfloat16(::fmodf(float(a), float(b)));
569}
570
572 const float f1 = static_cast<float>(a);
573 const float f2 = static_cast<float>(b);
574 return f2 < f1 ? b : a;
575}
577 const float f1 = static_cast<float>(a);
578 const float f2 = static_cast<float>(b);
579 return f1 < f2 ? b : a;
580}
581
583 const float f1 = static_cast<float>(a);
584 const float f2 = static_cast<float>(b);
585 return bfloat16(::fminf(f1, f2));
586}
588 const float f1 = static_cast<float>(a);
589 const float f2 = static_cast<float>(b);
590 return bfloat16(::fmaxf(f1, f2));
591}
592
593#ifndef EIGEN_NO_IO
594EIGEN_ALWAYS_INLINE std::ostream& operator << (std::ostream& os, const bfloat16& v) {
595 os << static_cast<float>(v);
596 return os;
597}
598#endif
599
600} // namespace bfloat16_impl
601
602namespace internal {
603
604template<>
605struct random_default_impl<bfloat16, false, false>
606{
607 static inline bfloat16 run(const bfloat16& x, const bfloat16& y)
608 {
609 return x + (y-x) * bfloat16(float(std::rand()) / float(RAND_MAX));
610 }
611 static inline bfloat16 run()
612 {
613 return run(bfloat16(-1.f), bfloat16(1.f));
614 }
615};
616
617template<> struct is_arithmetic<bfloat16> { enum { value = true }; };
618
619} // namespace internal
620
621template<> struct NumTraits<Eigen::bfloat16>
622 : GenericNumTraits<Eigen::bfloat16>
623{
624 enum {
625 IsSigned = true,
626 IsInteger = false,
627 IsComplex = false,
629 };
630
633 }
635 return bfloat16_impl::raw_uint16_to_bfloat16(0x3D4D); // bfloat16(5e-2f);
636
637 }
640 }
643 }
646 }
649 }
650};
651
652} // namespace Eigen
653
654namespace Eigen {
655namespace numext {
656
657template<>
659bool (isnan)(const Eigen::bfloat16& h) {
660 return (bfloat16_impl::isnan)(h);
661}
662
663template<>
665bool (isinf)(const Eigen::bfloat16& h) {
666 return (bfloat16_impl::isinf)(h);
667}
668
669template<>
671bool (isfinite)(const Eigen::bfloat16& h) {
672 return (bfloat16_impl::isfinite)(h);
673}
674
675template <>
676EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC Eigen::bfloat16 bit_cast<Eigen::bfloat16, uint16_t>(const uint16_t& src) {
678}
679
680template <>
681EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC uint16_t bit_cast<uint16_t, Eigen::bfloat16>(const Eigen::bfloat16& src) {
683}
684
685} // namespace numext
686} // namespace Eigen
687
688#if EIGEN_HAS_STD_HASH
689namespace std {
690template <>
691struct hash<Eigen::bfloat16> {
692 EIGEN_STRONG_INLINE std::size_t operator()(const Eigen::bfloat16& a) const {
693 return static_cast<std::size_t>(Eigen::numext::bit_cast<Eigen::numext::uint16_t>(a));
694 }
695};
696} // namespace std
697#endif
698
699
700#endif // EIGEN_BFLOAT16_H
EIGEN_DEVICE_FUNC RealReturnType real() const
Definition: CommonCwiseUnaryOps.h:100
internal::enable_if< internal::valid_indexed_view_overload< RowIndices, ColIndices >::value &&internal::traits< typenameEIGEN_INDEXED_VIEW_METHOD_TYPE< RowIndices, ColIndices >::type >::ReturnAsIndexedView, typenameEIGEN_INDEXED_VIEW_METHOD_TYPE< RowIndices, ColIndices >::type >::type operator()(const RowIndices &rowIndices, const ColIndices &colIndices) EIGEN_INDEXED_VIEW_METHOD_CONST
Definition: IndexedViewMethods.h:73
#define EIGEN_ALWAYS_INLINE
Definition: Macros.h:942
#define EIGEN_USING_STD(FUNC)
Definition: Macros.h:1195
#define EIGEN_CONSTEXPR
Definition: Macros.h:797
#define EIGEN_DEVICE_FUNC
Definition: Macros.h:986
#define EIGEN_NOT_A_MACRO
Definition: Macros.h:906
#define EIGEN_STRONG_INLINE
Definition: Macros.h:927
#define EIGEN_LOG2E
Definition: MathFunctions.h:17
constexpr return_t< T > acosh(const T x) noexcept
Compile-time inverse hyperbolic cosine function.
Definition: acosh.hpp:62
constexpr return_t< T > asinh(const T x) noexcept
Compile-time inverse hyperbolic sine function.
Definition: asinh.hpp:59
constexpr return_t< T > atanh(const T x) noexcept
Compile-time inverse hyperbolic tangent function.
Definition: atanh.hpp:73
Definition: core.h:1240
constexpr auto digits10() noexcept -> int
Definition: format.h:1154
bool_constant< is_integral< T >::value &&!std::is_same< T, bool >::value &&!std::is_same< T, char >::value &&!std::is_same< T, wchar_t >::value > is_integer
Definition: format.h:3418
std::integral_constant< bool, std::numeric_limits< T >::is_signed||std::is_same< T, int128_opt >::value > is_signed
Definition: format.h:996
constexpr common_t< T1, T2 > max(const T1 x, const T2 y) noexcept
Compile-time pairwise maximum function.
Definition: max.hpp:35
constexpr common_t< T1, T2 > min(const T1 x, const T2 y) noexcept
Compile-time pairwise minimum function.
Definition: min.hpp:35
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC __bfloat16_raw float_to_bfloat16_rtne(float ff)
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16() max(const bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:576
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 operator/(const bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:176
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 tanh(const bfloat16 &a)
Definition: BFloat16.h:541
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bool operator<(const bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:224
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 & operator*=(bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:188
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 floor(const bfloat16 &a)
Definition: BFloat16.h:555
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bool operator>=(const bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:233
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 operator+(const bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:161
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 cosh(const bfloat16 &a)
Definition: BFloat16.h:538
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16() min(const bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:571
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 ceil(const bfloat16 &a)
Definition: BFloat16.h:558
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 acos(const bfloat16 &a)
Definition: BFloat16.h:529
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 log2(const bfloat16 &a)
Definition: BFloat16.h:508
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC EIGEN_CONSTEXPR __bfloat16_raw raw_uint16_to_bfloat16(numext::uint16_t value)
Definition: BFloat16.h:263
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 rint(const bfloat16 &a)
Definition: BFloat16.h:561
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 & operator/=(bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:196
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 operator-(const bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:173
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC __bfloat16_raw truncate_to_bfloat16(const float v)
Definition: BFloat16.h:248
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 operator--(bfloat16 &a)
Definition: BFloat16.h:204
EIGEN_ALWAYS_INLINE std::ostream & operator<<(std::ostream &os, const bfloat16 &v)
Definition: BFloat16.h:594
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 & operator-=(bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:192
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 asin(const bfloat16 &a)
Definition: BFloat16.h:526
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bool() isfinite(const bfloat16 &a)
Definition: BFloat16.h:484
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 fmod(const bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:567
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 log10(const bfloat16 &a)
Definition: BFloat16.h:505
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC EIGEN_CONSTEXPR __bfloat16_raw raw_uint16_to_bfloat16(unsigned short value)
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 fmin(const bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:582
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 atan(const bfloat16 &a)
Definition: BFloat16.h:532
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 fmax(const bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:587
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 cos(const bfloat16 &a)
Definition: BFloat16.h:520
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 exp(const bfloat16 &a)
Definition: BFloat16.h:493
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 pow(const bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:514
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC EIGEN_CONSTEXPR numext::uint16_t raw_bfloat16_as_uint16(const __bfloat16_raw &bf)
Definition: BFloat16.h:267
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 expm1(const bfloat16 &a)
Definition: BFloat16.h:496
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 sqrt(const bfloat16 &a)
Definition: BFloat16.h:511
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bool operator==(const bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:218
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC __bfloat16_raw float_to_bfloat16_rtne< false >(float ff)
Definition: BFloat16.h:274
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 round(const bfloat16 &a)
Definition: BFloat16.h:564
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 log(const bfloat16 &a)
Definition: BFloat16.h:499
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bool operator!=(const bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:221
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bool operator>(const bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:230
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 abs(const bfloat16 &a)
Definition: BFloat16.h:488
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 sinh(const bfloat16 &a)
Definition: BFloat16.h:535
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bool() isnan(const bfloat16 &a)
Definition: BFloat16.h:480
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC __bfloat16_raw float_to_bfloat16_rtne< true >(float ff)
Definition: BFloat16.h:448
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 tan(const bfloat16 &a)
Definition: BFloat16.h:523
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 operator*(const bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:170
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bool operator<=(const bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:227
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 sin(const bfloat16 &a)
Definition: BFloat16.h:517
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 & operator+=(bfloat16 &a, const bfloat16 &b)
Definition: BFloat16.h:184
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bool() isinf(const bfloat16 &a)
Definition: BFloat16.h:476
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 log1p(const bfloat16 &a)
Definition: BFloat16.h:502
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC float bfloat16_to_float(__bfloat16_raw h)
Definition: BFloat16.h:464
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bfloat16 operator++(bfloat16 &a)
Definition: BFloat16.h:200
const Scalar & y
Definition: MathFunctions.h:821
::uint16_t uint16_t
Definition: Meta.h:54
EIGEN_DEVICE_FUNC bool() isfinite(const T &x)
Definition: MathFunctions.h:1372
EIGEN_DEVICE_FUNC bool() isinf(const T &x)
Definition: MathFunctions.h:1371
::uint32_t uint32_t
Definition: Meta.h:56
EIGEN_DEVICE_FUNC bool() isnan(const T &x)
Definition: MathFunctions.h:1370
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bool equal_strict(const X &x, const Y &y)
Definition: Meta.h:787
EIGEN_STRONG_INLINE EIGEN_DEVICE_FUNC bool not_equal_strict(const X &x, const Y &y)
Definition: Meta.h:798
Namespace containing all symbols from the Eigen library.
Definition: MatrixExponential.h:16
EIGEN_DEFAULT_DENSE_INDEX_TYPE Index
The Index type as used for the API.
Definition: Meta.h:74
Definition: format.h:2555
result
Definition: format.h:2556
Definition: Eigen_Colamd.h:50
Definition: StdDeque.h:50
static constexpr const unit_t< compound_unit< energy::joule, time::seconds > > h(6.626070040e-34)
Planck constant.
b
Definition: data.h:44
constexpr bool signbit(const T x) noexcept
Compile-time sign bit detection function.
Definition: signbit.hpp:34
Definition: NumTraits.h:153
@ RequireInitialization
Definition: NumTraits.h:158
@ IsSigned
Definition: NumTraits.h:156
@ IsInteger
Definition: NumTraits.h:155
@ IsComplex
Definition: NumTraits.h:157
EIGEN_DEVICE_FUNC static EIGEN_CONSTEXPR EIGEN_STRONG_INLINE Eigen::bfloat16 highest()
Definition: BFloat16.h:638
EIGEN_DEVICE_FUNC static EIGEN_CONSTEXPR EIGEN_STRONG_INLINE Eigen::bfloat16 lowest()
Definition: BFloat16.h:641
EIGEN_DEVICE_FUNC static EIGEN_CONSTEXPR EIGEN_STRONG_INLINE Eigen::bfloat16 infinity()
Definition: BFloat16.h:644
EIGEN_DEVICE_FUNC static EIGEN_CONSTEXPR EIGEN_STRONG_INLINE Eigen::bfloat16 quiet_NaN()
Definition: BFloat16.h:647
EIGEN_DEVICE_FUNC static EIGEN_CONSTEXPR EIGEN_STRONG_INLINE Eigen::bfloat16 dummy_precision()
Definition: BFloat16.h:634
EIGEN_DEVICE_FUNC static EIGEN_CONSTEXPR EIGEN_STRONG_INLINE Eigen::bfloat16 epsilon()
Definition: BFloat16.h:631
Holds information about the various numeric (i.e.
Definition: NumTraits.h:233
Definition: BFloat16.h:33
EIGEN_DEVICE_FUNC EIGEN_CONSTEXPR __bfloat16_raw()
Definition: BFloat16.h:34
unsigned short value
Definition: BFloat16.h:36
EIGEN_DEVICE_FUNC EIGEN_CONSTEXPR __bfloat16_raw(unsigned short raw)
Definition: BFloat16.h:35
Definition: BFloat16.h:50
EIGEN_DEVICE_FUNC EIGEN_CONSTEXPR bfloat16_base()
Definition: BFloat16.h:51
EIGEN_DEVICE_FUNC EIGEN_CONSTEXPR bfloat16_base(const __bfloat16_raw &h)
Definition: BFloat16.h:52
Definition: BFloat16.h:58
bfloat16_impl::__bfloat16_raw __bfloat16_raw
Definition: BFloat16.h:60
EIGEN_DEVICE_FUNC EIGEN_CONSTEXPR bfloat16(const __bfloat16_raw &h)
Definition: BFloat16.h:64
EIGEN_DEVICE_FUNC EIGEN_CONSTEXPR bfloat16(const std::complex< RealScalar > &val)
Definition: BFloat16.h:79
EIGEN_DEVICE_FUNC bfloat16(float f)
Definition: BFloat16.h:73
EIGEN_DEVICE_FUNC EIGEN_CONSTEXPR bfloat16(T val)
Definition: BFloat16.h:70
EIGEN_DEVICE_FUNC EIGEN_CONSTEXPR bfloat16()
Definition: BFloat16.h:62
EIGEN_DEVICE_FUNC EIGEN_CONSTEXPR bfloat16(bool b)
Definition: BFloat16.h:66
Definition: Meta.h:133
static bfloat16 run()
Definition: BFloat16.h:611
static bfloat16 run(const bfloat16 &x, const bfloat16 &y)
Definition: BFloat16.h:607
Definition: MathFunctions.h:810
Definition: format.h:989
static Eigen::bfloat16 signaling_NaN()
Definition: BFloat16.h:122
static Eigen::bfloat16 epsilon()
Definition: BFloat16.h:118
static Eigen::bfloat16 lowest()
Definition: BFloat16.h:116
static Eigen::bfloat16 denorm_min()
Definition: BFloat16.h:123
static Eigen::bfloat16 round_error()
Definition: BFloat16.h:119
static Eigen::bfloat16 quiet_NaN()
Definition: BFloat16.h:121
static Eigen::bfloat16 infinity()
Definition: BFloat16.h:120