Please, help us to better know about our user community by answering the following short survey: https://forms.gle/wpyrxWi18ox9Z5ae9
Eigen  3.4.0
 
Loading...
Searching...
No Matches
SSE/TypeCasting.h
1// This file is part of Eigen, a lightweight C++ template library
2// for linear algebra.
3//
4// Copyright (C) 2015 Benoit Steiner <benoit.steiner.goog@gmail.com>
5//
6// This Source Code Form is subject to the terms of the Mozilla
7// Public License v. 2.0. If a copy of the MPL was not distributed
8// with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
9
10#ifndef EIGEN_TYPE_CASTING_SSE_H
11#define EIGEN_TYPE_CASTING_SSE_H
12
13namespace Eigen {
14
15namespace internal {
16
17#ifndef EIGEN_VECTORIZE_AVX
18template <>
19struct type_casting_traits<float, int> {
20 enum {
21 VectorizedCast = 1,
22 SrcCoeffRatio = 1,
23 TgtCoeffRatio = 1
24 };
25};
26
27template <>
28struct type_casting_traits<int, float> {
29 enum {
30 VectorizedCast = 1,
31 SrcCoeffRatio = 1,
32 TgtCoeffRatio = 1
33 };
34};
35
36template <>
37struct type_casting_traits<double, float> {
38 enum {
39 VectorizedCast = 1,
40 SrcCoeffRatio = 2,
41 TgtCoeffRatio = 1
42 };
43};
44
45template <>
46struct type_casting_traits<float, double> {
47 enum {
48 VectorizedCast = 1,
49 SrcCoeffRatio = 1,
50 TgtCoeffRatio = 2
51 };
52};
53#endif
54
55template<> EIGEN_STRONG_INLINE Packet4i pcast<Packet4f, Packet4i>(const Packet4f& a) {
56 return _mm_cvttps_epi32(a);
57}
58
59template<> EIGEN_STRONG_INLINE Packet4f pcast<Packet4i, Packet4f>(const Packet4i& a) {
60 return _mm_cvtepi32_ps(a);
61}
62
63template<> EIGEN_STRONG_INLINE Packet4f pcast<Packet2d, Packet4f>(const Packet2d& a, const Packet2d& b) {
64 return _mm_shuffle_ps(_mm_cvtpd_ps(a), _mm_cvtpd_ps(b), (1 << 2) | (1 << 6));
65}
66
67template<> EIGEN_STRONG_INLINE Packet2d pcast<Packet4f, Packet2d>(const Packet4f& a) {
68 // Simply discard the second half of the input
69 return _mm_cvtps_pd(a);
70}
71
72template<> EIGEN_STRONG_INLINE Packet4i preinterpret<Packet4i,Packet4f>(const Packet4f& a) {
73 return _mm_castps_si128(a);
74}
75
76template<> EIGEN_STRONG_INLINE Packet4f preinterpret<Packet4f,Packet4i>(const Packet4i& a) {
77 return _mm_castsi128_ps(a);
78}
79
80template<> EIGEN_STRONG_INLINE Packet2d preinterpret<Packet2d,Packet4i>(const Packet4i& a) {
81 return _mm_castsi128_pd(a);
82}
83
84template<> EIGEN_STRONG_INLINE Packet4i preinterpret<Packet4i,Packet2d>(const Packet2d& a) {
85 return _mm_castpd_si128(a);
86}
87
88// Disable the following code since it's broken on too many platforms / compilers.
89//#elif defined(EIGEN_VECTORIZE_SSE) && (!EIGEN_ARCH_x86_64) && (!EIGEN_COMP_MSVC)
90#if 0
91
92template <>
93struct type_casting_traits<Eigen::half, float> {
94 enum {
95 VectorizedCast = 1,
96 SrcCoeffRatio = 1,
97 TgtCoeffRatio = 1
98 };
99};
100
101template<> EIGEN_STRONG_INLINE Packet4f pcast<Packet4h, Packet4f>(const Packet4h& a) {
102 __int64_t a64 = _mm_cvtm64_si64(a.x);
103 Eigen::half h = raw_uint16_to_half(static_cast<unsigned short>(a64));
104 float f1 = static_cast<float>(h);
105 h = raw_uint16_to_half(static_cast<unsigned short>(a64 >> 16));
106 float f2 = static_cast<float>(h);
107 h = raw_uint16_to_half(static_cast<unsigned short>(a64 >> 32));
108 float f3 = static_cast<float>(h);
109 h = raw_uint16_to_half(static_cast<unsigned short>(a64 >> 48));
110 float f4 = static_cast<float>(h);
111 return _mm_set_ps(f4, f3, f2, f1);
112}
113
114template <>
115struct type_casting_traits<float, Eigen::half> {
116 enum {
117 VectorizedCast = 1,
118 SrcCoeffRatio = 1,
119 TgtCoeffRatio = 1
120 };
121};
122
123template<> EIGEN_STRONG_INLINE Packet4h pcast<Packet4f, Packet4h>(const Packet4f& a) {
124 EIGEN_ALIGN16 float aux[4];
125 pstore(aux, a);
126 Eigen::half h0(aux[0]);
127 Eigen::half h1(aux[1]);
128 Eigen::half h2(aux[2]);
129 Eigen::half h3(aux[3]);
130
131 Packet4h result;
132 result.x = _mm_set_pi16(h3.x, h2.x, h1.x, h0.x);
133 return result;
134}
135
136#endif
137
138} // end namespace internal
139
140} // end namespace Eigen
141
142#endif // EIGEN_TYPE_CASTING_SSE_H
Namespace containing all symbols from the Eigen library.
Definition: Core:141