2022-10-21-dev/doxygen/PSEUDO__F32vec4_8h_source.html

 #ifndef L1Algo_PSEUDO_F32vec4_H
 #define L1Algo_PSEUDO_F32vec4_H

 #include <iostream>
 #include <cmath>
 #include "vec_arithmetic.h"

 /**********************************
  *
  *   Vector of four floats
  *
  **********************************/

 float min(float x, float y);
 float max(float x, float y);
 float asgnb(float x, float y);
 float rsqrt(float x);
 float rcp(float x);
 float sgn(float x);

 class F32vec4 {

  public:
   float v[4];

   float &operator[](int i) { return ((float *)&v)[i]; }
   float operator[](int i) const { return ((float *)&v)[i]; }

   F32vec4() {}
   F32vec4(const F32vec4 &a)
   {
     v[0] = a.v[0];
     v[1] = a.v[1];
     v[2] = a.v[2];
     v[3] = a.v[3];
   }
   F32vec4(const float &a)
   {
     v[0] = a;
     v[1] = a;
     v[2] = a;
     v[3] = a;
   }

   F32vec4(const float &f0, const float &f1, const float &f2, const float &f3)
   {
     v[0] = f0;
     v[1] = f1;
     v[2] = f2;
     v[3] = f3;
   }

 #define _f2(A, B, F)          \
   F32vec4 z;                  \
   z.v[0] = F(A.v[0], B.v[0]); \
   z.v[1] = F(A.v[1], B.v[1]); \
   z.v[2] = F(A.v[2], B.v[2]); \
   z.v[3] = F(A.v[3], B.v[3]); \
   return z;
 #define _f1(A, F)     \
   F32vec4 z;          \
   z.v[0] = F(A.v[0]); \
   z.v[1] = F(A.v[1]); \
   z.v[2] = F(A.v[2]); \
   z.v[3] = F(A.v[3]); \
   return z;
 #define _op(A, B, O)        \
   F32vec4 z;                \
   z.v[0] = A.v[0] O B.v[0]; \
   z.v[1] = A.v[1] O B.v[1]; \
   z.v[2] = A.v[2] O B.v[2]; \
   z.v[3] = A.v[3] O B.v[3]; \
   return z;

   /* Arithmetic Operators */
   friend F32vec4 operator+(const F32vec4 &a, const F32vec4 &b) { _op(a, b, +) }
   friend F32vec4 operator-(const F32vec4 &a, const F32vec4 &b) { _op(a, b, -) }
   friend F32vec4 operator*(const F32vec4 &a, const F32vec4 &b) { _op(a, b, *) }
   friend F32vec4 operator/(const F32vec4 &a, const F32vec4 &b) { _op(a, b, /) }

   /* Comparison */
   friend F32vec4 operator<(const F32vec4 &a, const F32vec4 &b) { _op(a, b, <) }
   friend F32vec4 operator<=(const F32vec4 &a, const F32vec4 &b) { _op(a, b, <=) }
   friend F32vec4 operator>(const F32vec4 &a, const F32vec4 &b) { _op(a, b, >) }
   friend F32vec4 operator>=(const F32vec4 &a, const F32vec4 &b) { _op(a, b, >=) }

   /* Logic */
   friend F32vec4 operator&(const F32vec4 &a, const F32vec4 &b) { _op(a, b, &&) }
   friend F32vec4 operator|(const F32vec4 &a, const F32vec4 &b) { _op(a, b, ||) }
   friend F32vec4 operator||(const F32vec4 &a, const F32vec4 &b) { _op(a, b, ||) }

   friend F32vec4 operator!(const F32vec4 &a)
   {
     F32vec4 z;
     z[0] = !a[0];
     z[1] = !a[1];
     z[2] = !a[2];
     z[3] = !a[3];

     return z;
   }

   friend F32vec4 if3(const F32vec4 &a, const F32vec4 &b, const F32vec4 &c)
   {
     F32vec4 z;
     z[0] = (a[0]) ? b[0] : c[0];
     z[1] = (a[1]) ? b[1] : c[1];
     z[2] = (a[2]) ? b[2] : c[2];
     z[3] = (a[3]) ? b[3] : c[3];

     return z;
   }

 #define NotEmpty(a) bool((a)[0]) | bool((a)[1]) | bool((a)[2]) | bool((a)[3])
 #define Empty(a) !(bool((a)[0]) | bool((a)[1]) | bool((a)[2]) | bool((a)[3]))
   // bool NotEmpty(const F32vec4 &a) { return a[0]||a[1]||a[2]||a[3]; }
   // bool    Empty(const F32vec4 &a) { return !(a[0]||a[1]||a[2]||a[3]); } // optimize
   friend F32vec4 bool2int(const F32vec4 &a)
   { // mask returned
     return if3(a, 1, 0);
   }

   /* Functions */
   friend float min(float x, float y) { return x < y ? x : y; }
   friend float max(float x, float y) { return x < y ? y : x; }
   friend float asgnb(float x, float y) { return y >= 0 ? fabs(x) : -fabs(x); }
   friend float rsqrt(float x) { return 1. / sqrt(x); }
   friend float rcp(float x) { return 1. / x; }
   friend float sgn(float x) { return x >= 0 ? 1 : -1; }

   friend F32vec4 min(const F32vec4 &a, const F32vec4 &b) { _f2(a, b, min) }
   friend F32vec4 max(const F32vec4 &a, const F32vec4 &b) { _f2(a, b, max) }
   friend F32vec4 asgnb(const F32vec4 &a, const F32vec4 &b) { _f2(a, b, asgnb) }
   friend F32vec4 sqrt(const F32vec4 &a) { _f1(a, sqrt) }
   friend F32vec4 rsqrt(const F32vec4 &a) { _f1(a, rsqrt) }
   friend F32vec4 rcp(const F32vec4 &a) { _f1(a, rcp) }
   friend F32vec4 fabs(const F32vec4 &a) { _f1(a, fabs) }
   friend F32vec4 sgn(const F32vec4 &a) { _f1(a, sgn) }
   friend F32vec4 exp(const F32vec4 &a) { _f1(a, exp) }
   friend F32vec4 log(const F32vec4 &a) { _f1(a, log) }
   friend F32vec4 sin(const F32vec4 &a) { _f1(a, sin) }
   friend F32vec4 cos(const F32vec4 &a) { _f1(a, cos) }
 #undef _f1
 #undef _f2
 #undef _op

   /* Define all operators for consistensy */

   vec_arithmetic(F32vec4, float);

   friend ostream &operator<<(ostream &strm, const F32vec4 &a)
   {
     strm << a[0] << " " << a[1] << " " << a[2] << " " << a[3];
     return strm;
   }

   friend istream &operator>>(istream &strm, F32vec4 &a)
   {
     float tmp;
     strm >> tmp;
     a = tmp;
     return strm;
   }

 } __attribute__((aligned(16)));
 ;

 typedef F32vec4 fvec;
 typedef float fscal;
 const int fvecLen = 4;
 //#define fvec_true  _f32vec4_true
 //#define fvec_false _f32vec4_false
 #define _fvecalignment

 namespace nsL1 {
 template <typename T>
 struct vector {
   typedef std::vector<T> TStd;
   typedef std::vector<T> TSimd;
 };

 typedef nsL1::vector<fvec>::TSimd vector_fvec;
 }; // namespace nsL1

 template <typename T>
 struct nsL1vector : public nsL1::vector<T> // just for use std::vector simultaniosly
 {
 };

 #endif
F32vec4
Definition: P4_F32vec4.h:38

nsL1vector
Definition: PSEUDO_F32vec1.h:152

asgnb
float asgnb(float x, float y)
Definition: PSEUDO_F32vec4.h:124

fvecLen
const int fvecLen
Definition: PSEUDO_F32vec4.h:170

F32vec4::operator!
friend F32vec4 operator!(const F32vec4 &a)
Definition: PSEUDO_F32vec4.h:92

F32vec4::log
friend F32vec4 log(const F32vec4 &a)
Definition: P4_F32vec4.h:154

F32vec4::rcp
friend float rcp(float x)
Definition: PSEUDO_F32vec4.h:128

min
float min(float x, float y)
Definition: PSEUDO_F32vec4.h:122

_op
#define _op(A, B, O)
Definition: PSEUDO_F32vec4.h:65

F32vec4::F32vec4
F32vec4(const float &a)
Definition: PSEUDO_F32vec4.h:37

F32vec4::max
friend F32vec4 max(const F32vec4 &a, const F32vec4 &b)
Definition: P4_F32vec4.h:62

nsL1
Definition: PSEUDO_F32vec1.h:141

F32vec4::rsqrt
friend F32vec4 rsqrt(const F32vec4 &a)
Definition: P4_F32vec4.h:68

F32vec4::F32vec4
F32vec4(const float &f0, const float &f1, const float &f2, const float &f3)
Definition: PSEUDO_F32vec4.h:45

nsL1::vector_fvec
nsL1::vector< fvec >::TSimd vector_fvec
Definition: PSEUDO_F32vec1.h:148

_f2
#define _f2(A, B, F)
Definition: PSEUDO_F32vec4.h:51

i
unsigned int i
Definition: P4_F32vec4.h:21

vec_arithmetic.h

F32vec4::vec_arithmetic
vec_arithmetic(F32vec4, float)

F32vec4::operator>
friend F32vec4 operator>(const F32vec4 &a, const F32vec4 &b)
Definition: PSEUDO_F32vec4.h:84

rcp
float rcp(float x)
Definition: PSEUDO_F32vec4.h:126

F32vec4::operator+
friend F32vec4 operator+(const F32vec4 &a, const F32vec4 &b)
Definition: P4_F32vec4.h:55

F32vec4::exp
friend F32vec4 exp(const F32vec4 &a)
Definition: P4_F32vec4.h:153

F32vec4::operator||
friend F32vec4 operator||(const F32vec4 &a, const F32vec4 &b)
Definition: PSEUDO_F32vec4.h:90

F32vec4::rcp
friend F32vec4 rcp(const F32vec4 &a)
Definition: P4_F32vec4.h:76

nsL1::vector::TSimd
std::vector< T > TSimd
Definition: PSEUDO_F32vec4.h:179

F32vec4::operator/
friend F32vec4 operator/(const F32vec4 &a, const F32vec4 &b)
Definition: PSEUDO_F32vec4.h:79

fvec
F32vec4 fvec
Definition: PSEUDO_F32vec4.h:166

F32vec4::asgnb
friend F32vec4 asgnb(const F32vec4 &a, const F32vec4 &b)
Definition: P4_F32vec4.h:87

F32vec4::operator|
friend F32vec4 operator|(const F32vec4 &a, const F32vec4 &b)
Definition: PSEUDO_F32vec4.h:89

F32vec4::if3
friend F32vec4 if3(const F32vec4 &a, const F32vec4 &b, const F32vec4 &c)
Definition: PSEUDO_F32vec4.h:103

F32vec4::operator<
friend F32vec4 operator<(const F32vec4 &a, const F32vec4 &b)
Definition: P4_F32vec4.h:113

F32vec4::bool2int
friend F32vec4 bool2int(const F32vec4 &a)
Definition: PSEUDO_F32vec4.h:118

fscal
float fscal
Definition: PSEUDO_F32vec4.h:169

F32vec4::cos
friend F32vec4 cos(const F32vec4 &a)
Definition: PSEUDO_F32vec4.h:142

F32vec4::operator<=
friend F32vec4 operator<=(const F32vec4 &a, const F32vec4 &b)
Definition: P4_F32vec4.h:117

F32vec4::operator[]
float & operator[](int i)
Definition: PSEUDO_F32vec4.h:26

F32vec4::operator &
friend F32vec4 operator &(const F32vec4 &a, const F32vec4 &b)
Definition: P4_F32vec4.h:91

_f1
#define _f1(A, F)
Definition: PSEUDO_F32vec4.h:58

__attribute__
nsL1vector __attribute__

F32vec4::F32vec4
F32vec4()
Definition: PSEUDO_F32vec4.h:29

F32vec4::fabs
friend F32vec4 fabs(const F32vec4 &a)
Definition: P4_F32vec4.h:83

sgn
float sgn(float x)
Definition: PSEUDO_F32vec4.h:127

nsL1::vector
Definition: PSEUDO_F32vec1.h:143

F32vec4::operator-
friend F32vec4 operator-(const F32vec4 &a, const F32vec4 &b)
Definition: P4_F32vec4.h:56

rsqrt
float rsqrt(float x)
Definition: PSEUDO_F32vec4.h:125

max
float max(float x, float y)
Definition: PSEUDO_F32vec4.h:123

F32vec4::sgn
friend F32vec4 sgn(const F32vec4 &a)
Definition: P4_F32vec4.h:86

F32vec4::min
friend F32vec4 min(const F32vec4 &a, const F32vec4 &b)
Definition: P4_F32vec4.h:61

F32vec4::operator>=
friend F32vec4 operator>=(const F32vec4 &a, const F32vec4 &b)
Definition: PSEUDO_F32vec4.h:85

F32vec4::sqrt
friend F32vec4 sqrt(const F32vec4 &a)
Definition: P4_F32vec4.h:65

F32vec4::operator<<
friend ostream & operator<<(ostream &strm, const F32vec4 &a)
Definition: PSEUDO_F32vec4.h:151

F32vec4::operator*
friend F32vec4 operator*(const F32vec4 &a, const F32vec4 &b)
Definition: PSEUDO_F32vec4.h:78

F32vec4::sin
friend F32vec4 sin(const F32vec4 &a)
Definition: PSEUDO_F32vec4.h:141

nsL1::vector::TStd
std::vector< T > TStd
Definition: PSEUDO_F32vec4.h:178

F32vec4::operator>>
friend istream & operator>>(istream &strm, F32vec4 &a)
Definition: PSEUDO_F32vec4.h:157

F32vec4::v
__m128 v
Definition: P4_F32vec4.h:40

F32vec4::F32vec4
F32vec4(const F32vec4 &a)
Definition: PSEUDO_F32vec4.h:30