api6_1/c++/vectorize__pnacl_8h_source.html

 #ifndef OPENMM_VECTORIZE_PNACL_H_

 #define OPENMM_VECTORIZE_PNACL_H_


 /* -------------------------------------------------------------------------- *

  *                                   OpenMM                                   *

  * -------------------------------------------------------------------------- *

  * This is part of the OpenMM molecular simulation toolkit originating from   *

  * Simbios, the NIH National Center for Physics-Based Simulation of           *

  * Biological Structures at Stanford, funded under the NIH Roadmap for        *

  * Medical Research, grant U54 GM072970. See https://simtk.org.               *

  *                                                                            *

  * Portions copyright (c) 2013-2014 Stanford University and the Authors.      *

  * Authors: Peter Eastman                                                     *

  * Contributors:                                                              *

  *                                                                            *

  * Permission is hereby granted, free of charge, to any person obtaining a    *

  * copy of this software and associated documentation files (the "Software"), *

  * to deal in the Software without restriction, including without limitation  *

  * the rights to use, copy, modify, merge, publish, distribute, sublicense,   *

  * and/or sell copies of the Software, and to permit persons to whom the      *

  * Software is furnished to do so, subject to the following conditions:       *

  *                                                                            *

  * The above copyright notice and this permission notice shall be included in *

  * all copies or substantial portions of the Software.                        *

  *                                                                            *

  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR *

  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,   *

  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL    *

  * THE AUTHORS, CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM,    *

  * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR      *

  * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE  *

  * USE OR OTHER DEALINGS IN THE SOFTWARE.                                     *

  * -------------------------------------------------------------------------- */


 #include <cmath>

 #include <cstdlib>


 // This file defines classes and functions to simplify vectorizing code with portable SIMD vectors.


 static bool isVec4Supported() {

     return true;

 }


 typedef float __m128 __attribute__((vector_size(16), aligned(4)));

 typedef int __m128i __attribute__((vector_size(16), aligned(4)));


 class ivec4;


 class fvec4 {

 public:

     __m128 val;


     fvec4() {}

     fvec4(float v) {

         val = {v, v, v, v};

     }

     fvec4(float v1, float v2, float v3, float v4) {

         val = {v1, v2, v3, v4};

     }

     fvec4(__m128 v) : val(v) {}

     fvec4(const float* v) {

         val = *((__m128*) v);

     }

     operator __m128() const {

         return val;

     }

     float operator[](int i) const {

         return val[i];

     }

     void store(float* v) const {

         *((__m128*) v) = val;

     }

     fvec4 operator+(const fvec4& other) const {

         return val+other;

     }

     fvec4 operator-(const fvec4& other) const {

         return val-other;

     }

     fvec4 operator*(const fvec4& other) const {

         return val*other;

     }

     fvec4 operator/(const fvec4& other) const {

         return val/other;

     }

     void operator+=(const fvec4& other) {

         val = val+other;

     }

     void operator-=(const fvec4& other) {

         val = val-other;

     }

     void operator*=(const fvec4& other) {

         val = val*other;

     }

     void operator/=(const fvec4& other) {

         val = val/other;

     }

     fvec4 operator-() const {

         return -val;

     }

     fvec4 operator&(const fvec4& other) const {

         return (fvec4) (((__m128i)val)&((__m128i)other.val));

     }

     fvec4 operator|(const fvec4& other) const {

         return (fvec4) (((__m128i)val)|((__m128i)other.val));

     }

     fvec4 operator==(const fvec4& other) const {

         return (val==other.val);

     }

     fvec4 operator!=(const fvec4& other) const {

         return (val!=other.val);

     }

     fvec4 operator>(const fvec4& other) const {

         return (val>other.val);

     }

     fvec4 operator<(const fvec4& other) const {

         return (val<other.val);

     }

     fvec4 operator>=(const fvec4& other) const {

         return (val>=other.val);

     }

     fvec4 operator<=(const fvec4& other) const {

         return (val<=other.val);

     }

     operator ivec4() const;

 };


 class ivec4 {

 public:

     __m128i val;


     ivec4() {}

     ivec4(int v) {

         val = {v, v, v, v};

     }

     ivec4(int v1, int v2, int v3, int v4) {

         val = {v1, v2, v3, v4};

     }

     ivec4(__m128i v) : val(v) {}

     ivec4(const int* v) {

         val = *((__m128*) v);

     }

     operator __m128i() const {

         return val;

     }

     int operator[](int i) const {

         return val[i];

     }

     void store(int* v) const {

         *((__m128*) v) = val;

     }

     ivec4 operator+(const ivec4& other) const {

         return val+other;

     }

     ivec4 operator-(const ivec4& other) const {

         return val-other;

     }

     ivec4 operator*(const ivec4& other) const {

         return val*other;

     }

     void operator+=(const ivec4& other) {

         val = val+other;

     }

     void operator-=(const ivec4& other) {

         val = val-other;

     }

     void operator*=(const ivec4& other) {

         val = val*other;

     }

     ivec4 operator-() const {

         return -val;

     }

     ivec4 operator&(const ivec4& other) const {

         return val&other.val;

     }

     ivec4 operator|(const ivec4& other) const {

         return val|other.val;

     }

     ivec4 operator==(const ivec4& other) const {

         return (val==other.val);

     }

     ivec4 operator!=(const ivec4& other) const {

         return (val!=other.val);

     }

     ivec4 operator>(const ivec4& other) const {

         return (val>other.val);

     }

     ivec4 operator<(const ivec4& other) const {

         return (val<other.val);

     }

     ivec4 operator>=(const ivec4& other) const {

         return (val>=other.val);

     }

     ivec4 operator<=(const ivec4& other) const {

         return (val<=other.val);

     }

     operator fvec4() const;

 };


 // Conversion operators.


 inline fvec4::operator ivec4() const {

     return __builtin_convertvector(val, __m128i);

 }


 inline ivec4::operator fvec4() const {

     return __builtin_convertvector(val, __m128);

 }


 // Functions that operate on fvec4s.


 static inline fvec4 floor(const fvec4& v) {

     return fvec4(std::floor(v[0]), std::floor(v[1]), std::floor(v[2]), std::floor(v[3]));

 }


 static inline fvec4 ceil(const fvec4& v) {

     return fvec4(std::ceil(v[0]), std::ceil(v[1]), std::ceil(v[2]), std::ceil(v[3]));

 }


 static inline fvec4 round(const fvec4& v) {

     return fvec4(std::round(v[0]), std::round(v[1]), std::round(v[2]), std::round(v[3]));

 }


 static inline fvec4 min(const fvec4& v1, const fvec4& v2) {

     return fvec4(std::min(v1[0], v2[0]), std::min(v1[1], v2[1]), std::min(v1[2], v2[2]), std::min(v1[3], v2[3]));

 }


 static inline fvec4 max(const fvec4& v1, const fvec4& v2) {

     return fvec4(std::max(v1[0], v2[0]), std::max(v1[1], v2[1]), std::max(v1[2], v2[2]), std::max(v1[3], v2[3]));

 }


 static inline fvec4 abs(const fvec4& v) {

     return fvec4(std::abs(v[0]), std::abs(v[1]), std::abs(v[2]), std::abs(v[3]));

 }


 static inline fvec4 sqrt(const fvec4& v) {

     return fvec4(std::sqrt(v[0]), std::sqrt(v[1]), std::sqrt(v[2]), std::sqrt(v[3]));

 }


 static inline float dot3(const fvec4& v1, const fvec4& v2) {

     fvec4 r = v1*v2;

     return r[0]+r[1]+r[2];

 }


 static inline float dot4(const fvec4& v1, const fvec4& v2) {

     fvec4 r = v1*v2;

     return r[0]+r[1]+r[2]+r[3];

 }


 static inline void transpose(fvec4& v1, fvec4& v2, fvec4& v3, fvec4& v4) {

     __m128 a1 = __builtin_shufflevector(v1.val, v2.val, 0, 4, 2, 6);

     __m128 a2 = __builtin_shufflevector(v1.val, v2.val, 1, 5, 3, 7);

     __m128 a3 = __builtin_shufflevector(v3.val, v4.val, 0, 4, 2, 6);

     __m128 a4 = __builtin_shufflevector(v3.val, v4.val, 1, 5, 3, 7);

     v1 = __builtin_shufflevector(a1, a3, 0, 1, 4, 5);

     v2 = __builtin_shufflevector(a2, a4, 0, 1, 4, 5);

     v3 = __builtin_shufflevector(a1, a3, 2, 3, 6, 7);

     v4 = __builtin_shufflevector(a2, a4, 2, 3, 6, 7);

 }


 // Functions that operate on ivec4s.


 static inline ivec4 min(const ivec4& v1, const ivec4& v2) {

     return ivec4(std::min(v1[0], v2[0]), std::min(v1[1], v2[1]), std::min(v1[2], v2[2]), std::min(v1[3], v2[3]));

 }


 static inline ivec4 max(const ivec4& v1, const ivec4& v2) {

     return ivec4(std::max(v1[0], v2[0]), std::max(v1[1], v2[1]), std::max(v1[2], v2[2]), std::max(v1[3], v2[3]));

 }


 static inline ivec4 abs(const ivec4& v) {

     return ivec4(abs(v[0]), abs(v[1]), abs(v[2]), abs(v[3]));

 }


 static inline bool any(const __m128i& v) {

     return (v[0] || v[1] || v[2] || v[3]);

 }


 // Mathematical operators involving a scalar and a vector.


 static inline fvec4 operator+(float v1, const fvec4& v2) {

     return fvec4(v1)+v2;

 }


 static inline fvec4 operator-(float v1, const fvec4& v2) {

     return fvec4(v1)-v2;

 }


 static inline fvec4 operator*(float v1, const fvec4& v2) {

     return fvec4(v1)*v2;

 }


 static inline fvec4 operator/(float v1, const fvec4& v2) {

     return fvec4(v1)/v2;

 }


 // Operations for blending fvec4s based on an ivec4.


 static inline fvec4 blend(const fvec4& v1, const fvec4& v2, const __m128i& mask) {

     return fvec4(mask[0] ? v2[0] : v1[0], mask[1] ? v2[1] : v1[1], mask[2] ? v2[2] : v1[2], mask[3] ? v2[3] : v1[3]);

 }


 #endif /*OPENMM_VECTORIZE_PNACL_H_*/


fvec4::operator>=
fvec4 operator>=(const fvec4 &other) const
Definition: vectorize_pnacl.h:124

fvec4::operator+
fvec4 operator+(const fvec4 &other) const
Definition: vectorize_pnacl.h:79

ivec4
A four element vector of ints.
Definition: vectorize_neon.h:150

ivec4::operator==
ivec4 operator==(const ivec4 &other) const
Definition: vectorize_pnacl.h:187

ivec4::operator[]
int operator[](int i) const
Definition: vectorize_pnacl.h:154

fvec4::operator-
fvec4 operator-(const fvec4 &other) const
Definition: vectorize_pnacl.h:82

fvec4::val
__m128 val
Definition: vectorize_pnacl.h:57

fvec4::operator[]
float operator[](int i) const
Definition: vectorize_pnacl.h:73

ivec4::operator<
ivec4 operator<(const ivec4 &other) const
Definition: vectorize_pnacl.h:196

fvec4::operator<
fvec4 operator<(const fvec4 &other) const
Definition: vectorize_pnacl.h:121

fvec4::fvec4
fvec4(__m128 v)
Definition: vectorize_pnacl.h:66

fvec4::operator/=
void operator/=(const fvec4 &other)
Definition: vectorize_pnacl.h:100

fvec4::operator*=
void operator*=(const fvec4 &other)
Definition: vectorize_pnacl.h:97

fvec4::fvec4
fvec4(const float *v)
Definition: vectorize_pnacl.h:67

ivec4::operator-
ivec4 operator-(const ivec4 &other) const
Definition: vectorize_pnacl.h:163

ivec4::store
void store(int *v) const
Definition: vectorize_pnacl.h:157

ivec4::operator>=
ivec4 operator>=(const ivec4 &other) const
Definition: vectorize_pnacl.h:199

ivec4::ivec4
ivec4(__m128i v)
Definition: vectorize_pnacl.h:147

fvec4
A four element vector of floats.
Definition: vectorize_neon.h:56

ivec4::operator!=
ivec4 operator!=(const ivec4 &other) const
Definition: vectorize_pnacl.h:190

ivec4::ivec4
ivec4(int v1, int v2, int v3, int v4)
Definition: vectorize_pnacl.h:144

ivec4::ivec4
ivec4(const int *v)
Definition: vectorize_pnacl.h:148

fvec4::operator==
fvec4 operator==(const fvec4 &other) const
Definition: vectorize_pnacl.h:112

fvec4::operator<=
fvec4 operator<=(const fvec4 &other) const
Definition: vectorize_pnacl.h:127

fvec4::store
void store(float *v) const
Definition: vectorize_pnacl.h:76

ivec4::operator-=
void operator-=(const ivec4 &other)
Definition: vectorize_pnacl.h:172

ivec4::operator+=
void operator+=(const ivec4 &other)
Definition: vectorize_pnacl.h:169

ivec4::operator+
ivec4 operator+(const ivec4 &other) const
Definition: vectorize_pnacl.h:160

fvec4::fvec4
fvec4()
Definition: vectorize_pnacl.h:59

ivec4::operator-
ivec4 operator-() const
Definition: vectorize_pnacl.h:178

fvec4::operator/
fvec4 operator/(const fvec4 &other) const
Definition: vectorize_pnacl.h:88

ivec4::operator|
ivec4 operator|(const ivec4 &other) const
Definition: vectorize_pnacl.h:184

fvec4::operator!=
fvec4 operator!=(const fvec4 &other) const
Definition: vectorize_pnacl.h:115

ivec4::operator>
ivec4 operator>(const ivec4 &other) const
Definition: vectorize_pnacl.h:193

ivec4::ivec4
ivec4()
Definition: vectorize_pnacl.h:140

fvec4::operator-=
void operator-=(const fvec4 &other)
Definition: vectorize_pnacl.h:94

fvec4::operator&
fvec4 operator&(const fvec4 &other) const
Definition: vectorize_pnacl.h:106

fvec4::operator*
fvec4 operator*(const fvec4 &other) const
Definition: vectorize_pnacl.h:85

fvec4::fvec4
fvec4(float v1, float v2, float v3, float v4)
Definition: vectorize_pnacl.h:63

fvec4::operator|
fvec4 operator|(const fvec4 &other) const
Definition: vectorize_pnacl.h:109

fvec4::fvec4
fvec4(float v)
Definition: vectorize_pnacl.h:60

fvec4::operator>
fvec4 operator>(const fvec4 &other) const
Definition: vectorize_pnacl.h:118

fvec4::operator-
fvec4 operator-() const
Definition: vectorize_pnacl.h:103

fvec4::operator+=
void operator+=(const fvec4 &other)
Definition: vectorize_pnacl.h:91

ivec4::ivec4
ivec4(int v)
Definition: vectorize_pnacl.h:141

ivec4::operator*
ivec4 operator*(const ivec4 &other) const
Definition: vectorize_pnacl.h:166

ivec4::operator<=
ivec4 operator<=(const ivec4 &other) const
Definition: vectorize_pnacl.h:202

ivec4::operator&
ivec4 operator&(const ivec4 &other) const
Definition: vectorize_pnacl.h:181

ivec4::operator*=
void operator*=(const ivec4 &other)
Definition: vectorize_pnacl.h:175

ivec4::val
__m128i val
Definition: vectorize_pnacl.h:138