NTrace/_math_8hpp_source.html

 /*

  *  Copyright (c) 2009-2011, NVIDIA Corporation

  *  All rights reserved.

  *

  *  Redistribution and use in source and binary forms, with or without

  *  modification, are permitted provided that the following conditions are met:

  *      * Redistributions of source code must retain the above copyright

  *        notice, this list of conditions and the following disclaimer.

  *      * Redistributions in binary form must reproduce the above copyright

  *        notice, this list of conditions and the following disclaimer in the

  *        documentation and/or other materials provided with the distribution.

  *      * Neither the name of NVIDIA Corporation nor the

  *        names of its contributors may be used to endorse or promote products

  *        derived from this software without specific prior written permission.

  *

  *  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND

  *  ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED

  *  WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE

  *  DISCLAIMED. IN NO EVENT SHALL <COPYRIGHT HOLDER> BE LIABLE FOR ANY

  *  DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES

  *  (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

  *  LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND

  *  ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

  *  (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS

  *  SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

  */


 #pragma once

 #include "base/DLLImports.hpp"


 #include <math.h>

 #include <vector_types.h>

 #include <stdio.h>


 namespace FW

 {

 //------------------------------------------------------------------------


 FW_CUDA_FUNC F32    sqrt            (F32 a)         { return ::sqrtf(a); }

 FW_CUDA_FUNC F64    sqrt            (F64 a)         { return ::sqrt(a); }

 FW_CUDA_FUNC S32    abs             (S32 a)         { return (a >= 0) ? a : -a; }

 FW_CUDA_FUNC S64    abs             (S64 a)         { return (a >= 0) ? a : -a; }

 FW_CUDA_FUNC F32    abs             (F32 a)         { return ::fabsf(a); }

 FW_CUDA_FUNC F64    abs             (F64 a)         { return ::abs(a); }

 FW_CUDA_FUNC F64    pow             (F64 a, F64 b)  { return ::pow(a, b); }

 FW_CUDA_FUNC F64    exp             (F64 a)         { return ::exp(a); }

 FW_CUDA_FUNC F64    log             (F64 a)         { return ::log(a); }

 FW_CUDA_FUNC F64    sin             (F64 a)         { return ::sin(a); }

 FW_CUDA_FUNC F64    cos             (F64 a)         { return ::cos(a); }

 FW_CUDA_FUNC F64    tan             (F64 a)         { return ::tan(a); }

 FW_CUDA_FUNC F32    asin            (F32 a)         { return ::asinf(a); }

 FW_CUDA_FUNC F64    asin            (F64 a)         { return ::asin(a); }

 FW_CUDA_FUNC F32    acos            (F32 a)         { return ::acosf(a); }

 FW_CUDA_FUNC F64    acos            (F64 a)         { return ::acos(a); }

 FW_CUDA_FUNC F32    atan            (F32 a)         { return ::atanf(a); }

 FW_CUDA_FUNC F64    atan            (F64 a)         { return ::atan(a); }

 FW_CUDA_FUNC F64    atan2           (F64 y, F64 x)  { return ::atan2(y, x); }

 FW_CUDA_FUNC F32    atan2           (F32 y, F32 x)  { return ::atan2f(y, x); }

 FW_CUDA_FUNC F32    floor           (F32 a)         { return ::floorf(a); }

 FW_CUDA_FUNC F64    floor           (F64 a)         { return ::floor(a); }

 FW_CUDA_FUNC F32    ceil            (F32 a)         { return ::ceilf(a); }

 FW_CUDA_FUNC F64    ceil            (F64 a)         { return ::ceil(a); }

 FW_CUDA_FUNC U64    doubleToBits    (F64 a)         { return *(U64*)&a; }

 FW_CUDA_FUNC F64    bitsToDouble    (U64 a)         { return *(F64*)&a; }


 #if FW_CUDA

 FW_CUDA_FUNC F32    pow             (F32 a, F32 b)  { return ::__powf(a, b); }

 FW_CUDA_FUNC F32    exp             (F32 a)         { return ::__expf(a); }

 FW_CUDA_FUNC F32    exp2            (F32 a)         { return ::exp2f(a); }

 FW_CUDA_FUNC F64    exp2            (F64 a)         { return ::exp2(a); }

 FW_CUDA_FUNC F32    log             (F32 a)         { return ::__logf(a); }

 FW_CUDA_FUNC F32    log2            (F32 a)         { return ::__log2f(a); }

 FW_CUDA_FUNC F64    log2            (F64 a)         { return ::log2(a); }

 FW_CUDA_FUNC F32    sin             (F32 a)         { return ::__sinf(a); }

 FW_CUDA_FUNC F32    cos             (F32 a)         { return ::__cosf(a); }

 FW_CUDA_FUNC F32    tan             (F32 a)         { return ::__tanf(a); }

 FW_CUDA_FUNC U32    floatToBits     (F32 a)         { return ::__float_as_int(a); }

 FW_CUDA_FUNC F32    bitsToFloat     (U32 a)         { return ::__int_as_float(a); }

 FW_CUDA_FUNC F32    exp2            (int a)         { return ::exp2f((F32)a); }

 FW_CUDA_FUNC F32    fastMin         (F32 a, F32 b)  { return ::fminf(a, b); }

 FW_CUDA_FUNC F32    fastMax         (F32 a, F32 b)  { return ::fmaxf(a, b); }

 FW_CUDA_FUNC F64    fastMin         (F64 a, F64 b)  { return ::fmin(a, b); }

 FW_CUDA_FUNC F64    fastMax         (F64 a, F64 b)  { return ::fmax(a, b); }

 #else

 inline F32          pow             (F32 a, F32 b)  { return ::powf(a, b); }

 inline F32          exp             (F32 a)         { return ::expf(a); }

 inline F32          exp2            (F32 a)         { return ::powf(2.0f, a); }

 inline F64          exp2            (F64 a)         { return ::pow(2.0, a); }

 inline F32          log             (F32 a)         { return ::logf(a); }

 inline F32          log2            (F32 a)         { return ::logf(a) / ::logf(2.0f); }

 inline F64          log2            (F64 a)         { return ::log(a) / ::log(2.0); }

 inline F32          sin             (F32 a)         { return ::sinf(a); }

 inline F32          cos             (F32 a)         { return ::cosf(a); }

 inline F32          tan             (F32 a)         { return ::tanf(a); }

 inline U32          floatToBits     (F32 a)         { return *(U32*)&a; }

 inline F32          bitsToFloat     (U32 a)         { return *(F32*)&a; }

 inline F32          exp2            (int a)         { return bitsToFloat(clamp(a + 127, 1, 254) << 23); }

 inline F32          fastMin         (F32 a, F32 b)  { return (a + b - abs(a - b)) * 0.5f; }

 inline F32          fastMax         (F32 a, F32 b)  { return (a + b + abs(a - b)) * 0.5f; }

 inline F64          fastMin         (F64 a, F64 b)  { return (a + b - abs(a - b)) * 0.5f; }

 inline F64          fastMax         (F64 a, F64 b)  { return (a + b + abs(a - b)) * 0.5f; }

 #endif


 FW_CUDA_FUNC F32    scale           (F32 a, int b)  { return a * exp2(b); }

 FW_CUDA_FUNC int    popc8           (U32 mask);

 FW_CUDA_FUNC int    popc16          (U32 mask);

 FW_CUDA_FUNC int    popc32          (U32 mask);

 FW_CUDA_FUNC int    popc64          (U64 mask);


 FW_CUDA_FUNC F32    fastClamp       (F32 v, F32 lo, F32 hi) { return fastMin(fastMax(v, lo), hi); }

 FW_CUDA_FUNC F64    fastClamp       (F64 v, F64 lo, F64 hi) { return fastMin(fastMax(v, lo), hi); }


 template <class T> FW_CUDA_FUNC T sqr(const T& a) { return a * a; }

 template <class T> FW_CUDA_FUNC T rcp(const T& a) { return (a) ? (T)1 / a : (T)0; }

 template <class A, class B> FW_CUDA_FUNC A lerp(const A& a, const A& b, const B& t) { return (A)(a * ((B)1 - t) + b * t); }


 //------------------------------------------------------------------------


 template <class T, int L> class Vector;


 template <class T, int L, class S> class VectorBase

 {

 public:

     FW_CUDA_FUNC                    VectorBase  (void)                      {}


     FW_CUDA_FUNC    const T*        getPtr      (void) const                { return ((S*)this)->getPtr(); }

     FW_CUDA_FUNC    T*              getPtr      (void)                      { return ((S*)this)->getPtr(); }

     FW_CUDA_FUNC    const T&        get         (int idx) const             { FW_ASSERT(idx >= 0 && idx < L); return getPtr()[idx]; }

     FW_CUDA_FUNC    T&              get         (int idx)                   { FW_ASSERT(idx >= 0 && idx < L); return getPtr()[idx]; }

     FW_CUDA_FUNC    T               set         (int idx, const T& a)       { T& slot = get(idx); T old = slot; slot = a; return old; }


     FW_CUDA_FUNC    void            set         (const T& a)                { T* tp = getPtr(); for (int i = 0; i < L; i++) tp[i] = a; }

     FW_CUDA_FUNC    void            set         (const T* ptr)              { FW_ASSERT(ptr); T* tp = getPtr(); for (int i = 0; i < L; i++) tp[i] = ptr[i]; }

     FW_CUDA_FUNC    void            setZero     (void)                      { set((T)0); }


 #if !FW_CUDA

                     void            print       (void) const                { const T* tp = getPtr(); for (int i = 0; i < L; i++) printf("%g\n", (F64)tp[i]); }

                     void            sprint      (char* vec, size_t s) const { int ctr = sprintf_s(vec, s, "( "); for (int i = 0; i < L-1; i++) ctr += sprintf_s(vec+ctr, s, "%.2f , ", (F64)get(i)); ctr += sprintf_s(vec+ctr, s, "%.2f )", (F64)get(L-1)); }

 #endif


     FW_CUDA_FUNC    bool            isZero      (void) const                { const T* tp = getPtr(); for (int i = 0; i < L; i++) if (tp[i] != (T)0) return false; return true; }

     FW_CUDA_FUNC    T               lenSqr      (void) const                { const T* tp = getPtr(); T r = (T)0; for (int i = 0; i < L; i++) r += sqr(tp[i]); return r; }

     FW_CUDA_FUNC    T               length      (void) const                { return sqrt(lenSqr()); }

     FW_CUDA_FUNC    S               normalized  (T len = (T)1) const        { return operator*(len * rcp(length())); }

     FW_CUDA_FUNC    void            normalize   (T len = (T)1)              { set(normalized(len)); }

     FW_CUDA_FUNC    T               min         (void) const                { const T* tp = getPtr(); T r = tp[0]; for (int i = 1; i < L; i++) r = FW::min(r, tp[i]); return r; }

     FW_CUDA_FUNC    T               max         (void) const                { const T* tp = getPtr(); T r = tp[0]; for (int i = 1; i < L; i++) r = FW::max(r, tp[i]); return r; }

     FW_CUDA_FUNC    T               sum         (void) const                { const T* tp = getPtr(); T r = tp[0]; for (int i = 1; i < L; i++) r += tp[i]; return r; }

     FW_CUDA_FUNC    S               abs         (void) const                { const T* tp = getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = FW::abs(tp[i]); return r; }


     FW_CUDA_FUNC    Vector<T, L + 1> toHomogeneous(void) const              { const T* tp = getPtr(); Vector<T, L + 1> r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i]; rp[L] = (T)1; return r; }

     FW_CUDA_FUNC    Vector<T, L - 1> toCartesian(void) const                { const T* tp = getPtr(); Vector<T, L - 1> r; T* rp = r.getPtr(); T c = rcp(tp[L - 1]); for (int i = 0; i < L - 1; i++) rp[i] = tp[i] * c; return r; }


     FW_CUDA_FUNC    const T&        operator[]  (int idx) const             { return get(idx); }

     FW_CUDA_FUNC    T&              operator[]  (int idx)                   { return get(idx); }


     FW_CUDA_FUNC    S&              operator=   (const T& a)                { set(a); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator+=  (const T& a)                { set(operator+(a)); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator-=  (const T& a)                { set(operator-(a)); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator*=  (const T& a)                { set(operator*(a)); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator/=  (const T& a)                { set(operator/(a)); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator%=  (const T& a)                { set(operator%(a)); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator&=  (const T& a)                { set(operator&(a)); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator|=  (const T& a)                { set(operator|(a)); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator^=  (const T& a)                { set(operator^(a)); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator<<= (const T& a)                { set(operator<<(a)); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator>>= (const T& a)                { set(operator>>(a)); return *(S*)this; }


     FW_CUDA_FUNC    S               operator+   (void) const                { return *this; }

     FW_CUDA_FUNC    S               operator-   (void) const                { const T* tp = getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = -tp[i]; return r; }

     FW_CUDA_FUNC    S               operator~   (void) const                { const T* tp = getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = ~tp[i]; return r; }


     FW_CUDA_FUNC    S               operator+   (const T& a) const          { const T* tp = getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] + a; return r; }

     FW_CUDA_FUNC    S               operator-   (const T& a) const          { const T* tp = getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] - a; return r; }

     FW_CUDA_FUNC    S               operator*   (const T& a) const          { const T* tp = getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] * a; return r; }

     FW_CUDA_FUNC    S               operator/   (const T& a) const          { const T* tp = getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] / a; return r; }

     FW_CUDA_FUNC    S               operator%   (const T& a) const          { const T* tp = getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] % a; return r; }

     FW_CUDA_FUNC    S               operator&   (const T& a) const          { const T* tp = getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] & a; return r; }

     FW_CUDA_FUNC    S               operator|   (const T& a) const          { const T* tp = getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] | a; return r; }

     FW_CUDA_FUNC    S               operator^   (const T& a) const          { const T* tp = getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] ^ a; return r; }

     FW_CUDA_FUNC    S               operator<<  (const T& a) const          { const T* tp = getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] << a; return r; }

     FW_CUDA_FUNC    S               operator>>  (const T& a) const          { const T* tp = getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] >> a; return r; }


     template <class V> FW_CUDA_FUNC void    set         (const VectorBase<T, L, V>& v)          { set(v.getPtr()); }

     template <class V> FW_CUDA_FUNC T       dot         (const VectorBase<T, L, V>& v) const    { const T* tp = getPtr(); const T* vp = v.getPtr(); T r = (T)0; for (int i = 0; i < L; i++) r += tp[i] * vp[i]; return r; }

     template <class V> FW_CUDA_FUNC S       min         (const VectorBase<T, L, V>& v) const    { const T* tp = getPtr(); const T* vp = v.getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = FW::min(tp[i], vp[i]); return r; }

     template <class V> FW_CUDA_FUNC S       max         (const VectorBase<T, L, V>& v) const    { const T* tp = getPtr(); const T* vp = v.getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = FW::max(tp[i], vp[i]); return r; }

     template <class V, class W> FW_CUDA_FUNC S clamp    (const VectorBase<T, L, V>& lo, const VectorBase<T, L, W>& hi) const { const T* tp = getPtr(); const T* lop = lo.getPtr(); const T* hip = hi.getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = FW::clamp(tp[i], lop[i], hip[i]); return r; }


     template <class V> FW_CUDA_FUNC S&      operator=   (const VectorBase<T, L, V>& v)          { set(v); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator+=  (const VectorBase<T, L, V>& v)          { set(operator+(v)); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator-=  (const VectorBase<T, L, V>& v)          { set(operator-(v)); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator*=  (const VectorBase<T, L, V>& v)          { set(operator*(v)); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator/=  (const VectorBase<T, L, V>& v)          { set(operator/(v)); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator%=  (const VectorBase<T, L, V>& v)          { set(operator%(v)); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator&=  (const VectorBase<T, L, V>& v)          { set(operator&(v)); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator|=  (const VectorBase<T, L, V>& v)          { set(operator|(v)); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator^=  (const VectorBase<T, L, V>& v)          { set(operator^(v)); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator<<= (const VectorBase<T, L, V>& v)          { set(operator<<(v)); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator>>= (const VectorBase<T, L, V>& v)          { set(operator>>(v)); return *(S*)this; }


     template <class V> FW_CUDA_FUNC S       operator+   (const VectorBase<T, L, V>& v) const    { const T* tp = getPtr(); const T* vp = v.getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] +  vp[i]; return r; }

     template <class V> FW_CUDA_FUNC S       operator-   (const VectorBase<T, L, V>& v) const    { const T* tp = getPtr(); const T* vp = v.getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] -  vp[i]; return r; }

     template <class V> FW_CUDA_FUNC S       operator*   (const VectorBase<T, L, V>& v) const    { const T* tp = getPtr(); const T* vp = v.getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] *  vp[i]; return r; }

     template <class V> FW_CUDA_FUNC S       operator/   (const VectorBase<T, L, V>& v) const    { const T* tp = getPtr(); const T* vp = v.getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] /  vp[i]; return r; }

     template <class V> FW_CUDA_FUNC S       operator%   (const VectorBase<T, L, V>& v) const    { const T* tp = getPtr(); const T* vp = v.getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] %  vp[i]; return r; }

     template <class V> FW_CUDA_FUNC S       operator&   (const VectorBase<T, L, V>& v) const    { const T* tp = getPtr(); const T* vp = v.getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] &  vp[i]; return r; }

     template <class V> FW_CUDA_FUNC S       operator|   (const VectorBase<T, L, V>& v) const    { const T* tp = getPtr(); const T* vp = v.getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] |  vp[i]; return r; }

     template <class V> FW_CUDA_FUNC S       operator^   (const VectorBase<T, L, V>& v) const    { const T* tp = getPtr(); const T* vp = v.getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] ^  vp[i]; return r; }

     template <class V> FW_CUDA_FUNC S       operator<<  (const VectorBase<T, L, V>& v) const    { const T* tp = getPtr(); const T* vp = v.getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] << vp[i]; return r; }

     template <class V> FW_CUDA_FUNC S       operator>>  (const VectorBase<T, L, V>& v) const    { const T* tp = getPtr(); const T* vp = v.getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = tp[i] >> vp[i]; return r; }


     template <class V> FW_CUDA_FUNC bool    operator==  (const VectorBase<T, L, V>& v) const    { const T* tp = getPtr(); const T* vp = v.getPtr(); for (int i = 0; i < L; i++) if (tp[i] != vp[i]) return false; return true; }

     template <class V> FW_CUDA_FUNC bool    operator!=  (const VectorBase<T, L, V>& v) const    { return (!operator==(v)); }

 };


 //------------------------------------------------------------------------


 template <class T, int L> class Vector : public VectorBase<T, L, Vector<T, L> >

 {

 public:

     FW_CUDA_FUNC                    Vector      (void)                      { setZero(); }

     FW_CUDA_FUNC                    Vector      (T a)                       { set(a); }


     FW_CUDA_FUNC    const T*        getPtr      (void) const                { return m_values; }

     FW_CUDA_FUNC    T*              getPtr      (void)                      { return m_values; }

     static FW_CUDA_FUNC Vector      fromPtr     (const T* ptr)              { Vector v; v.set(ptr); return v; }


     template <class V> FW_CUDA_FUNC Vector(const VectorBase<T, L, V>& v) { set(v); }

     template <class V> FW_CUDA_FUNC Vector& operator=(const VectorBase<T, L, V>& v) { set(v); return *this; }


 private:

     T               m_values[L];

 };


 //------------------------------------------------------------------------


 class Vec2i : public VectorBase<S32, 2, Vec2i>, public int2

 {

 public:

     FW_CUDA_FUNC                    Vec2i       (void)                      { setZero(); }

     FW_CUDA_FUNC                    Vec2i       (S32 a)                     { set(a); }

     FW_CUDA_FUNC                    Vec2i       (S32 xx, S32 yy)            { x = xx; y = yy; }


     FW_CUDA_FUNC    const S32*      getPtr      (void) const                { return &x; }

     FW_CUDA_FUNC    S32*            getPtr      (void)                      { return &x; }

     static FW_CUDA_FUNC Vec2i       fromPtr     (const S32* ptr)            { return Vec2i(ptr[0], ptr[1]); }


     FW_CUDA_FUNC    Vec2i           perpendicular(void) const               { return Vec2i(-y, x); }


     template <class V> FW_CUDA_FUNC Vec2i(const VectorBase<S32, 2, V>& v) { set(v); }

     template <class V> FW_CUDA_FUNC Vec2i& operator=(const VectorBase<S32, 2, V>& v) { set(v); return *this; }

 };


 //------------------------------------------------------------------------


 class Vec3i : public VectorBase<S32, 3, Vec3i>, public int3

 {

 public:

     FW_CUDA_FUNC                    Vec3i       (void)                      { setZero(); }

     FW_CUDA_FUNC                    Vec3i       (S32 a)                     { set(a); }

     FW_CUDA_FUNC                    Vec3i       (S32 xx, S32 yy, S32 zz)    { x = xx; y = yy; z = zz; }

     FW_CUDA_FUNC                    Vec3i       (const Vec2i& xy, S32 zz)   { x = xy.x; y = xy.y; z = zz; }


     FW_CUDA_FUNC    const S32*      getPtr      (void) const                { return &x; }

     FW_CUDA_FUNC    S32*            getPtr      (void)                      { return &x; }

     static FW_CUDA_FUNC Vec3i       fromPtr     (const S32* ptr)            { return Vec3i(ptr[0], ptr[1], ptr[2]); }


     FW_CUDA_FUNC    Vec2i           getXY       (void) const                { return Vec2i(x, y); }


     template <class V> FW_CUDA_FUNC Vec3i(const VectorBase<S32, 3, V>& v) { set(v); }

     template <class V> FW_CUDA_FUNC Vec3i& operator=(const VectorBase<S32, 3, V>& v) { set(v); return *this; }

 };


 //------------------------------------------------------------------------


 class Vec4i : public VectorBase<S32, 4, Vec4i>, public int4

 {

 public:

     FW_CUDA_FUNC                    Vec4i       (void)                      { setZero(); }

     FW_CUDA_FUNC                    Vec4i       (S32 a)                     { set(a); }

     FW_CUDA_FUNC                    Vec4i       (S32 xx, S32 yy, S32 zz, S32 ww) { x = xx; y = yy; z = zz; w = ww; }

     FW_CUDA_FUNC                    Vec4i       (const Vec2i& xy, S32 zz, S32 ww) { x = xy.x; y = xy.y; z = zz; w = ww; }

     FW_CUDA_FUNC                    Vec4i       (const Vec3i& xyz, S32 ww)  { x = xyz.x; y = xyz.y; z = xyz.z; w = ww; }

     FW_CUDA_FUNC                    Vec4i       (const Vec2i& xy, const Vec2i& zw) { x = xy.x; y = xy.y; z = zw.x; w = zw.y; }


     FW_CUDA_FUNC    const S32*      getPtr      (void) const                { return &x; }

     FW_CUDA_FUNC    S32*            getPtr      (void)                      { return &x; }

     static FW_CUDA_FUNC Vec4i       fromPtr     (const S32* ptr)            { return Vec4i(ptr[0], ptr[1], ptr[2], ptr[3]); }


     FW_CUDA_FUNC    Vec2i           getXY       (void) const                { return Vec2i(x, y); }

     FW_CUDA_FUNC    Vec3i           getXYZ      (void) const                { return Vec3i(x, y, z); }

     FW_CUDA_FUNC    Vec3i           getXYW      (void) const                { return Vec3i(x, y, w); }


     template <class V> FW_CUDA_FUNC Vec4i(const VectorBase<S32, 4, V>& v) { set(v); }

     template <class V> FW_CUDA_FUNC Vec4i& operator=(const VectorBase<S32, 4, V>& v) { set(v); return *this; }

 };


 //------------------------------------------------------------------------


 class Vec2f : public VectorBase<F32, 2, Vec2f>, public float2

 {

 public:

     FW_CUDA_FUNC                    Vec2f       (void)                      { setZero(); }

     FW_CUDA_FUNC                    Vec2f       (F32 a)                     { set(a); }

     FW_CUDA_FUNC                    Vec2f       (F32 xx, F32 yy)            { x = xx; y = yy; }

     FW_CUDA_FUNC                    Vec2f       (const Vec2i& v)            { x = (F32)v.x; y = (F32)v.y; }


     FW_CUDA_FUNC    const F32*      getPtr      (void) const                { return &x; }

     FW_CUDA_FUNC    F32*            getPtr      (void)                      { return &x; }

     static FW_CUDA_FUNC Vec2f       fromPtr     (const F32* ptr)            { return Vec2f(ptr[0], ptr[1]); }


     FW_CUDA_FUNC    operator        Vec2i       (void) const                { return Vec2i((S32)x, (S32)y); }


     FW_CUDA_FUNC    Vec2f           perpendicular(void) const               { return Vec2f(-y, x); }

     FW_CUDA_FUNC    F32             cross       (const Vec2f& v) const      { return x * v.y - y * v.x; }


     template <class V> FW_CUDA_FUNC Vec2f(const VectorBase<F32, 2, V>& v) { set(v); }

     template <class V> FW_CUDA_FUNC Vec2f& operator=(const VectorBase<F32, 2, V>& v) { set(v); return *this; }

 };


 //------------------------------------------------------------------------


 class Vec3f : public VectorBase<F32, 3, Vec3f>, public float3

 {

 public:

     FW_CUDA_FUNC                    Vec3f       (void)                      { setZero(); }

     FW_CUDA_FUNC                    Vec3f       (F32 a)                     { set(a); }

     FW_CUDA_FUNC                    Vec3f       (F32 xx, F32 yy, F32 zz)    { x = xx; y = yy; z = zz; }

     FW_CUDA_FUNC                    Vec3f       (const Vec2f& xy, F32 zz)   { x = xy.x; y = xy.y; z = zz; }

     FW_CUDA_FUNC                    Vec3f       (const Vec3i& v)            { x = (F32)v.x; y = (F32)v.y; z = (F32)v.z; }


     FW_CUDA_FUNC    const F32*      getPtr      (void) const                { return &x; }

     FW_CUDA_FUNC    F32*            getPtr      (void)                      { return &x; }

     static FW_CUDA_FUNC Vec3f       fromPtr     (const F32* ptr)            { return Vec3f(ptr[0], ptr[1], ptr[2]); }


     FW_CUDA_FUNC    operator        Vec3i       (void) const                { return Vec3i((S32)x, (S32)y, (S32)z); }

     FW_CUDA_FUNC    Vec2f           getXY       (void) const                { return Vec2f(x, y); }


     FW_CUDA_FUNC    Vec3f           cross       (const Vec3f& v) const      { return Vec3f(y * v.z - z * v.y, z * v.x - x * v.z, x * v.y - y * v.x); }


     template <class V> FW_CUDA_FUNC Vec3f(const VectorBase<F32, 3, V>& v) { set(v); }

     template <class V> FW_CUDA_FUNC Vec3f& operator=(const VectorBase<F32, 3, V>& v) { set(v); return *this; }

 };


 //------------------------------------------------------------------------


 class Vec4f : public VectorBase<F32, 4, Vec4f>, public float4

 {

 public:

     FW_CUDA_FUNC                    Vec4f       (void)                      { setZero(); }

     FW_CUDA_FUNC                    Vec4f       (F32 a)                     { set(a); }

     FW_CUDA_FUNC                    Vec4f       (F32 xx, F32 yy, F32 zz, F32 ww) { x = xx; y = yy; z = zz; w = ww; }

     FW_CUDA_FUNC                    Vec4f       (const Vec2f& xy, F32 zz, F32 ww) { x = xy.x; y = xy.y; z = zz; w = ww; }

     FW_CUDA_FUNC                    Vec4f       (const Vec3f& xyz, F32 ww)  { x = xyz.x; y = xyz.y; z = xyz.z; w = ww; }

     FW_CUDA_FUNC                    Vec4f       (const Vec2f& xy, const Vec2f& zw) { x = xy.x; y = xy.y; z = zw.x; w = zw.y; }

     FW_CUDA_FUNC                    Vec4f       (const Vec4i& v)            { x = (F32)v.x; y = (F32)v.y; z = (F32)v.z; w = (F32)v.w; }


     FW_CUDA_FUNC    const F32*      getPtr      (void) const                { return &x; }

     FW_CUDA_FUNC    F32*            getPtr      (void)                      { return &x; }

     static FW_CUDA_FUNC Vec4f       fromPtr     (const F32* ptr)            { return Vec4f(ptr[0], ptr[1], ptr[2], ptr[3]); }


     FW_CUDA_FUNC    operator        Vec4i       (void) const                { return Vec4i((S32)x, (S32)y, (S32)z, (S32)w); }

     FW_CUDA_FUNC    Vec2f           getXY       (void) const                { return Vec2f(x, y); }

     FW_CUDA_FUNC    Vec3f           getXYZ      (void) const                { return Vec3f(x, y, z); }

     FW_CUDA_FUNC    Vec3f           getXYW      (void) const                { return Vec3f(x, y, w); }


 #if !FW_CUDA

     static Vec4f    fromABGR        (U32 abgr);

     U32             toABGR          (void) const;

 #endif


     template <class V> FW_CUDA_FUNC Vec4f(const VectorBase<F32, 4, V>& v) { set(v); }

     template <class V> FW_CUDA_FUNC Vec4f& operator=(const VectorBase<F32, 4, V>& v) { set(v); return *this; }

 };


 //------------------------------------------------------------------------


 class Vec2d : public VectorBase<F64, 2, Vec2d>, public double2

 {

 public:

     FW_CUDA_FUNC                    Vec2d       (void)                      { setZero(); }

     FW_CUDA_FUNC                    Vec2d       (F64 a)                     { set(a); }

     FW_CUDA_FUNC                    Vec2d       (F64 xx, F64 yy)            { x = xx; y = yy; }

     FW_CUDA_FUNC                    Vec2d       (const Vec2i& v)            { x = (F64)v.x; y = (F64)v.y; }

     FW_CUDA_FUNC                    Vec2d       (const Vec2f& v)            { x = v.x; y = v.y; }


     FW_CUDA_FUNC    const F64*      getPtr      (void) const                { return &x; }

     FW_CUDA_FUNC    F64*            getPtr      (void)                      { return &x; }

     static FW_CUDA_FUNC Vec2d       fromPtr     (const F64* ptr)            { return Vec2d(ptr[0], ptr[1]); }


     FW_CUDA_FUNC    operator        Vec2i       (void) const                { return Vec2i((S32)x, (S32)y); }

     FW_CUDA_FUNC    operator        Vec2f       (void) const                { return Vec2f((F32)x, (F32)y); }


     FW_CUDA_FUNC    Vec2d           perpendicular(void) const               { return Vec2d(-y, x); }

     FW_CUDA_FUNC    F64             cross       (const Vec2d& v) const      { return x * v.y - y * v.x; }


     template <class V> FW_CUDA_FUNC Vec2d(const VectorBase<F64, 2, V>& v) { set(v); }

     template <class V> FW_CUDA_FUNC Vec2d& operator=(const VectorBase<F64, 2, V>& v) { set(v); return *this; }

 };


 //------------------------------------------------------------------------


 class Vec3d : public VectorBase<F64, 3, Vec3d>, public double3

 {

 public:

     FW_CUDA_FUNC                    Vec3d       (void)                      { setZero(); }

     FW_CUDA_FUNC                    Vec3d       (F64 a)                     { set(a); }

     FW_CUDA_FUNC                    Vec3d       (F64 xx, F64 yy, F64 zz)    { x = xx; y = yy; z = zz; }

     FW_CUDA_FUNC                    Vec3d       (const Vec2d& xy, F64 zz)   { x = xy.x; y = xy.y; z = zz; }

     FW_CUDA_FUNC                    Vec3d       (const Vec3i& v)            { x = (F64)v.x; y = (F64)v.y; z = (F64)v.z; }

     FW_CUDA_FUNC                    Vec3d       (const Vec3f& v)            { x = v.x; y = v.y; z = v.z; }


     FW_CUDA_FUNC    const F64*      getPtr      (void) const                { return &x; }

     FW_CUDA_FUNC    F64*            getPtr      (void)                      { return &x; }

     static FW_CUDA_FUNC Vec3d       fromPtr     (const F64* ptr)            { return Vec3d(ptr[0], ptr[1], ptr[2]); }


     FW_CUDA_FUNC    operator        Vec3i       (void) const                { return Vec3i((S32)x, (S32)y, (S32)z); }

     FW_CUDA_FUNC    operator        Vec3f       (void) const                { return Vec3f((F32)x, (F32)y, (F32)z); }

     FW_CUDA_FUNC    Vec2d           getXY       (void) const                { return Vec2d(x, y); }


     FW_CUDA_FUNC    Vec3d           cross       (const Vec3d& v) const      { return Vec3d(y * v.z - z * v.y, z * v.x - x * v.z, x * v.y - y * v.x); }


     template <class V> FW_CUDA_FUNC Vec3d(const VectorBase<F64, 3, V>& v) { set(v); }

     template <class V> FW_CUDA_FUNC Vec3d& operator=(const VectorBase<F64, 3, V>& v) { set(v); return *this; }

 };


 //------------------------------------------------------------------------


 class Vec4d : public VectorBase<F64, 4, Vec4d>, public double4

 {

 public:

     FW_CUDA_FUNC                    Vec4d       (void)                      { setZero(); }

     FW_CUDA_FUNC                    Vec4d       (F64 a)                     { set(a); }

     FW_CUDA_FUNC                    Vec4d       (F64 xx, F64 yy, F64 zz, F64 ww) { x = xx; y = yy; z = zz; w = ww; }

     FW_CUDA_FUNC                    Vec4d       (const Vec2d& xy, F64 zz, F64 ww) { x = xy.x; y = xy.y; z = zz; w = ww; }

     FW_CUDA_FUNC                    Vec4d       (const Vec3d& xyz, F64 ww)  { x = xyz.x; y = xyz.y; z = xyz.z; w = ww; }

     FW_CUDA_FUNC                    Vec4d       (const Vec2d& xy, const Vec2d& zw) { x = xy.x; y = xy.y; z = zw.x; w = zw.y; }

     FW_CUDA_FUNC                    Vec4d       (const Vec4i& v)            { x = (F64)v.x; y = (F64)v.y; z = (F64)v.z; w = (F64)v.w; }

     FW_CUDA_FUNC                    Vec4d       (const Vec4f& v)            { x = v.x; y = v.y; z = v.z; w = v.w; }


     FW_CUDA_FUNC    const F64*      getPtr      (void) const                { return &x; }

     FW_CUDA_FUNC    F64*            getPtr      (void)                      { return &x; }

     static FW_CUDA_FUNC Vec4d       fromPtr     (const F64* ptr)            { return Vec4d(ptr[0], ptr[1], ptr[2], ptr[3]); }


     FW_CUDA_FUNC    operator        Vec4i       (void) const                { return Vec4i((S32)x, (S32)y, (S32)z, (S32)w); }

     FW_CUDA_FUNC    operator        Vec4f       (void) const                { return Vec4f((F32)x, (F32)y, (F32)z, (F32)w); }

     FW_CUDA_FUNC    Vec2d           getXY       (void) const                { return Vec2d(x, y); }

     FW_CUDA_FUNC    Vec3d           getXYZ      (void) const                { return Vec3d(x, y, z); }

     FW_CUDA_FUNC    Vec3d           getXYW      (void) const                { return Vec3d(x, y, w); }


     template <class V> FW_CUDA_FUNC Vec4d(const VectorBase<F64, 4, V>& v) { set(v); }

     template <class V> FW_CUDA_FUNC Vec4d& operator=(const VectorBase<F64, 4, V>& v) { set(v); return *this; }

 };


 //------------------------------------------------------------------------


 template <class T, int L, class S> FW_CUDA_FUNC T lenSqr    (const VectorBase<T, L, S>& v)                  { return v.lenSqr(); }

 template <class T, int L, class S> FW_CUDA_FUNC T length    (const VectorBase<T, L, S>& v)                  { return v.length(); }

 template <class T, int L, class S> FW_CUDA_FUNC S normalize (const VectorBase<T, L, S>& v, T len = (T)1)    { return v.normalized(len); }

 template <class T, int L, class S> FW_CUDA_FUNC T min       (const VectorBase<T, L, S>& v)                  { return v.min(); }

 template <class T, int L, class S> FW_CUDA_FUNC T max       (const VectorBase<T, L, S>& v)                  { return v.max(); }

 template <class T, int L, class S> FW_CUDA_FUNC T sum       (const VectorBase<T, L, S>& v)                  { return v.sum(); }

 template <class T, int L, class S> FW_CUDA_FUNC S abs       (const VectorBase<T, L, S>& v)                  { return v.abs(); }


 template <class T, int L, class S> FW_CUDA_FUNC S operator+     (const T& a, const VectorBase<T, L, S>& b)  { return b + a; }

 template <class T, int L, class S> FW_CUDA_FUNC S operator-     (const T& a, const VectorBase<T, L, S>& b)  { return -b + a; }

 template <class T, int L, class S> FW_CUDA_FUNC S operator*     (const T& a, const VectorBase<T, L, S>& b)  { return b * a; }

 template <class T, int L, class S> FW_CUDA_FUNC S operator/     (const T& a, const VectorBase<T, L, S>& b)  { const T* bp = b.getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = a / bp[i]; return r; }

 template <class T, int L, class S> FW_CUDA_FUNC S operator%     (const T& a, const VectorBase<T, L, S>& b)  { const T* bp = b.getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = a % bp[i]; return r; }

 template <class T, int L, class S> FW_CUDA_FUNC S operator&     (const T& a, const VectorBase<T, L, S>& b)  { return b & a; }

 template <class T, int L, class S> FW_CUDA_FUNC S operator|     (const T& a, const VectorBase<T, L, S>& b)  { return b | a; }

 template <class T, int L, class S> FW_CUDA_FUNC S operator^     (const T& a, const VectorBase<T, L, S>& b)  { return b ^ a; }

 template <class T, int L, class S> FW_CUDA_FUNC S operator<<    (const T& a, const VectorBase<T, L, S>& b)  { const T* bp = b.getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = a << bp[i]; return r; }

 template <class T, int L, class S> FW_CUDA_FUNC S operator>>    (const T& a, const VectorBase<T, L, S>& b)  { const T* bp = b.getPtr(); S r; T* rp = r.getPtr(); for (int i = 0; i < L; i++) rp[i] = a >> bp[i]; return r; }


 template <class T, int L, class S, class V> FW_CUDA_FUNC T dot(const VectorBase<T, L, S>& a, const VectorBase<T, L, V>& b) { return a.dot(b); }


 FW_CUDA_FUNC Vec2f  perpendicular   (const Vec2f& v)                    { return v.perpendicular(); }

 FW_CUDA_FUNC Vec2d  perpendicular   (const Vec2d& v)                    { return v.perpendicular(); }

 FW_CUDA_FUNC F32    cross           (const Vec2f& a, const Vec2f& b)    { return a.cross(b); }

 FW_CUDA_FUNC F64    cross           (const Vec2d& a, const Vec2d& b)    { return a.cross(b); }

 FW_CUDA_FUNC Vec3f  cross           (const Vec3f& a, const Vec3f& b)    { return a.cross(b); }

 FW_CUDA_FUNC Vec3d  cross           (const Vec3d& a, const Vec3d& b)    { return a.cross(b); }


 #define MINMAX(T) \

     FW_CUDA_FUNC T min(const T& a, const T& b)                          { return a.min(b); } \

     FW_CUDA_FUNC T min(T& a, T& b)                                      { return a.min(b); } \

     FW_CUDA_FUNC T max(const T& a, const T& b)                          { return a.max(b); } \

     FW_CUDA_FUNC T max(T& a, T& b)                                      { return a.max(b); } \

     FW_CUDA_FUNC T min(const T& a, const T& b, const T& c)              { return a.min(b).min(c); } \

     FW_CUDA_FUNC T min(T& a, T& b, T& c)                                { return a.min(b).min(c); } \

     FW_CUDA_FUNC T max(const T& a, const T& b, const T& c)              { return a.max(b).max(c); } \

     FW_CUDA_FUNC T max(T& a, T& b, T& c)                                { return a.max(b).max(c); } \

     FW_CUDA_FUNC T min(const T& a, const T& b, const T& c, const T& d)  { return a.min(b).min(c).min(d); } \

     FW_CUDA_FUNC T min(T& a, T& b, T& c, T& d)                          { return a.min(b).min(c).min(d); } \

     FW_CUDA_FUNC T max(const T& a, const T& b, const T& c, const T& d)  { return a.max(b).max(c).max(d); } \

     FW_CUDA_FUNC T max(T& a, T& b, T& c, T& d)                          { return a.max(b).max(c).max(d); } \

     FW_CUDA_FUNC T clamp(const T& v, const T& lo, const T& hi)          { return v.clamp(lo, hi); } \

     FW_CUDA_FUNC T clamp(T& v, T& lo, T& hi)                            { return v.clamp(lo, hi); }


 MINMAX(Vec2i) MINMAX(Vec3i) MINMAX(Vec4i)

 MINMAX(Vec2f) MINMAX(Vec3f) MINMAX(Vec4f)

 MINMAX(Vec2d) MINMAX(Vec3d) MINMAX(Vec4d)

 #undef MINMAX


 //------------------------------------------------------------------------


 template <class T, int L, class S> class MatrixBase

 {

 public:

     FW_CUDA_FUNC                    MatrixBase  (void)                      {}


     template <class V> static FW_CUDA_FUNC S    translate   (const VectorBase<T, L - 1, V>& v);

     template <class V> static FW_CUDA_FUNC S    scale       (const VectorBase<T, L - 1, V>& v);

     template <class V> static FW_CUDA_FUNC S    scale       (const VectorBase<T, L, V>& v);


     FW_CUDA_FUNC    const T*        getPtr      (void) const                { return ((S*)this)->getPtr(); }

     FW_CUDA_FUNC    T*              getPtr      (void)                      { return ((S*)this)->getPtr(); }

     FW_CUDA_FUNC    const T&        get         (int idx) const             { FW_ASSERT(idx >= 0 && idx < L * L); return getPtr()[idx]; }

     FW_CUDA_FUNC    T&              get         (int idx)                   { FW_ASSERT(idx >= 0 && idx < L * L); return getPtr()[idx]; }

     FW_CUDA_FUNC    const T&        get         (int r, int c) const        { FW_ASSERT(r >= 0 && r < L && c >= 0 && c < L); return getPtr()[r + c * L]; }

     FW_CUDA_FUNC    T&              get         (int r, int c)              { FW_ASSERT(r >= 0 && r < L && c >= 0 && c < L); return getPtr()[r + c * L]; }

     FW_CUDA_FUNC    T               set         (int idx, const T& a)       { T& slot = get(idx); T old = slot; slot = a; return old; }

     FW_CUDA_FUNC    T               set         (int r, int c, const T& a)  { T& slot = get(r, c); T old = slot; slot = a; return old; }

     FW_CUDA_FUNC    const Vector<T, L>& col     (int c) const               { FW_ASSERT(c >= 0 && c < L); return *(const Vector<T, L>*)(getPtr() + c * L); }

     FW_CUDA_FUNC    Vector<T, L>&   col         (int c)                     { FW_ASSERT(c >= 0 && c < L); return *(Vector<T, L>*)(getPtr() + c * L); }

     FW_CUDA_FUNC    const Vector<T, L>& getCol  (int c) const               { return col(c); }

     FW_CUDA_FUNC    Vector<T, L>    getRow      (int r) const;


     FW_CUDA_FUNC    void            set         (const T& a)                { for (int i = 0; i < L * L; i++) get(i) = a; }

     FW_CUDA_FUNC    void            set         (const T* ptr)              { FW_ASSERT(ptr); for (int i = 0; i < L * L; i++) get(i) = ptr[i]; }

     FW_CUDA_FUNC    void            setZero     (void)                      { set((T)0); }

     FW_CUDA_FUNC    void            setIdentity (void)                      { setZero(); for (int i = 0; i < L; i++) get(i, i) = (T)1; }


 #if !FW_CUDA

                     void            print       (void) const;

 #endif


     FW_CUDA_FUNC    T               det         (void) const;

     FW_CUDA_FUNC    S               transposed  (void) const;

     FW_CUDA_FUNC    S               inverted    (void) const;

     FW_CUDA_FUNC    void            transpose   (void)                      { set(transposed()); }

     FW_CUDA_FUNC    void            invert      (void)                      { set(inverted()); }


     FW_CUDA_FUNC    const T&        operator()  (int r, int c) const        { return get(r, c); }

     FW_CUDA_FUNC    T&              operator()  (int r, int c)              { return get(r, c); }


     FW_CUDA_FUNC    S&              operator=   (const T& a)                { set(a); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator+=  (const T& a)                { set(operator+(a)); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator-=  (const T& a)                { set(operator-(a)); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator*=  (const T& a)                { set(operator*(a)); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator/=  (const T& a)                { set(operator/(a)); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator%=  (const T& a)                { set(operator%(a)); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator&=  (const T& a)                { set(operator&(a)); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator|=  (const T& a)                { set(operator|(a)); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator^=  (const T& a)                { set(operator^(a)); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator<<= (const T& a)                { set(operator<<(a)); return *(S*)this; }

     FW_CUDA_FUNC    S&              operator>>= (const T& a)                { set(operator>>(a)); return *(S*)this; }


     FW_CUDA_FUNC    S               operator+   (void) const                { return *this; }

     FW_CUDA_FUNC    S               operator-   (void) const                { S r; for (int i = 0; i < L * L; i++) r.get(i) = -get(i); return r; }

     FW_CUDA_FUNC    S               operator~   (void) const                { S r; for (int i = 0; i < L * L; i++) r.get(i) = ~get(i); return r; }


     FW_CUDA_FUNC    S               operator+   (const T& a) const          { S r; for (int i = 0; i < L * L; i++) r.get(i) = get(i) + a; return r; }

     FW_CUDA_FUNC    S               operator-   (const T& a) const          { S r; for (int i = 0; i < L * L; i++) r.get(i) = get(i) - a; return r; }

     FW_CUDA_FUNC    S               operator*   (const T& a) const          { S r; for (int i = 0; i < L * L; i++) r.get(i) = get(i) * a; return r; }

     FW_CUDA_FUNC    S               operator/   (const T& a) const          { S r; for (int i = 0; i < L * L; i++) r.get(i) = get(i) / a; return r; }

     FW_CUDA_FUNC    S               operator%   (const T& a) const          { S r; for (int i = 0; i < L * L; i++) r.get(i) = get(i) % a; return r; }

     FW_CUDA_FUNC    S               operator&   (const T& a) const          { S r; for (int i = 0; i < L * L; i++) r.get(i) = get(i) & a; return r; }

     FW_CUDA_FUNC    S               operator|   (const T& a) const          { S r; for (int i = 0; i < L * L; i++) r.get(i) = get(i) | a; return r; }

     FW_CUDA_FUNC    S               operator^   (const T& a) const          { S r; for (int i = 0; i < L * L; i++) r.get(i) = get(i) ^ a; return r; }

     FW_CUDA_FUNC    S               operator<<  (const T& a) const          { S r; for (int i = 0; i < L * L; i++) r.get(i) = get(i) << a; return r; }

     FW_CUDA_FUNC    S               operator>>  (const T& a) const          { S r; for (int i = 0; i < L * L; i++) r.get(i) = get(i) >> a; return r; }


     template <class V> FW_CUDA_FUNC void    setCol      (int c, const VectorBase<T, L, V>& v)   { col(c) = v; }

     template <class V> FW_CUDA_FUNC void    setRow      (int r, const VectorBase<T, L, V>& v);

     template <class V> FW_CUDA_FUNC void    set         (const MatrixBase<T, L, V>& v)          { set(v.getPtr()); }


     template <class V> FW_CUDA_FUNC S&      operator=   (const MatrixBase<T, L, V>& v)          { set(v); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator+=  (const MatrixBase<T, L, V>& v)          { set(operator+(v)); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator-=  (const MatrixBase<T, L, V>& v)          { set(operator-(v)); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator*=  (const MatrixBase<T, L, V>& v)          { set(operator*(v)); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator/=  (const MatrixBase<T, L, V>& v)          { set(operator/(v)); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator%=  (const MatrixBase<T, L, V>& v)          { set(operator%(v)); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator&=  (const MatrixBase<T, L, V>& v)          { set(operator&(v)); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator|=  (const MatrixBase<T, L, V>& v)          { set(operator|(v)); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator^=  (const MatrixBase<T, L, V>& v)          { set(operator^(v)); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator<<= (const MatrixBase<T, L, V>& v)          { set(operator<<(v)); return *(S*)this; }

     template <class V> FW_CUDA_FUNC S&      operator>>= (const MatrixBase<T, L, V>& v)          { set(operator>>(v)); return *(S*)this; }


     template <class V> FW_CUDA_FUNC V       operator*   (const VectorBase<T, L, V>& v) const;

     template <class V> FW_CUDA_FUNC V       operator*   (const VectorBase<T, L - 1, V>& v) const;


     template <class V> FW_CUDA_FUNC S       operator+   (const MatrixBase<T, L, V>& v) const    { S r; for (int i = 0; i < L * L; i++) r.get(i) = get(i) + v.get(i); return r; }

     template <class V> FW_CUDA_FUNC S       operator-   (const MatrixBase<T, L, V>& v) const    { S r; for (int i = 0; i < L * L; i++) r.get(i) = get(i) - v.get(i); return r; }

     template <class V> FW_CUDA_FUNC S       operator*   (const MatrixBase<T, L, V>& v) const;

     template <class V> FW_CUDA_FUNC S       operator/   (const MatrixBase<T, L, V>& v) const    { return operator*(v.inverted()); }

     template <class V> FW_CUDA_FUNC S       operator%   (const MatrixBase<T, L, V>& v) const    { S r; for (int i = 0; i < L * L; i++) r.get(i) = get(i) % v.get(i); return r; }

     template <class V> FW_CUDA_FUNC S       operator&   (const MatrixBase<T, L, V>& v) const    { S r; for (int i = 0; i < L * L; i++) r.get(i) = get(i) & v.get(i); return r; }

     template <class V> FW_CUDA_FUNC S       operator|   (const MatrixBase<T, L, V>& v) const    { S r; for (int i = 0; i < L * L; i++) r.get(i) = get(i) | v.get(i); return r; }

     template <class V> FW_CUDA_FUNC S       operator^   (const MatrixBase<T, L, V>& v) const    { S r; for (int i = 0; i < L * L; i++) r.get(i) = get(i) ^ v.get(i); return r; }

     template <class V> FW_CUDA_FUNC S       operator<<  (const MatrixBase<T, L, V>& v) const    { S r; for (int i = 0; i < L * L; i++) r.get(i) = get(i) << v.get(i); return r; }

     template <class V> FW_CUDA_FUNC S       operator>>  (const MatrixBase<T, L, V>& v) const    { S r; for (int i = 0; i < L * L; i++) r.get(i) = get(i) >> v.get(i); return r; }


     template <class V> FW_CUDA_FUNC bool    operator==  (const MatrixBase<T, L, V>& v) const    { for (int i = 0; i < L * L; i++) if (get(i) != v.get(i)) return false; return true; }

     template <class V> FW_CUDA_FUNC bool    operator!=  (const MatrixBase<T, L, V>& v) const    { return (!operator==(v)); }

 };


 //------------------------------------------------------------------------


 template <class T, int L> class Matrix : public MatrixBase<T, L, Matrix<T, L> >

 {

 public:

     FW_CUDA_FUNC                    Matrix      (void)                      { setIdentity(); }

     FW_CUDA_FUNC    explicit        Matrix      (T a)                       { set(a); }


     FW_CUDA_FUNC    const T*        getPtr      (void) const                { return m_values; }

     FW_CUDA_FUNC    T*              getPtr      (void)                      { return m_values; }

     static FW_CUDA_FUNC Matrix      fromPtr     (const T* ptr)              { Matrix v; v.set(ptr); return v; }


     template <class V> FW_CUDA_FUNC Matrix(const MatrixBase<T, L, V>& v) { set(v); }

     template <class V> FW_CUDA_FUNC Matrix& operator=(const MatrixBase<T, L, V>& v) { set(v); return *this; }


 private:

     T               m_values[L * L];

 };


 //------------------------------------------------------------------------


 class Mat2f : public MatrixBase<F32, 2, Mat2f>

 {

 public:

     FW_CUDA_FUNC                    Mat2f       (void)                      { setIdentity(); }

     FW_CUDA_FUNC    explicit        Mat2f       (F32 a)                     { set(a); }


     FW_CUDA_FUNC    const F32*      getPtr      (void) const                { return &m00; }

     FW_CUDA_FUNC    F32*            getPtr      (void)                      { return &m00; }

     static FW_CUDA_FUNC Mat2f       fromPtr     (const F32* ptr)            { Mat2f v; v.set(ptr); return v; }


     template <class V> FW_CUDA_FUNC Mat2f(const MatrixBase<F32, 2, V>& v) { set(v); }

     template <class V> FW_CUDA_FUNC Mat2f& operator=(const MatrixBase<F32, 2, V>& v) { set(v); return *this; }


 public:

     F32             m00, m10;

     F32             m01, m11;

 };


 //------------------------------------------------------------------------


 class Mat3f : public MatrixBase<F32, 3, Mat3f>

 {

 public:

     FW_CUDA_FUNC                    Mat3f       (void)                      { setIdentity(); }

     FW_CUDA_FUNC    explicit        Mat3f       (F32 a)                     { set(a); }


     FW_CUDA_FUNC    const F32*      getPtr      (void) const                { return &m00; }

     FW_CUDA_FUNC    F32*            getPtr      (void)                      { return &m00; }

     static FW_CUDA_FUNC Mat3f       fromPtr     (const F32* ptr)            { Mat3f v; v.set(ptr); return v; }


     template <class V> FW_CUDA_FUNC Mat3f(const MatrixBase<F32, 3, V>& v) { set(v); }

     template <class V> FW_CUDA_FUNC Mat3f& operator=(const MatrixBase<F32, 3, V>& v) { set(v); return *this; }


 #if !FW_CUDA

     static          Mat3f           rotation    (const Vec3f& axis, F32 angle);     // Rotation of "angle" radians around "axis". Axis must be unit!

 #endif


 public:

     F32             m00, m10, m20;

     F32             m01, m11, m21;

     F32             m02, m12, m22;

 };


 //------------------------------------------------------------------------


 class Mat4f : public MatrixBase<F32, 4, Mat4f>

 {

 public:

     FW_CUDA_FUNC                    Mat4f       (void)                      { setIdentity(); }

     FW_CUDA_FUNC    explicit        Mat4f       (F32 a)                     { set(a); }


     FW_CUDA_FUNC    const F32*      getPtr      (void) const                { return &m00; }

     FW_CUDA_FUNC    F32*            getPtr      (void)                      { return &m00; }

     static FW_CUDA_FUNC Mat4f       fromPtr     (const F32* ptr)            { Mat4f v; v.set(ptr); return v; }


 #if !FW_CUDA

     Mat3f                           getXYZ      (void) const;

     static Mat4f                    fitToView   (const Vec2f& pos, const Vec2f& size, const Vec2f& viewSize);

     static Mat4f                    perspective (F32 fov, F32 nearDist, F32 farDist);

 #endif


     template <class V> FW_CUDA_FUNC Mat4f(const MatrixBase<F32, 4, V>& v) { set(v); }

     template <class V> FW_CUDA_FUNC Mat4f& operator=(const MatrixBase<F32, 4, V>& v) { set(v); return *this; }


 public:

     F32             m00, m10, m20, m30;

     F32             m01, m11, m21, m31;

     F32             m02, m12, m22, m32;

     F32             m03, m13, m23, m33;

 };


 //------------------------------------------------------------------------


 class Mat2d : public MatrixBase<F64, 2, Mat2d>

 {

 public:

     FW_CUDA_FUNC                    Mat2d       (void)                      { setIdentity(); }

     FW_CUDA_FUNC                    Mat2d       (const Mat2f& a)            { for (int i = 0; i < 2 * 2; i++) set(i, (F64)a.get(i)); }

     FW_CUDA_FUNC    explicit        Mat2d       (F64 a)                     { set(a); }


     FW_CUDA_FUNC    const F64*      getPtr      (void) const                { return &m00; }

     FW_CUDA_FUNC    F64*            getPtr      (void)                      { return &m00; }

     static FW_CUDA_FUNC Mat2d       fromPtr     (const F64* ptr)            { Mat2d v; v.set(ptr); return v; }


     FW_CUDA_FUNC    operator        Mat2f       (void) const                { Mat2f r; for (int i = 0; i < 2 * 2; i++) r.set(i, (F32)get(i)); return r; }


     template <class V> FW_CUDA_FUNC Mat2d(const MatrixBase<F64, 2, V>& v) { set(v); }

     template <class V> FW_CUDA_FUNC Mat2d& operator=(const MatrixBase<F64, 2, V>& v) { set(v); return *this; }


 public:

     F64             m00, m10;

     F64             m01, m11;

 };


 //------------------------------------------------------------------------


 class Mat3d : public MatrixBase<F64, 3, Mat3d>

 {

 public:

     FW_CUDA_FUNC                    Mat3d       (void)                      { setIdentity(); }

     FW_CUDA_FUNC                    Mat3d       (const Mat3f& a)            { for (int i = 0; i < 3 * 3; i++) set(i, (F64)a.get(i)); }

     FW_CUDA_FUNC    explicit        Mat3d       (F64 a)                     { set(a); }


     FW_CUDA_FUNC    const F64*      getPtr      (void) const                { return &m00; }

     FW_CUDA_FUNC    F64*            getPtr      (void)                      { return &m00; }

     static FW_CUDA_FUNC Mat3d       fromPtr     (const F64* ptr)            { Mat3d v; v.set(ptr); return v; }


     FW_CUDA_FUNC    operator        Mat3f       (void) const                { Mat3f r; for (int i = 0; i < 3 * 3; i++) r.set(i, (F32)get(i)); return r; }


 #if !FW_CUDA

     static          Mat3d           rotation    (const Vec3d& axis, F64 angle);     // Rotation of "angle" radians around "axis". Axis must be unit!

 #endif


     template <class V> FW_CUDA_FUNC Mat3d(const MatrixBase<F64, 3, V>& v) { set(v); }

     template <class V> FW_CUDA_FUNC Mat3d& operator=(const MatrixBase<F64, 3, V>& v) { set(v); return *this; }


 public:

     F64             m00, m10, m20;

     F64             m01, m11, m21;

     F64             m02, m12, m22;

 };


 //------------------------------------------------------------------------


 class Mat4d : public MatrixBase<F64, 4, Mat4d>

 {

 public:

     FW_CUDA_FUNC                    Mat4d       (void)                      { setIdentity(); }

     FW_CUDA_FUNC                    Mat4d       (const Mat4f& a)            { for (int i = 0; i < 4 * 4; i++) set(i, (F64)a.get(i)); }

     FW_CUDA_FUNC    explicit        Mat4d       (F64 a)                     { set(a); }


     FW_CUDA_FUNC    const F64*      getPtr      (void) const                { return &m00; }

     FW_CUDA_FUNC    F64*            getPtr      (void)                      { return &m00; }

     static FW_CUDA_FUNC Mat4d       fromPtr     (const F64* ptr)            { Mat4d v; v.set(ptr); return v; }


     FW_CUDA_FUNC    operator        Mat4f       (void) const                { Mat4f r; for (int i = 0; i < 4 * 4; i++) r.set(i, (F32)get(i)); return r; }


     template <class V> FW_CUDA_FUNC Mat4d(const MatrixBase<F64, 4, V>& v) { set(v); }

     template <class V> FW_CUDA_FUNC Mat4d& operator=(const MatrixBase<F64, 4, V>& v) { set(v); return *this; }


 public:

     F64             m00, m10, m20, m30;

     F64             m01, m11, m21, m31;

     F64             m02, m12, m22, m32;

     F64             m03, m13, m23, m33;

 };


 //------------------------------------------------------------------------


 template <class T, int L, class S> FW_CUDA_FUNC Matrix<T, L> outerProduct(const VectorBase<T, L, S>& a, const VectorBase<T, L, S>& b);


 template <class T, int L, class S> FW_CUDA_FUNC T det           (const MatrixBase<T, L, S>& v)  { return v.det(); }

 template <class T, int L, class S> FW_CUDA_FUNC S transpose     (const MatrixBase<T, L, S>& v)  { return v.transposed(); }

 template <class T, int L, class S> FW_CUDA_FUNC S invert        (const MatrixBase<T, L, S>& v)  { return v.inverted(); }


 template <class T, int L, class S> FW_CUDA_FUNC S operator+     (const T& a, const MatrixBase<T, L, S>& b)  { return b + a; }

 template <class T, int L, class S> FW_CUDA_FUNC S operator-     (const T& a, const MatrixBase<T, L, S>& b)  { return -b + a; }

 template <class T, int L, class S> FW_CUDA_FUNC S operator*     (const T& a, const MatrixBase<T, L, S>& b)  { return b * a; }

 template <class T, int L, class S> FW_CUDA_FUNC S operator/     (const T& a, const MatrixBase<T, L, S>& b)  { S r; for (int i = 0; i < L * L; i++) r.get(i) = a / b.get(i); return r; }

 template <class T, int L, class S> FW_CUDA_FUNC S operator%     (const T& a, const MatrixBase<T, L, S>& b)  { S r; for (int i = 0; i < L * L; i++) r.get(i) = a % b.get(i); return r; }

 template <class T, int L, class S> FW_CUDA_FUNC S operator&     (const T& a, const MatrixBase<T, L, S>& b)  { return b & a; }

 template <class T, int L, class S> FW_CUDA_FUNC S operator|     (const T& a, const MatrixBase<T, L, S>& b)  { return b | a; }

 template <class T, int L, class S> FW_CUDA_FUNC S operator^     (const T& a, const MatrixBase<T, L, S>& b)  { return b ^ a; }

 template <class T, int L, class S> FW_CUDA_FUNC S operator<<    (const T& a, const MatrixBase<T, L, S>& b)  { S r; for (int i = 0; i < L * L; i++) r.get(i) = a << b.get(i); return r; }

 template <class T, int L, class S> FW_CUDA_FUNC S operator>>    (const T& a, const MatrixBase<T, L, S>& b)  { S r; for (int i = 0; i < L * L; i++) r.get(i) = a >> b.get(i); return r; }


 //------------------------------------------------------------------------


 FW_CUDA_CONST int c_popc8LUT[] =

 {

     0, 1, 1, 2, 1, 2, 2, 3, 1, 2, 2, 3, 2, 3, 3, 4,

     1, 2, 2, 3, 2, 3, 3, 4, 2, 3, 3, 4, 3, 4, 4, 5,

     1, 2, 2, 3, 2, 3, 3, 4, 2, 3, 3, 4, 3, 4, 4, 5,

     2, 3, 3, 4, 3, 4, 4, 5, 3, 4, 4, 5, 4, 5, 5, 6,

     1, 2, 2, 3, 2, 3, 3, 4, 2, 3, 3, 4, 3, 4, 4, 5,

     2, 3, 3, 4, 3, 4, 4, 5, 3, 4, 4, 5, 4, 5, 5, 6,

     2, 3, 3, 4, 3, 4, 4, 5, 3, 4, 4, 5, 4, 5, 5, 6,

     3, 4, 4, 5, 4, 5, 5, 6, 4, 5, 5, 6, 5, 6, 6, 7,

     1, 2, 2, 3, 2, 3, 3, 4, 2, 3, 3, 4, 3, 4, 4, 5,

     2, 3, 3, 4, 3, 4, 4, 5, 3, 4, 4, 5, 4, 5, 5, 6,

     2, 3, 3, 4, 3, 4, 4, 5, 3, 4, 4, 5, 4, 5, 5, 6,

     3, 4, 4, 5, 4, 5, 5, 6, 4, 5, 5, 6, 5, 6, 6, 7,

     2, 3, 3, 4, 3, 4, 4, 5, 3, 4, 4, 5, 4, 5, 5, 6,

     3, 4, 4, 5, 4, 5, 5, 6, 4, 5, 5, 6, 5, 6, 6, 7,

     3, 4, 4, 5, 4, 5, 5, 6, 4, 5, 5, 6, 5, 6, 6, 7,

     4, 5, 5, 6, 5, 6, 6, 7, 5, 6, 6, 7, 6, 7, 7, 8,

 };


 FW_CUDA_FUNC int popc8(U32 mask)

 {

     return c_popc8LUT[mask & 0xFFu];

 }


 FW_CUDA_FUNC int popc16(U32 mask)

 {

     return c_popc8LUT[mask & 0xFFu] + c_popc8LUT[(mask >> 8) & 0xFFu];

 }


 FW_CUDA_FUNC int popc32(U32 mask)

 {

     int result = c_popc8LUT[mask & 0xFFu];

     result += c_popc8LUT[(mask >> 8) & 0xFFu];

     result += c_popc8LUT[(mask >> 16) & 0xFFu];

     result += c_popc8LUT[mask >> 24];

     return result;

 }


 FW_CUDA_FUNC int popc64(U64 mask)

 {

     U32 lo = (U32)mask;

     U32 hi = (U32)(mask >> 32);

     int result = c_popc8LUT[lo & 0xffu] + c_popc8LUT[hi & 0xffu];

     result += c_popc8LUT[(lo >> 8) & 0xffu] + c_popc8LUT[(hi >> 8) & 0xffu];

     result += c_popc8LUT[(lo >> 16) & 0xffu] + c_popc8LUT[(hi >> 16) & 0xffu];

     result += c_popc8LUT[lo >> 24] + c_popc8LUT[hi >> 24];

     return result;

 }


 //------------------------------------------------------------------------


 template <class T, int L, class S> template <class V> S MatrixBase<T, L, S>::translate(const VectorBase<T, L - 1, V>& v)

 {

     S r;

     for (int i = 0; i < L - 1; i++)

         r(i, L - 1) = v[i];

     return r;

 }


 //------------------------------------------------------------------------


 template <class T, int L, class S> template <class V> S MatrixBase<T, L, S>::scale(const VectorBase<T, L - 1, V>& v)

 {

     S r;

     for (int i = 0; i < L - 1; i++)

         r(i, i) = v[i];

     return r;

 }


 //------------------------------------------------------------------------


 template <class T, int L, class S> template <class V> S MatrixBase<T, L, S>::scale(const VectorBase<T, L, V>& v)

 {

     S r;

     for (int i = 0; i < L; i++)

         r(i, i) = v[i];

     return r;

 }


 //------------------------------------------------------------------------


 template <class T, int L, class S> Vector<T, L> MatrixBase<T, L, S>::getRow(int idx) const

 {

     Vector<T, L> r;

     for (int i = 0; i < L; i++)

         r[i] = get(idx, i);

     return r;

 }


 //------------------------------------------------------------------------


 #if !FW_CUDA

 template <class T, int L, class S> void MatrixBase<T, L, S>::print(void) const

 {

     for (int i = 0; i < L; i++)

     {

         for (int j = 0; j < L; j++)

             printf("%-16g", (F64)get(i, j));

         printf("\n");

     }

 }

 #endif


 //------------------------------------------------------------------------


 template <class T, int L, class S> FW_CUDA_FUNC T detImpl(const MatrixBase<T, L, S>& v)

 {

     T r = (T)0;

     T s = (T)1;

     for (int i = 0; i < L; i++)

     {

         Matrix<T, L - 1> sub;

         for (int j = 0; j < L - 1; j++)

             for (int k = 0; k < L - 1; k++)

                 sub(j, k) = v((j < i) ? j : j + 1, k + 1);

         r += sub.det() * v(i, 0) * s;

         s = -s;

     }

     return r;

 }


 //------------------------------------------------------------------------


 template <class T, class S> FW_CUDA_FUNC T detImpl(const MatrixBase<T, 1, S>& v)

 {

     return v(0, 0);

 }


 //------------------------------------------------------------------------


 template <class T, class S> FW_CUDA_FUNC T detImpl(const MatrixBase<T, 2, S>& v)

 {

     return v(0, 0) * v(1, 1) - v(0, 1) * v(1, 0);

 }


 //------------------------------------------------------------------------


 template <class T, class S> FW_CUDA_FUNC T detImpl(const MatrixBase<T, 3, S>& v)

 {

     return v(0, 0) * v(1, 1) * v(2, 2) - v(0, 0) * v(1, 2) * v(2, 1) +

            v(1, 0) * v(2, 1) * v(0, 2) - v(1, 0) * v(2, 2) * v(0, 1) +

            v(2, 0) * v(0, 1) * v(1, 2) - v(2, 0) * v(0, 2) * v(1, 1);

 }


 //------------------------------------------------------------------------


 template <class T, int L, class S> T MatrixBase<T, L, S>::det(void) const

 {

     return detImpl(*this);

 }


 //------------------------------------------------------------------------


 template <class T, int L, class S> S MatrixBase<T, L, S>::transposed(void) const

 {

     S r;

     for (int i = 0; i < L; i++)

         for (int j = 0; j < L; j++)

             r(i, j) = get(j, i);

     return r;

 }


 //------------------------------------------------------------------------


 template <class T, int L, class S> S MatrixBase<T, L, S>::inverted(void) const

 {

     S r;

     T d = (T)0;

     T si = (T)1;

     for (int i = 0; i < L; i++)

     {

         T sj = si;

         for (int j = 0; j < L; j++)

         {

             Matrix<T, L - 1> sub;

             for (int k = 0; k < L - 1; k++)

                 for (int l = 0; l < L - 1; l++)

                     sub(k, l) = get((k < j) ? k : k + 1, (l < i) ? l : l + 1);

             T dd = sub.det() * sj;

             r(i, j) = dd;

             d += dd * get(j, i);

             sj = -sj;

         }

         si = -si;

     }

     return r * rcp(d) * L;

 }


 //------------------------------------------------------------------------


 template <class T, int L, class S> template <class V> void MatrixBase<T, L, S>::setRow(int idx, const VectorBase<T, L, V>& v)

 {

     for (int i = 0; i < L; i++)

         get(idx, i) = v[i];

 }


 //------------------------------------------------------------------------


 template <class T, int L, class S> template<class V> V MatrixBase<T, L, S>::operator*(const VectorBase<T, L, V>& v) const

 {

     V r;

     for (int i = 0; i < L; i++)

     {

         T rr = (T)0;

         for (int j = 0; j < L; j++)

             rr += get(i, j) * v[j];

         r[i] = rr;

     }

     return r;

 }


 //------------------------------------------------------------------------


 template <class T, int L, class S> template<class V> V MatrixBase<T, L, S>::operator*(const VectorBase<T, L - 1, V>& v) const

 {

     T w = get(L - 1, L - 1);

     for (int i = 0; i < L - 1; i++)

         w += get(L - 1, i) * v[i];

     w = rcp(w);


     V r;

     for (int i = 0; i < L - 1; i++)

     {

         T rr = get(i, L - 1);

         for (int j = 0; j < L - 1; j++)

             rr += get(i, j) * v[j];

         r[i] = rr * w;

     }

     return r;

 }


 //------------------------------------------------------------------------


 template <class T, int L, class S> template <class V> S MatrixBase<T, L, S>::operator*(const MatrixBase<T, L, V>& v) const

 {

     S r;

     for (int i = 0; i < L; i++)

     {

         for (int j = 0; j < L; j++)

         {

             T rr = (T)0;

             for (int k = 0; k < L; k++)

                 rr += get(i, k) * v(k, j);

             r(i, j) = rr;

         }

     }

     return r;

 }


 //------------------------------------------------------------------------


 template <class T, int L, class S> Matrix<T, L> outerProduct(const VectorBase<T, L, S>& a, const VectorBase<T, L, S>& b)

 {

     Matrix<T, L> res;

     for (int i = 0; i < L; i++)

         for (int j = 0; j < L; j++)

             res.get(i, j) = a.get(i) * b.get(j);

     return res;

 }


 //------------------------------------------------------------------------

 }

FW::MatrixBase::getPtr
FW_CUDA_FUNC const T * getPtr(void) const
Definition: Math.hpp:518

FW::Mat4f::m20
F32 m20
Definition: Math.hpp:696

FW::Vec4d::Vec4d
FW_CUDA_FUNC Vec4d(const Vec3d &xyz, F64 ww)
Definition: Math.hpp:437

FW::Mat3d::m20
F64 m20
Definition: Math.hpp:748

FW::Vector::Vector
FW_CUDA_FUNC Vector(void)
Definition: Math.hpp:222

FW::VectorBase::set
FW_CUDA_FUNC void set(const T *ptr)
Definition: Math.hpp:133

FW::operator+
FW_CUDA_FUNC S operator+(const T &a, const VectorBase< T, L, S > &b)
Definition: Math.hpp:466

FW::VectorBase::set
FW_CUDA_FUNC void set(const VectorBase< T, L, V > &v)
Definition: Math.hpp:184

FW::operator&
FW_CUDA_FUNC S operator&(const T &a, const VectorBase< T, L, S > &b)
Definition: Math.hpp:471

FW::Vec4d::Vec4d
FW_CUDA_FUNC Vec4d(const Vec4i &v)
Definition: Math.hpp:439

mask
CUdevice int ordinal char int CUdevice dev CUdevprop CUdevice dev CUcontext ctx CUcontext ctx CUcontext pctx CUmodule const void image CUmodule const void fatCubin CUfunction CUmodule const char name void p CUfunction unsigned int bytes CUtexref pTexRef CUtexref CUarray unsigned int Flags CUtexref int CUaddress_mode am CUtexref unsigned int Flags CUaddress_mode CUtexref int dim CUarray_format int CUtexref hTexRef CUfunction unsigned int numbytes CUfunction int float value CUfunction int CUtexref hTexRef CUfunction int int grid_height CUevent unsigned int Flags CUevent hEvent CUevent hEvent CUstream unsigned int Flags CUstream hStream GLuint bufferobj unsigned int CUdevice dev CUdeviceptr unsigned int CUmodule const char name CUdeviceptr unsigned int bytesize CUdeviceptr dptr void unsigned int bytesize void CUdeviceptr unsigned int ByteCount CUarray unsigned int CUdeviceptr unsigned int ByteCount CUarray unsigned int const void unsigned int ByteCount CUarray unsigned int CUarray unsigned int unsigned int ByteCount void CUarray unsigned int unsigned int CUstream hStream const CUDA_MEMCPY2D pCopy CUdeviceptr const void unsigned int CUstream hStream const CUDA_MEMCPY2D CUstream hStream CUdeviceptr unsigned char unsigned int N CUdeviceptr unsigned int unsigned int N CUdeviceptr unsigned int unsigned short unsigned int unsigned int Height CUarray const CUDA_ARRAY_DESCRIPTOR pAllocateArray CUarray const CUDA_ARRAY3D_DESCRIPTOR pAllocateArray unsigned int CUtexref CUdeviceptr unsigned int bytes CUcontext unsigned int CUdevice device GLenum texture GLenum GLuint buffer GLenum GLuint renderbuffer GLenum GLsizeiptr const GLvoid GLenum usage GLuint shader GLenum type GLsizei const GLuint framebuffers GLsizei const GLuint renderbuffers GLuint v GLuint v GLenum GLenum GLenum GLuint GLint level GLsizei GLuint framebuffers GLuint const GLchar name GLenum GLintptr GLsizeiptr GLvoid data GLuint GLenum GLint param GLuint GLenum GLint param GLhandleARB programObj GLenum GLenum GLsizei GLsizei height GLenum GLint GLint GLsizei GLsizei GLsizei GLint GLenum GLenum const GLvoid pixels GLint GLsizei const GLfloat value GLint GLfloat GLfloat v1 GLint GLfloat GLfloat GLfloat v2 GLint GLsizei const GLfloat value GLint GLsizei GLboolean const GLfloat value GLuint program GLuint GLfloat GLfloat GLfloat z GLuint GLint GLenum GLboolean GLsizei const GLvoid pointer GLuint GLuint const GLchar name GLenum GLsizei GLenum GLsizei GLsizei height GLenum GLuint renderbuffer GLenum GLenum GLint params GLuint GLsizei range GLuint GLsizei const GLubyte GLsizei GLenum const GLvoid coords GLuint GLsizei GLsizei GLsizei const GLubyte GLsizei GLenum const GLvoid coords GLuint GLenum GLsizei const GLvoid pathString GLuint GLenum const GLvoid GLbitfield GLuint GLsizei GLenum GLuint GLfloat emScale GLuint GLuint srcPath GLuint GLuint GLenum const GLfloat transformValues GLuint GLenum GLint value GLuint GLenum GLfloat value GLenum GLint GLuint mask
Definition: DLLImports.inl:400

FW::floatToBits
U32 floatToBits(F32 a)
Definition: Math.hpp:95

FW::MatrixBase::operator<<
FW_CUDA_FUNC S operator<<(const T &a) const
Definition: Math.hpp:573

FW::MatrixBase::getPtr
FW_CUDA_FUNC T * getPtr(void)
Definition: Math.hpp:519

FW::Vec4d::Vec4d
FW_CUDA_FUNC Vec4d(const Vec2d &xy, F64 zz, F64 ww)
Definition: Math.hpp:436

FW::MatrixBase::set
FW_CUDA_FUNC void set(const T *ptr)
Definition: Math.hpp:532

FW::length
FW_CUDA_FUNC T length(const VectorBase< T, L, S > &v)
Definition: Math.hpp:459

FW::Mat4d::m13
F64 m13
Definition: Math.hpp:775

FW::Vec4d::Vec4d
FW_CUDA_FUNC Vec4d(const VectorBase< F64, 4, V > &v)
Definition: Math.hpp:452

FW::MatrixBase::setRow
FW_CUDA_FUNC void setRow(int r, const VectorBase< T, L, V > &v)

FW::Vec3f::Vec3f
FW_CUDA_FUNC Vec3f(F32 a)
Definition: Math.hpp:328

FW::Vec4i::getXYZ
FW_CUDA_FUNC Vec3i getXYZ(void) const
Definition: Math.hpp:292

FW::Vec4i::getXYW
FW_CUDA_FUNC Vec3i getXYW(void) const
Definition: Math.hpp:293

FW::Vec4f::getXY
FW_CUDA_FUNC Vec2f getXY(void) const
Definition: Math.hpp:364

FW::Mat2f::getPtr
FW_CUDA_FUNC const F32 * getPtr(void) const
Definition: Math.hpp:637

FW::Vec3f::operator=
FW_CUDA_FUNC Vec3f & operator=(const VectorBase< F32, 3, V > &v)
Definition: Math.hpp:343

FW::Mat3f::m11
F32 m11
Definition: Math.hpp:670

FW::MatrixBase::operator+
FW_CUDA_FUNC S operator+(void) const
Definition: Math.hpp:561

FW::Mat3d::operator=
FW_CUDA_FUNC Mat3d & operator=(const MatrixBase< F64, 3, V > &v)
Definition: Math.hpp:745

FW::abs
FW_CUDA_FUNC S abs(const VectorBase< T, L, S > &v)
Definition: Math.hpp:464

FW::Mat3d::m00
F64 m00
Definition: Math.hpp:748

FW::popc64
FW_CUDA_FUNC int popc64(U64 mask)
Definition: Math.hpp:838

FW::Mat4d
Definition: Math.hpp:755

FW::Vec4d::getPtr
FW_CUDA_FUNC F64 * getPtr(void)
Definition: Math.hpp:443

FW::Mat4f::Mat4f
FW_CUDA_FUNC Mat4f(void)
Definition: Math.hpp:679

FW::Mat2d::Mat2d
FW_CUDA_FUNC Mat2d(const MatrixBase< F64, 2, V > &v)
Definition: Math.hpp:717

FW::Vec4i::operator=
FW_CUDA_FUNC Vec4i & operator=(const VectorBase< S32, 4, V > &v)
Definition: Math.hpp:296

FW::Mat3f::fromPtr
static FW_CUDA_FUNC Mat3f fromPtr(const F32 *ptr)
Definition: Math.hpp:659

FW::Mat3d::m02
F64 m02
Definition: Math.hpp:750

FW::Vec2i::Vec2i
FW_CUDA_FUNC Vec2i(void)
Definition: Math.hpp:241

FW::Vec3i::Vec3i
FW_CUDA_FUNC Vec3i(const Vec2i &xy, S32 zz)
Definition: Math.hpp:263

FW::Vec2f::operator=
FW_CUDA_FUNC Vec2f & operator=(const VectorBase< F32, 2, V > &v)
Definition: Math.hpp:319

FW::log2
F64 log2(F64 a)
Definition: Math.hpp:91

FW::Mat4d::m02
F64 m02
Definition: Math.hpp:774

FW::Mat4f::m32
F32 m32
Definition: Math.hpp:698

FW::Vec2f::fromPtr
static FW_CUDA_FUNC Vec2f fromPtr(const F32 *ptr)
Definition: Math.hpp:311

FW::acos
FW_CUDA_FUNC F32 acos(F32 a)
Definition: Math.hpp:53

FW::Mat4f::m01
F32 m01
Definition: Math.hpp:697

FW::Mat4f::m21
F32 m21
Definition: Math.hpp:697

FW::VectorBase::operator=
FW_CUDA_FUNC S & operator=(const T &a)
Definition: Math.hpp:157

FW::exp
FW_CUDA_FUNC F64 exp(F64 a)
Definition: Math.hpp:46

FW::MatrixBase::set
FW_CUDA_FUNC T set(int idx, const T &a)
Definition: Math.hpp:524

FW::Mat3f::Mat3f
FW_CUDA_FUNC Mat3f(F32 a)
Definition: Math.hpp:655

FW::MatrixBase::operator>>=
FW_CUDA_FUNC S & operator>>=(const T &a)
Definition: Math.hpp:559

FW::Vec2f::Vec2f
FW_CUDA_FUNC Vec2f(F32 a)
Definition: Math.hpp:305

FW::Mat2d::m00
F64 m00
Definition: Math.hpp:721

FW::Vec4f::getPtr
FW_CUDA_FUNC const F32 * getPtr(void) const
Definition: Math.hpp:359

FW::atan2
FW_CUDA_FUNC F64 atan2(F64 y, F64 x)
Definition: Math.hpp:57

FW::Vec3d
Definition: Math.hpp:404

FW::Mat3f::Mat3f
FW_CUDA_FUNC Mat3f(void)
Definition: Math.hpp:654

FW::lenSqr
FW_CUDA_FUNC T lenSqr(const VectorBase< T, L, S > &v)
Definition: Math.hpp:458

FW::Matrix::Matrix
FW_CUDA_FUNC Matrix(void)
Definition: Math.hpp:615

FW::Vec2d::perpendicular
FW_CUDA_FUNC Vec2d perpendicular(void) const
Definition: Math.hpp:395

FW::scale
FW_CUDA_FUNC F32 scale(F32 a, int b)
Definition: Math.hpp:104

FW::Mat4d::Mat4d
FW_CUDA_FUNC Mat4d(const Mat4f &a)
Definition: Math.hpp:759

FW::Vec2i::Vec2i
FW_CUDA_FUNC Vec2i(S32 xx, S32 yy)
Definition: Math.hpp:243

FW::VectorBase::max
FW_CUDA_FUNC T max(void) const
Definition: Math.hpp:147

FW::Vec3d::Vec3d
FW_CUDA_FUNC Vec3d(void)
Definition: Math.hpp:407

FW::Vec4d::Vec4d
FW_CUDA_FUNC Vec4d(const Vec4f &v)
Definition: Math.hpp:440

FW::Vec4i::Vec4i
FW_CUDA_FUNC Vec4i(const Vec2i &xy, const Vec2i &zw)
Definition: Math.hpp:285

FW::Mat4d::operator=
FW_CUDA_FUNC Mat4d & operator=(const MatrixBase< F64, 4, V > &v)
Definition: Math.hpp:769

FW::Mat2f::Mat2f
FW_CUDA_FUNC Mat2f(void)
Definition: Math.hpp:634

FW::fastMax
F32 fastMax(F32 a, F32 b)
Definition: Math.hpp:99

FW::Vec4d::getXYW
FW_CUDA_FUNC Vec3d getXYW(void) const
Definition: Math.hpp:450

FW::Mat2d::m01
F64 m01
Definition: Math.hpp:722

FW::Vec3i::fromPtr
static FW_CUDA_FUNC Vec3i fromPtr(const S32 *ptr)
Definition: Math.hpp:267

ptr
void ** ptr
Definition: DLLImports.cpp:74

FW::Vec2f::getPtr
FW_CUDA_FUNC const F32 * getPtr(void) const
Definition: Math.hpp:309

FW::Vec3d::Vec3d
FW_CUDA_FUNC Vec3d(const VectorBase< F64, 3, V > &v)
Definition: Math.hpp:424

FW::Vec2d::Vec2d
FW_CUDA_FUNC Vec2d(const Vec2i &v)
Definition: Math.hpp:385

FW::Mat4f::Mat4f
FW_CUDA_FUNC Mat4f(F32 a)
Definition: Math.hpp:680

FW::cos
FW_CUDA_FUNC F64 cos(F64 a)
Definition: Math.hpp:49

FW::Vec4d::getPtr
FW_CUDA_FUNC const F64 * getPtr(void) const
Definition: Math.hpp:442

FW::Vec2d::Vec2d
FW_CUDA_FUNC Vec2d(const VectorBase< F64, 2, V > &v)
Definition: Math.hpp:398

FW::tan
F32 tan(F32 a)
Definition: Math.hpp:94

FW::Vec3d::fromPtr
static FW_CUDA_FUNC Vec3d fromPtr(const F64 *ptr)
Definition: Math.hpp:416

FW::MatrixBase::det
FW_CUDA_FUNC T det(void) const
Definition: Math.hpp:946

FW::atan2
FW_CUDA_FUNC F32 atan2(F32 y, F32 x)
Definition: Math.hpp:58

FW::MatrixBase::col
FW_CUDA_FUNC Vector< T, L > & col(int c)
Definition: Math.hpp:527

FW::MatrixBase::transpose
FW_CUDA_FUNC void transpose(void)
Definition: Math.hpp:543

FW::Vector::Vector
FW_CUDA_FUNC Vector(T a)
Definition: Math.hpp:223

FW::MatrixBase::operator>>
FW_CUDA_FUNC S operator>>(const T &a) const
Definition: Math.hpp:574

FW::perpendicular
FW_CUDA_FUNC Vec2f perpendicular(const Vec2f &v)
Definition: Math.hpp:479

FW::Vec2d::Vec2d
FW_CUDA_FUNC Vec2d(F64 a)
Definition: Math.hpp:383

FW::MatrixBase::invert
FW_CUDA_FUNC void invert(void)
Definition: Math.hpp:544

FW::pow
FW_CUDA_FUNC F64 pow(F64 a, F64 b)
Definition: Math.hpp:45

FW::Mat2d::Mat2d
FW_CUDA_FUNC Mat2d(const Mat2f &a)
Definition: Math.hpp:708

FW::VectorBase::operator>>=
FW_CUDA_FUNC S & operator>>=(const T &a)
Definition: Math.hpp:167

FW::VectorBase::operator==
FW_CUDA_FUNC bool operator==(const VectorBase< T, L, V > &v) const
Definition: Math.hpp:213

FW::MatrixBase::operator^=
FW_CUDA_FUNC S & operator^=(const T &a)
Definition: Math.hpp:557

FW::sqr
FW_CUDA_FUNC T sqr(const T &a)
Definition: Math.hpp:113

FW::Vector::getPtr
FW_CUDA_FUNC const T * getPtr(void) const
Definition: Math.hpp:225

FW::Mat2f::Mat2f
FW_CUDA_FUNC Mat2f(const MatrixBase< F32, 2, V > &v)
Definition: Math.hpp:641

FW::U64
unsigned __int64 U64
Definition: Defs.hpp:97

FW::VectorBase::VectorBase
FW_CUDA_FUNC VectorBase(void)
Definition: Math.hpp:124

FW::Mat4f::m30
F32 m30
Definition: Math.hpp:696

FW::L
int L
Definition: Math.hpp:509

FW::F64
double F64
Definition: Defs.hpp:90

FW::Vec2f
Definition: Math.hpp:301

FW::Vec4f::toABGR
U32 toABGR(void) const
Definition: Math.cpp:45

FW::Mat2f::m01
F32 m01
Definition: Math.hpp:646

FW::Vec2d::operator=
FW_CUDA_FUNC Vec2d & operator=(const VectorBase< F64, 2, V > &v)
Definition: Math.hpp:399

FW::Mat4d::m30
F64 m30
Definition: Math.hpp:772

FW::VectorBase::toCartesian
FW_CUDA_FUNC Vector< T, L-1 > toCartesian(void) const
Definition: Math.hpp:152

FW::VectorBase::operator|=
FW_CUDA_FUNC S & operator|=(const T &a)
Definition: Math.hpp:164

FW::Mat4f::m10
F32 m10
Definition: Math.hpp:696

FW::Mat3d::getPtr
FW_CUDA_FUNC F64 * getPtr(void)
Definition: Math.hpp:735

FW::Vec3f::Vec3f
FW_CUDA_FUNC Vec3f(const Vec3i &v)
Definition: Math.hpp:331

FW::Vec2i::getPtr
FW_CUDA_FUNC const S32 * getPtr(void) const
Definition: Math.hpp:245

FW::Mat3f::rotation
static Mat3f rotation(const Vec3f &axis, F32 angle)
Definition: Math.cpp:96

FW::MatrixBase::MatrixBase
FW_CUDA_FUNC MatrixBase(void)
Definition: Math.hpp:512

FW::VectorBase::toHomogeneous
FW_CUDA_FUNC Vector< T, L+1 > toHomogeneous(void) const
Definition: Math.hpp:151

FW::floor
FW_CUDA_FUNC F32 floor(F32 a)
Definition: Math.hpp:59

FW::MatrixBase::scale
static FW_CUDA_FUNC S scale(const VectorBase< T, L-1, V > &v)

FW::Mat2d::getPtr
FW_CUDA_FUNC const F64 * getPtr(void) const
Definition: Math.hpp:711

FW::tan
FW_CUDA_FUNC F64 tan(F64 a)
Definition: Math.hpp:50

FW::Vec4f::getXYZ
FW_CUDA_FUNC Vec3f getXYZ(void) const
Definition: Math.hpp:365

FW::sqrt
FW_CUDA_FUNC F32 sqrt(F32 a)
Definition: Math.hpp:39

FW::Mat3d::Mat3d
FW_CUDA_FUNC Mat3d(const MatrixBase< F64, 3, V > &v)
Definition: Math.hpp:744

FW::Mat3f::Mat3f
FW_CUDA_FUNC Mat3f(const MatrixBase< F32, 3, V > &v)
Definition: Math.hpp:661

FW::Vec2f::cross
FW_CUDA_FUNC F32 cross(const Vec2f &v) const
Definition: Math.hpp:316

FW::Mat2f::m10
F32 m10
Definition: Math.hpp:645

FW::Vec2d::fromPtr
static FW_CUDA_FUNC Vec2d fromPtr(const F64 *ptr)
Definition: Math.hpp:390

FW::MatrixBase::operator==
FW_CUDA_FUNC bool operator==(const MatrixBase< T, L, V > &v) const
Definition: Math.hpp:606

FW_CUDA_FUNC
#define FW_CUDA_FUNC
Definition: Defs.hpp:74

FW::VectorBase::sprint
void sprint(char *vec, size_t s) const
Definition: Math.hpp:138

FW::Mat2d::Mat2d
FW_CUDA_FUNC Mat2d(void)
Definition: Math.hpp:707

FW::Mat2f::operator=
FW_CUDA_FUNC Mat2f & operator=(const MatrixBase< F32, 2, V > &v)
Definition: Math.hpp:642

FW::VectorBase::getPtr
FW_CUDA_FUNC T * getPtr(void)
Definition: Math.hpp:127

FW::Vec2d::cross
FW_CUDA_FUNC F64 cross(const Vec2d &v) const
Definition: Math.hpp:396

FW::Mat3d::m11
F64 m11
Definition: Math.hpp:749

FW::Vec3f::getXY
FW_CUDA_FUNC Vec2f getXY(void) const
Definition: Math.hpp:338

FW::atan
FW_CUDA_FUNC F64 atan(F64 a)
Definition: Math.hpp:56

FW::Vector
Definition: Math.hpp:119

FW::Mat4d::m00
F64 m00
Definition: Math.hpp:772

FW::Mat4d::m23
F64 m23
Definition: Math.hpp:775

FW::Mat3f::operator=
FW_CUDA_FUNC Mat3f & operator=(const MatrixBase< F32, 3, V > &v)
Definition: Math.hpp:662

FW::Vec4i::getPtr
FW_CUDA_FUNC const S32 * getPtr(void) const
Definition: Math.hpp:287

FW::MatrixBase::operator()
FW_CUDA_FUNC const T & operator()(int r, int c) const
Definition: Math.hpp:546

FW::VectorBase::lenSqr
FW_CUDA_FUNC T lenSqr(void) const
Definition: Math.hpp:142

FW::VectorBase::clamp
FW_CUDA_FUNC S clamp(const VectorBase< T, L, V > &lo, const VectorBase< T, L, W > &hi) const
Definition: Math.hpp:188

FW::MatrixBase::operator!=
FW_CUDA_FUNC bool operator!=(const MatrixBase< T, L, V > &v) const
Definition: Math.hpp:607

FW::Vec3d::Vec3d
FW_CUDA_FUNC Vec3d(F64 a)
Definition: Math.hpp:408

FW::MatrixBase::operator&=
FW_CUDA_FUNC S & operator&=(const T &a)
Definition: Math.hpp:555

FW::Vec4f
Definition: Math.hpp:348

FW::Mat3d::getPtr
FW_CUDA_FUNC const F64 * getPtr(void) const
Definition: Math.hpp:734

FW::dot
FW_CUDA_FUNC T dot(const VectorBase< T, L, S > &a, const VectorBase< T, L, V > &b)
Definition: Math.hpp:477

FW::Vec3i
Definition: Math.hpp:257

FW::Mat2d::m10
F64 m10
Definition: Math.hpp:721

FW::asin
FW_CUDA_FUNC F64 asin(F64 a)
Definition: Math.hpp:52

FW::Vec2f::perpendicular
FW_CUDA_FUNC Vec2f perpendicular(void) const
Definition: Math.hpp:315

x
CUdevice int ordinal char int CUdevice dev CUdevprop CUdevice dev CUcontext ctx CUcontext ctx CUcontext pctx CUmodule const void image CUmodule const void fatCubin CUfunction CUmodule const char name void p CUfunction unsigned int bytes CUtexref pTexRef CUtexref CUarray unsigned int Flags CUtexref int CUaddress_mode am CUtexref unsigned int Flags CUaddress_mode CUtexref int dim CUarray_format int CUtexref hTexRef CUfunction unsigned int numbytes CUfunction int float value CUfunction int CUtexref hTexRef CUfunction int int grid_height CUevent unsigned int Flags CUevent hEvent CUevent hEvent CUstream unsigned int Flags CUstream hStream GLuint bufferobj unsigned int CUdevice dev CUdeviceptr unsigned int CUmodule const char name CUdeviceptr unsigned int bytesize CUdeviceptr dptr void unsigned int bytesize void CUdeviceptr unsigned int ByteCount CUarray unsigned int CUdeviceptr unsigned int ByteCount CUarray unsigned int const void unsigned int ByteCount CUarray unsigned int CUarray unsigned int unsigned int ByteCount void CUarray unsigned int unsigned int CUstream hStream const CUDA_MEMCPY2D pCopy CUdeviceptr const void unsigned int CUstream hStream const CUDA_MEMCPY2D CUstream hStream CUdeviceptr unsigned char unsigned int N CUdeviceptr unsigned int unsigned int N CUdeviceptr unsigned int unsigned short unsigned int unsigned int Height CUarray const CUDA_ARRAY_DESCRIPTOR pAllocateArray CUarray const CUDA_ARRAY3D_DESCRIPTOR pAllocateArray unsigned int CUtexref CUdeviceptr unsigned int bytes CUcontext unsigned int CUdevice device GLenum texture GLenum GLuint buffer GLenum GLuint renderbuffer GLenum GLsizeiptr const GLvoid GLenum usage GLuint shader GLenum type GLsizei const GLuint framebuffers GLsizei const GLuint renderbuffers GLuint v GLuint v GLenum GLenum GLenum GLuint GLint level GLsizei GLuint framebuffers GLuint const GLchar name GLenum GLintptr GLsizeiptr GLvoid data GLuint GLenum GLint param GLuint GLenum GLint param GLhandleARB programObj GLenum GLenum GLsizei GLsizei height GLenum GLint GLint GLsizei GLsizei GLsizei GLint GLenum GLenum const GLvoid pixels GLint GLsizei const GLfloat value GLint GLfloat GLfloat v1 GLint GLfloat GLfloat GLfloat v2 GLint GLsizei const GLfloat value GLint GLsizei GLboolean const GLfloat value GLuint program GLuint GLfloat x
Definition: DLLImports.inl:363

FW::MatrixBase::set
FW_CUDA_FUNC void set(const MatrixBase< T, L, V > &v)
Definition: Math.hpp:578

FW::Mat3d::Mat3d
FW_CUDA_FUNC Mat3d(void)
Definition: Math.hpp:730

FW::Vec3i::getXY
FW_CUDA_FUNC Vec2i getXY(void) const
Definition: Math.hpp:269

FW::Mat3f::m22
F32 m22
Definition: Math.hpp:671

FW::Mat4f::m02
F32 m02
Definition: Math.hpp:698

FW::MatrixBase::print
void print(void) const
Definition: Math.hpp:892

FW::Vec4i::Vec4i
FW_CUDA_FUNC Vec4i(const Vec2i &xy, S32 zz, S32 ww)
Definition: Math.hpp:283

FW::Vec2d::Vec2d
FW_CUDA_FUNC Vec2d(F64 xx, F64 yy)
Definition: Math.hpp:384

FW::Mat4d::m22
F64 m22
Definition: Math.hpp:774

FW::Mat2d::m11
F64 m11
Definition: Math.hpp:722

FW::Vec4d::Vec4d
FW_CUDA_FUNC Vec4d(void)
Definition: Math.hpp:433

FW::VectorBase::operator+
FW_CUDA_FUNC S operator+(void) const
Definition: Math.hpp:169

FW::MatrixBase::set
FW_CUDA_FUNC void set(const T &a)
Definition: Math.hpp:531

FW::Mat4d::Mat4d
FW_CUDA_FUNC Mat4d(F64 a)
Definition: Math.hpp:760

FW::Vec3d::getXY
FW_CUDA_FUNC Vec2d getXY(void) const
Definition: Math.hpp:420

FW::Mat4f::getPtr
FW_CUDA_FUNC const F32 * getPtr(void) const
Definition: Math.hpp:682

FW::VectorBase::abs
FW_CUDA_FUNC S abs(void) const
Definition: Math.hpp:149

FW::Mat3d::m22
F64 m22
Definition: Math.hpp:750

z
CUdevice int ordinal char int CUdevice dev CUdevprop CUdevice dev CUcontext ctx CUcontext ctx CUcontext pctx CUmodule const void image CUmodule const void fatCubin CUfunction CUmodule const char name void p CUfunction unsigned int bytes CUtexref pTexRef CUtexref CUarray unsigned int Flags CUtexref int CUaddress_mode am CUtexref unsigned int Flags CUaddress_mode CUtexref int dim CUarray_format int CUtexref hTexRef CUfunction unsigned int numbytes CUfunction int float value CUfunction int CUtexref hTexRef CUfunction int int grid_height CUevent unsigned int Flags CUevent hEvent CUevent hEvent CUstream unsigned int Flags CUstream hStream GLuint bufferobj unsigned int CUdevice dev CUdeviceptr unsigned int CUmodule const char name CUdeviceptr unsigned int bytesize CUdeviceptr dptr void unsigned int bytesize void CUdeviceptr unsigned int ByteCount CUarray unsigned int CUdeviceptr unsigned int ByteCount CUarray unsigned int const void unsigned int ByteCount CUarray unsigned int CUarray unsigned int unsigned int ByteCount void CUarray unsigned int unsigned int CUstream hStream const CUDA_MEMCPY2D pCopy CUdeviceptr const void unsigned int CUstream hStream const CUDA_MEMCPY2D CUstream hStream CUdeviceptr unsigned char unsigned int N CUdeviceptr unsigned int unsigned int N CUdeviceptr unsigned int unsigned short unsigned int unsigned int Height CUarray const CUDA_ARRAY_DESCRIPTOR pAllocateArray CUarray const CUDA_ARRAY3D_DESCRIPTOR pAllocateArray unsigned int CUtexref CUdeviceptr unsigned int bytes CUcontext unsigned int CUdevice device GLenum texture GLenum GLuint buffer GLenum GLuint renderbuffer GLenum GLsizeiptr const GLvoid GLenum usage GLuint shader GLenum type GLsizei const GLuint framebuffers GLsizei const GLuint renderbuffers GLuint v GLuint v GLenum GLenum GLenum GLuint GLint level GLsizei GLuint framebuffers GLuint const GLchar name GLenum GLintptr GLsizeiptr GLvoid data GLuint GLenum GLint param GLuint GLenum GLint param GLhandleARB programObj GLenum GLenum GLsizei GLsizei height GLenum GLint GLint GLsizei GLsizei GLsizei GLint GLenum GLenum const GLvoid pixels GLint GLsizei const GLfloat value GLint GLfloat GLfloat v1 GLint GLfloat GLfloat GLfloat v2 GLint GLsizei const GLfloat value GLint GLsizei GLboolean const GLfloat value GLuint program GLuint GLfloat GLfloat GLfloat z
Definition: DLLImports.inl:363

FW::VectorBase::isZero
FW_CUDA_FUNC bool isZero(void) const
Definition: Math.hpp:141

FW::VectorBase::get
FW_CUDA_FUNC const T & get(int idx) const
Definition: Math.hpp:128

FW::Vec4f::Vec4f
FW_CUDA_FUNC Vec4f(const VectorBase< F32, 4, V > &v)
Definition: Math.hpp:373

FW::VectorBase::operator*=
FW_CUDA_FUNC S & operator*=(const T &a)
Definition: Math.hpp:160

FW::Mat3d::m12
F64 m12
Definition: Math.hpp:750

FW::sin
F32 sin(F32 a)
Definition: Math.hpp:92

FW::Vec3i::Vec3i
FW_CUDA_FUNC Vec3i(S32 xx, S32 yy, S32 zz)
Definition: Math.hpp:262

FW::Mat4f::m23
F32 m23
Definition: Math.hpp:699

FW::VectorBase::operator%
FW_CUDA_FUNC S operator%(const T &a) const
Definition: Math.hpp:177

FW::Vec3i::getPtr
FW_CUDA_FUNC S32 * getPtr(void)
Definition: Math.hpp:266

FW::MatrixBase::operator~
FW_CUDA_FUNC S operator~(void) const
Definition: Math.hpp:563

FW::VectorBase::dot
FW_CUDA_FUNC T dot(const VectorBase< T, L, V > &v) const
Definition: Math.hpp:185

FW::Mat3d::Mat3d
FW_CUDA_FUNC Mat3d(const Mat3f &a)
Definition: Math.hpp:731

FW::sum
FW_CUDA_FUNC T sum(const VectorBase< T, L, S > &v)
Definition: Math.hpp:463

FW::popc16
FW_CUDA_FUNC int popc16(U32 mask)
Definition: Math.hpp:824

FW::operator/
FW_CUDA_FUNC S operator/(const T &a, const VectorBase< T, L, S > &b)
Definition: Math.hpp:469

FW::F32
float F32
Definition: Defs.hpp:89

FW::Vector::Vector
FW_CUDA_FUNC Vector(const VectorBase< T, L, V > &v)
Definition: Math.hpp:229

y
CUdevice int ordinal char int CUdevice dev CUdevprop CUdevice dev CUcontext ctx CUcontext ctx CUcontext pctx CUmodule const void image CUmodule const void fatCubin CUfunction CUmodule const char name void p CUfunction unsigned int bytes CUtexref pTexRef CUtexref CUarray unsigned int Flags CUtexref int CUaddress_mode am CUtexref unsigned int Flags CUaddress_mode CUtexref int dim CUarray_format int CUtexref hTexRef CUfunction unsigned int numbytes CUfunction int float value CUfunction int CUtexref hTexRef CUfunction int int grid_height CUevent unsigned int Flags CUevent hEvent CUevent hEvent CUstream unsigned int Flags CUstream hStream GLuint bufferobj unsigned int CUdevice dev CUdeviceptr unsigned int CUmodule const char name CUdeviceptr unsigned int bytesize CUdeviceptr dptr void unsigned int bytesize void CUdeviceptr unsigned int ByteCount CUarray unsigned int CUdeviceptr unsigned int ByteCount CUarray unsigned int const void unsigned int ByteCount CUarray unsigned int CUarray unsigned int unsigned int ByteCount void CUarray unsigned int unsigned int CUstream hStream const CUDA_MEMCPY2D pCopy CUdeviceptr const void unsigned int CUstream hStream const CUDA_MEMCPY2D CUstream hStream CUdeviceptr unsigned char unsigned int N CUdeviceptr unsigned int unsigned int N CUdeviceptr unsigned int unsigned short unsigned int unsigned int Height CUarray const CUDA_ARRAY_DESCRIPTOR pAllocateArray CUarray const CUDA_ARRAY3D_DESCRIPTOR pAllocateArray unsigned int CUtexref CUdeviceptr unsigned int bytes CUcontext unsigned int CUdevice device GLenum texture GLenum GLuint buffer GLenum GLuint renderbuffer GLenum GLsizeiptr const GLvoid GLenum usage GLuint shader GLenum type GLsizei const GLuint framebuffers GLsizei const GLuint renderbuffers GLuint v GLuint v GLenum GLenum GLenum GLuint GLint level GLsizei GLuint framebuffers GLuint const GLchar name GLenum GLintptr GLsizeiptr GLvoid data GLuint GLenum GLint param GLuint GLenum GLint param GLhandleARB programObj GLenum GLenum GLsizei GLsizei height GLenum GLint GLint GLsizei GLsizei GLsizei GLint GLenum GLenum const GLvoid pixels GLint GLsizei const GLfloat value GLint GLfloat GLfloat v1 GLint GLfloat GLfloat GLfloat v2 GLint GLsizei const GLfloat value GLint GLsizei GLboolean const GLfloat value GLuint program GLuint GLfloat GLfloat y
Definition: DLLImports.inl:363

FW::Mat3d
Definition: Math.hpp:727

FW::Vec3f::Vec3f
FW_CUDA_FUNC Vec3f(const Vec2f &xy, F32 zz)
Definition: Math.hpp:330

FW::Mat4f::m12
F32 m12
Definition: Math.hpp:698

FW::VectorBase::operator>>
FW_CUDA_FUNC S operator>>(const T &a) const
Definition: Math.hpp:182

FW::operator^
FW_CUDA_FUNC S operator^(const T &a, const VectorBase< T, L, S > &b)
Definition: Math.hpp:473

FW::VectorBase::max
FW_CUDA_FUNC S max(const VectorBase< T, L, V > &v) const
Definition: Math.hpp:187

FW::Mat4d::Mat4d
FW_CUDA_FUNC Mat4d(void)
Definition: Math.hpp:758

FW::Vec3i::Vec3i
FW_CUDA_FUNC Vec3i(S32 a)
Definition: Math.hpp:261

FW::Vec2d::getPtr
FW_CUDA_FUNC const F64 * getPtr(void) const
Definition: Math.hpp:388

FW::Mat4f::operator=
FW_CUDA_FUNC Mat4f & operator=(const MatrixBase< F32, 4, V > &v)
Definition: Math.hpp:693

FW::Mat3d::fromPtr
static FW_CUDA_FUNC Mat3d fromPtr(const F64 *ptr)
Definition: Math.hpp:736

FW::MatrixBase::operator^
FW_CUDA_FUNC S operator^(const T &a) const
Definition: Math.hpp:572

FW::MatrixBase::translate
static FW_CUDA_FUNC S translate(const VectorBase< T, L-1, V > &v)

FW::Vec3f::Vec3f
FW_CUDA_FUNC Vec3f(const VectorBase< F32, 3, V > &v)
Definition: Math.hpp:342

FW::invert
FW_CUDA_FUNC S invert(const MatrixBase< T, L, S > &v)
Definition: Math.hpp:784

FW::VectorBase::min
FW_CUDA_FUNC S min(const VectorBase< T, L, V > &v) const
Definition: Math.hpp:186

FW::log2
F32 log2(F32 a)
Definition: Math.hpp:90

v
CUdevice int ordinal char int CUdevice dev CUdevprop CUdevice dev CUcontext ctx CUcontext ctx CUcontext pctx CUmodule const void image CUmodule const void fatCubin CUfunction CUmodule const char name void p CUfunction unsigned int bytes CUtexref pTexRef CUtexref CUarray unsigned int Flags CUtexref int CUaddress_mode am CUtexref unsigned int Flags CUaddress_mode CUtexref int dim CUarray_format int CUtexref hTexRef CUfunction unsigned int numbytes CUfunction int float value CUfunction int CUtexref hTexRef CUfunction int int grid_height CUevent unsigned int Flags CUevent hEvent CUevent hEvent CUstream unsigned int Flags CUstream hStream GLuint bufferobj unsigned int CUdevice dev CUdeviceptr unsigned int CUmodule const char name CUdeviceptr unsigned int bytesize CUdeviceptr dptr void unsigned int bytesize void CUdeviceptr unsigned int ByteCount CUarray unsigned int CUdeviceptr unsigned int ByteCount CUarray unsigned int const void unsigned int ByteCount CUarray unsigned int CUarray unsigned int unsigned int ByteCount void CUarray unsigned int unsigned int CUstream hStream const CUDA_MEMCPY2D pCopy CUdeviceptr const void unsigned int CUstream hStream const CUDA_MEMCPY2D CUstream hStream CUdeviceptr unsigned char unsigned int N CUdeviceptr unsigned int unsigned int N CUdeviceptr unsigned int unsigned short unsigned int unsigned int Height CUarray const CUDA_ARRAY_DESCRIPTOR pAllocateArray CUarray const CUDA_ARRAY3D_DESCRIPTOR pAllocateArray unsigned int CUtexref CUdeviceptr unsigned int bytes CUcontext unsigned int CUdevice device GLenum texture GLenum GLuint buffer GLenum GLuint renderbuffer GLenum GLsizeiptr const GLvoid GLenum usage GLuint shader GLenum type GLsizei const GLuint framebuffers GLsizei const GLuint renderbuffers GLuint v
Definition: DLLImports.inl:329

FW::pow
F32 pow(F32 a, F32 b)
Definition: Math.hpp:85

FW::Mat4d::getPtr
FW_CUDA_FUNC F64 * getPtr(void)
Definition: Math.hpp:763

FW::Vec2i::Vec2i
FW_CUDA_FUNC Vec2i(const VectorBase< S32, 2, V > &v)
Definition: Math.hpp:251

FW::Vec3f::Vec3f
FW_CUDA_FUNC Vec3f(F32 xx, F32 yy, F32 zz)
Definition: Math.hpp:329

FW::Mat3f::m02
F32 m02
Definition: Math.hpp:671

FW::Vec4i::Vec4i
FW_CUDA_FUNC Vec4i(S32 a)
Definition: Math.hpp:281

FW::Vec3d::operator=
FW_CUDA_FUNC Vec3d & operator=(const VectorBase< F64, 3, V > &v)
Definition: Math.hpp:425

FW::VectorBase
Definition: Math.hpp:121

FW::MatrixBase::operator=
FW_CUDA_FUNC S & operator=(const T &a)
Definition: Math.hpp:549

FW::bitsToDouble
FW_CUDA_FUNC F64 bitsToDouble(U64 a)
Definition: Math.hpp:64

FW::Mat2f::fromPtr
static FW_CUDA_FUNC Mat2f fromPtr(const F32 *ptr)
Definition: Math.hpp:639

FW::VectorBase::getPtr
FW_CUDA_FUNC const T * getPtr(void) const
Definition: Math.hpp:126

FW::VectorBase::operator/
FW_CUDA_FUNC S operator/(const T &a) const
Definition: Math.hpp:176

FW::VectorBase::operator<<=
FW_CUDA_FUNC S & operator<<=(const T &a)
Definition: Math.hpp:166

FW::Vec4i::getPtr
FW_CUDA_FUNC S32 * getPtr(void)
Definition: Math.hpp:288

FW::Mat4f::perspective
static Mat4f perspective(F32 fov, F32 nearDist, F32 farDist)
Definition: Math.cpp:79

FW::Vec4f::Vec4f
FW_CUDA_FUNC Vec4f(F32 xx, F32 yy, F32 zz, F32 ww)
Definition: Math.hpp:353

FW::Vec3d::Vec3d
FW_CUDA_FUNC Vec3d(const Vec3f &v)
Definition: Math.hpp:412

FW::Mat4f::m22
F32 m22
Definition: Math.hpp:698

FW::min
FW_CUDA_FUNC T min(const VectorBase< T, L, S > &v)
Definition: Math.hpp:461

FW::Mat4d::m01
F64 m01
Definition: Math.hpp:773

FW::MatrixBase::transposed
FW_CUDA_FUNC S transposed(void) const
Definition: Math.hpp:953

FW::max
FW_CUDA_FUNC T max(const VectorBase< T, L, S > &v)
Definition: Math.hpp:462

FW::Vec3d::cross
FW_CUDA_FUNC Vec3d cross(const Vec3d &v) const
Definition: Math.hpp:422

FW::Vec4f::Vec4f
FW_CUDA_FUNC Vec4f(F32 a)
Definition: Math.hpp:352

FW::VectorBase::operator&=
FW_CUDA_FUNC S & operator&=(const T &a)
Definition: Math.hpp:163

FW::MatrixBase::get
FW_CUDA_FUNC const T & get(int idx) const
Definition: Math.hpp:520

FW::Mat2f
Definition: Math.hpp:631

FW::Mat4d::m33
F64 m33
Definition: Math.hpp:775

FW::abs
FW_CUDA_FUNC S32 abs(S32 a)
Definition: Math.hpp:41

FW::MatrixBase::operator*
FW_CUDA_FUNC S operator*(const T &a) const
Definition: Math.hpp:567

FW::MatrixBase::operator<<=
FW_CUDA_FUNC S & operator<<=(const T &a)
Definition: Math.hpp:558

FW::MatrixBase::set
FW_CUDA_FUNC T set(int r, int c, const T &a)
Definition: Math.hpp:525

FW_ASSERT
#define FW_ASSERT(X)
Definition: Defs.hpp:67

FW::VectorBase::operator%=
FW_CUDA_FUNC S & operator%=(const T &a)
Definition: Math.hpp:162

FW::Vector::getPtr
FW_CUDA_FUNC T * getPtr(void)
Definition: Math.hpp:226

FW::fastClamp
FW_CUDA_FUNC F32 fastClamp(F32 v, F32 lo, F32 hi)
Definition: Math.hpp:110

FW::Vec3f::cross
FW_CUDA_FUNC Vec3f cross(const Vec3f &v) const
Definition: Math.hpp:340

FW::S32
signed int S32
Definition: Defs.hpp:88

FW::Vec4f::fromPtr
static FW_CUDA_FUNC Vec4f fromPtr(const F32 *ptr)
Definition: Math.hpp:361

FW::VectorBase::operator^=
FW_CUDA_FUNC S & operator^=(const T &a)
Definition: Math.hpp:165

FW::VectorBase::set
FW_CUDA_FUNC T set(int idx, const T &a)
Definition: Math.hpp:130

FW::asin
FW_CUDA_FUNC F32 asin(F32 a)
Definition: Math.hpp:51

FW::MINMAX
MINMAX(Vec2i) MINMAX(Vec3i) MINMAX(Vec4i) MINMAX(Vec2f) MINMAX(Vec3f) MINMAX(Vec4f) MINMAX(Vec2d) MINMAX(Vec3d) MINMAX(Vec4d) template< class T

FW::Vec4i::Vec4i
FW_CUDA_FUNC Vec4i(S32 xx, S32 yy, S32 zz, S32 ww)
Definition: Math.hpp:282

FW::Vec3d::getPtr
FW_CUDA_FUNC const F64 * getPtr(void) const
Definition: Math.hpp:414

FW::Vec3i::getPtr
FW_CUDA_FUNC const S32 * getPtr(void) const
Definition: Math.hpp:265

FW::Vec4i::getXY
FW_CUDA_FUNC Vec2i getXY(void) const
Definition: Math.hpp:291

FW::VectorBase::operator^
FW_CUDA_FUNC S operator^(const T &a) const
Definition: Math.hpp:180

FW_CUDA_CONST
#define FW_CUDA_CONST
Definition: Defs.hpp:75

FW::Vec3f::getPtr
FW_CUDA_FUNC F32 * getPtr(void)
Definition: Math.hpp:334

FW::Mat3d::m10
F64 m10
Definition: Math.hpp:748

FW::VectorBase::setZero
FW_CUDA_FUNC void setZero(void)
Definition: Math.hpp:134

FW::Vec4f::getPtr
FW_CUDA_FUNC F32 * getPtr(void)
Definition: Math.hpp:360

FW::Vec4d::Vec4d
FW_CUDA_FUNC Vec4d(F64 xx, F64 yy, F64 zz, F64 ww)
Definition: Math.hpp:435

FW::Matrix::getPtr
FW_CUDA_FUNC T * getPtr(void)
Definition: Math.hpp:619

FW::Mat4d::m03
F64 m03
Definition: Math.hpp:775

FW::acos
FW_CUDA_FUNC F64 acos(F64 a)
Definition: Math.hpp:54

FW::Vec2f::Vec2f
FW_CUDA_FUNC Vec2f(const VectorBase< F32, 2, V > &v)
Definition: Math.hpp:318

FW::Mat4f::m03
F32 m03
Definition: Math.hpp:699

FW::MatrixBase::inverted
FW_CUDA_FUNC S inverted(void) const
Definition: Math.hpp:964

FW::ceil
FW_CUDA_FUNC F32 ceil(F32 a)
Definition: Math.hpp:61

FW::rcp
FW_CUDA_FUNC T rcp(const T &a)
Definition: Math.hpp:114

FW::MatrixBase
Definition: Math.hpp:509

FW::Vec2d::Vec2d
FW_CUDA_FUNC Vec2d(const Vec2f &v)
Definition: Math.hpp:386

FW::Mat4d::fromPtr
static FW_CUDA_FUNC Mat4d fromPtr(const F64 *ptr)
Definition: Math.hpp:764

FW::Mat3d::m21
F64 m21
Definition: Math.hpp:749

FW::MatrixBase::col
FW_CUDA_FUNC const Vector< T, L > & col(int c) const
Definition: Math.hpp:526

len
CUdevice int ordinal char int len
Definition: DLLImports.inl:48

FW::Vec2i::getPtr
FW_CUDA_FUNC S32 * getPtr(void)
Definition: Math.hpp:246

FW::Mat4f::fitToView
static Mat4f fitToView(const Vec2f &pos, const Vec2f &size, const Vec2f &viewSize)
Definition: Math.cpp:66

FW::Vec2f::Vec2f
FW_CUDA_FUNC Vec2f(void)
Definition: Math.hpp:304

FW::Mat4f::m31
F32 m31
Definition: Math.hpp:697

FW::VectorBase::operator-=
FW_CUDA_FUNC S & operator-=(const T &a)
Definition: Math.hpp:159

FW::Vec2i::fromPtr
static FW_CUDA_FUNC Vec2i fromPtr(const S32 *ptr)
Definition: Math.hpp:247

FW::Vec3f::getPtr
FW_CUDA_FUNC const F32 * getPtr(void) const
Definition: Math.hpp:333

FW::VectorBase::operator+=
FW_CUDA_FUNC S & operator+=(const T &a)
Definition: Math.hpp:158

FW::Vec4f::Vec4f
FW_CUDA_FUNC Vec4f(const Vec4i &v)
Definition: Math.hpp:357

FW::Vec3f::fromPtr
static FW_CUDA_FUNC Vec3f fromPtr(const F32 *ptr)
Definition: Math.hpp:335

FW::doubleToBits
FW_CUDA_FUNC U64 doubleToBits(F64 a)
Definition: Math.hpp:63

FW::Mat3f::m01
F32 m01
Definition: Math.hpp:670

FW::Mat4f
Definition: Math.hpp:676

FW::Mat4f::m11
F32 m11
Definition: Math.hpp:697

FW::S64
signed __int64 S64
Definition: Defs.hpp:98

FW::popc8
FW_CUDA_FUNC int popc8(U32 mask)
Definition: Math.hpp:819

FW::exp2
F32 exp2(F32 a)
Definition: Math.hpp:87

FW::MatrixBase::operator-=
FW_CUDA_FUNC S & operator-=(const T &a)
Definition: Math.hpp:551

FW::VectorBase::operator<<
FW_CUDA_FUNC S operator<<(const T &a) const
Definition: Math.hpp:181

FW::Vec4f::Vec4f
FW_CUDA_FUNC Vec4f(const Vec2f &xy, F32 zz, F32 ww)
Definition: Math.hpp:354

FW::MatrixBase::operator*=
FW_CUDA_FUNC S & operator*=(const T &a)
Definition: Math.hpp:552

FW::exp
F32 exp(F32 a)
Definition: Math.hpp:86

FW::Mat3f::getPtr
FW_CUDA_FUNC const F32 * getPtr(void) const
Definition: Math.hpp:657

FW::U32
unsigned int U32
Definition: Defs.hpp:85

FW::Vec4f::Vec4f
FW_CUDA_FUNC Vec4f(void)
Definition: Math.hpp:351

FW::Mat4f::Mat4f
FW_CUDA_FUNC Mat4f(const MatrixBase< F32, 4, V > &v)
Definition: Math.hpp:692

FW::Matrix::Matrix
FW_CUDA_FUNC Matrix(const MatrixBase< T, L, V > &v)
Definition: Math.hpp:622

FW::cos
F32 cos(F32 a)
Definition: Math.hpp:93

FW::Matrix::operator=
FW_CUDA_FUNC Matrix & operator=(const MatrixBase< T, L, V > &v)
Definition: Math.hpp:623

FW::Vec4d::Vec4d
FW_CUDA_FUNC Vec4d(const Vec2d &xy, const Vec2d &zw)
Definition: Math.hpp:438

FW::Vec2f::Vec2f
FW_CUDA_FUNC Vec2f(const Vec2i &v)
Definition: Math.hpp:307

FW::Mat3f::m20
F32 m20
Definition: Math.hpp:669

FW::Mat4f::fromPtr
static FW_CUDA_FUNC Mat4f fromPtr(const F32 *ptr)
Definition: Math.hpp:684

FW::Vec2d
Definition: Math.hpp:379

FW::operator>>
FW_CUDA_FUNC S operator>>(const T &a, const VectorBase< T, L, S > &b)
Definition: Math.hpp:475

FW::operator|
FW_CUDA_FUNC S operator|(const T &a, const VectorBase< T, L, S > &b)
Definition: Math.hpp:472

FW::MatrixBase::getRow
FW_CUDA_FUNC Vector< T, L > getRow(int r) const
Definition: Math.hpp:881

FW::MatrixBase::setIdentity
FW_CUDA_FUNC void setIdentity(void)
Definition: Math.hpp:534

FW::popc32
FW_CUDA_FUNC int popc32(U32 mask)
Definition: Math.hpp:829

FW::Mat3d::m01
F64 m01
Definition: Math.hpp:749

FW::Vec4i::Vec4i
FW_CUDA_FUNC Vec4i(void)
Definition: Math.hpp:280

FW::MatrixBase::operator+=
FW_CUDA_FUNC S & operator+=(const T &a)
Definition: Math.hpp:550

FW::VectorBase::normalize
FW_CUDA_FUNC void normalize(T len=(T) 1)
Definition: Math.hpp:145

FW::operator-
FW_CUDA_FUNC S operator-(const T &a, const VectorBase< T, L, S > &b)
Definition: Math.hpp:467

FW::Mat4d::m10
F64 m10
Definition: Math.hpp:772

FW::bitsToFloat
F32 bitsToFloat(U32 a)
Definition: Math.hpp:96

f
CUdevice int ordinal char int CUdevice dev CUdevprop CUdevice dev CUcontext ctx CUcontext ctx CUcontext pctx CUmodule const void image CUmodule const void fatCubin CUfunction CUmodule const char name void p CUfunction unsigned int bytes CUtexref pTexRef CUtexref CUarray unsigned int Flags CUtexref int CUaddress_mode am CUtexref unsigned int Flags CUaddress_mode CUtexref int dim CUarray_format int CUtexref hTexRef CUfunction unsigned int numbytes CUfunction int float value CUfunction int CUtexref hTexRef CUfunction f
Definition: DLLImports.inl:88

FW::Vec2d::getPtr
FW_CUDA_FUNC F64 * getPtr(void)
Definition: Math.hpp:389

FW::Mat4d::m20
F64 m20
Definition: Math.hpp:772

FW::cross
FW_CUDA_FUNC F32 cross(const Vec2f &a, const Vec2f &b)
Definition: Math.hpp:481

FW::Vec3f
Definition: Math.hpp:324

FW::Vec4d::getXY
FW_CUDA_FUNC Vec2d getXY(void) const
Definition: Math.hpp:448

FW::Mat2d::fromPtr
static FW_CUDA_FUNC Mat2d fromPtr(const F64 *ptr)
Definition: Math.hpp:713

FW::Mat3d::Mat3d
FW_CUDA_FUNC Mat3d(F64 a)
Definition: Math.hpp:732

FW::sqrt
FW_CUDA_FUNC F64 sqrt(F64 a)
Definition: Math.hpp:40

FW::Mat3f::m21
F32 m21
Definition: Math.hpp:670

FW::Mat2d::operator=
FW_CUDA_FUNC Mat2d & operator=(const MatrixBase< F64, 2, V > &v)
Definition: Math.hpp:718

FW::Vec4f::operator=
FW_CUDA_FUNC Vec4f & operator=(const VectorBase< F32, 4, V > &v)
Definition: Math.hpp:374

FW::Mat4d::Mat4d
FW_CUDA_FUNC Mat4d(const MatrixBase< F64, 4, V > &v)
Definition: Math.hpp:768

FW::Vec2d::Vec2d
FW_CUDA_FUNC Vec2d(void)
Definition: Math.hpp:382

FW::floor
FW_CUDA_FUNC F64 floor(F64 a)
Definition: Math.hpp:60

FW::Vec4d::getXYZ
FW_CUDA_FUNC Vec3d getXYZ(void) const
Definition: Math.hpp:449

FW::Vec3d::getPtr
FW_CUDA_FUNC F64 * getPtr(void)
Definition: Math.hpp:415

FW::printf
void printf(const char *fmt,...)
Definition: Defs.cpp:225

FW::Mat4d::m32
F64 m32
Definition: Math.hpp:774

FW::Vec2i::Vec2i
FW_CUDA_FUNC Vec2i(S32 a)
Definition: Math.hpp:242

FW::Matrix
Definition: Math.hpp:612

FW::VectorBase::operator-
FW_CUDA_FUNC S operator-(void) const
Definition: Math.hpp:170

FW::normalize
FW_CUDA_FUNC S normalize(const VectorBase< T, L, S > &v, T len=(T) 1)
Definition: Math.hpp:460

FW::fastMin
F32 fastMin(F32 a, F32 b)
Definition: Math.hpp:98

FW::ceil
FW_CUDA_FUNC F64 ceil(F64 a)
Definition: Math.hpp:62

FW::Matrix::getPtr
FW_CUDA_FUNC const T * getPtr(void) const
Definition: Math.hpp:618

FW::Mat2f::getPtr
FW_CUDA_FUNC F32 * getPtr(void)
Definition: Math.hpp:638

FW::VectorBase::operator!=
FW_CUDA_FUNC bool operator!=(const VectorBase< T, L, V > &v) const
Definition: Math.hpp:214

FW::VectorBase::sum
FW_CUDA_FUNC T sum(void) const
Definition: Math.hpp:148

FW::Mat2d::Mat2d
FW_CUDA_FUNC Mat2d(F64 a)
Definition: Math.hpp:709

DLLImports.hpp

FW::log
FW_CUDA_FUNC F64 log(F64 a)
Definition: Math.hpp:47

FW::VectorBase::operator[]
FW_CUDA_FUNC const T & operator[](int idx) const
Definition: Math.hpp:154

FW::MatrixBase::getCol
FW_CUDA_FUNC const Vector< T, L > & getCol(int c) const
Definition: Math.hpp:528

FW::VectorBase::operator/=
FW_CUDA_FUNC S & operator/=(const T &a)
Definition: Math.hpp:161

FW::Vec4d
Definition: Math.hpp:430

FW::outerProduct
FW_CUDA_FUNC Matrix< T, L > outerProduct(const VectorBase< T, L, S > &a, const VectorBase< T, L, S > &b)
Definition: Math.hpp:1051

FW::Vector::fromPtr
static FW_CUDA_FUNC Vector fromPtr(const T *ptr)
Definition: Math.hpp:227

FW::Mat3d::rotation
static Mat3d rotation(const Vec3d &axis, F64 angle)
Definition: Math.cpp:107

FW::Vec2f::Vec2f
FW_CUDA_FUNC Vec2f(F32 xx, F32 yy)
Definition: Math.hpp:306

FW::Mat2f::m00
F32 m00
Definition: Math.hpp:645

FW::Vec2i::perpendicular
FW_CUDA_FUNC Vec2i perpendicular(void) const
Definition: Math.hpp:249

FW::Vec4f::getXYW
FW_CUDA_FUNC Vec3f getXYW(void) const
Definition: Math.hpp:366

FW::VectorBase::normalized
FW_CUDA_FUNC S normalized(T len=(T) 1) const
Definition: Math.hpp:144

FW::Vec4i::Vec4i
FW_CUDA_FUNC Vec4i(const VectorBase< S32, 4, V > &v)
Definition: Math.hpp:295

FW::Vec2f::getPtr
FW_CUDA_FUNC F32 * getPtr(void)
Definition: Math.hpp:310

FW::Mat4f::m13
F32 m13
Definition: Math.hpp:699

FW::Vec3i::Vec3i
FW_CUDA_FUNC Vec3i(void)
Definition: Math.hpp:260

FW::atan
FW_CUDA_FUNC F32 atan(F32 a)
Definition: Math.hpp:55

FW::MatrixBase::setZero
FW_CUDA_FUNC void setZero(void)
Definition: Math.hpp:533

FW::VectorBase::operator&
FW_CUDA_FUNC S operator&(const T &a) const
Definition: Math.hpp:178

FW::Vec4f::fromABGR
static Vec4f fromABGR(U32 abgr)
Definition: Math.cpp:34

FW::Mat2f::Mat2f
FW_CUDA_FUNC Mat2f(F32 a)
Definition: Math.hpp:635

FW::sin
FW_CUDA_FUNC F64 sin(F64 a)
Definition: Math.hpp:48

FW::Vec3i::Vec3i
FW_CUDA_FUNC Vec3i(const VectorBase< S32, 3, V > &v)
Definition: Math.hpp:271

FW::exp2
F32 exp2(int a)
Definition: Math.hpp:97

FW::Mat4d::getPtr
FW_CUDA_FUNC const F64 * getPtr(void) const
Definition: Math.hpp:762

FW::MatrixBase::operator/=
FW_CUDA_FUNC S & operator/=(const T &a)
Definition: Math.hpp:553

FW::Vec4f::Vec4f
FW_CUDA_FUNC Vec4f(const Vec2f &xy, const Vec2f &zw)
Definition: Math.hpp:356

FW::Vec4f::Vec4f
FW_CUDA_FUNC Vec4f(const Vec3f &xyz, F32 ww)
Definition: Math.hpp:355

FW::Vec3d::Vec3d
FW_CUDA_FUNC Vec3d(const Vec2d &xy, F64 zz)
Definition: Math.hpp:410

FW::det
FW_CUDA_FUNC T det(const MatrixBase< T, L, S > &v)
Definition: Math.hpp:782

FW::transpose
FW_CUDA_FUNC S transpose(const MatrixBase< T, L, S > &v)
Definition: Math.hpp:783

FW::Vec3d::Vec3d
FW_CUDA_FUNC Vec3d(F64 xx, F64 yy, F64 zz)
Definition: Math.hpp:409

FW::Vec4d::operator=
FW_CUDA_FUNC Vec4d & operator=(const VectorBase< F64, 4, V > &v)
Definition: Math.hpp:453

FW::MatrixBase::operator%
FW_CUDA_FUNC S operator%(const T &a) const
Definition: Math.hpp:569

FW::VectorBase::print
void print(void) const
Definition: Math.hpp:137

FW::Vec4i::Vec4i
FW_CUDA_FUNC Vec4i(const Vec3i &xyz, S32 ww)
Definition: Math.hpp:284

FW::VectorBase::operator~
FW_CUDA_FUNC S operator~(void) const
Definition: Math.hpp:171

FW::Vec3d::Vec3d
FW_CUDA_FUNC Vec3d(const Vec3i &v)
Definition: Math.hpp:411

FW::Vec3f::Vec3f
FW_CUDA_FUNC Vec3f(void)
Definition: Math.hpp:327

FW::MatrixBase::operator|=
FW_CUDA_FUNC S & operator|=(const T &a)
Definition: Math.hpp:556

FW::Mat4d::m21
F64 m21
Definition: Math.hpp:773

FW::detImpl
FW_CUDA_FUNC T detImpl(const MatrixBase< T, L, S > &v)
Definition: Math.hpp:905

FW::MatrixBase::operator%=
FW_CUDA_FUNC S & operator%=(const T &a)
Definition: Math.hpp:554

FW::Vector::operator=
FW_CUDA_FUNC Vector & operator=(const VectorBase< T, L, V > &v)
Definition: Math.hpp:230

FW::Mat4f::getPtr
FW_CUDA_FUNC F32 * getPtr(void)
Definition: Math.hpp:683

FW::MatrixBase::operator|
FW_CUDA_FUNC S operator|(const T &a) const
Definition: Math.hpp:571

FW::Vec4i::fromPtr
static FW_CUDA_FUNC Vec4i fromPtr(const S32 *ptr)
Definition: Math.hpp:289

FW::Vec2i
Definition: Math.hpp:238

FW::VectorBase::set
FW_CUDA_FUNC void set(const T &a)
Definition: Math.hpp:132

FW::MatrixBase::setCol
FW_CUDA_FUNC void setCol(int c, const VectorBase< T, L, V > &v)
Definition: Math.hpp:576

FW::c_popc8LUT
FW_CUDA_CONST int c_popc8LUT[]
Definition: Math.hpp:799

FW::log
F32 log(F32 a)
Definition: Math.hpp:89

FW::Mat4f::m00
F32 m00
Definition: Math.hpp:696

FW::Mat2f::m11
F32 m11
Definition: Math.hpp:646

size
CUdevice int ordinal char int CUdevice dev CUdevprop CUdevice dev CUcontext ctx CUcontext ctx CUcontext pctx CUmodule const void image CUmodule const void fatCubin CUfunction CUmodule const char name void p CUfunction unsigned int bytes CUtexref pTexRef CUtexref CUarray unsigned int Flags CUtexref int CUaddress_mode am CUtexref unsigned int Flags CUaddress_mode CUtexref int dim CUarray_format int CUtexref hTexRef CUfunction unsigned int numbytes CUfunction int float value CUfunction int CUtexref hTexRef CUfunction int int grid_height CUevent unsigned int Flags CUevent hEvent CUevent hEvent CUstream unsigned int Flags CUstream hStream GLuint bufferobj unsigned int CUdevice dev CUdeviceptr unsigned int CUmodule const char name CUdeviceptr unsigned int bytesize CUdeviceptr dptr void unsigned int bytesize void CUdeviceptr unsigned int ByteCount CUarray unsigned int CUdeviceptr unsigned int ByteCount CUarray unsigned int const void unsigned int ByteCount CUarray unsigned int CUarray unsigned int unsigned int ByteCount void CUarray unsigned int unsigned int CUstream hStream const CUDA_MEMCPY2D pCopy CUdeviceptr const void unsigned int CUstream hStream const CUDA_MEMCPY2D CUstream hStream CUdeviceptr unsigned char unsigned int N CUdeviceptr unsigned int unsigned int N CUdeviceptr unsigned int unsigned short unsigned int unsigned int Height CUarray const CUDA_ARRAY_DESCRIPTOR pAllocateArray CUarray const CUDA_ARRAY3D_DESCRIPTOR pAllocateArray unsigned int CUtexref CUdeviceptr unsigned int bytes CUcontext unsigned int CUdevice device GLenum texture GLenum GLuint buffer GLenum GLuint renderbuffer GLenum GLsizeiptr size
Definition: DLLImports.inl:319

FW::Mat3f::m12
F32 m12
Definition: Math.hpp:671

FW::Mat3f::m00
F32 m00
Definition: Math.hpp:669

FW::MatrixBase::operator&
FW_CUDA_FUNC S operator&(const T &a) const
Definition: Math.hpp:570

FW::Mat4f::m33
F32 m33
Definition: Math.hpp:699

FW::VectorBase::operator|
FW_CUDA_FUNC S operator|(const T &a) const
Definition: Math.hpp:179

FW::Mat4d::m31
F64 m31
Definition: Math.hpp:773

FW::Mat4f::getXYZ
Mat3f getXYZ(void) const
Definition: Math.cpp:56

FW::VectorBase::min
FW_CUDA_FUNC T min(void) const
Definition: Math.hpp:146

FW::Mat3f::getPtr
FW_CUDA_FUNC F32 * getPtr(void)
Definition: Math.hpp:658

FW::MatrixBase::operator-
FW_CUDA_FUNC S operator-(void) const
Definition: Math.hpp:562

FW::operator%
FW_CUDA_FUNC S operator%(const T &a, const VectorBase< T, L, S > &b)
Definition: Math.hpp:470

FW::Vec4d::fromPtr
static FW_CUDA_FUNC Vec4d fromPtr(const F64 *ptr)
Definition: Math.hpp:444

FW::Mat4d::m11
F64 m11
Definition: Math.hpp:773

FW::lerp
FW_CUDA_FUNC A lerp(const A &a, const A &b, const B &t)
Definition: Math.hpp:115

FW::Mat4d::m12
F64 m12
Definition: Math.hpp:774

FW::Vec2i::operator=
FW_CUDA_FUNC Vec2i & operator=(const VectorBase< S32, 2, V > &v)
Definition: Math.hpp:252

FW::Matrix::Matrix
FW_CUDA_FUNC Matrix(T a)
Definition: Math.hpp:616

FW::Mat2d
Definition: Math.hpp:704

FW::Mat3f::m10
F32 m10
Definition: Math.hpp:669

FW::Vec3i::operator=
FW_CUDA_FUNC Vec3i & operator=(const VectorBase< S32, 3, V > &v)
Definition: Math.hpp:272

FW::MatrixBase::operator/
FW_CUDA_FUNC S operator/(const T &a) const
Definition: Math.hpp:568

FW::Vec4i
Definition: Math.hpp:277

FW::VectorBase::operator*
FW_CUDA_FUNC S operator*(const T &a) const
Definition: Math.hpp:175

FW::VectorBase::length
FW_CUDA_FUNC T length(void) const
Definition: Math.hpp:143

FW::Mat3f
Definition: Math.hpp:651

FW::Mat2d::getPtr
FW_CUDA_FUNC F64 * getPtr(void)
Definition: Math.hpp:712

FW::Matrix::fromPtr
static FW_CUDA_FUNC Matrix fromPtr(const T *ptr)
Definition: Math.hpp:620

FW::operator*
FW_CUDA_FUNC S operator*(const T &a, const VectorBase< T, L, S > &b)
Definition: Math.hpp:468

FW::Vec4d::Vec4d
FW_CUDA_FUNC Vec4d(F64 a)
Definition: Math.hpp:434