doxygen/html/fixed_size_square_matrix_ops_impl_8hpp_source.html

 /*
  * Copyright (c) 2021, Lawrence Livermore National Security, LLC and LvArray contributors.
  * All rights reserved.
  * See the LICENSE file for details.
  * SPDX-License-Identifier: (BSD-3-Clause)
  */

 #pragma once

 #include "genericTensorOps.hpp"

 namespace LvArray
 {
 namespace tensorOps
 {
 namespace internal
 {

 template< std::ptrdiff_t M, typename FloatingPoint >
 LVARRAY_HOST_DEVICE inline
 static void shiftAndScale( FloatingPoint (& matrix)[ ( M * ( M + 1 ) ) / 2 ],
                            FloatingPoint & shift,
                            FloatingPoint & maxEntryAfterShift )
 {
   // Compute the average eigenvalue.
   shift = symTrace< M >( matrix ) / FloatingPoint( M );

   // Initialize the floating point copy of the matrix and shift the average eigenvalue to 0.
   symAddIdentity< M >( matrix, -shift );

   // Now scale the entires of the copy to between [-1, 1].
   maxEntryAfterShift = maxAbsoluteEntry< SYM_SIZE< M > >( matrix );
   if( maxEntryAfterShift > 0 )
   {
     scale< SYM_SIZE< M > >( matrix, 1 / maxEntryAfterShift );
   }

   // A second shift is necessary because of floating point round off and because the eigenvalue
   // algorithm expects the trace of the matrix to be zero. However it isn't necessary to export
   // this shift since when calculating the eigenvalues of the original matrix it will be lost
   // to roundoff.
   FloatingPoint const secondShift = symTrace< M >( matrix ) / FloatingPoint( M );
   symAddIdentity< M >( matrix, -secondShift );
 }

 template< std::ptrdiff_t M >
 struct SquareMatrixOps
 {};

 template<>
 struct SquareMatrixOps< 2 >
 {
   template< typename MATRIX >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static auto determinant( MATRIX const & matrix )
   {
     checkSizes< 2, 2 >( matrix );
     return matrix[ 0 ][ 0 ] * matrix[ 1 ][ 1 ] - matrix[ 0 ][ 1 ] * matrix[ 1 ][ 0 ];
   }

   template< typename DST_MATRIX, typename SRC_MATRIX >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static auto invert( DST_MATRIX && LVARRAY_RESTRICT_REF dstMatrix,
                       SRC_MATRIX const & LVARRAY_RESTRICT_REF srcMatrix )
   {
     checkSizes< 2, 2 >( dstMatrix );
     checkSizes< 2, 2 >( srcMatrix );

     using FloatingPoint = std::decay_t< decltype( dstMatrix[ 0 ][ 0 ] ) >;

     auto const det = determinant( srcMatrix );
     FloatingPoint const invDet = FloatingPoint( 1 ) / det;

     dstMatrix[ 0 ][ 0 ] = srcMatrix[ 1 ][ 1 ] * invDet;
     dstMatrix[ 1 ][ 1 ] = srcMatrix[ 0 ][ 0 ] * invDet;
     dstMatrix[ 0 ][ 1 ] = srcMatrix[ 0 ][ 1 ] * -invDet;
     dstMatrix[ 1 ][ 0 ] = srcMatrix[ 1 ][ 0 ] * -invDet;

     return det;
   }

   template< typename MATRIX >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static auto invert( MATRIX && matrix )
   {
     checkSizes< 2, 2 >( matrix );

     auto const det = determinant( matrix );
     auto const invDet = 1 / det;

     auto const temp = matrix[ 0 ][ 0 ];
     matrix[ 0 ][ 0 ] = matrix[ 1 ][ 1 ] * invDet;
     matrix[ 1 ][ 1 ] = temp * invDet;
     matrix[ 0 ][ 1 ] *= -invDet;
     matrix[ 1 ][ 0 ] *= -invDet;

     return det;
   }

   template< typename SYM_MATRIX >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static auto symDeterminant( SYM_MATRIX const & symMatrix )
   {
     checkSizes< 3 >( symMatrix );
     return symMatrix[ 0 ] * symMatrix[ 1 ] - symMatrix[ 2 ] * symMatrix[ 2 ];
   }

   template< typename DST_SYM_MATRIX, typename SRC_SYM_MATRIX >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static auto symInvert( DST_SYM_MATRIX && LVARRAY_RESTRICT_REF dstSymMatrix,
                          SRC_SYM_MATRIX const & LVARRAY_RESTRICT_REF srcSymMatrix )
   {
     checkSizes< 3 >( dstSymMatrix );
     checkSizes< 3 >( srcSymMatrix );

     using FloatingPoint = std::decay_t< decltype( dstSymMatrix[ 0 ] ) >;

     auto const det = symDeterminant( srcSymMatrix );
     FloatingPoint const invDet = FloatingPoint( 1 ) / det;

     dstSymMatrix[ 0 ] = srcSymMatrix[ 1 ] * invDet;
     dstSymMatrix[ 1 ] = srcSymMatrix[ 0 ] * invDet;
     dstSymMatrix[ 2 ] = srcSymMatrix[ 2 ] * -invDet;

     return det;
   }

   template< typename SYM_MATRIX >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static auto symInvert( SYM_MATRIX && symMatrix )
   {
     checkSizes< 3 >( symMatrix );

     auto const det = symDeterminant( symMatrix );
     auto const invDet = 1 / det;

     auto const temp = symMatrix[ 0 ];
     symMatrix[ 0 ] = symMatrix[ 1 ] * invDet;
     symMatrix[ 1 ] = temp * invDet;
     symMatrix[ 2 ] *= -invDet;

     return det;
   }

   template< typename DST_VECTOR, typename SYM_MATRIX_A, typename VECTOR_B >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static void Ri_eq_symAijBj( DST_VECTOR && LVARRAY_RESTRICT_REF dstVector,
                               SYM_MATRIX_A const & LVARRAY_RESTRICT_REF symMatrixA,
                               VECTOR_B const & LVARRAY_RESTRICT_REF vectorB )
   {
     checkSizes< 2 >( dstVector );
     checkSizes< 3 >( symMatrixA );
     checkSizes< 2 >( vectorB );

     dstVector[ 0 ] = symMatrixA[ 0 ] * vectorB[ 0 ] + symMatrixA[ 2 ] * vectorB[ 1 ];
     dstVector[ 1 ] = symMatrixA[ 2 ] * vectorB[ 0 ] + symMatrixA[ 1 ] * vectorB[ 1 ];
   }

   template< typename DST_VECTOR, typename SYM_MATRIX_A, typename VECTOR_B >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static void Ri_add_symAijBj( DST_VECTOR && LVARRAY_RESTRICT_REF dstVector,
                                SYM_MATRIX_A const & LVARRAY_RESTRICT_REF symMatrixA,
                                VECTOR_B const & LVARRAY_RESTRICT_REF vectorB )
   {
     checkSizes< 2 >( dstVector );
     checkSizes< 3 >( symMatrixA );
     checkSizes< 2 >( vectorB );

     dstVector[ 0 ] = dstVector[ 0 ] + symMatrixA[ 0 ] * vectorB[ 0 ] + symMatrixA[ 2 ] * vectorB[ 1 ];
     dstVector[ 1 ] = dstVector[ 1 ] + symMatrixA[ 2 ] * vectorB[ 0 ] + symMatrixA[ 1 ] * vectorB[ 1 ];
   }

   template< typename DST_MATRIX, typename SYM_MATRIX_A, typename MATRIX_B >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static void Rij_eq_symAikBjk( DST_MATRIX && LVARRAY_RESTRICT_REF dstMatrix,
                                 SYM_MATRIX_A const & LVARRAY_RESTRICT_REF symMatrixA,
                                 MATRIX_B const & LVARRAY_RESTRICT_REF matrixB )
   {
     checkSizes< 2, 2 >( dstMatrix );
     checkSizes< 3 >( symMatrixA );
     checkSizes< 2, 2 >( matrixB );

     dstMatrix[ 0 ][ 0 ] = symMatrixA[ 0 ] * matrixB[ 0 ][ 0 ] + symMatrixA[ 2 ] * matrixB[ 0 ][ 1 ];
     dstMatrix[ 0 ][ 1 ] = symMatrixA[ 0 ] * matrixB[ 1 ][ 0 ] + symMatrixA[ 2 ] * matrixB[ 1 ][ 1 ];

     dstMatrix[ 1 ][ 0 ] = symMatrixA[ 2 ] * matrixB[ 0 ][ 0 ] + symMatrixA[ 1 ] * matrixB[ 0 ][ 1 ];
     dstMatrix[ 1 ][ 1 ] = symMatrixA[ 2 ] * matrixB[ 1 ][ 0 ] + symMatrixA[ 1 ] * matrixB[ 1 ][ 1 ];
   }

   template< typename DST_SYM_MATRIX, typename MATRIX_A, typename SYM_MATRIX_B >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static void Rij_eq_AikSymBklAjl( DST_SYM_MATRIX && LVARRAY_RESTRICT_REF dstSymMatrix,
                                    MATRIX_A const & LVARRAY_RESTRICT_REF matrixA,
                                    SYM_MATRIX_B const & LVARRAY_RESTRICT_REF symMatrixB )
   {
     checkSizes< 3 >( dstSymMatrix );
     checkSizes< 2, 2 >( matrixA );
     checkSizes< 3 >( symMatrixB );

     // Calculate entry (0, 0).
     dstSymMatrix[ 0 ] = matrixA[ 0 ][ 0 ] * symMatrixB[ 0 ] * matrixA[ 0 ][ 0 ] +
                         matrixA[ 0 ][ 0 ] * symMatrixB[ 2 ] * matrixA[ 0 ][ 1 ] +
                         matrixA[ 0 ][ 1 ] * symMatrixB[ 2 ] * matrixA[ 0 ][ 0 ] +
                         matrixA[ 0 ][ 1 ] * symMatrixB[ 1 ] * matrixA[ 0 ][ 1 ];

     // Calculate entry (1, 1).
     dstSymMatrix[ 1 ] = matrixA[ 1 ][ 0 ] * symMatrixB[ 0 ] * matrixA[ 1 ][ 0 ] +
                         matrixA[ 1 ][ 0 ] * symMatrixB[ 2 ] * matrixA[ 1 ][ 1 ] +
                         matrixA[ 1 ][ 1 ] * symMatrixB[ 2 ] * matrixA[ 1 ][ 0 ] +
                         matrixA[ 1 ][ 1 ] * symMatrixB[ 1 ] * matrixA[ 1 ][ 1 ];

     // Calculate entry (1, 0) or (0, 1).
     dstSymMatrix[ 2 ] = matrixA[ 1 ][ 0 ] * symMatrixB[ 0 ] * matrixA[ 0 ][ 0 ] +
                         matrixA[ 1 ][ 0 ] * symMatrixB[ 2 ] * matrixA[ 0 ][ 1 ] +
                         matrixA[ 1 ][ 1 ] * symMatrixB[ 2 ] * matrixA[ 0 ][ 0 ] +
                         matrixA[ 1 ][ 1 ] * symMatrixB[ 1 ] * matrixA[ 0 ][ 1 ];
   }


   template< typename DST_MATRIX, typename VECTOR_A >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static void symRij_eq_AiAj( DST_MATRIX && LVARRAY_RESTRICT_REF dstMatrix,
                               VECTOR_A const & LVARRAY_RESTRICT_REF vectorA )
   {
     internal::checkSizes< 3 >( dstMatrix );
     internal::checkSizes< 2 >( vectorA );

     dstMatrix[ 0 ] = vectorA[ 0 ] * vectorA[ 0 ];
     dstMatrix[ 1 ] = vectorA[ 1 ] * vectorA[ 1 ];
     dstMatrix[ 2 ] = vectorA[ 0 ] * vectorA[ 1 ];
   }

   template< typename DST_SYM_MATRIX, typename VECTOR_A, typename VECTOR_B >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static void symRij_eq_AiBj_plus_AjBi( DST_SYM_MATRIX && LVARRAY_RESTRICT_REF dstMatrix,
                                         VECTOR_A const & LVARRAY_RESTRICT_REF vectorA,
                                         VECTOR_B const & LVARRAY_RESTRICT_REF vectorB )
   {
     internal::checkSizes< 3 >( dstMatrix );
     internal::checkSizes< 2 >( vectorA );
     internal::checkSizes< 2 >( vectorB );

     dstMatrix[ 0 ] = 2 * vectorA[ 0 ] * vectorB[ 0 ];
     dstMatrix[ 1 ] = 2 * vectorA[ 1 ] * vectorB[ 1 ];
     dstMatrix[ 2 ] = vectorA[ 0 ] * vectorB[ 1 ] + vectorA[ 1 ] * vectorB[ 0 ];
   }

   template< typename DST_VECTOR, typename SYM_MATRIX >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static void symEigenvalues( DST_VECTOR && LVARRAY_RESTRICT_REF eigenvalues,
                               SYM_MATRIX const & LVARRAY_RESTRICT_REF symMatrix )
   {
     checkSizes< 2 >( eigenvalues );
     checkSizes< 3 >( symMatrix );

     using FloatingPoint = std::decay_t< decltype( eigenvalues[ 0 ] ) >;

     // Shift the and scale the matrix
     FloatingPoint shift, maxEntryAfterShift;
     FloatingPoint fpCopy[ 3 ];
     copy< 3 >( fpCopy, symMatrix );
     shiftAndScale< 2 >( fpCopy, shift, maxEntryAfterShift );

     // Compute the eigenvalues of the shifted matrix.
     eigenvaluesOfShiftedMatrix( eigenvalues, fpCopy );

     // Rescale the eigenvalues.
     eigenvalues[ 0 ] = eigenvalues[ 0 ] * maxEntryAfterShift + shift;
     eigenvalues[ 1 ] = eigenvalues[ 1 ] * maxEntryAfterShift + shift;
   }

   template< typename DST_VECTOR, typename DST_MATRIX, typename SYM_MATRIX >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static void symEigenvectors( DST_VECTOR && LVARRAY_RESTRICT_REF eigenvalues,
                                DST_MATRIX && LVARRAY_RESTRICT_REF eigenvectors,
                                SYM_MATRIX const & LVARRAY_RESTRICT_REF symMatrix )
   {
     checkSizes< 2 >( eigenvalues );
     checkSizes< 2, 2 >( eigenvectors );
     checkSizes< 3 >( symMatrix );

     using FloatingPoint = std::decay_t< decltype( eigenvalues[ 0 ] ) >;

     using FloatingPoint = std::decay_t< decltype( eigenvalues[ 0 ] ) >;

     // Shift the and scale the matrix
     FloatingPoint shift, maxEntryAfterShift;
     FloatingPoint fpCopy[ 3 ];
     copy< 3 >( fpCopy, symMatrix );
     shiftAndScale< 2 >( fpCopy, shift, maxEntryAfterShift );

     // Compute the eigenvalues of the shifted matrix.
     eigenvaluesOfShiftedMatrix( eigenvalues, fpCopy );

     // If the eigenvalues are equal
     if( ( eigenvalues[ 1 ] - eigenvalues[ 0 ] ) <= NumericLimits< FloatingPoint >::epsilon )
     {
       LVARRAY_TENSOROPS_ASSIGN_2x2( eigenvectors,
                                     1, 0,
                                     0, 1 );
     }
     else
     {
       // Compute the eigenvector corresponding to the largest eigenvalue.
       // Done by constructing a rank 1 matrix and extracting the kernel.
       symAddIdentity< 2 >( fpCopy, -eigenvalues[ 1 ] );
       FloatingPoint const a2 = fpCopy[ 0 ] * fpCopy[ 0 ];
       FloatingPoint const c2 = fpCopy[ 1 ] * fpCopy[ 1 ];
       FloatingPoint const b2 = fpCopy[ 2 ] * fpCopy[ 2 ];

       // Pick the row with the greatest magnitude.
       if( a2 > c2 )
       {
         FloatingPoint const inv = math::invSqrt( a2 + b2 );
         eigenvectors[ 0 ][ 1 ] = -fpCopy[ 2 ] * inv;
         eigenvectors[ 1 ][ 1 ] = fpCopy[ 0 ] * inv;
       }
       else
       {
         FloatingPoint const inv = math::invSqrt( c2 + b2 );
         eigenvectors[ 0 ][ 1 ] = -fpCopy[ 1 ] * inv;
         eigenvectors[ 1 ][ 1 ] = fpCopy[ 2 ] * inv;
       }

       // The other eigenvector is orthonormal to the one just computed.
       eigenvectors[ 0 ][ 0 ] = -eigenvectors[ 1 ][ 1 ];
       eigenvectors[ 1 ][ 0 ] = eigenvectors[ 0 ][ 1 ];
     }

     // Rescale the eigenvalues.
     eigenvalues[ 0 ] = eigenvalues[ 0 ] * maxEntryAfterShift + shift;
     eigenvalues[ 1 ] = eigenvalues[ 1 ] * maxEntryAfterShift + shift;
   }

   template< typename DST_SYM_MATRIX, typename SRC_MATRIX >
   LVARRAY_HOST_DEVICE inline CONSTEXPR_WITHOUT_BOUNDS_CHECK
   static void denseToSymmetric( DST_SYM_MATRIX && dstSymMatrix, SRC_MATRIX const & srcMatrix )
   {
     tensorOps::internal::checkSizes< 3 >( dstSymMatrix );
     tensorOps::internal::checkSizes< 2, 2 >( srcMatrix );

     dstSymMatrix[ 0 ] = srcMatrix[ 0 ][ 0 ];
     dstSymMatrix[ 1 ] = srcMatrix[ 1 ][ 1 ];
     dstSymMatrix[ 2 ] = srcMatrix[ 0 ][ 1 ];
   }

   template< typename DST_MATRIX, typename SRC_SYM_MATRIX >
   LVARRAY_HOST_DEVICE inline CONSTEXPR_WITHOUT_BOUNDS_CHECK
   static void symmetricToDense( DST_MATRIX && dstMatrix, SRC_SYM_MATRIX const & srcSymMatrix )
   {
     tensorOps::internal::checkSizes< 2, 2 >( dstMatrix );
     tensorOps::internal::checkSizes< 3 >( srcSymMatrix );

     dstMatrix[ 0 ][ 0 ] = srcSymMatrix[ 0 ];
     dstMatrix[ 1 ][ 1 ] = srcSymMatrix[ 1 ];

     dstMatrix[ 0 ][ 1 ] = srcSymMatrix[ 2 ];
     dstMatrix[ 1 ][ 0 ] = srcSymMatrix[ 2 ];
   }

 private:

   template< typename FloatingPoint, typename VECTOR >
   LVARRAY_HOST_DEVICE inline
   static void eigenvaluesOfShiftedMatrix( VECTOR && eigenvalues, FloatingPoint const ( &matrix )[ 3 ] )
   {
     /*
        For a 2x2 symmetric matrix
           a0, a2
           a2, a1
        And eigenvalue x the characteristic equation is
           x^2 - (a0 + a1) * x + a0 * a1 - a2^2 = 0
        However the shifted matrix has a trace of 0 so this simplifies to
           x^2 + a0 * a1 - a2^2 = 0
      */
     eigenvalues[ 1 ] = math::sqrt( matrix[ 2 ] * matrix[ 2 ] - matrix[ 0 ] * matrix[ 1 ] );
     eigenvalues[ 0 ] = -eigenvalues[ 1 ];
   }
 };

 template<>
 struct SquareMatrixOps< 3 >
 {
   template< typename MATRIX >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static auto determinant( MATRIX const & matrix )
   {
     checkSizes< 3, 3 >( matrix );

     return matrix[ 0 ][ 0 ] * ( matrix[ 1 ][ 1 ] * matrix[ 2 ][ 2 ] - matrix[ 1 ][ 2 ] * matrix[ 2 ][ 1 ] ) +
            matrix[ 1 ][ 0 ] * ( matrix[ 0 ][ 2 ] * matrix[ 2 ][ 1 ] - matrix[ 0 ][ 1 ] * matrix[ 2 ][ 2 ] ) +
            matrix[ 2 ][ 0 ] * ( matrix[ 0 ][ 1 ] * matrix[ 1 ][ 2 ] - matrix[ 0 ][ 2 ] * matrix[ 1 ][ 1 ] );
   }

   template< typename DST_MATRIX, typename SRC_MATRIX >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static auto invert( DST_MATRIX && LVARRAY_RESTRICT_REF dstMatrix,
                       SRC_MATRIX const & LVARRAY_RESTRICT_REF srcMatrix )
   {
     checkSizes< 3, 3 >( dstMatrix );
     checkSizes< 3, 3 >( srcMatrix );

     using FloatingPoint = std::decay_t< decltype( dstMatrix[ 0 ][ 0 ] ) >;

     dstMatrix[ 0 ][ 0 ] = srcMatrix[ 1 ][ 1 ] * srcMatrix[ 2 ][ 2 ] - srcMatrix[ 1 ][ 2 ] * srcMatrix[ 2 ][ 1 ];
     dstMatrix[ 0 ][ 1 ] = srcMatrix[ 0 ][ 2 ] * srcMatrix[ 2 ][ 1 ] - srcMatrix[ 0 ][ 1 ] * srcMatrix[ 2 ][ 2 ];
     dstMatrix[ 0 ][ 2 ] = srcMatrix[ 0 ][ 1 ] * srcMatrix[ 1 ][ 2 ] - srcMatrix[ 0 ][ 2 ] * srcMatrix[ 1 ][ 1 ];

     auto const det = srcMatrix[ 0 ][ 0 ] * dstMatrix[ 0 ][ 0 ] +
                      srcMatrix[ 1 ][ 0 ] * dstMatrix[ 0 ][ 1 ] +
                      srcMatrix[ 2 ][ 0 ] * dstMatrix[ 0 ][ 2 ];
     FloatingPoint const invDet = FloatingPoint( 1 ) / det;

     dstMatrix[ 0 ][ 0 ] *= invDet;
     dstMatrix[ 0 ][ 1 ] *= invDet;
     dstMatrix[ 0 ][ 2 ] *= invDet;
     dstMatrix[ 1 ][ 0 ] = ( srcMatrix[ 1 ][ 2 ] * srcMatrix[ 2 ][ 0 ] - srcMatrix[ 1 ][ 0 ] * srcMatrix[ 2 ][ 2 ] ) * invDet;
     dstMatrix[ 1 ][ 1 ] = ( srcMatrix[ 0 ][ 0 ] * srcMatrix[ 2 ][ 2 ] - srcMatrix[ 0 ][ 2 ] * srcMatrix[ 2 ][ 0 ] ) * invDet;
     dstMatrix[ 1 ][ 2 ] = ( srcMatrix[ 0 ][ 2 ] * srcMatrix[ 1 ][ 0 ] - srcMatrix[ 0 ][ 0 ] * srcMatrix[ 1 ][ 2 ] ) * invDet;
     dstMatrix[ 2 ][ 0 ] = ( srcMatrix[ 1 ][ 0 ] * srcMatrix[ 2 ][ 1 ] - srcMatrix[ 1 ][ 1 ] * srcMatrix[ 2 ][ 0 ] ) * invDet;
     dstMatrix[ 2 ][ 1 ] = ( srcMatrix[ 0 ][ 1 ] * srcMatrix[ 2 ][ 0 ] - srcMatrix[ 0 ][ 0 ] * srcMatrix[ 2 ][ 1 ] ) * invDet;
     dstMatrix[ 2 ][ 2 ] = ( srcMatrix[ 0 ][ 0 ] * srcMatrix[ 1 ][ 1 ] - srcMatrix[ 0 ][ 1 ] * srcMatrix[ 1 ][ 0 ] ) * invDet;

     return det;
   }

   template< typename MATRIX >
   LVARRAY_HOST_DEVICE constexpr inline
   static auto invert( MATRIX && matrix )
   {
     using realType = std::remove_reference_t< decltype( matrix[ 0 ][ 0 ] ) >;
 #if 0
     realType temp[ 3 ][ 3 ];
     copy< 3, 3 >( temp, matrix );
     return invert( matrix, temp );
 #else
     // cuda kernels use a couple fewer registers in some cases with this implementation.
     realType const temp[3][3] =
     { { matrix[1][1]*matrix[2][2] - matrix[1][2]*matrix[2][1], matrix[0][2]*matrix[2][1] - matrix[0][1]*matrix[2][2], matrix[0][1]*matrix[1][2] - matrix[0][2]*matrix[1][1] },
       { matrix[1][2]*matrix[2][0] - matrix[1][0]*matrix[2][2], matrix[0][0]*matrix[2][2] - matrix[0][2]*matrix[2][0], matrix[0][2]*matrix[1][0] - matrix[0][0]*matrix[1][2] },
       { matrix[1][0]*matrix[2][1] - matrix[1][1]*matrix[2][0], matrix[0][1]*matrix[2][0] - matrix[0][0]*matrix[2][1], matrix[0][0]*matrix[1][1] - matrix[0][1]*matrix[1][0] } };

     realType const det =  matrix[0][0] * temp[0][0] + matrix[1][0] * temp[0][1] + matrix[2][0] * temp[0][2];
     realType const invDet = 1.0 / det;

     for( int i=0; i<3; ++i )
     {
       for( int j=0; j<3; ++j )
       {
         matrix[i][j] = temp[i][j] * invDet;
       }
     }
     return det;
 #endif
   }

   template< typename SYM_MATRIX >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static auto symDeterminant( SYM_MATRIX const & symMatrix )
   {
     checkSizes< 6 >( symMatrix );

     return symMatrix[ 0 ] * symMatrix[ 1 ] * symMatrix[ 2 ] +
            symMatrix[ 5 ] * symMatrix[ 4 ] * symMatrix[ 3 ] * 2 -
            symMatrix[ 0 ] * symMatrix[ 3 ] * symMatrix[ 3 ] -
            symMatrix[ 1 ] * symMatrix[ 4 ] * symMatrix[ 4 ] -
            symMatrix[ 2 ] * symMatrix[ 5 ] * symMatrix[ 5 ];
   }

   template< typename DST_SYM_MATRIX, typename SRC_SYM_MATRIX >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static auto symInvert( DST_SYM_MATRIX && LVARRAY_RESTRICT_REF dstSymMatrix,
                          SRC_SYM_MATRIX const & LVARRAY_RESTRICT_REF srcSymMatrix )
   {
     checkSizes< 6 >( dstSymMatrix );
     checkSizes< 6 >( srcSymMatrix );

     using FloatingPoint = std::decay_t< decltype( dstSymMatrix[ 0 ] ) >;

     dstSymMatrix[ 0 ] = srcSymMatrix[ 1 ] * srcSymMatrix[ 2 ] - srcSymMatrix[ 3 ] * srcSymMatrix[ 3 ];
     dstSymMatrix[ 5 ] = srcSymMatrix[ 4 ] * srcSymMatrix[ 3 ] - srcSymMatrix[ 5 ] * srcSymMatrix[ 2 ];
     dstSymMatrix[ 4 ] = srcSymMatrix[ 5 ] * srcSymMatrix[ 3 ] - srcSymMatrix[ 4 ] * srcSymMatrix[ 1 ];

     auto const det = srcSymMatrix[ 0 ] * dstSymMatrix[ 0 ] +
                      srcSymMatrix[ 5 ] * dstSymMatrix[ 5 ] +
                      srcSymMatrix[ 4 ] * dstSymMatrix[ 4 ];
     FloatingPoint const invDet = FloatingPoint( 1 ) / det;

     dstSymMatrix[ 0 ] *= invDet;
     dstSymMatrix[ 5 ] *= invDet;
     dstSymMatrix[ 4 ] *= invDet;
     dstSymMatrix[ 1 ] = ( srcSymMatrix[ 0 ] * srcSymMatrix[ 2 ] - srcSymMatrix[ 4 ] * srcSymMatrix[ 4 ] ) * invDet;
     dstSymMatrix[ 3 ] = ( srcSymMatrix[ 5 ] * srcSymMatrix[ 4 ] - srcSymMatrix[ 0 ] * srcSymMatrix[ 3 ] ) * invDet;
     dstSymMatrix[ 2 ] = ( srcSymMatrix[ 0 ] * srcSymMatrix[ 1 ] - srcSymMatrix[ 5 ] * srcSymMatrix[ 5 ] ) * invDet;

     return det;
   }

   template< typename SYM_MATRIX >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static auto symInvert( SYM_MATRIX && symMatrix )
   {
     std::remove_reference_t< decltype( symMatrix[ 0 ] ) > temp[ 6 ];
     auto const det = symInvert( temp, symMatrix );
     copy< 6 >( symMatrix, temp );

     return det;
   }

   template< typename DST_VECTOR, typename SYM_MATRIX_A, typename VECTOR_B >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static void Ri_eq_symAijBj( DST_VECTOR && LVARRAY_RESTRICT_REF dstVector,
                               SYM_MATRIX_A const & LVARRAY_RESTRICT_REF symMatrixA,
                               VECTOR_B const & LVARRAY_RESTRICT_REF vectorB )
   {
     checkSizes< 3 >( dstVector );
     checkSizes< 6 >( symMatrixA );
     checkSizes< 3 >( vectorB );

     dstVector[ 0 ] = symMatrixA[ 0 ] * vectorB[ 0 ] +
                      symMatrixA[ 5 ] * vectorB[ 1 ] +
                      symMatrixA[ 4 ] * vectorB[ 2 ];
     dstVector[ 1 ] = symMatrixA[ 5 ] * vectorB[ 0 ] +
                      symMatrixA[ 1 ] * vectorB[ 1 ] +
                      symMatrixA[ 3 ] * vectorB[ 2 ];
     dstVector[ 2 ] = symMatrixA[ 4 ] * vectorB[ 0 ] +
                      symMatrixA[ 3 ] * vectorB[ 1 ] +
                      symMatrixA[ 2 ] * vectorB[ 2 ];
   }

   template< typename DST_VECTOR, typename SYM_MATRIX_A, typename VECTOR_B >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static void Ri_add_symAijBj( DST_VECTOR && LVARRAY_RESTRICT_REF dstVector,
                                SYM_MATRIX_A const & LVARRAY_RESTRICT_REF symMatrixA,
                                VECTOR_B const & LVARRAY_RESTRICT_REF vectorB )
   {
     checkSizes< 3 >( dstVector );
     checkSizes< 6 >( symMatrixA );
     checkSizes< 3 >( vectorB );

     dstVector[ 0 ] = dstVector[ 0 ] +
                      symMatrixA[ 0 ] * vectorB[ 0 ] +
                      symMatrixA[ 5 ] * vectorB[ 1 ] +
                      symMatrixA[ 4 ] * vectorB[ 2 ];
     dstVector[ 1 ] = dstVector[ 1 ] +
                      symMatrixA[ 5 ] * vectorB[ 0 ] +
                      symMatrixA[ 1 ] * vectorB[ 1 ] +
                      symMatrixA[ 3 ] * vectorB[ 2 ];
     dstVector[ 2 ] = dstVector[ 2 ] +
                      symMatrixA[ 4 ] * vectorB[ 0 ] +
                      symMatrixA[ 3 ] * vectorB[ 1 ] +
                      symMatrixA[ 2 ] * vectorB[ 2 ];
   }

   template< typename DST_MATRIX, typename SYM_MATRIX_A, typename MATRIX_B >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static void Rij_eq_symAikBjk( DST_MATRIX && LVARRAY_RESTRICT_REF dstMatrix,
                                 SYM_MATRIX_A const & LVARRAY_RESTRICT_REF symMatrixA,
                                 MATRIX_B const & LVARRAY_RESTRICT_REF matrixB )
   {
     checkSizes< 3, 3 >( dstMatrix );
     checkSizes< 6 >( symMatrixA );
     checkSizes< 3, 3 >( matrixB );

     dstMatrix[ 0 ][ 0 ] = symMatrixA[ 0 ] * matrixB[ 0 ][ 0 ] +
                           symMatrixA[ 5 ] * matrixB[ 0 ][ 1 ] +
                           symMatrixA[ 4 ] * matrixB[ 0 ][ 2 ];
     dstMatrix[ 0 ][ 1 ] = symMatrixA[ 0 ] * matrixB[ 1 ][ 0 ] +
                           symMatrixA[ 5 ] * matrixB[ 1 ][ 1 ] +
                           symMatrixA[ 4 ] * matrixB[ 1 ][ 2 ];
     dstMatrix[ 0 ][ 2 ] = symMatrixA[ 0 ] * matrixB[ 2 ][ 0 ] +
                           symMatrixA[ 5 ] * matrixB[ 2 ][ 1 ] +
                           symMatrixA[ 4 ] * matrixB[ 2 ][ 2 ];

     dstMatrix[ 1 ][ 0 ] = symMatrixA[ 5 ] * matrixB[ 0 ][ 0 ] +
                           symMatrixA[ 1 ] * matrixB[ 0 ][ 1 ] +
                           symMatrixA[ 3 ] * matrixB[ 0 ][ 2 ];
     dstMatrix[ 1 ][ 1 ] = symMatrixA[ 5 ] * matrixB[ 1 ][ 0 ] +
                           symMatrixA[ 1 ] * matrixB[ 1 ][ 1 ] +
                           symMatrixA[ 3 ] * matrixB[ 1 ][ 2 ];
     dstMatrix[ 1 ][ 2 ] = symMatrixA[ 5 ] * matrixB[ 2 ][ 0 ] +
                           symMatrixA[ 1 ] * matrixB[ 2 ][ 1 ] +
                           symMatrixA[ 3 ] * matrixB[ 2 ][ 2 ];

     dstMatrix[ 2 ][ 0 ] = symMatrixA[ 4 ] * matrixB[ 0 ][ 0 ] +
                           symMatrixA[ 3 ] * matrixB[ 0 ][ 1 ] +
                           symMatrixA[ 2 ] * matrixB[ 0 ][ 2 ];
     dstMatrix[ 2 ][ 1 ] = symMatrixA[ 4 ] * matrixB[ 1 ][ 0 ] +
                           symMatrixA[ 3 ] * matrixB[ 1 ][ 1 ] +
                           symMatrixA[ 2 ] * matrixB[ 1 ][ 2 ];
     dstMatrix[ 2 ][ 2 ] = symMatrixA[ 4 ] * matrixB[ 2 ][ 0 ] +
                           symMatrixA[ 3 ] * matrixB[ 2 ][ 1 ] +
                           symMatrixA[ 2 ] * matrixB[ 2 ][ 2 ];
   }

   template< typename DST_SYM_MATRIX, typename MATRIX_A, typename SYM_MATRIX_B >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static void Rij_eq_AikSymBklAjl( DST_SYM_MATRIX && LVARRAY_RESTRICT_REF dstSymMatrix,
                                    MATRIX_A const & LVARRAY_RESTRICT_REF matrixA,
                                    SYM_MATRIX_B const & LVARRAY_RESTRICT_REF symMatrixB )
   {
     checkSizes< 6 >( dstSymMatrix );
     checkSizes< 3, 3 >( matrixA );
     checkSizes< 6 >( symMatrixB );

     // Calculate entry (0, 0).
     dstSymMatrix[ 0 ] = matrixA[ 0 ][ 0 ] * symMatrixB[ 0 ] * matrixA[ 0 ][ 0 ] +
                         matrixA[ 0 ][ 0 ] * symMatrixB[ 5 ] * matrixA[ 0 ][ 1 ] +
                         matrixA[ 0 ][ 0 ] * symMatrixB[ 4 ] * matrixA[ 0 ][ 2 ] +
                         matrixA[ 0 ][ 1 ] * symMatrixB[ 5 ] * matrixA[ 0 ][ 0 ] +
                         matrixA[ 0 ][ 1 ] * symMatrixB[ 1 ] * matrixA[ 0 ][ 1 ] +
                         matrixA[ 0 ][ 1 ] * symMatrixB[ 3 ] * matrixA[ 0 ][ 2 ] +
                         matrixA[ 0 ][ 2 ] * symMatrixB[ 4 ] * matrixA[ 0 ][ 0 ] +
                         matrixA[ 0 ][ 2 ] * symMatrixB[ 3 ] * matrixA[ 0 ][ 1 ] +
                         matrixA[ 0 ][ 2 ] * symMatrixB[ 2 ] * matrixA[ 0 ][ 2 ];

     // Calculate entry (1, 1).
     dstSymMatrix[ 1 ] = matrixA[ 1 ][ 0 ] * symMatrixB[ 0 ] * matrixA[ 1 ][ 0 ] +
                         matrixA[ 1 ][ 0 ] * symMatrixB[ 5 ] * matrixA[ 1 ][ 1 ] +
                         matrixA[ 1 ][ 0 ] * symMatrixB[ 4 ] * matrixA[ 1 ][ 2 ] +
                         matrixA[ 1 ][ 1 ] * symMatrixB[ 5 ] * matrixA[ 1 ][ 0 ] +
                         matrixA[ 1 ][ 1 ] * symMatrixB[ 1 ] * matrixA[ 1 ][ 1 ] +
                         matrixA[ 1 ][ 1 ] * symMatrixB[ 3 ] * matrixA[ 1 ][ 2 ] +
                         matrixA[ 1 ][ 2 ] * symMatrixB[ 4 ] * matrixA[ 1 ][ 0 ] +
                         matrixA[ 1 ][ 2 ] * symMatrixB[ 3 ] * matrixA[ 1 ][ 1 ] +
                         matrixA[ 1 ][ 2 ] * symMatrixB[ 2 ] * matrixA[ 1 ][ 2 ];

     // Calculate entry (2, 2).
     dstSymMatrix[ 2 ] = matrixA[ 2 ][ 0 ] * symMatrixB[ 0 ] * matrixA[ 2 ][ 0 ] +
                         matrixA[ 2 ][ 0 ] * symMatrixB[ 5 ] * matrixA[ 2 ][ 1 ] +
                         matrixA[ 2 ][ 0 ] * symMatrixB[ 4 ] * matrixA[ 2 ][ 2 ] +
                         matrixA[ 2 ][ 1 ] * symMatrixB[ 5 ] * matrixA[ 2 ][ 0 ] +
                         matrixA[ 2 ][ 1 ] * symMatrixB[ 1 ] * matrixA[ 2 ][ 1 ] +
                         matrixA[ 2 ][ 1 ] * symMatrixB[ 3 ] * matrixA[ 2 ][ 2 ] +
                         matrixA[ 2 ][ 2 ] * symMatrixB[ 4 ] * matrixA[ 2 ][ 0 ] +
                         matrixA[ 2 ][ 2 ] * symMatrixB[ 3 ] * matrixA[ 2 ][ 1 ] +
                         matrixA[ 2 ][ 2 ] * symMatrixB[ 2 ] * matrixA[ 2 ][ 2 ];

     // Calculate entry (1, 2) or (2, 1).
     dstSymMatrix[ 3 ] = matrixA[ 1 ][ 0 ] * symMatrixB[ 0 ] * matrixA[ 2 ][ 0 ] +
                         matrixA[ 1 ][ 0 ] * symMatrixB[ 5 ] * matrixA[ 2 ][ 1 ] +
                         matrixA[ 1 ][ 0 ] * symMatrixB[ 4 ] * matrixA[ 2 ][ 2 ] +
                         matrixA[ 1 ][ 1 ] * symMatrixB[ 5 ] * matrixA[ 2 ][ 0 ] +
                         matrixA[ 1 ][ 1 ] * symMatrixB[ 1 ] * matrixA[ 2 ][ 1 ] +
                         matrixA[ 1 ][ 1 ] * symMatrixB[ 3 ] * matrixA[ 2 ][ 2 ] +
                         matrixA[ 1 ][ 2 ] * symMatrixB[ 4 ] * matrixA[ 2 ][ 0 ] +
                         matrixA[ 1 ][ 2 ] * symMatrixB[ 3 ] * matrixA[ 2 ][ 1 ] +
                         matrixA[ 1 ][ 2 ] * symMatrixB[ 2 ] * matrixA[ 2 ][ 2 ];

     // Calculate entry (0, 2) or (2, 0).
     dstSymMatrix[ 4 ] = matrixA[ 0 ][ 0 ] * symMatrixB[ 0 ] * matrixA[ 2 ][ 0 ] +
                         matrixA[ 0 ][ 0 ] * symMatrixB[ 5 ] * matrixA[ 2 ][ 1 ] +
                         matrixA[ 0 ][ 0 ] * symMatrixB[ 4 ] * matrixA[ 2 ][ 2 ] +
                         matrixA[ 0 ][ 1 ] * symMatrixB[ 5 ] * matrixA[ 2 ][ 0 ] +
                         matrixA[ 0 ][ 1 ] * symMatrixB[ 1 ] * matrixA[ 2 ][ 1 ] +
                         matrixA[ 0 ][ 1 ] * symMatrixB[ 3 ] * matrixA[ 2 ][ 2 ] +
                         matrixA[ 0 ][ 2 ] * symMatrixB[ 4 ] * matrixA[ 2 ][ 0 ] +
                         matrixA[ 0 ][ 2 ] * symMatrixB[ 3 ] * matrixA[ 2 ][ 1 ] +
                         matrixA[ 0 ][ 2 ] * symMatrixB[ 2 ] * matrixA[ 2 ][ 2 ];

     // Calculate entry (0, 1) or (1, 0).
     dstSymMatrix[ 5 ] = matrixA[ 0 ][ 0 ] * symMatrixB[ 0 ] * matrixA[ 1 ][ 0 ] +
                         matrixA[ 0 ][ 0 ] * symMatrixB[ 5 ] * matrixA[ 1 ][ 1 ] +
                         matrixA[ 0 ][ 0 ] * symMatrixB[ 4 ] * matrixA[ 1 ][ 2 ] +
                         matrixA[ 0 ][ 1 ] * symMatrixB[ 5 ] * matrixA[ 1 ][ 0 ] +
                         matrixA[ 0 ][ 1 ] * symMatrixB[ 1 ] * matrixA[ 1 ][ 1 ] +
                         matrixA[ 0 ][ 1 ] * symMatrixB[ 3 ] * matrixA[ 1 ][ 2 ] +
                         matrixA[ 0 ][ 2 ] * symMatrixB[ 4 ] * matrixA[ 1 ][ 0 ] +
                         matrixA[ 0 ][ 2 ] * symMatrixB[ 3 ] * matrixA[ 1 ][ 1 ] +
                         matrixA[ 0 ][ 2 ] * symMatrixB[ 2 ] * matrixA[ 1 ][ 2 ];
   }

   template< typename DST_MATRIX, typename VECTOR_A >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static void symRij_eq_AiAj( DST_MATRIX && LVARRAY_RESTRICT_REF dstMatrix,
                               VECTOR_A const & LVARRAY_RESTRICT_REF vectorA )
   {
     internal::checkSizes< 6 >( dstMatrix );
     internal::checkSizes< 3 >( vectorA );

     dstMatrix[ 0 ] = vectorA[ 0 ] * vectorA[ 0 ];
     dstMatrix[ 1 ] = vectorA[ 1 ] * vectorA[ 1 ];
     dstMatrix[ 2 ] = vectorA[ 2 ] * vectorA[ 2 ];
     dstMatrix[ 3 ] = vectorA[ 1 ] * vectorA[ 2 ];
     dstMatrix[ 4 ] = vectorA[ 0 ] * vectorA[ 2 ];
     dstMatrix[ 5 ] = vectorA[ 0 ] * vectorA[ 1 ];
   }

   template< typename DST_SYM_MATRIX, typename VECTOR_A, typename VECTOR_B >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static void symRij_eq_AiBj_plus_AjBi( DST_SYM_MATRIX && LVARRAY_RESTRICT_REF dstMatrix,
                                         VECTOR_A const & LVARRAY_RESTRICT_REF vectorA,
                                         VECTOR_B const & LVARRAY_RESTRICT_REF vectorB )
   {
     internal::checkSizes< 6 >( dstMatrix );
     internal::checkSizes< 3 >( vectorA );
     internal::checkSizes< 3 >( vectorB );

     dstMatrix[ 0 ] = 2 * vectorA[ 0 ] * vectorB[ 0 ];
     dstMatrix[ 1 ] = 2 * vectorA[ 1 ] * vectorB[ 1 ];
     dstMatrix[ 2 ] = 2 * vectorA[ 2 ] * vectorB[ 2 ];
     dstMatrix[ 3 ] = vectorA[ 1 ] * vectorB[ 2 ] + vectorA[ 2 ] * vectorB[ 1 ];
     dstMatrix[ 4 ] = vectorA[ 0 ] * vectorB[ 2 ] + vectorA[ 2 ] * vectorB[ 0 ];
     dstMatrix[ 5 ] = vectorA[ 0 ] * vectorB[ 1 ] + vectorA[ 1 ] * vectorB[ 0 ];
   }

   template< typename DST_VECTOR, typename SYM_MATRIX >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static void symEigenvalues( DST_VECTOR && LVARRAY_RESTRICT_REF eigenvalues,
                               SYM_MATRIX const & LVARRAY_RESTRICT_REF symMatrix )
   {
     checkSizes< 3 >( eigenvalues );
     checkSizes< 6 >( symMatrix );

     using FloatingPoint = std::decay_t< decltype( eigenvalues[ 0 ] ) >;

     FloatingPoint shift, maxEntryAfterShift;
     FloatingPoint fpCopy[ 6 ];
     copy< 6 >( fpCopy, symMatrix );
     shiftAndScale< 3 >( fpCopy, shift, maxEntryAfterShift );

     eigenvaluesOfShiftedMatrix( eigenvalues, fpCopy );

     // Rescale back to the original size.
     eigenvalues[ 0 ] = maxEntryAfterShift * eigenvalues[ 0 ] + shift;
     eigenvalues[ 1 ] = maxEntryAfterShift * eigenvalues[ 1 ] + shift;
     eigenvalues[ 2 ] = maxEntryAfterShift * eigenvalues[ 2 ] + shift;
   }

   template< typename DST_VECTOR, typename DST_MATRIX, typename SYM_MATRIX >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static void symEigenvectors( DST_VECTOR && LVARRAY_RESTRICT_REF eigenvalues,
                                DST_MATRIX && LVARRAY_RESTRICT_REF eigenvectors,
                                SYM_MATRIX const & LVARRAY_RESTRICT_REF symMatrix )
   {
     checkSizes< 3 >( eigenvalues );
     checkSizes< 3, 3 >( eigenvectors );
     checkSizes< 6 >( symMatrix );

     using FloatingPoint = std::decay_t< decltype( eigenvalues[ 0 ] ) >;

     FloatingPoint shift, maxEntryAfterShift;
     FloatingPoint fpCopy[ 6 ];
     copy< 6 >( fpCopy, symMatrix );
     shiftAndScale< 3 >( fpCopy, shift, maxEntryAfterShift );

     eigenvaluesOfShiftedMatrix( eigenvalues, fpCopy );

     // compute the eigenvectors
     FloatingPoint const eigenvalueDifference = eigenvalues[ 2 ] - eigenvalues[ 0 ];
     if( eigenvalueDifference <= NumericLimits< FloatingPoint >::epsilon )
     {
       // All three eigenvalues are numerically the same
       LVARRAY_TENSOROPS_ASSIGN_3x3( eigenvectors,
                                     1, 0, 0,
                                     0, 1, 0,
                                     0, 0, 1 );
     }
     else
     {
       // Compute the eigenvector of the most distinct eigenvalue first. Since the eigenvalues are sorted
       // this is the eigenvector corresponding to either the first or last eigenvalue.
       int const mostDistinct = ( ( eigenvalues[ 2 ] - eigenvalues[ 1 ] ) >
                                  ( eigenvalues[ 1 ] - eigenvalues[ 0 ] ) ) ? 2 : 0;
       int const secondMostDistinct = 2 - mostDistinct;

       // Compute the first eigenvector. This is done by subtracting the identity times the most distinct eigenvalue
       // from the matrix which gives us a rank 2 matrix where the nullspace is the corresponding eigenvector.
       FloatingPoint tmp[ 3 ][ 3 ] = { { fpCopy[ 0 ] - eigenvalues[ mostDistinct ], fpCopy[ 5 ], fpCopy[ 4 ] },
         { fpCopy[ 5 ], fpCopy[ 1 ] - eigenvalues[ mostDistinct ], fpCopy[ 3 ] },
         { fpCopy[ 4 ], fpCopy[ 3 ], fpCopy[ 2 ] - eigenvalues[ mostDistinct ] } };

       int const row = getNullVector( eigenvectors[ mostDistinct ], tmp );

       // Compute eigenvector of the second most distinct eigenvalue.
       FloatingPoint const minEigenvalueSpacing = math::abs( eigenvalues[ secondMostDistinct ] - eigenvalues[ 1 ] );
       if( minEigenvalueSpacing <= 2 * NumericLimits< FloatingPoint >::epsilon * eigenvalueDifference )
       {
         // If minEigenvalueSpacing is too small then the other two eigenvalues are numerically the same
         // we can use tmp[ row ].
         FloatingPoint const norm2 = l2NormSquared< 3 >( tmp[ row ] );
         scaledCopy< 3 >( eigenvectors[ secondMostDistinct ], tmp[ row ], math::invSqrt( norm2 ) );
       }
       else
       {
         // Otherwise repeat the procedure with the second most distinct eigenvalue.
         tmp[ 0 ][ 0 ] = fpCopy[ 0 ] - eigenvalues[ secondMostDistinct ];
         tmp[ 1 ][ 1 ] = fpCopy[ 1 ] - eigenvalues[ secondMostDistinct ];
         tmp[ 2 ][ 2 ] = fpCopy[ 2 ] - eigenvalues[ secondMostDistinct ];

         getNullVector( eigenvectors[ secondMostDistinct ], tmp );
       }

       // Compute last eigenvector from the other two
       crossProduct( eigenvectors[ 1 ], eigenvectors[ 2 ], eigenvectors[ 0 ] );
       normalize< 3 >( eigenvectors[ 1 ] );
     }

     // Rescale back to the original size.
     eigenvalues[ 0 ] = maxEntryAfterShift * eigenvalues[ 0 ] + shift;
     eigenvalues[ 1 ] = maxEntryAfterShift * eigenvalues[ 1 ] + shift;
     eigenvalues[ 2 ] = maxEntryAfterShift * eigenvalues[ 2 ] + shift;
   }

   template< typename DST_SYM_MATRIX, typename SRC_MATRIX >
   LVARRAY_HOST_DEVICE inline CONSTEXPR_WITHOUT_BOUNDS_CHECK
   static void denseToSymmetric( DST_SYM_MATRIX && dstSymMatrix, SRC_MATRIX const & srcMatrix )
   {
     tensorOps::internal::checkSizes< 6 >( dstSymMatrix );
     tensorOps::internal::checkSizes< 3, 3 >( srcMatrix );

     dstSymMatrix[ 0 ] = srcMatrix[ 0 ][ 0 ];
     dstSymMatrix[ 1 ] = srcMatrix[ 1 ][ 1 ];
     dstSymMatrix[ 2 ] = srcMatrix[ 2 ][ 2 ];
     dstSymMatrix[ 3 ] = srcMatrix[ 1 ][ 2 ];
     dstSymMatrix[ 4 ] = srcMatrix[ 0 ][ 2 ];
     dstSymMatrix[ 5 ] = srcMatrix[ 0 ][ 1 ];
   }

   template< typename DST_MATRIX, typename SRC_SYM_MATRIX >
   LVARRAY_HOST_DEVICE inline CONSTEXPR_WITHOUT_BOUNDS_CHECK
   static void symmetricToDense( DST_MATRIX && dstMatrix, SRC_SYM_MATRIX const & srcSymMatrix )
   {
     tensorOps::internal::checkSizes< 3, 3 >( dstMatrix );
     tensorOps::internal::checkSizes< 6 >( srcSymMatrix );

     dstMatrix[ 0 ][ 0 ] = srcSymMatrix[ 0 ];
     dstMatrix[ 1 ][ 1 ] = srcSymMatrix[ 1 ];
     dstMatrix[ 2 ][ 2 ] = srcSymMatrix[ 2 ];

     dstMatrix[ 0 ][ 1 ] = srcSymMatrix[ 5 ];
     dstMatrix[ 0 ][ 2 ] = srcSymMatrix[ 4 ];
     dstMatrix[ 1 ][ 2 ] = srcSymMatrix[ 3 ];

     dstMatrix[ 1 ][ 0 ] = srcSymMatrix[ 5 ];
     dstMatrix[ 2 ][ 0 ] = srcSymMatrix[ 4 ];
     dstMatrix[ 2 ][ 1 ] = srcSymMatrix[ 3 ];
   }

 private:
   template< typename FloatingPoint, typename VECTOR >
   LVARRAY_HOST_DEVICE inline
   static void eigenvaluesOfShiftedMatrix( VECTOR && eigenvalues,
                                           FloatingPoint const ( &matrix )[ 6 ] )
   {
     /*
        For a 3x3 symmetric matrix A
           a0, a5, a4
           a5, a1, a3
           a4, a3, a2
        And eigenvalue x the characteristic equation is
           x^3 - tr(A) * x^2 - 0.5 * (tr(A^2) - tr(A)^2) * x - det( A ) = 0
        However the shifted matrix has a trace of 0 so this simplifies to
           x^3 - 0.5 * tr(A^2) * x - det( A ) = 0

        This approach is a hybrid of the wikipedia algorithm and Eigen's algorithm.
        The wikipedia algorithm uses one less call to sqrt to find theta but Eigen's
        conversion from theta to the roots is faster.

        https://en.wikipedia.org/wiki/Eigenvalue_algorithm#3%C3%973_matrices.
        https://gitlab.com/libeigen/eigen/-/blob/3.3/Eigen/src/Eigenvalues/SelfAdjointEigenSolver.h#L567
      */

     // The calculation of the trace(A^2) uses the fact that trace(A) = 0 and hence a2 = -a1 - a0.
     FloatingPoint const oneSixthTraceASquared =
       ( matrix[ 2 ] * matrix[ 2 ] - matrix[ 0 ] * matrix[ 1 ] + matrix[ 3 ] * matrix[ 3 ] +
         matrix[ 4 ] * matrix[ 4 ] + matrix[ 5 ] * matrix[ 5 ] ) / 3;

     FloatingPoint const p = math::sqrt( oneSixthTraceASquared );

     FloatingPoint const det = ( p > 0 ) ? symDeterminant( matrix ) / ( p * p * p ) : 0;

     // det should be in [-2, 2] but it may be slightly outside do to floating point error.
     FloatingPoint const halfDetB = det > 2 ? 1 : ( det < -2 ? -1 : det / 2 );
     FloatingPoint const theta = math::acos( halfDetB ) / 3;

     FloatingPoint sinTheta, cosTheta;
     math::sincos( theta, sinTheta, cosTheta );

     // roots are already sorted, since cos is monotonically decreasing on [0, pi]
     constexpr FloatingPoint squareRootThree = 1.73205080756887729352744;
     eigenvalues[ 0 ] = -p * ( cosTheta + squareRootThree * sinTheta ); // == 2 * p * cos( theta + 2pi/3 )
     eigenvalues[ 1 ] = -p * ( cosTheta - squareRootThree * sinTheta ); // == 2 * p * cos( theta +  pi/3 )
     eigenvalues[ 2 ] = 2 * p * cosTheta;
   }

   template< typename FLOAT, typename VECTOR >
   LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK inline
   static int getNullVector( VECTOR && nullVector, FLOAT const (&mat)[ 3 ][ 3 ] )
   {
     // Find the row with the largest diagonal value.
     FLOAT const abs00 = math::abs( mat[ 0 ][ 0 ] );
     FLOAT const abs11 = math::abs( mat[ 1 ][ 1 ] );
     FLOAT const abs22 = math::abs( mat[ 2 ][ 2 ] );

     int const row = abs00 > abs11 ? ( abs00 > abs22 ? 0 : 2 ) :
                     ( abs11 > abs22 ? 1 : 2 );

     // From each of the other two rows in the matrix construct an orthogonal vector.
     crossProduct( nullVector, mat[ row ], mat[ ( row + 1 ) % 3 ] );
     FLOAT const n0 = l2NormSquared< 3 >( nullVector );

     FLOAT nullVectorCandidate[ 3 ];
     crossProduct( nullVectorCandidate, mat[ row ], mat[ ( row + 2 ) % 3 ] );
     FLOAT const n1 = l2NormSquared< 3 >( nullVectorCandidate );

     // Choose the null vector with the largest magnitude.
     if( n0 > n1 )
     { scale< 3 >( nullVector, math::invSqrt( n0 ) ); }
     else
     { scaledCopy< 3 >( nullVector, nullVectorCandidate, math::invSqrt( n1 ) ); }

     return row;
   }
 };

 } // namespace internal
 } // namespace tensorOps
 } // namespace LvArray
LvArray::tensorOps::internal::SquareMatrixOps< 3 >::symDeterminant
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK auto symDeterminant(SYM_MATRIX const &symMatrix)
Definition: fixedSizeSquareMatrixOpsImpl.hpp:667

LvArray::tensorOps::internal::SquareMatrixOps< 2 >::symEigenvectors
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void symEigenvectors(DST_VECTOR &&LVARRAY_RESTRICT_REF eigenvalues, DST_MATRIX &&LVARRAY_RESTRICT_REF eigenvectors, SYM_MATRIX const &LVARRAY_RESTRICT_REF symMatrix)
Compute the eigenvalues and eigenvectors of the symmetric matrix symMatrix.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:431

LvArray::tensorOps::internal::SquareMatrixOps< 3 >::getNullVector
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK int getNullVector(VECTOR &&nullVector, FLOAT const (&mat)[3][3])
Extract the nullspace of the rank 2 3x3 symmetric matrix mat.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:1230

LvArray::tensorOps::internal::SquareMatrixOps< 3 >::symEigenvectors
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void symEigenvectors(DST_VECTOR &&LVARRAY_RESTRICT_REF eigenvalues, DST_MATRIX &&LVARRAY_RESTRICT_REF eigenvectors, SYM_MATRIX const &LVARRAY_RESTRICT_REF symMatrix)
Compute the eigenvalues and eigenvectors of the symmetric matrix symMatrix.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:1043

LvArray::tensorOps::internal::SquareMatrixOps< 2 >::symDeterminant
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK auto symDeterminant(SYM_MATRIX const &symMatrix)
Definition: fixedSizeSquareMatrixOpsImpl.hpp:156

LvArray::tensorOps::internal::SquareMatrixOps< 3 >::symInvert
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK auto symInvert(DST_SYM_MATRIX &&LVARRAY_RESTRICT_REF dstSymMatrix, SRC_SYM_MATRIX const &LVARRAY_RESTRICT_REF srcSymMatrix)
Invert the symmetric matrix srcSymMatrix and store the result in dstSymMatrix.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:689

LvArray::tensorOps::internal::SquareMatrixOps< 2 >::symEigenvalues
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void symEigenvalues(DST_VECTOR &&LVARRAY_RESTRICT_REF eigenvalues, SYM_MATRIX const &LVARRAY_RESTRICT_REF symMatrix)
Compute the eigenvalues of the symmetric matrix symMatrix.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:394

LvArray::tensorOps::internal::SquareMatrixOps< 3 >::symInvert
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK auto symInvert(SYM_MATRIX &&symMatrix)
Invert the symmetric matrix symMatrix overwritting it.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:725

LvArray::tensorOps::internal::SquareMatrixOps< 2 >::invert
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK auto invert(MATRIX &&matrix)
Invert the matrix srcMatrix overwritting it.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:133

LvArray::tensorOps::internal::SquareMatrixOps
Performs operations on square matrices.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:71

LvArray::tensorOps::internal::shiftAndScale
static LVARRAY_HOST_DEVICE void shiftAndScale(FloatingPoint(&matrix)[(M *(M+1))/2], FloatingPoint &shift, FloatingPoint &maxEntryAfterShift)
Shift the and scale the MxM symmetric matrix matrix.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:38

LvArray::tensorOps::internal::SquareMatrixOps< 3 >::eigenvaluesOfShiftedMatrix
static LVARRAY_HOST_DEVICE void eigenvaluesOfShiftedMatrix(VECTOR &&eigenvalues, FloatingPoint const (&matrix)[6])
Compute the eigenvalues of the 3x3 symmetric matrix matrix.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:1175

LvArray::tensorOps::invert
LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK auto invert(DST_MATRIX &&LVARRAY_RESTRICT_REF dstMatrix, SRC_MATRIX const &LVARRAY_RESTRICT_REF srcMatrix)
Invert the source matrix srcMatrix and store the result in dstMatrix.
Definition: fixedSizeSquareMatrixOps.hpp:53

LvArray::tensorOps::internal::SquareMatrixOps< 3 >::Rij_eq_AikSymBklAjl
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void Rij_eq_AikSymBklAjl(DST_SYM_MATRIX &&LVARRAY_RESTRICT_REF dstSymMatrix, MATRIX_A const &LVARRAY_RESTRICT_REF matrixA, SYM_MATRIX_B const &LVARRAY_RESTRICT_REF symMatrixB)
Multiply the transpose of matrix matrixA by the symmetric matrix symMatrixB then by matrixA and store...
Definition: fixedSizeSquareMatrixOpsImpl.hpp:867

LvArray::tensorOps::symDeterminant
LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK auto symDeterminant(SYM_MATRIX const &symMatrix)
Definition: fixedSizeSquareMatrixOps.hpp:229

LvArray::math::acos
LVARRAY_HOST_DEVICE float acos(float const x)
Definition: math.hpp:888

LvArray::tensorOps::internal::SquareMatrixOps< 3 >::Rij_eq_symAikBjk
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void Rij_eq_symAikBjk(DST_MATRIX &&LVARRAY_RESTRICT_REF dstMatrix, SYM_MATRIX_A const &LVARRAY_RESTRICT_REF symMatrixA, MATRIX_B const &LVARRAY_RESTRICT_REF matrixB)
Multiply the transpose of matrix matrixB by the symmetric matrix symMatrixA and store the result in d...
Definition: fixedSizeSquareMatrixOpsImpl.hpp:813

LVARRAY_TENSOROPS_ASSIGN_3x3
#define LVARRAY_TENSOROPS_ASSIGN_3x3(var, exp00, exp01, exp02, exp10, exp11, exp12, exp20, exp21, exp22)
Assign to the 3x3 matrix var.
Definition: genericTensorOps.hpp:137

LvArray::tensorOps::internal::SquareMatrixOps< 2 >::symmetricToDense
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void symmetricToDense(DST_MATRIX &&dstMatrix, SRC_SYM_MATRIX const &srcSymMatrix)
Convert the srcSymMatrix into a dense matrix.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:520

genericTensorOps.hpp
Contains the implementation of arbitrary sized vector and matrix operations.

CONSTEXPR_WITHOUT_BOUNDS_CHECK
#define CONSTEXPR_WITHOUT_BOUNDS_CHECK
Expands to constexpr when array bound checking is disabled.
Definition: Macros.hpp:609

LvArray::tensorOps::internal::SquareMatrixOps< 2 >::Ri_add_symAijBj
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void Ri_add_symAijBj(DST_VECTOR &&LVARRAY_RESTRICT_REF dstVector, SYM_MATRIX_A const &LVARRAY_RESTRICT_REF symMatrixA, VECTOR_B const &LVARRAY_RESTRICT_REF vectorB)
Multiply the vector vectorB by the symmetric matrix symMatrixA and add the result to dstVector...
Definition: fixedSizeSquareMatrixOpsImpl.hpp:252

LvArray::tensorOps::internal::SquareMatrixOps< 3 >::symmetricToDense
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void symmetricToDense(DST_MATRIX &&dstMatrix, SRC_SYM_MATRIX const &srcSymMatrix)
Convert the srcSymMatrix into a dense matrix.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:1147

LvArray::tensorOps::internal::SquareMatrixOps< 2 >::symInvert
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK auto symInvert(SYM_MATRIX &&symMatrix)
Invert the symmetric matrix symMatrix overwritting it.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:200

LvArray::tensorOps::internal::SquareMatrixOps< 3 >::determinant
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK auto determinant(MATRIX const &matrix)
Definition: fixedSizeSquareMatrixOpsImpl.hpp:573

LvArray::tensorOps::internal::SquareMatrixOps< 2 >::symInvert
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK auto symInvert(DST_SYM_MATRIX &&LVARRAY_RESTRICT_REF dstSymMatrix, SRC_SYM_MATRIX const &LVARRAY_RESTRICT_REF srcSymMatrix)
Invert the symmetric matrix srcSymMatrix and store the result in dstSymMatrix.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:173

LvArray::math::sincos
LVARRAY_HOST_DEVICE void sincos(float const theta, float &sinTheta, float &cosTheta)
Compute the sine and cosine of theta.
Definition: math.hpp:636

LvArray::tensorOps::internal::SquareMatrixOps< 3 >::invert
LVARRAY_HOST_DEVICE static constexpr auto invert(MATRIX &&matrix)
Invert the matrix srcMatrix overwritting it.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:632

LvArray::tensorOps::internal::SquareMatrixOps< 3 >::invert
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK auto invert(DST_MATRIX &&LVARRAY_RESTRICT_REF dstMatrix, SRC_MATRIX const &LVARRAY_RESTRICT_REF srcMatrix)
Invert the source matrix srcMatrix and store the result in dstMatrix.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:593

LvArray::tensorOps::internal::SquareMatrixOps< 2 >::Rij_eq_AikSymBklAjl
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void Rij_eq_AikSymBklAjl(DST_SYM_MATRIX &&LVARRAY_RESTRICT_REF dstSymMatrix, MATRIX_A const &LVARRAY_RESTRICT_REF matrixA, SYM_MATRIX_B const &LVARRAY_RESTRICT_REF symMatrixB)
Multiply the transpose of matrix matrixA by the symmetric matrix symMatrixB then by matrixA and store...
Definition: fixedSizeSquareMatrixOpsImpl.hpp:307

LvArray::math::sqrt
LVARRAY_HOST_DEVICE float sqrt(float const x)
Definition: math.hpp:461

LvArray
The top level namespace.
Definition: Array.hpp:24

LvArray::tensorOps::crossProduct
LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK void crossProduct(DST_VECTOR &&LVARRAY_RESTRICT_REF dstVector, VECTOR_A const &LVARRAY_RESTRICT_REF vectorA, VECTOR_B const &LVARRAY_RESTRICT_REF vectorB)
Compute the cross product of vectorA and vectorB and put it in dstVector.
Definition: genericTensorOps.hpp:792

LvArray::tensorOps::internal::SquareMatrixOps< 3 >::symEigenvalues
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void symEigenvalues(DST_VECTOR &&LVARRAY_RESTRICT_REF eigenvalues, SYM_MATRIX const &LVARRAY_RESTRICT_REF symMatrix)
Compute the eigenvalues of the symmetric matrix symMatrix.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:1007

LvArray::tensorOps::internal::SquareMatrixOps< 2 >::invert
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK auto invert(DST_MATRIX &&LVARRAY_RESTRICT_REF dstMatrix, SRC_MATRIX const &LVARRAY_RESTRICT_REF srcMatrix)
Invert the source matrix srcMatrix and store the result in dstMatrix.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:105

LvArray::tensorOps::determinant
LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK auto determinant(MATRIX const &matrix)
Definition: fixedSizeSquareMatrixOps.hpp:38

LvArray::tensorOps::internal::SquareMatrixOps< 2 >::symRij_eq_AiBj_plus_AjBi
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void symRij_eq_AiBj_plus_AjBi(DST_SYM_MATRIX &&LVARRAY_RESTRICT_REF dstMatrix, VECTOR_A const &LVARRAY_RESTRICT_REF vectorA, VECTOR_B const &LVARRAY_RESTRICT_REF vectorB)
Perform the unscaled symmetric outer product of vectorA and vectorB writing the result to dstMatrix...
Definition: fixedSizeSquareMatrixOpsImpl.hpp:370

LvArray::tensorOps::internal::SquareMatrixOps< 2 >::symRij_eq_AiAj
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void symRij_eq_AiAj(DST_MATRIX &&LVARRAY_RESTRICT_REF dstMatrix, VECTOR_A const &LVARRAY_RESTRICT_REF vectorA)
Perform the outer product of vectorA with itself writing the result to dstMatrix. ...
Definition: fixedSizeSquareMatrixOpsImpl.hpp:346

LvArray::NumericLimits
A wrapper for the std::numeric_limits< T > member functions, this allows their values to be used on d...
Definition: limits.hpp:36

LvArray::math::abs
LVARRAY_HOST_DEVICE constexpr T abs(T const x)
Definition: math.hpp:402

LvArray::tensorOps::internal::SquareMatrixOps< 3 >::symRij_eq_AiAj
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void symRij_eq_AiAj(DST_MATRIX &&LVARRAY_RESTRICT_REF dstMatrix, VECTOR_A const &LVARRAY_RESTRICT_REF vectorA)
Perform the outer product of vectorA with itself writing the result to dstMatrix. ...
Definition: fixedSizeSquareMatrixOpsImpl.hpp:953

LvArray::tensorOps::internal::SquareMatrixOps< 3 >::Ri_eq_symAijBj
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void Ri_eq_symAijBj(DST_VECTOR &&LVARRAY_RESTRICT_REF dstVector, SYM_MATRIX_A const &LVARRAY_RESTRICT_REF symMatrixA, VECTOR_B const &LVARRAY_RESTRICT_REF vectorB)
Multiply the vector vectorB by the symmetric matrix symMatrixA and store the result in dstVector...
Definition: fixedSizeSquareMatrixOpsImpl.hpp:747

LvArray::tensorOps::internal::SquareMatrixOps< 2 >::eigenvaluesOfShiftedMatrix
static LVARRAY_HOST_DEVICE void eigenvaluesOfShiftedMatrix(VECTOR &&eigenvalues, FloatingPoint const (&matrix)[3])
Compute the eigenvalues of the 2x2 symmetric matrix matrix.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:543

LvArray::tensorOps::internal::SquareMatrixOps< 3 >::symRij_eq_AiBj_plus_AjBi
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void symRij_eq_AiBj_plus_AjBi(DST_SYM_MATRIX &&LVARRAY_RESTRICT_REF dstMatrix, VECTOR_A const &LVARRAY_RESTRICT_REF vectorA, VECTOR_B const &LVARRAY_RESTRICT_REF vectorB)
Perform the unscaled symmetric outer product of vectorA and vectorB writing the result to dstMatrix...
Definition: fixedSizeSquareMatrixOpsImpl.hpp:980

LvArray::math::invSqrt
LVARRAY_HOST_DEVICE float invSqrt(float const x)
Definition: math.hpp:503

LvArray::tensorOps::internal::SquareMatrixOps< 2 >::Ri_eq_symAijBj
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void Ri_eq_symAijBj(DST_VECTOR &&LVARRAY_RESTRICT_REF dstVector, SYM_MATRIX_A const &LVARRAY_RESTRICT_REF symMatrixA, VECTOR_B const &LVARRAY_RESTRICT_REF vectorB)
Multiply the vector vectorB by the symmetric matrix symMatrixA and store the result in dstVector...
Definition: fixedSizeSquareMatrixOpsImpl.hpp:228

LvArray::tensorOps::internal::SquareMatrixOps< 2 >::determinant
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK auto determinant(MATRIX const &matrix)
Definition: fixedSizeSquareMatrixOpsImpl.hpp:88

LvArray::tensorOps::internal::SquareMatrixOps< 2 >::denseToSymmetric
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void denseToSymmetric(DST_SYM_MATRIX &&dstSymMatrix, SRC_MATRIX const &srcMatrix)
Convert the upper triangular part of srcMatrix to a symmetric matrix.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:501

LVARRAY_TENSOROPS_ASSIGN_2x2
#define LVARRAY_TENSOROPS_ASSIGN_2x2(var, exp00, exp01, exp10, exp11)
Assign to the 2x2 matrix var.
Definition: genericTensorOps.hpp:111

LvArray::tensorOps::symInvert
LVARRAY_HOST_DEVICE CONSTEXPR_WITHOUT_BOUNDS_CHECK auto symInvert(DST_SYM_MATRIX &&LVARRAY_RESTRICT_REF dstSymMatrix, SRC_SYM_MATRIX const &LVARRAY_RESTRICT_REF srcSymMatrix)
Invert the symmetric matrix srcSymMatrix and store the result in dstSymMatrix.
Definition: fixedSizeSquareMatrixOps.hpp:244

LvArray::tensorOps::internal::SquareMatrixOps< 3 >::Ri_add_symAijBj
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void Ri_add_symAijBj(DST_VECTOR &&LVARRAY_RESTRICT_REF dstVector, SYM_MATRIX_A const &LVARRAY_RESTRICT_REF symMatrixA, VECTOR_B const &LVARRAY_RESTRICT_REF vectorB)
Multiply the vector vectorB by the symmetric matrix symMatrixA and add the result to dstVector...
Definition: fixedSizeSquareMatrixOpsImpl.hpp:778

LVARRAY_HOST_DEVICE
#define LVARRAY_HOST_DEVICE
Mark a function for both host and device usage.
Definition: Macros.hpp:549

LvArray::tensorOps::internal::SquareMatrixOps< 2 >::Rij_eq_symAikBjk
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void Rij_eq_symAikBjk(DST_MATRIX &&LVARRAY_RESTRICT_REF dstMatrix, SYM_MATRIX_A const &LVARRAY_RESTRICT_REF symMatrixA, MATRIX_B const &LVARRAY_RESTRICT_REF matrixB)
Multiply the transpose of matrix matrixB by the symmetric matrix symMatrixA and store the result in d...
Definition: fixedSizeSquareMatrixOpsImpl.hpp:277

LvArray::tensorOps::internal::SquareMatrixOps< 3 >::denseToSymmetric
LVARRAY_HOST_DEVICE static CONSTEXPR_WITHOUT_BOUNDS_CHECK void denseToSymmetric(DST_SYM_MATRIX &&dstSymMatrix, SRC_MATRIX const &srcMatrix)
Convert the upper triangular part of srcMatrix to a symmetric matrix.
Definition: fixedSizeSquareMatrixOpsImpl.hpp:1125