Go to the source code of this file.
Defines | |
#define | B_ID(index, i) (index+(bStride*(i))) |
#define | C_ID(index, i) (index+(cStride*(i))) |
Functions | |
template<typename T > | |
dxGlobal void | cudaComputeAdcfmBT (int4 *bodyIDs, typename vec4< T >::Type *j0, typename vec4< T >::Type *j1, typename vec4< T >::Type *j2, typename vec4< T >::Type *j3, typename vec4< T >::Type *ij0, typename vec4< T >::Type *ij1, typename vec4< T >::Type *ij2, typename vec4< T >::Type *ij3, T *adcfm, T *rhs, T sorParam, int numConstraints) |
template<typename T > | |
dxGlobal void | cudaComputeInvMJTT (int4 *bodyIDs, typename vec4< T >::Type *j0, typename vec4< T >::Type *j1, typename vec4< T >::Type *j2, typename vec4< T >::Type *j3, typename vec4< T >::Type *ij0, typename vec4< T >::Type *ij1, typename vec4< T >::Type *ij2, typename vec4< T >::Type *ij3, T *iMass, int numConstraints, typename vec4< T >::Type *ii0, typename vec4< T >::Type *ii1, typename vec4< T >::Type *ii2) |
template<typename T > | |
dxGlobal void | cudaIntegrateT (typename vec4< T >::Type *pos, typename vec4< T >::Type *lVel, typename vec4< T >::Type *aVel, float deltaTime, int numConstraints) |
template<typename T > | |
dxGlobal void | cudaReduceIterativeCompactT (typename vec4< T >::Type *fc0_reduction, typename vec4< T >::Type *fc1_reduction, const int treePower) |
template<typename T > | |
dxGlobal void | cudaReduceLoopedCompactT (typename vec4< T >::Type *fc0_reduction, typename vec4< T >::Type *fc1_reduction, const int size, const int step) |
template<typename T , unsigned int blockSize> | |
dxGlobal void | cudaReduceSequentialT (typename vec4< T >::Type *fc0, typename vec4< T >::Type *fc1, typename vec4< T >::Type *fc0_reduction, typename vec4< T >::Type *fc1_reduction, int n) |
template<typename T > | |
dxGlobal void | cudaReduceStridedT (typename vec4< T >::Type *fc0, typename vec4< T >::Type *fc1, const typename vec4< T >::Type *fc0_reduction, const typename vec4< T >::Type *fc1_reduction, const int reductionStride, const int bodySize, const int reductionSize) |
template<typename T > | |
dxGlobal void | cudaSORLCPT (typename vec4< T >::Type *fc0_reduction, typename vec4< T >::Type *fc1_reduction, T *lambda, const int4 *bodyIDs, const int *fIDs, const typename vec4< T >::Type *j, const typename vec4< T >::Type *ij, const typename vec4< T >::Type *fc0, const typename vec4< T >::Type *fc1, const T *adcfm, const T *rhs, const T *hilo, const int offset, const int numConstraints, const int bStride, const int cStride) |
template<typename T > | |
dxGlobal void | cudaZeroT (T *buffer, const int bufferSize) |
template<typename T > | |
static dxDevice T | parallel_inf () |
template<> | |
dxDevice double | parallel_inf< double > () |
template<> | |
dxDevice float | parallel_inf< float > () |
template<typename T > | |
static dxDevice T | parallel_zero () |
template<> | |
dxDevice double | parallel_zero< double > () |
template<> | |
dxDevice double4 | parallel_zero< double4 > () |
template<> | |
dxDevice float | parallel_zero< float > () |
template<> | |
dxDevice float4 | parallel_zero< float4 > () |
Variables | |
static uint2 | s_blockDim |
static uint2 | s_blockIdx |
static uint2 | s_threadIdx |
#define B_ID | ( | index, | |
i | |||
) | (index+(bStride*(i))) |
Definition at line 5 of file parallel_kernels.h.
#define C_ID | ( | index, | |
i | |||
) | (index+(cStride*(i))) |
Definition at line 4 of file parallel_kernels.h.
dxGlobal void cudaComputeAdcfmBT | ( | int4 * | bodyIDs, |
typename vec4< T >::Type * | j0, | ||
typename vec4< T >::Type * | j1, | ||
typename vec4< T >::Type * | j2, | ||
typename vec4< T >::Type * | j3, | ||
typename vec4< T >::Type * | ij0, | ||
typename vec4< T >::Type * | ij1, | ||
typename vec4< T >::Type * | ij2, | ||
typename vec4< T >::Type * | ij3, | ||
T * | adcfm, | ||
T * | rhs, | ||
T | sorParam, | ||
int | numConstraints | ||
) |
Definition at line 399 of file parallel_kernels.h.
dxGlobal void cudaComputeInvMJTT | ( | int4 * | bodyIDs, |
typename vec4< T >::Type * | j0, | ||
typename vec4< T >::Type * | j1, | ||
typename vec4< T >::Type * | j2, | ||
typename vec4< T >::Type * | j3, | ||
typename vec4< T >::Type * | ij0, | ||
typename vec4< T >::Type * | ij1, | ||
typename vec4< T >::Type * | ij2, | ||
typename vec4< T >::Type * | ij3, | ||
T * | iMass, | ||
int | numConstraints, | ||
typename vec4< T >::Type * | ii0, | ||
typename vec4< T >::Type * | ii1, | ||
typename vec4< T >::Type * | ii2 | ||
) |
Definition at line 321 of file parallel_kernels.h.
dxGlobal void cudaIntegrateT | ( | typename vec4< T >::Type * | pos, |
typename vec4< T >::Type * | lVel, | ||
typename vec4< T >::Type * | aVel, | ||
float | deltaTime, | ||
int | numConstraints | ||
) |
Definition at line 457 of file parallel_kernels.h.
dxGlobal void cudaReduceIterativeCompactT | ( | typename vec4< T >::Type * | fc0_reduction, |
typename vec4< T >::Type * | fc1_reduction, | ||
const int | treePower | ||
) |
Definition at line 157 of file parallel_kernels.h.
dxGlobal void cudaReduceLoopedCompactT | ( | typename vec4< T >::Type * | fc0_reduction, |
typename vec4< T >::Type * | fc1_reduction, | ||
const int | size, | ||
const int | step | ||
) |
Definition at line 180 of file parallel_kernels.h.
dxGlobal void cudaReduceSequentialT | ( | typename vec4< T >::Type * | fc0, |
typename vec4< T >::Type * | fc1, | ||
typename vec4< T >::Type * | fc0_reduction, | ||
typename vec4< T >::Type * | fc1_reduction, | ||
int | n | ||
) |
Definition at line 240 of file parallel_kernels.h.
dxGlobal void cudaReduceStridedT | ( | typename vec4< T >::Type * | fc0, |
typename vec4< T >::Type * | fc1, | ||
const typename vec4< T >::Type * | fc0_reduction, | ||
const typename vec4< T >::Type * | fc1_reduction, | ||
const int | reductionStride, | ||
const int | bodySize, | ||
const int | reductionSize | ||
) |
Definition at line 209 of file parallel_kernels.h.
dxGlobal void cudaSORLCPT | ( | typename vec4< T >::Type * | fc0_reduction, |
typename vec4< T >::Type * | fc1_reduction, | ||
T * | lambda, | ||
const int4 * | bodyIDs, | ||
const int * | fIDs, | ||
const typename vec4< T >::Type * | j, | ||
const typename vec4< T >::Type * | ij, | ||
const typename vec4< T >::Type * | fc0, | ||
const typename vec4< T >::Type * | fc1, | ||
const T * | adcfm, | ||
const T * | rhs, | ||
const T * | hilo, | ||
const int | offset, | ||
const int | numConstraints, | ||
const int | bStride, | ||
const int | cStride | ||
) |
Definition at line 38 of file parallel_kernels.h.
Definition at line 27 of file parallel_kernels.h.
static dxDevice T parallel_inf | ( | ) | [inline, static] |
Definition at line 9 of file parallel_kernels.h.
dxDevice double parallel_inf< double > | ( | ) | [inline] |
Definition at line 20 of file parallel_kernels.h.
dxDevice float parallel_inf< float > | ( | ) | [inline] |
Definition at line 12 of file parallel_kernels.h.
static dxDevice T parallel_zero | ( | ) | [inline, static] |
Definition at line 10 of file parallel_kernels.h.
dxDevice double parallel_zero< double > | ( | ) | [inline] |
Definition at line 21 of file parallel_kernels.h.
dxDevice double4 parallel_zero< double4 > | ( | ) | [inline] |
Definition at line 22 of file parallel_kernels.h.
dxDevice float parallel_zero< float > | ( | ) | [inline] |
Definition at line 13 of file parallel_kernels.h.
dxDevice float4 parallel_zero< float4 > | ( | ) | [inline] |
Definition at line 14 of file parallel_kernels.h.
uint2 s_blockDim [static] |
Definition at line 7 of file parallel_kernels.h.
uint2 s_blockIdx [static] |
Definition at line 7 of file parallel_kernels.h.
uint2 s_threadIdx [static] |
Definition at line 7 of file parallel_kernels.h.