bullet-2.82-html/html/btSoftBodySolver__DX11SIMDAware_8cpp_source.html

 /*

 Bullet Continuous Collision Detection and Physics Library

 Copyright (c) 2003-2006 Erwin Coumans  http://continuousphysics.com/Bullet/


 This software is provided 'as-is', without any express or implied warranty.

 In no event will the authors be held liable for any damages arising from the use of this software.

 Permission is granted to anyone to use this software for any purpose,

 including commercial applications, and to alter it and redistribute it freely,

 subject to the following restrictions:


 1. The origin of this software must not be misrepresented; you must not claim that you wrote the original software. If you use this software in a product, an acknowledgment in the product documentation would be appreciated but is not required.

 2. Altered source versions must be plainly marked as such, and must not be misrepresented as being the original software.

 3. This notice may not be removed or altered from any source distribution.

 */


 #include <cstdio>


 #define WAVEFRONT_SIZE 32

 #define WAVEFRONT_BLOCK_MULTIPLIER 2

 #define GROUP_SIZE (WAVEFRONT_SIZE*WAVEFRONT_BLOCK_MULTIPLIER)

 #define LINKS_PER_SIMD_LANE 16


 #define STRINGIFY( S ) STRINGIFY2( S )

 #define STRINGIFY2( S ) #S


 #include "BulletCollision/CollisionShapes/btTriangleIndexVertexArray.h"

 #include "vectormath/vmInclude.h"


 #include "btSoftBodySolverLinkData_DX11SIMDAware.h"

 #include "btSoftBodySolver_DX11SIMDAware.h"

 #include "btSoftBodySolverVertexBuffer_DX11.h"

 #include "BulletSoftBody/btSoftBody.h"

 #include "BulletCollision/CollisionShapes/btCapsuleShape.h"


 #define MSTRINGIFY(A) #A

 static char* UpdatePositionsFromVelocitiesHLSLString =

 #include "HLSL/UpdatePositionsFromVelocities.hlsl"

 static char* SolvePositionsSIMDBatchedHLSLString =

 #include "HLSL/SolvePositionsSIMDBatched.hlsl"

 static char* UpdateNodesHLSLString =

 #include "HLSL/UpdateNodes.hlsl"

 static char* UpdatePositionsHLSLString =

 #include "HLSL/UpdatePositions.hlsl"

 static char* UpdateConstantsHLSLString =

 #include "HLSL/UpdateConstants.hlsl"

 static char* IntegrateHLSLString =

 #include "HLSL/Integrate.hlsl"

 static char* ApplyForcesHLSLString =

 #include "HLSL/ApplyForces.hlsl"

 static char* UpdateNormalsHLSLString =

 #include "HLSL/UpdateNormals.hlsl"

 static char* OutputToVertexArrayHLSLString =

 #include "HLSL/OutputToVertexArray.hlsl"

 static char* VSolveLinksHLSLString =

 #include "HLSL/VSolveLinks.hlsl"

 static char* ComputeBoundsHLSLString =

 #include "HLSL/ComputeBounds.hlsl"

 static char* SolveCollisionsAndUpdateVelocitiesHLSLString =

 #include "HLSL/solveCollisionsAndUpdateVelocitiesSIMDBatched.hlsl"


 btSoftBodyLinkDataDX11SIMDAware::btSoftBodyLinkDataDX11SIMDAware( ID3D11Device *d3dDevice, ID3D11DeviceContext *d3dDeviceContext ) :

                 m_d3dDevice( d3dDevice ),

                 m_d3dDeviceContext( d3dDeviceContext ),

                 m_wavefrontSize( WAVEFRONT_SIZE ),

                 m_linksPerWorkItem( LINKS_PER_SIMD_LANE ),

                 m_maxBatchesWithinWave( 0 ),

                 m_maxLinksPerWavefront( m_wavefrontSize * m_linksPerWorkItem ),

                 m_numWavefronts( 0 ),

                 m_maxVertex( 0 ),

                 m_dx11NumBatchesAndVerticesWithinWaves( d3dDevice, d3dDeviceContext, &m_numBatchesAndVerticesWithinWaves, true ),

                 m_dx11WavefrontVerticesGlobalAddresses( d3dDevice, d3dDeviceContext, &m_wavefrontVerticesGlobalAddresses, true ),

                 m_dx11LinkVerticesLocalAddresses( d3dDevice, d3dDeviceContext, &m_linkVerticesLocalAddresses, true ),

                 m_dx11LinkStrength( d3dDevice, d3dDeviceContext, &m_linkStrength, true ),

                 m_dx11LinksMassLSC( d3dDevice, d3dDeviceContext, &m_linksMassLSC, true ),

                 m_dx11LinksRestLengthSquared( d3dDevice, d3dDeviceContext, &m_linksRestLengthSquared, true ),

                 m_dx11LinksRestLength( d3dDevice, d3dDeviceContext, &m_linksRestLength, true ),

                 m_dx11LinksMaterialLinearStiffnessCoefficient( d3dDevice, d3dDeviceContext, &m_linksMaterialLinearStiffnessCoefficient, true )

 {

         m_d3dDevice = d3dDevice;

         m_d3dDeviceContext = d3dDeviceContext;

 }


 btSoftBodyLinkDataDX11SIMDAware::~btSoftBodyLinkDataDX11SIMDAware()

 {

 }


 static Vectormath::Aos::Vector3 toVector3( const btVector3 &vec )

 {

         Vectormath::Aos::Vector3 outVec( vec.getX(), vec.getY(), vec.getZ() );

         return outVec;

 }


 void btSoftBodyLinkDataDX11SIMDAware::createLinks( int numLinks )

 {

         int previousSize = m_links.size();

         int newSize = previousSize + numLinks;


         btSoftBodyLinkData::createLinks( numLinks );


         // Resize the link addresses array as well

         m_linkAddresses.resize( newSize );

 }


 void btSoftBodyLinkDataDX11SIMDAware::setLinkAt( const btSoftBodyLinkData::LinkDescription &link, int linkIndex )

 {

         btSoftBodyLinkData::setLinkAt( link, linkIndex );


         if( link.getVertex0() > m_maxVertex )

                 m_maxVertex = link.getVertex0();

         if( link.getVertex1() > m_maxVertex )

                 m_maxVertex = link.getVertex1();


         // Set the link index correctly for initialisation

         m_linkAddresses[linkIndex] = linkIndex;

 }


 bool btSoftBodyLinkDataDX11SIMDAware::onAccelerator()

 {

         return m_onGPU;

 }


 bool btSoftBodyLinkDataDX11SIMDAware::moveToAccelerator()

 {

         bool success = true;


         success = success && m_dx11NumBatchesAndVerticesWithinWaves.moveToGPU();

         success = success && m_dx11WavefrontVerticesGlobalAddresses.moveToGPU();

         success = success && m_dx11LinkVerticesLocalAddresses.moveToGPU();

         success = success && m_dx11LinkStrength.moveToGPU();

         success = success && m_dx11LinksMassLSC.moveToGPU();

         success = success && m_dx11LinksRestLengthSquared.moveToGPU();

         success = success && m_dx11LinksRestLength.moveToGPU();

         success = success && m_dx11LinksMaterialLinearStiffnessCoefficient.moveToGPU();


         if( success )

                 m_onGPU = true;


         return success;

 }


 bool btSoftBodyLinkDataDX11SIMDAware::moveFromAccelerator()

 {

         bool success = true;

         success = success && m_dx11NumBatchesAndVerticesWithinWaves.moveFromGPU();

         success = success && m_dx11WavefrontVerticesGlobalAddresses.moveFromGPU();

         success = success && m_dx11LinkVerticesLocalAddresses.moveFromGPU();

         success = success && m_dx11LinkStrength.moveFromGPU();

         success = success && m_dx11LinksMassLSC.moveFromGPU();

         success = success && m_dx11LinksRestLengthSquared.moveFromGPU();

         success = success && m_dx11LinksRestLength.moveFromGPU();

         success = success && m_dx11LinksMaterialLinearStiffnessCoefficient.moveFromGPU();


         if( success )

                 m_onGPU = false;


         return success;

 }


 btDX11SIMDAwareSoftBodySolver::btDX11SIMDAwareSoftBodySolver(ID3D11Device * dx11Device, ID3D11DeviceContext* dx11Context, DXFunctions::CompileFromMemoryFunc dx11CompileFromMemory) :

         btDX11SoftBodySolver( dx11Device, dx11Context, dx11CompileFromMemory ),

         m_linkData(m_dx11Device, m_dx11Context)

 {

         // Initial we will clearly need to update solver constants

         // For now this is global for the cloths linked with this solver - we should probably make this body specific

         // for performance in future once we understand more clearly when constants need to be updated

         m_updateSolverConstants = true;


         m_shadersInitialized = false;

 }


 btDX11SIMDAwareSoftBodySolver::~btDX11SIMDAwareSoftBodySolver()

 {

         releaseKernels();

 }


 btSoftBodyLinkData &btDX11SIMDAwareSoftBodySolver::getLinkData()

 {

         // TODO: Consider setting link data to "changed" here

         return m_linkData;

 }


 void btDX11SIMDAwareSoftBodySolver::optimize( btAlignedObjectArray< btSoftBody * > &softBodies , bool forceUpdate)

 {

         if(forceUpdate || m_softBodySet.size() != softBodies.size() )

         {

                 // Have a change in the soft body set so update, reloading all the data

                 getVertexData().clear();

                 getTriangleData().clear();

                 getLinkData().clear();

                 m_softBodySet.resize(0);


                 for( int softBodyIndex = 0; softBodyIndex < softBodies.size(); ++softBodyIndex )

                 {

                         btSoftBody *softBody = softBodies[ softBodyIndex ];

                         using Vectormath::Aos::Matrix3;

                         using Vectormath::Aos::Point3;


                         // Create SoftBody that will store the information within the solver

                         btAcceleratedSoftBodyInterface *newSoftBody = new btAcceleratedSoftBodyInterface( softBody );

                         m_softBodySet.push_back( newSoftBody );


                         m_perClothAcceleration.push_back( toVector3(softBody->getWorldInfo()->m_gravity) );

                         m_perClothDampingFactor.push_back(softBody->m_cfg.kDP);

                         m_perClothVelocityCorrectionCoefficient.push_back( softBody->m_cfg.kVCF );

                         m_perClothLiftFactor.push_back( softBody->m_cfg.kLF );

                         m_perClothDragFactor.push_back( softBody->m_cfg.kDG );

                         m_perClothMediumDensity.push_back(softBody->getWorldInfo()->air_density);

                         // Simple init values. Actually we'll put 0 and -1 into them at the appropriate time

                         m_perClothMinBounds.push_back( UIntVector3( 0, 0, 0 ) );

                         m_perClothMaxBounds.push_back( UIntVector3( UINT_MAX, UINT_MAX, UINT_MAX ) );

                         m_perClothFriction.push_back( softBody->getFriction() );

                         m_perClothCollisionObjects.push_back( CollisionObjectIndices(-1, -1) );


                         // Add space for new vertices and triangles in the default solver for now

                         // TODO: Include space here for tearing too later

                         int firstVertex = getVertexData().getNumVertices();

                         int numVertices = softBody->m_nodes.size();

                         // Round maxVertices to a multiple of the workgroup size so we know we're safe to run over in a given group

                         // maxVertices can be increased to allow tearing, but should be used sparingly because these extra verts will always be processed

                         int maxVertices = GROUP_SIZE*((numVertices+GROUP_SIZE)/GROUP_SIZE);

                         // Allocate space for new vertices in all the vertex arrays

                         getVertexData().createVertices( numVertices, softBodyIndex, maxVertices );


                         int firstTriangle = getTriangleData().getNumTriangles();

                         int numTriangles = softBody->m_faces.size();

                         int maxTriangles = numTriangles;

                         getTriangleData().createTriangles( maxTriangles );


                         // Copy vertices from softbody into the solver

                         for( int vertex = 0; vertex < numVertices; ++vertex )

                         {

                                 Point3 multPoint(softBody->m_nodes[vertex].m_x.getX(), softBody->m_nodes[vertex].m_x.getY(), softBody->m_nodes[vertex].m_x.getZ());

                                 btSoftBodyVertexData::VertexDescription desc;


                                 // TODO: Position in the softbody might be pre-transformed

                                 // or we may need to adapt for the pose.

                                 //desc.setPosition( cloth.getMeshTransform()*multPoint );

                                 desc.setPosition( multPoint );


                                 float vertexInverseMass = softBody->m_nodes[vertex].m_im;

                                 desc.setInverseMass(vertexInverseMass);

                                 getVertexData().setVertexAt( desc, firstVertex + vertex );

                         }


                         // Copy triangles similarly

                         // We're assuming here that vertex indices are based on the firstVertex rather than the entire scene

                         for( int triangle = 0; triangle < numTriangles; ++triangle )

                         {

                                 // Note that large array storage is relative to the array not to the cloth

                                 // So we need to add firstVertex to each value

                                 int vertexIndex0 = (softBody->m_faces[triangle].m_n[0] - &(softBody->m_nodes[0]));

                                 int vertexIndex1 = (softBody->m_faces[triangle].m_n[1] - &(softBody->m_nodes[0]));

                                 int vertexIndex2 = (softBody->m_faces[triangle].m_n[2] - &(softBody->m_nodes[0]));

                                 btSoftBodyTriangleData::TriangleDescription newTriangle(vertexIndex0 + firstVertex, vertexIndex1 + firstVertex, vertexIndex2 + firstVertex);

                                 getTriangleData().setTriangleAt( newTriangle, firstTriangle + triangle );


                                 // Increase vertex triangle counts for this triangle

                                 getVertexData().getTriangleCount(newTriangle.getVertexSet().vertex0)++;

                                 getVertexData().getTriangleCount(newTriangle.getVertexSet().vertex1)++;

                                 getVertexData().getTriangleCount(newTriangle.getVertexSet().vertex2)++;

                         }


                         int firstLink = getLinkData().getNumLinks();

                         int numLinks = softBody->m_links.size();

                         int maxLinks = numLinks;


                         // Allocate space for the links

                         getLinkData().createLinks( numLinks );


                         // Add the links

                         for( int link = 0; link < numLinks; ++link )

                         {

                                 int vertexIndex0 = softBody->m_links[link].m_n[0] - &(softBody->m_nodes[0]);

                                 int vertexIndex1 = softBody->m_links[link].m_n[1] - &(softBody->m_nodes[0]);


                                 btSoftBodyLinkData::LinkDescription newLink(vertexIndex0 + firstVertex, vertexIndex1 + firstVertex, softBody->m_links[link].m_material->m_kLST);

                                 newLink.setLinkStrength(1.f);

                                 getLinkData().setLinkAt(newLink, firstLink + link);

                         }


                         newSoftBody->setFirstVertex( firstVertex );

                         newSoftBody->setFirstTriangle( firstTriangle );

                         newSoftBody->setNumVertices( numVertices );

                         newSoftBody->setMaxVertices( maxVertices );

                         newSoftBody->setNumTriangles( numTriangles );

                         newSoftBody->setMaxTriangles( maxTriangles );

                         newSoftBody->setFirstLink( firstLink );

                         newSoftBody->setNumLinks( numLinks );

                 }


                 updateConstants(0.f);


                 m_linkData.generateBatches();

                 m_triangleData.generateBatches();


                 // Build the shaders to match the batching parameters

                 buildShaders();

         }


 }


 void btDX11SIMDAwareSoftBodySolver::solveConstraints( float solverdt )

 {


         //std::cerr << "'GPU' solve constraints\n";

         using Vectormath::Aos::Vector3;

         using Vectormath::Aos::Point3;

         using Vectormath::Aos::lengthSqr;

         using Vectormath::Aos::dot;


         // Prepare links

         int numLinks = m_linkData.getNumLinks();

         int numVertices = m_vertexData.getNumVertices();


         float kst = 1.f;

         float ti = 0.f;


         m_dx11PerClothDampingFactor.moveToGPU();

         m_dx11PerClothVelocityCorrectionCoefficient.moveToGPU();


         // Ensure data is on accelerator

         m_linkData.moveToAccelerator();

         m_vertexData.moveToAccelerator();


         prepareCollisionConstraints();


         // Solve drift

         for( int iteration = 0; iteration < m_numberOfPositionIterations ; ++iteration )

         {


                 for( int i = 0; i < m_linkData.m_wavefrontBatchStartLengths.size(); ++i )

                 {

                         int startWave = m_linkData.m_wavefrontBatchStartLengths[i].start;

                         int numWaves = m_linkData.m_wavefrontBatchStartLengths[i].length;


                         solveLinksForPosition( startWave, numWaves, kst, ti );

                 }


         } // for( int iteration = 0; iteration < m_numberOfPositionIterations ; ++iteration )


         // At this point assume that the force array is blank - we will overwrite it

         solveCollisionsAndUpdateVelocities( 1.f/solverdt );


 } // btDX11SIMDAwareSoftBodySolver::solveConstraints


 void btDX11SIMDAwareSoftBodySolver::updateConstants( float timeStep )

 {

         using namespace Vectormath::Aos;


         if( m_updateSolverConstants )

         {

                 m_updateSolverConstants = false;


                 // Will have to redo this if we change the structure (tear, maybe) or various other possible changes


                 // Initialise link constants

                 const int numLinks = m_linkData.getNumLinks();

                 for( int linkIndex = 0; linkIndex < numLinks; ++linkIndex )

                 {

                         btSoftBodyLinkData::LinkNodePair &vertices( m_linkData.getVertexPair(linkIndex) );

                         m_linkData.getRestLength(linkIndex) = length((m_vertexData.getPosition( vertices.vertex0 ) - m_vertexData.getPosition( vertices.vertex1 )));

                         float invMass0 = m_vertexData.getInverseMass(vertices.vertex0);

                         float invMass1 = m_vertexData.getInverseMass(vertices.vertex1);

                         float linearStiffness = m_linkData.getLinearStiffnessCoefficient(linkIndex);

                         float massLSC = (invMass0 + invMass1)/linearStiffness;

                         m_linkData.getMassLSC(linkIndex) = massLSC;

                         float restLength = m_linkData.getRestLength(linkIndex);

                         float restLengthSquared = restLength*restLength;

                         m_linkData.getRestLengthSquared(linkIndex) = restLengthSquared;

                 }

         }

 } // btDX11SIMDAwareSoftBodySolver::updateConstants


 // Kernel dispatches


 void btDX11SIMDAwareSoftBodySolver::solveLinksForPosition( int startWave, int numWaves, float kst, float ti )

 {


         m_vertexData.moveToAccelerator();

         m_linkData.moveToAccelerator();


         // Copy kernel parameters to GPU

         SolvePositionsFromLinksKernelCB constBuffer;


         // Set the first wave of the batch and the number of waves

         constBuffer.startWave = startWave;

         constBuffer.numWaves = numWaves;


         constBuffer.kst = kst;

         constBuffer.ti = ti;


         D3D11_MAPPED_SUBRESOURCE MappedResource = {0};

         m_dx11Context->Map( solvePositionsFromLinksKernel.constBuffer, 0, D3D11_MAP_WRITE_DISCARD, 0, &MappedResource );

         memcpy( MappedResource.pData, &constBuffer, sizeof(SolvePositionsFromLinksKernelCB) );

         m_dx11Context->Unmap( solvePositionsFromLinksKernel.constBuffer, 0 );

         m_dx11Context->CSSetConstantBuffers( 0, 1, &solvePositionsFromLinksKernel.constBuffer );


         // Set resources and dispatch

         m_dx11Context->CSSetShaderResources( 0, 1, &(m_linkData.m_dx11NumBatchesAndVerticesWithinWaves.getSRV()) );

         m_dx11Context->CSSetShaderResources( 1, 1, &(m_linkData.m_dx11WavefrontVerticesGlobalAddresses.getSRV()) );

         m_dx11Context->CSSetShaderResources( 2, 1, &(m_vertexData.m_dx11VertexInverseMass.getSRV()) );

         m_dx11Context->CSSetShaderResources( 3, 1, &(m_linkData.m_dx11LinkVerticesLocalAddresses.getSRV()) );

         m_dx11Context->CSSetShaderResources( 4, 1, &(m_linkData.m_dx11LinksMassLSC.getSRV()) );

         m_dx11Context->CSSetShaderResources( 5, 1, &(m_linkData.m_dx11LinksRestLengthSquared.getSRV()) );


         m_dx11Context->CSSetUnorderedAccessViews( 0, 1, &(m_vertexData.m_dx11VertexPosition.getUAV()), NULL );


         // Execute the kernel

         m_dx11Context->CSSetShader( solvePositionsFromLinksKernel.kernel, NULL, 0 );


         int     numBlocks = ((constBuffer.numWaves + WAVEFRONT_BLOCK_MULTIPLIER - 1) / WAVEFRONT_BLOCK_MULTIPLIER );

         m_dx11Context->Dispatch(numBlocks , 1, 1 );


         {

                 // Tidy up

                 ID3D11ShaderResourceView* pViewNULL = NULL;

                 m_dx11Context->CSSetShaderResources( 0, 1, &pViewNULL );

                 m_dx11Context->CSSetShaderResources( 1, 1, &pViewNULL );

                 m_dx11Context->CSSetShaderResources( 2, 1, &pViewNULL );

                 m_dx11Context->CSSetShaderResources( 3, 1, &pViewNULL );

                 m_dx11Context->CSSetShaderResources( 4, 1, &pViewNULL );

                 m_dx11Context->CSSetShaderResources( 5, 1, &pViewNULL );


                 ID3D11UnorderedAccessView* pUAViewNULL = NULL;

                 m_dx11Context->CSSetUnorderedAccessViews( 0, 1, &pUAViewNULL, NULL );


                 ID3D11Buffer *pBufferNull = NULL;

                 m_dx11Context->CSSetConstantBuffers( 0, 1, &pBufferNull );

         }

 } // btDX11SIMDAwareSoftBodySolver::solveLinksForPosition


 // End kernel dispatches


 bool btDX11SIMDAwareSoftBodySolver::buildShaders()

 {

         // Ensure current kernels are released first

         releaseKernels();


         bool returnVal = true;


         if( m_shadersInitialized )

                 return true;


         updatePositionsFromVelocitiesKernel = dxFunctions.compileComputeShaderFromString( UpdatePositionsFromVelocitiesHLSLString, "UpdatePositionsFromVelocitiesKernel", sizeof(UpdatePositionsFromVelocitiesCB) );

         if( !updatePositionsFromVelocitiesKernel.constBuffer )

                 returnVal = false;


         char maxVerticesPerWavefront[20];

         char maxBatchesPerWavefront[20];

         char waveFrontSize[20];

         char waveFrontBlockMultiplier[20];

         char blockSize[20];


         sprintf(maxVerticesPerWavefront, "%d", m_linkData.getMaxVerticesPerWavefront());

         sprintf(maxBatchesPerWavefront, "%d", m_linkData.getMaxBatchesPerWavefront());

         sprintf(waveFrontSize, "%d", m_linkData.getWavefrontSize());

         sprintf(waveFrontBlockMultiplier, "%d", WAVEFRONT_BLOCK_MULTIPLIER);

         sprintf(blockSize, "%d", WAVEFRONT_BLOCK_MULTIPLIER*m_linkData.getWavefrontSize());


         D3D10_SHADER_MACRO solvePositionsMacros[6] = { "MAX_NUM_VERTICES_PER_WAVE", maxVerticesPerWavefront, "MAX_BATCHES_PER_WAVE", maxBatchesPerWavefront, "WAVEFRONT_SIZE", waveFrontSize, "WAVEFRONT_BLOCK_MULTIPLIER", waveFrontBlockMultiplier, "BLOCK_SIZE", blockSize, 0, 0 };


         solvePositionsFromLinksKernel = dxFunctions.compileComputeShaderFromString( SolvePositionsSIMDBatchedHLSLString, "SolvePositionsFromLinksKernel", sizeof(SolvePositionsFromLinksKernelCB), solvePositionsMacros );

         if( !solvePositionsFromLinksKernel.constBuffer )

                 returnVal = false;


         updateVelocitiesFromPositionsWithVelocitiesKernel = dxFunctions.compileComputeShaderFromString( UpdateNodesHLSLString, "updateVelocitiesFromPositionsWithVelocitiesKernel", sizeof(UpdateVelocitiesFromPositionsWithVelocitiesCB) );

         if( !updateVelocitiesFromPositionsWithVelocitiesKernel.constBuffer )

                 returnVal = false;

         updateVelocitiesFromPositionsWithoutVelocitiesKernel = dxFunctions.compileComputeShaderFromString( UpdatePositionsHLSLString, "updateVelocitiesFromPositionsWithoutVelocitiesKernel", sizeof(UpdateVelocitiesFromPositionsWithoutVelocitiesCB));

         if( !updateVelocitiesFromPositionsWithoutVelocitiesKernel.constBuffer )

                 returnVal = false;

         integrateKernel = dxFunctions.compileComputeShaderFromString( IntegrateHLSLString, "IntegrateKernel", sizeof(IntegrateCB) );

         if( !integrateKernel.constBuffer )

                 returnVal = false;

         applyForcesKernel = dxFunctions.compileComputeShaderFromString( ApplyForcesHLSLString, "ApplyForcesKernel", sizeof(ApplyForcesCB) );

         if( !applyForcesKernel.constBuffer )

                 returnVal = false;

         solveCollisionsAndUpdateVelocitiesKernel = dxFunctions.compileComputeShaderFromString( SolveCollisionsAndUpdateVelocitiesHLSLString, "SolveCollisionsAndUpdateVelocitiesKernel", sizeof(SolveCollisionsAndUpdateVelocitiesCB) );

         if( !solveCollisionsAndUpdateVelocitiesKernel.constBuffer )

                 returnVal = false;

         resetNormalsAndAreasKernel = dxFunctions.compileComputeShaderFromString( UpdateNormalsHLSLString, "ResetNormalsAndAreasKernel", sizeof(UpdateSoftBodiesCB) );

         if( !resetNormalsAndAreasKernel.constBuffer )

                 returnVal = false;

         normalizeNormalsAndAreasKernel = dxFunctions.compileComputeShaderFromString( UpdateNormalsHLSLString, "NormalizeNormalsAndAreasKernel", sizeof(UpdateSoftBodiesCB) );

         if( !normalizeNormalsAndAreasKernel.constBuffer )

                 returnVal = false;

         updateSoftBodiesKernel = dxFunctions.compileComputeShaderFromString( UpdateNormalsHLSLString, "UpdateSoftBodiesKernel", sizeof(UpdateSoftBodiesCB) );

         if( !updateSoftBodiesKernel.constBuffer )

                 returnVal = false;


         computeBoundsKernel = dxFunctions.compileComputeShaderFromString( ComputeBoundsHLSLString, "ComputeBoundsKernel", sizeof(ComputeBoundsCB) );

         if( !computeBoundsKernel.constBuffer )

                 returnVal = false;


         if( returnVal )

                 m_shadersInitialized = true;


         return returnVal;

 } // btDX11SIMDAwareSoftBodySolver::buildShaders


 static Vectormath::Aos::Transform3 toTransform3( const btTransform &transform )

 {

         Vectormath::Aos::Transform3 outTransform;

         outTransform.setCol(0, toVector3(transform.getBasis().getColumn(0)));

         outTransform.setCol(1, toVector3(transform.getBasis().getColumn(1)));

         outTransform.setCol(2, toVector3(transform.getBasis().getColumn(2)));

         outTransform.setCol(3, toVector3(transform.getOrigin()));

         return outTransform;

 }


 static void generateBatchesOfWavefronts( btAlignedObjectArray < btAlignedObjectArray <int> > &linksForWavefronts, btSoftBodyLinkData &linkData, int numVertices, btAlignedObjectArray < btAlignedObjectArray <int> > &wavefrontBatches )

 {

         // A per-batch map of truth values stating whether a given vertex is in that batch

         // This allows us to significantly optimize the batching

         btAlignedObjectArray <btAlignedObjectArray<bool> > mapOfVerticesInBatches;


         for( int waveIndex = 0; waveIndex < linksForWavefronts.size(); ++waveIndex )

         {

                 btAlignedObjectArray <int> &wavefront( linksForWavefronts[waveIndex] );


                 int batch = 0;

                 bool placed = false;

                 while( batch < wavefrontBatches.size() && !placed )

                 {

                         // Test the current batch, see if this wave shares any vertex with the waves in the batch

                         bool foundSharedVertex = false;

                         for( int link = 0; link < wavefront.size(); ++link )

                         {

                                 btSoftBodyLinkData::LinkNodePair vertices = linkData.getVertexPair( wavefront[link] );

                                 if( (mapOfVerticesInBatches[batch])[vertices.vertex0] || (mapOfVerticesInBatches[batch])[vertices.vertex1] )

                                 {

                                         foundSharedVertex = true;

                                 }

                         }


                         if( !foundSharedVertex )

                         {

                                 wavefrontBatches[batch].push_back( waveIndex );

                                 // Insert vertices into this batch too

                                 for( int link = 0; link < wavefront.size(); ++link )

                                 {

                                         btSoftBodyLinkData::LinkNodePair vertices = linkData.getVertexPair( wavefront[link] );

                                         (mapOfVerticesInBatches[batch])[vertices.vertex0] = true;

                                         (mapOfVerticesInBatches[batch])[vertices.vertex1] = true;

                                 }

                                 placed = true;

                         }

                         batch++;

                 }

                 if( batch == wavefrontBatches.size() && !placed )

                 {

                         wavefrontBatches.resize( batch + 1 );

                         wavefrontBatches[batch].push_back( waveIndex );


                         // And resize map as well

                         mapOfVerticesInBatches.resize( batch + 1 );


                         // Resize maps with total number of vertices

                         mapOfVerticesInBatches[batch].resize( numVertices+1, false );


                         // Insert vertices into this batch too

                         for( int link = 0; link < wavefront.size(); ++link )

                         {

                                 btSoftBodyLinkData::LinkNodePair vertices = linkData.getVertexPair( wavefront[link] );

                                 (mapOfVerticesInBatches[batch])[vertices.vertex0] = true;

                                 (mapOfVerticesInBatches[batch])[vertices.vertex1] = true;

                         }

                 }

         }

         mapOfVerticesInBatches.clear();

 }


 // Function to remove an object from a vector maintaining correct ordering of the vector

 template< typename T > static void removeFromVector( btAlignedObjectArray< T > &vectorToUpdate, int indexToRemove )

 {

         int currentSize = vectorToUpdate.size();

         for( int i = indexToRemove; i < (currentSize-1); ++i )

         {

                 vectorToUpdate[i] = vectorToUpdate[i+1];

         }

         if( currentSize > 0 )

                 vectorToUpdate.resize( currentSize - 1 );

 }


 template< typename T > static void insertAtIndex( btAlignedObjectArray< T > &vectorToUpdate, int index, T element )

 {

         vectorToUpdate.resize( vectorToUpdate.size() + 1 );

         for( int i = (vectorToUpdate.size() - 1); i > index; --i )

         {

                 vectorToUpdate[i] = vectorToUpdate[i-1];

         }

         vectorToUpdate[index] = element;

 }


 template< typename T > static void insertUniqueAndOrderedIntoVector( btAlignedObjectArray<T> &vectorToUpdate, T element )

 {

         int index = 0;

         while( index < vectorToUpdate.size() && vectorToUpdate[index] < element )

         {

                 index++;

         }

         if( index == vectorToUpdate.size() || vectorToUpdate[index] != element )

                 insertAtIndex( vectorToUpdate, index, element );

 }


 static void generateLinksPerVertex( int numVertices, btSoftBodyLinkData &linkData, btAlignedObjectArray< int > &listOfLinksPerVertex, btAlignedObjectArray <int> &numLinksPerVertex, int &maxLinks )

 {

         for( int linkIndex = 0; linkIndex < linkData.getNumLinks(); ++linkIndex )

         {

                 btSoftBodyLinkData::LinkNodePair nodes( linkData.getVertexPair(linkIndex) );

                 numLinksPerVertex[nodes.vertex0]++;

                 numLinksPerVertex[nodes.vertex1]++;

         }

         int maxLinksPerVertex = 0;

         for( int vertexIndex = 0; vertexIndex < numVertices; ++vertexIndex )

         {

                 maxLinksPerVertex = btMax(numLinksPerVertex[vertexIndex], maxLinksPerVertex);

         }

         maxLinks = maxLinksPerVertex;


         btAlignedObjectArray< int > linksFoundPerVertex;

         linksFoundPerVertex.resize( numVertices, 0 );


         listOfLinksPerVertex.resize( maxLinksPerVertex * numVertices );


         for( int linkIndex = 0; linkIndex < linkData.getNumLinks(); ++linkIndex )

         {

                 btSoftBodyLinkData::LinkNodePair nodes( linkData.getVertexPair(linkIndex) );

                 {

                         // Do vertex 0

                         int vertexIndex = nodes.vertex0;

                         int linkForVertex = linksFoundPerVertex[nodes.vertex0];

                         int linkAddress = vertexIndex * maxLinksPerVertex + linkForVertex;


                         listOfLinksPerVertex[linkAddress] = linkIndex;


                         linksFoundPerVertex[nodes.vertex0] = linkForVertex + 1;

                 }

                 {

                         // Do vertex 1

                         int vertexIndex = nodes.vertex1;

                         int linkForVertex = linksFoundPerVertex[nodes.vertex1];

                         int linkAddress = vertexIndex * maxLinksPerVertex + linkForVertex;


                         listOfLinksPerVertex[linkAddress] = linkIndex;


                         linksFoundPerVertex[nodes.vertex1] = linkForVertex + 1;

                 }

         }

 }


 static void computeBatchingIntoWavefronts(

         btSoftBodyLinkData &linkData,

         int wavefrontSize,

         int linksPerWorkItem,

         int maxLinksPerWavefront,

         btAlignedObjectArray < btAlignedObjectArray <int> > &linksForWavefronts,

         btAlignedObjectArray< btAlignedObjectArray < btAlignedObjectArray <int> > > &batchesWithinWaves, /* wave, batch, links in batch */

         btAlignedObjectArray< btAlignedObjectArray< int > > &verticesForWavefronts /* wavefront, vertex */

         )

 {


         // Attempt generation of larger batches of links.

         btAlignedObjectArray< bool > processedLink;

         processedLink.resize( linkData.getNumLinks() );

         btAlignedObjectArray< int > listOfLinksPerVertex;

         int maxLinksPerVertex = 0;


         // Count num vertices

         int numVertices = 0;

         for( int linkIndex = 0; linkIndex < linkData.getNumLinks(); ++linkIndex )

         {

                 btSoftBodyLinkData::LinkNodePair nodes( linkData.getVertexPair(linkIndex) );

                 numVertices = btMax( numVertices, nodes.vertex0 + 1 );

                 numVertices = btMax( numVertices, nodes.vertex1 + 1 );

         }


         // Need list of links per vertex

         // Compute valence of each vertex

         btAlignedObjectArray <int> numLinksPerVertex;

         numLinksPerVertex.resize(0);

         numLinksPerVertex.resize( numVertices, 0 );


         generateLinksPerVertex( numVertices, linkData, listOfLinksPerVertex, numLinksPerVertex, maxLinksPerVertex );


         // At this point we know what links we have for each vertex so we can start batching


         // We want a vertex to start with, let's go with 0

         int currentVertex = 0;

         int linksProcessed = 0;


         btAlignedObjectArray <int> verticesToProcess;


         while( linksProcessed < linkData.getNumLinks() )

         {

                 // Next wavefront

                 int nextWavefront = linksForWavefronts.size();

                 linksForWavefronts.resize( nextWavefront + 1 );

                 btAlignedObjectArray <int> &linksForWavefront(linksForWavefronts[nextWavefront]);

                 verticesForWavefronts.resize( nextWavefront + 1 );

                 btAlignedObjectArray<int> &vertexSet( verticesForWavefronts[nextWavefront] );


                 linksForWavefront.resize(0);


                 // Loop to find enough links to fill the wavefront

                 // Stopping if we either run out of links, or fill it

                 while( linksProcessed < linkData.getNumLinks() && linksForWavefront.size() < maxLinksPerWavefront )

                 {

                         // Go through the links for the current vertex

                         for( int link = 0; link < numLinksPerVertex[currentVertex] && linksForWavefront.size() < maxLinksPerWavefront; ++link )

                         {

                                 int linkAddress = currentVertex * maxLinksPerVertex + link;

                                 int linkIndex = listOfLinksPerVertex[linkAddress];


                                 // If we have not already processed this link, add it to the wavefront

                                 // Claim it as another processed link

                                 // Add the vertex at the far end to the list of vertices to process.

                                 if( !processedLink[linkIndex] )

                                 {

                                         linksForWavefront.push_back( linkIndex );

                                         linksProcessed++;

                                         processedLink[linkIndex] = true;

                                         int v0 = linkData.getVertexPair(linkIndex).vertex0;

                                         int v1 = linkData.getVertexPair(linkIndex).vertex1;

                                         if( v0 == currentVertex )

                                                 verticesToProcess.push_back( v1 );

                                         else

                                                 verticesToProcess.push_back( v0 );

                                 }

                         }

                         if( verticesToProcess.size() > 0 )

                         {

                                 // Get the element on the front of the queue and remove it

                                 currentVertex = verticesToProcess[0];

                                 removeFromVector( verticesToProcess, 0 );

                         } else {

                                 // If we've not yet processed all the links, find the first unprocessed one

                                 // and select one of its vertices as the current vertex

                                 if( linksProcessed < linkData.getNumLinks() )

                                 {

                                         int searchLink = 0;

                                         while( processedLink[searchLink] )

                                                 searchLink++;

                                         currentVertex = linkData.getVertexPair(searchLink).vertex0;

                                 }

                         }

                 }


                 // We have either finished or filled a wavefront

                 for( int link = 0; link < linksForWavefront.size(); ++link )

                 {

                         int v0 = linkData.getVertexPair( linksForWavefront[link] ).vertex0;

                         int v1 = linkData.getVertexPair( linksForWavefront[link] ).vertex1;

                         insertUniqueAndOrderedIntoVector( vertexSet, v0 );

                         insertUniqueAndOrderedIntoVector( vertexSet, v1 );

                 }

                 // Iterate over links mapped to the wave and batch those

                 // We can run a batch on each cycle trivially


                 batchesWithinWaves.resize( batchesWithinWaves.size() + 1 );

                 btAlignedObjectArray < btAlignedObjectArray <int> > &batchesWithinWave( batchesWithinWaves[batchesWithinWaves.size()-1] );


                 for( int link = 0; link < linksForWavefront.size(); ++link )

                 {

                         int linkIndex = linksForWavefront[link];

                         btSoftBodyLinkData::LinkNodePair vertices = linkData.getVertexPair( linkIndex );


                         int batch = 0;

                         bool placed = false;

                         while( batch < batchesWithinWave.size() && !placed )

                         {

                                 bool foundSharedVertex = false;

                                 if( batchesWithinWave[batch].size() >= wavefrontSize )

                                 {

                                         // If we have already filled this batch, move on to another

                                         foundSharedVertex = true;

                                 } else {

                                         for( int link2 = 0; link2 < batchesWithinWave[batch].size(); ++link2 )

                                         {

                                                 btSoftBodyLinkData::LinkNodePair vertices2 = linkData.getVertexPair( (batchesWithinWave[batch])[link2] );


                                                 if( vertices.vertex0 == vertices2.vertex0 ||

                                                         vertices.vertex1 == vertices2.vertex0 ||

                                                         vertices.vertex0 == vertices2.vertex1 ||

                                                         vertices.vertex1 == vertices2.vertex1 )

                                                 {

                                                         foundSharedVertex = true;

                                                         break;

                                                 }

                                         }

                                 }

                                 if( !foundSharedVertex )

                                 {

                                         batchesWithinWave[batch].push_back( linkIndex );

                                         placed = true;

                                 } else {

                                         ++batch;

                                 }

                         }

                         if( batch == batchesWithinWave.size() && !placed )

                         {

                                 batchesWithinWave.resize( batch + 1 );

                                 batchesWithinWave[batch].push_back( linkIndex );

                         }

                 }


         }


 }


 void btSoftBodyLinkDataDX11SIMDAware::generateBatches()

 {

         btAlignedObjectArray < btAlignedObjectArray <int> > linksForWavefronts;

         btAlignedObjectArray < btAlignedObjectArray <int> > wavefrontBatches;

         btAlignedObjectArray< btAlignedObjectArray < btAlignedObjectArray <int> > > batchesWithinWaves;

         btAlignedObjectArray< btAlignedObjectArray< int > > verticesForWavefronts; // wavefronts, vertices in wavefront as an ordered set


         // Group the links into wavefronts

         computeBatchingIntoWavefronts( *this, m_wavefrontSize, m_linksPerWorkItem, m_maxLinksPerWavefront, linksForWavefronts, batchesWithinWaves, verticesForWavefronts );


         // Batch the wavefronts

         generateBatchesOfWavefronts( linksForWavefronts, *this, m_maxVertex, wavefrontBatches );


         m_numWavefronts = linksForWavefronts.size();


         // At this point we have a description of which links we need to process in each wavefront


         // First correctly fill the batch ranges vector

         int numBatches = wavefrontBatches.size();

         m_wavefrontBatchStartLengths.resize(0);

         int prefixSum = 0;

         for( int batchIndex = 0; batchIndex < numBatches; ++batchIndex )

         {

                 int wavesInBatch = wavefrontBatches[batchIndex].size();

                 int nextPrefixSum = prefixSum + wavesInBatch;

                 m_wavefrontBatchStartLengths.push_back( BatchPair( prefixSum, nextPrefixSum - prefixSum ) );


                 prefixSum += wavesInBatch;

         }


         // Also find max number of batches within a wave

         m_maxBatchesWithinWave = 0;

         m_maxVerticesWithinWave = 0;

         m_numBatchesAndVerticesWithinWaves.resize( m_numWavefronts );

         for( int waveIndex = 0; waveIndex < m_numWavefronts; ++waveIndex )

         {

                 // See if the number of batches in this wave is greater than the current maxium

                 int batchesInCurrentWave = batchesWithinWaves[waveIndex].size();

                 int verticesInCurrentWave = verticesForWavefronts[waveIndex].size();

                 m_maxBatchesWithinWave = btMax( batchesInCurrentWave, m_maxBatchesWithinWave );

                 m_maxVerticesWithinWave = btMax( verticesInCurrentWave, m_maxVerticesWithinWave );

         }


         // Add padding values both for alignment and as dudd addresses within LDS to compute junk rather than branch around

         m_maxVerticesWithinWave = 16*((m_maxVerticesWithinWave/16)+2);


         // Now we know the maximum number of vertices per-wave we can resize the global vertices array

         m_wavefrontVerticesGlobalAddresses.resize( m_maxVerticesWithinWave * m_numWavefronts );


         // Grab backup copies of all the link data arrays for the sorting process

         btAlignedObjectArray<btSoftBodyLinkData::LinkNodePair>                          m_links_Backup(m_links);

         btAlignedObjectArray<float>                                                                                     m_linkStrength_Backup(m_linkStrength);

         btAlignedObjectArray<float>                                                                                     m_linksMassLSC_Backup(m_linksMassLSC);

         btAlignedObjectArray<float>                                                                                     m_linksRestLengthSquared_Backup(m_linksRestLengthSquared);

         //btAlignedObjectArray<Vectormath::Aos::Vector3>                                                m_linksCLength_Backup(m_linksCLength);

         //btAlignedObjectArray<float>                                                                                   m_linksLengthRatio_Backup(m_linksLengthRatio);

         btAlignedObjectArray<float>                                                                                     m_linksRestLength_Backup(m_linksRestLength);

         btAlignedObjectArray<float>                                                                                     m_linksMaterialLinearStiffnessCoefficient_Backup(m_linksMaterialLinearStiffnessCoefficient);


         // Resize to a wavefront sized batch per batch per wave so we get perfectly coherent memory accesses.

         m_links.resize( m_maxBatchesWithinWave * m_wavefrontSize * m_numWavefronts );

         m_linkVerticesLocalAddresses.resize( m_maxBatchesWithinWave * m_wavefrontSize * m_numWavefronts );

         m_linkStrength.resize( m_maxBatchesWithinWave * m_wavefrontSize * m_numWavefronts );

         m_linksMassLSC.resize( m_maxBatchesWithinWave * m_wavefrontSize * m_numWavefronts );

         m_linksRestLengthSquared.resize( m_maxBatchesWithinWave * m_wavefrontSize * m_numWavefronts );

         m_linksRestLength.resize( m_maxBatchesWithinWave * m_wavefrontSize * m_numWavefronts );

         m_linksMaterialLinearStiffnessCoefficient.resize( m_maxBatchesWithinWave * m_wavefrontSize * m_numWavefronts );


         // Then re-order links into wavefront blocks


         // Total number of wavefronts moved. This will decide the ordering of sorted wavefronts.

         int wavefrontCount = 0;


         // Iterate over batches of wavefronts, then wavefronts in the batch

         for( int batchIndex = 0; batchIndex < numBatches; ++batchIndex )

         {

                 btAlignedObjectArray <int> &batch( wavefrontBatches[batchIndex] );

                 int wavefrontsInBatch = batch.size();


                 for( int wavefrontIndex = 0; wavefrontIndex < wavefrontsInBatch; ++wavefrontIndex )

                 {


                         int originalWavefrontIndex = batch[wavefrontIndex];

                         btAlignedObjectArray< int > &wavefrontVertices( verticesForWavefronts[originalWavefrontIndex] );

                         int verticesUsedByWavefront = wavefrontVertices.size();


                         // Copy the set of vertices into the correctly structured array for use on the device

                         // Fill the non-vertices with -1s

                         // so we can mask out those reads

                         for( int vertex = 0; vertex < verticesUsedByWavefront; ++vertex )

                         {

                                 m_wavefrontVerticesGlobalAddresses[m_maxVerticesWithinWave * wavefrontCount + vertex] = wavefrontVertices[vertex];

                         }

                         for( int vertex = verticesUsedByWavefront; vertex < m_maxVerticesWithinWave; ++vertex )

                         {

                                 m_wavefrontVerticesGlobalAddresses[m_maxVerticesWithinWave * wavefrontCount + vertex] = -1;

                         }


                         // Obtain the set of batches within the current wavefront

                         btAlignedObjectArray < btAlignedObjectArray <int> > &batchesWithinWavefront( batchesWithinWaves[originalWavefrontIndex] );

                         // Set the size of the batches for use in the solver, correctly ordered

                         NumBatchesVerticesPair batchesAndVertices;

                         batchesAndVertices.numBatches = batchesWithinWavefront.size();

                         batchesAndVertices.numVertices = verticesUsedByWavefront;

                         m_numBatchesAndVerticesWithinWaves[wavefrontCount] = batchesAndVertices;


                         // Now iterate over batches within the wavefront to structure the links correctly

                         for( int wavefrontBatch = 0; wavefrontBatch < batchesWithinWavefront.size(); ++wavefrontBatch )

                         {

                                 btAlignedObjectArray <int> &linksInBatch( batchesWithinWavefront[wavefrontBatch] );

                                 int wavefrontBatchSize = linksInBatch.size();


                                 int batchAddressInTarget = m_maxBatchesWithinWave * m_wavefrontSize * wavefrontCount + m_wavefrontSize * wavefrontBatch;


                                 for( int linkIndex = 0; linkIndex < wavefrontBatchSize; ++linkIndex )

                                 {

                                         int originalLinkAddress = linksInBatch[linkIndex];

                                         // Reorder simple arrays trivially

                                         m_links[batchAddressInTarget + linkIndex] = m_links_Backup[originalLinkAddress];

                                         m_linkStrength[batchAddressInTarget + linkIndex] = m_linkStrength_Backup[originalLinkAddress];

                                         m_linksMassLSC[batchAddressInTarget + linkIndex] = m_linksMassLSC_Backup[originalLinkAddress];

                                         m_linksRestLengthSquared[batchAddressInTarget + linkIndex] = m_linksRestLengthSquared_Backup[originalLinkAddress];

                                         m_linksRestLength[batchAddressInTarget + linkIndex] = m_linksRestLength_Backup[originalLinkAddress];

                                         m_linksMaterialLinearStiffnessCoefficient[batchAddressInTarget + linkIndex] = m_linksMaterialLinearStiffnessCoefficient_Backup[originalLinkAddress];


                                         // The local address is more complicated. We need to work out where a given vertex will end up

                                         // by searching the set of vertices for this link and using the index as the local address

                                         btSoftBodyLinkData::LinkNodePair localPair;

                                         btSoftBodyLinkData::LinkNodePair globalPair = m_links[batchAddressInTarget + linkIndex];

                                         localPair.vertex0 = wavefrontVertices.findLinearSearch( globalPair.vertex0 );

                                         localPair.vertex1 = wavefrontVertices.findLinearSearch( globalPair.vertex1 );

                                         m_linkVerticesLocalAddresses[batchAddressInTarget + linkIndex] = localPair;

                                 }

                                 for( int linkIndex = wavefrontBatchSize; linkIndex < m_wavefrontSize; ++linkIndex )

                                 {

                                         // Put 0s into these arrays for padding for cleanliness

                                         m_links[batchAddressInTarget + linkIndex] = btSoftBodyLinkData::LinkNodePair(0, 0);

                                         m_linkStrength[batchAddressInTarget + linkIndex] = 0.f;

                                         m_linksMassLSC[batchAddressInTarget + linkIndex] = 0.f;

                                         m_linksRestLengthSquared[batchAddressInTarget + linkIndex] = 0.f;

                                         m_linksRestLength[batchAddressInTarget + linkIndex] = 0.f;

                                         m_linksMaterialLinearStiffnessCoefficient[batchAddressInTarget + linkIndex] = 0.f;


                                         // For local addresses of junk data choose a set of addresses just above the range of valid ones

                                         // and cycling tyhrough % 16 so that we don't have bank conficts between all dud addresses

                                         // The valid addresses will do scatter and gather in the valid range, the junk ones should happily work

                                         // off the end of that range so we need no control

                                         btSoftBodyLinkData::LinkNodePair localPair;

                                         localPair.vertex0 = verticesUsedByWavefront + (linkIndex % 16);

                                         localPair.vertex1 = verticesUsedByWavefront + (linkIndex % 16);

                                         m_linkVerticesLocalAddresses[batchAddressInTarget + linkIndex] = localPair;

                                 }


                         }


                         wavefrontCount++;

                 }


         }


 } // void btSoftBodyLinkDataDX11SIMDAware::generateBatches()

btDX11SIMDAwareSoftBodySolver::optimize
virtual void optimize(btAlignedObjectArray< btSoftBody * > &softBodies, bool forceUpdate=false)
Optimize soft bodies in this solver.
Definition: btSoftBodySolver_DX11SIMDAware.cpp:202

insertAtIndex
static void insertAtIndex(btAlignedObjectArray< T > &vectorToUpdate, int index, T element)
Insert element into vectorToUpdate at index index.
Definition: btSoftBodySolver_DX11SIMDAware.cpp:652

btSoftBodyTriangleData::setTriangleAt
virtual void setTriangleAt(const TriangleDescription &triangle, int triangleIndex)
Definition: btSoftBodySolverData.h:677

btDX11SoftBodySolver::UpdateSoftBodiesCB
Definition: btSoftBodySolver_DX11.h:351

length
btScalar length(const btQuaternion &q)
Return the length of a quaternion.
Definition: btQuaternion.h:835

LINKS_PER_SIMD_LANE
#define LINKS_PER_SIMD_LANE
Definition: btSoftBodySolver_DX11SIMDAware.cpp:22

btSoftBodyVertexData::createVertices
void createVertices(int numVertices, int clothIdentifier, int maxVertices=0)
Create numVertices new vertices for cloth clothIdentifier maxVertices allows a buffer zone of extra v...
Definition: btSoftBodySolverData.h:442

generateBatchesOfWavefronts
static void generateBatchesOfWavefronts(btAlignedObjectArray< btAlignedObjectArray< int > > &linksForWavefronts, btSoftBodyLinkData &linkData, int numVertices, btAlignedObjectArray< btAlignedObjectArray< int > > &wavefrontBatches)
Definition: btSoftBodySolver_DX11SIMDAware.cpp:575

btDX11SoftBodySolver::UpdateVelocitiesFromPositionsWithVelocitiesCB
Definition: btSoftBodySolver_DX11.h:343

m_dx11NumBatchesAndVerticesWithinWaves
static char m_dx11NumBatchesAndVerticesWithinWaves(d3dDevice, d3dDeviceContext,&m_numBatchesAndVerticesWithinWaves, true)

btAlignedObjectArray::push_back
void push_back(const T &_Val)
Definition: btAlignedObjectArray.h:276

btSoftBodyTriangleDataDX11::generateBatches
void generateBatches()
Generate (and later update) the batching for the entire triangle set.
Definition: btSoftBodySolver_DX11.cpp:427

btSoftBodyLinkDataDX11SIMDAware::m_onGPU
bool m_onGPU
Definition: btSoftBodySolverLinkData_DX11SIMDAware.h:29

btSoftBodySolver_DX11SIMDAware.h

btSoftBodyLinkDataDX11SIMDAware::btSoftBodyLinkDataDX11SIMDAware
btSoftBodyLinkDataDX11SIMDAware(ID3D11Device *d3dDevice, ID3D11DeviceContext *d3dDeviceContext)

btSoftBodyLinkDataDX11SIMDAware::generateBatches
void generateBatches()
Generate (and later update) the batching for the entire link set.
Definition: btSoftBodySolver_DX11SIMDAware.cpp:885

btDX11SIMDAwareSoftBodySolver::SolvePositionsFromLinksKernelCB::ti
float ti
Definition: btSoftBodySolver_DX11SIMDAware.h:35

btSoftBody::m_cfg
Config m_cfg
Definition: btSoftBody.h:648

btDX11SoftBodySolver::m_dx11Context
ID3D11DeviceContext * m_dx11Context
Definition: btSoftBodySolver_DX11.h:409

btSoftBodySolverVertexBuffer_DX11.h

btDX11SIMDAwareSoftBodySolver::solveConstraints
virtual void solveConstraints(float solverdt)
Solve constraints for a set of soft bodies.
Definition: btSoftBodySolver_DX11SIMDAware.cpp:329

btSoftBodyTriangleData::createTriangles
virtual void createTriangles(int numTriangles)
Definition: btSoftBodySolverData.h:682

GROUP_SIZE
#define GROUP_SIZE
Definition: btSoftBodySolver_DX11SIMDAware.cpp:21

btSoftBodyVertexData::VertexDescription::setPosition
void setPosition(const Vectormath::Aos::Point3 &position)
Definition: btSoftBodySolverData.h:341

btDX11Buffer::moveToGPU
bool moveToGPU()
Move the data to the GPU if it is not there already.
Definition: btSoftBodySolverBuffer_DX11.h:183

btCapsuleShape.h

btDX11SoftBodySolver::m_dx11PerClothDampingFactor
btDX11Buffer< float > m_dx11PerClothDampingFactor
Definition: btSoftBodySolver_DX11.h:445

btSoftBodyLinkData::LinkNodePair::vertex1
int vertex1
Definition: btSoftBodySolverData.h:33

btSoftBodyLinkData::setLinkAt
virtual void setLinkAt(const LinkDescription &link, int linkIndex)
Insert the link described into the correct data structures assuming space has already been allocated ...
Definition: btSoftBodySolverData.h:188

btDX11SoftBodySolver::computeBoundsKernel
DXFunctions::KernelDesc computeBoundsKernel
Definition: btSoftBodySolver_DX11.h:512

DXFunctions::KernelDesc::kernel
ID3D11ComputeShader * kernel
Definition: btSoftBodySolver_DX11.h:53

btDX11SoftBodySolver
Definition: btSoftBodySolver_DX11.h:76

btAlignedObjectArray< btSoftBody * >

btDX11SoftBodySolver::updatePositionsFromVelocitiesKernel
DXFunctions::KernelDesc updatePositionsFromVelocitiesKernel
Definition: btSoftBodySolver_DX11.h:506

Vectormath::Aos::Transform3
Definition: neon/vectormath_aos.h:1661

btSoftBodyLinkData::LinkNodePair::vertex0
int vertex0
Definition: btSoftBodySolverData.h:32

btDX11SoftBodySolver::getTriangleData
virtual btSoftBodyTriangleData & getTriangleData()
Definition: btSoftBodySolver_DX11.cpp:809

btDX11SoftBodySolver::ComputeBoundsCB
Definition: btSoftBodySolver_DX11.h:388

btSoftBodyLinkDataDX11SIMDAware::NumBatchesVerticesPair
Definition: btSoftBodySolverLinkData_DX11SIMDAware.h:42

btSoftBodyVertexData::clear
virtual void clear()
Definition: btSoftBodySolverData.h:403

Vectormath::Aos::Matrix3
Definition: neon/vectormath_aos.h:1136

btSoftBodyLinkData::getRestLengthSquared
float & getRestLengthSquared(int linkIndex)
Return reference to rest length squared for link linkIndex as stored on the host. ...
Definition: btSoftBodySolverData.h:283

btSoftBodyLinkDataDX11SIMDAware::NumBatchesVerticesPair::numBatches
int numBatches
Definition: btSoftBodySolverLinkData_DX11SIMDAware.h:44

m_dx11LinksRestLength
static char m_dx11LinksRestLength(d3dDevice, d3dDeviceContext,&m_linksRestLength, true)

Vectormath::Aos::Point3
Definition: neon/vectormath_aos.h:634

btDX11SoftBodySolver::btAcceleratedSoftBodyInterface::setNumTriangles
void setNumTriangles(int numTriangles)
Definition: btSoftBodySolver_DX11.h:224

btSoftBodyVertexData::getTriangleCount
int & getTriangleCount(int vertexIndex)
Get access to the array of how many triangles touch each vertex.
Definition: btSoftBodySolverData.h:537

size
static DBVT_INLINE btScalar size(const btDbvtVolume &a)
Definition: btDbvt.cpp:51

btSoftBody::Config::kVCF
btScalar kVCF
Definition: btSoftBody.h:565

DXFunctions::KernelDesc::constBuffer
ID3D11Buffer * constBuffer
Definition: btSoftBodySolver_DX11.h:54

btSoftBodyVertexData::getNumVertices
int getNumVertices()
Definition: btSoftBodySolverData.h:416

m_dx11LinksRestLengthSquared
static char m_dx11LinksRestLengthSquared(d3dDevice, d3dDeviceContext,&m_linksRestLengthSquared, true)

Vectormath::Aos::Vector3
Definition: neon/vectormath_aos.h:46

btDX11SoftBodySolver::m_perClothVelocityCorrectionCoefficient
btAlignedObjectArray< float > m_perClothVelocityCorrectionCoefficient
Velocity correction coefficient.
Definition: btSoftBodySolver_DX11.h:448

btSoftBodyLinkDataDX11SIMDAware::m_wavefrontBatchStartLengths
btAlignedObjectArray< BatchPair > m_wavefrontBatchStartLengths
Start and length values for computation batches over link data.
Definition: btSoftBodySolverLinkData_DX11SIMDAware.h:93

btSoftBodyLinkData::getLinearStiffnessCoefficient
float & getLinearStiffnessCoefficient(int linkIndex)
Return reference to linear stiffness coefficient for link linkIndex as stored on the host...
Definition: btSoftBodySolverData.h:267

btDX11SoftBodySolver::UpdateVelocitiesFromPositionsWithoutVelocitiesCB
Definition: btSoftBodySolver_DX11.h:335

btSoftBodyLinkData::getVertexPair
LinkNodePair & getVertexPair(int linkIndex)
Return reference to the vertex index pair for link linkIndex as stored on the host.
Definition: btSoftBodySolverData.h:234

btTriangleIndexVertexArray.h

m_maxLinksPerWavefront
static char m_maxLinksPerWavefront(m_wavefrontSize *m_linksPerWorkItem)

m_dx11WavefrontVerticesGlobalAddresses
static char m_dx11WavefrontVerticesGlobalAddresses(d3dDevice, d3dDeviceContext,&m_wavefrontVerticesGlobalAddresses, true)

btSoftBodyVertexData::VertexDescription
Class describing a vertex for input into the system.
Definition: btSoftBodySolverData.h:318

btMatrix3x3::getColumn
btVector3 getColumn(int i) const
Get a column of the matrix as a vector.
Definition: btMatrix3x3.h:134

btSoftBody::Config::kDG
btScalar kDG
Definition: btSoftBody.h:567

btDX11SoftBodySolver::btAcceleratedSoftBodyInterface::setMaxTriangles
void setMaxTriangles(int maxTriangles)
Definition: btSoftBodySolver_DX11.h:234

btDX11SIMDAwareSoftBodySolver::SolvePositionsFromLinksKernelCB::kst
float kst
Definition: btSoftBodySolver_DX11SIMDAware.h:34

btSoftBodyLinkDataDX11SIMDAware::onAccelerator
virtual bool onAccelerator()
Return true if data is on the accelerator.
Definition: btSoftBodySolver_DX11SIMDAware.cpp:120

btDX11SoftBodySolver::m_perClothCollisionObjects
btAlignedObjectArray< CollisionObjectIndices > m_perClothCollisionObjects
Collision shape details: pair of index of first collision shape for the cloth and number of collision...
Definition: btSoftBodySolver_DX11.h:467

btDX11SoftBodySolver::applyForcesKernel
DXFunctions::KernelDesc applyForcesKernel
Definition: btSoftBodySolver_DX11.h:515

removeFromVector
static void removeFromVector(btAlignedObjectArray< T > &vectorToUpdate, int indexToRemove)
Definition: btSoftBodySolver_DX11SIMDAware.cpp:638

m_dx11LinkStrength
static char m_dx11LinkStrength(d3dDevice, d3dDeviceContext,&m_linkStrength, true)

btSoftBody::m_nodes
tNodeArray m_nodes
Definition: btSoftBody.h:654

btSoftBody::m_links
tLinkArray m_links
Definition: btSoftBody.h:655

btDX11SIMDAwareSoftBodySolver::m_updateSolverConstants
bool m_updateSolverConstants
Variable to define whether we need to update solver constants on the next iteration.
Definition: btSoftBodySolver_DX11SIMDAware.h:43

btDX11SIMDAwareSoftBodySolver::solveLinksForPosition
void solveLinksForPosition(int startLink, int numLinks, float kst, float ti)
Definition: btSoftBodySolver_DX11SIMDAware.cpp:415

btSoftBodyLinkDataDX11SIMDAware::m_dx11WavefrontVerticesGlobalAddresses
btDX11Buffer< int > m_dx11WavefrontVerticesGlobalAddresses
Definition: btSoftBodySolverLinkData_DX11SIMDAware.h:57

btDX11SoftBodySolver::dxFunctions
DXFunctions dxFunctions
Definition: btSoftBodySolver_DX11.h:411

btSoftBodyTriangleData::TriangleDescription::getVertexSet
TriangleNodeSet getVertexSet() const
Definition: btSoftBodySolverData.h:636

btDX11SoftBodySolver::btAcceleratedSoftBodyInterface::setNumLinks
void setNumLinks(int numLinks)
Definition: btSoftBodySolver_DX11.h:254

btVector3::getZ
const btScalar & getZ() const
Return the z value.
Definition: btVector3.h:565

m_numWavefronts
static char m_numWavefronts(0)

toVector3
static Vectormath::Aos::Vector3 toVector3(const btVector3 &vec)
Definition: btSoftBodySolver_DX11SIMDAware.cpp:90

btAlignedObjectArray::clear
void clear()
clear the array, deallocated memory. Generally it is better to use array.resize(0), to reduce performance overhead of run-time memory (de)allocations.
Definition: btAlignedObjectArray.h:184

btDX11SoftBodySolver::m_perClothMinBounds
btAlignedObjectArray< UIntVector3 > m_perClothMinBounds
Minimum bounds for each cloth.
Definition: btSoftBodySolver_DX11.h:482

btSoftBody::Config::kLF
btScalar kLF
Definition: btSoftBody.h:568

btSoftBodyVertexDataDX11::m_dx11VertexInverseMass
btDX11Buffer< float > m_dx11VertexInverseMass
Definition: btSoftBodySolverVertexData_DX11.h:44

Vectormath::Aos::Transform3::setCol
Transform3 & setCol(int col, const Vector3 &vec)
Definition: neon/mat_aos.h:1174

btSoftBodyLinkData::getMassLSC
float & getMassLSC(int linkIndex)
Return reference to the MassLSC value for link linkIndex as stored on the host.
Definition: btSoftBodySolverData.h:275

btSoftBodyLinkDataDX11SIMDAware::NumBatchesVerticesPair::numVertices
int numVertices
Definition: btSoftBodySolverLinkData_DX11SIMDAware.h:45

btDX11SoftBodySolver::solvePositionsFromLinksKernel
DXFunctions::KernelDesc solvePositionsFromLinksKernel
Definition: btSoftBodySolver_DX11.h:502

btDX11SIMDAwareSoftBodySolver::getLinkData
virtual btSoftBodyLinkData & getLinkData()
Definition: btSoftBodySolver_DX11SIMDAware.cpp:194

btDX11SoftBodySolver::m_dx11PerClothVelocityCorrectionCoefficient
btDX11Buffer< float > m_dx11PerClothVelocityCorrectionCoefficient
Definition: btSoftBodySolver_DX11.h:449

Vectormath::Aos::lengthSqr
float lengthSqr(const Vector3 &vec)
Definition: neon/vec_aos.h:447

btSoftBody::getWorldInfo
btSoftBodyWorldInfo * getWorldInfo()
Definition: btSoftBody.h:697

generateLinksPerVertex
static void generateLinksPerVertex(int numVertices, btSoftBodyLinkData &linkData, btAlignedObjectArray< int > &listOfLinksPerVertex, btAlignedObjectArray< int > &numLinksPerVertex, int &maxLinks)
Definition: btSoftBodySolver_DX11SIMDAware.cpp:677

btSoftBody.h

btDX11SoftBodySolver::m_perClothMediumDensity
btAlignedObjectArray< float > m_perClothMediumDensity
Density of the medium in which each cloth sits.
Definition: btSoftBodySolver_DX11.h:460

btSoftBodyLinkDataDX11SIMDAware::getMaxVerticesPerWavefront
int getMaxVerticesPerWavefront()
Definition: btSoftBodySolverLinkData_DX11SIMDAware.h:122

btAlignedObjectArray::size
int size() const
return the number of elements in the array
Definition: btAlignedObjectArray.h:149

btTransform::getOrigin
btVector3 & getOrigin()
Return the origin vector translation.
Definition: btTransform.h:117

btDX11SoftBodySolver::ApplyForcesCB
Definition: btSoftBodySolver_DX11.h:360

btDX11SIMDAwareSoftBodySolver::SolvePositionsFromLinksKernelCB::startWave
int startWave
Definition: btSoftBodySolver_DX11SIMDAware.h:32

btDX11SoftBodySolver::CollisionObjectIndices
Definition: btSoftBodySolver_DX11.h:287

btDX11SoftBodySolver::btAcceleratedSoftBodyInterface::setFirstVertex
void setFirstVertex(int firstVertex)
Definition: btSoftBodySolver_DX11.h:239

btSoftBody::Config::kDP
btScalar kDP
Definition: btSoftBody.h:566

btSoftBodyLinkDataDX11SIMDAware::~btSoftBodyLinkDataDX11SIMDAware
virtual ~btSoftBodyLinkDataDX11SIMDAware()
Definition: btSoftBodySolver_DX11SIMDAware.cpp:86

btDX11SoftBodySolver::solveCollisionsAndUpdateVelocitiesKernel
DXFunctions::KernelDesc solveCollisionsAndUpdateVelocitiesKernel
Definition: btSoftBodySolver_DX11.h:509

DXFunctions::compileComputeShaderFromString
KernelDesc compileComputeShaderFromString(const char *shaderString, const char *shaderName, int constBufferSize, D3D10_SHADER_MACRO *compileMacros=0)
Compile a compute shader kernel from a string and return the appropriate KernelDesc object...
Definition: btSoftBodySolver_DX11.cpp:1995

btDX11SoftBodySolver::updateSoftBodiesKernel
DXFunctions::KernelDesc updateSoftBodiesKernel
Definition: btSoftBodySolver_DX11.h:513

m_maxVertex
static char m_maxVertex(0)

btDX11SoftBodySolver::getVertexData
virtual btSoftBodyVertexData & getVertexData()
Definition: btSoftBodySolver_DX11.cpp:803

btSoftBodyLinkData::m_links
btAlignedObjectArray< LinkNodePair > m_links
Definition: btSoftBodySolverData.h:133

btDX11SoftBodySolver::m_perClothDampingFactor
btAlignedObjectArray< float > m_perClothDampingFactor
Velocity damping factor.
Definition: btSoftBodySolver_DX11.h:444

btDX11SoftBodySolver::btAcceleratedSoftBodyInterface
SoftBody class to maintain information about a soft body instance within a solver.
Definition: btSoftBodySolver_DX11.h:139

btDX11SIMDAwareSoftBodySolver::~btDX11SIMDAwareSoftBodySolver
virtual ~btDX11SIMDAwareSoftBodySolver()
Definition: btSoftBodySolver_DX11SIMDAware.cpp:188

btDX11SoftBodySolver::resetNormalsAndAreasKernel
DXFunctions::KernelDesc resetNormalsAndAreasKernel
Definition: btSoftBodySolver_DX11.h:510

btSoftBodyLinkDataDX11SIMDAware::m_linkAddresses
btAlignedObjectArray< int > m_linkAddresses
Link addressing information for each cloth.
Definition: btSoftBodySolverLinkData_DX11SIMDAware.h:88

btSoftBodyLinkData::LinkNodePair
Class representing a link as a set of three indices into the vertex array.
Definition: btSoftBodySolverData.h:29

btDX11SoftBodySolver::btAcceleratedSoftBodyInterface::setNumVertices
void setNumVertices(int numVertices)
Definition: btSoftBodySolver_DX11.h:219

computeBatchingIntoWavefronts
static void computeBatchingIntoWavefronts(btSoftBodyLinkData &linkData, int wavefrontSize, int linksPerWorkItem, int maxLinksPerWavefront, btAlignedObjectArray< btAlignedObjectArray< int > > &linksForWavefronts, btAlignedObjectArray< btAlignedObjectArray< btAlignedObjectArray< int > > > &batchesWithinWaves, btAlignedObjectArray< btAlignedObjectArray< int > > &verticesForWavefronts)
Definition: btSoftBodySolver_DX11SIMDAware.cpp:723

btVector3::getY
const btScalar & getY() const
Return the y value.
Definition: btVector3.h:563

btDX11SIMDAwareSoftBodySolver::updateConstants
void updateConstants(float timeStep)
Definition: btSoftBodySolver_DX11SIMDAware.cpp:383

m_linksPerWorkItem
static char m_linksPerWorkItem(LINKS_PER_SIMD_LANE)

btDX11SoftBodySolver::normalizeNormalsAndAreasKernel
DXFunctions::KernelDesc normalizeNormalsAndAreasKernel
Definition: btSoftBodySolver_DX11.h:511

btTransform::getBasis
btMatrix3x3 & getBasis()
Return the basis matrix for the rotation.
Definition: btTransform.h:112

UpdatePositionsFromVelocitiesHLSLString
static char * UpdatePositionsFromVelocitiesHLSLString
Definition: btSoftBodySolver_DX11SIMDAware.cpp:37

btVector3::getX
const btScalar & getX() const
Return the x value.
Definition: btVector3.h:561

btSoftBodyLinkDataDX11SIMDAware::BatchPair
Definition: btSoftBodySolverLinkData_DX11SIMDAware.h:66

btSoftBodyLinkData::getRestLength
float & getRestLength(int linkIndex)
Return reference to the rest length of link linkIndex as stored on the host.
Definition: btSoftBodySolverData.h:259

btSoftBodyLinkDataDX11SIMDAware::m_dx11LinksRestLength
btDX11Buffer< float > m_dx11LinksRestLength
Definition: btSoftBodySolverLinkData_DX11SIMDAware.h:63

btDX11SoftBodySolver::m_perClothFriction
btAlignedObjectArray< float > m_perClothFriction
Friction coefficient for each cloth.
Definition: btSoftBodySolver_DX11.h:498

btDX11SoftBodySolver::btAcceleratedSoftBodyInterface::setMaxVertices
void setMaxVertices(int maxVertices)
Definition: btSoftBodySolver_DX11.h:229

btDX11SoftBodySolver::integrateKernel
DXFunctions::KernelDesc integrateKernel
Definition: btSoftBodySolver_DX11.h:504

btDX11SoftBodySolver::IntegrateCB
Definition: btSoftBodySolver_DX11.h:319

m_maxBatchesWithinWave
static char m_maxBatchesWithinWave(0)

btSoftBodyLinkDataDX11SIMDAware::moveToAccelerator
virtual bool moveToAccelerator()
Move data from host memory to the accelerator.
Definition: btSoftBodySolver_DX11SIMDAware.cpp:125

vmInclude.h

toTransform3
static Vectormath::Aos::Transform3 toTransform3(const btTransform &transform)
Definition: btSoftBodySolver_DX11SIMDAware.cpp:554

btDX11SIMDAwareSoftBodySolver::btDX11SIMDAwareSoftBodySolver
btDX11SIMDAwareSoftBodySolver(ID3D11Device *dx11Device, ID3D11DeviceContext *dx11Context, DXFunctions::CompileFromMemoryFunc dx11CompileFromMemory=&D3DX11CompileFromMemory)
Definition: btSoftBodySolver_DX11SIMDAware.cpp:176

btVector3
btVector3 can be used to represent 3D points and vectors.
Definition: btVector3.h:83

btDX11SoftBodySolver::m_softBodySet
btAlignedObjectArray< btAcceleratedSoftBodyInterface * > m_softBodySet
Cloths owned by this solver.
Definition: btSoftBodySolver_DX11.h:429

btDX11SIMDAwareSoftBodySolver::buildShaders
virtual bool buildShaders()
Definition: btSoftBodySolver_DX11SIMDAware.cpp:485

btSoftBodyLinkDataDX11SIMDAware::m_maxVertex
int m_maxVertex
Definition: btSoftBodySolverLinkData_DX11SIMDAware.h:40

btSoftBodyTriangleData::getNumTriangles
int getNumTriangles()
Definition: btSoftBodySolverData.h:672

btSoftBodyTriangleData::TriangleNodeSet::vertex2
int vertex2
Definition: btSoftBodySolverData.h:595

btSoftBodyLinkData::LinkDescription
Class describing a link for input into the system.
Definition: btSoftBodySolverData.h:51

btTransform
The btTransform class supports rigid transforms with only translation and rotation and no scaling/she...
Definition: btTransform.h:34

btDX11SoftBodySolver::UIntVector3
Definition: btSoftBodySolver_DX11.h:107

btSoftBodyLinkData::clear
virtual void clear()
Definition: btSoftBodySolverData.h:154

btDX11SIMDAwareSoftBodySolver::SolvePositionsFromLinksKernelCB
Definition: btSoftBodySolver_DX11SIMDAware.h:30

m_dx11LinkVerticesLocalAddresses
static char m_dx11LinkVerticesLocalAddresses(d3dDevice, d3dDeviceContext,&m_linkVerticesLocalAddresses, true)

btSoftBodyTriangleData::TriangleNodeSet::vertex0
int vertex0
Definition: btSoftBodySolverData.h:593

WAVEFRONT_SIZE
#define WAVEFRONT_SIZE
Definition: btSoftBodySolver_DX11SIMDAware.cpp:19

btSoftBodyLinkDataDX11SIMDAware::setLinkAt
virtual void setLinkAt(const LinkDescription &link, int linkIndex)
Insert the link described into the correct data structures assuming space has already been allocated ...
Definition: btSoftBodySolver_DX11SIMDAware.cpp:107

btSoftBodyLinkData
Definition: btSoftBodySolverData.h:23

btDX11SoftBodySolver::m_perClothDragFactor
btAlignedObjectArray< float > m_perClothDragFactor
Drag parameter for wind effect on cloth.
Definition: btSoftBodySolver_DX11.h:456

btSoftBodySolverLinkData_DX11SIMDAware.h

btAlignedObjectArray::resize
void resize(int newsize, const T &fillData=T())
Definition: btAlignedObjectArray.h:220

btSoftBodyLinkData::getNumLinks
int getNumLinks()
Definition: btSoftBodySolverData.h:165

btDX11Buffer::getSRV
ID3D11ShaderResourceView *& getSRV()
Definition: btSoftBodySolverBuffer_DX11.h:165

btSoftBodyVertexData::getInverseMass
float & getInverseMass(int vertexIndex)
Return a reference to the inverse mass of vertex vertexIndex as stored on the host.
Definition: btSoftBodySolverData.h:521

btAlignedObjectArray::findLinearSearch
int findLinearSearch(const T &key) const
Definition: btAlignedObjectArray.h:465

btSoftBodyVertexDataDX11::moveToAccelerator
virtual bool moveToAccelerator()
Move data from host memory to the accelerator.
Definition: btSoftBodySolver_DX11.cpp:292

btSoftBodyLinkData::LinkDescription::getVertex1
int getVertex1() const
Definition: btSoftBodySolverData.h:110

btSoftBodyLinkDataDX11SIMDAware::m_dx11LinksRestLengthSquared
btDX11Buffer< float > m_dx11LinksRestLengthSquared
Definition: btSoftBodySolverLinkData_DX11SIMDAware.h:62

btSoftBodyVertexData::getPosition
Vectormath::Aos::Point3 & getPosition(int vertexIndex)
Return a reference to the position of vertex vertexIndex as stored on the host.
Definition: btSoftBodySolverData.h:471

btDX11SoftBodySolver::m_vertexData
btSoftBodyVertexDataDX11 m_vertexData
Definition: btSoftBodySolver_DX11.h:415

btCollisionObject::getFriction
btScalar getFriction() const
Definition: btCollisionObject.h:281

btDX11Buffer::getUAV
ID3D11UnorderedAccessView *& getUAV()
Definition: btSoftBodySolverBuffer_DX11.h:170

btDX11SoftBodySolver::releaseKernels
void releaseKernels()
Definition: btSoftBodySolver_DX11.cpp:608

m_dx11LinksMassLSC
static char m_dx11LinksMassLSC(d3dDevice, d3dDeviceContext,&m_linksMassLSC, true)

btMax
const T & btMax(const T &a, const T &b)
Definition: btMinMax.h:29

btSoftBodyTriangleData::TriangleDescription
Definition: btSoftBodySolverData.h:614

btSoftBodyLinkDataDX11SIMDAware::m_dx11LinkStrength
btDX11Buffer< float > m_dx11LinkStrength
Definition: btSoftBodySolverLinkData_DX11SIMDAware.h:60

btDX11SoftBodySolver::m_perClothLiftFactor
btAlignedObjectArray< float > m_perClothLiftFactor
Lift parameter for wind effect on cloth.
Definition: btSoftBodySolver_DX11.h:452

btSoftBodyVertexDataDX11::m_dx11VertexPosition
btDX11Buffer< Vectormath::Aos::Point3 > m_dx11VertexPosition
Definition: btSoftBodySolverVertexData_DX11.h:39

m_wavefrontSize
static char m_wavefrontSize(WAVEFRONT_SIZE)

btSoftBodyTriangleData::clear
virtual void clear()
Definition: btSoftBodySolverData.h:665

btSoftBodyLinkDataDX11SIMDAware::createLinks
virtual void createLinks(int numLinks)
Allocate enough space in all link-related arrays to fit numLinks links.
Definition: btSoftBodySolver_DX11SIMDAware.cpp:96

btDX11SoftBodySolver::updateVelocitiesFromPositionsWithoutVelocitiesKernel
DXFunctions::KernelDesc updateVelocitiesFromPositionsWithoutVelocitiesKernel
Definition: btSoftBodySolver_DX11.h:507

btSoftBodyLinkDataDX11SIMDAware::getMaxBatchesPerWavefront
int getMaxBatchesPerWavefront()
Definition: btSoftBodySolverLinkData_DX11SIMDAware.h:142

m_d3dDeviceContext
static char m_d3dDeviceContext(d3dDeviceContext)

btDX11SoftBodySolver::btAcceleratedSoftBodyInterface::setFirstLink
void setFirstLink(int firstLink)
Definition: btSoftBodySolver_DX11.h:259

btDX11SoftBodySolver::UpdatePositionsFromVelocitiesCB
Definition: btSoftBodySolver_DX11.h:327

btSoftBodyLinkData::LinkDescription::getVertex0
int getVertex0() const
Definition: btSoftBodySolverData.h:105

btSoftBodyWorldInfo::air_density
btScalar air_density
Definition: btSoftBody.h:45

btDX11SIMDAwareSoftBodySolver::SolvePositionsFromLinksKernelCB::numWaves
int numWaves
Definition: btSoftBodySolver_DX11SIMDAware.h:33

m_dx11LinksMaterialLinearStiffnessCoefficient
static char m_dx11LinksMaterialLinearStiffnessCoefficient(d3dDevice, d3dDeviceContext,&m_linksMaterialLinearStiffnessCoefficient, true)
Definition: btSoftBodySolver_DX11SIMDAware.cpp:80

btDX11SoftBodySolver::m_triangleData
btSoftBodyTriangleDataDX11 m_triangleData
Definition: btSoftBodySolver_DX11.h:416

Vectormath::Aos::dot
float dot(const Quat &quat0, const Quat &quat1)
Definition: neon/quat_aos.h:268

btSoftBodyLinkDataDX11SIMDAware::getWavefrontSize
int getWavefrontSize()
Definition: btSoftBodySolverLinkData_DX11SIMDAware.h:127

btSoftBodyWorldInfo::m_gravity
btVector3 m_gravity
Definition: btSoftBody.h:52

btDX11SoftBodySolver::updateVelocitiesFromPositionsWithVelocitiesKernel
DXFunctions::KernelDesc updateVelocitiesFromPositionsWithVelocitiesKernel
Definition: btSoftBodySolver_DX11.h:508

btSoftBodyLinkData::LinkDescription::setLinkStrength
void setLinkStrength(float strength)
Definition: btSoftBodySolverData.h:100

btSoftBodyLinkDataDX11SIMDAware::moveFromAccelerator
virtual bool moveFromAccelerator()
Move data from host memory from the accelerator.
Definition: btSoftBodySolver_DX11SIMDAware.cpp:144

btDX11SoftBodySolver::SolveCollisionsAndUpdateVelocitiesCB
Definition: btSoftBodySolver_DX11.h:396

btSoftBodyLinkDataDX11SIMDAware::m_dx11LinksMassLSC
btDX11Buffer< float > m_dx11LinksMassLSC
Definition: btSoftBodySolverLinkData_DX11SIMDAware.h:61

btDX11SoftBodySolver::prepareCollisionConstraints
void prepareCollisionConstraints()
Sort the collision object details array and generate indexing into it for the per-cloth collision obj...
Definition: btSoftBodySolver_DX11.cpp:1235

btSoftBody
The btSoftBody is an class to simulate cloth and volumetric soft bodies.
Definition: btSoftBody.h:71

btDX11SoftBodySolver::solveCollisionsAndUpdateVelocities
void solveCollisionsAndUpdateVelocities(float isolverdt)
Definition: btSoftBodySolver_DX11.cpp:1695

insertUniqueAndOrderedIntoVector
static void insertUniqueAndOrderedIntoVector(btAlignedObjectArray< T > &vectorToUpdate, T element)
Insert into btAlignedObjectArray assuming the array is ordered and maintaining both ordering and uniq...
Definition: btSoftBodySolver_DX11SIMDAware.cpp:666

DXFunctions::CompileFromMemoryFunc
HRESULT(WINAPI * CompileFromMemoryFunc)(LPCSTR, SIZE_T, LPCSTR, const D3D10_SHADER_MACRO *, LPD3D10INCLUDE, LPCSTR, LPCSTR, UINT, UINT, ID3DX11ThreadPump *, ID3D10Blob **, ID3D10Blob **, HRESULT *)
Definition: btSoftBodySolver_DX11.h:33

btSoftBodyVertexData::setVertexAt
void setVertexAt(const VertexDescription &vertex, int vertexIndex)
Definition: btSoftBodySolverData.h:426

btSoftBodyLinkDataDX11SIMDAware::m_dx11LinkVerticesLocalAddresses
btDX11Buffer< LinkNodePair > m_dx11LinkVerticesLocalAddresses
Definition: btSoftBodySolverLinkData_DX11SIMDAware.h:59

WAVEFRONT_BLOCK_MULTIPLIER
#define WAVEFRONT_BLOCK_MULTIPLIER
Definition: btSoftBodySolver_DX11SIMDAware.cpp:20

btDX11SoftBodySolver::m_shadersInitialized
bool m_shadersInitialized
Definition: btSoftBodySolver_DX11.h:423

btSoftBodySolver::m_numberOfPositionIterations
int m_numberOfPositionIterations
Definition: btSoftBodySolvers.h:45

btDX11SIMDAwareSoftBodySolver::m_linkData
btSoftBodyLinkDataDX11SIMDAware m_linkData
Link data for all cloths.
Definition: btSoftBodySolver_DX11SIMDAware.h:40

btSoftBodyTriangleData::TriangleNodeSet::vertex1
int vertex1
Definition: btSoftBodySolverData.h:594

btDX11SoftBodySolver::btAcceleratedSoftBodyInterface::setFirstTriangle
void setFirstTriangle(int firstTriangle)
Definition: btSoftBodySolver_DX11.h:244

btSoftBodyLinkDataDX11SIMDAware::m_dx11NumBatchesAndVerticesWithinWaves
btDX11Buffer< NumBatchesVerticesPair > m_dx11NumBatchesAndVerticesWithinWaves
Definition: btSoftBodySolverLinkData_DX11SIMDAware.h:51

btSoftBodyLinkData::createLinks
virtual void createLinks(int numLinks)
Allocate enough space in all link-related arrays to fit numLinks links.
Definition: btSoftBodySolverData.h:171

btSoftBody::m_faces
tFaceArray m_faces
Definition: btSoftBody.h:656

btDX11Buffer::moveFromGPU
bool moveFromGPU()
Move the data back from the GPU if it is on there and isn't read only.
Definition: btSoftBodySolverBuffer_DX11.h:227

btDX11SoftBodySolver::m_perClothMaxBounds
btAlignedObjectArray< UIntVector3 > m_perClothMaxBounds
Maximum bounds for each cloth.
Definition: btSoftBodySolver_DX11.h:491

btSoftBodyLinkDataDX11SIMDAware::m_dx11LinksMaterialLinearStiffnessCoefficient
btDX11Buffer< float > m_dx11LinksMaterialLinearStiffnessCoefficient
Definition: btSoftBodySolverLinkData_DX11SIMDAware.h:64

btDX11SoftBodySolver::m_perClothAcceleration
btAlignedObjectArray< Vectormath::Aos::Vector3 > m_perClothAcceleration
Acceleration value to be applied to all non-static vertices in the solver.
Definition: btSoftBodySolver_DX11.h:434