mirror of
https://github.com/PixarAnimationStudios/OpenSubdiv
synced 2025-01-02 13:20:10 +00:00
8da827336d
This is the first step to tease off Osd compute controller/contexts from Far API. Currently FarStencilTable only creates a kernelbatch for the entire range, so we can use [0, numStencils) for all cases instead of KernelBatch. This might not be true if we apply non-factorized level-wise stencils, then we'll add another modular utility to serve those cases.
223 lines
6.4 KiB
C++
223 lines
6.4 KiB
C++
//
|
|
// Copyright 2013 Pixar
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "Apache License")
|
|
// with the following modification; you may not use this file except in
|
|
// compliance with the Apache License and the following modification to it:
|
|
// Section 6. Trademarks. is deleted and replaced with:
|
|
//
|
|
// 6. Trademarks. This License does not grant permission to use the trade
|
|
// names, trademarks, service marks, or product names of the Licensor
|
|
// and its affiliates, except as required to comply with Section 4(c) of
|
|
// the License and to reproduce the content of the NOTICE file.
|
|
//
|
|
// You may obtain a copy of the Apache License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the Apache License with the above modification is
|
|
// distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
// KIND, either express or implied. See the Apache License for the specific
|
|
// language governing permissions and limitations under the Apache License.
|
|
//
|
|
|
|
#include "../far/stencilTables.h"
|
|
|
|
#include "../osd/cudaComputeContext.h"
|
|
|
|
#include <cuda_runtime.h>
|
|
#include <vector>
|
|
|
|
namespace OpenSubdiv {
|
|
namespace OPENSUBDIV_VERSION {
|
|
|
|
namespace Osd {
|
|
|
|
// ----------------------------------------------------------------------------
|
|
|
|
template <class T> void *
|
|
createCudaBuffer(std::vector<T> const & src) {
|
|
|
|
void * devicePtr=0;
|
|
|
|
size_t size = src.size()*sizeof(T);
|
|
|
|
cudaError_t err = cudaMalloc(&devicePtr, size);
|
|
if (err != cudaSuccess) {
|
|
return devicePtr;
|
|
}
|
|
|
|
err = cudaMemcpy(devicePtr, &src.at(0), size, cudaMemcpyHostToDevice);
|
|
if (err != cudaSuccess) {
|
|
cudaFree(devicePtr);
|
|
return 0;
|
|
}
|
|
return devicePtr;
|
|
}
|
|
|
|
// ----------------------------------------------------------------------------
|
|
|
|
class CudaComputeContext::CudaStencilTables {
|
|
|
|
public:
|
|
|
|
CudaStencilTables(Far::StencilTables const & stencilTables) {
|
|
_sizes = createCudaBuffer(stencilTables.GetSizes());
|
|
_offsets = createCudaBuffer(stencilTables.GetOffsets());
|
|
_indices = createCudaBuffer(stencilTables.GetControlIndices());
|
|
_weights = createCudaBuffer(stencilTables.GetWeights());
|
|
_numStencils = stencilTables.GetNumStencils();
|
|
}
|
|
|
|
~CudaStencilTables() {
|
|
if (_sizes) { cudaFree(_sizes); }
|
|
if (_offsets) { cudaFree(_offsets); }
|
|
if (_indices) { cudaFree(_indices); }
|
|
if (_weights) { cudaFree(_weights); }
|
|
}
|
|
|
|
bool IsValid() const {
|
|
return _sizes and _offsets and _indices and _weights;
|
|
}
|
|
|
|
void * GetSizes() const {
|
|
return _sizes;
|
|
}
|
|
|
|
void * GetOffsets() const {
|
|
return _offsets;
|
|
}
|
|
|
|
void * GetIndices() const {
|
|
return _indices;
|
|
}
|
|
|
|
void * GetWeights() const {
|
|
return _weights;
|
|
}
|
|
|
|
int GetNumStencils() const {
|
|
return _numStencils;
|
|
}
|
|
|
|
private:
|
|
void * _sizes,
|
|
* _offsets,
|
|
* _indices,
|
|
* _weights;
|
|
int _numStencils;
|
|
};
|
|
|
|
// ----------------------------------------------------------------------------
|
|
|
|
CudaComputeContext::CudaComputeContext(
|
|
Far::StencilTables const * vertexStencilTables,
|
|
Far::StencilTables const * varyingStencilTables) :
|
|
_vertexStencilTables(0), _varyingStencilTables(0),
|
|
_numControlVertices(0) {
|
|
|
|
if (vertexStencilTables) {
|
|
_vertexStencilTables = new CudaStencilTables(*vertexStencilTables);
|
|
_numControlVertices = vertexStencilTables->GetNumControlVertices();
|
|
}
|
|
|
|
if (varyingStencilTables) {
|
|
_varyingStencilTables = new CudaStencilTables(*varyingStencilTables);
|
|
|
|
if (_numControlVertices) {
|
|
assert(_numControlVertices==varyingStencilTables->GetNumControlVertices());
|
|
} else {
|
|
_numControlVertices = varyingStencilTables->GetNumControlVertices();
|
|
}
|
|
}
|
|
}
|
|
|
|
CudaComputeContext::~CudaComputeContext() {
|
|
delete _vertexStencilTables;
|
|
delete _varyingStencilTables;
|
|
}
|
|
|
|
// ----------------------------------------------------------------------------
|
|
|
|
bool
|
|
CudaComputeContext::HasVertexStencilTables() const {
|
|
return _vertexStencilTables ? _vertexStencilTables->IsValid() : false;
|
|
}
|
|
|
|
bool
|
|
CudaComputeContext::HasVaryingStencilTables() const {
|
|
return _varyingStencilTables ? _varyingStencilTables->IsValid() : false;
|
|
}
|
|
|
|
int
|
|
CudaComputeContext::GetNumStencilsInVertexStencilTables() const {
|
|
return _vertexStencilTables ? _vertexStencilTables->GetNumStencils() : 0;
|
|
}
|
|
|
|
int
|
|
CudaComputeContext::GetNumStencilsInVaryingStencilTables() const {
|
|
return _varyingStencilTables ? _varyingStencilTables->GetNumStencils() : 0;
|
|
}
|
|
|
|
// ----------------------------------------------------------------------------
|
|
|
|
void *
|
|
CudaComputeContext::GetVertexStencilTablesSizes() const {
|
|
return _vertexStencilTables ? _vertexStencilTables->GetSizes() : 0;
|
|
}
|
|
|
|
void *
|
|
CudaComputeContext::GetVertexStencilTablesOffsets() const {
|
|
return _vertexStencilTables ? _vertexStencilTables->GetOffsets() : 0;
|
|
}
|
|
|
|
void *
|
|
CudaComputeContext::GetVertexStencilTablesIndices() const {
|
|
return _vertexStencilTables ? _vertexStencilTables->GetIndices() : 0;
|
|
}
|
|
|
|
void *
|
|
CudaComputeContext::GetVertexStencilTablesWeights() const {
|
|
return _vertexStencilTables ? _vertexStencilTables->GetWeights() : 0;
|
|
}
|
|
|
|
// ----------------------------------------------------------------------------
|
|
|
|
void *
|
|
CudaComputeContext::GetVaryingStencilTablesSizes() const {
|
|
return _varyingStencilTables ? _varyingStencilTables->GetSizes() : 0;
|
|
}
|
|
|
|
void *
|
|
CudaComputeContext::GetVaryingStencilTablesOffsets() const {
|
|
return _varyingStencilTables ? _varyingStencilTables->GetOffsets() : 0;
|
|
}
|
|
|
|
void *
|
|
CudaComputeContext::GetVaryingStencilTablesIndices() const {
|
|
return _varyingStencilTables ? _varyingStencilTables->GetIndices() : 0;
|
|
}
|
|
|
|
void *
|
|
CudaComputeContext::GetVaryingStencilTablesWeights() const {
|
|
return _varyingStencilTables ? _varyingStencilTables->GetWeights() : 0;
|
|
}
|
|
|
|
// ----------------------------------------------------------------------------
|
|
|
|
CudaComputeContext *
|
|
CudaComputeContext::Create(Far::StencilTables const * vertexStencilTables,
|
|
Far::StencilTables const * varyingStencilTables) {
|
|
|
|
CudaComputeContext *result =
|
|
new CudaComputeContext(vertexStencilTables, varyingStencilTables);
|
|
|
|
return result;
|
|
}
|
|
|
|
} // end namespace Osd
|
|
|
|
} // end namespace OPENSUBDIV_VERSION
|
|
} // end namespace OpenSubdiv
|