mirror of
https://github.com/PixarAnimationStudios/OpenSubdiv
synced 2025-01-10 08:30:11 +00:00
82a0513326
refactor CL/CUDA specific initialization stuffs into examples/common/clDeviceContext and cudaDeviceContext, and update examples to use those structs. also - remove CL/CUDA tests from osd_regression. The tests for those kernels will be covered by glImaging. - update cuda initialization to use the GL-interoperable device if available. - remove CL specialization from glShareTopology, following the same pattern as we took in the previous OsdGLMesh refactoring. (still something strange with XFB kernels though) - fix file permissions.
168 lines
4.7 KiB
C++
168 lines
4.7 KiB
C++
//
|
|
// Copyright 2013 Pixar
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "Apache License")
|
|
// with the following modification; you may not use this file except in
|
|
// compliance with the Apache License and the following modification to it:
|
|
// Section 6. Trademarks. is deleted and replaced with:
|
|
//
|
|
// 6. Trademarks. This License does not grant permission to use the trade
|
|
// names, trademarks, service marks, or product names of the Licensor
|
|
// and its affiliates, except as required to comply with Section 4(c) of
|
|
// the License and to reproduce the content of the NOTICE file.
|
|
//
|
|
// You may obtain a copy of the Apache License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the Apache License with the above modification is
|
|
// distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
// KIND, either express or implied. See the Apache License for the specific
|
|
// language governing permissions and limitations under the Apache License.
|
|
//
|
|
|
|
#include "../osd/cudaGLVertexBuffer.h"
|
|
#include "../osd/opengl.h"
|
|
#include "../far/error.h"
|
|
|
|
#include <cuda_runtime.h>
|
|
#include <cuda_gl_interop.h>
|
|
|
|
#include <cassert>
|
|
|
|
namespace OpenSubdiv {
|
|
namespace OPENSUBDIV_VERSION {
|
|
|
|
namespace Osd {
|
|
|
|
CudaGLVertexBuffer::CudaGLVertexBuffer(int numElements, int numVertices)
|
|
: _numElements(numElements), _numVertices(numVertices),
|
|
_vbo(0), _devicePtr(0), _cudaResource(0) {
|
|
}
|
|
|
|
CudaGLVertexBuffer::~CudaGLVertexBuffer() {
|
|
|
|
unmap();
|
|
cudaGraphicsUnregisterResource(_cudaResource);
|
|
glDeleteBuffers(1, &_vbo);
|
|
}
|
|
|
|
CudaGLVertexBuffer *
|
|
CudaGLVertexBuffer::Create(int numElements, int numVertices, void *) {
|
|
CudaGLVertexBuffer *instance =
|
|
new CudaGLVertexBuffer(numElements, numVertices);
|
|
if (instance->allocate()) return instance;
|
|
Far::Error(Far::FAR_RUNTIME_ERROR, "CudaGLVertexBuffer::Create failed.\n");
|
|
delete instance;
|
|
return NULL;
|
|
}
|
|
|
|
void
|
|
CudaGLVertexBuffer::UpdateData(const float *src,
|
|
int startVertex, int numVertices,
|
|
void * /*deviceContext*/) {
|
|
|
|
map();
|
|
cudaError_t err = cudaMemcpy((float*)_devicePtr + _numElements * startVertex,
|
|
src,
|
|
_numElements * numVertices * sizeof(float),
|
|
cudaMemcpyHostToDevice);
|
|
if (err != cudaSuccess)
|
|
Far::Error(Far::FAR_RUNTIME_ERROR,
|
|
"CudaGLVertexBuffer::UpdateData failed. : %s\n",
|
|
cudaGetErrorString(err));
|
|
}
|
|
|
|
int
|
|
CudaGLVertexBuffer::GetNumElements() const {
|
|
|
|
return _numElements;
|
|
}
|
|
|
|
int
|
|
CudaGLVertexBuffer::GetNumVertices() const {
|
|
|
|
return _numVertices;
|
|
}
|
|
|
|
float *
|
|
CudaGLVertexBuffer::BindCudaBuffer() {
|
|
|
|
map();
|
|
return static_cast<float*>(_devicePtr);
|
|
}
|
|
|
|
GLuint
|
|
CudaGLVertexBuffer::BindVBO(void * /*deviceContext*/) {
|
|
|
|
unmap();
|
|
return _vbo;
|
|
}
|
|
|
|
bool
|
|
CudaGLVertexBuffer::allocate() {
|
|
|
|
int size = _numElements * _numVertices * sizeof(float);
|
|
|
|
glGenBuffers(1, &_vbo);
|
|
|
|
#if defined(GL_EXT_direct_state_access)
|
|
if (glNamedBufferDataEXT) {
|
|
glNamedBufferDataEXT(_vbo, size, 0, GL_DYNAMIC_DRAW);
|
|
} else {
|
|
#else
|
|
{
|
|
#endif
|
|
glBindBuffer(GL_ARRAY_BUFFER, _vbo);
|
|
glBufferData(GL_ARRAY_BUFFER, size, 0, GL_DYNAMIC_DRAW);
|
|
glBindBuffer(GL_ARRAY_BUFFER, 0);
|
|
}
|
|
|
|
// register vbo as cuda resource
|
|
cudaError_t err = cudaGraphicsGLRegisterBuffer(
|
|
&_cudaResource, _vbo, cudaGraphicsMapFlagsWriteDiscard);
|
|
|
|
if (err != cudaSuccess) return false;
|
|
return true;
|
|
}
|
|
|
|
void
|
|
CudaGLVertexBuffer::map() {
|
|
|
|
if (_devicePtr) return;
|
|
size_t num_bytes;
|
|
void *ptr;
|
|
|
|
cudaError_t err = cudaGraphicsMapResources(1, &_cudaResource, 0);
|
|
if (err != cudaSuccess)
|
|
Far::Error(Far::FAR_RUNTIME_ERROR,
|
|
"CudaGLVertexBuffer::map failed.\n%s\n",
|
|
cudaGetErrorString(err));
|
|
err = cudaGraphicsResourceGetMappedPointer(&ptr, &num_bytes, _cudaResource);
|
|
if (err != cudaSuccess)
|
|
Far::Error(Far::FAR_RUNTIME_ERROR,
|
|
"CudaGLVertexBuffer::map failed.\n%s\n",
|
|
cudaGetErrorString(err));
|
|
_devicePtr = ptr;
|
|
}
|
|
|
|
void
|
|
CudaGLVertexBuffer::unmap() {
|
|
|
|
if (_devicePtr == NULL) return;
|
|
cudaError_t err = cudaGraphicsUnmapResources(1, &_cudaResource, 0);
|
|
if (err != cudaSuccess)
|
|
Far::Error(Far::FAR_RUNTIME_ERROR,
|
|
"CudaGLVertexBuffer::unmap failed.\n%s\n",
|
|
cudaGetErrorString(err));
|
|
_devicePtr = NULL;
|
|
}
|
|
|
|
|
|
} // end namespace Osd
|
|
|
|
} // end namespace OPENSUBDIV_VERSION
|
|
} // end namespace OpenSubdiv
|
|
|