mirror of
https://github.com/PixarAnimationStudios/OpenSubdiv
synced 2025-01-10 00:30:07 +00:00
82a0513326
refactor CL/CUDA specific initialization stuffs into examples/common/clDeviceContext and cudaDeviceContext, and update examples to use those structs. also - remove CL/CUDA tests from osd_regression. The tests for those kernels will be covered by glImaging. - update cuda initialization to use the GL-interoperable device if available. - remove CL specialization from glShareTopology, following the same pattern as we took in the previous OsdGLMesh refactoring. (still something strange with XFB kernels though) - fix file permissions.
152 lines
4.2 KiB
C++
152 lines
4.2 KiB
C++
//
|
|
// Copyright 2013 Pixar
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "Apache License")
|
|
// with the following modification; you may not use this file except in
|
|
// compliance with the Apache License and the following modification to it:
|
|
// Section 6. Trademarks. is deleted and replaced with:
|
|
//
|
|
// 6. Trademarks. This License does not grant permission to use the trade
|
|
// names, trademarks, service marks, or product names of the Licensor
|
|
// and its affiliates, except as required to comply with Section 4(c) of
|
|
// the License and to reproduce the content of the NOTICE file.
|
|
//
|
|
// You may obtain a copy of the Apache License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the Apache License with the above modification is
|
|
// distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
// KIND, either express or implied. See the Apache License for the specific
|
|
// language governing permissions and limitations under the Apache License.
|
|
//
|
|
|
|
#include "../osd/cudaD3D11VertexBuffer.h"
|
|
#include "../far/error.h"
|
|
|
|
#include <D3D11.h>
|
|
#include <cuda_runtime.h>
|
|
#include <cuda_d3d11_interop.h>
|
|
#include <cassert>
|
|
|
|
namespace OpenSubdiv {
|
|
namespace OPENSUBDIV_VERSION {
|
|
|
|
namespace Osd {
|
|
|
|
CudaD3D11VertexBuffer::CudaD3D11VertexBuffer(int numElements, int numVertices)
|
|
: _numElements(numElements), _numVertices(numVertices),
|
|
_d3d11Buffer(NULL), _cudaBuffer(NULL), _cudaResource(NULL) {
|
|
}
|
|
|
|
CudaD3D11VertexBuffer::~CudaD3D11VertexBuffer() {
|
|
|
|
unmap();
|
|
cudaGraphicsUnregisterResource(_cudaResource);
|
|
_d3d11Buffer->Release();
|
|
}
|
|
|
|
CudaD3D11VertexBuffer *
|
|
CudaD3D11VertexBuffer::Create(int numElements, int numVertices,
|
|
ID3D11DeviceContext *deviceContext) {
|
|
CudaD3D11VertexBuffer *instance =
|
|
new CudaD3D11VertexBuffer(numElements, numVertices);
|
|
|
|
ID3D11Device *device;
|
|
deviceContext->GetDevice(&device);
|
|
if (instance->allocate(device)) return instance;
|
|
delete instance;
|
|
return NULL;
|
|
}
|
|
|
|
void
|
|
CudaD3D11VertexBuffer::UpdateData(const float *src,
|
|
int startVertex, int numVertices,
|
|
void * /*deviceContext*/) {
|
|
|
|
map();
|
|
cudaMemcpy((float*)_cudaBuffer + _numElements * startVertex,
|
|
src, _numElements * numVertices * sizeof(float),
|
|
cudaMemcpyHostToDevice);
|
|
}
|
|
|
|
int
|
|
CudaD3D11VertexBuffer::GetNumElements() const {
|
|
|
|
return _numElements;
|
|
}
|
|
|
|
int
|
|
CudaD3D11VertexBuffer::GetNumVertices() const {
|
|
|
|
return _numVertices;
|
|
}
|
|
|
|
float *
|
|
CudaD3D11VertexBuffer::BindCudaBuffer() {
|
|
|
|
map();
|
|
return (float*)_cudaBuffer;
|
|
}
|
|
|
|
ID3D11Buffer *
|
|
CudaD3D11VertexBuffer::BindD3D11Buffer(ID3D11DeviceContext *deviceContext) {
|
|
|
|
unmap();
|
|
return _d3d11Buffer;
|
|
}
|
|
|
|
bool
|
|
CudaD3D11VertexBuffer::allocate(ID3D11Device *device) {
|
|
|
|
D3D11_BUFFER_DESC hBufferDesc;
|
|
hBufferDesc.ByteWidth = _numElements * _numVertices * sizeof(float);
|
|
hBufferDesc.Usage = D3D11_USAGE_DYNAMIC;
|
|
hBufferDesc.BindFlags = D3D11_BIND_VERTEX_BUFFER | D3D11_BIND_SHADER_RESOURCE;
|
|
hBufferDesc.CPUAccessFlags = D3D11_CPU_ACCESS_WRITE;
|
|
hBufferDesc.MiscFlags = 0;
|
|
hBufferDesc.StructureByteStride = sizeof(float);
|
|
|
|
HRESULT hr;
|
|
hr = device->CreateBuffer(&hBufferDesc, NULL, &_d3d11Buffer);
|
|
if(FAILED(hr)) {
|
|
Far::Error(Far::FAR_RUNTIME_ERROR,
|
|
"Fail in CreateBuffer\n");
|
|
return false;
|
|
}
|
|
|
|
// register d3d11buffer as cuda resource
|
|
cudaError_t err = cudaGraphicsD3D11RegisterResource(
|
|
&_cudaResource, _d3d11Buffer, cudaGraphicsRegisterFlagsNone);
|
|
|
|
if (err != cudaSuccess) return false;
|
|
return true;
|
|
}
|
|
|
|
void
|
|
CudaD3D11VertexBuffer::map() {
|
|
|
|
if (_cudaBuffer) return;
|
|
size_t num_bytes;
|
|
void *ptr;
|
|
|
|
cudaGraphicsMapResources(1, &_cudaResource, 0);
|
|
cudaGraphicsResourceGetMappedPointer(&ptr, &num_bytes, _cudaResource);
|
|
_cudaBuffer = ptr;
|
|
}
|
|
|
|
void
|
|
CudaD3D11VertexBuffer::unmap() {
|
|
|
|
if (_cudaBuffer == NULL) return;
|
|
cudaGraphicsUnmapResources(1, &_cudaResource, 0);
|
|
_cudaBuffer = NULL;
|
|
}
|
|
|
|
} // end namespace Osd
|
|
|
|
} // end namespace OPENSUBDIV_VERSION
|
|
} // end namespace OpenSubdiv
|
|
|