mirror of
https://github.com/PixarAnimationStudios/OpenSubdiv
synced 2024-11-23 20:20:09 +00:00
de0082ba95
Removed OpenCL/D3D11 specialization and add DEVICE_CONTEXT as a template parameter. For the kernels which don't need a context object (e.g. CPU, OpenGL, cuda) just ignore the context, and for the kernels which use a context (e.g. OpenCL, DirectX) takes a context or a user-defined class as which encapsulates device contexts. Note that OpenCL requires two objects, cl_context and cl_command_queue. The user-defined class must provide GetContext() and GetCommandQueue() for strongly typed binding to osd VertexBuffers and ComputeContexts. Osd::Mesh and MeshInterface have been used as a handy harness to host multiple GPU kernels and graphics APIs. However it has CL/DirectX specializations and duplicates large amount of plubming code. With this change, glMesh.h and d3d11Mesh.h become just typedefs and all logic is put into mesh.h without specializations. Also cleaned up unused header files and code formatting.
152 lines
4.3 KiB
C++
152 lines
4.3 KiB
C++
//
|
|
// Copyright 2013 Pixar
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "Apache License")
|
|
// with the following modification; you may not use this file except in
|
|
// compliance with the Apache License and the following modification to it:
|
|
// Section 6. Trademarks. is deleted and replaced with:
|
|
//
|
|
// 6. Trademarks. This License does not grant permission to use the trade
|
|
// names, trademarks, service marks, or product names of the Licensor
|
|
// and its affiliates, except as required to comply with Section 4(c) of
|
|
// the License and to reproduce the content of the NOTICE file.
|
|
//
|
|
// You may obtain a copy of the Apache License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the Apache License with the above modification is
|
|
// distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
// KIND, either express or implied. See the Apache License for the specific
|
|
// language governing permissions and limitations under the Apache License.
|
|
//
|
|
|
|
#include "../osd/cudaD3D11VertexBuffer.h"
|
|
#include "../far/error.h"
|
|
|
|
#include <D3D11.h>
|
|
#include <cuda_runtime.h>
|
|
#include <cuda_d3d11_interop.h>
|
|
#include <cassert>
|
|
|
|
namespace OpenSubdiv {
|
|
namespace OPENSUBDIV_VERSION {
|
|
|
|
namespace Osd {
|
|
|
|
CudaD3D11VertexBuffer::CudaD3D11VertexBuffer(int numElements, int numVertices)
|
|
: _numElements(numElements), _numVertices(numVertices),
|
|
_d3d11Buffer(NULL), _cudaBuffer(NULL), _cudaResource(NULL) {
|
|
}
|
|
|
|
CudaD3D11VertexBuffer::~CudaD3D11VertexBuffer() {
|
|
|
|
unmap();
|
|
cudaGraphicsUnregisterResource(_cudaResource);
|
|
_d3d11Buffer->Release();
|
|
}
|
|
|
|
CudaD3D11VertexBuffer *
|
|
CudaD3D11VertexBuffer::Create(int numElements, int numVertices,
|
|
ID3D11DeviceContext *deviceContext) {
|
|
CudaD3D11VertexBuffer *instance =
|
|
new CudaD3D11VertexBuffer(numElements, numVertices, device);
|
|
|
|
ID3D11Device *device;
|
|
deviceContext->GetDevice(&device);
|
|
if (instance->allocate(device)) return instance;
|
|
delete instance;
|
|
return NULL;
|
|
}
|
|
|
|
void
|
|
CudaD3D11VertexBuffer::UpdateData(const float *src,
|
|
int startVertex, int numVertices,
|
|
void * /*deviceContext*/) {
|
|
|
|
map();
|
|
cudaMemcpy((float*)_cudaBuffer + _numElements * startVertex,
|
|
src, _numElements * numVertices * sizeof(float),
|
|
cudaMemcpyHostToDevice);
|
|
}
|
|
|
|
int
|
|
CudaD3D11VertexBuffer::GetNumElements() const {
|
|
|
|
return _numElements;
|
|
}
|
|
|
|
int
|
|
CudaD3D11VertexBuffer::GetNumVertices() const {
|
|
|
|
return _numVertices;
|
|
}
|
|
|
|
float *
|
|
CudaD3D11VertexBuffer::BindCudaBuffer() {
|
|
|
|
map();
|
|
return (float*)_cudaBuffer;
|
|
}
|
|
|
|
ID3D11Buffer *
|
|
CudaD3D11VertexBuffer::BindD3D11Buffer(ID3D11DeviceContext *deviceContext) {
|
|
|
|
unmap();
|
|
return _d3d11Buffer;
|
|
}
|
|
|
|
bool
|
|
CudaD3D11VertexBuffer::allocate(ID3D11Device *device) {
|
|
|
|
D3D11_BUFFER_DESC hBufferDesc;
|
|
hBufferDesc.ByteWidth = _numElements * _numVertices * sizeof(float);
|
|
hBufferDesc.Usage = D3D11_USAGE_DYNAMIC;
|
|
hBufferDesc.BindFlags = D3D11_BIND_VERTEX_BUFFER | D3D11_BIND_SHADER_RESOURCE;
|
|
hBufferDesc.CPUAccessFlags = D3D11_CPU_ACCESS_WRITE;
|
|
hBufferDesc.MiscFlags = 0;
|
|
hBufferDesc.StructureByteStride = sizeof(float);
|
|
|
|
HRESULT hr;
|
|
hr = device->CreateBuffer(&hBufferDesc, NULL, &_d3d11Buffer);
|
|
if(FAILED(hr)) {
|
|
Far::Error(Far::FAR_RUNTIME_ERROR,
|
|
"Fail in CreateBuffer\n");
|
|
return false;
|
|
}
|
|
|
|
// register d3d11buffer as cuda resource
|
|
cudaError_t err = cudaGraphicsD3D11RegisterResource(
|
|
&_cudaResource, _d3d11Buffer, cudaGraphicsRegisterFlagsNone);
|
|
|
|
if (err != cudaSuccess) return false;
|
|
return true;
|
|
}
|
|
|
|
void
|
|
CudaD3D11VertexBuffer::map() {
|
|
|
|
if (_cudaBuffer) return;
|
|
size_t num_bytes;
|
|
void *ptr;
|
|
|
|
cudaGraphicsMapResources(1, &_cudaResource, 0);
|
|
cudaGraphicsResourceGetMappedPointer(&ptr, &num_bytes, _cudaResource);
|
|
_cudaBuffer = ptr;
|
|
}
|
|
|
|
void
|
|
CudaD3D11VertexBuffer::unmap() {
|
|
|
|
if (_cudaBuffer == NULL) return;
|
|
cudaGraphicsUnmapResources(1, &_cudaResource, 0);
|
|
_cudaBuffer = NULL;
|
|
}
|
|
|
|
} // end namespace Osd
|
|
|
|
} // end namespace OPENSUBDIV_VERSION
|
|
} // end namespace OpenSubdiv
|
|
|