OpenSubdiv/opensubdiv/osd/cudaD3D11VertexBuffer.cpp
Takahito Tejima de0082ba95 Simplify Osd::MeshInterface.
Removed OpenCL/D3D11 specialization and add DEVICE_CONTEXT as a template
parameter. For the kernels which don't need a context object (e.g.
CPU, OpenGL, cuda) just ignore the context, and for the kernels which
use a context (e.g. OpenCL, DirectX) takes a context or a user-defined
class as which encapsulates device contexts. Note that OpenCL requires
two objects, cl_context and cl_command_queue. The user-defined
class must provide GetContext() and GetCommandQueue() for strongly typed
binding to osd VertexBuffers and ComputeContexts.

Osd::Mesh and MeshInterface have been used as a handy harness to host
multiple GPU kernels and graphics APIs. However it has CL/DirectX
specializations and duplicates large amount of plubming code. With this
change, glMesh.h and d3d11Mesh.h become just typedefs and all logic is
put into mesh.h without specializations.

Also cleaned up unused header files and code formatting.
2015-04-27 11:27:05 -07:00

152 lines
4.3 KiB
C++

//
// Copyright 2013 Pixar
//
// Licensed under the Apache License, Version 2.0 (the "Apache License")
// with the following modification; you may not use this file except in
// compliance with the Apache License and the following modification to it:
// Section 6. Trademarks. is deleted and replaced with:
//
// 6. Trademarks. This License does not grant permission to use the trade
// names, trademarks, service marks, or product names of the Licensor
// and its affiliates, except as required to comply with Section 4(c) of
// the License and to reproduce the content of the NOTICE file.
//
// You may obtain a copy of the Apache License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the Apache License with the above modification is
// distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the Apache License for the specific
// language governing permissions and limitations under the Apache License.
//
#include "../osd/cudaD3D11VertexBuffer.h"
#include "../far/error.h"
#include <D3D11.h>
#include <cuda_runtime.h>
#include <cuda_d3d11_interop.h>
#include <cassert>
namespace OpenSubdiv {
namespace OPENSUBDIV_VERSION {
namespace Osd {
CudaD3D11VertexBuffer::CudaD3D11VertexBuffer(int numElements, int numVertices)
: _numElements(numElements), _numVertices(numVertices),
_d3d11Buffer(NULL), _cudaBuffer(NULL), _cudaResource(NULL) {
}
CudaD3D11VertexBuffer::~CudaD3D11VertexBuffer() {
unmap();
cudaGraphicsUnregisterResource(_cudaResource);
_d3d11Buffer->Release();
}
CudaD3D11VertexBuffer *
CudaD3D11VertexBuffer::Create(int numElements, int numVertices,
ID3D11DeviceContext *deviceContext) {
CudaD3D11VertexBuffer *instance =
new CudaD3D11VertexBuffer(numElements, numVertices, device);
ID3D11Device *device;
deviceContext->GetDevice(&device);
if (instance->allocate(device)) return instance;
delete instance;
return NULL;
}
void
CudaD3D11VertexBuffer::UpdateData(const float *src,
int startVertex, int numVertices,
void * /*deviceContext*/) {
map();
cudaMemcpy((float*)_cudaBuffer + _numElements * startVertex,
src, _numElements * numVertices * sizeof(float),
cudaMemcpyHostToDevice);
}
int
CudaD3D11VertexBuffer::GetNumElements() const {
return _numElements;
}
int
CudaD3D11VertexBuffer::GetNumVertices() const {
return _numVertices;
}
float *
CudaD3D11VertexBuffer::BindCudaBuffer() {
map();
return (float*)_cudaBuffer;
}
ID3D11Buffer *
CudaD3D11VertexBuffer::BindD3D11Buffer(ID3D11DeviceContext *deviceContext) {
unmap();
return _d3d11Buffer;
}
bool
CudaD3D11VertexBuffer::allocate(ID3D11Device *device) {
D3D11_BUFFER_DESC hBufferDesc;
hBufferDesc.ByteWidth = _numElements * _numVertices * sizeof(float);
hBufferDesc.Usage = D3D11_USAGE_DYNAMIC;
hBufferDesc.BindFlags = D3D11_BIND_VERTEX_BUFFER | D3D11_BIND_SHADER_RESOURCE;
hBufferDesc.CPUAccessFlags = D3D11_CPU_ACCESS_WRITE;
hBufferDesc.MiscFlags = 0;
hBufferDesc.StructureByteStride = sizeof(float);
HRESULT hr;
hr = device->CreateBuffer(&hBufferDesc, NULL, &_d3d11Buffer);
if(FAILED(hr)) {
Far::Error(Far::FAR_RUNTIME_ERROR,
"Fail in CreateBuffer\n");
return false;
}
// register d3d11buffer as cuda resource
cudaError_t err = cudaGraphicsD3D11RegisterResource(
&_cudaResource, _d3d11Buffer, cudaGraphicsRegisterFlagsNone);
if (err != cudaSuccess) return false;
return true;
}
void
CudaD3D11VertexBuffer::map() {
if (_cudaBuffer) return;
size_t num_bytes;
void *ptr;
cudaGraphicsMapResources(1, &_cudaResource, 0);
cudaGraphicsResourceGetMappedPointer(&ptr, &num_bytes, _cudaResource);
_cudaBuffer = ptr;
}
void
CudaD3D11VertexBuffer::unmap() {
if (_cudaBuffer == NULL) return;
cudaGraphicsUnmapResources(1, &_cudaResource, 0);
_cudaBuffer = NULL;
}
} // end namespace Osd
} // end namespace OPENSUBDIV_VERSION
} // end namespace OpenSubdiv