mirror of
https://github.com/PixarAnimationStudios/OpenSubdiv
synced 2025-01-07 23:40:12 +00:00
eb09b9e14c
Further leverage cmake object libraries to share object files for CPU and GPU OSD libraries, avoiding duplicate complation for dynamic/static build passes. CMake restricts object library inputs to header and source files, so the .inc files were renamed to .gen.h (which seems like a better name anyway) to make CMake happy. Also updated the .gitignore file to ignore .gen.h files. Conflicts: opensubdiv/osd/CMakeLists.txt
377 lines
12 KiB
C++
377 lines
12 KiB
C++
//
|
|
// Copyright 2013 Pixar
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "Apache License")
|
|
// with the following modification; you may not use this file except in
|
|
// compliance with the Apache License and the following modification to it:
|
|
// Section 6. Trademarks. is deleted and replaced with:
|
|
//
|
|
// 6. Trademarks. This License does not grant permission to use the trade
|
|
// names, trademarks, service marks, or product names of the Licensor
|
|
// and its affiliates, except as required to comply with Section 4(c) of
|
|
// the License and to reproduce the content of the NOTICE file.
|
|
//
|
|
// You may obtain a copy of the Apache License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the Apache License with the above modification is
|
|
// distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
// KIND, either express or implied. See the Apache License for the specific
|
|
// language governing permissions and limitations under the Apache License.
|
|
//
|
|
|
|
#include "../osd/debug.h"
|
|
#include "../osd/error.h"
|
|
#include "../osd/d3d11KernelBundle.h"
|
|
|
|
#define INITGUID // for IID_ID3D11ShaderReflection
|
|
#include <D3D11.h>
|
|
#include <D3D11shader.h>
|
|
#include <D3Dcompiler.h>
|
|
|
|
#include <cassert>
|
|
#include <cstring>
|
|
#include <sstream>
|
|
#include <string>
|
|
|
|
namespace OpenSubdiv {
|
|
namespace OPENSUBDIV_VERSION {
|
|
|
|
static const char *shaderSource =
|
|
#include "../osd/hlslComputeKernel.gen.h"
|
|
;
|
|
|
|
#define SAFE_RELEASE(p) { if(p) { (p)->Release(); (p)=NULL; } }
|
|
|
|
OsdD3D11ComputeKernelBundle::OsdD3D11ComputeKernelBundle(
|
|
ID3D11DeviceContext * deviceContext) :
|
|
_deviceContext(deviceContext),
|
|
_computeShader(0),
|
|
_classLinkage(0),
|
|
_kernelCB(0),
|
|
_kernelComputeFace(0),
|
|
_kernelComputeEdge(0),
|
|
_kernelComputeBilinearEdge(0),
|
|
_kernelComputeVertex(0),
|
|
_kernelComputeVertexA(0),
|
|
_kernelComputeCatmarkVertexB(0),
|
|
_kernelComputeLoopVertexB(0),
|
|
_kernelEditAdd(0) {
|
|
|
|
// XXX: too rough!
|
|
_workGroupSize = 64;
|
|
}
|
|
|
|
OsdD3D11ComputeKernelBundle::~OsdD3D11ComputeKernelBundle() {
|
|
SAFE_RELEASE(_computeShader);
|
|
SAFE_RELEASE(_classLinkage);
|
|
SAFE_RELEASE(_kernelCB);
|
|
SAFE_RELEASE(_kernelComputeFace);
|
|
SAFE_RELEASE(_kernelComputeEdge);
|
|
SAFE_RELEASE(_kernelComputeBilinearEdge);
|
|
SAFE_RELEASE(_kernelComputeVertex);
|
|
SAFE_RELEASE(_kernelComputeVertexA);
|
|
SAFE_RELEASE(_kernelComputeCatmarkVertexB);
|
|
SAFE_RELEASE(_kernelComputeLoopVertexB);
|
|
SAFE_RELEASE(_kernelEditAdd);
|
|
}
|
|
|
|
bool
|
|
OsdD3D11ComputeKernelBundle::Compile(int numVertexElements,
|
|
int numVaryingElements) {
|
|
|
|
_vdesc.Set( numVertexElements, numVaryingElements );
|
|
|
|
DWORD dwShaderFlags = D3DCOMPILE_ENABLE_STRICTNESS;
|
|
#ifdef _DEBUG
|
|
dwShaderFlags |= D3DCOMPILE_DEBUG;
|
|
#endif
|
|
|
|
std::ostringstream ss;
|
|
ss << numVertexElements;
|
|
std::string numVertexElementsStr(ss.str());
|
|
ss.str("");
|
|
ss << numVaryingElements;
|
|
std::string numVaryingElementsStr(ss.str());
|
|
ss.str("");
|
|
ss << _workGroupSize;
|
|
std::string workGroupSizeStr(ss.str());
|
|
|
|
D3D_SHADER_MACRO shaderDefines[] = {
|
|
"NUM_VERTEX_ELEMENTS", numVertexElementsStr.c_str(),
|
|
"NUM_VARYING_ELEMENTS", numVaryingElementsStr.c_str(),
|
|
"WORK_GROUP_SIZE", workGroupSizeStr.c_str(),
|
|
0, 0
|
|
};
|
|
|
|
ID3DBlob* pComputeShaderBuffer = NULL;
|
|
ID3DBlob* pErrorBuffer = NULL;
|
|
|
|
HRESULT hr = D3DCompile(shaderSource, strlen(shaderSource),
|
|
NULL, &shaderDefines[0], NULL,
|
|
"cs_main", "cs_5_0",
|
|
dwShaderFlags, 0,
|
|
&pComputeShaderBuffer, &pErrorBuffer);
|
|
if (FAILED(hr)) {
|
|
if (pErrorBuffer != NULL) {
|
|
OsdError(OSD_D3D11_COMPILE_ERROR,
|
|
"Error compiling HLSL shader: %s\n",
|
|
(CHAR*)pErrorBuffer->GetBufferPointer());
|
|
pErrorBuffer->Release();
|
|
return false;
|
|
}
|
|
}
|
|
|
|
ID3D11Device *device = NULL;
|
|
_deviceContext->GetDevice(&device);
|
|
assert(device);
|
|
|
|
device->CreateClassLinkage(&_classLinkage);
|
|
assert(_classLinkage);
|
|
|
|
device->CreateComputeShader(pComputeShaderBuffer->GetBufferPointer(),
|
|
pComputeShaderBuffer->GetBufferSize(),
|
|
_classLinkage,
|
|
&_computeShader);
|
|
assert(_computeShader);
|
|
|
|
ID3D11ShaderReflection *reflector;
|
|
D3DReflect(pComputeShaderBuffer->GetBufferPointer(),
|
|
pComputeShaderBuffer->GetBufferSize(),
|
|
IID_ID3D11ShaderReflection, (void**) &reflector);
|
|
assert(reflector);
|
|
|
|
assert(reflector->GetNumInterfaceSlots() == 1);
|
|
reflector->Release();
|
|
|
|
pComputeShaderBuffer->Release();
|
|
|
|
_classLinkage->GetClassInstance(
|
|
"catmarkComputeFace", 0, &_kernelComputeFace);
|
|
assert(_kernelComputeFace);
|
|
_classLinkage->GetClassInstance(
|
|
"catmarkComputeEdge", 0, &_kernelComputeEdge);
|
|
assert(_kernelComputeEdge);
|
|
_classLinkage->GetClassInstance(
|
|
"bilinearComputeEdge", 0, &_kernelComputeBilinearEdge);
|
|
assert(_kernelComputeBilinearEdge);
|
|
_classLinkage->GetClassInstance(
|
|
"bilinearComputeVertex", 0, &_kernelComputeVertex);
|
|
assert(_kernelComputeVertex);
|
|
_classLinkage->GetClassInstance(
|
|
"catmarkComputeVertexA", 0, &_kernelComputeVertexA);
|
|
assert(_kernelComputeVertexA);
|
|
_classLinkage->GetClassInstance(
|
|
"catmarkComputeVertexB", 0, &_kernelComputeCatmarkVertexB);
|
|
assert(_kernelComputeCatmarkVertexB);
|
|
_classLinkage->GetClassInstance(
|
|
"loopComputeVertexB", 0, &_kernelComputeLoopVertexB);
|
|
assert(_kernelComputeLoopVertexB);
|
|
_classLinkage->GetClassInstance(
|
|
"editAdd", 0, &_kernelEditAdd);
|
|
assert(_kernelEditAdd);
|
|
|
|
return true;
|
|
}
|
|
|
|
// must match constant buffer declaration in hlslComputeKernel.hlsl
|
|
__declspec(align(16))
|
|
struct OsdD3D11ComputeKernelBundle::KernelCB {
|
|
int vertexOffset; // vertex index offset for the batch
|
|
int tableOffset; // offset of subdivision table
|
|
int indexStart; // start index relative to tableOffset
|
|
int indexEnd; // end index relative to tableOffset
|
|
BOOL vertexPass; // 4-byte bool
|
|
|
|
// vertex edit kernel
|
|
int editPrimVarOffset;
|
|
int editPrimVarWidth;
|
|
};
|
|
|
|
void
|
|
OsdD3D11ComputeKernelBundle::dispatchCompute(
|
|
ID3D11ClassInstance * kernel, KernelCB const & args) {
|
|
|
|
int count = args.indexEnd - args.indexStart;
|
|
if (count <= 0) return;
|
|
|
|
if (! _kernelCB) {
|
|
ID3D11Device *device = NULL;
|
|
_deviceContext->GetDevice(&device);
|
|
assert(device);
|
|
|
|
D3D11_BUFFER_DESC cbDesc;
|
|
ZeroMemory(&cbDesc, sizeof(cbDesc));
|
|
cbDesc.Usage = D3D11_USAGE_DYNAMIC;
|
|
cbDesc.BindFlags = D3D11_BIND_CONSTANT_BUFFER;
|
|
cbDesc.CPUAccessFlags = D3D11_CPU_ACCESS_WRITE;
|
|
cbDesc.MiscFlags = 0;
|
|
cbDesc.ByteWidth = sizeof(KernelCB);
|
|
device->CreateBuffer(&cbDesc, NULL, &_kernelCB);
|
|
}
|
|
assert(_kernelCB);
|
|
|
|
D3D11_MAPPED_SUBRESOURCE MappedResource;
|
|
_deviceContext->Map(_kernelCB, 0, D3D11_MAP_WRITE_DISCARD, 0, &MappedResource);
|
|
CopyMemory(MappedResource.pData, &args, sizeof(KernelCB));
|
|
_deviceContext->Unmap(_kernelCB, 0);
|
|
_deviceContext->CSSetConstantBuffers(0, 1, &_kernelCB); // b0
|
|
|
|
_deviceContext->CSSetShader(_computeShader, &kernel, 1);
|
|
_deviceContext->Dispatch(count/_workGroupSize + 1, 1, 1);
|
|
}
|
|
|
|
void
|
|
OsdD3D11ComputeKernelBundle::ApplyBilinearFaceVerticesKernel(
|
|
int vertexOffset, int tableOffset, int start, int end) {
|
|
|
|
KernelCB args;
|
|
ZeroMemory(&args, sizeof(args));
|
|
args.vertexOffset = vertexOffset;
|
|
args.tableOffset = tableOffset;
|
|
args.indexStart = start;
|
|
args.indexEnd = end;
|
|
dispatchCompute(_kernelComputeFace, args);
|
|
}
|
|
|
|
void
|
|
OsdD3D11ComputeKernelBundle::ApplyBilinearEdgeVerticesKernel(
|
|
int vertexOffset, int tableOffset, int start, int end) {
|
|
|
|
KernelCB args;
|
|
ZeroMemory(&args, sizeof(args));
|
|
args.vertexOffset = vertexOffset;
|
|
args.tableOffset = tableOffset;
|
|
args.indexStart = start;
|
|
args.indexEnd = end;
|
|
dispatchCompute(_kernelComputeBilinearEdge, args);
|
|
}
|
|
|
|
void
|
|
OsdD3D11ComputeKernelBundle::ApplyBilinearVertexVerticesKernel(
|
|
int vertexOffset, int tableOffset, int start, int end) {
|
|
|
|
KernelCB args;
|
|
ZeroMemory(&args, sizeof(args));
|
|
args.vertexOffset = vertexOffset;
|
|
args.tableOffset = tableOffset;
|
|
args.indexStart = start;
|
|
args.indexEnd = end;
|
|
dispatchCompute(_kernelComputeVertex, args);
|
|
}
|
|
|
|
|
|
void
|
|
OsdD3D11ComputeKernelBundle::ApplyCatmarkFaceVerticesKernel(
|
|
int vertexOffset, int tableOffset, int start, int end) {
|
|
|
|
KernelCB args;
|
|
ZeroMemory(&args, sizeof(args));
|
|
args.vertexOffset = vertexOffset;
|
|
args.tableOffset = tableOffset;
|
|
args.indexStart = start;
|
|
args.indexEnd = end;
|
|
dispatchCompute(_kernelComputeFace, args);
|
|
}
|
|
|
|
void
|
|
OsdD3D11ComputeKernelBundle::ApplyCatmarkEdgeVerticesKernel(
|
|
int vertexOffset, int tableOffset, int start, int end) {
|
|
|
|
KernelCB args;
|
|
ZeroMemory(&args, sizeof(args));
|
|
args.vertexOffset = vertexOffset;
|
|
args.tableOffset = tableOffset;
|
|
args.indexStart = start;
|
|
args.indexEnd = end;
|
|
dispatchCompute(_kernelComputeEdge, args);
|
|
}
|
|
|
|
void
|
|
OsdD3D11ComputeKernelBundle::ApplyCatmarkVertexVerticesKernelB(
|
|
int vertexOffset, int tableOffset, int start, int end) {
|
|
|
|
KernelCB args;
|
|
ZeroMemory(&args, sizeof(args));
|
|
args.vertexOffset = vertexOffset;
|
|
args.tableOffset = tableOffset;
|
|
args.indexStart = start;
|
|
args.indexEnd = end;
|
|
dispatchCompute(_kernelComputeCatmarkVertexB, args);
|
|
}
|
|
|
|
void
|
|
OsdD3D11ComputeKernelBundle::ApplyCatmarkVertexVerticesKernelA(
|
|
int vertexOffset, int tableOffset, int start, int end, bool pass) {
|
|
|
|
KernelCB args;
|
|
ZeroMemory(&args, sizeof(args));
|
|
args.vertexOffset = vertexOffset;
|
|
args.tableOffset = tableOffset;
|
|
args.indexStart = start;
|
|
args.indexEnd = end;
|
|
args.vertexPass = pass ? 1 : 0;
|
|
dispatchCompute(_kernelComputeVertexA, args);
|
|
}
|
|
|
|
void
|
|
OsdD3D11ComputeKernelBundle::ApplyLoopEdgeVerticesKernel(
|
|
int vertexOffset, int tableOffset, int start, int end) {
|
|
|
|
KernelCB args;
|
|
ZeroMemory(&args, sizeof(args));
|
|
args.vertexOffset = vertexOffset;
|
|
args.tableOffset = tableOffset;
|
|
args.indexStart = start;
|
|
args.indexEnd = end;
|
|
dispatchCompute(_kernelComputeEdge, args);
|
|
}
|
|
|
|
void
|
|
OsdD3D11ComputeKernelBundle::ApplyLoopVertexVerticesKernelB(
|
|
int vertexOffset, int tableOffset, int start, int end) {
|
|
|
|
KernelCB args;
|
|
ZeroMemory(&args, sizeof(args));
|
|
args.vertexOffset = vertexOffset;
|
|
args.tableOffset = tableOffset;
|
|
args.indexStart = start;
|
|
args.indexEnd = end;
|
|
dispatchCompute(_kernelComputeLoopVertexB, args);
|
|
}
|
|
|
|
void
|
|
OsdD3D11ComputeKernelBundle::ApplyLoopVertexVerticesKernelA(
|
|
int vertexOffset, int tableOffset, int start, int end, bool pass) {
|
|
|
|
KernelCB args;
|
|
ZeroMemory(&args, sizeof(args));
|
|
args.vertexOffset = vertexOffset;
|
|
args.tableOffset = tableOffset;
|
|
args.indexStart = start;
|
|
args.indexEnd = end;
|
|
args.vertexPass = pass ? 1 : 0;
|
|
dispatchCompute(_kernelComputeVertexA, args);
|
|
}
|
|
|
|
void
|
|
OsdD3D11ComputeKernelBundle::ApplyEditAdd(
|
|
int primvarOffset, int primvarWidth,
|
|
int vertexOffset, int tableOffset, int start, int end) {
|
|
|
|
KernelCB args;
|
|
ZeroMemory(&args, sizeof(args));
|
|
args.vertexOffset = vertexOffset;
|
|
args.tableOffset = tableOffset;
|
|
args.indexStart = start;
|
|
args.indexEnd = end;
|
|
args.editPrimVarOffset = primvarOffset;
|
|
args.editPrimVarWidth = primvarWidth;
|
|
dispatchCompute(_kernelEditAdd, args);
|
|
}
|
|
|
|
} // end namespace OPENSUBDIV_VERSION
|
|
} // end namespace OpenSubdiv
|