OpenSubdiv/opensubdiv/osd/cudaComputeContext.cpp
Takahito Tejima a57dd034e7 Reorganize ComputeContext and ComputeController.
Moved transient states (current vertex buffer etc) to controller.
ComputeContext becomes constant so that it's well suited for coarse-grain
parallelism on cpu. The prims sharing same topology (ComputeContext) can
be refined simultaneously by having mutiple compute controllers.
Client facing API doesn't change.
2014-05-06 08:53:36 -07:00

214 lines
5.9 KiB
C++

//
// Copyright 2013 Pixar
//
// Licensed under the Apache License, Version 2.0 (the "Apache License")
// with the following modification; you may not use this file except in
// compliance with the Apache License and the following modification to it:
// Section 6. Trademarks. is deleted and replaced with:
//
// 6. Trademarks. This License does not grant permission to use the trade
// names, trademarks, service marks, or product names of the Licensor
// and its affiliates, except as required to comply with Section 4(c) of
// the License and to reproduce the content of the NOTICE file.
//
// You may obtain a copy of the Apache License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the Apache License with the above modification is
// distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the Apache License for the specific
// language governing permissions and limitations under the Apache License.
//
#include "../osd/cudaComputeContext.h"
#include <cuda_runtime.h>
namespace OpenSubdiv {
namespace OPENSUBDIV_VERSION {
bool
OsdCudaTable::createCudaBuffer(size_t size, const void *ptr) {
cudaError_t err = cudaMalloc(&_devicePtr, size);
if (err != cudaSuccess) {
return false;
}
err = cudaMemcpy(_devicePtr, ptr, size, cudaMemcpyHostToDevice);
if (err != cudaSuccess) {
cudaFree(_devicePtr);
_devicePtr = NULL;
return false;
}
return true;
}
OsdCudaTable::~OsdCudaTable() {
if (_devicePtr) cudaFree(_devicePtr);
}
void *
OsdCudaTable::GetCudaMemory() const {
return _devicePtr;
}
// ----------------------------------------------------------------------------
OsdCudaHEditTable::OsdCudaHEditTable()
: _primvarIndicesTable(NULL), _editValuesTable(NULL) {
}
OsdCudaHEditTable::~OsdCudaHEditTable() {
delete _primvarIndicesTable;
delete _editValuesTable;
}
OsdCudaHEditTable *
OsdCudaHEditTable::Create(const FarVertexEditTables::VertexEditBatch &batch) {
OsdCudaHEditTable *result = new OsdCudaHEditTable();
result->_operation = batch.GetOperation();
result->_primvarOffset = batch.GetPrimvarIndex();
result->_primvarWidth = batch.GetPrimvarWidth();
result->_primvarIndicesTable = OsdCudaTable::Create(batch.GetVertexIndices());
result->_editValuesTable = OsdCudaTable::Create(batch.GetValues());
if (result->_primvarIndicesTable == NULL or
result->_editValuesTable == NULL) {
delete result;
return NULL;
}
return result;
}
const OsdCudaTable *
OsdCudaHEditTable::GetPrimvarIndices() const {
return _primvarIndicesTable;
}
const OsdCudaTable *
OsdCudaHEditTable::GetEditValues() const {
return _editValuesTable;
}
int
OsdCudaHEditTable::GetOperation() const {
return _operation;
}
int
OsdCudaHEditTable::GetPrimvarOffset() const {
return _primvarOffset;
}
int
OsdCudaHEditTable::GetPrimvarWidth() const {
return _primvarWidth;
}
// ----------------------------------------------------------------------------
OsdCudaComputeContext::OsdCudaComputeContext() {
}
OsdCudaComputeContext::~OsdCudaComputeContext() {
for (size_t i = 0; i < _tables.size(); ++i) {
delete _tables[i];
}
for (size_t i = 0; i < _editTables.size(); ++i) {
delete _editTables[i];
}
}
bool
OsdCudaComputeContext::initialize(FarSubdivisionTables const *subdivisionTables,
FarVertexEditTables const *vertexEditTables) {
// allocate 5 or 7 tables
_tables.resize(subdivisionTables->GetNumTables(), 0);
_tables[FarSubdivisionTables::E_IT] = OsdCudaTable::Create(subdivisionTables->Get_E_IT());
_tables[FarSubdivisionTables::V_IT] = OsdCudaTable::Create(subdivisionTables->Get_V_IT());
_tables[FarSubdivisionTables::V_ITa] = OsdCudaTable::Create(subdivisionTables->Get_V_ITa());
_tables[FarSubdivisionTables::E_W] = OsdCudaTable::Create(subdivisionTables->Get_E_W());
_tables[FarSubdivisionTables::V_W] = OsdCudaTable::Create(subdivisionTables->Get_V_W());
if (subdivisionTables->GetNumTables() > 5) {
_tables[FarSubdivisionTables::F_IT] = OsdCudaTable::Create(subdivisionTables->Get_F_IT());
_tables[FarSubdivisionTables::F_ITa] = OsdCudaTable::Create(subdivisionTables->Get_F_ITa());
}
// error check
for (size_t i = 0; i < _tables.size(); ++i) {
if (_tables[i] == NULL) {
return false;
}
}
// create hedit tables
if (vertexEditTables) {
int numEditBatches = vertexEditTables->GetNumBatches();
_editTables.reserve(numEditBatches);
for (int i = 0; i < numEditBatches; ++i) {
const FarVertexEditTables::VertexEditBatch & edit =
vertexEditTables->GetBatch(i);
_editTables.push_back(OsdCudaHEditTable::Create(edit));
}
}
// error check
for (size_t i = 0; i < _editTables.size(); ++i) {
if (_editTables[i] == NULL) return false;
}
return true;
}
const OsdCudaTable *
OsdCudaComputeContext::GetTable(int tableIndex) const {
return _tables[tableIndex];
}
int
OsdCudaComputeContext::GetNumEditTables() const {
return static_cast<int>(_editTables.size());
}
const OsdCudaHEditTable *
OsdCudaComputeContext::GetEditTable(int tableIndex) const {
return _editTables[tableIndex];
}
OsdCudaComputeContext *
OsdCudaComputeContext::Create(FarSubdivisionTables const *subdivisionTables,
FarVertexEditTables const *vertexEditTables) {
OsdCudaComputeContext *result = new OsdCudaComputeContext();
if (result->initialize(subdivisionTables, vertexEditTables) == false) {
delete result;
return NULL;
}
return result;
}
} // end namespace OPENSUBDIV_VERSION
} // end namespace OpenSubdiv