2015-05-09 00:31:26 +00:00
|
|
|
//
|
|
|
|
// Copyright 2015 Pixar
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "Apache License")
|
|
|
|
// with the following modification; you may not use this file except in
|
|
|
|
// compliance with the Apache License and the following modification to it:
|
|
|
|
// Section 6. Trademarks. is deleted and replaced with:
|
|
|
|
//
|
|
|
|
// 6. Trademarks. This License does not grant permission to use the trade
|
|
|
|
// names, trademarks, service marks, or product names of the Licensor
|
|
|
|
// and its affiliates, except as required to comply with Section 4(c) of
|
|
|
|
// the License and to reproduce the content of the NOTICE file.
|
|
|
|
//
|
|
|
|
// You may obtain a copy of the Apache License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the Apache License with the above modification is
|
|
|
|
// distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
|
|
// KIND, either express or implied. See the Apache License for the specific
|
|
|
|
// language governing permissions and limitations under the Apache License.
|
|
|
|
//
|
|
|
|
|
|
|
|
#include "../osd/cudaEvaluator.h"
|
|
|
|
|
|
|
|
#include <cuda_runtime.h>
|
|
|
|
#include <vector>
|
|
|
|
|
2015-05-22 18:50:01 +00:00
|
|
|
#include "../far/stencilTable.h"
|
2015-05-09 00:31:26 +00:00
|
|
|
|
|
|
|
extern "C" {
|
|
|
|
void CudaEvalStencils(const float *src,
|
|
|
|
float *dst,
|
|
|
|
int length,
|
|
|
|
int srcStride,
|
|
|
|
int dstStride,
|
2015-05-19 17:16:56 +00:00
|
|
|
const int * sizes,
|
2015-05-09 00:31:26 +00:00
|
|
|
const int * offsets,
|
|
|
|
const int * indices,
|
|
|
|
const float * weights,
|
|
|
|
int start,
|
|
|
|
int end);
|
|
|
|
}
|
|
|
|
|
|
|
|
namespace OpenSubdiv {
|
|
|
|
namespace OPENSUBDIV_VERSION {
|
|
|
|
|
|
|
|
namespace Osd {
|
|
|
|
|
|
|
|
template <class T> void *
|
|
|
|
createCudaBuffer(std::vector<T> const & src) {
|
|
|
|
void * devicePtr = 0;
|
|
|
|
|
|
|
|
size_t size = src.size()*sizeof(T);
|
|
|
|
|
|
|
|
cudaError_t err = cudaMalloc(&devicePtr, size);
|
|
|
|
if (err != cudaSuccess) {
|
|
|
|
return devicePtr;
|
|
|
|
}
|
|
|
|
|
|
|
|
err = cudaMemcpy(devicePtr, &src.at(0), size, cudaMemcpyHostToDevice);
|
|
|
|
if (err != cudaSuccess) {
|
|
|
|
cudaFree(devicePtr);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
return devicePtr;
|
|
|
|
}
|
|
|
|
|
|
|
|
// ----------------------------------------------------------------------------
|
|
|
|
|
2015-05-22 18:50:01 +00:00
|
|
|
CudaStencilTable::CudaStencilTable(Far::StencilTable const *stencilTable) {
|
|
|
|
_numStencils = stencilTable->GetNumStencils();
|
2015-05-09 00:31:26 +00:00
|
|
|
if (_numStencils > 0) {
|
2015-05-22 18:50:01 +00:00
|
|
|
_sizes = createCudaBuffer(stencilTable->GetSizes());
|
|
|
|
_offsets = createCudaBuffer(stencilTable->GetOffsets());
|
|
|
|
_indices = createCudaBuffer(stencilTable->GetControlIndices());
|
|
|
|
_weights = createCudaBuffer(stencilTable->GetWeights());
|
2015-05-09 00:31:26 +00:00
|
|
|
} else {
|
|
|
|
_sizes = _offsets = _indices = _weights = NULL;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-05-22 18:50:01 +00:00
|
|
|
CudaStencilTable::~CudaStencilTable() {
|
2015-05-09 00:31:26 +00:00
|
|
|
if (_sizes) cudaFree(_sizes);
|
|
|
|
if (_offsets) cudaFree(_offsets);
|
|
|
|
if (_indices) cudaFree(_indices);
|
|
|
|
if (_weights) cudaFree(_weights);
|
|
|
|
}
|
|
|
|
|
|
|
|
// ---------------------------------------------------------------------------
|
|
|
|
|
|
|
|
/* static */
|
|
|
|
bool
|
|
|
|
CudaEvaluator::EvalStencils(const float *src,
|
|
|
|
VertexBufferDescriptor const &srcDesc,
|
|
|
|
float *dst,
|
|
|
|
VertexBufferDescriptor const &dstDesc,
|
2015-05-19 17:16:56 +00:00
|
|
|
const int * sizes,
|
2015-05-09 00:31:26 +00:00
|
|
|
const int * offsets,
|
|
|
|
const int * indices,
|
|
|
|
const float * weights,
|
|
|
|
int start,
|
|
|
|
int end) {
|
|
|
|
CudaEvalStencils(src + srcDesc.offset,
|
|
|
|
dst + dstDesc.offset,
|
|
|
|
srcDesc.length,
|
|
|
|
srcDesc.stride,
|
|
|
|
dstDesc.stride,
|
|
|
|
sizes, offsets, indices, weights,
|
|
|
|
start, end);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* static */
|
|
|
|
void
|
|
|
|
CudaEvaluator::Synchronize(void * /*deviceContext*/) {
|
|
|
|
cudaThreadSynchronize();
|
|
|
|
}
|
|
|
|
|
|
|
|
} // end namespace Osd
|
|
|
|
|
|
|
|
} // end namespace OPENSUBDIV_VERSION
|
|
|
|
} // end namespace OpenSubdiv
|