OpenSubdiv/opensubdiv/osd/cudaComputeContext.cpp

//
//   Copyright 2013 Pixar
//
//   Licensed under the Apache License, Version 2.0 (the "Apache License")
//   with the following modification; you may not use this file except in
//   compliance with the Apache License and the following modification to it:
//   Section 6. Trademarks. is deleted and replaced with:
//
//   6. Trademarks. This License does not grant permission to use the trade
//      names, trademarks, service marks, or product names of the Licensor
//      and its affiliates, except as required to comply with Section 4(c) of
//      the License and to reproduce the content of the NOTICE file.
//
//   You may obtain a copy of the Apache License at
//
//       http://www.apache.org/licenses/LICENSE-2.0
//
//   Unless required by applicable law or agreed to in writing, software
//   distributed under the Apache License with the above modification is
//   distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
//   KIND, either express or implied. See the Apache License for the specific
//   language governing permissions and limitations under the Apache License.
//

#include "../far/stencilTables.h"

#include "../osd/cudaComputeContext.h"

#include <cuda_runtime.h>
#include <vector>

namespace OpenSubdiv {
namespace OPENSUBDIV_VERSION {

namespace Osd {

// ----------------------------------------------------------------------------

template <class T> void *
createCudaBuffer(std::vector<T> const & src) {

    void * devicePtr=0;

    size_t size = src.size()*sizeof(T);

    cudaError_t err = cudaMalloc(&devicePtr, size);
    if (err != cudaSuccess) {
        return devicePtr;
    }

    err = cudaMemcpy(devicePtr, &src.at(0), size, cudaMemcpyHostToDevice);
    if (err != cudaSuccess) {
        cudaFree(devicePtr);
        return 0;
    }
    return devicePtr;
}

// ----------------------------------------------------------------------------

class CudaComputeContext::CudaStencilTables {

public:

    CudaStencilTables(Far::StencilTables const & stencilTables) {
        _sizes = createCudaBuffer(stencilTables.GetSizes());
        _offsets = createCudaBuffer(stencilTables.GetOffsets());
        _indices = createCudaBuffer(stencilTables.GetControlIndices());
        _weights = createCudaBuffer(stencilTables.GetWeights());
        _numStencils = stencilTables.GetNumStencils();
    }

    ~CudaStencilTables() {
        if (_sizes) { cudaFree(_sizes); }
        if (_offsets) { cudaFree(_offsets); }
        if (_indices) { cudaFree(_indices); }
        if (_weights) { cudaFree(_weights); }
    }

    bool IsValid() const {
        return _sizes and _offsets and _indices and _weights;
    }

    void * GetSizes() const {
        return _sizes;
    }

    void * GetOffsets() const {
        return _offsets;
    }

    void * GetIndices() const {
        return _indices;
    }

    void * GetWeights() const {
        return _weights;
    }

    int GetNumStencils() const {
        return _numStencils;
    }

private:
    void * _sizes,
         * _offsets,
         * _indices,
         * _weights;
    int _numStencils;
};

// ----------------------------------------------------------------------------

CudaComputeContext::CudaComputeContext(
    Far::StencilTables const * vertexStencilTables,
        Far::StencilTables const * varyingStencilTables) :
            _vertexStencilTables(0), _varyingStencilTables(0),
                _numControlVertices(0) {

    if (vertexStencilTables) {
        _vertexStencilTables = new CudaStencilTables(*vertexStencilTables);
        _numControlVertices = vertexStencilTables->GetNumControlVertices();
    }

    if (varyingStencilTables) {
        _varyingStencilTables = new CudaStencilTables(*varyingStencilTables);

        if (_numControlVertices) {
            assert(_numControlVertices==varyingStencilTables->GetNumControlVertices());
        } else {
            _numControlVertices = varyingStencilTables->GetNumControlVertices();
        }
    }
}

CudaComputeContext::~CudaComputeContext() {
    delete _vertexStencilTables;
    delete _varyingStencilTables;
}

// ----------------------------------------------------------------------------

bool
CudaComputeContext::HasVertexStencilTables() const {
    return _vertexStencilTables ? _vertexStencilTables->IsValid() : false;
}

bool
CudaComputeContext::HasVaryingStencilTables() const {
    return _varyingStencilTables ? _varyingStencilTables->IsValid() : false;
}

int
CudaComputeContext::GetNumStencilsInVertexStencilTables() const {
    return _vertexStencilTables ? _vertexStencilTables->GetNumStencils() : 0;
}

int
CudaComputeContext::GetNumStencilsInVaryingStencilTables() const {
    return _varyingStencilTables ? _varyingStencilTables->GetNumStencils() : 0;
}

// ----------------------------------------------------------------------------

void *
CudaComputeContext::GetVertexStencilTablesSizes() const {
    return _vertexStencilTables ? _vertexStencilTables->GetSizes() : 0;
}

void *
CudaComputeContext::GetVertexStencilTablesOffsets() const {
    return _vertexStencilTables ? _vertexStencilTables->GetOffsets() : 0;
}

void *
CudaComputeContext::GetVertexStencilTablesIndices() const {
    return _vertexStencilTables ? _vertexStencilTables->GetIndices() : 0;
}

void *
CudaComputeContext::GetVertexStencilTablesWeights() const {
    return _vertexStencilTables ? _vertexStencilTables->GetWeights() : 0;
}

// ----------------------------------------------------------------------------

void *
CudaComputeContext::GetVaryingStencilTablesSizes() const {
    return _varyingStencilTables ? _varyingStencilTables->GetSizes() : 0;
}

void *
CudaComputeContext::GetVaryingStencilTablesOffsets() const {
    return _varyingStencilTables ? _varyingStencilTables->GetOffsets() : 0;
}

void *
CudaComputeContext::GetVaryingStencilTablesIndices() const {
    return _varyingStencilTables ? _varyingStencilTables->GetIndices() : 0;
}

void *
CudaComputeContext::GetVaryingStencilTablesWeights() const {
    return _varyingStencilTables ? _varyingStencilTables->GetWeights() : 0;
}

// ----------------------------------------------------------------------------

CudaComputeContext *
CudaComputeContext::Create(Far::StencilTables const * vertexStencilTables,
                              Far::StencilTables const * varyingStencilTables) {

    CudaComputeContext *result =
        new CudaComputeContext(vertexStencilTables, varyingStencilTables);

    return result;
}

}  // end namespace Osd

}  // end namespace OPENSUBDIV_VERSION
}  // end namespace OpenSubdiv