cavis/libnd4j/include/helpers/PointersManager.h

84 lines
2.2 KiB
C
Raw Normal View History

2021-02-01 13:31:45 +01:00
/* ******************************************************************************
*
2019-06-06 14:21:15 +02:00
*
* This program and the accompanying materials are made available under the
* terms of the Apache License, Version 2.0 which is available at
* https://www.apache.org/licenses/LICENSE-2.0.
*
2021-02-01 13:31:45 +01:00
* See the NOTICE file distributed with this work for additional
* information regarding copyright ownership.
2019-06-06 14:21:15 +02:00
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
* License for the specific language governing permissions and limitations
* under the License.
*
* SPDX-License-Identifier: Apache-2.0
******************************************************************************/
//
// @author Yurii Shyrma (iuriish@yahoo.com), created on 06.02.2019
// @author raver119@gmail.com
//
#ifndef CUDAMANAGER_H
#define CUDAMANAGER_H
#include <vector>
#include <string>
#include <execution/LaunchContext.h>
#include <types/types.h>
2019-06-06 14:21:15 +02:00
namespace sd {
2019-06-06 14:21:15 +02:00
class ND4J_EXPORT PointersManager {
2019-06-06 14:21:15 +02:00
private:
sd::LaunchContext *_context;
2019-06-06 14:21:15 +02:00
std::vector<void*> _pOnGlobMem;
std::string _funcName;
public:
PointersManager(const sd::LaunchContext* context, const std::string& funcName = "");
2019-06-06 14:21:15 +02:00
~PointersManager();
void* replicatePointer(const void* src, const size_t size);
void synchronize() const;
template<typename T>
void printDevContentOnHost(const void* pDev, const Nd4jLong len) const;
#ifdef __CUDABLAS__
template<typename T>
static void printDevContentOnDevFromHost(const void* pDev, const Nd4jLong len, const int tid = 0);
#endif
#ifdef __CUDACC__
template<typename T>
static FORCEINLINE __device__ void printDevContentOnDev(const void* pDev, const Nd4jLong len, const int tid = 0) {
if(blockIdx.x * blockDim.x + threadIdx.x != tid)
return;
printf("device print out: \n");
for(Nd4jLong i = 0; i < len; ++i)
printf("%f, ", (double)reinterpret_cast<const T*>(pDev)[i]);
printf("\n");
}
#endif
};
}
#endif // CUDAMANAGER_H