2020-01-24 08:11:09 +01:00
|
|
|
/*******************************************************************************
|
|
|
|
* Copyright (c) 2020 Konduit K.K.
|
|
|
|
*
|
|
|
|
* This program and the accompanying materials are made available under the
|
|
|
|
* terms of the Apache License, Version 2.0 which is available at
|
|
|
|
* https://www.apache.org/licenses/LICENSE-2.0.
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
|
|
|
|
* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
|
|
|
|
* License for the specific language governing permissions and limitations
|
|
|
|
* under the License.
|
|
|
|
*
|
|
|
|
* SPDX-License-Identifier: Apache-2.0
|
|
|
|
******************************************************************************/
|
|
|
|
|
|
|
|
//
|
|
|
|
// @author raver119@gmail.com
|
|
|
|
//
|
|
|
|
|
|
|
|
#include "../MemoryCounter.h"
|
|
|
|
#include <execution/AffinityManager.h>
|
2020-03-02 10:49:41 +01:00
|
|
|
#include <system/Environment.h>
|
2020-01-24 08:11:09 +01:00
|
|
|
#include <helpers/logger.h>
|
|
|
|
|
2020-03-02 10:49:41 +01:00
|
|
|
namespace sd {
|
2020-01-24 08:11:09 +01:00
|
|
|
namespace memory {
|
|
|
|
|
|
|
|
MemoryCounter::MemoryCounter() {
|
2020-03-02 10:49:41 +01:00
|
|
|
auto numDevices = sd::AffinityManager::numberOfDevices();
|
2020-01-24 08:11:09 +01:00
|
|
|
|
|
|
|
// setting default 0s
|
|
|
|
for (int e = 0; e < numDevices; e++) {
|
|
|
|
_deviceLimits[e] = 0;
|
|
|
|
_deviceCounters[e] = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
// setting initial values for limits
|
2020-03-02 10:49:41 +01:00
|
|
|
_groupLimits[sd::memory::MemoryType::HOST] = sd::Environment::getInstance()->maxPrimaryMemory();
|
|
|
|
_groupLimits[sd::memory::MemoryType::DEVICE] = sd::Environment::getInstance()->maxSpecialMemory();
|
2020-01-24 08:11:09 +01:00
|
|
|
|
|
|
|
// setting initial counter values
|
2020-03-02 10:49:41 +01:00
|
|
|
_groupCounters[sd::memory::MemoryType::HOST] = 0;
|
|
|
|
_groupCounters[sd::memory::MemoryType::DEVICE] = 0;
|
2020-01-24 08:11:09 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
MemoryCounter* MemoryCounter::getInstance() {
|
|
|
|
if (_INSTANCE == 0)
|
|
|
|
_INSTANCE = new MemoryCounter();
|
|
|
|
|
|
|
|
return _INSTANCE;
|
|
|
|
}
|
|
|
|
|
|
|
|
void MemoryCounter::countIn(int deviceId, Nd4jLong numBytes) {
|
|
|
|
std::lock_guard<std::mutex> lock(_locker);
|
|
|
|
_deviceCounters[deviceId] += numBytes;
|
|
|
|
}
|
|
|
|
|
2020-03-02 10:49:41 +01:00
|
|
|
void MemoryCounter::countIn(sd::memory::MemoryType group, Nd4jLong numBytes) {
|
2020-01-24 08:11:09 +01:00
|
|
|
std::lock_guard<std::mutex> lock(_locker);
|
|
|
|
_groupCounters[group] += numBytes;
|
|
|
|
}
|
|
|
|
|
|
|
|
void MemoryCounter::countOut(int deviceId, Nd4jLong numBytes) {
|
|
|
|
std::lock_guard<std::mutex> lock(_locker);
|
|
|
|
_deviceCounters[deviceId] -= numBytes;
|
|
|
|
}
|
|
|
|
|
2020-03-02 10:49:41 +01:00
|
|
|
void MemoryCounter::countOut(sd::memory::MemoryType group, Nd4jLong numBytes) {
|
2020-01-24 08:11:09 +01:00
|
|
|
std::lock_guard<std::mutex> lock(_locker);
|
|
|
|
_groupCounters[group] -= numBytes;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool MemoryCounter::validate(Nd4jLong numBytes) {
|
2020-03-02 10:49:41 +01:00
|
|
|
auto deviceId = sd::AffinityManager::currentDeviceId();
|
2020-01-24 08:11:09 +01:00
|
|
|
return validateDevice(deviceId, numBytes);
|
|
|
|
}
|
|
|
|
|
|
|
|
bool MemoryCounter::validateDevice(int deviceId, Nd4jLong numBytes) {
|
|
|
|
std::lock_guard<std::mutex> lock(_locker);
|
|
|
|
auto dLimit = _deviceLimits[deviceId];
|
|
|
|
if (dLimit <= 0)
|
|
|
|
return true;
|
|
|
|
|
|
|
|
auto dAlloc = _deviceCounters[deviceId];
|
|
|
|
|
|
|
|
return numBytes + dAlloc <= dLimit;
|
|
|
|
}
|
|
|
|
|
2020-03-02 10:49:41 +01:00
|
|
|
bool MemoryCounter::validateGroup(sd::memory::MemoryType group, Nd4jLong numBytes) {
|
2020-01-24 08:11:09 +01:00
|
|
|
std::lock_guard<std::mutex> lock(_locker);
|
|
|
|
auto gLimit = _groupLimits[group];
|
|
|
|
if (gLimit <= 0)
|
|
|
|
return true;
|
|
|
|
|
|
|
|
auto gAlloc = _groupCounters[group];
|
|
|
|
|
|
|
|
return numBytes + gAlloc <= gLimit;
|
|
|
|
}
|
|
|
|
|
|
|
|
Nd4jLong MemoryCounter::allocatedDevice(int deviceId) {
|
|
|
|
std::lock_guard<std::mutex> lock(_locker);
|
|
|
|
return _deviceCounters[deviceId];
|
|
|
|
}
|
|
|
|
|
2020-03-02 10:49:41 +01:00
|
|
|
Nd4jLong MemoryCounter::allocatedGroup(sd::memory::MemoryType group) {
|
2020-01-24 08:11:09 +01:00
|
|
|
std::lock_guard<std::mutex> lock(_locker);
|
|
|
|
return _groupCounters[group];
|
|
|
|
}
|
|
|
|
|
|
|
|
void MemoryCounter::setDeviceLimit(int deviceId, Nd4jLong numBytes) {
|
|
|
|
std::lock_guard<std::mutex> lock(_locker);
|
|
|
|
_deviceLimits[deviceId] = numBytes;
|
|
|
|
}
|
|
|
|
|
2020-03-02 10:49:41 +01:00
|
|
|
void MemoryCounter::setGroupLimit(sd::memory::MemoryType group, Nd4jLong numBytes) {
|
2020-01-24 08:11:09 +01:00
|
|
|
std::lock_guard<std::mutex> lock(_locker);
|
|
|
|
_groupLimits[group] = numBytes;
|
|
|
|
}
|
|
|
|
|
|
|
|
Nd4jLong MemoryCounter::deviceLimit(int deviceId) {
|
|
|
|
std::lock_guard<std::mutex> lock(_locker);
|
|
|
|
return _deviceLimits[deviceId];
|
|
|
|
}
|
|
|
|
|
2020-03-02 10:49:41 +01:00
|
|
|
Nd4jLong MemoryCounter::groupLimit(sd::memory::MemoryType group) {
|
2020-01-24 08:11:09 +01:00
|
|
|
std::lock_guard<std::mutex> lock(_locker);
|
|
|
|
return _groupLimits[group];
|
|
|
|
}
|
|
|
|
|
|
|
|
MemoryCounter* MemoryCounter::_INSTANCE = 0;
|
|
|
|
}
|
|
|
|
}
|