1459 lines
57 KiB
C++
1459 lines
57 KiB
C++
/*******************************************************************************
|
|
* Copyright (c) 2015-2018 Skymind, Inc.
|
|
*
|
|
* This program and the accompanying materials are made available under the
|
|
* terms of the Apache License, Version 2.0 which is available at
|
|
* https://www.apache.org/licenses/LICENSE-2.0.
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
|
|
* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
|
|
* License for the specific language governing permissions and limitations
|
|
* under the License.
|
|
*
|
|
* SPDX-License-Identifier: Apache-2.0
|
|
******************************************************************************/
|
|
|
|
//
|
|
// @author raver119@gmail.com
|
|
//
|
|
|
|
#include <graph/Graph.h>
|
|
#include <array/DataTypeUtils.h>
|
|
#include <helpers/EnumUtils.h>
|
|
#include <graph/FlatUtils.h>
|
|
#include <legacy/NativeOps.h>
|
|
#include <vector>
|
|
#include <helpers/ShapeUtils.h>
|
|
#include <ops/declarable/OpRegistrator.h>
|
|
#include <graph/VariableProxy.h>
|
|
#include <exceptions/graph_exception.h>
|
|
#include <graph/exceptions/unresolved_input_exception.h>
|
|
#include <graph/exceptions/unresolved_output_exception.h>
|
|
|
|
namespace sd {
|
|
namespace graph {
|
|
std::vector<Node*>* Graph::getAllNodes() {
|
|
return &_handles;
|
|
}
|
|
|
|
std::vector<Variable*>* Graph::getPlaceholders() {
|
|
return _variableSpace->getPlaceholders();
|
|
}
|
|
|
|
int Graph::numberOfPlaceholders() {
|
|
return _variableSpace->numberOfPlaceholders();
|
|
};
|
|
|
|
Nd4jLong Graph::estimateRequiredMemory() {
|
|
|
|
Nd4jLong result = 0L;
|
|
Nd4jLong lastStep = 0L;
|
|
|
|
std::vector<Nd4jLong const*> shapes;
|
|
MAP_IMPL<std::pair<int,int>, Nd4jLong const*> shapesMap;
|
|
|
|
int cntFD = 0;
|
|
|
|
// we loop in similar way to execution
|
|
for (int l = 0; l < (int) _onion->size(); l++) {
|
|
int layerSize = _onion->count(l) == 1 ? _onion->at(l)->size() : 0;
|
|
|
|
|
|
for (int n = 0; n < layerSize; n++) {
|
|
Node* node = _onion->at(l)->at(n);
|
|
|
|
/*
|
|
* Limited number of options here:
|
|
*
|
|
* 1) Op is inplace, so adds nothing to total
|
|
* 2) Op is not inplace, and 1:1 transform
|
|
* 3) Op is reduction (i.e. sum)
|
|
* 4) Op is multiplicator (i.e. im2col)
|
|
*/
|
|
if (node->hasCustomOp()) {
|
|
//if (node->isInplace()) {
|
|
// continue;
|
|
//}
|
|
|
|
|
|
nd4j_debug("Trying estimation [%i] on [%s]\n", node->id(), node->getCustomOp()->getOpName()->c_str());
|
|
|
|
auto op = node->getCustomOp();
|
|
auto in = node->input()->at(0);
|
|
|
|
auto block = node->getContextPrototype();
|
|
std::vector<Nd4jLong const*> inputShapes;
|
|
int *oldShape;
|
|
for (auto v: *node->input()) {
|
|
nd4j_debug(" inputs for estimation are: %i:%i\n", v.first, v.second);
|
|
if (v.first < 0) {
|
|
inputShapes.push_back(_variableSpace->getVariable(v.first)->getNDArray()->shapeInfo());
|
|
} else {
|
|
inputShapes.push_back(shapesMap.at(v));
|
|
}
|
|
}
|
|
|
|
Context ctx(block, _variableSpace);
|
|
|
|
ShapeList inSha(inputShapes);
|
|
auto outSha = op->calculateOutputShape(&inSha, ctx);
|
|
|
|
int cnt = 0;
|
|
for (auto newShape: *outSha->asVector()) {
|
|
std::pair<int, int> pairAddr(node->id(), cnt++);
|
|
std::pair<std::pair<int, int>, Nd4jLong const*> pairShape(pairAddr, newShape);
|
|
|
|
shapesMap.insert(pairShape);
|
|
|
|
if (!block->isInplace() && !node->isInplace())
|
|
result += shape::length(newShape) * DataTypeUtils::sizeOfElement(node->dataType());
|
|
|
|
shapes.push_back(newShape);
|
|
}
|
|
|
|
delete outSha;
|
|
} else if (node->getOpClass() == OpClass_TRANSFORM) {
|
|
auto vec = node->input();
|
|
|
|
auto in = node->input()->at(0);
|
|
if (in.first < 0) {
|
|
|
|
auto x = _variableSpace->getVariable(in);
|
|
auto z = _variableSpace->getVariable(node->id());
|
|
|
|
auto newShape = new Nd4jLong[shape::shapeInfoLength(x->getNDArray()->shapeInfo())];
|
|
memcpy(newShape, x->getNDArray()->shapeInfo(), shape::shapeInfoByteLength(x->getNDArray()->shapeInfo()));
|
|
|
|
std::pair<int, int> pairAddr(node->id(), 0);
|
|
std::pair<std::pair<int, int>, Nd4jLong const*> pairShape(pairAddr, newShape);
|
|
|
|
shapesMap.insert(pairShape);
|
|
|
|
if (!node->isInplace())
|
|
result += shape::length(newShape) * DataTypeUtils::sizeOfElement(node->dataType());
|
|
|
|
shapes.push_back(newShape);
|
|
} else {
|
|
auto prevShape = shapesMap.at(in);
|
|
|
|
auto newShape = new Nd4jLong[shape::shapeInfoLength(prevShape)];
|
|
memcpy(newShape, prevShape, shape::shapeInfoByteLength(prevShape));
|
|
|
|
std::pair<int, int> pairAddr(node->id(), 0);
|
|
std::pair<std::pair<int, int>, Nd4jLong const*> pairShape(pairAddr, newShape);
|
|
|
|
shapesMap.insert(pairShape);
|
|
|
|
if (!node->isInplace())
|
|
result += shape::length(newShape) * DataTypeUtils::sizeOfElement(node->dataType());
|
|
|
|
shapes.push_back(newShape);
|
|
}
|
|
|
|
} else if (node->getOpClass() == OpClass_REDUCTION) {
|
|
Nd4jLong const* newShape = nullptr;
|
|
|
|
// if that's scalar output - we don't care about previous node
|
|
if (node->getDimensions()->size() == 0 || (node->getDimensions()->size() == 1 && node->getDimensions()->at(0) == sd::DataTypeUtils::max<int>())) {
|
|
// auto aNewShape = new Nd4jLong[8];
|
|
//
|
|
// aNewShape[0] = 2;
|
|
// aNewShape[1] = 1;
|
|
// aNewShape[2] = 1;
|
|
// aNewShape[3] = 1;
|
|
// aNewShape[4] = 1;
|
|
// aNewShape[5] = 8192; // set type as FLOAT32 by default
|
|
// aNewShape[6] = 1;
|
|
// aNewShape[7] = 99;
|
|
newShape = ConstantShapeHelper::getInstance()->createShapeInfo(DataType::FLOAT32, 'c', {1,1});
|
|
} else {
|
|
auto in = node->input()->at(0);
|
|
|
|
Nd4jLong const* oldShape = nullptr;
|
|
// calculate tads here
|
|
if (in.first < 0) {
|
|
auto x = _variableSpace->getVariable(in)->getNDArray();
|
|
|
|
oldShape = x->shapeInfo();
|
|
} else {
|
|
|
|
oldShape = shapesMap.at(in);
|
|
}
|
|
|
|
//shape::TAD tad(oldShape, node->getDimensions()->data(), node->getDimensions()->size());
|
|
auto numTads = shape::tadLength(oldShape, node->getDimensions()->data(), node->getDimensions()->size());
|
|
Nd4jLong shape[2] = {1, (int) numTads};
|
|
newShape = ConstantShapeHelper::getInstance()->createShapeInfo(ArrayOptions::dataType(oldShape), 'c', 2, shape);
|
|
}
|
|
|
|
std::pair<int, int> pairAddr(node->id(), 0);
|
|
std::pair<std::pair<int, int>, Nd4jLong const*> pairShape(pairAddr, newShape);
|
|
|
|
shapesMap.insert(pairShape);
|
|
|
|
result += shape::length(newShape) * DataTypeUtils::sizeOfElement(node->dataType());
|
|
|
|
shapes.push_back(newShape);
|
|
} else if (node->getOpClass() == OpClass_MULTIPLICATOR) {
|
|
// can't be in non-special op
|
|
}
|
|
|
|
|
|
cntFD++;
|
|
}
|
|
}
|
|
|
|
// this is the only place where we deallocate shapes.
|
|
//if (_variableSpace->launchContext()->getWorkspace() == nullptr)
|
|
// for (auto v: shapes)
|
|
// delete[] v;
|
|
|
|
return result;
|
|
}
|
|
|
|
void Graph::pushToOutputOnce(int id) {
|
|
if (std::find(_output.begin(), _output.end(), id) == _output.end())
|
|
_output.emplace_back(id);
|
|
}
|
|
|
|
void Graph::addOutput(int id) {
|
|
if (_configuration->_outputMode == OutputMode_EXPLICIT || _configuration->_outputMode == OutputMode_EXPLICIT_AND_IMPLICIT)
|
|
pushToOutputOnce(id);
|
|
}
|
|
|
|
ExecutorConfiguration * Graph::getExecutorConfiguration() {
|
|
return _configuration;
|
|
}
|
|
|
|
std::vector<Variable *> * Graph::fetchOutputs() {
|
|
auto res = new std::vector<Variable *>();
|
|
|
|
nd4j_debug("Graph output size: %i\n", _output.size());
|
|
for (int e = 0; e < (int) _output.size(); e++) {
|
|
auto nodeId = _output.at(e);
|
|
nd4j_debug("Output node: %i\n", nodeId);
|
|
|
|
for (int e = 0; e < DataTypeUtils::max<int>(); e++) {
|
|
if (_variableSpace->hasVariable(nodeId, e)) {
|
|
res->push_back(_variableSpace->getVariable(nodeId, e));
|
|
} else {
|
|
if (e == 0) {
|
|
throw unresolved_output_exception::build("Can't find output variable", nodeId, e);
|
|
} else
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
return res;
|
|
}
|
|
|
|
MAP_IMPL<int, Node *> * Graph::getMapped() {
|
|
return _mapped;
|
|
}
|
|
|
|
MAP_IMPL<int, std::vector<Node *> *>* Graph::getOnion() {
|
|
return _onion;
|
|
}
|
|
|
|
void Graph::injectNode(Node *node) {
|
|
if (node->getLayer() < 0)
|
|
throw std::runtime_error("Only nodes with non-negative layer defined can be inserted");
|
|
|
|
std::pair<int, Node *> pair(node->id(), node);
|
|
if (_mapped->count(pair.first) > 0)
|
|
return;
|
|
|
|
nd4j_debug("Node_%i mapped to layer_%i\n", node->id(), node->getLayer());
|
|
|
|
|
|
_onion->at(node->getLayer())->push_back(node);
|
|
_mapped->insert(pair);
|
|
}
|
|
|
|
void Graph::expandOnion(int newLayer) {
|
|
if (_onion->count(newLayer) > 0)
|
|
return;
|
|
|
|
std::vector<Node *> *rootList = new std::vector<Node *>();
|
|
std::pair<int, std::vector<Node *>*> pair(newLayer, rootList);
|
|
_onion->insert(pair);
|
|
}
|
|
|
|
VariableSpace * Graph::getVariableSpace() {
|
|
return _variableSpace;
|
|
}
|
|
|
|
Graph::~Graph() {
|
|
for (auto &v: *_mapped)
|
|
delete v.second;
|
|
|
|
for (auto &v: _unmapped)
|
|
delete v.second;
|
|
|
|
for (auto &v: *_onion)
|
|
delete v.second;
|
|
|
|
|
|
for (auto v: _scopes)
|
|
delete v;
|
|
|
|
delete _mapped;
|
|
delete _nodes;
|
|
delete _variableSpace;
|
|
delete _onion;
|
|
delete _configuration;
|
|
}
|
|
|
|
void Graph::addNode(Node *node) {
|
|
_built.store(false);
|
|
|
|
if (node->opType() == OpType_LOGIC) {
|
|
// nd4j_debug("Adding LogicOp [%i]\n", node->opNum());
|
|
// SCOPE
|
|
if (node->opNum() == logic::Scope) {
|
|
auto scope = new Scope(node->id(), node->getName() != nullptr ? node->getName()->c_str() : "");
|
|
_mappedScopes[node->id()] = scope;
|
|
_scopes.push_back(scope);
|
|
}
|
|
}
|
|
|
|
auto cname = node->getName() == nullptr ? nullptr : node->getName()->c_str();
|
|
auto nodeState = _variableSpace->hasVariable(node->id()) ? _variableSpace->getVariable(node->id()) :new Variable(nullptr, cname, node->id());
|
|
if (node->getName() != nullptr)
|
|
nodeState->setName(node->getName());
|
|
|
|
|
|
if (node->isInplace())
|
|
nodeState->markRemovable(false);
|
|
|
|
_handles.push_back(node);
|
|
|
|
|
|
_nodes->emplace_back(node->id());
|
|
|
|
// storing node state now
|
|
_variableSpace->putVariable(node->id(), nodeState);
|
|
|
|
// here we're filling our blocks with future variables
|
|
if (node->opType() == OpType_LOGIC && node->opNum() == logic::While) {
|
|
// filling while
|
|
int inputs = node->input()->size();
|
|
for (int e = 0; e < inputs - 2; e++){
|
|
auto deepVar = new Variable(nullptr, nullptr, node->id(), e);
|
|
|
|
std::pair<int,int> id(node->id(), e);
|
|
_variableSpace->putVariable(id, deepVar);
|
|
}
|
|
|
|
} else if (node->hasCustomOp()) {
|
|
// custom ops require Block inside. but we'll set it inside buildGraph
|
|
|
|
// TODO: we want to change this, to make blocks thread-local/session-local
|
|
ContextPrototype* block = nullptr;
|
|
|
|
if (!node->hasBlockAttached()) {
|
|
block = new ContextPrototype(node->getCustomOp()->getOpDescriptor(), node->id());
|
|
node->setContextPrototype(block);
|
|
} else
|
|
block = node->getContextPrototype();
|
|
|
|
|
|
if (!block->hasVariablesFilled()) {
|
|
|
|
for (uint32_t e = 0; e < node->input()->size(); e++) {
|
|
auto p = node->input()->at(e);
|
|
|
|
block->pickInput(p);
|
|
}
|
|
}
|
|
|
|
// and might have > 1 output
|
|
if (node->getCustomOp()->getOpDescriptor()->getNumberOfOutputs() > 1) {
|
|
for (int e = 1; e < node->getCustomOp()->getOpDescriptor()->getNumberOfOutputs(); e++) {
|
|
auto deepVar = new Variable(nullptr, nullptr, node->id());
|
|
//deepVar->setId(node->id());
|
|
deepVar->setId(node->id(), e);
|
|
if (node->isInplace())
|
|
deepVar->markRemovable(false);
|
|
|
|
std::pair<int,int> id(node->id(), e);
|
|
_variableSpace->putVariable(id, deepVar);
|
|
}
|
|
} else {
|
|
// we need to check, if we should propagate output of this variable somewhere
|
|
for (int e = 0; e < node->output()->size(); e++) {
|
|
auto out = node->output()->at(e);
|
|
if (out.first < 0) {
|
|
nd4j_debug("Node [%i] will be propagating its output to Variable [%i]\n", node->id(), out.first);
|
|
auto extVar = _variableSpace->getVariable(out);
|
|
if (extVar->hasNDArray()) {
|
|
nodeState->setNDArray(extVar->getNDArray());
|
|
nodeState->markRemovable(false);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
// we're saving only ops that have internal outpus here
|
|
if (_configuration->_outputMode == OutputMode_VARIABLE_SPACE)
|
|
if (node->hasInternalOutputs())
|
|
pushToOutputOnce(node->id());
|
|
|
|
// if outputs are undefined, we have to auto-create variable
|
|
if (node->output()->size() == 0 || (node->output()->size() == 1 && node->output()->at(0).first == 0)){
|
|
Variable* var;
|
|
if (!_variableSpace->hasVariable(node->id())) {
|
|
var = new Variable();
|
|
} else {
|
|
var = _variableSpace->getVariable(node->id());
|
|
}
|
|
// nd4j_logger("Adding auto output variable; Output size: %i\n", node->output()->size());
|
|
|
|
var->setId(node->id());
|
|
var->setName(node->getName());
|
|
_variableSpace->putOutputVariable(var);
|
|
//node->pickExternalOutput(var->id());
|
|
|
|
this->_autos.push_back(var->id());
|
|
|
|
// }
|
|
} else if (node->hasExternalOutputs()) {
|
|
// TODO: we might want this behavior configurable!
|
|
nd4j_logger("Adding specific output variable: Outputs: %i; HasInternal: %i;\n", node->output()->size(), node->hasInternalOutputs());
|
|
|
|
// we're pushing this node to output only
|
|
if ((!node->hasInternalOutputs() && (_configuration->_outputMode == OutputMode_IMPLICIT || _configuration->_outputMode == OutputMode_EXPLICIT_AND_IMPLICIT)) ) {
|
|
for (int e = 0; e < (int) node->output()->size(); e++) {
|
|
if (node->output()->at(e).first < 0)
|
|
pushToOutputOnce(node->output()->at(e).first);
|
|
}
|
|
|
|
nd4j_logger("Loop finished: %i outputs now\n", this->_output.size());
|
|
}
|
|
}
|
|
|
|
// ops that are tied to specific scope are never placed into the structure.
|
|
if (node->isScoped()) {
|
|
if (_mappedScopes.count(node->scopeId()) < 1) {
|
|
nd4j_printf("Requested scope [%i/%s] wasn't created yet\n", node->scopeId(), node->scopeName()->c_str());
|
|
throw std::invalid_argument("Unknown scope requested");
|
|
}
|
|
|
|
Scope* scope = _mappedScopes.at(node->scopeId());
|
|
scope->push_back(node);
|
|
|
|
return;
|
|
}
|
|
|
|
std::pair<int, Node *> pair(node->id(), node);
|
|
// nd4j_debug("Adding node_%i\n", node->id());
|
|
// if model has only external variables as input - it goes to first layer, no matter what.
|
|
if (node->hasExternalInputs() && !node->hasInternalInputs()) {
|
|
node->setLayer(0);
|
|
|
|
injectNode(node);
|
|
|
|
// nd4j_logger("A Node_%i mapped to layer_%i; Output: %i;\n", node->id(), node->getLayer(), node->output()->at(0));
|
|
|
|
return;
|
|
} else {
|
|
// in some cases we're able to put stuff immediately
|
|
if (node->hasInternalInputs() && !node->hasExternalInputs() && node->input()->size() == 1) {
|
|
|
|
bool automapAllowed = true;
|
|
for (int e = 0; e < node->input()->size(); e++) {
|
|
auto cInput = node->input()->at(e);
|
|
int cFirst = cInput.first;
|
|
if (_mapped->count(cFirst) == 0) {
|
|
automapAllowed = false;
|
|
break;
|
|
}
|
|
}
|
|
|
|
// we only can put single input nodes, whose outputs were not mapped yet
|
|
//if (_mapped->count(node->input()->at(0).first) == 1 && (node->output()->size() == 0 || _mapped->count(node->output()->at(0).first) == 0)) {
|
|
if (automapAllowed) {
|
|
auto parent = _mapped->at(node->input()->at(0).first);
|
|
int nLayer = parent->getLayer() + 1;
|
|
|
|
expandOnion(nLayer);
|
|
node->setLayer(nLayer);
|
|
injectNode(node);
|
|
|
|
if (node->output()->size() > 0) {
|
|
nd4j_logger("Node_%i mapped to layer_%i; Output: %i;\n", node->id(), node->getLayer(), node->output()->at(0));
|
|
} else {
|
|
nd4j_logger("Node_%i mapped to layer_%i; Output: none;\n", node->id(), node->getLayer());
|
|
}
|
|
|
|
return;
|
|
}
|
|
} /*else if (node->opType() == OpType_LOGIC && node->opNum() == 10) {
|
|
// Scopes are just being added. They won't be executed on their own anyway.
|
|
|
|
int nLayer = _onion->size();
|
|
|
|
expandOnion(nLayer);
|
|
node->setLayer(nLayer);
|
|
injectNode(node);
|
|
|
|
nd4j_logger("Node_%i mapped Scope to layer_%i; Output: %i;\n", node->id(), node->getLayer(), node->output()->at(0));
|
|
|
|
return;
|
|
}
|
|
*/
|
|
// otherwise we're putting it to unmapped space for further sorting
|
|
_unmapped.insert(pair);
|
|
_unmappedMap.emplace_back(pair.first);
|
|
nd4j_debug("adding: %i\n", pair.first);
|
|
}
|
|
}
|
|
|
|
Nd4jStatus Graph::buildGraph() {
|
|
if (_built.load()) {
|
|
prepareOutputs();
|
|
return ND4J_STATUS_OK;
|
|
}
|
|
|
|
typename MAP_IMPL<int, Node *>::iterator fit;
|
|
int cnts = 0;
|
|
for ( fit = _unmapped.begin(); fit != _unmapped.end(); fit++ ) {
|
|
int tK = fit->first;
|
|
int tF = _unmappedMap.at(cnts++);
|
|
}
|
|
|
|
int buildCnt = 0;
|
|
int buildLimit = _unmapped.size() * 2;
|
|
while (_unmapped.size() > 0) {
|
|
|
|
int sz = _unmapped.size();
|
|
int sf = _unmappedMap.size();
|
|
|
|
std::vector<int> queue;
|
|
|
|
// first pass for unmapped nodes, we try to build tale here
|
|
typename MAP_IMPL<int, Node *>::iterator it;
|
|
int cntf = 0;
|
|
nd4j_debug("-----------\n","");
|
|
for ( it = _unmapped.begin(); it != _unmapped.end(); it++ ) {
|
|
auto node = it->second;
|
|
int tK = it->first;
|
|
int tF = _unmappedMap.at(cntf++);
|
|
|
|
//nd4j_printf("tK: %i; tF: %i\n", tK, tF);
|
|
//for (int f = 0; f < sz; f++) {
|
|
// auto node = _unmapped.at(_unmappedMap.at(f));
|
|
|
|
|
|
// single-input node
|
|
if (node->input()->size() == 1) {
|
|
|
|
if (node->getName() == nullptr) {
|
|
nd4j_debug("Trying SI Node_%i\n", node->id());
|
|
} else {
|
|
nd4j_debug("Trying SI Node_%i:[%s]\n", node->id(), node->getName()->c_str());
|
|
}
|
|
|
|
int iNode = node->input()->at(0).first;
|
|
if (iNode < 0 || _variableSpace->hasExternalVariable(iNode)) {
|
|
// this is external variable, should we check, who's the last user of this variable?
|
|
int lastLayer = _onion->size();
|
|
expandOnion(lastLayer);
|
|
|
|
node->setLayer(lastLayer);
|
|
this->injectNode(node);
|
|
|
|
if (node->hasCustomOp()) {
|
|
ContextPrototype* block = nullptr;
|
|
|
|
if (!node->hasBlockAttached()) {
|
|
block = new ContextPrototype(node->getCustomOp()->getOpDescriptor(), node->id());
|
|
node->setContextPrototype(block);
|
|
} else
|
|
block = node->getContextPrototype();
|
|
|
|
|
|
if (!block->hasVariablesFilled()) {
|
|
|
|
for (int e = 0; e < node->input()->size(); e++) {
|
|
auto p = node->input()->at(e);
|
|
|
|
block->pickInput(p);
|
|
}
|
|
}
|
|
}
|
|
} else if (_mapped->count(iNode) > 0) {
|
|
int maxLayer = _mapped->at(iNode)->getLayer() + 1;
|
|
|
|
node->setLayer(maxLayer);
|
|
if (_onion->count(maxLayer) == 0)
|
|
expandOnion(maxLayer);
|
|
|
|
this->injectNode(node);
|
|
queue.emplace_back(node->id());
|
|
|
|
if (node->hasCustomOp()) {
|
|
ContextPrototype* block = nullptr;
|
|
|
|
if (!node->hasBlockAttached()) {
|
|
block = new ContextPrototype(node->getCustomOp()->getOpDescriptor(), node->id());
|
|
node->setContextPrototype(block);
|
|
} else
|
|
block = node->getContextPrototype();
|
|
|
|
|
|
if (!block->hasVariablesFilled()) {
|
|
|
|
for (uint32_t e = 0; e < node->input()->size(); e++) {
|
|
auto p = node->input()->at(e);
|
|
|
|
block->pickInput(p);
|
|
}
|
|
}
|
|
}
|
|
} else
|
|
continue;
|
|
|
|
//_unmapped.erase(node->id());
|
|
queue.emplace_back(node->id());
|
|
} else {
|
|
// multi-input node
|
|
if (node->getName() == nullptr) {
|
|
nd4j_debug("Trying MI Node_%i\n", node->id());
|
|
} else {
|
|
std::string np = *(node->getName());
|
|
nd4j_debug("Trying MI Node_%i:[%s]\n", node->id(), node->getName()->c_str());
|
|
}
|
|
|
|
int maxLayer = 0;
|
|
bool breaker = false;
|
|
for (unsigned int e = 0; e < node->input()->size(); e++) {
|
|
int nodeId = node->input()->at(e).first;
|
|
|
|
// if input node wasn't mapped yet - we'll have skip it in this round
|
|
if (_mapped->count(nodeId) == 1) {
|
|
auto iNode = _mapped->at(nodeId);
|
|
|
|
if (maxLayer < iNode->getLayer())
|
|
maxLayer = iNode->getLayer();
|
|
} else
|
|
if (node->opType() == OpType_LOGIC) {
|
|
// just allow it?
|
|
} else // checking if that's static variable
|
|
if (nodeId > 0 && !_variableSpace->hasExternalVariable(nodeId)) {
|
|
breaker = true;
|
|
break;
|
|
}
|
|
}
|
|
|
|
if (breaker)
|
|
continue;
|
|
|
|
maxLayer++;
|
|
if (_onion->count(maxLayer) == 0)
|
|
expandOnion(maxLayer);
|
|
|
|
node->setLayer(maxLayer);
|
|
injectNode(node);
|
|
queue.emplace_back(node->id());
|
|
|
|
if (node->hasCustomOp()) {
|
|
ContextPrototype* block = nullptr;
|
|
|
|
if (!node->hasBlockAttached()) {
|
|
block = new ContextPrototype(node->getCustomOp()->getOpDescriptor(), node->id());
|
|
node->setContextPrototype(block);
|
|
} else
|
|
block = node->getContextPrototype();
|
|
|
|
if (!block->hasVariablesFilled()) {
|
|
|
|
for (uint32_t e = 0; e < node->input()->size(); e++) {
|
|
auto p = node->input()->at(e);
|
|
|
|
block->pickInput(p);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
for (auto &v: queue)
|
|
_unmapped.erase(v);
|
|
|
|
// second pass is mover, we'll be moving onion layers around here
|
|
buildCnt++;
|
|
if (buildCnt > buildLimit) {
|
|
nd4j_printf("Unable to build graph, probably unmapped nodes, or something: %i nodes left\n", _unmapped.size());
|
|
for (auto v: _unmapped) {
|
|
Node* node = v.second;
|
|
nd4j_printf("Unmapped node: [%i]\n", node->id());
|
|
}
|
|
|
|
throw std::runtime_error("Unable to build graph");
|
|
}
|
|
}
|
|
|
|
if (_unmapped.size() == 0)
|
|
_built.store(true);
|
|
|
|
prepareOutputs();
|
|
|
|
return sd::Status::OK();
|
|
}
|
|
|
|
void Graph::tagInplaceNodes() {
|
|
// just calling, in case it wasn't built before
|
|
if (!_built.load())
|
|
this->buildGraph();
|
|
|
|
bool buildRef = false;
|
|
|
|
// checking for non-refenenced nodes
|
|
for (auto v: *_nodes) {
|
|
// skipping unmapped nodes
|
|
if (_mapped->count(v) == 0)
|
|
continue;
|
|
|
|
Node* node = _mapped->at(v);
|
|
if (node->totalReferences() == 0) {
|
|
buildRef = true;
|
|
break;
|
|
}
|
|
}
|
|
|
|
if (buildRef) {
|
|
for (auto v: *_nodes) {
|
|
// skipping unmapped nodes
|
|
if (_mapped->count(v) == 0)
|
|
continue;
|
|
|
|
Node* node = _mapped->at(v);
|
|
auto inputs = node->input();
|
|
for (auto &t: *inputs) {
|
|
if (_mapped->count(t.first) == 0)
|
|
continue;
|
|
|
|
Node* inode = _mapped->at(t.first);
|
|
inode->addReference(node->id());
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
for (auto v: *_nodes) {
|
|
// skipping unmapped nodes
|
|
if (_mapped->count(v) == 0)
|
|
continue;
|
|
|
|
Node* node = _mapped->at(v);
|
|
|
|
/**
|
|
* Node can be inplace if 2 requirements met:
|
|
* 1) current node allows in-place modification
|
|
* 2) source node has only 1 output
|
|
*/
|
|
|
|
// checking for first requirement first
|
|
if (node->getCustomOp() != nullptr)
|
|
if (node->getCustomOp()->getOpDescriptor()->allowsInplace()){
|
|
bool singleInput = true;
|
|
auto inputs = node->input();
|
|
for (auto &t: *inputs) {
|
|
if (_mapped->count(t.first) == 0)
|
|
continue;
|
|
|
|
Node* inode = _mapped->at(t.first);
|
|
|
|
int output_size = inode->output()->size();
|
|
|
|
// checking for second requirement: inputNode must not be used as input anywhere
|
|
if (inode->totalReferences() > 1) {
|
|
singleInput = false;
|
|
break;
|
|
}
|
|
}
|
|
|
|
node->markInplace(singleInput);
|
|
}
|
|
}
|
|
}
|
|
|
|
void Graph::prepareOutputs() {
|
|
// if we're dumping everything out there - we'll add external variables as well
|
|
if (_configuration->_outputMode == OutputMode_VARIABLE_SPACE) {
|
|
auto ext = _variableSpace->getExternalVariables();
|
|
nd4j_verbose("Number of external variables: %i\n", ext->size())
|
|
for (unsigned int e = 0; e < ext->size(); e++) {
|
|
pushToOutputOnce(ext->at(e)->id());
|
|
}
|
|
|
|
for (auto v: *_nodes) {
|
|
if (_mapped->count(v) == 0)
|
|
continue;
|
|
|
|
Node* node = _mapped->at(v);
|
|
|
|
if (std::find(_output.begin(), _output.end(), node->id()) == _output.end())
|
|
_output.emplace_back(node->id());
|
|
}
|
|
|
|
} else if (_configuration->_outputMode == OutputMode_IMPLICIT) {
|
|
// we're adding final nodes of the graph. those, not used as input anywhere
|
|
nd4j_debug("Paring nodes... \n", "");
|
|
|
|
if (Environment::getInstance()->isDebugAndVerbose()) {
|
|
// nd4j_printv("current _output", _output);
|
|
}
|
|
//_output.clear();
|
|
|
|
for (auto v: *_nodes) {
|
|
// we should check for scopes, and other possible non-mapped stuff
|
|
if (_mapped->count(v) == 0)
|
|
continue;
|
|
|
|
Node* node = _mapped->at(v);
|
|
if (node->name() != nullptr) {
|
|
nd4j_debug("Node %i; Name: [%s]\n", v, node->name()->c_str());
|
|
} else {
|
|
nd4j_debug("Node %i\n", v);
|
|
}
|
|
|
|
// updating outputs now
|
|
for (int e = 0; e < node->input()->size(); e++) {
|
|
auto inP = node->input()->at(e);
|
|
|
|
// input can be variable, or node. we only care about nodes
|
|
if (_mapped->count(inP.first) > 0) {
|
|
_mapped->at(inP.first)->pickOutputOnce(v);
|
|
}
|
|
}
|
|
}
|
|
// at this point all nodes have filled inputs/outputs, so we know nodes that do not have any connected outputs
|
|
|
|
for (auto v: *_nodes) {
|
|
// we should check for scopes, and other possible non-mapped stuff
|
|
if (_mapped->count(v) == 0)
|
|
continue;
|
|
|
|
Node* node = _mapped->at(v);
|
|
|
|
if (!node->hasInternalOutputs()) {
|
|
if (node->name() != nullptr) {
|
|
nd4j_debug("Output node found: [%i:<%s>]\n", v, node->name()->c_str());
|
|
} else {
|
|
nd4j_debug("Output node found: [%i]\n", v);
|
|
}
|
|
|
|
// FIXME: we don't really need search here.
|
|
|
|
if (std::find(_output.begin(), _output.end(), node->id()) == _output.end())
|
|
_output.emplace_back(node->id());
|
|
} else if (Environment::getInstance()->isDebugAndVerbose()) {
|
|
nd4j_debug("Node [%i:<%s>] has %i outputs announced:\n", v, node->name()->c_str(), node->output()->size());
|
|
printf("{");
|
|
for (auto s : *node->output()) {
|
|
printf("[%i:%i], ", s.first, s.second);
|
|
}
|
|
printf("}\n");
|
|
fflush(stdout);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
Graph::Graph(const FlatGraph *flatGraph, VariableSpace *variableSpace) {
|
|
this->_onion = new MAP_IMPL<int, std::vector<Node *> *>();
|
|
this->_mapped = new MAP_IMPL<int, Node *> ();
|
|
this->_nodes = new std::vector<int>();
|
|
this->_variableSpace = variableSpace == nullptr ? new VariableSpace() : variableSpace;
|
|
bool trusted = flatGraph != nullptr;
|
|
|
|
// add 0 layer
|
|
this->expandOnion(0);
|
|
|
|
// if there was no exec configuration in flatgraph - create default one
|
|
if (flatGraph != nullptr && flatGraph->configuration() != nullptr) {
|
|
_configuration = new ExecutorConfiguration(flatGraph->configuration());
|
|
} else
|
|
_configuration = new ExecutorConfiguration();
|
|
|
|
// if memory reqs were set - initialize workspace
|
|
if (_configuration->_footprintForward > 0) {
|
|
sd::memory::Workspace *workspace = this->_variableSpace->launchContext()->getWorkspace();
|
|
workspace->expandBy(_configuration->_footprintForward);
|
|
}
|
|
|
|
// parsing variables here
|
|
if (flatGraph != nullptr && flatGraph->variables() != nullptr && flatGraph->variables()->size() > 0) {
|
|
for (unsigned int e = 0; e < flatGraph->variables()->size(); e++) {
|
|
auto flatVar = flatGraph->variables()->Get(e);
|
|
|
|
auto var = new Variable(flatVar);
|
|
std::pair<int, int> pair(flatVar->id()->first(), flatVar->id()->second());
|
|
_variableSpace->putVariable(pair, var);
|
|
|
|
// if that's VariableSpace mode - we're pushing it to _output
|
|
if (_configuration->_outputMode == OutputMode_VARIABLE_SPACE)
|
|
pushToOutputOnce(var->id());
|
|
|
|
}
|
|
}
|
|
|
|
// at this point we expect all variables are already registered
|
|
// we're saving outputs only if explicit mode is set
|
|
if (_configuration->_outputMode == OutputMode_EXPLICIT || _configuration->_outputMode == OutputMode_EXPLICIT_AND_IMPLICIT) {
|
|
if (flatGraph != nullptr && flatGraph->outputs() != nullptr) {
|
|
for (unsigned int e = 0; e < flatGraph->outputs()->size(); e++) {
|
|
auto out = flatGraph->outputs()->Get(e);
|
|
std::pair<int, int> vp(out->first(), out->second());
|
|
if (!_variableSpace->hasVariable(vp)) {
|
|
nd4j_verbose("Non-existent variable requested: %i\n", out);
|
|
throw std::runtime_error("Non-existent variable requested");
|
|
}
|
|
|
|
// TODO: fix this .first
|
|
pushToOutputOnce(vp.first);
|
|
}
|
|
}
|
|
}
|
|
|
|
// rolling through nodes
|
|
if (flatGraph != nullptr && flatGraph->nodes() != nullptr && flatGraph->nodes()->size() > 0) {
|
|
for (unsigned int e = 0; e < flatGraph->nodes()->size(); e++) {
|
|
auto node = flatGraph->nodes()->Get(e);
|
|
|
|
if (node->output() == nullptr || node->output()->size() == 0) {
|
|
nd4j_verbose("Orphan node detected: %i; AutoOutput to be considered\n", node->id());
|
|
}
|
|
|
|
nd4j_debug("Node name: [%s]\n", node->name()->c_str());
|
|
auto nnode = new Node(node);
|
|
/*
|
|
expandOnion(e);
|
|
nnode->setLayer(e);
|
|
this->addNode(nnode);
|
|
injectNode(nnode);
|
|
_unmapped.erase(nnode->id());
|
|
*/
|
|
// just filling list of nodes
|
|
_unmapped[nnode->id()] = nnode;
|
|
}
|
|
|
|
|
|
this->toposortNodes();
|
|
|
|
_built = true;
|
|
}
|
|
|
|
/**
|
|
* we allow in-place execution optimizations ONLY if 2 requirements met:
|
|
* 1) this is FeedForward pass ONLY
|
|
* 2) OPTIMIZED mode is set, so no intermediate results are going to be used
|
|
*/
|
|
if (_configuration->_direction == Direction_FORWARD_ONLY && _configuration->_outputMode == OutputMode_OPTIMIZED)
|
|
this->tagInplaceNodes();
|
|
}
|
|
|
|
|
|
void Graph::toposortNodes() {
|
|
int attempts = 0;
|
|
|
|
// in worst possible case number of rolls equals to the number of nodes
|
|
int limit = _unmapped.size() + 1;
|
|
|
|
std::vector<int> tbd;
|
|
while (!_unmapped.empty() && attempts < limit) {
|
|
for (auto np:_unmapped) {
|
|
auto id = np.first;
|
|
tbd.emplace_back(id);
|
|
}
|
|
|
|
// rolling through unmapped nodes
|
|
for (auto np:tbd) {
|
|
auto id = np;
|
|
auto node = _unmapped[id];
|
|
|
|
// this variables contains the layer of maximal dependency
|
|
int maxDependencyLayer = -1;
|
|
|
|
// simple flag
|
|
bool canMap = true;
|
|
|
|
// looping through inputs, to check if they were already mapped
|
|
auto inputs = node->input();
|
|
for (auto in:*inputs) {
|
|
// only 2 options here, in either refers to the node, or to the variable
|
|
// however, node can be already mapped, or not yet. this makes it 3 options :)
|
|
|
|
if (hasNode(in.first)) { // node was mapped
|
|
auto dependency = nodeById(in.first);
|
|
auto layer = dependency->getLayer();
|
|
if (layer > maxDependencyLayer)
|
|
maxDependencyLayer = layer;
|
|
|
|
} else if (_unmapped.count(in.first) > 0) { // node is unmapped yet
|
|
// can't map this node yet, due to non-resolved dependencies
|
|
canMap = false;
|
|
} else if (_variableSpace->hasVariable(in.first)){ // that's probably variable. if not - we'll throw exception later
|
|
// do nothing, maxDepLayer is -1 here, because it's a variable input
|
|
} else {
|
|
throw graph::unresolved_input_exception::build("Unknown input specified", id, in);
|
|
}
|
|
}
|
|
|
|
if (canMap) {
|
|
auto layer = maxDependencyLayer + 1;
|
|
this->expandOnion(layer);
|
|
node->setLayer(layer);
|
|
this->addNode(node);
|
|
this->injectNode(node);
|
|
_unmapped.erase(id);
|
|
}
|
|
}
|
|
|
|
// if something was successfully mapped - remove it from unmapped entries
|
|
if (!tbd.empty())
|
|
tbd.clear();
|
|
|
|
attempts++;
|
|
}
|
|
|
|
if (!_unmapped.empty())
|
|
throw graph_exception("Graph wasn't toposorted", 0);
|
|
|
|
_built = true;
|
|
}
|
|
|
|
|
|
/**
|
|
* This method returns number of root nodes in this graph
|
|
* @return
|
|
*/
|
|
int Graph::rootNodes() {
|
|
return this->_onion->at(0)->size();
|
|
}
|
|
|
|
/**
|
|
* This method returns total number of nodes in this graph
|
|
* @return
|
|
*/
|
|
int Graph::totalNodes() {
|
|
if (_built.load() != true)
|
|
buildGraph();
|
|
|
|
return _mapped->size();
|
|
}
|
|
|
|
Nd4jStatus Graph::validate() {
|
|
if (!_built) {
|
|
_mutexPreprocessing.lock();
|
|
if (!_built) {
|
|
this->buildGraph();
|
|
}
|
|
_mutexPreprocessing.unlock();
|
|
}
|
|
|
|
if (_built.load() != true)
|
|
return ND4J_STATUS_BAD_GRAPH;
|
|
|
|
return ND4J_STATUS_OK;
|
|
};
|
|
|
|
void Graph::printOutNode(Node* node) {
|
|
nd4j_printf("%i. ", node->id());
|
|
switch(node->opType()) {
|
|
case OpType_CUSTOM: {
|
|
printf("%s; ", node->getCustomOp()->getOpName()->c_str());
|
|
}
|
|
break;
|
|
case OpType_LOGIC: {
|
|
printf("%s; ", EnumUtils::_LogicOpToString(node->opNum()));
|
|
}
|
|
break;
|
|
default: {
|
|
printf("%s:{%i}; ", EnumUtils::_OpTypeToString(node->opType()), (int) node->opNum());
|
|
}
|
|
}
|
|
|
|
nd4j_printf("Inputs: [", "");
|
|
//auto block = node->getBlock();
|
|
for (int e = 0; e < node->input()->size(); e++) {
|
|
|
|
auto in = node->input()->at(e);
|
|
printf("{%i:%i}", in.first, in.second);
|
|
if (e < node->input()->size() - 1)
|
|
nd4j_printf(", ", "");
|
|
}
|
|
|
|
if (node->opType() == OpType_CUSTOM) {
|
|
auto ctx = node->protoContext();
|
|
if (ctx->getIArguments()->size() > 0) {
|
|
printf("]; iArgs: [");
|
|
|
|
for (int e = 0; e < ctx->getIArguments()->size(); e++) {
|
|
printf("%i", ctx->getIArguments()->at(e));
|
|
if (e < ctx->getIArguments()->size() - 1)
|
|
nd4j_printf(", ", "");
|
|
}
|
|
}
|
|
}
|
|
|
|
nd4j_printf("]; \n", "");
|
|
|
|
|
|
// printf("\n");
|
|
fflush(stdout);
|
|
}
|
|
|
|
void Graph::printOut() {
|
|
buildGraph();
|
|
|
|
// print variables first
|
|
if (_variableSpace->totalEntries() > 0) {
|
|
nd4j_printf("\nPrinting out Variables...\n", "");
|
|
auto vars = _variableSpace->getVariables();
|
|
|
|
for (Variable* v: vars) {
|
|
if (v->hasNDArray()) {
|
|
auto shape = ShapeUtils::shapeAsString(v->getNDArray());
|
|
auto values = v->getNDArray()->asString(16);
|
|
auto dtype = DataTypeUtils::asString(v->getNDArray()->dataType());
|
|
|
|
if (v->getName() != nullptr && !v->getName()->empty()) {
|
|
nd4j_printf("<%s> <%i:%i> dtype: %s; shape: %s; values: %s;\n", v->getName()->c_str(), v->id(), v->index(), dtype.c_str(), shape.c_str(), values.c_str());
|
|
} else {
|
|
nd4j_printf("<%i:%i> dtype: %s; shape: %s; values: %s;\n", v->id(), v->index(), dtype.c_str(), shape.c_str(), values.c_str());
|
|
}
|
|
} else if (v->hasNDArrayList()) {
|
|
// TODO: add better NDArrayList printout
|
|
nd4j_printf("<%i:%i> holds ArrayList", v->id(), v->index());
|
|
}
|
|
}
|
|
}
|
|
|
|
if (_onion->size() > 0)
|
|
nd4j_printf("\nPrinting out Graph...\n", "");
|
|
|
|
int opCnt = 0;
|
|
for (int l = 0; l < _onion->size(); l++) {
|
|
int layerSize = _onion->count(l) == 1 ? _onion->at(l)->size() : 0;
|
|
|
|
for (int n = 0; n < layerSize; n++) {
|
|
Node* node = _onion->at(l)->at(n);
|
|
|
|
// we're skipping Scopes here
|
|
if (node->opType() == OpType_LOGIC && node->opNum() == logic::Scope)
|
|
continue;
|
|
|
|
printOutNode(node);
|
|
}
|
|
}
|
|
|
|
|
|
if (_scopes.size() > 0)
|
|
nd4j_printf("\nPrinting out Scopes...\n","");
|
|
|
|
for (int s = 0; s < _scopes.size(); s++) {
|
|
Scope* scope = _scopes.at(s);
|
|
nd4j_printf("Scope %i:<%s>:\n", scope->id(), scope->name()->c_str());
|
|
|
|
for (int n = 0; n < scope->nodes()->size(); n++) {
|
|
Node* node = scope->nodes()->at(n);
|
|
printOutNode(node);
|
|
}
|
|
}
|
|
|
|
fflush(stdout);
|
|
}
|
|
|
|
Nd4jStatus Graph::validateNode(Node *node) {
|
|
// TODO: to be implemented
|
|
return ND4J_STATUS_OK;
|
|
}
|
|
|
|
std::vector<sd::ops::OpDescriptor> Graph::getOperations() {
|
|
buildGraph();
|
|
// nd4j_printf("\nRetrieving ops from the Graph and collect them...\n", "");
|
|
std::vector<sd::ops::OpDescriptor> res;
|
|
|
|
int opCnt = 0;
|
|
for (int l = 0; l < _onion->size(); l++) {
|
|
int layerSize = _onion->count(l) == 1 ? _onion->at(l)->size() : 0;
|
|
|
|
for (int n = 0; n < layerSize; n++) {
|
|
Node* node = _onion->at(l)->at(n);
|
|
if (node->name() == nullptr) continue;
|
|
sd::ops::OpDescriptor* pOpDescriptor = nullptr;
|
|
std::string opNameStr; //node->name();
|
|
int numInputs = 0;
|
|
int numOutputs = 0;
|
|
|
|
switch(node->opType()) {
|
|
case OpType_CUSTOM: {
|
|
pOpDescriptor = node->getCustomOp()->getOpDescriptor();
|
|
}
|
|
break;
|
|
case OpType_LOGIC: {
|
|
opNameStr = std::string(EnumUtils::_LogicOpToString(node->opNum()));
|
|
}
|
|
break;
|
|
default: {
|
|
opNameStr = std::string(EnumUtils::_OpTypeToString(node->opType()))+"{" + ops::OpRegistrator::getInstance()->local_to_string<int>((int) node->opNum()) + "}";
|
|
}
|
|
}
|
|
|
|
if (node->input())
|
|
numInputs = node->input()->size();
|
|
|
|
if (node->output())
|
|
numOutputs = node->output()->size();
|
|
bool inplace = node->isInplace();
|
|
|
|
//OpDescriptor opDescriptor(numInputs, numOutputs, opNameStr, inplace);
|
|
|
|
// we're skipping Scopes here
|
|
if (node->opType() == OpType_LOGIC && node->opNum() == logic::Scope)
|
|
continue;
|
|
if (pOpDescriptor)
|
|
res.emplace_back(*pOpDescriptor);
|
|
else
|
|
res.emplace_back(sd::ops::OpDescriptor(numInputs, numOutputs, opNameStr, inplace));
|
|
}
|
|
}
|
|
|
|
|
|
// nd4j_printf("\nCollecting out Scopes...\n","");
|
|
for (int s = 0; s < _scopes.size(); s++) {
|
|
Scope* scope = _scopes.at(s);
|
|
// nd4j_printf("Scope %i:<%s>:\n", scope->id(), scope->name()->c_str());
|
|
|
|
for (int n = 0; n < scope->nodes()->size(); n++) {
|
|
Node* node = scope->nodes()->at(n);
|
|
//printOutNode(node);
|
|
if (node->name() == nullptr) continue;
|
|
std::string opNameStr; //node->name();
|
|
sd::ops::OpDescriptor* pOpDescriptor = nullptr;
|
|
int numInputs = 0;
|
|
int numOutputs = 0;
|
|
|
|
switch(node->opType()) {
|
|
case OpType_CUSTOM: {
|
|
pOpDescriptor = node->getCustomOp()->getOpDescriptor();
|
|
}
|
|
break;
|
|
case OpType_LOGIC: {
|
|
opNameStr = std::string(EnumUtils::_LogicOpToString(node->opNum()));
|
|
}
|
|
break;
|
|
default: {
|
|
opNameStr = std::string(EnumUtils::_OpTypeToString(node->opType()))+"{" + ops::OpRegistrator::getInstance()->local_to_string<int>((int) node->opNum()) + "}";
|
|
}
|
|
}
|
|
|
|
if (node->input())
|
|
numInputs = node->input()->size();
|
|
|
|
if (node->output())
|
|
numOutputs = node->output()->size();
|
|
bool inplace = node->isInplace();
|
|
|
|
if (pOpDescriptor != nullptr)
|
|
res.emplace_back(*pOpDescriptor);
|
|
else
|
|
res.emplace_back(sd::ops::OpDescriptor(numInputs, numOutputs, opNameStr, inplace));
|
|
}
|
|
}
|
|
|
|
return res;
|
|
}
|
|
|
|
Scope *Graph::scopeById(int id) {
|
|
if (_mappedScopes.count(id) == 0) {
|
|
nd4j_printf("Requested Scope [%i] doesn't exist\n", id);
|
|
throw std::runtime_error("Non-existent Scope was requested");
|
|
}
|
|
|
|
return _mappedScopes.at(id);
|
|
}
|
|
|
|
void Graph::forgetVariableSpace() {
|
|
_variableSpace = nullptr;
|
|
}
|
|
|
|
void Graph::replaceState(VariableSpace *state, ExecutorConfiguration *configuration) {
|
|
delete _variableSpace;
|
|
delete _configuration;
|
|
|
|
_variableSpace = state;
|
|
_configuration = configuration;
|
|
}
|
|
|
|
Graph* Graph::cloneWithProxy() {
|
|
auto clone = new Graph();
|
|
|
|
clone->replaceState(new VariableProxy(this->_variableSpace), this->_configuration->clone());
|
|
|
|
// transfer nodes
|
|
for (int e = 0; e < _nodes->size(); e++)
|
|
clone->_nodes->emplace_back(_nodes->at(e));
|
|
|
|
// transfer outputs
|
|
for (auto v: _output)
|
|
clone->_output.emplace_back(v);
|
|
|
|
// transfer autos
|
|
for (auto v: _autos)
|
|
clone->_autos.emplace_back(v);
|
|
|
|
// transfer scopes
|
|
for (auto &v: _mappedScopes) {
|
|
auto scp = v.second->clone();
|
|
clone->_mappedScopes[v.first] = scp;
|
|
clone->_scopes.emplace_back(scp);
|
|
}
|
|
|
|
// transfer mapped nodes
|
|
for (auto &v: *_onion) {
|
|
auto vec = clone->_onion->count(v.first) > 0 ? clone->_onion->at(v.first) : new std::vector<Node*>();
|
|
|
|
|
|
// cloning actual nodes
|
|
auto ovec = (*_onion)[v.first];
|
|
for (auto x: *(ovec)) {
|
|
auto n = x->clone();
|
|
vec->emplace_back(n);
|
|
_handles.emplace_back(n);
|
|
(*clone->_mapped)[n->id()] = n;
|
|
}
|
|
|
|
if (clone->_onion->count(v.first) < 1)
|
|
(*clone->_onion)[v.first] = vec;
|
|
}
|
|
|
|
// transfer mapped nodes
|
|
for (auto &v: _unmapped)
|
|
clone->_unmapped[v.first] = v.second->clone();
|
|
|
|
clone->_built.store(_built.load());
|
|
|
|
return clone;
|
|
}
|
|
|
|
Graph* Graph::clone() {
|
|
auto clone = new Graph();
|
|
|
|
clone->replaceState(this->_variableSpace->clone(), this->_configuration->clone());
|
|
|
|
// transfer nodes
|
|
for (int e = 0; e < _nodes->size(); e++)
|
|
clone->_nodes->emplace_back(_nodes->at(e));
|
|
|
|
// transfer outputs
|
|
for (auto v: _output)
|
|
clone->_output.emplace_back(v);
|
|
|
|
// transfer autos
|
|
for (auto v: _autos)
|
|
clone->_autos.emplace_back(v);
|
|
|
|
// transfer scopes
|
|
for (auto &v: _mappedScopes) {
|
|
auto scp = v.second->clone();
|
|
clone->_mappedScopes[v.first] = scp;
|
|
clone->_scopes.emplace_back(scp);
|
|
}
|
|
|
|
// transfer mapped nodes
|
|
for (auto &v: *_onion) {
|
|
auto vec = clone->_onion->count(v.first) > 0 ? clone->_onion->at(v.first) : new std::vector<Node*>();
|
|
|
|
|
|
// cloning actual nodes
|
|
auto ovec = (*_onion)[v.first];
|
|
for (auto x: *(ovec)) {
|
|
auto n = x->clone();
|
|
vec->emplace_back(n);
|
|
_handles.emplace_back(n);
|
|
(*clone->_mapped)[n->id()] = n;
|
|
}
|
|
|
|
if (clone->_onion->count(v.first) < 1)
|
|
(*clone->_onion)[v.first] = vec;
|
|
}
|
|
|
|
// transfer mapped nodes
|
|
for (auto &v: _unmapped)
|
|
clone->_unmapped[v.first] = v.second->clone();
|
|
|
|
clone->_built.store(_built.load());
|
|
|
|
return clone;
|
|
}
|
|
|
|
bool Graph::hasNode(int id) {
|
|
return _mapped->count(id) > 0;
|
|
}
|
|
|
|
Node* Graph::nodeById(int id) {
|
|
return _mapped->at(id);
|
|
}
|
|
|
|
bool Graph::hasScope(int id) {
|
|
return _mappedScopes.count(id) > 0;
|
|
}
|
|
|
|
Nd4jLong Graph::hashCode() {
|
|
if (!_built.load())
|
|
this->buildGraph();
|
|
|
|
Nd4jLong hash = 0L;
|
|
std::string localStamp;
|
|
/**
|
|
* Plan is:
|
|
* 1) get shapes of existing variables
|
|
* 2) get hash codes of individual ops
|
|
* 3) optionally: get node names, if they are defined
|
|
* 4) use long hash on that
|
|
*/
|
|
int cnt = 0;
|
|
/*
|
|
if (_variableSpace != nullptr) {
|
|
// loop over existing variables
|
|
for (auto v: *(_variableSpace->handles())) {
|
|
if (v->hasNDArray()) {
|
|
NDArray *arr = v->getNDArray();
|
|
if (arr != nullptr && arr->nonNull()) {
|
|
auto shape = arr->getShapeAsVector();
|
|
auto string = ShapeUtils::shapeAsString(shape);
|
|
localStamp += string;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
*/
|
|
|
|
// loop over nodes in graph
|
|
for (auto &v: *_mapped) {
|
|
Node *node = v.second;
|
|
|
|
// optional part: node names
|
|
if (!node->name()->empty()) {
|
|
localStamp += *(node->name());
|
|
}
|
|
}
|
|
|
|
|
|
hash = ops::HashHelper::getInstance()->getLongHash(localStamp);
|
|
|
|
nd4j_debug("Graph hash: %lld\n", hash);
|
|
|
|
return hash;
|
|
}
|
|
}
|
|
}
|
|
|