Publishing 2019 R1 content
[platform/upstream/dldt.git] / inference-engine / src / inference_engine / graph_transformer.cpp
index af0dd63..8c40f08 100644 (file)
-// Copyright (C) 2018 Intel Corporation
+// Copyright (C) 2018-2019 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#include <assert.h>
+#include <cpp/ie_cnn_network.h>
+#include <details/ie_cnn_network_tools.h>
+#include <details/caseless.hpp>
 #include "graph_transformer.h"
+#include "cnn_network_impl.hpp"
+#include "blob_factory.hpp"
+#include "graph_tools.hpp"
+#include <vector>
+#include <string>
+#include <iterator>
+#include <map>
+#include <memory>
+#include <shape_infer/const_infer/ie_const_infer_holder.hpp>
 
 namespace InferenceEngine {
 
-void replaceLayerWithNewLayer(ICNNNetwork &network, const CNNLayerPtr &layer, const CNNLayerPtr &newLayer) {
-    assert(layer->name == newLayer->name);
+std::vector<std::string>
+ConstTransformer::foldConstSubgraphsInternal(const std::map<std::string, bool>& constLayers, const BlobMap& constData,
+                                               const std::vector<CNNLayerPtr>& sortedLayers) {
+    std::vector<std::string> remainingConstLayers;
+    for (const auto& layer : sortedLayers) {
+        if (constLayers.find(layer->name) != constLayers.end()) {
+            // const layer doesn't need parent connections -> erase them
+            for (const auto& insData : layer->insData) {
+                auto& inputTo = insData.lock()->getInputTo();
+                inputTo.erase(layer->name);
+                // Notr: to resolve corner case above layers can be marked as const with const data, just to be removed properly..
+                // and maybe this logic wouldn't be needed
+                if (inputTo.empty()) {
+                    auto creator = insData.lock()->creatorLayer.lock();
+                    auto it = std::find(creator->outData.begin(), creator->outData.end(), insData.lock());
+                    if (it != creator->outData.end()) {
+                        network->removeData((*it)->name);
+                        creator->outData.erase(it);
+                    }
+                }
+            }
+            layer->insData.clear();
 
-    // Redirect srd data
-    for (auto& src : layer->insData) {
-        src.lock()->getInputTo()[layer->name] = newLayer;
+            if (constLayers.at(layer->name)) {
+                for (const auto& outData : layer->outData) {
+                    for (const auto& inputTo : outData->getInputTo()) {
+                        CNNLayerPtr inputToLayer;
+                        std::string inputToName;
+                        std::tie(inputToName, inputToLayer) = inputTo;
+                        auto& insData = inputToLayer->insData;
+                        auto insDataIt = std::find_if(insData.begin(), insData.end(),
+                                                      [&outData](const DataWeakPtr& current) {
+                                                          return current.lock()->name == outData->name;
+                                                      });
+                        // remove connection with const data, because for const child it's not needed, for dynamic - new one will be created
+                        if (insDataIt != insData.end()) {
+                            insDataIt = inputToLayer->insData.erase(insDataIt);
+                        }
+                    }
+                    network->removeData(outData->name);
+                }
+                network->removeLayer(layer->name);
+            } else {
+                // if only one output data is not const - do nothing, otherwise - run procedure below
+                // note: multiple const output data requires multiple layers with blob["custom"] to keep const data
+                bool keepConstData = layer->outData.size() == 1;
+                if (keepConstData) {
+                    auto outData = layer->outData[0];
+                    for (const auto& inputTo : outData->getInputTo()) {
+                        if (constLayers.find(inputTo.first) != constLayers.end()) {
+                            keepConstData = false;
+                        }
+                    }
+                }
+                if (keepConstData) {
+                    if (!constLayers.at(layer->name)) {
+                        auto outData = layer->outData[0];
+                        if (layer->blobs.find("custom") == layer->blobs.end()) {
+                            // if there's no const data - set it
+                            const auto it = constData.find(outData->name);
+                            if (it != constData.end()) {
+                                layer->blobs["custom"] = it->second;
+                            }
+                        }
+                        if (layer->type != "Const") {
+                            // layer was calculated during the Const Propagation, need to hide its semantic (type, params)
+                            LayerParams layerParams{layer->name + "__" + outData->name + "__Const", "Const",
+                                                    layer->precision};
+                            auto newLayer = std::make_shared<CNNLayer>(layerParams);
+                            for (const auto& data : layer->outData) {
+                                data->creatorLayer = newLayer;
+                            }
+                            newLayer->outData = layer->outData;
+                            newLayer->blobs["custom"] = layer->blobs["custom"];
+                            network->removeLayer(layer->name);
+                            network->addLayer(newLayer);
+                            remainingConstLayers.push_back(newLayer->name);
+                        } else {
+                            // Layer with `Const` type should be also considered on trimming shape inputs
+                            remainingConstLayers.push_back(layer->name);
+                        }
+                    }
+                } else {
+                    for (const auto& outData : layer->outData) {
+                        for (const auto& inputTo : outData->getInputTo()) {
+                            CNNLayerPtr inputToLayer;
+                            std::string inputToName;
+                            std::tie(inputToName, inputToLayer) = inputTo;
+                            auto& insData = inputToLayer->insData;
+                            auto insDataIt = std::find_if(insData.begin(), insData.end(),
+                                                          [&outData](const DataWeakPtr& current) {
+                                                              return current.lock()->name == outData->name;
+                                                          });
+                            // remove connection with const data, because for const child it's not needed, for dynamic - new one will be created
+                            if (insDataIt != insData.end()) {
+                                insDataIt = inputToLayer->insData.erase(insDataIt);
+                            }
+                            if (constLayers.find(inputToName) == constLayers.end()) {
+                                // next layer is not const, need to attach const data to it via blobs["custom"] of new Const layer
+                                LayerParams layerParams{layer->name + "__" + outData->name + "__Const", "Const",
+                                                        layer->precision};
+                                auto newLayer = std::make_shared<CNNLayer>(layerParams);
+                                remainingConstLayers.push_back(newLayer->name);
+                                const auto it = constData.find(outData->name);
+                                if (it != constData.end()) {
+                                    newLayer->blobs["custom"] = it->second;
+                                }
+                                auto newData = std::make_shared<Data>(outData->name + "__" + inputToName,
+                                                                      outData->getTensorDesc());
+                                newData->creatorLayer = newLayer;
+                                newData->inputTo[inputToName] = inputToLayer;
+                                newLayer->outData = {newData};
+                                network->addLayer(newLayer);
+                                network->getData(newData->name) = newData;
+                                inputToLayer->insData.insert(insDataIt, newData);
+                            }
+                        }
+                    }
+                    for (const auto& data : layer->outData) {
+                        network->removeData(data->name);
+                    }
+                    network->removeLayer(layer->name);
+                }
+            }
+        }
     }
-    newLayer->insData = layer->insData;
+    return remainingConstLayers;
+}
+
+const std::map<std::string, bool> ConstTransformer::getConstLayers(const std::vector<CNNLayerPtr>& sortedLayers) {
+    std::map<std::string, bool> mapConstLayers;
+    // collect all const layers, which inputs are const layers.
+    for (const auto& layer : sortedLayers) {
+        // Layers with "Shape" and "Const" type are Const by definition
+        if (layer->type == "Shape" || layer->type == "Const") {
+            mapConstLayers[layer->name] = false;
+        } else {
+            bool isAllInputsConst = true;
+            for (auto const& data : layer->insData) {
+                auto creatorName = data.lock()->creatorLayer.lock()->name;
+                if (mapConstLayers.find(creatorName) == mapConstLayers.end()) {
+                    isAllInputsConst = false;
+                }
+            }
+            if (isAllInputsConst && !layer->insData.empty()) mapConstLayers[layer->name] = false;
+        }
+    }
+    // Add mark for const layers, if it's used for shape taking layers as second input
+    // true - is used and can be deleted from graph, as no influence on data, false - opposite
+    std::map<std::string, bool> mapVisitedLayers = mapConstLayers;
+    for (auto rit = sortedLayers.rbegin(); rit != sortedLayers.rend(); rit++) {
+        auto currentLayer = (*rit);
+        std::string currentLayerName = currentLayer->name;
+        bool isCurrentConst = mapConstLayers.find(currentLayerName) != mapConstLayers.end();
+        for (int i = 0; i < currentLayer->insData.size(); i++) {
+            std::string creatorName;
+            if (currentLayer->insData[i].lock()) {
+                auto creator = currentLayer->insData[i].lock()->creatorLayer.lock();
+                if (creator) {
+                    creatorName = creator->name;
+                }
+            }
+            bool isCreatorConst = mapConstLayers.find(creatorName) != mapConstLayers.end();
+            if (isCreatorConst) {
+                // mark second const input of shape taking layers (Reshape, Interp..), if they wasn't visited before
+                if ((i == 1) && (shapeTaking.find(currentLayer->type)) != shapeTaking.end()) {
+                    if (!mapConstLayers[creatorName]) {
+                        if (!mapVisitedLayers.at(creatorName)) {
+                            mapConstLayers[creatorName] = true;
+                        }
+                    }
+                } else {
+                    if (isCurrentConst) {
+                        if (mapConstLayers.at(currentLayerName)) {
+                            if (!mapConstLayers[creatorName]) {
+                                if (!mapVisitedLayers.at(creatorName)) {
+                                    mapConstLayers[creatorName] = true;
+                                }
+                            }
+                        } else {
+                            mapConstLayers[creatorName] = false;
+                        }
+                    } else {
+                        mapConstLayers[creatorName] = false;
+                    }
+                }
+            }
+            mapVisitedLayers[creatorName] = true;
+        }
+        mapVisitedLayers[currentLayerName] = true;
+    }
+    return mapConstLayers;
+}
+
+const BlobMap ConstTransformer::getConstData(const std::map<std::string, bool>& constLayers, const std::vector<CNNLayerPtr>& sortedLayers) {
+    ShapeInfer::ConstInferHolder holder;
+    BlobMap constData;
+    auto getInputBlobs = [&constData](const std::vector<DataWeakPtr>& insData,
+                                      bool isForShape) -> std::vector<Blob::CPtr> {
+        std::vector<Blob::CPtr> inputBlobs;
+        // special case of Const layers: no inputs, no input blobs
+        if (insData.empty()) {
+            return {};
+        }
+        for (const auto& data : insData) {
+            std::string dataName = data.lock()->name;
+            if (constData.find(dataName) != constData.end()) {
+                // get blobs, inferred before
+                inputBlobs.push_back(constData.at(dataName));
+            } else {
+                // special case of Shape layer: no input data, but blob contains info about dimensions, layout and etc...
+                auto blob = make_blob_with_precision(data.lock()->getTensorDesc());
+                inputBlobs.push_back(blob);
+            }
+        }
+        return inputBlobs;
+    };
+
+    auto getOutputBlobs = [](const std::vector<DataPtr>& outData) -> std::vector<Blob::Ptr> {
+        std::vector<Blob::Ptr> outputBlobs;
+        for (const auto& data : outData) {
+            auto blob = make_blob_with_precision(data->getTensorDesc());
+            blob->allocate();
+            outputBlobs.push_back(blob);
+        }
+        return outputBlobs;
+    };
 
-    // Redirect dst data
-    for (auto& dst : layer->outData) {
-        dst->creatorLayer = newLayer;
+    for (const auto& layer : sortedLayers) {
+        if (constLayers.find(layer->name) != constLayers.end()) {
+            std::string layerName = layer->name;
+            bool isForShape = constLayers.at(layerName);
+            CNNNetwork cnnNetwork(network);
+            auto layer = cnnNetwork.getLayerByName(layerName.c_str());
+            auto implPtr = holder.getConstInferImpl(layer->type);
+            if (!implPtr && !isForShape)
+                THROW_IE_EXCEPTION << "Failed to find reference implementation for `"
+                                      + layer->name + "` Layer with `" + layer->type + "` Type on constant propagation";
+            if (!isForShape) {
+                auto outputBlobs = getOutputBlobs(layer->outData);
+                implPtr->infer(getInputBlobs(layer->insData, isForShape), layer->params, layer->blobs, outputBlobs);
+                for (int i = 0; i < layer->outData.size(); i++) {
+                    std::string dataName = layer->outData[i]->name;
+                    auto shapes = layer->outData[i]->getTensorDesc().getDims();
+                    outputBlobs[i]->Reshape(SizeVector(shapes.rbegin(), shapes.rend()),
+                                            TensorDesc::getLayoutByDims(shapes));
+                    constData[dataName] = outputBlobs[i];
+                }
+            }
+        }
     }
-    newLayer->outData = layer->outData;
+    return constData;
+}
+
+void ConstTransformer::trimShapeInputs(const std::vector<std::string>& constLayers) {
+    for (const auto& layerName : constLayers) {
+        auto layer = cnnNetwork.getLayerByName(layerName.c_str());
+        if (layer->outData.size() == 1 && layer->type == "Const" && layer->insData.empty()) {
+            auto constData = layer->outData[0];
+            std::map<std::string, CNNLayerPtr> inputToMap = constData->getInputTo();
+            for (const auto& inputTo : inputToMap) {
+                CNNLayerPtr inputToLayer = inputTo.second;
+                if (shapeTaking.find(inputToLayer->type) != shapeTaking.end()) {
+                    auto& insData = inputToLayer->insData;
+                    auto it = std::find_if(insData.begin(), insData.end(),
+                                           [&constData](const DataWeakPtr& current) {
+                                               return current.lock()->name == constData->name;
+                                           });
+                    if (it != insData.end() && std::distance(insData.begin(), it) == 1) {
+                        inputToLayer->insData.erase(it);
+                        constData->getInputTo().erase(inputTo.first);
+                    }
+                }
+            }
+            if (constData->inputTo.empty()) {
+                network->removeData(constData->name);
+                network->removeLayer(layer->name);
+            }
+        }
+    }
+}
+
+void ConstTransformer::foldConstSubgraphs() {
+    auto sortedLayers = details::CNNNetSortTopologically(*network);
+    auto constLayers = getConstLayers(sortedLayers);
+    auto constData = getConstData(constLayers, sortedLayers);
+    foldConstSubgraphsInternal(constLayers, constData, sortedLayers);
+}
 
-    network.addLayer(newLayer);
+void ConstTransformer::fullTrim() {
+    auto sortedLayers = details::CNNNetSortTopologically(*network);
+    auto constMapLayers = getConstLayers(sortedLayers);
+    auto constData = getConstData(constMapLayers, sortedLayers);
+    auto constLayers = foldConstSubgraphsInternal(constMapLayers, constData, sortedLayers);
+    trimShapeInputs(constLayers);
 }
 
 }  // namespace InferenceEngine