// This file is part of OpenCV project. // It is subject to the license terms in the LICENSE file found in the top-level directory // of this distribution and at http://opencv.org/license.html. #ifndef __OPENCV_DNN_SRC_NET_IMPL_HPP__ #define __OPENCV_DNN_SRC_NET_IMPL_HPP__ #include "op_halide.hpp" #include "op_inf_engine.hpp" #include "ie_ngraph.hpp" #include "op_vkcom.hpp" #include "op_cuda.hpp" #include "op_webnn.hpp" #include "op_timvx.hpp" #include #include #include #include #include #include "layer_internals.hpp" // LayerPin LayerData DataLayer #include "legacy_backend.hpp" // wrapMat BlobManager OpenCLBackendWrapper namespace cv { namespace dnn { CV__DNN_INLINE_NS_BEGIN using std::make_pair; using std::string; // NB: Implementation is divided between of multiple .cpp files struct Net::Impl : public detail::NetImplBase { typedef std::map LayersShapesMap; typedef std::map MapIdToLayerData; Impl(); Ptr netInputLayer; std::vector blobsToKeep; MapIdToLayerData layers; std::map layerNameToId; std::map outputNameToId; // use registerOutput() to populate outputs BlobManager blobManager; int preferableBackend; int preferableTarget; String halideConfigFile; bool skipInfEngineInit; bool hasDynamicShapes; // Map host data to backend specific wrapper. std::map> backendWrappers; int lastLayerId; bool netWasAllocated; bool netWasQuantized; bool fusion; bool isAsync; std::vector layersTimings; bool empty() const; void setPreferableBackend(int backendId); void setPreferableTarget(int targetId); // FIXIT use inheritance Ptr wrap(Mat& host); void clear(); void setUpNet(const std::vector& blobsToKeep_ = std::vector()); Ptr getLayer(int layerId) const; Ptr getLayer(const LayerId& layerId) const; int getLayerId(const String& layerName) const; int getLayerId(int id) const; int getLayerId(DictValue& layerDesc) const; String getLayerName(int id) const; LayerData& getLayerData(int id) const; LayerData& getLayerData(const String& layerName) const; LayerData& getLayerData(const DictValue& layerDesc) const; static void addLayerInput(LayerData& ld, int inNum, LayerPin from); int resolvePinOutputName(LayerData& ld, const String& outName) const; LayerPin getPinByAlias(const String& layerName) const; std::vector getLayerOutPins(const String& layerName) const; // FIXIT remove dtype int addLayer(const String& name, const String& type, const int& dtype, LayerParams& params); int addLayerToPrev(const String& name, const String& type, const int& dtype, LayerParams& params); void connect(int outLayerId, int outNum, int inLayerId, int inNum); int registerOutput(const std::string& outputName, int layerId, int outputPort); // FIXIT drop "unconnected" API std::vector getUnconnectedOutLayers() const; std::vector getUnconnectedOutLayersNames() /*const*/; void setInputsNames(const std::vector& inputBlobNames); void setInputShape(const String& inputName, const MatShape& shape); void setInput(InputArray blob, const String& name, double scalefactor, const Scalar& mean); Mat getParam(int layer, int numParam) const; void setParam(int layer, int numParam, const Mat& blob); std::vector> getLayerInputs(int layerId) const; std::vector getLayerNames() const; // TODO drop? void getLayerTypes(std::vector& layersTypes) const; int getLayersCount(const String& layerType) const; // FIXIT use inheritance void initBackend(const std::vector& blobsToKeep_); void setHalideScheduler(const String& scheduler); #ifdef HAVE_HALIDE void compileHalide(); void initHalideBackend(); #endif #ifdef HAVE_DNN_NGRAPH void addNgraphOutputs(LayerData& ld); void initNgraphBackend(const std::vector& blobsToKeep_); #endif #ifdef HAVE_WEBNN void addWebnnOutputs(LayerData& ld); void initWebnnBackend(const std::vector& blobsToKeep_); #endif #ifdef HAVE_VULKAN void initVkComBackend(); #endif #ifdef HAVE_TIMVX // Create timVxInfo for reserve tvGraphList. TimVXInfo timVxInfo = TimVXInfo(); void tvUpdateConfictMap(int graphIndex, LayerData& ld, std::vector >& graphConflictMap); void tvConvertToOutputNode(const LayerData& ld, Ptr& targetWrap); void initTimVXBackend(); #endif #ifdef HAVE_CUDA struct CudaInfo_t { CudaInfo_t(cuda4dnn::csl::CSLContext ctxt, cuda4dnn::csl::Stream d2h_stream_) : context(std::move(ctxt)) , d2h_stream(std::move(d2h_stream_)) {} cuda4dnn::csl::CSLContext context; cuda4dnn::csl::Stream d2h_stream; cuda4dnn::csl::Workspace workspace; }; std::unique_ptr cudaInfo; void initCUDABackend(const std::vector& blobsToKeep_); #endif void allocateLayer(int lid, const LayersShapesMap& layersShapes); // TODO add getter void enableFusion(bool fusion_); void fuseLayers(const std::vector& blobsToKeep_); void allocateLayers(const std::vector& blobsToKeep_); void forwardLayer(LayerData& ld); void forwardToLayer(LayerData& ld, bool clearFlags = true); Mat forward(const String& outputName); AsyncArray forwardAsync(const String& outputName); void forward(OutputArrayOfArrays outputBlobs, const String& outputName); void forward(OutputArrayOfArrays outputBlobs, const std::vector& outBlobNames); void forward(std::vector>& outputBlobs, const std::vector& outBlobNames); void getLayerShapesRecursively(int id, LayersShapesMap& inOutShapes); void getLayersShapes( const ShapesVec& netInputShapes, std::vector& layersIds, std::vector& inLayersShapes, std::vector& outLayersShapes) /*const*/; void getLayersShapes(const ShapesVec& netInputShapes, LayersShapesMap& inOutShapes); void getLayerShapes(const ShapesVec& netInputShapes, const int layerId, LayerShapes& shapes); void updateLayersShapes(); int64 getFLOPS(const std::vector& netInputShapes) /*const*/; int64 getFLOPS( const int layerId, const std::vector& netInputShapes) /*const*/; void getMemoryConsumption( const int layerId, const std::vector& netInputShapes, size_t& weights, size_t& blobs) /*const*/; void getMemoryConsumption( const std::vector& netInputShapes, size_t& weights, size_t& blobs) /*const*/; void getMemoryConsumption( const std::vector& netInputShapes, std::vector& layerIds, std::vector& weights, std::vector& blobs) /*const*/; int64 getPerfProfile(std::vector& timings) const; // TODO drop LayerPin getLatestLayerPin(const std::vector& pins) const; Mat getBlob(const LayerPin& pin) const; Mat getBlob(String outputName) const; #ifdef CV_CXX11 AsyncArray getBlobAsync(const LayerPin& pin); AsyncArray getBlobAsync(String outputName); #endif // CV_CXX11 #ifdef HAVE_INF_ENGINE static Net createNetworkFromModelOptimizer(InferenceEngine::CNNNetwork& ieNet); #endif string dump(bool forceAllocation = false) const; void dumpNetworkToFile() const; // FIXIT drop from inference API Net quantize(InputArrayOfArrays calibData, int inputsDtype, int outputsDtype, bool perChannel) /*const*/; void getInputDetails(std::vector& scales, std::vector& zeropoints) /*const*/; void getOutputDetails(std::vector& scales, std::vector& zeropoints) /*const*/; }; // Net::Impl CV__DNN_INLINE_NS_END }} // namespace cv::dnn #endif // __OPENCV_DNN_SRC_NET_IMPL_HPP__