kevinch-nv
diff --git a/‎CMakeLists.txt‎
Lines changed: 10 additions & 4 deletions b/‎CMakeLists.txt‎
Lines changed: 10 additions & 4 deletions
diff --git a/‎ImporterContext.hpp‎
Lines changed: 10 additions & 0 deletions b/‎ImporterContext.hpp‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎ModelImporter.cpp‎
Lines changed: 27 additions & 8 deletions b/‎ModelImporter.cpp‎
Lines changed: 27 additions & 8 deletions
diff --git a/‎OnnxAttrs.cpp‎
Lines changed: 5 additions & 1 deletion b/‎OnnxAttrs.cpp‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎README.md‎
Lines changed: 9 additions & 0 deletions b/‎README.md‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎TensorOrWeights.hpp‎
Lines changed: 10 additions & 2 deletions b/‎TensorOrWeights.hpp‎
Lines changed: 10 additions & 2 deletions
@@ -111,9 +111,15 @@ find_library(TENSORRT_LIBRARY_INFER nvinfer
 find_library(TENSORRT_LIBRARY_INFER_PLUGIN nvinfer_plugin
   HINTS  ${TENSORRT_ROOT} ${TENSORRT_BUILD} ${CUDA_TOOLKIT_ROOT_DIR}
   PATH_SUFFIXES lib lib64 lib/x64)
-find_library(TENSORRT_LIBRARY_MYELIN myelin
-  HINTS  ${TENSORRT_ROOT} ${TENSORRT_BUILD} ${CUDA_TOOLKIT_ROOT_DIR}
-  PATH_SUFFIXES lib lib64 lib/x64)
+if(WIN32)
+  find_library(TENSORRT_LIBRARY_MYELIN myelin64_1
+    HINTS  ${TENSORRT_ROOT} ${TENSORRT_BUILD} ${CUDA_TOOLKIT_ROOT_DIR}
+    PATH_SUFFIXES lib lib64 lib/x64)
+else()
+  find_library(TENSORRT_LIBRARY_MYELIN myelin
+    HINTS  ${TENSORRT_ROOT} ${TENSORRT_BUILD} ${CUDA_TOOLKIT_ROOT_DIR}
+    PATH_SUFFIXES lib lib64 lib/x64)
+endif()
 set(TENSORRT_LIBRARY ${TENSORRT_LIBRARY_INFER} ${TENSORRT_LIBRARY_INFER_PLUGIN} ${TENSORRT_LIBRARY_MYELIN})
 MESSAGE(STATUS "Find TensorRT libs at ${TENSORRT_LIBRARY}")
 find_package_handle_standard_args(
@@ -152,7 +158,7 @@ endif()
 # --------------------------------
 add_executable(onnx2trt ${EXECUTABLE_SOURCES})
 target_include_directories(onnx2trt PUBLIC ${ONNX_INCLUDE_DIRS})
-target_link_libraries(onnx2trt PUBLIC ${PROTOBUF_LIB} nvonnxparser_static ${CMAKE_THREAD_LIBS_INIT} ${CMAKE_DL_LIBS}) #${CUDA_LIBRARIES} 
+target_link_libraries(onnx2trt PUBLIC ${PROTOBUF_LIB} onnx nvonnxparser_static ${CMAKE_THREAD_LIBS_INIT} ${CMAKE_DL_LIBS}) #${CUDA_LIBRARIES} 
 
 # --------------------------------
 # API Tests
 
@@ -48,6 +48,8 @@ class ImporterContext final : public IImporterContext
         mTensorNameCounts; // Keep track of how many times a tensor name shows up, to avoid duplicate naming in TRT.
     StringMap<size_t>
         mLayerNameCounts; // Keep track of how many times a tensor name shows up, to avoid duplicate naming in TRT.
+    std::unordered_set<std::string> mUnsupportedShapeTensors; // Container to hold any shape tensors that are the output of layers that do not support shape tensors.
+    StringMap<std::string> mLoopTensors; // Container to map subgraph tensors to their original outer graph names.
 public:
     ImporterContext(nvinfer1::INetworkDefinition* network, nvinfer1::ILogger* logger)
         : _network(network)
@@ -78,6 +80,14 @@ class ImporterContext final : public IImporterContext
     {
         return mLayerPrecisions;
     }
+    virtual std::unordered_set<std::string>& unsupportedShapeTensors() override
+    {
+        return mUnsupportedShapeTensors;
+    }
+    virtual StringMap<std::string>& loopTensors() override
+    {
+        return mLoopTensors;
+    }
 
     // This actually handles weights as well, but is named this way to be consistent with the tensors()
     virtual void registerTensor(TensorOrWeights tensor, const std::string& basename) override
 
@@ -172,7 +172,8 @@ Status parseGraph(
             auto& output = outputs.at(i);
             ssOutputs << "[" << outputName << " -> " << output.shape() << "], ";
             // Note: This condition is to allow ONNX outputs to be ignored
-            if (output && !outputName.empty())
+            // Always register output weights (even empty ones) as it may be mapped to an unused input
+            if ((output || output.is_weights()) && !outputName.empty())
             {
                 ctx->registerTensor(std::move(output), outputName);
             }
@@ -331,11 +332,11 @@ bool ModelImporter::supportsModel(
             }
         }
     }
-
-    auto checkForInput = [&input_node](::ONNX_NAMESPACE::NodeProto const& node) {
+    auto* ctx = &_importer_ctx;
+    auto checkForInput = [&input_node, &ctx](::ONNX_NAMESPACE::NodeProto const& node) {
         for (auto input : node.input())
         {
-            if (input_node == input)
+            if (input_node == input || ctx->loopTensors()[input_node] == input)
             {
                 return true;
             }
@@ -351,17 +352,23 @@ bool ModelImporter::supportsModel(
         cout << "Failed to sort model topologically, exiting ..." << endl;
         return false;
     }
+
     for (int node_idx : topological_order)
     {
         ::ONNX_NAMESPACE::NodeProto const& node = model.graph().node(node_idx);
+
         // Add the node to the subgraph if:
-        //     1. Importer function is regestiered for the operator type
-        //     2. It is not directly connected to an unsupported input
-        //     3. Parsing did not hit an error on the node
+        //     1. Importer function is registered for the operator type
+        //     2. It is NOT directly connected to an unsupported input
+        //     3. Parsing did NOT hit an error on the node
+        //     4. Any shape tensor output is coming from a supported node
         bool registered = supportsOperator(node.op_type().c_str());
         bool containsInput = (input_node.empty()) ? false : checkForInput(node);
         bool containsIndex = node_idx == error_node;
-        if (registered && !containsInput && !containsIndex)
+        auto const tensor = node.output(0);
+        bool supportedShapeTensorOutput = ctx->unsupportedShapeTensors().count(tensor) == 0 ? true : false;
+
+        if (registered && !containsInput && !containsIndex && supportedShapeTensorOutput)
         {
             if (newSubGraph)
             {
@@ -447,6 +454,18 @@ void removeShapeTensorCasts(IImporterContext* ctx)
             {
                 t.setType(SHAPE_TENSOR_TYPE);
             }
+            // Some layers do not support shape tensor outputs. Keep track of these tensor names
+            // for supportsModel().
+            auto type = layer->getType();
+            auto elementwiseOp = layer->getType() == nvinfer1::LayerType::kELEMENTWISE ? (static_cast<nvinfer1::IElementWiseLayer*>(layer))->getOperation() : nvinfer1::ElementWiseOperation::kSUM;
+            auto reduceOp = layer->getType() == nvinfer1::LayerType::kREDUCE ? (static_cast<nvinfer1::IReduceLayer*>(layer))->getOperation() : nvinfer1::ReduceOperation::kSUM;
+
+            if (!supportsShapeTensor(type, elementwiseOp, reduceOp))
+            {
+                auto name = layer->getOutput(0)->getName();
+                ctx->unsupportedShapeTensors().insert(name);
+                LOG_ERROR("Found " << name << " as a shape tensor output from a layer that does not support it!");
+            }
         }
     }
 }
 
@@ -109,7 +109,11 @@ onnx2trt::ShapedWeights OnnxAttrs::get<onnx2trt::ShapedWeights>(const std::strin
 {
     ::ONNX_NAMESPACE::TensorProto const& onnx_weights_tensor = this->at(key)->t();
     onnx2trt::ShapedWeights weights;
-    convertOnnxWeights(onnx_weights_tensor, &weights, mCtx);
+    // Return empty weights if conversion failed
+    if (!convertOnnxWeights(onnx_weights_tensor, &weights, mCtx))
+    {
+        return onnx2trt::ShapedWeights::empty(::ONNX_NAMESPACE::TensorProto_DataType_FLOAT);
+    }
     return weights;
 }
 
 
@@ -58,6 +58,15 @@ ONNX models can also be converted to human-readable text:
 
     onnx2trt my_model.onnx -t my_model.onnx.txt
 
+ONNX models can also be optimized by ONNX's optimization libraries.
+To optimize an ONNX model and output a new one use `-m` to specify the output model name and `-O` to specify a semicolon-separated list of optimization passes to apply:
+
+    onnx2trt my_model.onnx -O "pass_1;pass_2;pass_3" -m my_model_optimized.onnx
+
+See more all available optimization passes by running:
+
+    onnx2trt -p
+
 See more usage information by running:
 
     onnx2trt -h
 
@@ -67,14 +67,18 @@ class TensorOrWeights
     {
         return _variant == NODE_WEIGHTS;
     }
+    bool isNullTensor() const
+    {
+        return is_tensor() && _tensor == nullptr;
+    }
     nvinfer1::ITensor& tensor()
     {
-        assert(is_tensor());
+        assert(!isNullTensor());
         return *_tensor;
     }
     nvinfer1::ITensor const& tensor() const
     {
-        assert(is_tensor());
+        assert(!isNullTensor());
         return *_tensor;
     }
     ShapedWeights& weights()
@@ -99,6 +103,10 @@ class TensorOrWeights
     {
         return is_tensor() ? _tensor->getType() == nvinfer1::DataType::kINT32 : _weights.type == ::ONNX_NAMESPACE::TensorProto_DataType_INT32;
     }
+    bool isBool() const
+    {
+        return is_tensor() ? _tensor->getType() == nvinfer1::DataType::kBOOL : _weights.type == ::ONNX_NAMESPACE::TensorProto_DataType_BOOL;
+    }
 };
 
 } // namespace onnx2trt
Original file line number	Diff line number	Diff line change
`@@ -172,7 +172,8 @@ Status parseGraph(`
`172`	`172`	`auto& output = outputs.at(i);`
`173`	`173`	`ssOutputs << "[" << outputName << " -> " << output.shape() << "], ";`
`174`	`174`	`// Note: This condition is to allow ONNX outputs to be ignored`
`175`		`- if (output && !outputName.empty())`
	`175`	`+ // Always register output weights (even empty ones) as it may be mapped to an unused input`
	`176`	`+ if ((output \|\| output.is_weights()) && !outputName.empty())`
`176`	`177`	`{`
`177`	`178`	`ctx->registerTensor(std::move(output), outputName);`
`178`	`179`	`}`
`@@ -331,11 +332,11 @@ bool ModelImporter::supportsModel(`
`331`	`332`	`}`
`332`	`333`	`}`
`333`	`334`	`}`
`334`		`-`
`335`		`- auto checkForInput = [&input_node](::ONNX_NAMESPACE::NodeProto const& node) {`
	`335`	`+ auto* ctx = &_importer_ctx;`
	`336`	`+ auto checkForInput = [&input_node, &ctx](::ONNX_NAMESPACE::NodeProto const& node) {`
`336`	`337`	`for (auto input : node.input())`
`337`	`338`	`{`
`338`		`- if (input_node == input)`
	`339`	`+ if (input_node == input \|\| ctx->loopTensors()[input_node] == input)`
`339`	`340`	`{`
`340`	`341`	`return true;`
`341`	`342`	`}`
`@@ -351,17 +352,23 @@ bool ModelImporter::supportsModel(`
`351`	`352`	`cout << "Failed to sort model topologically, exiting ..." << endl;`
`352`	`353`	`return false;`
`353`	`354`	`}`
	`355`	`+`
`354`	`356`	`for (int node_idx : topological_order)`
`355`	`357`	`{`
`356`	`358`	`::ONNX_NAMESPACE::NodeProto const& node = model.graph().node(node_idx);`
	`359`	`+`
`357`	`360`	`// Add the node to the subgraph if:`
`358`		`- // 1. Importer function is regestiered for the operator type`
`359`		`- // 2. It is not directly connected to an unsupported input`
`360`		`- // 3. Parsing did not hit an error on the node`
	`361`	`+ // 1. Importer function is registered for the operator type`
	`362`	`+ // 2. It is NOT directly connected to an unsupported input`
	`363`	`+ // 3. Parsing did NOT hit an error on the node`
	`364`	`+ // 4. Any shape tensor output is coming from a supported node`
`361`	`365`	`bool registered = supportsOperator(node.op_type().c_str());`
`362`	`366`	`bool containsInput = (input_node.empty()) ? false : checkForInput(node);`
`363`	`367`	`bool containsIndex = node_idx == error_node;`
`364`		`- if (registered && !containsInput && !containsIndex)`
	`368`	`+ auto const tensor = node.output(0);`
	`369`	`+ bool supportedShapeTensorOutput = ctx->unsupportedShapeTensors().count(tensor) == 0 ? true : false;`
	`370`	`+`
	`371`	`+ if (registered && !containsInput && !containsIndex && supportedShapeTensorOutput)`
`365`	`372`	`{`
`366`	`373`	`if (newSubGraph)`
`367`	`374`	`{`
`@@ -447,6 +454,18 @@ void removeShapeTensorCasts(IImporterContext* ctx)`
`447`	`454`	`{`
`448`	`455`	`t.setType(SHAPE_TENSOR_TYPE);`
`449`	`456`	`}`
	`457`	`+ // Some layers do not support shape tensor outputs. Keep track of these tensor names`
	`458`	`+ // for supportsModel().`
	`459`	`+ auto type = layer->getType();`
	`460`	`+ auto elementwiseOp = layer->getType() == nvinfer1::LayerType::kELEMENTWISE ? (static_cast<nvinfer1::IElementWiseLayer*>(layer))->getOperation() : nvinfer1::ElementWiseOperation::kSUM;`
	`461`	`+ auto reduceOp = layer->getType() == nvinfer1::LayerType::kREDUCE ? (static_cast<nvinfer1::IReduceLayer*>(layer))->getOperation() : nvinfer1::ReduceOperation::kSUM;`
	`462`	`+`
	`463`	`+ if (!supportsShapeTensor(type, elementwiseOp, reduceOp))`
	`464`	`+ {`
	`465`	`+ auto name = layer->getOutput(0)->getName();`
	`466`	`+ ctx->unsupportedShapeTensors().insert(name);`
	`467`	`+ LOG_ERROR("Found " << name << " as a shape tensor output from a layer that does not support it!");`
	`468`	`+ }`
`450`	`469`	`}`
`451`	`470`	`}`
`452`	`471`	`}`
Original file line number	Diff line number	Diff line change
`@@ -109,7 +109,11 @@ onnx2trt::ShapedWeights OnnxAttrs::get<onnx2trt::ShapedWeights>(const std::strin`
`109`	`109`	`{`
`110`	`110`	`::ONNX_NAMESPACE::TensorProto const& onnx_weights_tensor = this->at(key)->t();`
`111`	`111`	`onnx2trt::ShapedWeights weights;`
`112`		`- convertOnnxWeights(onnx_weights_tensor, &weights, mCtx);`
	`112`	`+ // Return empty weights if conversion failed`
	`113`	`+ if (!convertOnnxWeights(onnx_weights_tensor, &weights, mCtx))`
	`114`	`+ {`
	`115`	`+ return onnx2trt::ShapedWeights::empty(::ONNX_NAMESPACE::TensorProto_DataType_FLOAT);`
	`116`	`+ }`
`113`	`117`	`return weights;`
`114`	`118`	`}`
`115`	`119`
Original file line number	Diff line number	Diff line change
`@@ -67,14 +67,18 @@ class TensorOrWeights`
`67`	`67`	`{`
`68`	`68`	`return _variant == NODE_WEIGHTS;`
`69`	`69`	`}`
	`70`	`+ bool isNullTensor() const`
	`71`	`+ {`
	`72`	`+ return is_tensor() && _tensor == nullptr;`
	`73`	`+ }`
`70`	`74`	`nvinfer1::ITensor& tensor()`
`71`	`75`	`{`
`72`		`- assert(is_tensor());`
	`76`	`+ assert(!isNullTensor());`
`73`	`77`	`return *_tensor;`
`74`	`78`	`}`
`75`	`79`	`nvinfer1::ITensor const& tensor() const`
`76`	`80`	`{`
`77`		`- assert(is_tensor());`
	`81`	`+ assert(!isNullTensor());`
`78`	`82`	`return *_tensor;`
`79`	`83`	`}`
`80`	`84`	`ShapedWeights& weights()`
`@@ -99,6 +103,10 @@ class TensorOrWeights`
`99`	`103`	`{`
`100`	`104`	`return is_tensor() ? _tensor->getType() == nvinfer1::DataType::kINT32 : _weights.type == ::ONNX_NAMESPACE::TensorProto_DataType_INT32;`
`101`	`105`	`}`
	`106`	`+ bool isBool() const`
	`107`	`+ {`
	`108`	`+ return is_tensor() ? _tensor->getType() == nvinfer1::DataType::kBOOL : _weights.type == ::ONNX_NAMESPACE::TensorProto_DataType_BOOL;`
	`109`	`+ }`
`102`	`110`	`};`
`103`	`111`
`104`	`112`	`} // namespace onnx2trt`