feat(//cpp/trtorchc): Adding a new CLI application for TRTorch which

narendasan · narendasan · commit 4f349a12de03 · 2020-05-30T18:55:34.000-07:00
will serve as a replacement to trtorchexec and act like a GCC style
compiler for TorchScript

Signed-off-by: Naren Dasan &lt;naren@narendasan.com&gt;
Signed-off-by: Naren Dasan &lt;narens@nvidia.com&gt;
diff --git a/cpp/api/include/trtorch/ptq.h b/cpp/api/include/trtorch/ptq.h
@@ -104,18 +104,17 @@ class Int8Calibrator : Algorithm {
             std::stringstream ss;
             ss << "Reading Calibration Cache from " << cache_file_path_;
             logging::log(logging::Level::kINFO, ss.str());
+
             cache_.clear();
-            std::ifstream cache_file(cache_file_path_, std::ios::binary);
-            cache_file >> std::noskipws;
-            if (cache_file.good()) {
-                std::copy(std::istream_iterator<char>(cache_file),
-                            std::istream_iterator<char>(),
-                            std::back_inserter(cache_));
-                ss << "Cache read";
-                logging::log(logging::Level::kDEBUG, ss.str());
+            std::ifstream input(cache_file_path_, std::ios::binary);
+            input >> std::noskipws;
+            if (input.good()) {
+                std::copy(std::istream_iterator<char>(input), std::istream_iterator<char>(),
+                    std::back_inserter(cache_));
+                logging::log(logging::Level::kDEBUG, "Cache read");
             }
-            cache_size_ = cache_.size();
-            return cache_size_ ? cache_.data() : nullptr;
+            length = cache_.size();
+            return length ? cache_.data() : nullptr;
         }
         return nullptr;
     }
@@ -220,23 +219,17 @@ class Int8CacheCalibrator : Algorithm {
         std::stringstream ss;
         ss << "Reading Calibration Cache from " << cache_file_path_;
         logging::log(logging::Level::kINFO, ss.str());
+
         cache_.clear();
-        std::ifstream cache_file;
-        cache_file.open(cache_file_path_, std::ios::in | std::ios::binary);
-        cache_file.unsetf(std::ios::skipws);
-        cache_file.seekg(0, std::ios::beg);
-        cache_.reserve(cache_file.tellg());
-        cache_file.seekg(0, std::ios::beg);
-        if (cache_file.good()) {
-            std::cout << "Trying to read cache" << std::endl;
-            std::copy(std::istreambuf_iterator<char>(cache_file),
-                        std::istreambuf_iterator<char>(),
-                        std::back_inserter(cache_));
-            ss << "Cache read";
-            logging::log(logging::Level::kDEBUG, ss.str());
+        std::ifstream input(cache_file_path_, std::ios::binary);
+        input >> std::noskipws;
+        if (input.good()) {
+            std::copy(std::istream_iterator<char>(input), std::istream_iterator<char>(),
+                std::back_inserter(cache_));
+            logging::log(logging::Level::kDEBUG, "Cache read");
         }
-        cache_size_ = cache_.size();
-        return cache_size_ ? cache_.data() : nullptr;
+        length = cache_.size();
+        return length ? cache_.data() : nullptr;
     }
 
 
diff --git a/cpp/api/include/trtorch/trtorch.h b/cpp/api/include/trtorch/trtorch.h
@@ -142,6 +142,14 @@ struct TRTORCH_API ExtraInfo {
          * @return false
          */
         constexpr bool operator==(DataType other) const { return value == other.value; }
+        /**
+         * @brief Comparision operator for DataType
+         *
+         * @param other
+         * @return true
+         * @return false
+         */
+        constexpr bool operator==(DataType::Value other) const { return value == other; }
         /**
          * @brief Comparision operator for DataType
          *
@@ -150,6 +158,14 @@ struct TRTORCH_API ExtraInfo {
          * @return false
          */
         constexpr bool operator!=(DataType other) const { return value != other.value; }
+        /**
+         * @brief Comparision operator for DataType
+         *
+         * @param other
+         * @return true
+         * @return false
+         */
+        constexpr bool operator!=(DataType::Value other) const { return value != other; }
     private:
         Value value;
     };
diff --git a/cpp/trtorchc/BUILD b/cpp/trtorchc/BUILD
@@ -0,0 +1,14 @@
+package(default_visibility = ["//visibility:public"])
+
+cc_binary(
+    name = "trtorchc",
+    srcs = [
+        "main.cpp"
+    ],
+    deps = [
+        "@libtorch//:libtorch",
+        "@libtorch//:caffe2",
+        "//third_party/args",
+        "//cpp/api:trtorch"
+    ],
+)
diff --git a/cpp/trtorchc/README.md b/cpp/trtorchc/README.md
@@ -0,0 +1,87 @@
+# trtorhc
+
+trtorchc is a compiler CLI application using the TRTorch compiler. It serves as an easy way to compile a
+TorchScript Module with TRTorch from the command-line to quickly check support or as part of
+a deployment pipeline. All basic features of the compiler are supported including post training
+quantization (though you must already have a calibration cache file to use). The compiler can
+output two formats, either a TorchScript program with the TensorRT engine embedded or
+the TensorRT engine itself as a PLAN file.
+
+All that is required to run the program after compilation is for C++ linking against libtrtorch.so
+or in Python importing the trtorch package. All other aspects of using compiled modules are identical
+to standard TorchScript. Load with `torch.jit.load()` and run like you would run any other module.
+
+
+```
+trtorchc [input_file_path] [output_file_path]
+    [input_shapes...] {OPTIONS}
+
+    TRTorch is a compiler for TorchScript, it will compile and optimize
+    TorchScript programs to run on NVIDIA GPUs using TensorRT
+
+  OPTIONS:
+
+      -h, --help                        Display this help menu
+      Verbiosity of the compiler
+        -v, --verbose                     Dumps debugging information about the
+                                          compilation process onto the console
+        -w, --warnings                    Disables warnings generated during
+                                          compilation onto the console (warnings
+                                          are on by default)
+        --info                            Dumps info messages generated during
+                                          compilation onto the console
+      --build-debuggable-engine         Creates a debuggable engine
+      --use-strict-types                Restrict operating type to only use set
+                                        default operation precision
+                                        (op_precision)
+      --allow-gpu-fallback              (Only used when targeting DLA
+                                        (device-type)) Lets engine run layers on
+                                        GPU if they are not supported on DLA
+      -p[precision],
+      --default-op-precision=[precision]
+                                        Default operating precision for the
+                                        engine (Int8 requires a
+                                        calibration-cache argument) [ float |
+                                        float32 | f32 | half | float16 | f16 |
+                                        int8 | i8 ] (default: float)
+      -d[type], --device-type=[type]    The type of device the engine should be
+                                        built for [ gpu | dla ] (default: gpu)
+      --engine-capability=[capability]  The type of device the engine should be
+                                        built for [ default | safe_gpu |
+                                        safe_dla ]
+      --calibration-cache-file=[file_path]
+                                        Path to calibration cache file to use
+                                        for post training quantization
+      --num-min-timing-iter=[num_iters] Number of minimization timing iterations
+                                        used to select kernels
+      --num-avg-timing-iters=[num_iters]
+                                        Number of averaging timing iterations
+                                        used to select kernels
+      --workspace-size=[workspace_size] Maximum size of workspace given to
+                                        TensorRT
+      --max-batch-size=[max_batch_size] Maximum batch size (must be >= 1 to be
+                                        set, 0 means not set)
+      -t[threshold],
+      --threshold=[threshold]           Maximum acceptable numerical deviation
+                                        from standard torchscript output
+                                        (default 2e-5)
+      --save-engine                     Instead of compiling a full a
+                                        TorchScript program, save the created
+                                        engine to the path specified as the
+                                        output path
+      input_file_path                   Path to input TorchScript file
+      output_file_path                  Path for compiled TorchScript (or
+                                        TensorRT engine) file
+      input_shapes...                   Sizes for inputs to engine, can either
+                                        be a single size or a range defined by
+                                        Min, Optimal, Max sizes, e.g.
+                                        "(N,..,C,H,W)"
+                                        "[(MIN_N,..,MIN_C,MIN_H,MIN_W);(OPT_N,..,OPT_C,OPT_H,OPT_W);(MAX_N,..,MAX_C,MAX_H,MAX_W)]"
+      "--" can be used to terminate flag options and force all following
+      arguments to be treated as positional options
+```
+
+e.g.
+```
+trtorchc tests/modules/ssd_traced.jit.pt ssd_trt.ts "[(1,3,300,300); (1,3,512,512); (1, 3, 1024, 1024)]" -p f16
+```
diff --git a/cpp/trtorchc/main.cpp b/cpp/trtorchc/main.cpp