ONNX-TensorRT 10.8-GA Release (#1012)

yuanyao-nv · web-flow · commit 118ed0aea197 · 2025-01-30T14:00:28.000-08:00
* ONNX-TensorRT 10.8-GA Release

Signed-off-by: Yuan Yao &lt;yuanyao@nvidia.com&gt;

* update date

Signed-off-by: Yuan Yao &lt;yuanyao@nvidia.com&gt;

---------

Signed-off-by: Yuan Yao &lt;yuanyao@nvidia.com&gt;
diff --git a/README.md b/README.md
@@ -16,7 +16,7 @@ For press and other inquiries, please contact Hector Marinez at hmarinez@nvidia.
 
 ## Supported TensorRT Versions
 
-Development on the this branch is for the latest version of [TensorRT 10.7](https://developer.nvidia.com/nvidia-tensorrt-download) with full-dimensions and dynamic shape support.
+Development on the this branch is for the latest version of [TensorRT 10.8](https://developer.nvidia.com/nvidia-tensorrt-download) with full-dimensions and dynamic shape support.
 
 For previous versions of TensorRT, refer to their respective branches.
 
@@ -29,8 +29,8 @@ Current supported ONNX operators are found in the [operator support matrix](docs
 ### Dependencies
 
  - [Protobuf >= 3.0.x](https://github.com/google/protobuf/releases)
- - [TensorRT 10.7](https://developer.nvidia.com/tensorrt)
- - [TensorRT 10.7 open source libaries] (https://github.com/NVIDIA/TensorRT/)
+ - [TensorRT 10.8](https://developer.nvidia.com/tensorrt)
+ - [TensorRT 10.8 open source libaries] (https://github.com/NVIDIA/TensorRT/)
 
 ### Building
 
@@ -82,7 +82,7 @@ Refer to the link or run `polygraphy run -h` for more information on CLI options
 
 Python bindings for the ONNX-TensorRT parser are packaged in the shipped `.whl` files.
 
-TensorRT 10.7 supports ONNX release 1.17.0. Install it with:
+TensorRT 10.8 supports ONNX release 1.17.0. Install it with:
 
     python3 -m pip install onnx==1.17.0
 
diff --git a/Status.hpp b/Status.hpp
@@ -204,6 +204,7 @@ static std::ostream& operator<<(std::ostream& stream, nvinfer1::DataType const&
     case nvinfer1::DataType::kBOOL: return stream << "bool";
     case nvinfer1::DataType::kFP8: return stream << "float8";
     case nvinfer1::DataType::kINT4: return stream << "int4";
+    case nvinfer1::DataType::kFP4: return stream << "fp4";
 
     default: throw std::runtime_error("Unknown dtype");
     }
diff --git a/TensorOrWeights.cpp b/TensorOrWeights.cpp
@@ -24,6 +24,7 @@ std::string TensorOrWeights::getType() const
         case nvinfer1::DataType::kBOOL: return "BOOL";
         case nvinfer1::DataType::kFP8: return "FP8";
         case nvinfer1::DataType::kINT4: return "INT4";
+        case nvinfer1::DataType::kFP4: return "FP4";
         }
     }
     else
@@ -42,6 +43,7 @@ std::string TensorOrWeights::getType() const
         case ::ONNX_NAMESPACE::TensorProto::INT64: return "INT64";
         case ::ONNX_NAMESPACE::TensorProto::FLOAT8E4M3FN: return "FP8";
         case ::ONNX_NAMESPACE::TensorProto::INT4: return "INT4";
+        case ::ONNX_NAMESPACE::TensorProto::FLOAT4E2M1: return "FP4";
         }
     }
     return "UNKNOWN TYPE";
@@ -62,6 +64,7 @@ nvinfer1::DataType TensorOrWeights::convertONNXDataType(ShapedWeights::DataType
         case ::ONNX_NAMESPACE::TensorProto::INT64: return nvinfer1::DataType::kINT64;
         case ::ONNX_NAMESPACE::TensorProto::FLOAT8E4M3FN: return nvinfer1::DataType::kFP8;
         case ::ONNX_NAMESPACE::TensorProto::INT4: return nvinfer1::DataType::kINT4;
+        case ::ONNX_NAMESPACE::TensorProto::FLOAT4E2M1: return nvinfer1::DataType::kFP4;
         }
         assert(false && "Unknown datatype");
         return nvinfer1::DataType::kFLOAT;
@@ -81,6 +84,7 @@ ShapedWeights::DataType TensorOrWeights::convertTRTDataType(nvinfer1::DataType d
         case nvinfer1::DataType::kINT64: return ::ONNX_NAMESPACE::TensorProto::INT64;
         case nvinfer1::DataType::kFP8: return ::ONNX_NAMESPACE::TensorProto::FLOAT8E4M3FN;
         case nvinfer1::DataType::kINT4: return ::ONNX_NAMESPACE::TensorProto::INT4;
+        case nvinfer1::DataType::kFP4: return ::ONNX_NAMESPACE::TensorProto::FLOAT4E2M1;
         }
         assert(false && "Unknown datatype");
         return ::ONNX_NAMESPACE::TensorProto::FLOAT;
diff --git a/WeightsContext.cpp b/WeightsContext.cpp
@@ -356,7 +356,7 @@ bool WeightsContext::convertOnnxWeights(
     else if (onnxDtype == ::ONNX_NAMESPACE::TensorProto::INT32 || onnxDtype == ::ONNX_NAMESPACE::TensorProto::INT64
         || onnxDtype == ::ONNX_NAMESPACE::TensorProto::FLOAT16 || onnxDtype == ::ONNX_NAMESPACE::TensorProto::BFLOAT16
         || onnxDtype == ::ONNX_NAMESPACE::TensorProto::INT8 || onnxDtype == ::ONNX_NAMESPACE::TensorProto::BOOL
-        || onnxDtype == ::ONNX_NAMESPACE::TensorProto::INT4)
+        || onnxDtype == ::ONNX_NAMESPACE::TensorProto::INT4 || onnxDtype == ::ONNX_NAMESPACE::TensorProto::FLOAT4E2M1)
     {
         if (onnxTensor.raw_data().size() > 0)
         {
@@ -399,6 +399,8 @@ bool WeightsContext::convertOnnxWeights(
                 break;
             case ::ONNX_NAMESPACE::TensorProto::INT4:
                 // int4 data is packed, each int32 element contains one byte (two int4 nibbles)
+            case ::ONNX_NAMESPACE::TensorProto::FLOAT4E2M1:
+                // int4/fp4 data is packed, each int32 element contains one byte (two int4/fp4 nibbles)
                 nbytes = onnxTensor.int32_data().size();
                 dataPtr = convertPackedInt32Data(onnxTensor.int32_data().data(), shape, nbytes, onnxDtype);
                 break;
diff --git a/docs/Changelog.md b/docs/Changelog.md
@@ -2,7 +2,15 @@
 
 # ONNX-TensorRT Changelog
 
-# TensorRT 10.7 GA Release - 2024-12-3
+# TensorRT 10.8 GA Release - 2025-1-30
+For more details, see the 10.8 GA release notes
+
+- Added support for `FLOAT4E2M1` types for quantized networks
+- Added support for dynamic axes and improved performance of `CumSum` operations
+- Fixed the import of local functions when their input tensor names aliased one from an outside scope
+- Added support for `Pow` ops with integer-typed exponent values
+
+# TensorRT 10.7 GA Release - 2024-11-26
 For more details, see the 10.7 GA release notes
 
 - Now prioritizes using plugins over local functions when a corresponding plugin is available in the registry
diff --git a/docs/operators.md b/docs/operators.md
@@ -2,13 +2,13 @@
 
 # Supported ONNX Operators
 
-TensorRT 10.7 supports operators in the inclusive range of opset 9 to opset 22. Latest information of ONNX operators can be found [here](https://github.com/onnx/onnx/blob/main/docs/Operators.md). More details and limitations are documented in the chart below.
+TensorRT 10.8 supports operators in the inclusive range of opset 9 to opset 22. Latest information of ONNX operators can be found [here](https://github.com/onnx/onnx/blob/main/docs/Operators.md). More details and limitations are documented in the chart below.
 
-TensorRT supports the following ONNX data types: DOUBLE, FLOAT32, FLOAT16, BFLOAT16, INT32, INT64, FP8, INT8, INT4, UINT8, and BOOL
+TensorRT supports the following ONNX data types: DOUBLE, FLOAT32, FLOAT16, BFLOAT16, FP8, FP4, INT32, INT64, INT8, INT4, UINT8, and BOOL
 
 > Note: There is limited support for DOUBLE type. TensorRT will attempt to cast DOUBLE down to FLOAT, clamping values to `+-FLT_MAX` if necessary.
 
-> Note: INT8, INT4, and FP8 are treated as `Quantized Types` in TensorRT, where support is available only through quantization from a floating-point type with higher precision. See [section 7.4.2](https://docs.nvidia.com/deeplearning/tensorrt/developer-guide/index.html#qat-models-work) of the developer guide for more information.
+> Note: INT8, INT4, FP8 and FP4 are treated as `Quantized Types` in TensorRT, where support is available only through quantization from a floating-point type with higher precision. See [section 7.4.2](https://docs.nvidia.com/deeplearning/tensorrt/developer-guide/index.html#qat-models-work) of the developer guide for more information.
 
 > Note: UINT8 is only supported as network input or output tensor types.
 
@@ -47,22 +47,22 @@ TensorRT supports the following ONNX data types: DOUBLE, FLOAT32, FLOAT16, BFLOA
 | Compress                  | N          |
 | Concat                    | Y          | FP32, FP16, BF16, INT32, INT64, BOOL |
 | ConcatFromSequence        | N          |
-| Constant                  | Y          | FP32, FP16, BF16, INT32, INT64, BOOL | `sparse_value`, `value_string`, and `value_strings` attributes are unsupported.
-| ConstantOfShape           | Y          | FP32, FP16, BF16, INT32, INF64, BOOL |
+| Constant                  | Y          | FP32, FP16, BF16, FP8, FP4, INT4, INT32, INT64, BOOL | `sparse_value`, `value_string`, and `value_strings` attributes are unsupported.
+| ConstantOfShape           | Y          | FP32, FP16, BF16, FP8, FP4, INT4, INT32, INF64, BOOL |
 | Conv                      | Y          | FP32, FP16, BF16 |
 | ConvInteger               | N          |
 | ConvTranspose             | Y          | FP32, FP16, BF16 |
 | Cos                       | Y          | FP32, FP16, BF16 |
 | Cosh                      | Y          | FP32, FP16, BF16 |
-| CumSum                    | Y          | FP32, FP16, BF16 | `axis` must be an initializer                                                                                                            |
+| CumSum                    | Y          | FP32, FP16, BF16 | `axis` must be a build-time constant                                                                                                     |
 | DFT                       | N          |
 | DeformConv                | Y          | FP32, FP16 | `input` must have 1D or 2D spatial dimensions. `pads` for the beginning and end along each spatial axis must be the same
 | DepthToSpace              | Y          | FP32, FP16, BF16, INT32, INT64 |
-| DequantizeLinear          | Y          | INT8, FP8, INT4 | `x_zero_point` must be zero                                                                                    |
+| DequantizeLinear          | Y          | INT8, FP8, FP4, INT4 | `x_zero_point` must be zero                                                                                    |
 | Det                       | N          |
 | Div                       | Y          | FP32, FP16, BF16, INT32, INT64 |
 | Dropout                   | Y          | FP32, FP16, BF16 | `is_traning` must be an initializer and evaluate to False.
-| DynamicQuantizeLinear     | N          |
+| DynamicQuantizeLinear     | N          | Not supported. TensorRT's IDynamicQuantize can be composed from ONNX operators in the form of a model local function.
 | Einsum                    | Y          | FP32, FP16, BF16 |
 | Elu                       | Y          | FP32, FP16, BF16 |
 | Equal                     | Y          | FP32, FP16, BF16, INT32, INT64 |
diff --git a/importerUtils.cpp b/importerUtils.cpp
@@ -333,6 +333,7 @@ bool convertDtype(int32_t onnx_dtype, nvinfer1::DataType* trt_dtype)
     case ::ONNX_NAMESPACE::TensorProto::INT64: *trt_dtype = nvinfer1::DataType::kINT64; break;
     case ::ONNX_NAMESPACE::TensorProto::FLOAT8E4M3FN: *trt_dtype = nvinfer1::DataType::kFP8; break;
     case ::ONNX_NAMESPACE::TensorProto::INT4: *trt_dtype = nvinfer1::DataType::kINT4; break;
+    case ::ONNX_NAMESPACE::TensorProto::FLOAT4E2M1: *trt_dtype = nvinfer1::DataType::kFP4; break;
     default:
         std::cerr << "Unsupported ONNX data type: " << getDtypeName(onnx_dtype) << " (" << std::to_string(onnx_dtype)
                   << ")" << std::endl;
@@ -506,6 +507,7 @@ std::string getTrtDtypeName(nvinfer1::DataType TrtDtype)
     case nvinfer1::DataType::kBF16: return "BF16";
     case nvinfer1::DataType::kINT64: return "INT64";
     case nvinfer1::DataType::kINT4: return "INT4";
+    case nvinfer1::DataType::kFP4: return "FP4";
     default: return "<UNKNOWN>";
     }
 }
@@ -903,9 +905,9 @@ nvinfer1::IPluginCreatorInterface* importPluginCreator(ImporterContext* ctx, std
     return creator;
 }
 
-std::unique_ptr<nvinfer1::IPluginV2, PluginDeleter> createPlugin(std::string const& name,
-    std::string const& /* pluginNamespace */, nvinfer1::IPluginCreator* pluginCreator,
-    std::vector<nvinfer1::PluginField> const& pluginFields)
+std::unique_ptr<nvinfer1::IPluginV2, PluginDeleter> createPlugin(ImporterContext* ctx,
+    ::ONNX_NAMESPACE::NodeProto const& node, std::string const& name, std::string const& /* pluginNamespace */,
+    nvinfer1::IPluginCreator* pluginCreator, std::vector<nvinfer1::PluginField> const& pluginFields)
 {
     if (!pluginCreator)
     {
@@ -953,8 +955,9 @@ CreatorVersion getPluginCreatorVersion(nvinfer1::IPluginCreatorInterface const*
     ONNXTRT_CHECK(false && "Unknown plugin creator version.", ErrorCode::kINTERNAL_ERROR);
 }
 
-std::unique_ptr<nvinfer1::IPluginV3> createPlugin(std::string const& name, std::string const& pluginNamespace,
-    nvinfer1::IPluginCreatorInterface* pluginCreator, std::vector<nvinfer1::PluginField> const& pluginFields)
+std::unique_ptr<nvinfer1::IPluginV3> createPlugin(ImporterContext* ctx, ::ONNX_NAMESPACE::NodeProto const& node,
+    std::string const& name, std::string const& pluginNamespace, nvinfer1::IPluginCreatorInterface* pluginCreator,
+    std::vector<nvinfer1::PluginField> const& pluginFields)
 {
     if (!pluginCreator)
     {
@@ -1178,7 +1181,7 @@ NodeOutputs modulatedDeformableConvPluginHelper(ImporterContext* ctx, ::ONNX_NAM
     f.emplace_back("dilation", dilationValues.data(), nvinfer1::PluginFieldType::kINT32, listAttrSize);
 
     // Create plugin from registry
-    auto const plugin = createPlugin(pluginName, kTRT_STD_PLUGIN_NAMESPACE,
+    auto const plugin = createPlugin(ctx, node, pluginName, kTRT_STD_PLUGIN_NAMESPACE,
         static_cast<nvinfer1::IPluginCreator*>(importPluginCreator(ctx, pluginName, pluginVersion)), f);
 
     ONNXTRT_CHECK_NODE(plugin != nullptr, "ModulatedDeformConv2d plugin was not found in the plugin registry!", node,
@@ -1295,7 +1298,7 @@ NodeOutputs instanceNormPluginHelper(ImporterContext* ctx, ::ONNX_NAMESPACE::Nod
     f.emplace_back("alpha", &alpha, nvinfer1::PluginFieldType::kFLOAT32, 1);
 
     // Create plugin from registry
-    auto const plugin = createPlugin(getNodeName(node), kTRT_STD_PLUGIN_NAMESPACE,
+    auto const plugin = createPlugin(ctx, node, getNodeName(node), kTRT_STD_PLUGIN_NAMESPACE,
         static_cast<nvinfer1::IPluginCreatorV3One*>(importPluginCreator(ctx, pluginName, pluginVersion)), f);
 
     ONNXTRT_CHECK_NODE(plugin != nullptr, "InstanceNormalization plugin was not found in the plugin registry!", node,
@@ -1717,6 +1720,7 @@ ::ONNX_NAMESPACE::TensorProto_DataType trtDataTypeToONNX(nvinfer1::DataType dt)
     case nvinfer1::DataType::kUINT8: return ::ONNX_NAMESPACE::TensorProto::UINT8;
     case nvinfer1::DataType::kFP8: return ::ONNX_NAMESPACE::TensorProto::FLOAT8E4M3FN;
     case nvinfer1::DataType::kINT4: return ::ONNX_NAMESPACE::TensorProto::INT4;
+    case nvinfer1::DataType::kFP4: return ::ONNX_NAMESPACE::TensorProto::FLOAT4E2M1;
     }
     return ::ONNX_NAMESPACE::TensorProto_DataType_UNDEFINED;
 }
diff --git a/importerUtils.hpp b/importerUtils.hpp
@@ -250,13 +250,14 @@ nvinfer1::IPluginCreatorInterface* importPluginCreator(ImporterContext* ctx, std
     std::string const& pluginVersion, std::string const& pluginNamespace = kTRT_STD_PLUGIN_NAMESPACE);
 
 // Helper function to get a plugin from the PluginRegistry
-std::unique_ptr<nvinfer1::IPluginV2, PluginDeleter> createPlugin(std::string const& name,
-    std::string const& pluginNamespace, nvinfer1::IPluginCreator* pluginCreator,
-    std::vector<nvinfer1::PluginField> const& pluginFields);
+std::unique_ptr<nvinfer1::IPluginV2, PluginDeleter> createPlugin(ImporterContext* ctx,
+    ::ONNX_NAMESPACE::NodeProto const& node, std::string const& name, std::string const& pluginNamespace,
+    nvinfer1::IPluginCreator* pluginCreator, std::vector<nvinfer1::PluginField> const& pluginFields);
 
 // Helper function to get a V3 plugin from the PluginRegistry
-std::unique_ptr<nvinfer1::IPluginV3> createPlugin(std::string const& name, std::string const& pluginNamespace,
-    nvinfer1::IPluginCreatorInterface* pluginCreator, std::vector<nvinfer1::PluginField> const& pluginFields);
+std::unique_ptr<nvinfer1::IPluginV3> createPlugin(ImporterContext* ctx, ::ONNX_NAMESPACE::NodeProto const& node,
+    std::string const& name, std::string const& pluginNamespace, nvinfer1::IPluginCreatorInterface* pluginCreator,
+    std::vector<nvinfer1::PluginField> const& pluginFields);
 
 // Helper function to return the identity of a TensorOrWeights
 TensorOrWeights identity(ImporterContext* ctx, TensorOrWeights input);
diff --git a/onnxOpCheckers.cpp b/onnxOpCheckers.cpp
@@ -269,6 +269,7 @@ DEFINE_OP_EMPTY_CHECKER(TRT_INT4QuantizeLinear)
 
 DEFINE_OP_EMPTY_CHECKER(TRT_INT4DequantizeLinear)
 
+DEFINE_OP_EMPTY_CHECKER(TRT_FP4DynamicQuantize)
 
 DECLARE_OP_CHECKER(Mul);
 
@@ -526,7 +527,12 @@ DEFINE_OP_EMPTY_CHECKER(Pad)
 
 DEFINE_OP_EMPTY_CHECKER(ParametricSoftplus)
 
-DEFINE_OP_EMPTY_CHECKER(Pow)
+DEFINE_OP_CHECKER(Pow)
+{
+    int32_t const nbInputs = node.input().size();
+    STATIC_CHECK(
+        nbInputs == 2 && "POW operator expects two inputs!", ErrorCode::kINVALID_NODE, node, errors, nodeIndex);
+}
 
 DEFINE_OP_EMPTY_CHECKER(PRelu)
 
diff --git a/onnxOpImporters.cpp b/onnxOpImporters.cpp
diff --git a/onnx_tensorrt/__init__.py b/onnx_tensorrt/__init__.py
diff --git a/third_party/onnx b/third_party/onnx
diff --git a/weightUtils.cpp b/weightUtils.cpp

Original file line number	Diff line number	Diff line change
`@@ -204,6 +204,7 @@ static std::ostream& operator<<(std::ostream& stream, nvinfer1::DataType const&`
`204`	`204`	`case nvinfer1::DataType::kBOOL: return stream << "bool";`
`205`	`205`	`case nvinfer1::DataType::kFP8: return stream << "float8";`
`206`	`206`	`case nvinfer1::DataType::kINT4: return stream << "int4";`
	`207`	`+ case nvinfer1::DataType::kFP4: return stream << "fp4";`
`207`	`208`
`208`	`209`	`default: throw std::runtime_error("Unknown dtype");`
`209`	`210`	`}`
Original file line number	Diff line number	Diff line change
`@@ -24,6 +24,7 @@ std::string TensorOrWeights::getType() const`
`24`	`24`	`case nvinfer1::DataType::kBOOL: return "BOOL";`
`25`	`25`	`case nvinfer1::DataType::kFP8: return "FP8";`
`26`	`26`	`case nvinfer1::DataType::kINT4: return "INT4";`
	`27`	`+ case nvinfer1::DataType::kFP4: return "FP4";`
`27`	`28`	`}`
`28`	`29`	`}`
`29`	`30`	`else`
`@@ -42,6 +43,7 @@ std::string TensorOrWeights::getType() const`
`42`	`43`	`case ::ONNX_NAMESPACE::TensorProto::INT64: return "INT64";`
`43`	`44`	`case ::ONNX_NAMESPACE::TensorProto::FLOAT8E4M3FN: return "FP8";`
`44`	`45`	`case ::ONNX_NAMESPACE::TensorProto::INT4: return "INT4";`
	`46`	`+ case ::ONNX_NAMESPACE::TensorProto::FLOAT4E2M1: return "FP4";`
`45`	`47`	`}`
`46`	`48`	`}`
`47`	`49`	`return "UNKNOWN TYPE";`
`@@ -62,6 +64,7 @@ nvinfer1::DataType TensorOrWeights::convertONNXDataType(ShapedWeights::DataType`
`62`	`64`	`case ::ONNX_NAMESPACE::TensorProto::INT64: return nvinfer1::DataType::kINT64;`
`63`	`65`	`case ::ONNX_NAMESPACE::TensorProto::FLOAT8E4M3FN: return nvinfer1::DataType::kFP8;`
`64`	`66`	`case ::ONNX_NAMESPACE::TensorProto::INT4: return nvinfer1::DataType::kINT4;`
	`67`	`+ case ::ONNX_NAMESPACE::TensorProto::FLOAT4E2M1: return nvinfer1::DataType::kFP4;`
`65`	`68`	`}`
`66`	`69`	`assert(false && "Unknown datatype");`
`67`	`70`	`return nvinfer1::DataType::kFLOAT;`
`@@ -81,6 +84,7 @@ ShapedWeights::DataType TensorOrWeights::convertTRTDataType(nvinfer1::DataType d`
`81`	`84`	`case nvinfer1::DataType::kINT64: return ::ONNX_NAMESPACE::TensorProto::INT64;`
`82`	`85`	`case nvinfer1::DataType::kFP8: return ::ONNX_NAMESPACE::TensorProto::FLOAT8E4M3FN;`
`83`	`86`	`case nvinfer1::DataType::kINT4: return ::ONNX_NAMESPACE::TensorProto::INT4;`
	`87`	`+ case nvinfer1::DataType::kFP4: return ::ONNX_NAMESPACE::TensorProto::FLOAT4E2M1;`
`84`	`88`	`}`
`85`	`89`	`assert(false && "Unknown datatype");`
`86`	`90`	`return ::ONNX_NAMESPACE::TensorProto::FLOAT;`