docs/hdk/tensorrt__provider__options_8h_source.html

 // Copyright (c) Microsoft Corporation. All rights reserved.

 // Licensed under the MIT License.


 #pragma once


 /// <summary>

 /// Options for the TensorRT provider that are passed to SessionOptionsAppendExecutionProvider_TensorRT_V2.

 /// Please note that this struct is *similar* to OrtTensorRTProviderOptions but only to be used internally.

 /// Going forward, new trt provider options are to be supported via this struct and usage of the publicly defined

 /// OrtTensorRTProviderOptions will be deprecated over time.

 /// User can only get the instance of OrtTensorRTProviderOptionsV2 via CreateTensorRTProviderOptions.

 /// </summary>

 struct OrtTensorRTProviderOptionsV2 {

   int device_id;                                // cuda device id.

   int has_user_compute_stream;                  // indicator of user specified CUDA compute stream.

   void* user_compute_stream;                    // user specified CUDA compute stream.

   int trt_max_partition_iterations;             // maximum iterations for TensorRT parser to get capability

   int trt_min_subgraph_size;                    // minimum size of TensorRT subgraphs

   size_t trt_max_workspace_size;                // maximum workspace size for TensorRT.

   int trt_fp16_enable;                          // enable TensorRT FP16 precision. Default 0 = false, nonzero = true

   int trt_int8_enable;                          // enable TensorRT INT8 precision. Default 0 = false, nonzero = true

   const char* trt_int8_calibration_table_name;  // TensorRT INT8 calibration table name.

   int trt_int8_use_native_calibration_table;    // use native TensorRT generated calibration table. Default 0 = false, nonzero = true

   int trt_dla_enable;                           // enable DLA. Default 0 = false, nonzero = true

   int trt_dla_core;                             // DLA core number. Default 0

   int trt_dump_subgraphs;                       // dump TRT subgraph. Default 0 = false, nonzero = true

   int trt_engine_cache_enable;                  // enable engine caching. Default 0 = false, nonzero = true

   const char* trt_engine_cache_path;            // specify engine cache path

   int trt_engine_decryption_enable;             // enable engine decryption. Default 0 = false, nonzero = true

   const char* trt_engine_decryption_lib_path;   // specify engine decryption library path

   int trt_force_sequential_engine_build;        // force building TensorRT engine sequentially. Default 0 = false, nonzero = true

   int trt_context_memory_sharing_enable;        // enable context memory sharing between subgraphs. Default 0 = false, nonzero = true

   int trt_layer_norm_fp32_fallback;             // force Pow + Reduce ops in layer norm to FP32. Default 0 = false, nonzero = true

 };

OrtTensorRTProviderOptionsV2::trt_engine_cache_enable
int trt_engine_cache_enable
Definition: tensorrt_provider_options.h:27

OrtTensorRTProviderOptionsV2::trt_dump_subgraphs
int trt_dump_subgraphs
Definition: tensorrt_provider_options.h:26

OrtTensorRTProviderOptionsV2::trt_engine_decryption_enable
int trt_engine_decryption_enable
Definition: tensorrt_provider_options.h:29

OrtTensorRTProviderOptionsV2::trt_context_memory_sharing_enable
int trt_context_memory_sharing_enable
Definition: tensorrt_provider_options.h:32

OrtTensorRTProviderOptionsV2::user_compute_stream
void * user_compute_stream
Definition: tensorrt_provider_options.h:16

OrtTensorRTProviderOptionsV2::trt_min_subgraph_size
int trt_min_subgraph_size
Definition: tensorrt_provider_options.h:18

OrtTensorRTProviderOptionsV2::trt_max_partition_iterations
int trt_max_partition_iterations
Definition: tensorrt_provider_options.h:17

OrtTensorRTProviderOptionsV2
Options for the TensorRT provider that are passed to SessionOptionsAppendExecutionProvider_TensorRT_V...
Definition: tensorrt_provider_options.h:13

OrtTensorRTProviderOptionsV2::trt_int8_calibration_table_name
const char * trt_int8_calibration_table_name
Definition: tensorrt_provider_options.h:22

OrtTensorRTProviderOptionsV2::trt_engine_cache_path
const char * trt_engine_cache_path
Definition: tensorrt_provider_options.h:28

OrtTensorRTProviderOptionsV2::trt_max_workspace_size
size_t trt_max_workspace_size
Definition: tensorrt_provider_options.h:19

OrtTensorRTProviderOptionsV2::trt_int8_use_native_calibration_table
int trt_int8_use_native_calibration_table
Definition: tensorrt_provider_options.h:23

OrtTensorRTProviderOptionsV2::trt_dla_enable
int trt_dla_enable
Definition: tensorrt_provider_options.h:24

OrtTensorRTProviderOptionsV2::trt_fp16_enable
int trt_fp16_enable
Definition: tensorrt_provider_options.h:20

OrtTensorRTProviderOptionsV2::trt_int8_enable
int trt_int8_enable
Definition: tensorrt_provider_options.h:21

OrtTensorRTProviderOptionsV2::trt_layer_norm_fp32_fallback
int trt_layer_norm_fp32_fallback
Definition: tensorrt_provider_options.h:33

OrtTensorRTProviderOptionsV2::device_id
int device_id
Definition: tensorrt_provider_options.h:14

OrtTensorRTProviderOptionsV2::trt_force_sequential_engine_build
int trt_force_sequential_engine_build
Definition: tensorrt_provider_options.h:31

OrtTensorRTProviderOptionsV2::has_user_compute_stream
int has_user_compute_stream
Definition: tensorrt_provider_options.h:15

OrtTensorRTProviderOptionsV2::trt_engine_decryption_lib_path
const char * trt_engine_decryption_lib_path
Definition: tensorrt_provider_options.h:30

OrtTensorRTProviderOptionsV2::trt_dla_core
int trt_dla_core
Definition: tensorrt_provider_options.h:25