Skip to content

Commit

Permalink
feat(//cpp/api): Adding max batch size setting
Browse files Browse the repository at this point in the history
Signed-off-by: Naren Dasan <naren@narendasan.com>
Signed-off-by: Naren Dasan <narens@nvidia.com>
  • Loading branch information
narendasan committed Apr 23, 2020
1 parent fc70267 commit 1b25542
Show file tree
Hide file tree
Showing 4 changed files with 34 additions and 16 deletions.
35 changes: 23 additions & 12 deletions core/conversion/conversionctx/ConversionCtx.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -9,17 +9,24 @@ namespace core {
namespace conversion {

std::ostream& operator<<(std::ostream& os, const BuilderSettings& s) {
os << "Settings requested for TensorRT engine:" \
<< "\n Operating Precision: " << s.op_precision \
<< "\n Make Refittable Engine: " << s.refit \
<< "\n Debuggable Engine: " << s.debug \
<< "\n Strict Type: " << s.strict_type \
<< "\n Allow GPU Fallback (if running on DLA): " << s.allow_gpu_fallback \
<< "\n Min Timing Iterations: " << s.num_min_timing_iters \
<< "\n Avg Timing Iterations: " << s.num_avg_timing_iters \
<< "\n Max Workspace Size: " << s.workspace_size \
<< "\n Device Type: " << s.device \
<< "\n Engine Capability: " << s.capability \
os << "Settings requested for TensorRT engine:" \
<< "\n Operating Precision: " << s.op_precision \
<< "\n Make Refittable Engine: " << s.refit \
<< "\n Debuggable Engine: " << s.debug \
<< "\n Strict Type: " << s.strict_types \
<< "\n Allow GPU Fallback (if running on DLA): " << s.allow_gpu_fallback \
<< "\n Min Timing Iterations: " << s.num_min_timing_iters \
<< "\n Avg Timing Iterations: " << s.num_avg_timing_iters \
<< "\n Max Workspace Size: " << s.workspace_size;

if (s.max_batch_size != 0) {
os << "\n Max Batch Size: " << s.max_batch_size;
} else {
os << "\n Max Batch Size: Not set";
}

os << "\n Device Type: " << s.device \
<< "\n Engine Capability: " << s.capability \
<< "\n Calibrator Created: " << (s.calibrator != nullptr);
return os;
}
Expand Down Expand Up @@ -62,14 +69,18 @@ ConversionCtx::ConversionCtx(BuilderSettings build_settings)
cfg->setFlag(nvinfer1::BuilderFlag::kDEBUG);
}

if (settings.strict_type) {
if (settings.strict_types) {
cfg->setFlag(nvinfer1::BuilderFlag::kSTRICT_TYPES);
}

if (settings.allow_gpu_fallback) {
cfg->setFlag(nvinfer1::BuilderFlag::kGPU_FALLBACK);
}

if (settings.max_batch_size != 0) {
builder->setMaxBatchSize(settings.max_batch_size);
}

cfg->setMinTimingIterations(settings.num_min_timing_iters);
cfg->setAvgTimingIterations(settings.num_avg_timing_iters);
cfg->setMaxWorkspaceSize(settings.workspace_size);
Expand Down
3 changes: 2 additions & 1 deletion core/conversion/conversionctx/ConversionCtx.h
Original file line number Diff line number Diff line change
Expand Up @@ -20,14 +20,15 @@ struct BuilderSettings {
nvinfer1::DataType op_precision = nvinfer1::DataType::kFLOAT;
bool refit = false;
bool debug = false;
bool strict_type = false;
bool strict_types = false;
bool allow_gpu_fallback = true;
nvinfer1::DeviceType device = nvinfer1::DeviceType::kGPU;
nvinfer1::EngineCapability capability = nvinfer1::EngineCapability::kDEFAULT;
nvinfer1::IInt8Calibrator* calibrator = nullptr;
uint64_t num_min_timing_iters = 2;
uint64_t num_avg_timing_iters = 1;
uint64_t workspace_size = 0;
uint64_t max_batch_size = 0;

BuilderSettings() = default;
BuilderSettings(const BuilderSettings& other) = default;
Expand Down
9 changes: 7 additions & 2 deletions cpp/api/include/trtorch/trtorch.h
Original file line number Diff line number Diff line change
Expand Up @@ -175,7 +175,7 @@ struct TRTORCH_API ExtraInfo {
/**
* Restrict operating type to only set default operation precision (op_precision)
*/
bool strict_type = false;
bool strict_types = false;

/**
* (Only used when targeting DLA (device))
Expand Down Expand Up @@ -205,7 +205,12 @@ struct TRTORCH_API ExtraInfo {
/**
* Maximum size of workspace given to TensorRT
*/
uint64_t workspace_size = 1 << 20;
uint64_t workspace_size = 0;

/**
* Maximum batch size (must be =< 1 to be set, 0 means not set)
*/
uint64_t max_batch_size = 0;

/**
* Calibration dataloaders for each input for post training quantizatiom
Expand Down
3 changes: 2 additions & 1 deletion cpp/api/src/extra_info.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -91,8 +91,9 @@ core::ExtraInfo to_internal_extra_info(ExtraInfo external) {

internal.convert_info.engine_settings.refit = external.refit;
internal.convert_info.engine_settings.debug = external.debug;
internal.convert_info.engine_settings.strict_type = external.strict_type;
internal.convert_info.engine_settings.strict_types = external.strict_types;
internal.convert_info.engine_settings.allow_gpu_fallback = external.allow_gpu_fallback;
internal.convert_info.engine_settings.max_batch_size = external.max_batch_size;

switch(external.device) {
case ExtraInfo::DeviceType::kDLA:
Expand Down

0 comments on commit 1b25542

Please sign in to comment.