Skip to content

Commit

Permalink
Improve performance of converted layer_norm ops
Browse files Browse the repository at this point in the history
  • Loading branch information
mfeliz-cruise committed Sep 5, 2023
1 parent 2155021 commit 9f68439
Showing 1 changed file with 4 additions and 4 deletions.
8 changes: 4 additions & 4 deletions core/conversion/converters/impl/layer_norm.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -90,16 +90,16 @@ auto layer_norm_registrations TORCHTRT_UNUSED = RegisterNodeConversionPatterns()

auto normalized = div_out;

//gamma
if (args[2].IValue()->isTensor()){
// gamma
if (args[2].IValue()->isTensor()) {
auto gamma = args[2].ITensorOrFreeze(ctx);
auto gamma_prod = add_elementwise(
ctx, nvinfer1::ElementWiseOperation::kPROD, normalized, gamma, (util::node_info(n) + "_gamma").c_str());
normalized = gamma_prod->getOutput(0);
}

//beta
if (args[3].IValue()->isTensor()){
// beta
if (args[3].IValue()->isTensor()) {
auto beta = args[3].ITensorOrFreeze(ctx);
auto beta_sum = add_elementwise(
ctx, nvinfer1::ElementWiseOperation::kSUM, normalized, beta, (util::node_info(n) + "_beta").c_str());
Expand Down

0 comments on commit 9f68439

Please sign in to comment.