[feat]: support slice with dynamic shape

inocsin · inocsin · commit b229c378d211 · 2022-06-13T16:36:42.000+08:00
Signed-off-by: inocsin &lt;vcheungyi@163.com&gt;
diff --git a/core/conversion/converters/converter_util.cpp b/core/conversion/converters/converter_util.cpp
@@ -199,6 +199,60 @@ nvinfer1::ITensor* tensor_to_const(ConversionCtx* ctx, at::Tensor t, const std::
   return out;
 }
 
+nvinfer1::ITensor* toITensor(ConversionCtx* ctx, const torch::jit::Node* n, at::Tensor* input) {
+
+    auto weights = Weights(ctx, *input);
+    // IConstantLayer to convert indices from Weights to ITensor
+    auto const_layer = ctx->net->addConstant(weights.shape, weights.data); // shouln't use constant
+    TORCHTRT_CHECK(const_layer, "Unable to create constant layer from node: " << *n);
+    auto const_out = const_layer->getOutput(0);
+    return const_out;
+}
+
+// clamp x to [lower_bound, upper_bound]
+nvinfer1::ITensor* clamp(ConversionCtx* ctx, const torch::jit::Node* n, nvinfer1::ITensor* x,
+                        nvinfer1::ITensor* lower_bound, nvinfer1::ITensor* upper_bound) {
+  auto max_layer = ctx->net->addElementWise(*x, *lower_bound, nvinfer1::ElementWiseOperation::kMAX);
+  auto max_itensor = max_layer->getOutput(0);
+  auto min_layer = ctx->net->addElementWise(*max_itensor, *upper_bound, nvinfer1::ElementWiseOperation::kMIN);
+  auto min_itensor = min_layer->getOutput(0);
+  return min_itensor;
+}
+
+// return indices < 0 ? inputDims + indices : indices
+nvinfer1::ITensor* bump_if_negtive(ConversionCtx* ctx, const torch::jit::Node* n, nvinfer1::ITensor* input_dim,
+                                   nvinfer1::ITensor* indices) {
+    auto nbdims = input_dim->getDimensions().d[0];
+    auto zero = torch::zeros({nbdims}).to(torch::kI32);
+    auto neg = - torch::ones({nbdims}).to(torch::kI32);
+    auto zero_itensor = toITensor(ctx, n, &zero);
+    auto neg_itensor = toITensor(ctx, n, &neg);
+    auto signs = clamp(ctx, n, indices, neg_itensor, zero_itensor);
+    auto mul = ctx->net->addElementWise(*signs, *input_dim, nvinfer1::ElementWiseOperation::kPROD);
+    auto mul_itensor = mul->getOutput(0);
+    auto sub = ctx->net->addElementWise(*indices, *mul_itensor, nvinfer1::ElementWiseOperation::kSUB);
+    auto sub_itensor = sub->getOutput(0);
+    return sub_itensor;
+}
+
+void update_start_and_end(ConversionCtx* ctx, const torch::jit::Node* n, nvinfer1::ITensor* in_shape, 
+                        nvinfer1::ITensor* in_start, nvinfer1::ITensor* in_end,
+                        nvinfer1::ITensor** out_start, nvinfer1::ITensor** out_end) {
+    *out_start = bump_if_negtive(ctx, n, in_shape, in_start);
+    *out_end = bump_if_negtive(ctx, n, in_shape, in_end);
+}
+
+bool is_dynamic_shape(nvinfer1::ITensor* tensor) {
+   auto dim = tensor->getDimensions();
+   auto ndims = dim.nbDims;
+   for (int i = 0; i < ndims; i++) {
+     if (dim.d[i] == -1) {
+       return true;
+     }
+   }
+   return false;
+}
+
 } // namespace converters
 } // namespace conversion
 } // namespace core
diff --git a/core/conversion/converters/converter_util.h b/core/conversion/converters/converter_util.h
@@ -50,6 +50,20 @@ nvinfer1::ITensor* castITensor(ConversionCtx* ctx, nvinfer1::ITensor* tensor, nv
 // Freeze an at::Tensor in a IConstant layer
 nvinfer1::ITensor* tensor_to_const(ConversionCtx* ctx, at::Tensor t, const std::string& name = std::string());
 
+nvinfer1::ITensor* toITensor(ConversionCtx* ctx, const torch::jit::Node* n, at::Tensor* input);
+
+nvinfer1::ITensor* clamp(ConversionCtx* ctx, const torch::jit::Node* n, nvinfer1::ITensor* x,
+                        nvinfer1::ITensor* lower_bound, nvinfer1::ITensor* upper_bound);
+
+nvinfer1::ITensor* bump_if_negtive(ConversionCtx* ctx, const torch::jit::Node* n, nvinfer1::ITensor* input_dim,
+                                   nvinfer1::ITensor* indices);
+
+void update_start_and_end(ConversionCtx* ctx, const torch::jit::Node* n, nvinfer1::ITensor* in_shape, 
+                        nvinfer1::ITensor* in_start, nvinfer1::ITensor* in_end,
+                        nvinfer1::ITensor** out_start, nvinfer1::ITensor** out_end);
+
+bool is_dynamic_shape(nvinfer1::ITensor* tensor);
+
 } // namespace converters
 } // namespace conversion
 } // namespace core
diff --git a/core/conversion/converters/impl/select.cpp b/core/conversion/converters/impl/select.cpp
@@ -302,45 +302,105 @@ auto select_registrations TORCHTRT_UNUSED =
         .pattern(
             {"aten::slice.Tensor(Tensor(a) self, int dim=0, int? start=None, int? end=None, int step=1) -> Tensor(a)",
              [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
-               auto in = args[0].ITensorOrFreeze(ctx);
-               auto axis = args[1].unwrapToInt();
-               auto maxDim = static_cast<int64_t>(in->getDimensions().d[axis]);
-               auto startIdx = 0;
-               auto startIdxIVal = args[2].IValue();
-               if (!startIdxIVal->isNone()) {
-                 startIdx = startIdxIVal->toInt();
-               }
-               // Handle case when given tensor index is negative
-               auto start = (startIdx < 0) ? (maxDim + startIdx) : startIdx;
-               // Bound the end index to input tensor dimensions at specified axis
-               auto endIdx = maxDim;
-               auto endIdxIVal = args[3].IValue();
-               if (!endIdxIVal->isNone()) {
-                 endIdx = std::min(endIdxIVal->toInt(), maxDim);
-               }
-               auto end = (endIdx < 0) ? (maxDim + endIdx) : endIdx;
-               auto step = args[4].unwrapToInt();
-
-               LOG_DEBUG("Start idx: " << start);
-               LOG_DEBUG("End idx: " << end);
-
-               // indices to be accessed need to be an at::Tensor
-               at::Tensor indices = torch::arange(start, end, step).to(torch::kI32);
-               auto weights = Weights(ctx, indices);
-
-               // IConstantLayer to convert indices from Weights to ITensor
-               auto const_layer = ctx->net->addConstant(weights.shape, weights.data);
-               TORCHTRT_CHECK(const_layer, "Unable to create constant layer from node: " << *n);
-               auto const_out = const_layer->getOutput(0);
-
-               // IGatherLayer takes in input tensor, the indices, and the axis of input tensor to take indices from
-               auto gather_layer = ctx->net->addGather(*in, *const_out, axis);
-               TORCHTRT_CHECK(gather_layer, "Unable to create gather layer from node: " << *n);
-               auto gather_out = gather_layer->getOutput(0);
-
-               auto out = ctx->AssociateValueAndTensor(n->outputs()[0], gather_out);
-
-               LOG_DEBUG("Slice layer output shape: " << out->getDimensions());
+                auto in = args[0].ITensorOrFreeze(ctx);
+                auto axis = args[1].unwrapToInt();
+                auto maxDim = static_cast<int64_t>(in->getDimensions().d[axis]);
+                bool dynamic_shape = is_dynamic_shape(in);
+                auto input_dim = in->getDimensions();
+                // add Shape Tensor
+                auto ishape_layer = ctx->net->addShape(*in);
+                auto ishape_tensor = ishape_layer->getOutput(0); // input shape
+
+                auto startIdx = 0;
+                auto startIdxIVal = args[2].IValue();
+                if (!startIdxIVal->isNone()) {
+                  startIdx = startIdxIVal->toInt();
+                }
+                // Handle case when given tensor index is negative
+                if (maxDim > 0) {  // only for static shape
+                  startIdx = (startIdx < 0) ? (maxDim + startIdx) : startIdx;
+                }
+                
+                // Bound the end index to input tensor dimensions at specified axis
+                auto endIdx = maxDim; // -1 for dynamic shape
+                auto endIdxIVal = args[3].IValue();
+                if (!endIdxIVal->isNone()) {
+                  endIdx = maxDim == -1 ? endIdxIVal->toInt() : std::min(endIdxIVal->toInt(), maxDim);
+                }
+                if (maxDim > 0) {
+                  endIdx = (endIdx < 0) ? (maxDim + endIdx) : endIdx;
+                }
+                auto step = args[4].unwrapToInt();
+
+                auto nbdims = in->getDimensions().nbDims;
+                nvinfer1::Dims start_, size_, stride_;
+                start_.nbDims = nbdims;
+                size_.nbDims = nbdims;
+                stride_.nbDims = nbdims;
+                for (int i = 0; i < nbdims; i++) {
+                  if (i == axis) {
+                    start_.d[i] = startIdx;
+                    size_.d[i] = (endIdx - startIdx - 1) / step + 1;
+                    stride_.d[i] = step;
+                  } else {
+                    start_.d[i] = 0;
+                    size_.d[i] = input_dim.d[i]; // for static
+                    stride_.d[i] = 1;
+                  }
+                }
+                auto slice_layer = ctx->net->addSlice(*in, start_, size_, stride_);
+
+                if (dynamic_shape) { // dynamic shape
+                  LOG_DEBUG("Using dynamic version of slice");
+                  // start tensor
+                  at::Tensor start_tensor = torch::zeros({nbdims}).to(torch::kI32);;
+                  start_tensor[axis] = startIdx;
+                  auto start_itensor = toITensor(ctx, n, &start_tensor);
+
+                  // step tensor
+                  at::Tensor stride_tensor = torch::ones({nbdims}).to(torch::kI32);
+                  stride_tensor[axis] = step;
+                  auto stride_itensor = toITensor(ctx, n, &stride_tensor);
+
+                  // end tensor
+                  at::Tensor end_tensor = torch::zeros({nbdims}).to(torch::kI32);
+                  for (int i = 0; i < nbdims; i++) {
+                    if (i == axis) {
+                      end_tensor[i] = endIdxIVal->isNone() ? -1: endIdx-1;
+                    } else {
+                      end_tensor[i] = input_dim.d[i] == -1 ? -1 : input_dim.d[i]-1;
+                    }
+                  }
+                  auto end_itensor = toITensor(ctx, n, &end_tensor);
+
+                  // one itensor
+                  at::Tensor one_tensor = torch::ones({nbdims}).to(torch::kI32);
+                  auto one_itensor = toITensor(ctx, n, &one_tensor);
+
+                  // update start and end 
+                  nvinfer1::ITensor* out_start;
+                  nvinfer1::ITensor* out_end;
+                  update_start_and_end(ctx, n, ishape_tensor, 
+                        start_itensor, end_itensor,
+                        &out_start, &out_end);
+
+                  // calculate size
+                  auto sub_layer = ctx->net->addElementWise(*out_end, *out_start, nvinfer1::ElementWiseOperation::kSUB);
+                  auto sub_itensor = sub_layer->getOutput(0);
+                  auto div_layer = ctx->net->addElementWise(*sub_itensor, *stride_itensor, nvinfer1::ElementWiseOperation::kDIV);
+                  auto div_itensor = div_layer->getOutput(0);
+                  auto add_layer = ctx->net->addElementWise(*div_itensor, *one_itensor, nvinfer1::ElementWiseOperation::kSUM);
+                  auto size_itensor = add_layer->getOutput(0);
+                  
+
+                  // update slice layer
+                  slice_layer->setInput(1, *out_start); // start
+                  slice_layer->setInput(2, *size_itensor); // size, must be set if input is dynamic
+
+                }
+                auto slice_out = slice_layer->getOutput(0);
+                auto out = ctx->AssociateValueAndTensor(n->outputs()[0], slice_out);
+                LOG_DEBUG("Slice layer output shape: " << out->getDimensions());
 
                return true;
              }})
diff --git a/core/conversion/var/Var.cpp b/core/conversion/var/Var.cpp
@@ -110,6 +110,7 @@ nvinfer1::ITensor* Var::ITensorOrFreeze(ConversionCtx* ctx) {
     out = ptr_.tensor;
   }
 
+  LOG_DEBUG("ITensor name: " << out->getName());
   LOG_DEBUG("ITensor shape: " << out->getDimensions());
   LOG_DEBUG("ITensor type: " << out->getType());
   return out;
diff --git a/tests/core/conversion/converters/test_select.cpp b/tests/core/conversion/converters/test_select.cpp
diff --git a/tests/util/run_graph_engine.cpp b/tests/util/run_graph_engine.cpp

Original file line number	Diff line number	Diff line change
`@@ -110,6 +110,7 @@ nvinfer1::ITensor* Var::ITensorOrFreeze(ConversionCtx* ctx) {`
`110`	`110`	`out = ptr_.tensor;`
`111`	`111`	`}`
`112`	`112`
	`113`	`+ LOG_DEBUG("ITensor name: " << out->getName());`
`113`	`114`	`LOG_DEBUG("ITensor shape: " << out->getDimensions());`
`114`	`115`	`LOG_DEBUG("ITensor type: " << out->getType());`
`115`	`116`	`return out;`