[tensorrt] NFC: Fix broken translation test

christopherbate · christopherbate · commit f968d8efc21d · 2025-08-02T17:21:12.000Z
GitOrigin-RevId: cce60f66cb978ba012c074aca0d652710262457a
diff --git a/mlir-tensorrt/integrations/python/setup_utils.py b/mlir-tensorrt/integrations/python/setup_utils.py
@@ -127,6 +127,7 @@ def run_cmake_build(python_package_name: str, python_wheel_staging_dir: Path):
         cmake_options.append(
             f'-DMLIR_TRT_ENABLE_CUBLAS={os.environ["MLIR_TRT_ENABLE_CUBLAS"]}'
         )
+
     # Override TensorRT version if specified
     cmake_options.append(f"-DMLIR_TRT_DOWNLOAD_TENSORRT_VERSION={TENSORRT_VERSION}")
 
diff --git a/mlir-tensorrt/tensorrt/test/Target/TensorRT/host-tensor.mlir b/mlir-tensorrt/tensorrt/test/Target/TensorRT/host-tensor.mlir
@@ -0,0 +1,26 @@
+// RUN: %pick-one-gpu tensorrt-opt -split-input-file -pass-pipeline="builtin.module(translate-tensorrt-to-engine)" \
+// RUN:  -mlir-elide-elementsattrs-if-larger=32 -tensorrt-builder-opt-level=0 %s | FileCheck %s
+
+// CHECK-LABEL: func.func @trt_host_input
+//  CHECK-SAME: tensorrt.engine
+func.func @trt_host_input(
+        %arg0: tensor<?x4xf32> {tensorrt.dimension_names = {}, tensorrt.shape_profile = #tensorrt.shape_profile<min = [2, 4], opt = [4, 4], max = [6, 4]>}, 
+        %arg1: tensor<i32> {tensorrt.host_tensor, tensorrt.value_bounds = #tensorrt.shape_profile<min = [1], opt = [2], max = [3]>}) 
+        -> tensor<?x?xf32> {
+  %cst_i32 = tensorrt.constant dense<1> : tensor<i32>
+  %0 = tensorrt.element_wise <kSUM>(%arg0, %arg0 : tensor<?x4xf32>, tensor<?x4xf32>) -> tensor<?x4xf32>
+  %1 = tensorrt.shape %0 : tensor<?x4xf32> -> tensor<2xi32>
+  %2 = tensorrt.slice %1[0][1][1] : tensor<2xi32> to tensor<1xi32>
+  %3 = tensorrt.shuffle {first_transpose = array<i64: 0>, reshape = array<i64>, second_transpose = array<i64>, zero_is_placeholder = false} ins(%2 : tensor<1xi32>) -> tensor<i32>
+  %4 = tensorrt.element_wise <kPROD>(%3, %cst_i32 : tensor<i32>, tensor<i32>) -> tensor<i32>
+  %5 = tensorrt.slice %1[1][1][1] : tensor<2xi32> to tensor<1xi32>
+  %6 = tensorrt.shuffle {first_transpose = array<i64: 0>, reshape = array<i64>, second_transpose = array<i64>, zero_is_placeholder = false} ins(%5 : tensor<1xi32>) -> tensor<i32>
+  %7 = tensorrt.element_wise <kPROD>(%4, %6 : tensor<i32>, tensor<i32>) -> tensor<i32>
+  %8 = tensorrt.element_wise <kPROD>(%arg1, %cst_i32 : tensor<i32>, tensor<i32>) -> tensor<i32>
+  %9 = tensorrt.element_wise <kFLOOR_DIV>(%7, %8 : tensor<i32>, tensor<i32>) -> tensor<i32>
+  %10 = tensorrt.shuffle {first_transpose = array<i64>, reshape = array<i64: 1>, second_transpose = array<i64: 0>, zero_is_placeholder = false} ins(%9 : tensor<i32>) -> tensor<?xi32>
+  %11 = tensorrt.shuffle {first_transpose = array<i64>, reshape = array<i64: 1>, second_transpose = array<i64: 0>, zero_is_placeholder = false} ins(%arg1 : tensor<i32>) -> tensor<?xi32>
+  %12 = tensorrt.concatenation {axis = 0 : i32} ins(%10, %11 : tensor<?xi32>, tensor<?xi32>) -> tensor<2xi32>
+  %13 = tensorrt.shuffle {first_transpose = array<i64: 0, 1>, second_transpose = array<i64: 0, 1>, zero_is_placeholder = false} ins(%0, %12 : tensor<?x4xf32>, tensor<2xi32>) -> tensor<?x?xf32>
+  return %13 : tensor<?x?xf32>
+}
diff --git a/mlir-tensorrt/tensorrt/test/Target/TensorRT/translate-to-tensorrt.mlir b/mlir-tensorrt/tensorrt/test/Target/TensorRT/translate-to-tensorrt.mlir
@@ -65,27 +65,3 @@ func.func @trt_dim_names(
   %0 = tensorrt.identity %arg0 : tensor<?x?xf32> to tensor<?x?xf32>
   return %0 : tensor<?x?xf32>
 }
-
-// CHECK-LABEL: @trt_host_input
-//  CHECK-SAME: tensorrt.engine
-func.func @trt_host_input(%arg0: tensor<?x4xf32> {tensorrt.dimension_names = {}, tensorrt.shape_profile = #tensorrt.shape_profile<min = [2, 4], opt = [4, 4], max = [6, 4]>}, %arg1: tensor<i32> {plan.memory_space = #plan.memory_space<host>, tensorrt.value_bounds = #tensorrt.shape_profile<min = [1], opt = [2], max = [3]>}) -> tensor<?x?xf32> {
-    %0 = tensorrt.element_wise <kSUM>(%arg0, %arg0 : tensor<?x4xf32>, tensor<?x4xf32>) -> tensor<?x4xf32>
-    %1 = tensorrt.shape %0 : tensor<?x4xf32> -> tensor<2xi32>
-    %2 = tensorrt.slice %1[0][1][1] : tensor<2xi32> to tensor<1xi32>
-    %3 = tensorrt.collapse_rank %2 : tensor<1xi32> to tensor<i32>
-    %cst_i32 = tensorrt.constant dense<1> : tensor<i32>
-    %4 = tensorrt.element_wise <kPROD>(%3, %cst_i32 : tensor<i32>, tensor<i32>) -> tensor<i32>
-    %5 = tensorrt.slice %1[1][1][1] : tensor<2xi32> to tensor<1xi32>
-    %6 = tensorrt.collapse_rank %5 : tensor<1xi32> to tensor<i32>
-    %7 = tensorrt.element_wise <kPROD>(%4, %6 : tensor<i32>, tensor<i32>) -> tensor<i32>
-    %cst_i32_0 = tensorrt.constant dense<1> : tensor<i32>
-    %8 = tensorrt.element_wise <kPROD>(%arg1, %cst_i32_0 : tensor<i32>, tensor<i32>) -> tensor<i32>
-    %9 = tensorrt.element_wise <kFLOOR_DIV>(%7, %8 : tensor<i32>, tensor<i32>) -> tensor<i32>
-    %cst_i32_1 = tensorrt.constant dense<1> : tensor<1xi32>
-    %10 = tensorrt.reshape %9 shape(%cst_i32_1: tensor<1xi32>) : tensor<i32> to tensor<?xi32>
-    %cst_i32_2 = tensorrt.constant dense<1> : tensor<1xi32>
-    %11 = tensorrt.reshape %arg1 shape(%cst_i32_2: tensor<1xi32>) : tensor<i32> to tensor<?xi32>
-    %12 = tensorrt.concatenation {axis = 0 : i32} ins(%10, %11 : tensor<?xi32>, tensor<?xi32>) -> tensor<2xi32>
-    %13 = tensorrt.reshape %0 shape(%12: tensor<2xi32>) : tensor<?x4xf32> to tensor<?x?xf32>
-    return %13 : tensor<?x?xf32>
-}

Original file line number	Diff line number	Diff line change
`@@ -127,6 +127,7 @@ def run_cmake_build(python_package_name: str, python_wheel_staging_dir: Path):`
`127`	`127`	`cmake_options.append(`
`128`	`128`	`f'-DMLIR_TRT_ENABLE_CUBLAS={os.environ["MLIR_TRT_ENABLE_CUBLAS"]}'`
`129`	`129`	`)`
	`130`	`+`
`130`	`131`	`# Override TensorRT version if specified`
`131`	`132`	`cmake_options.append(f"-DMLIR_TRT_DOWNLOAD_TENSORRT_VERSION={TENSORRT_VERSION}")`
`132`	`133`