From b8add61eefe7a609e0d21561b17284301ca15f9f Mon Sep 17 00:00:00 2001
From: Yao Wang <kevinthesunwy@gmail.com>
Date: Wed, 2 Dec 2020 23:59:39 +0000
Subject: [PATCH 1/7] Fix GPU dynamic Topk

---
 include/tvm/topi/nn.h            |  2 +-
 include/tvm/topi/transform.h     | 70 ++++++++++++++++++++++++++++----
 python/tvm/topi/cuda/sort.py     | 28 +++++++++++--
 src/relay/op/tensor/transform.cc | 19 ++++++---
 tests/python/relay/test_any.py   |  8 +---
 5 files changed, 102 insertions(+), 25 deletions(-)
diff --git a/include/tvm/topi/nn.h b/include/tvm/topi/nn.h
index f958048f13c3..71944071a7ce 100644
--- a/include/tvm/topi/nn.h
+++ b/include/tvm/topi/nn.h
@@ -614,7 +614,7 @@ inline tvm::te::Tensor batch_to_space_nd(const tvm::te::Tensor& data,
   out = reshape(out, r_p_shape);
 
   // Crop the start and end of dimensions of out
-  Array<Integer> begin_idx, end_idx, strides;
+  Array<PrimExpr> begin_idx, end_idx, strides;
   for (size_t i = 0; i < r_p_shape.size(); ++i) {
     strides.push_back(Integer(1));
     if (i > 0 && i <= num_block_dims) {
diff --git a/include/tvm/topi/transform.h b/include/tvm/topi/transform.h
index c866dfb7f86b..4e7f90189c56 100644
--- a/include/tvm/topi/transform.h
+++ b/include/tvm/topi/transform.h
@@ -598,17 +598,69 @@ inline te::Tensor dynamic_strided_slice(const te::Tensor& x, const te::Tensor& b
  *
  * \return A Tensor whose op member is the split operation
  */
-inline Tensor strided_slice(const Tensor& x, const Array<Integer>& begin, const Array<Integer>& end,
-                            const Array<Integer>& strides, std::string slice_mode = "end",
-                            std::string name = "T_strided_slice", std::string tag = kInjective) {
+inline Tensor strided_slice(const Tensor& x, const Array<PrimExpr>& begin,
+		            const Array<PrimExpr>& end, const Array<PrimExpr>& strides,
+			    std::string slice_mode = "end", std::string name = "T_strided_slice",
+			    std::string tag = kInjective) {
   size_t src_tensor_dim = static_cast<size_t>(x->shape.size());
+  // Quick path for dynamic shape strided slice.
+  // This is for ease of use to dynamice strided slice in topi.
+  bool is_dyn = false;
+  for (size_t i = 0; i < src_tensor_dim; ++i) {
+    if (!IsConstInt(x->shape[i])) {
+      is_dyn = true;
+      break;
+    }
+  }
+  if (!is_dyn) {
+    for (size_t i = 0; i < begin.size(); ++i) {
+      if (begin[i].defined() && !IsConstInt(begin[i])) {
+        is_dyn = true;
+	break;
+      }
+    }
+  }
+  if (!is_dyn) {
+    for (size_t i = 0; i < end.size(); ++i) {
+      if (end[i].defined() && !IsConstInt(end[i])) {
+        is_dyn = true;
+        break;
+      }
+    }
+  }
+  if (!is_dyn) {
+    for (size_t i = 0; i < strides.size(); ++i) {
+      if (strides[i].defined() && !IsConstInt(strides[i])) {
+        is_dyn = true;
+        break;
+      }
+    }
+  }
+
+  Array<PrimExpr> out_shape;
+  if (is_dyn) {
+    for (size_t i = 0; i < src_tensor_dim; ++i) {
+      out_shape.push_back(indexdiv(end[i] - begin[i], strides[i]));
+    }
+    return te::compute(
+        out_shape,
+        [&](const Array<tvm::tir::Var>& indices) {
+          Array<PrimExpr> real_indices;
+          for (size_t i = 0; i < src_tensor_dim; ++i) {
+            real_indices.push_back(indices[i] * strides[i] + begin[i]);
+          }
+          return x(real_indices);
+        },
+        name, tag);
+  }
+
   // Setup the ranges.
   // NOTE: this code duplicates the shape inference logic relay.op
   // Consider to refactor in the future.
   std::vector<int64_t> stride_vec(src_tensor_dim, 1);
   for (size_t i = 0; i < strides.size(); ++i) {
     ICHECK(strides[i].defined());
-    stride_vec[i] = strides[i]->value;
+    stride_vec[i] = GetConstInt(strides[i]);
   }
 
   const int64_t max_range = std::numeric_limits<int64_t>::max();
@@ -619,7 +671,7 @@ inline Tensor strided_slice(const Tensor& x, const Array<Integer>& begin, const
       // value=None
       begin_vec.push_back(stride_vec[i] > 0 ? 0 : max_range);
     } else {
-      begin_vec.push_back(begin[i]->value);
+      begin_vec.push_back(GetConstInt(begin[i]));
     }
   }
   for (size_t i = begin_vec.size(); i < src_tensor_dim; ++i) {
@@ -633,20 +685,20 @@ inline Tensor strided_slice(const Tensor& x, const Array<Integer>& begin, const
     if (!end[i].defined()) {
       end_vec.push_back(stride_vec[i] < 0 ? 0 : max_range);
     } else if (slice_mode == "size") {
-      if (end[i]->value < 0) {
+      int64_t end_val = GetConstInt(end[i]);
+      if (end_val < 0) {
         end_vec.push_back(stride_vec[i] < 0 ? 0 : max_range);
       } else {
-        end_vec.push_back(begin_vec[i] + end[i]->value);
+        end_vec.push_back(begin_vec[i] + end_val);
       }
     } else {
-      end_vec.push_back(end[i]->value);
+      end_vec.push_back(GetConstInt(end[i]));
     }
   }
   for (size_t i = end_vec.size(); i < src_tensor_dim; ++i) {
     end_vec.push_back(stride_vec[i] < 0 ? 0 : max_range);
   }
   // Compute
-  Array<PrimExpr> out_shape;
   Array<PrimExpr> begin_expr;
   Array<PrimExpr> strides_expr;
 
diff --git a/python/tvm/topi/cuda/sort.py b/python/tvm/topi/cuda/sort.py
index 465299a5bc8f..ec65b656eb87 100644
--- a/python/tvm/topi/cuda/sort.py
+++ b/python/tvm/topi/cuda/sort.py
@@ -455,6 +455,7 @@ def topk(data, k=1, axis=-1, ret_type="both", is_ascend=False, dtype="int64"):
     out : tvm.te.Tensor or List[tvm.te.Tensor]
         The computed result.
     """
+    return topk_thrust(data, k=1, axis=-1, ret_type="both", is_ascend=False, dtype="int64")
     assert ret_type in ["both", "values", "indices"]
     ndim = len(data.shape)
     axis = axis + ndim if axis < 0 else axis
@@ -561,10 +562,31 @@ def topk_thrust(data, k=1, axis=-1, ret_type="both", is_ascend=False, dtype="int
         tag="topk_gpu",
     )
 
-    if k > 0:
+    is_dyn = not isinstance(k, int)
+    for dim in data.shape:
+        if not isinstance(dim, tvm.tir.IntImm):
+            is_dyn = True
+            break
+
+    if not is_dyn:
+        if k > 0:
+            beg = [0] * ndim
+            end = data.shape[:axis] + [k] + data.shape[axis:]
+            out = [strided_slice(o, beg, end) for o in out]
+    else:
         beg = [0] * ndim
-        end = data.shape[:-1] + [k]
-        out = [strided_slice(o, beg, end) for o in out]
+        end = []
+        for i in range(len(data.shape)):
+            if i == axis:
+                if isinstance(k, int):
+                    end.append(data.shape[i] if k <= 0 else k)
+                else:
+                    end.append(tvm.te.size_var("dim"))
+            else:
+                end.append(data.shape[i])
+
+        strides = [1] * ndim
+        out = [strided_slice(o, beg, end, strides) for o in out]
 
     if axis != ndim - 1:
         axes = swap(list(range(ndim)), axis)
diff --git a/src/relay/op/tensor/transform.cc b/src/relay/op/tensor/transform.cc
index d1f2f267c580..62e143197d9e 100644
--- a/src/relay/op/tensor/transform.cc
+++ b/src/relay/op/tensor/transform.cc
@@ -2312,6 +2312,7 @@ Array<te::Tensor> StridedSliceCompute(const Attrs& attrs, const Array<te::Tensor
   const StridedSliceAttrs* param = attrs.as<StridedSliceAttrs>();
   ICHECK(param != nullptr);
   Array<Integer> begin, end, strides;
+  Array<PrimExpr> begin_expr, end_expr, strides_expr;
   begin = param->begin.value();
   end = param->end.value();
   strides = param->strides.value();
@@ -2324,8 +2325,6 @@ Array<te::Tensor> StridedSliceCompute(const Attrs& attrs, const Array<te::Tensor
     for (size_t i = 0; i < src_tensor_dim; ++i) {
       out_shape.push_back(tvm::tir::Var("dim"));
     }
-    Array<PrimExpr> begin_expr;
-    Array<PrimExpr> strides_expr;
     for (size_t i = 0; i < src_tensor_dim; ++i) {
       int64_t begin_i = begin[i]->value;
       if (begin_i < 0) {
@@ -2346,8 +2345,19 @@ Array<te::Tensor> StridedSliceCompute(const Attrs& attrs, const Array<te::Tensor
           return input(real_indices);
         },
         std::string{"T_strided_slice_dynamic"}, std::string{topi::kInjective})};
+  } else {
+    for (size_t i = 0; i < begin.size(); ++i) {
+      begin_expr.push_back(begin[i]);
+    }
+    for (size_t i = 0; i < end.size(); ++i) {
+      end_expr.push_back(end[i]);
+    }
+    for (size_t i = 0; i < strides.size(); ++i) {
+      strides_expr.push_back(strides[i]);
+    }
   }
-  return Array<te::Tensor>{topi::strided_slice(inputs[0], begin, end, strides, param->slice_mode)};
+  return Array<te::Tensor>{
+      topi::strided_slice(inputs[0], begin_expr, end_expr, strides_expr, param->slice_mode)};
 }
 
 // Positional relay function to create StridedSlice operator used by frontend FFI.
@@ -2663,8 +2673,7 @@ Array<te::Tensor> SliceLikeCompute(const Attrs& attrs, const Array<te::Tensor>&
           << topi::GetConstInt(src_shape[axis]);
     }
   }
-  return Array<te::Tensor>{topi::strided_slice(inputs[0], GetIntArray(begin_idx),
-                                               GetIntArray(end_idx), GetIntArray(strides), "end")};
+  return Array<te::Tensor>{topi::strided_slice(inputs[0], begin_idx, end_idx, strides, "end")};
 }
 
 TVM_REGISTER_GLOBAL("relay.op._make.slice_like").set_body_typed(MakeSliceLike);
diff --git a/tests/python/relay/test_any.py b/tests/python/relay/test_any.py
index 546973704fea..8aa7536f632e 100644
--- a/tests/python/relay/test_any.py
+++ b/tests/python/relay/test_any.py
@@ -815,13 +815,7 @@ def verify_any_topk(data_shape, kval, np_dshape, dtype, const_k=False):
     else:
         ref_out = sorted[0:kval]
 
-    for kind in ["debug", "vm"]:
-        ex = relay.create_executor(kind, mod=mod, ctx=tvm.cpu(), target="llvm")
-        result = ex.evaluate()(*in_vals)
-        tvm.testing.assert_allclose(result.asnumpy(), ref_out)
-
-    # TODO(@zhiics) Fix topk cuda schedule for dynamic inputs
-    # check_result(in_vals, mod, ref_out)
+    check_result(in_vals, mod, ref_out)
 
 
 def test_any_topk():

From 4a5f4a81562c687bb86981189481816d881c67ba Mon Sep 17 00:00:00 2001
From: Yao Wang <kevinthesunwy@gmail.com>
Date: Thu, 3 Dec 2020 00:04:59 +0000
Subject: [PATCH 2/7] Fix style

---
 include/tvm/topi/transform.h | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/include/tvm/topi/transform.h b/include/tvm/topi/transform.h
index 4e7f90189c56..d89370719150 100644
--- a/include/tvm/topi/transform.h
+++ b/include/tvm/topi/transform.h
@@ -599,9 +599,9 @@ inline te::Tensor dynamic_strided_slice(const te::Tensor& x, const te::Tensor& b
  * \return A Tensor whose op member is the split operation
  */
 inline Tensor strided_slice(const Tensor& x, const Array<PrimExpr>& begin,
-		            const Array<PrimExpr>& end, const Array<PrimExpr>& strides,
-			    std::string slice_mode = "end", std::string name = "T_strided_slice",
-			    std::string tag = kInjective) {
+                            const Array<PrimExpr>& end, const Array<PrimExpr>& strides,
+                            std::string slice_mode = "end", std::string name = "T_strided_slice",
+                            std::string tag = kInjective) {
   size_t src_tensor_dim = static_cast<size_t>(x->shape.size());
   // Quick path for dynamic shape strided slice.
   // This is for ease of use to dynamice strided slice in topi.
@@ -616,7 +616,7 @@ inline Tensor strided_slice(const Tensor& x, const Array<PrimExpr>& begin,
     for (size_t i = 0; i < begin.size(); ++i) {
       if (begin[i].defined() && !IsConstInt(begin[i])) {
         is_dyn = true;
-	break;
+        break;
       }
     }
   }

From 7855e49a71d7b5005cc87a69deece15fe420cbb1 Mon Sep 17 00:00:00 2001
From: Yao Wang <kevinthesunwy@gmail.com>
Date: Thu, 3 Dec 2020 00:23:07 +0000
Subject: [PATCH 3/7] Minor fix

---
 python/tvm/topi/cuda/sort.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/python/tvm/topi/cuda/sort.py b/python/tvm/topi/cuda/sort.py
index ec65b656eb87..7b348a775285 100644
--- a/python/tvm/topi/cuda/sort.py
+++ b/python/tvm/topi/cuda/sort.py
@@ -455,7 +455,6 @@ def topk(data, k=1, axis=-1, ret_type="both", is_ascend=False, dtype="int64"):
     out : tvm.te.Tensor or List[tvm.te.Tensor]
         The computed result.
     """
-    return topk_thrust(data, k=1, axis=-1, ret_type="both", is_ascend=False, dtype="int64")
     assert ret_type in ["both", "values", "indices"]
     ndim = len(data.shape)
     axis = axis + ndim if axis < 0 else axis

From d30b7a6e3cb51020c179fa98b7e61f3a135036d3 Mon Sep 17 00:00:00 2001
From: Yao Wang <kevinthesunwy@gmail.com>
Date: Thu, 3 Dec 2020 00:53:03 +0000
Subject: [PATCH 4/7] Simplfy dynamic checking

---
 include/tvm/topi/detail/constant_utils.h | 15 ++++++++++
 include/tvm/topi/transform.h             | 37 ++++--------------------
 2 files changed, 20 insertions(+), 32 deletions(-)

diff --git a/include/tvm/topi/detail/constant_utils.h b/include/tvm/topi/detail/constant_utils.h
index 412c79330ca9..a0c3c19f832e 100644
--- a/include/tvm/topi/detail/constant_utils.h
+++ b/include/tvm/topi/detail/constant_utils.h
@@ -47,6 +47,21 @@ using namespace tvm::te;
  */
 inline bool IsConstInt(PrimExpr expr) { return expr->IsInstance<tvm::tir::IntImmNode>(); }
 
+/*!
+ * \brief Test whether the given Array has every element as constant integer
+ *
+ * \param array the array to query
+ *
+ * \return true if every element in array is constant int or uint, false otherwise.
+ */
+inline bool IsConstIntArray(Array<PrimExpr> array) { 
+   bool is_const_int = true;
+  for (auto const& elem : array) {
+    is_const_int &= elem->IsInstance<tvm::tir::IntImmNode>();
+  }
+  return is_const_int;
+}
+
 /*!
  * \brief Get the value of the given constant integer expression. An error
  * is logged if the given expression is not a constant integer.
diff --git a/include/tvm/topi/transform.h b/include/tvm/topi/transform.h
index d89370719150..265ba0f315b5 100644
--- a/include/tvm/topi/transform.h
+++ b/include/tvm/topi/transform.h
@@ -605,40 +605,13 @@ inline Tensor strided_slice(const Tensor& x, const Array<PrimExpr>& begin,
   size_t src_tensor_dim = static_cast<size_t>(x->shape.size());
   // Quick path for dynamic shape strided slice.
   // This is for ease of use to dynamice strided slice in topi.
-  bool is_dyn = false;
-  for (size_t i = 0; i < src_tensor_dim; ++i) {
-    if (!IsConstInt(x->shape[i])) {
-      is_dyn = true;
-      break;
-    }
-  }
-  if (!is_dyn) {
-    for (size_t i = 0; i < begin.size(); ++i) {
-      if (begin[i].defined() && !IsConstInt(begin[i])) {
-        is_dyn = true;
-        break;
-      }
-    }
-  }
-  if (!is_dyn) {
-    for (size_t i = 0; i < end.size(); ++i) {
-      if (end[i].defined() && !IsConstInt(end[i])) {
-        is_dyn = true;
-        break;
-      }
-    }
-  }
-  if (!is_dyn) {
-    for (size_t i = 0; i < strides.size(); ++i) {
-      if (strides[i].defined() && !IsConstInt(strides[i])) {
-        is_dyn = true;
-        break;
-      }
-    }
-  }
+  bool is_static = IsConstIntArray(x->shape);
+  is_static &= IsConstIntArray(begin);
+  is_static &= IsConstIntArray(end);
+  is_static &= IsConstIntArray(strides);
 
   Array<PrimExpr> out_shape;
-  if (is_dyn) {
+  if (!is_static) {
     for (size_t i = 0; i < src_tensor_dim; ++i) {
       out_shape.push_back(indexdiv(end[i] - begin[i], strides[i]));
     }

From ce76572afda8d7a7331d92eee3c1c01bcff689bb Mon Sep 17 00:00:00 2001
From: Yao Wang <kevinthesunwy@gmail.com>
Date: Thu, 3 Dec 2020 00:59:38 +0000
Subject: [PATCH 5/7] Fix lint

---
 include/tvm/topi/detail/constant_utils.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/include/tvm/topi/detail/constant_utils.h b/include/tvm/topi/detail/constant_utils.h
index a0c3c19f832e..49ce21b5732e 100644
--- a/include/tvm/topi/detail/constant_utils.h
+++ b/include/tvm/topi/detail/constant_utils.h
@@ -54,8 +54,8 @@ inline bool IsConstInt(PrimExpr expr) { return expr->IsInstance<tvm::tir::IntImm
  *
  * \return true if every element in array is constant int or uint, false otherwise.
  */
-inline bool IsConstIntArray(Array<PrimExpr> array) { 
-   bool is_const_int = true;
+inline bool IsConstIntArray(Array<PrimExpr> array) {
+  bool is_const_int = true;
   for (auto const& elem : array) {
     is_const_int &= elem->IsInstance<tvm::tir::IntImmNode>();
   }

From 96cdac0fde37506375c596aac7fd21259786c184 Mon Sep 17 00:00:00 2001
From: Yao Wang <kevinthesunwy@gmail.com>
Date: Thu, 3 Dec 2020 02:26:54 +0000
Subject: [PATCH 6/7] More improvements

---
 python/tvm/topi/cuda/sort.py                  | 24 ++-----------------
 .../relay/dyn/test_dynamic_op_level6.py       |  6 +++--
 2 files changed, 6 insertions(+), 24 deletions(-)

diff --git a/python/tvm/topi/cuda/sort.py b/python/tvm/topi/cuda/sort.py
index 7b348a775285..ca5c0d5a2687 100644
--- a/python/tvm/topi/cuda/sort.py
+++ b/python/tvm/topi/cuda/sort.py
@@ -561,29 +561,9 @@ def topk_thrust(data, k=1, axis=-1, ret_type="both", is_ascend=False, dtype="int
         tag="topk_gpu",
     )
 
-    is_dyn = not isinstance(k, int)
-    for dim in data.shape:
-        if not isinstance(dim, tvm.tir.IntImm):
-            is_dyn = True
-            break
-
-    if not is_dyn:
-        if k > 0:
-            beg = [0] * ndim
-            end = data.shape[:axis] + [k] + data.shape[axis:]
-            out = [strided_slice(o, beg, end) for o in out]
-    else:
+    if not isinstance(k, int) or k > 0:
         beg = [0] * ndim
-        end = []
-        for i in range(len(data.shape)):
-            if i == axis:
-                if isinstance(k, int):
-                    end.append(data.shape[i] if k <= 0 else k)
-                else:
-                    end.append(tvm.te.size_var("dim"))
-            else:
-                end.append(data.shape[i])
-
+        end = data.shape[:-1] + [k if isinstance(k, int) else tvm.te.size_var("dim")]
         strides = [1] * ndim
         out = [strided_slice(o, beg, end, strides) for o in out]
 
diff --git a/tests/python/relay/dyn/test_dynamic_op_level6.py b/tests/python/relay/dyn/test_dynamic_op_level6.py
index aeed8db7c1b6..4b2e4822d6ae 100644
--- a/tests/python/relay/dyn/test_dynamic_op_level6.py
+++ b/tests/python/relay/dyn/test_dynamic_op_level6.py
@@ -22,8 +22,8 @@
 from tvm import relay
 import tvm.testing
 
-# TODO(mbrookhart): Enable when we can get it working
-# @tvm.testing.uses_gpu
+
+@tvm.testing.uses_gpu
 def test_dynamic_topk():
     def verify_topk(k, axis, ret_type, is_ascend, dtype):
         shape = (20, 100)
@@ -53,6 +53,8 @@ def verify_topk(k, axis, ret_type, is_ascend, dtype):
         np_indices = np_indices.astype(dtype)
 
         for target, ctx in tvm.testing.enabled_targets():
+            if "nvptx" in target:
+                continue
             for kind in ["vm", "debug"]:
                 mod = tvm.ir.IRModule.from_expr(func)
                 intrp = relay.create_executor(kind, mod=mod, ctx=ctx, target=target)

From 164a664d6fb41403119ff737bd94f1b6be5d271a Mon Sep 17 00:00:00 2001
From: Yao Wang <kevinthesunwy@gmail.com>
Date: Thu, 3 Dec 2020 21:49:38 +0000
Subject: [PATCH 7/7] Disable test any topk

---
 python/tvm/topi/cuda/sort.py                     | 13 +++++++------
 tests/python/relay/dyn/test_dynamic_op_level6.py |  2 --
 tests/python/relay/test_any.py                   |  2 ++
 3 files changed, 9 insertions(+), 8 deletions(-)

diff --git a/python/tvm/topi/cuda/sort.py b/python/tvm/topi/cuda/sort.py
index ca5c0d5a2687..ac14f5aae779 100644
--- a/python/tvm/topi/cuda/sort.py
+++ b/python/tvm/topi/cuda/sort.py
@@ -479,27 +479,28 @@ def topk(data, k=1, axis=-1, ret_type="both", is_ascend=False, dtype="int64"):
             name="topk_gpu",
             tag="topk_gpu",
         )
-    if k < 1:
+    if isinstance(k, int) and k < 1:
         if ret_type == "indices":
             return output[1]
         return output
     beg = [0] * ndim
     end = []
+    strides = [1] * ndim
     for i in range(ndim):
         if i == axis:
-            end.append(k)
+            end.append(k if isinstance(k, int) else tvm.te.size_var("dim"))
         else:
             end.append(data.shape[i])
     if ret_type == "both":
         values_out, indices_out = output
-        values_out = strided_slice(values_out, beg, end)
-        indices_out = strided_slice(indices_out, beg, end)
+        values_out = strided_slice(values_out, beg, end, strides)
+        indices_out = strided_slice(indices_out, beg, end, strides)
         output = [values_out, indices_out]
     elif ret_type == "values":
-        output = [strided_slice(output, beg, end)]
+        output = [strided_slice(output, beg, end, strides)]
     else:  # ret_type == "indices"
         indices_out = output[1]
-        output = [strided_slice(indices_out, beg, end)]
+        output = [strided_slice(indices_out, beg, end, strides)]
     return output
 
 
diff --git a/tests/python/relay/dyn/test_dynamic_op_level6.py b/tests/python/relay/dyn/test_dynamic_op_level6.py
index 4b2e4822d6ae..52abbe2a15b6 100644
--- a/tests/python/relay/dyn/test_dynamic_op_level6.py
+++ b/tests/python/relay/dyn/test_dynamic_op_level6.py
@@ -53,8 +53,6 @@ def verify_topk(k, axis, ret_type, is_ascend, dtype):
         np_indices = np_indices.astype(dtype)
 
         for target, ctx in tvm.testing.enabled_targets():
-            if "nvptx" in target:
-                continue
             for kind in ["vm", "debug"]:
                 mod = tvm.ir.IRModule.from_expr(func)
                 intrp = relay.create_executor(kind, mod=mod, ctx=ctx, target=target)
diff --git a/tests/python/relay/test_any.py b/tests/python/relay/test_any.py
index 8aa7536f632e..e2a6c54ec0cc 100644
--- a/tests/python/relay/test_any.py
+++ b/tests/python/relay/test_any.py
@@ -818,6 +818,8 @@ def verify_any_topk(data_shape, kval, np_dshape, dtype, const_k=False):
     check_result(in_vals, mod, ref_out)
 
 
+# TODO(kevinthesun): enable this test when Thrust is available in ci.
+# @tvm.testing.uses_gpu
 def test_any_topk():
     verify_any_topk(any_dims(1), 5, (10,), "float32")
     verify_any_topk(any_dims(2), 2, (6, 3), "int32")