NVIDIA
diff --git a/‎cpp/tensorrt_llm/kernels/IndexerTopK.h‎
Lines changed: 5 additions & 5 deletions b/‎cpp/tensorrt_llm/kernels/IndexerTopK.h‎
Lines changed: 5 additions & 5 deletions
@@ -24,12 +24,12 @@
 
 namespace tensorrt_llm::kernels
 {
-void invokeIndexerTopKDecode(float const* logits, int const* seqLens, int* outIndices, float* auxLogits,
-    int* auxIndices, int const splitWorkThreshold, int const numRows, int const numColumns, int const stride0,
-    int const stride1, int const next_n, int const index_topk = 2048, cudaStream_t const stream = 0);
+void invokeIndexerTopKDecode(float const* logits, int const* seqLens, int* indices, float* outLogitsAux,
+    int* outIndicesAux, int const splitWorkThreshold, int const numRows, int const numColumns, int const stride0,
+    int const stride1, int const next_n, int const topK = 2048, cudaStream_t const stream = 0);
 
-void invokeIndexerTopKPrefill(float const* logits, int const* rowStarts, int const* rowEnds, int* outIndices,
-    int const numRows, int const numColumns, int const stride0, int const stride1, int const index_topk = 2048,
+void invokeIndexerTopKPrefill(float const* logits, int const* rowStarts, int const* rowEnds, int* indices,
+    int const numRows, int const numColumns, int const stride0, int const stride1, int const topK = 2048,
     cudaStream_t const stream = 0);
 
 } // namespace tensorrt_llm::kernels