add length check to unwrap arguments

Signed-off-by: Jinjie Liu <jjliu@baai.ac.cn>
2026-05-02 03:52:11 +08:00 · 2026-02-12 15:31:50 +08:00
parent 599957e156
commit a727526794
4 changed files with 16 additions and 15 deletions
--- a/examples/attention/attnbwd.cc
+++ b/examples/attention/attnbwd.cc
@@ -1,10 +1,9 @@
 #include "ATen/core/ATen_fwd.h"
 #include "ATen/ops/empty.h"
 #include "c10/core/Device.h"
 #include "torch/headeronly/core/DeviceType.h"
 #include "tvm/ffi/container/tensor.h"
 #include <ATen/DLConvertor.h>
 #include <ATen/core/ATen_fwd.h>
 #include <ATen/dlpack.h>
 #include <ATen/ops/empty.h>
 #include <torch/headeronly/core/DeviceType.h>
 #include <tvm/ffi/container/tensor.h>
 #include <tvm/ffi/extra/cuda/cubin_launcher.h>
 #include <tvm/ffi/function.h>
 #include <tvm/ffi/tvm_ffi.h>
--- a/examples/attention/attnbwdpre.cc
+++ b/examples/attention/attnbwdpre.cc
@@ -1,9 +1,9 @@
 #include "ATen/core/ATen_fwd.h"
 #include "ATen/ops/empty.h"
 #include "torch/headeronly/core/DeviceType.h"
 #include "tvm/ffi/container/tensor.h"
 #include <ATen/DLConvertor.h>
 #include <ATen/core/ATen_fwd.h>
 #include <ATen/dlpack.h>
 #include <ATen/ops/empty.h>
 #include <torch/headeronly/core/DeviceType.h>
 #include <tvm/ffi/container/tensor.h>
 #include <tvm/ffi/extra/cuda/cubin_launcher.h>
 #include <tvm/ffi/function.h>
 #include <tvm/ffi/tvm_ffi.h>
@@ -28,8 +28,9 @@ tvm::ffi::Tensor AttnBwdPreprocess(tvm::ffi::Tensor o, tvm::ffi::Tensor do_,
      tvm::ffi::Tensor::FromDLPack(at::toDLPack(deltaTorch));
  tvm::ffi::Tuple<int32_t, int32_t, int32_t> grid(kNCtx / kPreBlock,
                                                  kBatch * kNHead, 1);
-  tvm::ffi::Array<tvm::ffi::Any> args = {o, do_, delta, kBatch, kNHead, kNCtx};
+  tvm::ffi::Array<tvm::ffi::Any> args = {o, do_, delta, kBatch, kNHead};
  tvm::ffi::Map<tvm::ffi::String, tvm::ffi::Any> kwargs = {
      {"N_CTX", kNCtx},
      {"BLOCK_M", kPreBlock},
      {"HEAD_DIM", kHeadDim},
  };
--- a/examples/attention/attnfwd.cc
+++ b/examples/attention/attnfwd.cc
@@ -1,8 +1,8 @@
 #include "ATen/core/ATen_fwd.h"
 #include "ATen/ops/empty.h"
 #include "tvm/ffi/container/tensor.h"
 #include <ATen/DLConvertor.h>
 #include <ATen/core/ATen_fwd.h>
 #include <ATen/dlpack.h>
 #include <ATen/ops/empty.h>
 #include <tvm/ffi/container/tensor.h>
 #include <tvm/ffi/extra/cuda/cubin_launcher.h>
 #include <tvm/ffi/function.h>
 #include <tvm/ffi/tvm_ffi.h>
--- a/python/triton_tvm_ffi/templates/gendef.cc.j2
+++ b/python/triton_tvm_ffi/templates/gendef.cc.j2
@@ -28,11 +28,12 @@ triton_tvm_ffi::FillMeta<{% for type in fn.signature %}__varname{{ loop.index0 }
 CUfunction __function = triton_tvm_ffi::GetKernel<__fnname_{{ fn.fnname }}, __cubin_{{ fn.fnname }}, {{ fn.shmem }}>(__device); \
 tvm::ffi::Tuple<int32_t, int32_t, int32_t> __gridDim = triton_tvm_ffi::MakeGridDim(__grid, __meta); \
 void *dummy = nullptr; \
 const size_t __args_len = __args.size(); \
 {% for ctype in fn.ctypes %}
 {% if ctype == "CUdeviceptr" %}
-void *__arg{{ loop.index0 }} = __args[{{ loop.index0 }}].cast<tvm::ffi::TensorView>().data_ptr(); \
+void *__arg{{ loop.index0 }} = {{ loop.index0 }} < __args_len ? __args[{{ loop.index0 }}].cast<tvm::ffi::TensorView>().data_ptr() : __kwargs[__varname{{ loop.index0 }}].cast<tvm::ffi::TensorView>().data_ptr(); \
 {% elif ctype != none %}
-{{ ctype }} __arg{{ loop.index0 }} = __args[{{ loop.index0 }}].cast<{{ ctype }}>(); \
+{{ ctype }} __arg{{ loop.index0 }} = {{ loop.index0 }} < __args_len ? __args[{{ loop.index0 }}].cast<{{ ctype }}>() : __kwargs[__varname{{ loop.index0 }}].cast<{{ ctype }}>(); \
 {% endif %}
 {% endfor %}
 void *__params[] = { {% for ctype in fn.ctypes %}{% if ctype != none %}&__arg{{ loop.index0 }}, {% endif %}{% endfor %}&dummy, &dummy }; \