File tree Expand file tree Collapse file tree
xllm/core/layers/npu_torch Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -17,7 +17,6 @@ limitations under the License.
1717
1818#include < tuple>
1919
20- #include " torch_npu/csrc/aten/CustomFunctions.h"
2120#include " xllm/core/kernels/ops_api.h"
2221
2322namespace xllm {
@@ -440,8 +439,7 @@ torch::Tensor Qwen3GatedDeltaNetBaseImpl::forward(
440439 initial_state_tensor.fill_ (0.0 );
441440 chunk_gated_delta_params.initial_state = initial_state_tensor;
442441 chunk_gated_delta_params.output_final_state = true ;
443- chunk_gated_delta_params.cu_seqlens =
444- attn_metadata.q_cu_seq_lens .to (torch::kInt32 );
442+ chunk_gated_delta_params.cu_seqlens = attn_metadata.q_cu_seq_lens ;
445443 chunk_gated_delta_params.head_first = false ;
446444 chunk_gated_delta_params.use_qk_l2norm_in_kernel = true ;
447445 std::tie (core_attn_out, last_recurrent_state) =
You can’t perform that action at this time.
0 commit comments