We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent ea1d0cb commit 9dd28f3Copy full SHA for 9dd28f3
include/flashinfer/attention/decode.cuh
@@ -442,7 +442,7 @@ __global__ void BatchDecodeWithPagedKVCacheKernel(const __grid_constant__ Params
442
if constexpr (POS_ENCODING_MODE == PosEncodingMode::kRoPELlama) {
443
const IdType* q_rope_offset = nullptr;
444
if constexpr (has_decode_maybe_q_rope_offset_v<Params>) {
445
- q_rope_offset = params.maybe_q_rope_offset;
+ q_rope_offset = params.decode_maybe_q_rope_offset;
446
}
447
int32_t q_rope_offset_val = q_rope_offset == nullptr ? (kv_len - 1) : q_rope_offset[batch_idx];
448
const float rope_rcp_scale = params.rope_rcp_scale;
0 commit comments