sglang_v0.5.2/flashinfer_0.3.1/csrc/single_decode_kernel_inst.j...

14 lines
335 B
Django/Jinja

#include <flashinfer/attention/decode.cuh>
#include "single_decode_config.inc"
using namespace flashinfer;
namespace flashinfer {
template cudaError_t SingleDecodeWithKVCacheDispatched<
{{ head_dim_qk }}, {{ pos_encoding_mode }}, {{ variant_name }}, Params>(
Params params, {{ dtype_o }}* tmp,
cudaStream_t stream);
};