Index _ | A | B | C | E | F | G | M | P | R | S | T _ __init__() (flashinfer.cascade.BatchDecodeWithSharedPrefixPagedKVCacheWrapper method) (flashinfer.cascade.BatchPrefillWithSharedPrefixPagedKVCacheWrapper method) (flashinfer.cascade.MultiLevelCascadeAttentionWrapper method) (flashinfer.decode.BatchDecodeMlaWithPagedKVCacheWrapper method) (flashinfer.decode.BatchDecodeWithPagedKVCacheWrapper method) (flashinfer.decode.CUDAGraphBatchDecodeWithPagedKVCacheWrapper method) (flashinfer.gemm.SegmentGEMMWrapper method) (flashinfer.prefill.BatchPrefillWithPagedKVCacheWrapper method) (flashinfer.prefill.BatchPrefillWithRaggedKVCacheWrapper method) (flashinfer.sparse.BlockSparseAttentionWrapper method) A append_paged_kv_cache() (in module flashinfer.page) apply_llama31_rope() (in module flashinfer.rope) apply_llama31_rope_inplace() (in module flashinfer.rope) apply_llama31_rope_pos_ids() (in module flashinfer.rope) apply_llama31_rope_pos_ids_inplace() (in module flashinfer.rope) apply_rope() (in module flashinfer.rope) apply_rope_inplace() (in module flashinfer.rope) apply_rope_pos_ids() (in module flashinfer.rope) apply_rope_pos_ids_inplace() (in module flashinfer.rope) apply_rope_with_cos_sin_cache() (in module flashinfer.rope) apply_rope_with_cos_sin_cache_inplace() (in module flashinfer.rope) B BatchDecodeMlaWithPagedKVCacheWrapper (class in flashinfer.decode) BatchDecodeWithPagedKVCacheWrapper (class in flashinfer.decode) BatchDecodeWithSharedPrefixPagedKVCacheWrapper (class in flashinfer.cascade) BatchPrefillWithPagedKVCacheWrapper (class in flashinfer.prefill) BatchPrefillWithRaggedKVCacheWrapper (class in flashinfer.prefill) BatchPrefillWithSharedPrefixPagedKVCacheWrapper (class in flashinfer.cascade) begin_forward() (flashinfer.cascade.BatchDecodeWithSharedPrefixPagedKVCacheWrapper method) (flashinfer.cascade.BatchPrefillWithSharedPrefixPagedKVCacheWrapper method) BlockSparseAttentionWrapper (class in flashinfer.sparse) bmm_fp8() (in module flashinfer.gemm) C chain_speculative_sampling() (in module flashinfer.sampling) CUDAGraphBatchDecodeWithPagedKVCacheWrapper (class in flashinfer.decode) E end_forward() (flashinfer.cascade.BatchDecodeWithSharedPrefixPagedKVCacheWrapper method) (flashinfer.cascade.BatchPrefillWithSharedPrefixPagedKVCacheWrapper method) F forward() (flashinfer.cascade.BatchDecodeWithSharedPrefixPagedKVCacheWrapper method) (flashinfer.cascade.BatchPrefillWithSharedPrefixPagedKVCacheWrapper method) fused_add_rmsnorm() (in module flashinfer.norm) G gelu_and_mul() (in module flashinfer.activation) gelu_tanh_and_mul() (in module flashinfer.activation) gemma_fused_add_rmsnorm() (in module flashinfer.norm) gemma_rmsnorm() (in module flashinfer.norm) get_batch_indices_positions() (in module flashinfer.page) M merge_state() (in module flashinfer.cascade) merge_state_in_place() (in module flashinfer.cascade) merge_states() (in module flashinfer.cascade) min_p_sampling_from_probs() (in module flashinfer.sampling) MultiLevelCascadeAttentionWrapper (class in flashinfer.cascade) P packbits() (in module flashinfer.quantization) plan() (flashinfer.cascade.MultiLevelCascadeAttentionWrapper method) (flashinfer.decode.BatchDecodeMlaWithPagedKVCacheWrapper method) (flashinfer.decode.BatchDecodeWithPagedKVCacheWrapper method) (flashinfer.prefill.BatchPrefillWithPagedKVCacheWrapper method) (flashinfer.prefill.BatchPrefillWithRaggedKVCacheWrapper method) (flashinfer.sparse.BlockSparseAttentionWrapper method) R reset_workspace_buffer() (flashinfer.cascade.BatchDecodeWithSharedPrefixPagedKVCacheWrapper method) (flashinfer.cascade.BatchPrefillWithSharedPrefixPagedKVCacheWrapper method) (flashinfer.cascade.MultiLevelCascadeAttentionWrapper method) (flashinfer.decode.BatchDecodeMlaWithPagedKVCacheWrapper method) (flashinfer.decode.BatchDecodeWithPagedKVCacheWrapper method) (flashinfer.gemm.SegmentGEMMWrapper method) (flashinfer.prefill.BatchPrefillWithPagedKVCacheWrapper method) (flashinfer.prefill.BatchPrefillWithRaggedKVCacheWrapper method) (flashinfer.sparse.BlockSparseAttentionWrapper method) rmsnorm() (in module flashinfer.norm) run() (flashinfer.cascade.MultiLevelCascadeAttentionWrapper method) (flashinfer.decode.BatchDecodeMlaWithPagedKVCacheWrapper method) (flashinfer.decode.BatchDecodeWithPagedKVCacheWrapper method) (flashinfer.gemm.SegmentGEMMWrapper method) (flashinfer.prefill.BatchPrefillWithPagedKVCacheWrapper method) (flashinfer.prefill.BatchPrefillWithRaggedKVCacheWrapper method) (flashinfer.sparse.BlockSparseAttentionWrapper method) S sampling_from_probs() (in module flashinfer.sampling) segment_packbits() (in module flashinfer.quantization) SegmentGEMMWrapper (class in flashinfer.gemm) silu_and_mul() (in module flashinfer.activation) single_decode_with_kv_cache() (in module flashinfer.decode) single_prefill_with_kv_cache() (in module flashinfer.prefill) single_prefill_with_kv_cache_return_lse() (in module flashinfer.prefill) T top_k_mask_logits() (in module flashinfer.sampling) top_k_renorm_probs() (in module flashinfer.sampling) top_k_sampling_from_probs() (in module flashinfer.sampling) top_k_top_p_sampling_from_logits() (in module flashinfer.sampling) top_k_top_p_sampling_from_probs() (in module flashinfer.sampling) top_p_renorm_probs() (in module flashinfer.sampling) top_p_sampling_from_probs() (in module flashinfer.sampling)