Index

_ | A | B | C | E | F | G | L | M | P | R | S | T | V

_

__init__() (flashinfer.cascade.BatchDecodeWithSharedPrefixPagedKVCacheWrapper method)

A

B

C

chain_speculative_sampling() (in module flashinfer.sampling)

CUDAGraphBatchDecodeWithPagedKVCacheWrapper (class in flashinfer.decode)

E

end_forward() (flashinfer.cascade.BatchDecodeWithSharedPrefixPagedKVCacheWrapper method)
- (flashinfer.cascade.BatchPrefillWithSharedPrefixPagedKVCacheWrapper method)

F

forward() (flashinfer.cascade.BatchDecodeWithSharedPrefixPagedKVCacheWrapper method)
- (flashinfer.cascade.BatchPrefillWithSharedPrefixPagedKVCacheWrapper method)

fused_add_rmsnorm() (in module flashinfer.norm)

G

L

LogitsPipe (class in flashinfer.logits_processor)

LogitsProcessor (class in flashinfer.logits_processor)

M

P

R

reset_workspace_buffer() (flashinfer.cascade.BatchDecodeWithSharedPrefixPagedKVCacheWrapper method)

S

T

V

VariableBlockSparseAttentionWrapper (class in flashinfer.sparse)