Skip to content
LMCache
Toggle navigation menu
⌘
K
LMCache
/
Index
Index
A
ALIGN_BYTES (TensorMemoryAllocator attribute)
allocate() (BufferAllocator method)
(GPUMemoryAllocator method)
(MemoryAllocatorInterface method)
(StorageManager method)
(TensorMemoryAllocator method)
B
BaseEvictor (class in lmcache.experimental.storage_backend.evictor.base_evictor)
BINARY (MemoryFormat attribute)
BINARY_BUFFER (MemoryFormat attribute)
blend() (BlendExecutor method)
(CacheBlendImpl method)
BlendExecutor (class in lmcache.blend.interfaces)
BlendOutput (class in lmcache.blend.interfaces)
BlendRetriever (class in lmcache.blend.interfaces)
BlendRetrieverResult (class in lmcache.blend.interfaces)
BlendRetrieverTask (class in lmcache.blend.interfaces)
broadcast_seq_group_list() (in module lmcache.integration.vllm.vllm_adapter)
BufferAllocator (class in lmcache.experimental.memory_management)
build_partial_prefill_input() (in module lmcache.integration.vllm.vllm_adapter)
byte_array (MemoryObj property)
C
CacheBlendImpl (class in lmcache.blend.executor)
CHUNK_PREFILL (RetrieveStatus attribute)
(StoreStatus attribute)
close() (LMCacheEngine method)
(StorageBackendInterface method)
(StorageManager method)
contains() (StorageBackendInterface method)
(StorageManager method)
D
DECODE (StoreStatus attribute)
E
exists_in_put_tasks() (StorageBackendInterface method)
F
free() (BufferAllocator method)
(GPUMemoryAllocator method)
(MemoryAllocatorInterface method)
(TensorMemoryAllocator method)
from_gpu() (GPUConnectorInterface method)
(VLLMNestedTupleGPUConnector method)
(VLLMPagedMemGPUConnector method)
(VLLMPagedMemGPUConnectorV2 method)
G
get() (StorageManager method)
get_blocking() (StorageBackendInterface method)
get_dtype() (MemoryObj method)
get_memory_format() (MemoryObj method)
get_physical_size() (MemoryObj method)
get_ref_count() (BufferAllocator method)
(GPUMemoryAllocator method)
(MemoryAllocatorInterface method)
(TensorMemoryAllocator method)
get_shape() (GPUConnectorInterface method)
(MemoryObj method)
(VLLMNestedTupleGPUConnector method)
(VLLMPagedMemGPUConnector method)
(VLLMPagedMemGPUConnectorV2 method)
get_size() (MemoryObj method)
GPUConnectorInterface (class in lmcache.experimental.gpu_connector)
GPUMemoryAllocator (class in lmcache.experimental.memory_management)
I
ILLEGAL (PutStatus attribute)
invalidate() (MemoryObj method)
is_valid() (MemoryObj method)
K
k (BlendOutput attribute)
(BlendRetrieverResult attribute)
KV_BLOB (MemoryFormat attribute)
L
LEGAL (PutStatus attribute)
lmcache_retrieve_kv() (in module lmcache.integration.vllm.vllm_adapter)
lmcache_should_retrieve() (in module lmcache.integration.vllm.vllm_adapter)
lmcache_should_store() (in module lmcache.integration.vllm.vllm_adapter)
lmcache_store_kv() (in module lmcache.integration.vllm.vllm_adapter)
LMCacheEngine (class in lmcache.experimental.cache_engine)
local_indices (BlendOutput attribute)
lookup() (LMCacheEngine method)
LRUEvictor (class in lmcache.experimental.storage_backend.evictor.lru_evictor)
M
memcheck() (BufferAllocator method)
(GPUMemoryAllocator method)
(TensorMemoryAllocator method)
MemoryAllocatorInterface (class in lmcache.experimental.memory_management)
MemoryFormat (class in lmcache.experimental.memory_management)
MemoryObj (class in lmcache.experimental.memory_management)
metadata (MemoryObj property)
N
new_request() (BlendRetriever method)
NONE (RetrieveStatus attribute)
(StoreStatus attribute)
O
original_positions (BlendRetrieverResult attribute)
P
positions (BlendOutput attribute)
prefetch() (LMCacheEngine method)
(StorageManager method)
prefetch_callback() (StorageManager method)
PREFILL (RetrieveStatus attribute)
(StoreStatus attribute)
put() (StorageManager method)
PutStatus (class in lmcache.experimental.storage_backend.evictor.base_evictor)
Q
q (BlendOutput attribute)
query_start_loc (BlendOutput attribute)
R
ref_count_down() (BufferAllocator method)
(GPUMemoryAllocator method)
(MemoryAllocatorInterface method)
(TensorMemoryAllocator method)
ref_count_up() (BufferAllocator method)
(GPUMemoryAllocator method)
(MemoryAllocatorInterface method)
(TensorMemoryAllocator method)
result() (BlendRetrieverTask method)
retrieve() (LMCacheEngine method)
RetrieveStatus (class in lmcache.integration.vllm.vllm_adapter)
S
set_positional_encoder() (CacheBlendImpl method)
set_reverse_positional_encoder() (CacheBlendImpl method)
StorageBackendInterface (class in lmcache.experimental.storage_backend.abstract_backend)
StorageManager (class in lmcache.experimental.storage_backend.storage_manager)
store() (LMCacheEngine method)
StoreStatus (class in lmcache.integration.vllm.vllm_adapter)
submit_prefetch_task() (StorageBackendInterface method)
submit_put_task() (StorageBackendInterface method)
SUFFIX_PREFILL (StoreStatus attribute)
T
tensor (MemoryObj property)
TensorMemoryAllocator (class in lmcache.experimental.memory_management)
to_gpu() (GPUConnectorInterface method)
(VLLMNestedTupleGPUConnector method)
(VLLMPagedMemGPUConnector method)
(VLLMPagedMemGPUConnectorV2 method)
token_dim() (MemoryFormat method)
U
UNDEFINED (MemoryFormat attribute)
update_on_hit() (BaseEvictor method)
(LRUEvictor method)
update_on_put() (BaseEvictor method)
(LRUEvictor method)
V
v (BlendOutput attribute)
(BlendRetrieverResult attribute)
valid_mask (BlendRetrieverResult attribute)
VLLMNestedTupleGPUConnector (class in lmcache.experimental.gpu_connector)
VLLMPagedMemGPUConnector (class in lmcache.experimental.gpu_connector)
VLLMPagedMemGPUConnectorV2 (class in lmcache.experimental.gpu_connector)