sgl-project · ishandhanani · Feb 4, 2026 · doujiang24 · Feb 4, 2026 · ishandhanani
@@ -56,16 +56,24 @@ class KVCacheEvent(
     """Base class for all KV cache-related events"""
 
 
+# Medium values for storage tiers (compatible with vLLM)
+MEDIUM_GPU = "GPU"
+MEDIUM_CPU_TIER1 = "CPU_TIER1"
+MEDIUM_CPU_TIER2 = "CPU_TIER2"
+
+
 class BlockStored(KVCacheEvent):
     block_hashes: list[int]
     parent_block_hash: Optional[int]
     token_ids: list[int]
     block_size: int
     lora_id: Optional[int]
+    medium: Optional[str] = None
 
 
 class BlockRemoved(KVCacheEvent):
     block_hashes: list[int]
+    medium: Optional[str] = None
 
 
 class AllBlocksCleared(KVCacheEvent):

@@ -35,6 +35,7 @@
 logger = logging.getLogger(__name__)
 
 from sglang.srt.disaggregation.kv_events import (
+    MEDIUM_GPU,
     AllBlocksCleared,
     BlockRemoved,
     BlockStored,
@@ -822,6 +823,7 @@ def _record_store_event(self, node: TreeNode):
                         token_ids=page_tokens,
                         block_size=len(page_tokens),
                         lora_id=None,
+                        medium=MEDIUM_GPU,
                     )
                 )
 
@@ -843,7 +845,9 @@ def _record_remove_event(self, node: TreeNode):
 
                 block_hash = hash_str_to_int64(node.hash_value[page_index])
 
-                self.kv_event_queue.append(BlockRemoved(block_hashes=[block_hash]))
+                self.kv_event_queue.append(
+                    BlockRemoved(block_hashes=[block_hash], medium=MEDIUM_GPU)
+                )
 
                 page_index += 1