fix: add initialize_cache method to NPU worker

2026-04-18 22:32:53 +00:00 · 2026-02-10 19:42:32 +08:00
parent 7120cd803b
commit 101435817a
1 changed files with 6 additions and 0 deletions
--- a/vllm_npu/worker/worker_v1.py
+++ b/vllm_npu/worker/worker_v1.py
@@ -184,6 +184,12 @@ class NPUWorker(WorkerBase):
    def get_kv_cache_spec(self) -> KVCacheSpec:
        return self.model_runner.get_kv_cache_spec()

+    def initialize_cache(self, num_gpu_blocks: int,
+                         num_cpu_blocks: int) -> None:
+        """Store the number of KV cache blocks."""
+        self.cache_config.num_gpu_blocks = num_gpu_blocks
+        self.cache_config.num_cpu_blocks = num_cpu_blocks
+
    def initialize_from_config(self, kv_cache_config: KVCacheConfig) -> None:
        """Allocate KV caches on NPU."""
        self.model_runner.initialize_kv_cache(kv_cache_config)