We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 596f40e commit 4d9077cCopy full SHA for 4d9077c
1 file changed
fastdeploy/cache_manager/ops.py
@@ -77,6 +77,9 @@ def swap_cache_per_layer(*args, **kwargs): # 单层 KV cache 换入算子(同
77
def swap_cache_per_layer_async(*args, **kwargs): # 单层 KV cache 换入算子(异步)
78
raise RuntimeError("Metax swap_cache_per_layer_async UNIMPLEMENTED")
79
80
+ def swap_cache_layout(*args, **kwargs):
81
+ raise RuntimeError("Metax swap_cache_layout UNIMPLEMENTED")
82
+
83
elif current_platform.is_xpu():
84
from fastdeploy.model_executor.ops.xpu import (
85
cuda_host_alloc,
0 commit comments