From 6fd9dc5155cf55c076d8033cd8ba35d0d98dad6c Mon Sep 17 00:00:00 2001
From: Socratesa <lihaode@zju.edu.cn>
Date: Tue, 23 Jun 2026 21:23:19 +0800
Subject: [PATCH] Fix MLA cache shape init without layerid

Signed-off-by: Socratesa <lihaode@zju.edu.cn>
---
 .../layers/attention/mla_attention_backend.py             | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/fastdeploy/model_executor/layers/attention/mla_attention_backend.py b/fastdeploy/model_executor/layers/attention/mla_attention_backend.py
index 855c34c8343..83932f7a908 100644
--- a/fastdeploy/model_executor/layers/attention/mla_attention_backend.py
+++ b/fastdeploy/model_executor/layers/attention/mla_attention_backend.py
@@ -620,9 +620,13 @@ def get_kv_cache_shape(
         """
         Calculate kv cache shape for MLA
         """
-        layer_id = self.layer_id
+        layer_id = getattr(self, "layer_id", None)
         value_cache_shape = []
-        if self.window_attn_skip_freq is not None and self.window_attn_skip_freq[layer_id] == 1:
+        if (
+            layer_id is not None
+            and self.window_attn_skip_freq is not None
+            and self.window_attn_skip_freq[layer_id] == 1
+        ):
             fp8_key_cahe_dim = self.kv_lora_rank + 4 * (self.kv_lora_rank // 128) + 2 * self.qk_rope_head_dim
             key_cache_shape = [max_num_blocks, 1, self.block_size, fp8_key_cahe_dim]
         else: