Merge branch 'main' into fix/export-directory

chunnienc · web-flow · commit 311c5367da2f · 2025-05-29T09:51:54.000-07:00
diff --git a/ai_edge_torch/generative/layers/model_config.py b/ai_edge_torch/generative/layers/model_config.py
@@ -268,6 +268,12 @@ class ModelConfig:
   # export.
   use_mask_cache: bool = True
 
+  # An interleaved sequence of the attention types used in the model.
+  # E.g. [AttentionType.LOCAL_SLIDING, AttentionType.LOCAL_SLIDING,
+  # AttentionType.GLOBAL] means that the model has an attention pattern of 2
+  # local attentions followed by a global attention in a repeated pattern.
+  attention_patterns: Optional[Sequence[AttentionType]] = None
+
   @property
   def kv_cache_max(self) -> int:
     if self.kv_cache_max_len > 0:
@@ -286,3 +292,19 @@ def block_config(self, idx: int) -> TransformerBlockConfig:
   @property
   def causal_mask_value(self) -> float:
     return self.block_config(0).attn_config.causal_mask_value
+
+  def check_if_global_attention_layer(self, layer_idx: int) -> bool:
+    """Returns True if the layer is a global attention layer."""
+    if self.attention_patterns is None:
+      # If attention_patterns is not set, we assume the model has global
+      # attention.
+      return True
+    assert layer_idx >= 0 and layer_idx < self.num_layers, (
+        "Layer index {layer_idx} is out of range for num_layers:"
+        f" {self.num_layers}"
+    )
+
+    return (
+        self.block_config(layer_idx).attn_config.attn_type
+        == AttentionType.GLOBAL
+    )
diff --git a/ai_edge_torch/generative/utilities/test_utils.py b/ai_edge_torch/generative/utilities/test_utils.py
@@ -0,0 +1,29 @@
+# Copyright 2025 The AI Edge Torch Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Test utils for generative layers."""
+from typing import Sequence
+from ai_edge_torch.generative.layers import kv_cache as kv_utils
+import torch
+
+
+def initialize_kv_cache_all_zeros(
+    kv_shape: Sequence[int],
+    layout: kv_utils.KVLayout = kv_utils.KV_LAYOUT_DEFAULT,
+) -> kv_utils.KVCacheEntry:
+  return kv_utils.KVCacheEntry(
+      k_cache=torch.zeros(kv_shape, dtype=torch.float32),
+      v_cache=torch.zeros(kv_shape, dtype=torch.float32),
+      kv_layout=layout,
+  )