Fix test

yaochengji · yaochengji · commit af49b41e32e2 · 2025-10-31T21:49:53.000Z
Signed-off-by: Chengji Yao &lt;chengjiyao@google.com&gt;
diff --git a/tests/layers/vllm/test_attention.py b/tests/layers/vllm/test_attention.py
@@ -30,9 +30,7 @@
 # Number of attention heads (Key/Value) - for Grouped-Query Attention
 NUM_KV_HEADS = 4
 # Dimension of each attention head
-HEAD_DIM = 64
-# Padded head dimension
-PADDED_HEAD_DIM = 64
+HEAD_DIM = 128
 # Total number of blocks in the KV cache
 NUM_BLOCKS = 32
 # Number of tokens per block