ソースを参照

Update utils_llama.py

Allen 1 年間 前
コミット
57d1f6d04f
1 ファイル変更1 行追加1 行削除
  1. 1 1
      research/long-context-llama/H2O/utils_llama.py

+ 1 - 1
research/long-context-llama/H2O/utils_llama.py

@@ -209,7 +209,7 @@ class H2OLlamaAttention(nn.Module):
 
         # Update KV Cache based on Heavy-Hitter Oracle
         if past_key_value is not None:
-            past_key_value.update_slimming(attn_weights, self.num_key_value_groups, self.layer_idx, cache_kwargs)
+            past_key_value.update_slimming(attn_weights, self.num_key_value_groups, self.layer_idx)
 
         attn_weights = nn.functional.dropout(attn_weights, p=self.attention_dropout, training=self.training)
         attn_output = torch.matmul(attn_weights, value_states)