浏览代码

Update cache_utils.py

Allen 1 年之前
父节点
当前提交
d0eeba3119
共有 1 个文件被更改,包括 3 次插入1 次删除
  1. 3 1
      research/long-context-llama/H2O/cache_utils.py

+ 3 - 1
research/long-context-llama/H2O/cache_utils.py

@@ -523,8 +523,10 @@ class HHCache(Cache):
             self.key_cache[layer_idx] = self.key_cache[layer_idx][mask].view(bsz, num_heads, -1, head_dim)
             self.value_cache[layer_idx] = self.value_cache[layer_idx][mask].view(bsz, num_heads, -1, head_dim)
             self.accumulated_attention_scores[layer_idx] = self.accumulated_attention_scores[layer_idx][mask].view(bsz, num_heads, -1)
+        
+        if layer_idx == 0:
+            import pdb; pdb.set_trace()
 
-        pdb.set_trace()
 
     def reorder_cache(self, beam_idx: torch.LongTensor):
         """Reorders the cache for beam search, given the selected beam indices."""