|
@@ -556,6 +556,7 @@ class HHCache(Cache):
|
|
if past_key_values is not None:
|
|
if past_key_values is not None:
|
|
for layer_idx in range(len(past_key_values)):
|
|
for layer_idx in range(len(past_key_values)):
|
|
key_states, value_states, accumulated_attention_scores = past_key_values[layer_idx]
|
|
key_states, value_states, accumulated_attention_scores = past_key_values[layer_idx]
|
|
|
|
+ import pdb; pdb.set_trace()
|
|
cache.update(key_states, value_states, layer_idx, accumulated_attention_scores=accumulated_attention_scores)
|
|
cache.update(key_states, value_states, layer_idx, accumulated_attention_scores=accumulated_attention_scores)
|
|
return cache
|
|
return cache
|
|
|
|
|