normalcomputing
/

extended-mind-llama-2-7b

Text Generation

Model card Files Files and versions Community

phoebeklett commited on May 30

Commit

c3edc15

•

1 Parent(s): 1df9b46

Upload 2 files

Files changed (1) hide show

modeling.py +2 -1

modeling.py CHANGED Viewed

@@ -654,7 +654,7 @@ class ExtendedLlamaAttention(nn.Module):
         if not output_attentions:
             attn_weights = None
-        if not output_retrieved_memory_idx:
             reshaped_idx = None
         return attn_output, attn_weights, past_key_value, reshaped_idx
@@ -1568,6 +1568,7 @@ class ExtendedLlamaForCausalLM(LlamaPreTrainedModel):
                 "attention_mask": attention_mask,
                 "use_external_mind": kwargs.get("use_external_mind"), # EM: Add config here
                 "topk": kwargs.get("topk"),
             }
         )
         return model_inputs

         if not output_attentions:
             attn_weights = None
+        if not output_retrieved_memory_idx or (long_range_past_key_value is None and faiss_indexes is None):
             reshaped_idx = None
         return attn_output, attn_weights, past_key_value, reshaped_idx
                 "attention_mask": attention_mask,
                 "use_external_mind": kwargs.get("use_external_mind"), # EM: Add config here
                 "topk": kwargs.get("topk"),
+                "output_retrieved_memory_idx": kwargs.get("output_retrieved_memory_idx"),
             }
         )
         return model_inputs