Transformers
English
Japanese
Spanish
recursive_transformer
Drjkedwards's picture
Create save_model.py
240d348 verified
# Run this once on your machine to generate the weight files
import torch
from modeling_recursive_transformer import RecursiveTransformerConfig, RecursiveTransformerModel
config = RecursiveTransformerConfig()
model = RecursiveTransformerModel(config)
# Add a couple of example memory blocks
model.add_memory("Paris is the capital of France")
model.add_memory("The Eiffel Tower is in Paris")
# Save everything
model.save_pretrained("./")
print("✅ pytorch_model.bin and memory_state.json created!")