| # Run this once on your machine to generate the weight files | |
| import torch | |
| from modeling_recursive_transformer import RecursiveTransformerConfig, RecursiveTransformerModel | |
| config = RecursiveTransformerConfig() | |
| model = RecursiveTransformerModel(config) | |
| # Add a couple of example memory blocks | |
| model.add_memory("Paris is the capital of France") | |
| model.add_memory("The Eiffel Tower is in Paris") | |
| # Save everything | |
| model.save_pretrained("./") | |
| print("✅ pytorch_model.bin and memory_state.json created!") |