MiniMax01Text-Dev / create.py
Goekdeniz-Guelmez's picture
Upload 7 files
789179e verified
raw
history blame contribute delete
1.09 kB
import sys
import os
from safetensors.torch import save_file
import json
# Add the directory containing your modeling.py and configuration.py to the Python path
model_dir = "/Users/gokdenizgulmez/Desktop/mlx-lm/mlx_lm/MiniMiniMax01Text"
sys.path.append(model_dir)
# Import your custom model and configuration classes
from modeling_minimax_text_01 import MiniMaxText01ForCausalLM
from configuration_minimax_text_01 import MiniMaxText01Config
# Load the configuration
config_path = os.path.join(model_dir, "onfig.json")
with open(config_path, 'r') as f:
config_dict = json.load(f)
# Create the configuration object
config = MiniMaxText01Config(**config_dict)
# Create the model
small_model = MiniMaxText01ForCausalLM(config)
# Print parameter count to verify
param_count = sum(p.numel() for p in small_model.parameters())
print(f"Model has {param_count:,} parameters")
# Convert model to state dict
model_state_dict = small_model.state_dict()
# Save as safetensors
save_file(model_state_dict, os.path.join(model_dir, "model.safetensors"))
print("Model saved in safetensors format")