Spaces:

Tonic
/

SmolFactory

Running

App Files Files Community

SmolFactory / cloud_deploy.py

Tonic

Fix model recovery and deployment scripts - add safetensors support and Windows compatibility

22bb04c verified 3 months ago

raw

history blame

3.26 kB

	#!/usr/bin/env python3
	"""
	Cloud Model Deployment Script
	Run this directly on your cloud instance to deploy your trained model
	"""

	import os
	import sys
	import logging
	import subprocess
	from pathlib import Path

	# Setup logging
	logging.basicConfig(
	level=logging.INFO,
	format='%(asctime)s - %(levelname)s - %(message)s'
	)
	logger = logging.getLogger(__name__)

	def main():
	"""Main deployment function"""

	# Configuration - CHANGE THESE VALUES
	MODEL_PATH = "/output-checkpoint"
	REPO_NAME = "Tonic/smollm3-finetuned" # Change to your HF username and desired repo name
	HF_TOKEN = os.getenv('HF_TOKEN')
	PRIVATE = False # Set to True for private repository

	# Validate configuration
	if not HF_TOKEN:
	logger.error("❌ HF_TOKEN environment variable not set")
	logger.info("Please set your Hugging Face token:")
	logger.info("export HF_TOKEN=your_token_here")
	return 1

	if not Path(MODEL_PATH).exists():
	logger.error(f"❌ Model path not found: {MODEL_PATH}")
	return 1

	# Check for required files
	required_files = ['config.json', 'model.safetensors.index.json', 'tokenizer.json']
	for file in required_files:
	if not (Path(MODEL_PATH) / file).exists():
	logger.error(f"❌ Required file not found: {file}")
	return 1

	logger.info("✅ Model files validated")

	# Install dependencies if needed
	try:
	import torchao
	logger.info("✅ torchao available")
	except ImportError:
	logger.info("📦 Installing torchao...")
	os.system("pip install torchao")

	try:
	import huggingface_hub
	logger.info("✅ huggingface_hub available")
	except ImportError:
	logger.info("📦 Installing huggingface_hub...")
	os.system("pip install huggingface_hub")

	# Run the recovery script
	logger.info("🚀 Starting model deployment...")

	cmd = [
	sys.executable, "recover_model.py",
	MODEL_PATH,
	REPO_NAME,
	"--hf-token", HF_TOKEN,
	"--quant-types", "int8_weight_only", "int4_weight_only",
	"--author-name", "Tonic",
	"--model-description", "A fine-tuned SmolLM3 model for improved text generation and conversation capabilities"
	]

	if PRIVATE:
	cmd.append("--private")

	logger.info(f"Running: {' '.join(cmd)}")

	# Run the command using subprocess for better argument handling
	try:
	result = subprocess.run(cmd, check=True, capture_output=True, text=True)
	logger.info("✅ Model deployment completed successfully!")
	logger.info(f"🌐 View your model at: https://huggingface.co/{REPO_NAME}")
	logger.info("📊 Quantized models available at:")
	logger.info(f" - https://huggingface.co/{REPO_NAME}/int8 (GPU optimized)")
	logger.info(f" - https://huggingface.co/{REPO_NAME}/int4 (CPU optimized)")
	return 0
	except subprocess.CalledProcessError as e:
	logger.error(f"❌ Model deployment failed!")
	logger.error(f"Error: {e}")
	logger.error(f"stdout: {e.stdout}")
	logger.error(f"stderr: {e.stderr}")
	return 1

	if __name__ == "__main__":
	exit(main())