Spaces:

lemms
/

openllm

Sleeping

App Files Files Community

openllm / install_dependencies.py

lemms

Add manual dependency installation script to fix sentencepiece import issues

5d375ac verified 19 days ago

raw

history blame contribute delete

3.84 kB

	#!/usr/bin/env python3
	"""
	Manual dependency installation script for Hugging Face Spaces.

	This script installs missing dependencies that might not be properly
	installed through requirements.txt. Run this in the Space terminal.

	Author: Louis Chua Bean Chong
	License: GPL-3.0
	"""

	import subprocess
	import sys
	import os

	def run_command(command, description):
	"""
	Run a shell command and handle errors.

	Args:
	command: Command to run
	description: Description of what the command does
	"""
	print(f"\n🔧 {description}")
	print(f"Running: {command}")

	try:
	result = subprocess.run(command, shell=True, capture_output=True, text=True)
	if result.returncode == 0:
	print(f"✅ Success: {description}")
	if result.stdout.strip():
	print(f"Output: {result.stdout.strip()}")
	else:
	print(f"❌ Failed: {description}")
	print(f"Error: {result.stderr.strip()}")
	return False
	except Exception as e:
	print(f"❌ Exception: {e}")
	return False

	return True

	def main():
	"""Install all required dependencies manually."""
	print("🚀 Manual Dependency Installation for OpenLLM Training")
	print("=" * 60)

	# Check Python version
	print(f"🐍 Python version: {sys.version}")
	print(f"📁 Working directory: {os.getcwd()}")

	# Core dependencies that might be missing
	dependencies = [
	("sentencepiece>=0.1.99", "SentencePiece tokenization library (CRITICAL for OpenLLM)"),
	("transformers>=4.30.0", "Hugging Face Transformers library"),
	("datasets>=2.12.0", "Hugging Face Datasets library"),
	("tokenizers>=0.13.0", "Fast tokenization library"),
	("huggingface_hub>=0.34.0", "Hugging Face Hub integration"),
	("accelerate>=0.20.0", "Distributed training acceleration"),
	("torch>=2.0.0", "PyTorch deep learning framework"),
	("gradio==4.44.1", "Gradio UI framework (fixed version)"),
	("numpy>=1.24.0", "Numerical computing library"),
	("pandas>=2.0.0", "Data manipulation library"),
	("tqdm>=4.65.0", "Progress bars"),
	("requests>=2.31.0", "HTTP library"),
	]

	print(f"\n📦 Installing {len(dependencies)} dependencies...")

	success_count = 0
	for package, description in dependencies:
	command = f"pip install {package}"
	if run_command(command, description):
	success_count += 1

	print(f"\n" + "=" * 60)
	print(f"🎯 Installation Summary:")
	print(f"✅ Successful: {success_count}/{len(dependencies)}")
	print(f"❌ Failed: {len(dependencies) - success_count}/{len(dependencies)}")

	if success_count == len(dependencies):
	print("\n🎉 All dependencies installed successfully!")
	print("💡 You can now try the training again.")
	else:
	print("\n⚠️ Some dependencies failed to install.")
	print("💡 Check the error messages above and try again.")

	# Test critical imports
	print(f"\n🧪 Testing critical imports...")
	test_imports = [
	("sentencepiece", "SentencePiece (CRITICAL)"),
	("transformers", "Transformers"),
	("datasets", "Datasets"),
	("torch", "PyTorch"),
	("gradio", "Gradio"),
	]

	for module, name in test_imports:
	try:
	__import__(module)
	print(f"✅ {name} - Import successful")
	except ImportError as e:
	print(f"❌ {name} - Import failed: {e}")

	print(f"\n🔧 Manual installation complete!")
	print("💡 If imports still fail, try restarting the Space.")

	if __name__ == "__main__":
	main()