Spaces:

ayousanz
/

piper-plus-demo

Running

App Files Files Community

piper-plus-demo / download_models.py

ayousanz

Update from GitHub Actions - 2025-08-21 06:20:35

407e6d8 verified 3 days ago

raw

history blame contribute delete

4.4 kB

	"""Download model files from Hugging Face Hub or create dummy models"""

	import json
	from pathlib import Path

	import onnx
	from onnx import TensorProto, helper


	def create_dummy_onnx_model(output_path: Path, num_symbols: int = 130):
	"""Create a minimal dummy ONNX model for testing"""

	# Define input tensors
	input_ids = helper.make_tensor_value_info("input", TensorProto.INT64, [1, None])
	input_lengths = helper.make_tensor_value_info(
	"input_lengths", TensorProto.INT64, [1]
	)
	scales = helper.make_tensor_value_info("scales", TensorProto.FLOAT, [3])

	# Define output tensor
	output = helper.make_tensor_value_info("output", TensorProto.FLOAT, [1, 1, None])

	# Create a simple identity-like operation
	# This is just a placeholder - real model would have complex operations
	identity_node = helper.make_node(
	"Identity", inputs=["input"], outputs=["identity_out"], name="identity"
	)

	# Create a constant output shape
	shape_const = helper.make_tensor(
	"shape_const",
	TensorProto.INT64,
	dims=[3],
	vals=[1, 1, 22050], # 1 second at 22050 Hz
	)

	# Create a constant fill node
	const_fill = helper.make_node(
	"ConstantOfShape", inputs=["shape_const"], outputs=["output"], name="const_fill"
	)

	# Create the graph
	graph = helper.make_graph(
	[identity_node, const_fill],
	"dummy_tts_model",
	[input_ids, input_lengths, scales],
	[output],
	[shape_const],
	)

	# Create the model
	model = helper.make_model(graph)

	# Save the model
	onnx.save(model, str(output_path))
	print(f"Created dummy model: {output_path}")


	def create_dummy_config(output_path: Path, language: str = "en"):
	"""Create a dummy model configuration"""
	config = {
	"audio": {"sample_rate": 22050},
	"espeak": {"voice": "en-us" if language == "en" else "ja"},
	"language": {"code": language},
	"inference": {"noise_scale": 0.667, "length_scale": 1, "noise_w": 0.8},
	"phoneme_type": "espeak" if language == "en" else "openjtalk",
	"phoneme_map": {},
	"phoneme_id_map": {
	"_": [0],
	"^": [1],
	"$": [2],
	" ": [3],
	"a": [4],
	"b": [5],
	"c": [6],
	"d": [7],
	"e": [8],
	},
	"num_symbols": 10,
	"num_speakers": 1,
	"speaker_id_map": {},
	}

	with open(output_path, "w", encoding="utf-8") as f:
	json.dump(config, f, indent=2)
	print(f"Created config: {output_path}")


	def download_models():
	"""Setup models - use existing models if available, otherwise create dummy models"""
	models_dir = Path("models")
	models_dir.mkdir(exist_ok=True)

	# Model configurations
	models = [
	("ja_JP-test-medium.onnx", "ja", "Japanese medium quality model"),
	("test_voice.onnx", "en", "English test model"),
	]

	print("Setting up models for demo...")
	for filename, lang, description in models:
	onnx_path = models_dir / filename
	json_path = models_dir / f"{filename}.json"

	# Check if actual model exists
	if onnx_path.exists():
	# Verify it's a real ONNX model (efficiently check without loading entire model)
	try:
	# Use onnx.checker for efficient validation without loading entire model
	with open(onnx_path, "rb") as f:
	onnx.checker.check_model(f.read(), full_check=False)
	print(
	f"✓ Found existing {description}: {onnx_path} ({onnx_path.stat().st_size / 1024 / 1024:.1f} MB)"
	)
	except Exception as e:
	print(f"⚠ Invalid ONNX model {onnx_path}, creating dummy model: {e}")
	create_dummy_onnx_model(onnx_path)
	else:
	# Create dummy model as fallback
	print(f"Creating dummy {description}...")
	create_dummy_onnx_model(onnx_path)

	# Always ensure config exists
	if not json_path.exists():
	print(f"Creating config for {filename}...")
	create_dummy_config(json_path, language=lang)
	else:
	print(f"✓ Found existing config: {json_path}")

	print("Model setup complete!")


	if __name__ == "__main__":
	download_models()