faster-whisper-webui-v2

Running

App Files Files Community

faster-whisper-webui-v2 / src /config.py

aadnk

Add more configuration options to config.json5

1acaa19 over 1 year ago

raw

history blame

No virus

7.54 kB

	import urllib

	import os
	from typing import List
	from urllib.parse import urlparse
	import json5
	import torch

	from tqdm import tqdm

	from src.conversion.hf_converter import convert_hf_whisper

	class ModelConfig:
	def __init__(self, name: str, url: str, path: str = None, type: str = "whisper"):
	"""
	Initialize a model configuration.

	name: Name of the model
	url: URL to download the model from
	path: Path to the model file. If not set, the model will be downloaded from the URL.
	type: Type of model. Can be whisper or huggingface.
	"""
	self.name = name
	self.url = url
	self.path = path
	self.type = type

	def download_url(self, root_dir: str):
	import whisper

	# See if path is already set
	if self.path is not None:
	return self.path

	if root_dir is None:
	root_dir = os.path.join(os.path.expanduser("~"), ".cache", "whisper")

	model_type = self.type.lower() if self.type is not None else "whisper"

	if model_type in ["huggingface", "hf"]:
	self.path = self.url
	destination_target = os.path.join(root_dir, self.name + ".pt")

	# Convert from HuggingFace format to Whisper format
	if os.path.exists(destination_target):
	print(f"File {destination_target} already exists, skipping conversion")
	else:
	print("Saving HuggingFace model in Whisper format to " + destination_target)
	convert_hf_whisper(self.url, destination_target)

	self.path = destination_target

	elif model_type in ["whisper", "w"]:
	self.path = self.url

	# See if URL is just a file
	if self.url in whisper._MODELS:
	# No need to download anything - Whisper will handle it
	self.path = self.url
	elif self.url.startswith("file://"):
	# Get file path
	self.path = urlparse(self.url).path
	# See if it is an URL
	elif self.url.startswith("http://") or self.url.startswith("https://"):
	# Extension (or file name)
	extension = os.path.splitext(self.url)[-1]
	download_target = os.path.join(root_dir, self.name + extension)

	if os.path.exists(download_target) and not os.path.isfile(download_target):
	raise RuntimeError(f"{download_target} exists and is not a regular file")

	if not os.path.isfile(download_target):
	self._download_file(self.url, download_target)
	else:
	print(f"File {download_target} already exists, skipping download")

	self.path = download_target
	# Must be a local file
	else:
	self.path = self.url

	else:
	raise ValueError(f"Unknown model type {model_type}")

	return self.path

	def _download_file(self, url: str, destination: str):
	with urllib.request.urlopen(url) as source, open(destination, "wb") as output:
	with tqdm(
	total=int(source.info().get("Content-Length")),
	ncols=80,
	unit="iB",
	unit_scale=True,
	unit_divisor=1024,
	) as loop:
	while True:
	buffer = source.read(8192)
	if not buffer:
	break

	output.write(buffer)
	loop.update(len(buffer))

	class ApplicationConfig:
	def __init__(self, models: List[ModelConfig] = [], input_audio_max_duration: int = 600,
	share: bool = False, server_name: str = None, server_port: int = 7860, delete_uploaded_files: bool = True,
	default_model_name: str = "medium", default_vad: str = "silero-vad",
	vad_parallel_devices: str = "", vad_cpu_cores: int = 1, vad_process_timeout: int = 1800,
	auto_parallel: bool = False, output_dir: str = None,
	model_dir: str = None, device: str = None,
	verbose: bool = True, task: str = "transcribe", language: str = None,
	vad_merge_window: float = 5, vad_max_merge_size: float = 30,
	vad_padding: float = 1, vad_prompt_window: float = 3,
	temperature: float = 0, best_of: int = 5, beam_size: int = 5,
	patience: float = None, length_penalty: float = None,
	suppress_tokens: str = "-1", initial_prompt: str = None,
	condition_on_previous_text: bool = True, fp16: bool = True,
	temperature_increment_on_fallback: float = 0.2, compression_ratio_threshold: float = 2.4,
	logprob_threshold: float = -1.0, no_speech_threshold: float = 0.6):

	if device is None:
	device = "cuda" if torch.cuda.is_available() else "cpu"

	self.models = models

	# WebUI settings
	self.input_audio_max_duration = input_audio_max_duration
	self.share = share
	self.server_name = server_name
	self.server_port = server_port
	self.delete_uploaded_files = delete_uploaded_files

	self.default_model_name = default_model_name
	self.default_vad = default_vad
	self.vad_parallel_devices = vad_parallel_devices
	self.vad_cpu_cores = vad_cpu_cores
	self.vad_process_timeout = vad_process_timeout
	self.auto_parallel = auto_parallel
	self.output_dir = output_dir

	self.model_dir = model_dir
	self.device = device
	self.verbose = verbose
	self.task = task
	self.language = language
	self.vad_merge_window = vad_merge_window
	self.vad_max_merge_size = vad_max_merge_size
	self.vad_padding = vad_padding
	self.vad_prompt_window = vad_prompt_window
	self.temperature = temperature
	self.best_of = best_of
	self.beam_size = beam_size
	self.patience = patience
	self.length_penalty = length_penalty
	self.suppress_tokens = suppress_tokens
	self.initial_prompt = initial_prompt
	self.condition_on_previous_text = condition_on_previous_text
	self.fp16 = fp16
	self.temperature_increment_on_fallback = temperature_increment_on_fallback
	self.compression_ratio_threshold = compression_ratio_threshold
	self.logprob_threshold = logprob_threshold
	self.no_speech_threshold = no_speech_threshold

	def get_model_names(self):
	return [ x.name for x in self.models ]

	def update(self, **new_values):
	result = ApplicationConfig(**self.__dict__)

	for key, value in new_values.items():
	setattr(result, key, value)
	return result

	@staticmethod
	def create_default(**kwargs):
	app_config = ApplicationConfig.parse_file(os.environ.get("WHISPER_WEBUI_CONFIG", "config.json5"))

	# Update with kwargs
	if len(kwargs) > 0:
	app_config = app_config.update(**kwargs)
	return app_config

	@staticmethod
	def parse_file(config_path: str):
	import json5

	with open(config_path, "r") as f:
	# Load using json5
	data = json5.load(f)
	data_models = data.pop("models", [])

	models = [ ModelConfig(**x) for x in data_models ]

	return ApplicationConfig(models, **data)