whisper-v3-zero

Running on Zero

App Files Files Community

suisuyy commited on Apr 5, 2024

Commit

a1dd53c

1 Parent(s): fbe6007

add status

Browse files

Files changed (4) hide show

README.md +293 -0
__pycache__/app.cpython-310.pyc +0 -0
app.py +79 -7
requirements.txt +4 -1

README.md CHANGED Viewed

@@ -10,3 +10,296 @@ pinned: false
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
+#  all requirements when dev
+```
+absl-py==2.0.0
+aiofiles==22.1.0
+aiohttp==3.9.1
+aiosignal==1.3.1
+aiosqlite==0.19.0
+altair==5.3.0
+annotated-types==0.6.0
+anyascii==0.3.2
+anyio==4.2.0
+argon2-cffi==23.1.0
+argon2-cffi-bindings==21.2.0
+arrow==1.3.0
+asttokens==2.4.1
+async-timeout==4.0.3
+attrs==23.2.0
+audioread==3.0.1
+Babel==2.14.0
+backoff==2.2.1
+bangla==0.0.2
+beautifulsoup4==4.12.2
+bleach==6.1.0
+blessed==1.20.0
+blinker==1.7.0
+blis==0.7.11
+bnnumerizer==0.0.2
+bnunicodenormalizer==0.1.6
+boto3==1.34.17
+botocore==1.34.17
+Brotli==1.1.0
+cachetools==5.3.2
+catalogue==2.0.10
+certifi==2023.11.17
+cffi==1.16.0
+charset-normalizer==3.3.2
+click==8.1.7
+cloudpathlib==0.16.0
+colorama==0.4.6
+comm==0.2.1
+confection==0.1.4
+contourpy==1.2.0
+coqpit==0.0.17
+cutlet==0.3.0
+cycler==0.12.1
+cymem==2.0.8
+Cython==3.0.8
+dateparser==1.1.8
+debugpy==1.8.0
+decorator==4.4.2
+deepspeed==0.12.6
+defusedxml==0.7.1
+docopt==0.6.2
+einops==0.7.0
+emoji==2.8.0
+encodec==0.1.1
+entrypoints==0.4
+exceptiongroup==1.2.0
+executing==2.0.1
+fastapi==0.109.0
+fastjsonschema==2.19.1
+ffmpy==0.3.2
+filelock==3.13.1
+Flask==3.0.0
+fonttools==4.47.2
+fqdn==1.5.1
+frozenlist==1.4.1
+fsspec==2023.12.2
+fugashi==1.3.0
+g2pkk==0.1.2
+google-auth==2.26.2
+google-auth-oauthlib==1.2.0
+gpustat==1.1.1
+gradio==4.8.0
+gradio_client==0.10.0
+grpcio==1.60.0
+gruut==2.2.3
+gruut-ipa==0.13.0
+gruut-lang-de==2.0.0
+gruut-lang-en==2.0.0
+gruut-lang-es==2.0.0
+gruut-lang-fr==2.0.2
+h11==0.14.0
+hangul-romanize==0.1.0
+hjson==3.1.0
+httpcore==1.0.2
+httpx==0.26.0
+huggingface-hub==0.20.2
+idna==3.6
+imageio==2.34.0
+imageio-ffmpeg==0.4.9
+importlib_resources==6.4.0
+inflect==7.0.0
+ipykernel==6.26.0
+ipython==8.17.2
+ipython-genutils==0.2.0
+ipywidgets==8.1.1
+isoduration==20.11.0
+itsdangerous==2.1.2
+jaconv==0.3.4
+jamo==0.4.1
+jedi==0.19.1
+jieba==0.42.1
+Jinja2==3.1.3
+jmespath==1.0.1
+joblib==1.3.2
+json5==0.9.14
+jsonlines==1.2.0
+jsonpointer==2.4
+jsonschema==4.20.0
+jsonschema-specifications==2023.12.1
+jupyter-events==0.9.0
+jupyter-ydoc==0.2.5
+jupyter_client==7.4.9
+jupyter_core==5.7.1
+jupyter_server==2.12.4
+jupyter_server_fileid==0.9.1
+jupyter_server_terminals==0.5.1
+jupyter_server_ydoc==0.6.1
+jupyterlab==3.6.1
+jupyterlab-widgets==3.0.9
+jupyterlab_pygments==0.3.0
+jupyterlab_server==2.25.2
+kiwisolver==1.4.5
+langcodes==3.3.0
+lazy_loader==0.3
+librosa==0.10.0
+lightning==2.1.2
+lightning-cloud==0.5.57
+lightning-utilities==0.10.0
+lightning_sdk==0.0.13a0
+linkify-it-py==2.0.3
+llvmlite==0.41.1
+loguru==0.7.2
+Markdown==3.5.2
+markdown-it-py==2.2.0
+MarkupSafe==2.1.3
+matplotlib==3.8.2
+matplotlib-inline==0.1.6
+mdit-py-plugins==0.3.3
+mdurl==0.1.2
+mistune==3.0.2
+mojimoji==0.0.13
+moviepy==1.0.3
+mpmath==1.3.0
+msgpack==1.0.7
+multidict==6.0.4
+murmurhash==1.0.10
+mutagen==1.47.0
+nbclassic==1.0.0
+nbclient==0.9.0
+nbconvert==7.14.1
+nbformat==5.9.2
+nest-asyncio==1.5.8
+networkx==2.8.8
+ninja==1.11.1.1
+nltk==3.8.1
+notebook==6.5.6
+notebook_shim==0.2.3
+num2words==0.5.13
+numba==0.58.1
+numpy==1.22.0
+nvidia-ml-py==12.535.133
+oauthlib==3.2.2
+orjson==3.10.0
+overrides==7.4.0
+packaging==23.2
+pandas==1.5.3
+pandocfilters==1.5.0
+parso==0.8.3
+pexpect==4.9.0
+pillow==10.2.0
+platformdirs==4.1.0
+pooch==1.8.0
+preshed==3.0.9
+proglog==0.1.10
+prometheus-client==0.19.0
+prompt-toolkit==3.0.43
+protobuf==4.23.4
+psutil==5.9.7
+ptyprocess==0.7.0
+pure-eval==0.2.2
+py-cpuinfo==9.0.0
+pyasn1==0.5.1
+pyasn1-modules==0.3.0
+PyAudio==0.2.14
+pycparser==2.21
+pycryptodomex==3.20.0
+pydantic==2.5.3
+pydantic_core==2.14.6
+pydub==0.25.1
+Pygments==2.17.2
+PyJWT==2.8.0
+pynndescent==0.5.11
+pynvml==11.5.0
+pyparsing==3.1.1
+pypinyin==0.50.0
+pysbd==0.3.4
+python-crfsuite==0.9.10
+python-dateutil==2.8.2
+python-dotenv==1.0.0
+python-json-logger==2.0.7
+python-multipart==0.0.6
+pytorch-lightning==2.1.2
+pyttsx3==2.90
+pytz==2023.3.post1
+PyYAML==6.0.1
+pyzmq==24.0.1
+referencing==0.32.1
+regex==2023.12.25
+requests==2.31.0
+requests-oauthlib==1.3.1
+rfc3339-validator==0.1.4
+rfc3986-validator==0.1.1
+rich==13.7.0
+rpds-py==0.17.1
+rsa==4.9
+s3transfer==0.10.0
+safetensors==0.4.1
+scikit-learn==1.3.2
+scipy==1.11.4
+semantic-version==2.10.0
+Send2Trash==1.8.2
+shellingham==1.5.4
+six==1.16.0
+smart-open==6.4.0
+sniffio==1.3.0
+soundfile==0.12.1
+soupsieve==2.5
+soxr==0.3.7
+spaces==0.25.0
+spacy==3.7.2
+spacy-legacy==3.0.12
+spacy-loggers==1.0.5
+srsly==2.4.8
+stack-data==0.6.3
+stanza==1.6.1
+starlette==0.35.1
+stream2sentence==0.2.2
+SudachiDict-core==20230927
+SudachiPy==0.6.8
+sympy==1.12
+tensorboard==2.15.1
+tensorboard-data-server==0.7.2
+terminado==0.18.0
+thinc==8.2.2
+threadpoolctl==3.2.0
+tinycss2==1.2.1
+tokenizers==0.15.0
+tomli==2.0.1
+tomlkit==0.12.0
+toolz==0.12.1
+torch==2.1.1+cu118
+torchaudio==2.1.1+cu118
+torchmetrics==1.2.0
+torchvision==0.16.1+cu121
+tornado==6.4
+tqdm==4.66.1
+trainer==0.0.36
+traitlets==5.14.1
+transformers @ git+https://github.com/huggingface/transformers@81642d2b51de9d5e5aee1768abdc744d90f7f52d
+triton==2.1.0
+TTS==0.21.3
+typer==0.9.0
+types-python-dateutil==2.8.19.20240106
+typing_extensions==4.9.0
+tzdata==2023.4
+tzlocal==5.2
+uc-micro-py==1.0.3
+umap-learn==0.5.5
+Unidecode==1.3.8
+unidic-lite==1.0.8
+uri-template==1.3.0
+urllib3==2.0.7
+uvicorn==0.25.0
+wasabi==1.1.2
+wcwidth==0.2.13
+weasel==0.3.4
+webcolors==1.13
+webencodings==0.5.1
+websocket-client==1.7.0
+websockets==11.0.3
+Werkzeug==3.0.1
+widgetsnbextension==4.0.9
+xtts-api-server==0.8.3
+y-py==0.6.2
+yarl==1.9.4
+ypy-websocket==0.8.4
+yt-dlp==2024.3.10
+```

__pycache__/app.cpython-310.pyc CHANGED Viewed

Binary files a/__pycache__/app.cpython-310.pyc and b/__pycache__/app.cpython-310.pyc differ

app.py CHANGED Viewed

@@ -1,16 +1,18 @@
 import torch
 import time
 import gradio as gr
 import spaces
 from transformers import pipeline
 from transformers.pipelines.audio_utils import ffmpeg_read
 DEFAULT_MODEL_NAME = "distil-whisper/distil-large-v3"
 BATCH_SIZE = 8
 device = 0 if torch.cuda.is_available() else "cpu"
 def load_pipeline(model_name):
     return pipeline(
@@ -32,6 +34,11 @@ def transcribe(inputs, task, model_name):
         pipe = load_pipeline(model_name)
     start_time = time.time()  # Record the start time
     text = pipe(inputs, batch_size=BATCH_SIZE, generate_kwargs={"task": task}, return_timestamps=True)["text"]
     end_time = time.time()  # Record the end time
@@ -40,12 +47,65 @@ def transcribe(inputs, task, model_name):
     # Create the transcription time output with additional information
     transcription_time_output = (
         f"Transcription Time: {transcription_time:.2f} seconds\n"
         f"Model Used: {model_name}\n"
         f"Device Used: {'GPU' if torch.cuda.is_available() else 'CPU'}"
     )
     return text, transcription_time_output
 demo = gr.Blocks()
 mf_transcribe = gr.Interface(
@@ -57,7 +117,7 @@ mf_transcribe = gr.Interface(
             label="Model Name",
             value=DEFAULT_MODEL_NAME,
             placeholder="Enter the model name",
-            info="Some available models: distil-whisper/distil-large-v3 distil-whisper/distil-medium.en   Systran/faster-distil-whisper-large-v3 Systran/faster-whisper-large-v3  Systran/faster-whisper-medium    openai/whisper-tiny , openai/whisper-base, openai/whisper-medium, openai/whisper-large-v3"
         ),
     ],
     outputs=[gr.TextArea(label="Transcription"), gr.TextArea(label="Transcription Info")],
@@ -79,7 +139,7 @@ file_transcribe = gr.Interface(
             label="Model Name",
             value=DEFAULT_MODEL_NAME,
             placeholder="Enter the model name",
-            info="Some available models: openai/whisper-tiny, openai/whisper-base, openai/whisper-medium, openai/whisper-large-v2"
         ),
     ],
     outputs=[gr.TextArea(label="Transcription"), gr.TextArea(label="Transcription Info")],
@@ -91,8 +151,20 @@ file_transcribe = gr.Interface(
     ),
     allow_flagging="never",
 )
 with demo:
     gr.TabbedInterface([mf_transcribe, file_transcribe], ["Microphone", "Audio file"])
-demo.launch(share=True)

 import torch
 import time
+import moviepy.editor as mp
+import psutil
 import gradio as gr
 import spaces
 from transformers import pipeline
 from transformers.pipelines.audio_utils import ffmpeg_read
 DEFAULT_MODEL_NAME = "distil-whisper/distil-large-v3"
 BATCH_SIZE = 8
 device = 0 if torch.cuda.is_available() else "cpu"
+if device == "cpu":
+    DEFAULT_MODEL_NAME = "openai/whisper-tiny"
 def load_pipeline(model_name):
     return pipeline(
         pipe = load_pipeline(model_name)
     start_time = time.time()  # Record the start time
+    # Load the audio file and calculate its duration
+    audio = mp.AudioFileClip(inputs)
+    audio_duration = audio.duration
     text = pipe(inputs, batch_size=BATCH_SIZE, generate_kwargs={"task": task}, return_timestamps=True)["text"]
     end_time = time.time()  # Record the end time
     # Create the transcription time output with additional information
     transcription_time_output = (
         f"Transcription Time: {transcription_time:.2f} seconds\n"
+        f"Audio Duration: {audio_duration:.2f} seconds\n"
         f"Model Used: {model_name}\n"
         f"Device Used: {'GPU' if torch.cuda.is_available() else 'CPU'}"
     )
     return text, transcription_time_output
+from gpustat import GPUStatCollection
+def update_gpu_status():
+    if torch.cuda.is_available() == False:
+        return "No Nviadia Device"
+    try:
+        gpu_stats = GPUStatCollection.new_query()
+        for gpu in gpu_stats:
+            # Assuming you want to monitor the first GPU, index 0
+            gpu_id = gpu.index
+            gpu_name = gpu.name
+            gpu_utilization = gpu.utilization
+            memory_used = gpu.memory_used
+            memory_total = gpu.memory_total
+            memory_utilization = (memory_used / memory_total) * 100
+            gpu_status=(f"GPU {gpu_id}: {gpu_name}, Utilization: {gpu_utilization}%, Memory Used: {memory_used}MB, Memory Total: {memory_total}MB, Memory Utilization: {memory_utilization:.2f}%")
+            return gpu_status
+    except Exception as e:
+        print(f"Error getting GPU stats: {e}")
+# def update_gpu_status():
+#     if torch.cuda.is_available():
+#         gpu_info = torch.cuda.get_device_name(0)
+#         gpu_memory = torch.cuda.mem_get_info(0)
+#         total_memory = gpu_memory[1] / (1024 * 1024)
+#         used_memory = (gpu_memory[1] - gpu_memory[0]) / (1024 * 1024)
+#         gpu_status = f"GPU: {gpu_info}\nTotal Memory: {total_memory:.2f} MB\nUsed Memory: {used_memory:.2f} MB"
+#     else:
+#         gpu_status = "No GPU available"
+#     return gpu_status
+def update_cpu_status():
+    import datetime
+    # Get the current time
+    current_time = datetime.datetime.now().time()
+    # Convert the time to a string
+    time_str = current_time.strftime("%H:%M:%S")
+    cpu_percent = psutil.cpu_percent()
+    cpu_status = f"CPU Usage: {cpu_percent}% {time_str}"
+    return cpu_status
+def update_status():
+    gpu_status = update_gpu_status()
+    cpu_status = update_cpu_status()
+    return gpu_status, cpu_status
+def refresh_status():
+    return update_status()
 demo = gr.Blocks()
 mf_transcribe = gr.Interface(
             label="Model Name",
             value=DEFAULT_MODEL_NAME,
             placeholder="Enter the model name",
+            info="Some available models: distil-whisper/distil-large-v3 distil-whisper/distil-medium.en Systran/faster-distil-whisper-large-v3 Systran/faster-whisper-large-v3 Systran/faster-whisper-medium openai/whisper-tiny, openai/whisper-base, openai/whisper-medium, openai/whisper-large-v3",
         ),
     ],
     outputs=[gr.TextArea(label="Transcription"), gr.TextArea(label="Transcription Info")],
             label="Model Name",
             value=DEFAULT_MODEL_NAME,
             placeholder="Enter the model name",
+            info="Some available models: openai/whisper-tiny, openai/whisper-base, openai/whisper-medium, openai/whisper-large-v2",
         ),
     ],
     outputs=[gr.TextArea(label="Transcription"), gr.TextArea(label="Transcription Info")],
     ),
     allow_flagging="never",
 )
 with demo:
     gr.TabbedInterface([mf_transcribe, file_transcribe], ["Microphone", "Audio file"])
+    with gr.Row():
+        refresh_button = gr.Button("Refresh Status")  # Create a refresh button
+    gpu_status_output = gr.Textbox(label="GPU Status", interactive=False)
+    cpu_status_output = gr.Textbox(label="CPU Status", interactive=False)
+    # Link the refresh button to the refresh_status function
+    refresh_button.click(refresh_status, None, [gpu_status_output, cpu_status_output])
+    # Load the initial status using update_status function
+    demo.load(update_status, inputs=None, outputs=[gpu_status_output, cpu_status_output], every=2, queue=False)
+# Launch the Gradio app
+demo.launch(share=True)

requirements.txt CHANGED Viewed

@@ -1,4 +1,7 @@
 git+https://github.com/huggingface/transformers
 torch
 yt-dlp
-gradio==4.8.0

 git+https://github.com/huggingface/transformers
 torch
 yt-dlp
+gradio==4.8.0
+gpustat
+moviepy
+freeze