Spaces:

tudeplom
/

api-stt

Sleeping

App Files Files Community

tudeplom commited on Mar 28

Commit

ceda7cb

verified ·

1 Parent(s): d102cd2

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -76

app.py CHANGED Viewed

@@ -1,12 +1,10 @@
 import os
 import wave
 import json
 import uuid
-import numpy as np
-from flask import Flask, request, jsonify
-from flask_cors import CORS
 from vosk import Model, KaldiRecognizer
-from flasgger import Swagger
 # Thư mục chứa model
 MODEL_PATH = "model/vosk-model"
@@ -19,78 +17,29 @@ if not os.path.exists(MODEL_PATH):
 print("\u2705 Đang tải model Vosk...")
 model = Model(MODEL_PATH)
-# Khởi tạo Flask app
-app = Flask(__name__)
-CORS(app)
-Swagger(app)
-@app.route("/")
-def home():
-    """API Home
-    ---
-    responses:
-      200:
-        description: API đang chạy
-    """
-    return "\u2705 Vosk STT API đang chạy!"
-@app.route("/stt", methods=["POST"])
-def stt():
-    """Chuyển đổi giọng nói thành văn bản (Speech-to-Text)
-    ---
-    consumes:
-      - multipart/form-data
-    parameters:
-      - in: formData
-        name: audio
-        type: file
-        required: true
-        description: File âm thanh WAV mono PCM
-    responses:
-      200:
-        description: Kết quả chuyển đổi văn bản
-        schema:
-          type: object
-          properties:
-            text:
-              type: string
-              example: "Xin chào thế giới"
-      400:
-        description: Lỗi nếu file âm thanh không hợp lệ hoặc không tìm thấy
-    """
-    if "audio" not in request.files:
-        return jsonify({"error": "Không tìm thấy file audio!"}), 400
-    audio_file = request.files["audio"]
-    file_path = f"/tmp/{uuid.uuid4()}.wav"  # Lưu vào thư mục tạm để tránh lỗi quyền hạn
-    audio_file.save(file_path)
-    try:
-        # Mở file âm thanh
-        wf = wave.open(file_path, "rb")
-        # Kiểm tra file có đúng định dạng WAV mono không
-        if wf.getnchannels() != 1 or wf.getsampwidth() != 2 or wf.getcomptype() != "NONE":
-            return jsonify({"error": "File audio phải là WAV mono PCM!"}), 400
-        rec = KaldiRecognizer(model, wf.getframerate())
-        result_text = ""
-        while True:
-            data = wf.readframes(4000)
-            if len(data) == 0:
-                break
-            if rec.AcceptWaveform(data):
-                result_text += json.loads(rec.Result())["text"] + " "
-        return jsonify({"text": result_text.strip()})
-    except Exception as e:
-        return jsonify({"error": str(e)}), 500
     finally:
-        wf.close()
-        os.remove(file_path)  # Xóa file tạm
-if __name__ == "__main__":
-    app.run(host="0.0.0.0", port=7860, debug=True)

 import os
 import wave
 import json
+import asyncio
+import websockets
 import uuid
 from vosk import Model, KaldiRecognizer
 # Thư mục chứa model
 MODEL_PATH = "model/vosk-model"
 print("\u2705 Đang tải model Vosk...")
 model = Model(MODEL_PATH)
+async def recognize_audio(websocket, path):
+    print("🔵 Kết nối WebSocket mới...")
+    rec = KaldiRecognizer(model, 16000)
+    result_text = ""
+    try:
+        async for message in websocket:
+            if isinstance(message, bytes):  # Kiểm tra nếu dữ liệu là bytes
+                if rec.AcceptWaveform(message):
+                    result = json.loads(rec.Result())
+                    text = result.get("text", "")
+                    result_text += text + " "
+                    await websocket.send(json.dumps({"text": text}))
+            else:
+                await websocket.send(json.dumps({"error": "Dữ liệu không hợp lệ"}))
+    except websockets.exceptions.ConnectionClosed:
+        print("🔴 Kết nối WebSocket đã đóng")
     finally:
+        print(f"✅ Văn bản cuối cùng: {result_text.strip()}")
+# Chạy server WebSocket
+start_server = websockets.serve(recognize_audio, "0.0.0.0", 7860)
+print("🚀 WebSocket STT server đang chạy trên ws://0.0.0.0:7860")
+asyncio.get_event_loop().run_until_complete(start_server)
+asyncio.get_event_loop().run_forever()