Spaces:

SamSak09
/

flood-diffusion-api

Running

App Files Files Community

SamSak09 commited on 17 days ago

Commit

6894e36

verified ·

1 Parent(s): 0f93e54

Upload 3 files

Browse files

Files changed (3) hide show

Dockerfile +17 -0
app2.py +69 -0
requirements.txt +27 -0

Dockerfile ADDED Viewed

	@@ -0,0 +1,17 @@

+# Use an official Python runtime as a parent image
+FROM python:3.10-slim
+# Set the working directory
+WORKDIR /app
+# Copy the current directory contents into the container
+COPY . /app
+# Install dependencies
+RUN pip install --no-cache-dir -r requirements.txt
+# Hugging Face requires applications to run on port 7860
+EXPOSE 7860
+# Run app2.py when the container launches
+CMD ["python", "app2.py"]

app2.py ADDED Viewed

	@@ -0,0 +1,69 @@

+from flask import Flask, request, jsonify
+from flask_sock import Sock
+from transformers import AutoModel
+import torch
+import time
+import json
+from flask_cors import CORS
+app = Flask(__name__)
+CORS(app)
+sock = Sock(app) # Initialize WebSocket support
+print("[SYSTEM] Booting up Network Server...")
+print("[SYSTEM] Loading FloodDiffusionTiny model from Hugging Face...")
+# 1. Load the model
+model = AutoModel.from_pretrained(
+    "ShandaAI/FloodDiffusionTiny",
+    trust_remote_code=True
+)
+# 2. M1 Architecture Override
+device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+model = model.to(device)
+print(f"[SYSTEM] Model loaded successfully onto device: {device}")
+# --- THE NEW WEBSOCKET PIPELINE ---
+@sock.route('/api/generate_stream')
+def stream_motion(ws):
+    print("\n[NETWORK] 🟢 WebSocket Connection Opened! Client connected.")
+    # Keep the connection open forever
+    while True:
+        try:
+            # 1. Wait for the live prompt from the client's text box
+            raw_data = ws.receive()
+            if raw_data is None:
+                continue
+            data = json.loads(raw_data)
+            text_prompt = data.get('prompt', '')
+            print(f"[NETWORK] Live Prompt Received: '{text_prompt}'")
+            start_time = time.time()
+            # 2. Server Processing (Inference)
+            motion_joints = model(text_prompt, length=15, output_joints=True)
+            processing_time = (time.time() - start_time) * 1000
+            # 3. Format Network Payload
+            payload = {
+                "status": "success",
+                "latency_ms": round(processing_time, 2),
+                "tensor_shape": list(motion_joints.shape),
+                "data": motion_joints.tolist()
+            }
+            # 4. Push data back through the pipe instantly!
+            ws.send(json.dumps(payload))
+            print(f"[NETWORK] ⚡ Streamed 30 frames to client in {processing_time:.2f}ms")
+        except Exception as e:
+            print(f"[NETWORK] 🔴 WebSocket Error or Disconnect: {e}")
+            break
+if __name__ == '__main__':
+    # --- CHANGE THE PORT TO 7860 ---
+    app.run(host='0.0.0.0', port=7860, debug=False)

requirements.txt ADDED Viewed

	@@ -0,0 +1,27 @@

+torch
+lightning
+torch_ema
+transformers
+torchmetrics
+omegaconf
+diffusers
+tensorboard
+wandb
+# render
+flask
+trimesh
+pyrender
+moviepy
+matplotlib
+Pillow
+imageio[ffmpeg]
+# wan
+ftfy
+einops
+# For flash attention
+# conda install -c nvidia cuda-toolkit
+# export CUDA_HOME=$CONDA_PREFIX && echo "CUDA_HOME set to: $CUDA_HOME"
+# pip install flash-attn --no-build-isolation