aquif-ai
/

aquif-Dream-6B-Exp

video-generation

audio-synthesis

unified-architecture

Model card Files Files and versions

aquiffoo commited on 24 days ago

Commit

e3d25cc

·

verified ·

1 Parent(s): ce99d13

Upload architecture_metadata.json

Files changed (1) hide show

architecture_metadata.json +52 -0

architecture_metadata.json ADDED Viewed

	@@ -0,0 +1,52 @@

+{
+  "model_name": "aquif-Dream-6B",
+  "model_type": "aquif_dream",
+  "organization": "aquif-ai",
+  "total_parameters": 5920000000,
+  "components": {
+    "video_generation": {
+      "model": "Wan2.2-TI2V-5B",
+      "path": "video-gen",
+      "parameters": 5000000000,
+      "role": "Primary video synthesis engine",
+      "capabilities": [
+        "text-to-video",
+        "image-to-video"
+      ]
+    },
+    "video_understanding": {
+      "model": "SmolVLM2-500M-Video-Instruct",
+      "path": "captioner",
+      "parameters": 500000000,
+      "role": "Caption generation and video understanding",
+      "capabilities": [
+        "video-captioning",
+        "visual-reasoning"
+      ]
+    },
+    "audio_synthesis": {
+      "model": "Suno Bark Small",
+      "path": "audio-gen",
+      "parameters": 420000000,
+      "role": "Text-to-speech with emotion control",
+      "capabilities": [
+        "text-to-speech",
+        "emotional-expressiveness"
+      ]
+    }
+  },
+  "unified_embedding_dim": 768,
+  "adapter_architecture": "ModalityBridge (2-3 layer MLPs)",
+  "synchronization": "Cross-attention based temporal alignment",
+  "video_specs": {
+    "resolution": "512x512",
+    "fps": 24,
+    "max_duration": 10,
+    "format": "latent-space"
+  },
+  "audio_specs": {
+    "sample_rate": 24000,
+    "channels": 1,
+    "codec": "PCM"
+  }
+}