aquiffoo commited on
Commit
e3d25cc
·
verified ·
1 Parent(s): ce99d13

Upload architecture_metadata.json

Browse files
Files changed (1) hide show
  1. architecture_metadata.json +52 -0
architecture_metadata.json ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name": "aquif-Dream-6B",
3
+ "model_type": "aquif_dream",
4
+ "organization": "aquif-ai",
5
+ "total_parameters": 5920000000,
6
+ "components": {
7
+ "video_generation": {
8
+ "model": "Wan2.2-TI2V-5B",
9
+ "path": "video-gen",
10
+ "parameters": 5000000000,
11
+ "role": "Primary video synthesis engine",
12
+ "capabilities": [
13
+ "text-to-video",
14
+ "image-to-video"
15
+ ]
16
+ },
17
+ "video_understanding": {
18
+ "model": "SmolVLM2-500M-Video-Instruct",
19
+ "path": "captioner",
20
+ "parameters": 500000000,
21
+ "role": "Caption generation and video understanding",
22
+ "capabilities": [
23
+ "video-captioning",
24
+ "visual-reasoning"
25
+ ]
26
+ },
27
+ "audio_synthesis": {
28
+ "model": "Suno Bark Small",
29
+ "path": "audio-gen",
30
+ "parameters": 420000000,
31
+ "role": "Text-to-speech with emotion control",
32
+ "capabilities": [
33
+ "text-to-speech",
34
+ "emotional-expressiveness"
35
+ ]
36
+ }
37
+ },
38
+ "unified_embedding_dim": 768,
39
+ "adapter_architecture": "ModalityBridge (2-3 layer MLPs)",
40
+ "synchronization": "Cross-attention based temporal alignment",
41
+ "video_specs": {
42
+ "resolution": "512x512",
43
+ "fps": 24,
44
+ "max_duration": 10,
45
+ "format": "latent-space"
46
+ },
47
+ "audio_specs": {
48
+ "sample_rate": 24000,
49
+ "channels": 1,
50
+ "codec": "PCM"
51
+ }
52
+ }