Push model using huggingface_hub.

Files changed (3) hide show

README.md ADDED Viewed

+---
+license: mit
+tags:
+- denseav
+- pytorch_model_hub_mixin
+- model_hub_mixin
+---
+This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
+- Library: https://github.com/mhamilton723/DenseAV
+- Docs: [More Information Needed]

config.json ADDED Viewed

+{
+  "adaptive_clipping": true,
+  "audio_aligner_type": "audio_sa_3_3_pool_2",
+  "audio_lora": false,
+  "audio_lora_rank": 8,
+  "audio_model_type": "hubert",
+  "audio_pool_width": 1,
+  "cal_balance_weight": 0.1,
+  "cal_init": 1.0,
+  "channel_dropout": 0.0,
+  "code_dim": 384,
+  "disentangle_weight": 0.0,
+  "finetune_audio_model": true,
+  "finetune_image_model": false,
+  "gather_tensors": true,
+  "gradient_clipping": 10.0,
+  "head_agg": "max_elementwise",
+  "image_aligner_type": "image_linear",
+  "image_lora": true,
+  "image_lora_rank": 8,
+  "image_model_token_type": "token",
+  "image_model_type": "dino8",
+  "image_pool_width": 2,
+  "learn_audio_cls": true,
+  "loss_leak": 0.0,
+  "loss_margin": 0.0,
+  "loss_type": "nce",
+  "lr": 5e-05,
+  "lr_cycle_length": 50000,
+  "lr_schedule": null,
+  "lr_warmup": 1000,
+  "mask_silence": true,
+  "memory_buffer_size": 0,
+  "mixup_weight": 0.0,
+  "neg_audio": true,
+  "neg_audio_weight": 0.01,
+  "nonneg_pressure": 0.01,
+  "nonneg_sim": false,
+  "norm_vectors": false,
+  "optimizer": "adam",
+  "output_root": "/mnt/azureml/cr/j/5e46ccec7c6e408e8496ffdbf5769734/cap/data-capability/wd/INPUT_video_analysis_store_3_video_analysis_store_3",
+  "pretrain_lr": 5e-05,
+  "silence_l1": 0.01,
+  "silence_l2": 0.0,
+  "sim_agg_heads": 2,
+  "sim_agg_type": "misa",
+  "sim_use_cls": false,
+  "spatial_dropout": 0.0,
+  "specialization_weight": 0.05,
+  "tv_weight": 0.01,
+  "use_cached_embs": false
+}

model.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:c46217bb89ca8d6ab27b7c40cdee909aff29e0be38c28a4cd2201d33b3c3b72b
+size 1365469596