Upload 5 files

Browse files

Files changed (5) hide show

adapter_config.json +48 -0
adapter_model.safetensors +3 -0
ema_shadow.pt +3 -0
optimizer.pt +3 -0
train_state.json +102 -0

adapter_config.json ADDED Viewed

	@@ -0,0 +1,48 @@

+{
+  "alora_invocation_tokens": null,
+  "alpha_pattern": {},
+  "arrow_config": null,
+  "auto_mapping": {
+    "base_model_class": "TextToLatentRFDiT",
+    "parent_library": "irodori_tts.model"
+  },
+  "base_model_name_or_path": null,
+  "bias": "none",
+  "corda_config": null,
+  "ensure_weight_tying": false,
+  "eva_config": null,
+  "exclude_modules": null,
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layer_replication": null,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "loftq_config": {},
+  "lora_alpha": 32.0,
+  "lora_bias": false,
+  "lora_dropout": 0.05,
+  "lora_ga_config": null,
+  "megatron_config": null,
+  "megatron_core": "megatron.core",
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "peft_version": "0.19.1",
+  "qalora_group_size": 16,
+  "r": 16,
+  "rank_pattern": {},
+  "revision": null,
+  "target_modules": [
+    "wk",
+    "wo",
+    "wv",
+    "wq"
+  ],
+  "target_parameters": null,
+  "task_type": null,
+  "trainable_token_indices": null,
+  "use_bdlora": null,
+  "use_dora": false,
+  "use_qalora": false,
+  "use_rslora": false
+}

adapter_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2fc10166d27b4a7b1defee3c77664ced749196d72062eaec88cfc583840b10f1
+size 6847184

ema_shadow.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4d5d9103dc03853300da50d10c2782cfe68b8350832935ef40230859f1c4c73f
+size 13719297

optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:93ca2ca9f6962dd73a72da87411292a803de2f6c32724e605b4422d0f40a7081
+size 13836619

train_state.json ADDED Viewed

	@@ -0,0 +1,102 @@

+{
+  "step": 3000,
+  "base_model_path": "E:\\Emoji-TTS\\checkpoints\\Aratako_Irodori-TTS-500M-v2\\model.safetensors",
+  "base_model_sha256": "e5add885303babe328eae2c426475e41bc2f2aca2bcb010a2ceb6b6ddd1b8d9c",
+  "base_model_config": {
+    "latent_dim": 32,
+    "latent_patch_size": 1,
+    "model_dim": 1280,
+    "num_layers": 12,
+    "num_heads": 20,
+    "mlp_ratio": 2.875,
+    "text_mlp_ratio": 2.6,
+    "speaker_mlp_ratio": 2.6,
+    "dropout": 0.0,
+    "text_vocab_size": 99574,
+    "text_tokenizer_repo": "llm-jp/llm-jp-3-150m",
+    "text_add_bos": true,
+    "text_dim": 512,
+    "text_layers": 10,
+    "text_heads": 8,
+    "speaker_dim": 768,
+    "speaker_layers": 8,
+    "speaker_heads": 12,
+    "speaker_patch_size": 1,
+    "timestep_embed_dim": 512,
+    "adaln_rank": 192,
+    "norm_eps": 1e-05
+  },
+  "lora_config": {
+    "r": 16,
+    "lora_alpha": 32.0,
+    "lora_dropout": 0.05,
+    "target_modules": [
+      "wq",
+      "wk",
+      "wv",
+      "wo"
+    ]
+  },
+  "train_config": {
+    "manifest_path": "E:\\Emoji-TTS\\data\\train_manifest.jsonl",
+    "output_dir": "E:\\Emoji-TTS\\lora\\my_lora",
+    "batch_size": 4,
+    "num_workers": 2,
+    "dataloader_persistent_workers": false,
+    "dataloader_prefetch_factor": 2,
+    "allow_tf32": false,
+    "compile_model": false,
+    "learning_rate": 0.0001,
+    "weight_decay": 0.01,
+    "optimizer": "adamw",
+    "adam_beta1": 0.9,
+    "adam_beta2": 0.999,
+    "adam_eps": 1e-08,
+    "muon_momentum": 0.95,
+    "muon_adjust_lr_fn": "match_rms_adamw",
+    "lr_scheduler": "none",
+    "warmup_steps": 0,
+    "caption_warmup": false,
+    "caption_warmup_steps": 0,
+    "stable_steps": 0,
+    "min_lr_scale": 0.1,
+    "max_steps": 3000,
+    "log_every": 10,
+    "save_every": 500,
+    "checkpoint_best_n": 0,
+    "valid_ratio": 0.1,
+    "valid_every": 100,
+    "progress": true,
+    "progress_all_ranks": false,
+    "precision": "bf16",
+    "grad_clip_norm": 1.0,
+    "gradient_accumulation_steps": 1,
+    "max_text_len": 256,
+    "max_caption_len": null,
+    "text_condition_dropout": 0.1,
+    "caption_condition_dropout": 0.1,
+    "speaker_condition_dropout": 0.1,
+    "max_latent_steps": 750,
+    "fixed_target_latent_steps": null,
+    "fixed_target_full_mask": false,
+    "timestep_logit_mean": 0.0,
+    "timestep_logit_std": 1.0,
+    "timestep_stratified": false,
+    "timestep_min": 0.001,
+    "timestep_max": 0.999,
+    "wandb_enabled": false,
+    "wandb_project": null,
+    "wandb_entity": null,
+    "wandb_run_name": null,
+    "wandb_mode": "online",
+    "ddp_find_unused_parameters": false,
+    "lora_enabled": false,
+    "lora_r": 16,
+    "lora_alpha": 32,
+    "lora_dropout": 0.0,
+    "lora_bias": "none",
+    "lora_target_modules": "diffusion_attn",
+    "seed": 0
+  },
+  "ema_decay": 0.9999
+}