mazesmazes commited on
Commit
ee337a7
·
verified ·
1 Parent(s): 4623ffa

Training in progress, step 14000

Browse files
Files changed (3) hide show
  1. config.json +1 -4
  2. model.safetensors +1 -1
  3. training_args.bin +2 -2
config.json CHANGED
@@ -64,11 +64,9 @@
64
  "type": "audio"
65
  }
66
  },
67
- "decoder_model_name": "HuggingFaceTB/SmolLM3-3B",
68
  "downsample_rate": 16,
69
  "dtype": "bfloat16",
70
  "encoder_dim": 1280,
71
- "encoder_model_name": "openai/whisper-large-v3-turbo",
72
  "inference_diversity_penalty": 0.0,
73
  "inference_warmup_tokens": 10,
74
  "label_smoothing": 0.0,
@@ -83,13 +81,12 @@
83
  "projector_dropout": 0.0,
84
  "projector_hidden_dim": null,
85
  "projector_init_std": 0.02,
86
- "projector_input_noise": 0.02,
87
  "projector_num_layers": 2,
88
  "projector_pool_stride": 2,
89
  "projector_type": "mlp",
90
  "router_aux_loss_coef": 0.01,
91
  "system_prompt": "/no_think /system_override",
92
- "temperature": 0.1,
93
  "text_config": {
94
  "_name_or_path": "HuggingFaceTB/SmolLM3-3B",
95
  "architectures": [
 
64
  "type": "audio"
65
  }
66
  },
 
67
  "downsample_rate": 16,
68
  "dtype": "bfloat16",
69
  "encoder_dim": 1280,
 
70
  "inference_diversity_penalty": 0.0,
71
  "inference_warmup_tokens": 10,
72
  "label_smoothing": 0.0,
 
81
  "projector_dropout": 0.0,
82
  "projector_hidden_dim": null,
83
  "projector_init_std": 0.02,
84
+ "projector_input_noise": 0.0,
85
  "projector_num_layers": 2,
86
  "projector_pool_stride": 2,
87
  "projector_type": "mlp",
88
  "router_aux_loss_coef": 0.01,
89
  "system_prompt": "/no_think /system_override",
 
90
  "text_config": {
91
  "_name_or_path": "HuggingFaceTB/SmolLM3-3B",
92
  "architectures": [
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1530d120be6020e944be23373fcca73ec2a4dcac75f473117ad95a68332322fc
3
  size 23462224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25d44f082c613a5981137d73a0fa57706f3dd2d2fed56ad80f553b27b4f11471
3
  size 23462224
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a614500a8c2b6ea97976e7dbd2e49f64b5adef85d1fffcffceebe71b6fd4ce58
3
- size 5905
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:316f75ee83a5b4c47f214306644d6417f18aaad67f6f41d0e1950ffdaafdc9f9
3
+ size 5969