jshrdt commited on
Commit
3e85595
·
verified ·
1 Parent(s): 82fcf78

Upload ft_config.json

Browse files
Files changed (1) hide show
  1. ft_config.json +52 -0
ft_config.json ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "modelname": "openai/whisper-large-v2",
3
+ "gen_args": {"num_beams": 3},
4
+ "fallback": [7,5,1],
5
+ "corpora": {
6
+ "train": {
7
+ "thchs": {
8
+ "languages": "cmn",
9
+ "limit": [
10
+ 1000
11
+ ]
12
+ }
13
+ },
14
+ "dev": {
15
+ "thchs": {
16
+ "languages": "cmn",
17
+ "limit": [
18
+ 500
19
+ ]
20
+ }
21
+ }
22
+ },
23
+ "hyperparams": {
24
+ "output_dir": "../models/lowhipa-large-thchs30",
25
+ "overwrite_output_dir": "True",
26
+ "peft": "True",
27
+ "per_device_train_batch_size": 16,
28
+ "gradient_accumulation_steps": 1,
29
+ "learning_rate": 0.001,
30
+ "warmup_ratio": 0.1,
31
+ "max_steps": 630,
32
+ "gradient_checkpointing": "True",
33
+ "fp16": "True",
34
+ "eval_strategy": "steps",
35
+ "per_device_eval_batch_size": 8,
36
+ "predict_with_generate": "True",
37
+ "generation_max_length": 448,
38
+ "save_steps": 126,
39
+ "eval_steps": 126,
40
+ "logging_steps": 63,
41
+ "logging_first_step": "True",
42
+ "report_to": [
43
+ "tensorboard"
44
+ ],
45
+ "load_best_model_at_end": "False",
46
+ "metric_for_best_model": "pfer",
47
+ "greater_is_better": "False",
48
+ "hub_private_repo": "True",
49
+ "push_to_hub": "False",
50
+ "torch_empty_cache_steps": 4
51
+ }
52
+ }