hf-test commited on
Commit
fb46903
1 Parent(s): 753fa5f

add language model

Browse files
alphabet.json ADDED
@@ -0,0 +1 @@
 
1
+ {"labels": [" ", "a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k", "l", "m", "n", "o", "p", "q", "r", "s", "t", "u", "v", "w", "x", "y", "z", "\u00e4", "\u00e5", "\u00e9", "\u00f4", "\u00f6", "\u00fc", "\u2047", "", "<s>", "</s>"], "is_bpe": false}
eval.py ADDED
@@ -0,0 +1,127 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!/usr/bin/env python3
2
+ from datasets import load_dataset, load_metric, Audio, Dataset
3
+ from transformers import pipeline, AutoFeatureExtractor
4
+ import re
5
+ import argparse
6
+ import unicodedata
7
+ from typing import Dict
8
+
9
+
10
+ def log_results(result: Dataset, args: Dict[str, str]):
11
+ """ DO NOT CHANGE. This function computes and logs the result metrics. """
12
+
13
+ log_outputs = args.log_outputs
14
+ dataset_id = "_".join(args.dataset.split("/") + [args.config, args.split])
15
+
16
+ # load metric
17
+ wer = load_metric("wer")
18
+ cer = load_metric("cer")
19
+
20
+ # compute metrics
21
+ wer_result = wer.compute(references=result["target"], predictions=result["prediction"])
22
+ cer_result = cer.compute(references=result["target"], predictions=result["prediction"])
23
+
24
+ # print & log results
25
+ result_str = (
26
+ f"WER: {wer_result}\n"
27
+ f"CER: {cer_result}"
28
+ )
29
+ print(result_str)
30
+
31
+ with open(f"{dataset_id}_eval_results.txt", "w") as f:
32
+ f.write(result_str)
33
+
34
+ # log all results in text file. Possibly interesting for analysis
35
+ if log_outputs is not None:
36
+ pred_file = f"log_{dataset_id}_predictions.txt"
37
+ target_file = f"log_{dataset_id}_targets.txt"
38
+
39
+ with open(pred_file, "w") as p, open(target_file, "w") as t:
40
+
41
+ # mapping function to write output
42
+ def write_to_file(batch, i):
43
+ p.write(f"{i}" + "\n")
44
+ p.write(batch["prediction"] + "\n")
45
+ t.write(f"{i}" + "\n")
46
+ t.write(batch["target"] + "\n")
47
+
48
+ result.map(write_to_file, with_indices=True)
49
+
50
+
51
+ def normalize_text(text: str) -> str:
52
+ """ DO ADAPT FOR YOUR USE CASE. this function normalizes the target text. """
53
+
54
+ chars_to_ignore_regex = '[,?.!\-\;\:\"“%‘”�—’…–]' # noqa: W605 IMPORTANT: this should correspond to the chars that were ignored during training
55
+
56
+ text = text.lower()
57
+ # normalize non-standard (stylized) unicode characters
58
+ text = unicodedata.normalize('NFKC', text)
59
+ # remove punctuation
60
+ text = re.sub(chars_to_ignore_regex, "", text)
61
+
62
+ # Let's also make sure we split on all kinds of newlines, spaces, etc...
63
+ text = " ".join(text.split())
64
+
65
+ return text
66
+
67
+
68
+ def main(args):
69
+ # load dataset
70
+ dataset = load_dataset(args.dataset, args.config, split=args.split, use_auth_token=True)
71
+
72
+ # for testing: only process the first two examples as a test
73
+ # dataset = dataset.select(range(10))
74
+
75
+ # load processor
76
+ feature_extractor = AutoFeatureExtractor.from_pretrained(args.model_id)
77
+ sampling_rate = feature_extractor.sampling_rate
78
+
79
+ # resample audio
80
+ dataset = dataset.cast_column("audio", Audio(sampling_rate=sampling_rate))
81
+
82
+ # load eval pipeline
83
+ asr = pipeline("automatic-speech-recognition", model=args.model_id)
84
+
85
+ # map function to decode audio
86
+ def map_to_pred(batch):
87
+ prediction = asr(batch["audio"]["array"], chunk_length_s=args.chunk_length_s, stride_length_s=args.stride_length_s)
88
+
89
+ batch["prediction"] = prediction["text"]
90
+ batch["target"] = normalize_text(batch["sentence"])
91
+ return batch
92
+
93
+ # run inference on all examples
94
+ result = dataset.map(map_to_pred, remove_columns=dataset.column_names)
95
+
96
+ # compute and log_results
97
+ # do not change function below
98
+ log_results(result, args)
99
+
100
+
101
+ if __name__ == "__main__":
102
+ parser = argparse.ArgumentParser()
103
+
104
+ parser.add_argument(
105
+ "--model_id", type=str, required=True, help="Model identifier. Should be loadable with 🤗 Transformers"
106
+ )
107
+ parser.add_argument(
108
+ "--dataset", type=str, required=True, help="Dataset name to evaluate the `model_id`. Should be loadable with 🤗 Datasets"
109
+ )
110
+ parser.add_argument(
111
+ "--config", type=str, required=True, help="Config of the dataset. *E.g.* `'en'` for Common Voice"
112
+ )
113
+ parser.add_argument(
114
+ "--split", type=str, required=True, help="Split of the dataset. *E.g.* `'test'`"
115
+ )
116
+ parser.add_argument(
117
+ "--chunk_length_s", type=float, default=None, help="Chunk length in seconds. Defaults to None. For long audio files a good value would be 5.0 seconds."
118
+ )
119
+ parser.add_argument(
120
+ "--stride_length_s", type=float, default=None, help="Stride of the audio chunks. Defaults to None. For long audio files a good value would be 1.0 seconds."
121
+ )
122
+ parser.add_argument(
123
+ "--log_outputs", action='store_true', help="If defined, write outputs to log file for analysis."
124
+ )
125
+ args = parser.parse_args()
126
+
127
+ main(args)
language_model/5gram.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c803936922612f71cf0abdb37763c18d24624e36bfa4abac20187cc17b88541d
3
+ size 1981380707
language_model/attrs.json ADDED
@@ -0,0 +1 @@
 
1
+ {"alpha": 0.5, "beta": 1.5, "unk_score_offset": -10.0, "score_boundary": true}
language_model/unigrams.txt ADDED
The diff for this file is too large to render. See raw diff
preprocessor_config.json CHANGED
@@ -4,6 +4,7 @@
4
  "feature_size": 1,
5
  "padding_side": "right",
6
  "padding_value": 0,
 
7
  "return_attention_mask": true,
8
  "sampling_rate": 16000
9
  }
4
  "feature_size": 1,
5
  "padding_side": "right",
6
  "padding_value": 0,
7
+ "processor_class": "Wav2Vec2ProcessorWithLM",
8
  "return_attention_mask": true,
9
  "sampling_rate": 16000
10
  }
special_tokens_map.json CHANGED
@@ -1 +1 @@
1
- {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}
tokenizer_config.json CHANGED
@@ -1 +1 @@
1
- {"unk_token": "[UNK]", "bos_token": "<s>", "eos_token": "</s>", "pad_token": "[PAD]", "do_lower_case": false, "word_delimiter_token": "|", "special_tokens_map_file": null, "tokenizer_file": null, "name_or_path": "./", "tokenizer_class": "Wav2Vec2CTCTokenizer"}
1
+ {"unk_token": "[UNK]", "bos_token": "<s>", "eos_token": "</s>", "pad_token": "[PAD]", "do_lower_case": false, "word_delimiter_token": "|", "special_tokens_map_file": null, "tokenizer_file": null, "name_or_path": "hf-test/xls-r-300m-sv", "tokenizer_class": "Wav2Vec2CTCTokenizer", "processor_class": "Wav2Vec2ProcessorWithLM"}
wandb/run-20220127_121247-o8za41vn/files/config.yaml CHANGED
@@ -4832,6 +4832,16 @@ _wandb:
4832
  - 5
4833
  - 11
4834
  - 12
 
 
 
 
 
 
 
 
 
 
4835
  4: 3.8.12
4836
  5: 0.12.1
4837
  6: 4.16.0.dev0
4832
  - 5
4833
  - 11
4834
  - 12
4835
+ 2:
4836
+ - 1
4837
+ - 2
4838
+ - 3
4839
+ - 5
4840
+ - 11
4841
+ - 12
4842
+ 3:
4843
+ - 1
4844
+ - 7
4845
  4: 3.8.12
4846
  5: 0.12.1
4847
  6: 4.16.0.dev0
wandb/run-20220127_121247-o8za41vn/files/output.log CHANGED
@@ -14028,3 +14028,19 @@ Upload file runs/Jan27_12-08-15_brutasse/events.out.tfevents.1643285566.brutasse
14028
  Upload file runs/Jan27_12-08-15_brutasse/events.out.tfevents.1643285566.brutasse.15970.0: 73%|███████████████████████████████████████████████▉ | 32.0k/44.1k [00:00<?, ?B/s]
14029
  01/27/2022 20:35:38 - WARNING - huggingface_hub.repository - To https://huggingface.co/hf-test/xls-r-300m-sv-cv8
14030
  Upload file wandb/run-20220127_121247-o8za41vn/run-o8za41vn.wandb: 100%|███████████████████████████████████████████████████████████████████████████████████| 118M/118M [04:02<00:00, 47.9kB/s]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
14028
  Upload file runs/Jan27_12-08-15_brutasse/events.out.tfevents.1643285566.brutasse.15970.0: 73%|███████████████████████████████████████████████▉ | 32.0k/44.1k [00:00<?, ?B/s]
14029
  01/27/2022 20:35:38 - WARNING - huggingface_hub.repository - To https://huggingface.co/hf-test/xls-r-300m-sv-cv8
14030
  Upload file wandb/run-20220127_121247-o8za41vn/run-o8za41vn.wandb: 100%|███████████████████████████████████████████████████████████████████████████████████| 118M/118M [04:02<00:00, 47.9kB/s]
14031
+ Dropping the following result as it does not have all the necessary fields:████████████████████████████████████████████████████████████████████████████████| 118M/118M [04:02<00:00, 47.9kB/s]
14032
+ Dropping the following result as it does not have all the necessary fields:████████████████████████████████████████████████████████████████████████████████| 118M/118M [04:02<00:00, 47.9kB/s]
14033
+ Dropping the following result as it does not have all the necessary fields:████████████████████████████████████████████████████████████████████████████████| 118M/118M [04:02<00:00, 47.9kB/s]
14034
+ Dropping the following result as it does not have all the necessary fields:████████████████████████████████████████████████████████████████████████████████| 118M/118M [04:02<00:00, 47.9kB/s]
14035
+ Dropping the following result as it does not have all the necessary fields:████████████████████████████████████████████████████████████████████████████████| 118M/118M [04:02<00:00, 47.9kB/s]
14036
+ Dropping the following result as it does not have all the necessary fields:████████████████████████████████████████████████████████████████████████████████| 118M/118M [04:02<00:00, 47.9kB/s]
14037
+ Dropping the following result as it does not have all the necessary fields:████████████████████████████████████████████████████████████████████████████████| 118M/118M [04:02<00:00, 47.9kB/s]
14038
+ Dropping the following result as it does not have all the necessary fields:████████████████████████████████████████████████████████████████████████████████| 118M/118M [04:02<00:00, 47.9kB/s]
14039
+ Dropping the following result as it does not have all the necessary fields:████████████████████████████████████████████████████████████████████████████████| 118M/118M [04:02<00:00, 47.9kB/s]
14040
+ Dropping the following result as it does not have all the necessary fields:████████████████████████████████████████████████████████████████████████████████| 118M/118M [04:02<00:00, 47.9kB/s]
14041
+ Dropping the following result as it does not have all the necessary fields:████████████████████████████████████████████████████████████████████████████████| 118M/118M [04:02<00:00, 47.9kB/s]
14042
+ 01/27/2022 20:36:03 - WARNING - huggingface_hub.repository - To https://huggingface.co/hf-test/xls-r-300m-sv-cv8
14043
+ 2b65b1d..753fa5f main -> main
14044
+ Dropping the following result as it does not have all the necessary fields:████████████████████████████████████████████████████���███████████████████████████| 118M/118M [04:02<00:00, 47.9kB/s]
14045
+ Dropping the following result as it does not have all the necessary fields:████████████████████████████████████████████████████████████████████████████████| 118M/118M [04:02<00:00, 47.9kB/s]
14046
+ Dropping the following result as it does not have all the necessary fields:████████████████████████████████████████████████████████████████████████████████| 118M/118M [04:02<00:00, 47.9kB/s]
wandb/run-20220127_121247-o8za41vn/files/wandb-summary.json CHANGED
The diff for this file is too large to render. See raw diff
wandb/run-20220127_121247-o8za41vn/logs/debug-internal.log CHANGED
@@ -20965,3 +20965,134 @@
20965
  2022-01-27 20:35:39,608 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
20966
  2022-01-27 20:35:40,609 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
20967
  2022-01-27 20:35:41,610 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
20965
  2022-01-27 20:35:39,608 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
20966
  2022-01-27 20:35:40,609 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
20967
  2022-01-27 20:35:41,610 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
20968
+ 2022-01-27 20:35:43,610 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
20969
+ 2022-01-27 20:35:47,251 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: stop_status
20970
+ 2022-01-27 20:35:47,251 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: stop_status
20971
+ 2022-01-27 20:35:47,611 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
20972
+ 2022-01-27 20:35:49,612 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
20973
+ 2022-01-27 20:35:51,613 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
20974
+ 2022-01-27 20:35:53,614 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
20975
+ 2022-01-27 20:35:55,614 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
20976
+ 2022-01-27 20:35:57,615 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
20977
+ 2022-01-27 20:35:59,616 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
20978
+ 2022-01-27 20:36:01,616 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
20979
+ 2022-01-27 20:36:02,341 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: stop_status
20980
+ 2022-01-27 20:36:02,341 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: stop_status
20981
+ 2022-01-27 20:36:03,617 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
20982
+ 2022-01-27 20:36:04,618 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
20983
+ 2022-01-27 20:36:05,619 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
20984
+ 2022-01-27 20:36:07,620 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
20985
+ 2022-01-27 20:36:07,710 DEBUG SenderThread:16113 [sender.py:send():182] send: stats
20986
+ 2022-01-27 20:36:09,482 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: poll_exit
20987
+ 2022-01-27 20:36:09,482 DEBUG SenderThread:16113 [sender.py:send():182] send: telemetry
20988
+ 2022-01-27 20:36:09,482 DEBUG SenderThread:16113 [sender.py:send():182] send: exit
20989
+ 2022-01-27 20:36:09,482 INFO SenderThread:16113 [sender.py:send_exit():291] handling exit code: 0
20990
+ 2022-01-27 20:36:09,483 INFO SenderThread:16113 [sender.py:send_exit():293] handling runtime: 30201
20991
+ 2022-01-27 20:36:09,500 INFO SenderThread:16113 [sender.py:_save_file():873] saving file wandb-summary.json with policy end
20992
+ 2022-01-27 20:36:09,500 INFO SenderThread:16113 [sender.py:send_exit():303] send defer
20993
+ 2022-01-27 20:36:09,500 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: poll_exit
20994
+ 2022-01-27 20:36:09,500 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: defer
20995
+ 2022-01-27 20:36:09,501 INFO HandlerThread:16113 [handler.py:handle_request_defer():143] handle defer: 0
20996
+ 2022-01-27 20:36:09,501 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: defer
20997
+ 2022-01-27 20:36:09,501 INFO SenderThread:16113 [sender.py:send_request_defer():312] handle sender defer: 0
20998
+ 2022-01-27 20:36:09,501 INFO SenderThread:16113 [sender.py:transition_state():316] send defer: 1
20999
+ 2022-01-27 20:36:09,501 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: defer
21000
+ 2022-01-27 20:36:09,501 INFO HandlerThread:16113 [handler.py:handle_request_defer():143] handle defer: 1
21001
+ 2022-01-27 20:36:09,531 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: defer
21002
+ 2022-01-27 20:36:09,532 INFO SenderThread:16113 [sender.py:send_request_defer():312] handle sender defer: 1
21003
+ 2022-01-27 20:36:09,532 INFO SenderThread:16113 [sender.py:transition_state():316] send defer: 2
21004
+ 2022-01-27 20:36:09,532 DEBUG SenderThread:16113 [sender.py:send():182] send: stats
21005
+ 2022-01-27 20:36:09,532 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: defer
21006
+ 2022-01-27 20:36:09,532 INFO HandlerThread:16113 [handler.py:handle_request_defer():143] handle defer: 2
21007
+ 2022-01-27 20:36:09,533 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: defer
21008
+ 2022-01-27 20:36:09,533 INFO SenderThread:16113 [sender.py:send_request_defer():312] handle sender defer: 2
21009
+ 2022-01-27 20:36:09,533 INFO SenderThread:16113 [sender.py:transition_state():316] send defer: 3
21010
+ 2022-01-27 20:36:09,533 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: defer
21011
+ 2022-01-27 20:36:09,533 INFO HandlerThread:16113 [handler.py:handle_request_defer():143] handle defer: 3
21012
+ 2022-01-27 20:36:09,552 DEBUG SenderThread:16113 [sender.py:send():182] send: summary
21013
+ 2022-01-27 20:36:09,581 INFO SenderThread:16113 [sender.py:_save_file():873] saving file wandb-summary.json with policy end
21014
+ 2022-01-27 20:36:09,581 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: defer
21015
+ 2022-01-27 20:36:09,581 INFO SenderThread:16113 [sender.py:send_request_defer():312] handle sender defer: 3
21016
+ 2022-01-27 20:36:09,581 INFO SenderThread:16113 [sender.py:transition_state():316] send defer: 4
21017
+ 2022-01-27 20:36:09,581 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: defer
21018
+ 2022-01-27 20:36:09,582 INFO HandlerThread:16113 [handler.py:handle_request_defer():143] handle defer: 4
21019
+ 2022-01-27 20:36:09,582 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: defer
21020
+ 2022-01-27 20:36:09,582 INFO SenderThread:16113 [sender.py:send_request_defer():312] handle sender defer: 4
21021
+ 2022-01-27 20:36:09,601 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: poll_exit
21022
+ 2022-01-27 20:36:09,622 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/wandb-summary.json
21023
+ 2022-01-27 20:36:09,622 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
21024
+ 2022-01-27 20:36:10,036 INFO SenderThread:16113 [sender.py:transition_state():316] send defer: 5
21025
+ 2022-01-27 20:36:10,036 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: poll_exit
21026
+ 2022-01-27 20:36:10,037 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: defer
21027
+ 2022-01-27 20:36:10,037 INFO HandlerThread:16113 [handler.py:handle_request_defer():143] handle defer: 5
21028
+ 2022-01-27 20:36:10,037 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: defer
21029
+ 2022-01-27 20:36:10,037 INFO SenderThread:16113 [sender.py:send_request_defer():312] handle sender defer: 5
21030
+ 2022-01-27 20:36:10,037 INFO SenderThread:16113 [dir_watcher.py:finish():283] shutting down directory watcher
21031
+ 2022-01-27 20:36:10,138 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: poll_exit
21032
+ 2022-01-27 20:36:10,622 INFO Thread-8 :16113 [dir_watcher.py:_on_file_modified():230] file/dir modified: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/config.yaml
21033
+ 2022-01-27 20:36:10,623 INFO SenderThread:16113 [dir_watcher.py:finish():313] scan: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files
21034
+ 2022-01-27 20:36:10,623 INFO SenderThread:16113 [dir_watcher.py:finish():327] scan save: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/config.yaml config.yaml
21035
+ 2022-01-27 20:36:10,623 INFO SenderThread:16113 [dir_watcher.py:finish():327] scan save: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/conda-environment.yaml conda-environment.yaml
21036
+ 2022-01-27 20:36:10,623 INFO SenderThread:16113 [dir_watcher.py:finish():327] scan save: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log output.log
21037
+ 2022-01-27 20:36:10,623 INFO SenderThread:16113 [dir_watcher.py:finish():327] scan save: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/wandb-metadata.json wandb-metadata.json
21038
+ 2022-01-27 20:36:10,623 INFO SenderThread:16113 [dir_watcher.py:finish():327] scan save: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/wandb-summary.json wandb-summary.json
21039
+ 2022-01-27 20:36:10,624 INFO SenderThread:16113 [dir_watcher.py:finish():327] scan save: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/requirements.txt requirements.txt
21040
+ 2022-01-27 20:36:10,624 INFO SenderThread:16113 [sender.py:transition_state():316] send defer: 6
21041
+ 2022-01-27 20:36:10,627 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: poll_exit
21042
+ 2022-01-27 20:36:10,630 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: defer
21043
+ 2022-01-27 20:36:10,630 INFO HandlerThread:16113 [handler.py:handle_request_defer():143] handle defer: 6
21044
+ 2022-01-27 20:36:10,631 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: defer
21045
+ 2022-01-27 20:36:10,631 INFO SenderThread:16113 [sender.py:send_request_defer():312] handle sender defer: 6
21046
+ 2022-01-27 20:36:10,631 INFO SenderThread:16113 [file_pusher.py:finish():177] shutting down file pusher
21047
+ 2022-01-27 20:36:10,728 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: poll_exit
21048
+ 2022-01-27 20:36:10,728 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: poll_exit
21049
+ 2022-01-27 20:36:10,829 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: poll_exit
21050
+ 2022-01-27 20:36:10,830 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: poll_exit
21051
+ 2022-01-27 20:36:10,931 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: poll_exit
21052
+ 2022-01-27 20:36:10,931 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: poll_exit
21053
+ 2022-01-27 20:36:11,018 INFO Thread-12 :16113 [upload_job.py:push():137] Uploaded file /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/config.yaml
21054
+ 2022-01-27 20:36:11,032 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: poll_exit
21055
+ 2022-01-27 20:36:11,032 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: poll_exit
21056
+ 2022-01-27 20:36:11,099 INFO Thread-16 :16113 [upload_job.py:push():137] Uploaded file /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/requirements.txt
21057
+ 2022-01-27 20:36:11,134 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: poll_exit
21058
+ 2022-01-27 20:36:11,134 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: poll_exit
21059
+ 2022-01-27 20:36:11,166 INFO Thread-15 :16113 [upload_job.py:push():137] Uploaded file /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/wandb-summary.json
21060
+ 2022-01-27 20:36:11,236 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: poll_exit
21061
+ 2022-01-27 20:36:11,236 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: poll_exit
21062
+ 2022-01-27 20:36:11,278 INFO Thread-13 :16113 [upload_job.py:push():137] Uploaded file /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/conda-environment.yaml
21063
+ 2022-01-27 20:36:11,289 INFO Thread-14 :16113 [upload_job.py:push():137] Uploaded file /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/files/output.log
21064
+ 2022-01-27 20:36:11,338 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: poll_exit
21065
+ 2022-01-27 20:36:11,338 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: poll_exit
21066
+ 2022-01-27 20:36:11,440 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: poll_exit
21067
+ 2022-01-27 20:36:11,440 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: poll_exit
21068
+ 2022-01-27 20:36:11,490 INFO Thread-7 :16113 [sender.py:transition_state():316] send defer: 7
21069
+ 2022-01-27 20:36:11,491 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: defer
21070
+ 2022-01-27 20:36:11,491 INFO HandlerThread:16113 [handler.py:handle_request_defer():143] handle defer: 7
21071
+ 2022-01-27 20:36:11,491 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: defer
21072
+ 2022-01-27 20:36:11,491 INFO SenderThread:16113 [sender.py:send_request_defer():312] handle sender defer: 7
21073
+ 2022-01-27 20:36:11,542 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: poll_exit
21074
+ 2022-01-27 20:36:12,157 INFO SenderThread:16113 [sender.py:transition_state():316] send defer: 8
21075
+ 2022-01-27 20:36:12,157 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: poll_exit
21076
+ 2022-01-27 20:36:12,158 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: defer
21077
+ 2022-01-27 20:36:12,158 INFO HandlerThread:16113 [handler.py:handle_request_defer():143] handle defer: 8
21078
+ 2022-01-27 20:36:12,158 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: defer
21079
+ 2022-01-27 20:36:12,158 INFO SenderThread:16113 [sender.py:send_request_defer():312] handle sender defer: 8
21080
+ 2022-01-27 20:36:12,158 INFO SenderThread:16113 [sender.py:transition_state():316] send defer: 9
21081
+ 2022-01-27 20:36:12,159 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: defer
21082
+ 2022-01-27 20:36:12,159 DEBUG SenderThread:16113 [sender.py:send():182] send: final
21083
+ 2022-01-27 20:36:12,159 INFO HandlerThread:16113 [handler.py:handle_request_defer():143] handle defer: 9
21084
+ 2022-01-27 20:36:12,159 DEBUG SenderThread:16113 [sender.py:send():182] send: footer
21085
+ 2022-01-27 20:36:12,160 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: defer
21086
+ 2022-01-27 20:36:12,160 INFO SenderThread:16113 [sender.py:send_request_defer():312] handle sender defer: 9
21087
+ 2022-01-27 20:36:12,259 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: poll_exit
21088
+ 2022-01-27 20:36:12,260 DEBUG SenderThread:16113 [sender.py:send_request():196] send_request: poll_exit
21089
+ 2022-01-27 20:36:12,260 INFO SenderThread:16113 [file_pusher.py:join():182] waiting for file pusher
21090
+ 2022-01-27 20:36:12,261 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: get_summary
21091
+ 2022-01-27 20:36:12,302 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: sampled_history
21092
+ 2022-01-27 20:36:12,304 DEBUG HandlerThread:16113 [handler.py:handle_request():126] handle_request: shutdown
21093
+ 2022-01-27 20:36:12,304 INFO HandlerThread:16113 [handler.py:finish():683] shutting down handler
21094
+ 2022-01-27 20:36:13,159 INFO WriterThread:16113 [datastore.py:close():281] close: /home/patrick/experiments/xls-r-300m-sv-cv8/wandb/run-20220127_121247-o8za41vn/run-o8za41vn.wandb
21095
+ 2022-01-27 20:36:13,260 INFO SenderThread:16113 [sender.py:finish():979] shutting down sender
21096
+ 2022-01-27 20:36:13,260 INFO SenderThread:16113 [file_pusher.py:finish():177] shutting down file pusher
21097
+ 2022-01-27 20:36:13,260 INFO SenderThread:16113 [file_pusher.py:join():182] waiting for file pusher
21098
+ 2022-01-27 20:36:13,288 INFO MainThread:16113 [internal.py:handle_exit():76] Internal process exited
wandb/run-20220127_121247-o8za41vn/logs/debug.log CHANGED
@@ -23,3 +23,115 @@ config: {}
23
  2022-01-27 12:12:53,089 INFO MainThread:15970 [wandb_init.py:init():565] run started, returning control to user process
24
  2022-01-27 12:12:53,091 INFO MainThread:15970 [wandb_run.py:_config_callback():843] config_cb None None {'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': 'float32', 'use_bfloat16': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'chunk_size_feed_forward': 0, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'architectures': ['Wav2Vec2ForPreTraining'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': 1, 'pad_token_id': 34, 'eos_token_id': 2, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'facebook/wav2vec2-xls-r-300m', 'transformers_version': '4.16.0.dev0', 'feat_extract_dropout': 0.0, 'model_type': 'wav2vec2', 'num_feat_extract_layers': 7, 'hidden_size': 1024, 'feat_extract_norm': 'layer', 'feat_extract_activation': 'gelu', 'conv_dim': [512, 512, 512, 512, 512, 512, 512], 'conv_stride': [5, 2, 2, 2, 2, 2, 2], 'conv_kernel': [10, 3, 3, 3, 3, 2, 2], 'conv_bias': True, 'num_conv_pos_embeddings': 128, 'num_conv_pos_embedding_groups': 16, 'num_hidden_layers': 24, 'intermediate_size': 4096, 'hidden_act': 'gelu', 'num_attention_heads': 16, 'hidden_dropout': 0.0, 'attention_dropout': 0.0, 'activation_dropout': 0.1, 'feat_proj_dropout': 0.0, 'final_dropout': 0.0, 'layerdrop': 0.0, 'layer_norm_eps': 1e-05, 'initializer_range': 0.02, 'vocab_size': 37, 'do_stable_layer_norm': True, 'use_weighted_layer_sum': False, 'apply_spec_augment': True, 'mask_time_prob': 0.75, 'mask_time_length': 10, 'mask_time_min_masks': 2, 'mask_feature_prob': 0.25, 'mask_feature_length': 64, 'mask_feature_min_masks': 0, 'num_codevectors_per_group': 320, 'num_codevector_groups': 2, 'contrastive_logits_temperature': 0.1, 'feat_quantizer_dropout': 0.0, 'num_negatives': 100, 'codevector_dim': 768, 'proj_codevector_dim': 768, 'diversity_loss_weight': 0.1, 'ctc_loss_reduction': 'mean', 'ctc_zero_infinity': False, 'add_adapter': False, 'adapter_kernel_size': 3, 'adapter_stride': 2, 'num_adapter_layers': 3, 'output_hidden_size': 1024, 'classifier_proj_size': 256, 'tdnn_dim': [512, 512, 512, 512, 1500], 'tdnn_kernel': [5, 3, 3, 1, 1], 'tdnn_dilation': [1, 2, 3, 1, 1], 'xvector_output_dim': 512, 'output_dir': './', 'overwrite_output_dir': True, 'do_train': True, 'do_eval': True, 'do_predict': False, 'evaluation_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 8, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': 'None', 'per_gpu_eval_batch_size': 'None', 'gradient_accumulation_steps': 4, 'eval_accumulation_steps': 'None', 'learning_rate': 7.5e-05, 'weight_decay': 0.0, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 50.0, 'max_steps': -1, 'lr_scheduler_type': 'linear', 'warmup_ratio': 0.0, 'warmup_steps': 2000, 'log_level': -1, 'log_level_replica': -1, 'log_on_each_node': True, 'logging_dir': './runs/Jan27_12-08-15_brutasse', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 100, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 500, 'save_total_limit': 3, 'save_on_each_node': False, 'no_cuda': False, 'seed': 42, 'bf16': False, 'fp16': True, 'fp16_opt_level': 'O1', 'half_precision_backend': 'amp', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': 'None', 'local_rank': -1, 'xpu_backend': 'None', 'tpu_num_cores': 'None', 'tpu_metrics_debug': False, 'debug': '[]', 'dataloader_drop_last': False, 'eval_steps': 500, 'dataloader_num_workers': 0, 'past_index': -1, 'run_name': './', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': 'None', 'load_best_model_at_end': False, 'metric_for_best_model': 'None', 'greater_is_better': 'None', 'ignore_data_skip': False, 'sharded_ddp': '[]', 'deepspeed': 'None', 'label_smoothing_factor': 0.0, 'optim': 'adamw_hf', 'adafactor': False, 'group_by_length': True, 'length_column_name': 'input_length', 'report_to': "['tensorboard', 'wandb', 'codecarbon']", 'ddp_find_unused_parameters': 'None', 'ddp_bucket_cap_mb': 'None', 'dataloader_pin_memory': True, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': 'None', 'hub_model_id': 'None', 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'gradient_checkpointing': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': 'None', 'push_to_hub_organization': 'None', 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', '_n_gpu': 1, 'mp_parameters': '', 'train_batch_size': 8, 'eval_batch_size': 8}
25
  2022-01-27 12:12:53,094 INFO MainThread:15970 [wandb_watch.py:watch():43] Watching
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
23
  2022-01-27 12:12:53,089 INFO MainThread:15970 [wandb_init.py:init():565] run started, returning control to user process
24
  2022-01-27 12:12:53,091 INFO MainThread:15970 [wandb_run.py:_config_callback():843] config_cb None None {'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': 'float32', 'use_bfloat16': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'chunk_size_feed_forward': 0, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'architectures': ['Wav2Vec2ForPreTraining'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': 1, 'pad_token_id': 34, 'eos_token_id': 2, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'facebook/wav2vec2-xls-r-300m', 'transformers_version': '4.16.0.dev0', 'feat_extract_dropout': 0.0, 'model_type': 'wav2vec2', 'num_feat_extract_layers': 7, 'hidden_size': 1024, 'feat_extract_norm': 'layer', 'feat_extract_activation': 'gelu', 'conv_dim': [512, 512, 512, 512, 512, 512, 512], 'conv_stride': [5, 2, 2, 2, 2, 2, 2], 'conv_kernel': [10, 3, 3, 3, 3, 2, 2], 'conv_bias': True, 'num_conv_pos_embeddings': 128, 'num_conv_pos_embedding_groups': 16, 'num_hidden_layers': 24, 'intermediate_size': 4096, 'hidden_act': 'gelu', 'num_attention_heads': 16, 'hidden_dropout': 0.0, 'attention_dropout': 0.0, 'activation_dropout': 0.1, 'feat_proj_dropout': 0.0, 'final_dropout': 0.0, 'layerdrop': 0.0, 'layer_norm_eps': 1e-05, 'initializer_range': 0.02, 'vocab_size': 37, 'do_stable_layer_norm': True, 'use_weighted_layer_sum': False, 'apply_spec_augment': True, 'mask_time_prob': 0.75, 'mask_time_length': 10, 'mask_time_min_masks': 2, 'mask_feature_prob': 0.25, 'mask_feature_length': 64, 'mask_feature_min_masks': 0, 'num_codevectors_per_group': 320, 'num_codevector_groups': 2, 'contrastive_logits_temperature': 0.1, 'feat_quantizer_dropout': 0.0, 'num_negatives': 100, 'codevector_dim': 768, 'proj_codevector_dim': 768, 'diversity_loss_weight': 0.1, 'ctc_loss_reduction': 'mean', 'ctc_zero_infinity': False, 'add_adapter': False, 'adapter_kernel_size': 3, 'adapter_stride': 2, 'num_adapter_layers': 3, 'output_hidden_size': 1024, 'classifier_proj_size': 256, 'tdnn_dim': [512, 512, 512, 512, 1500], 'tdnn_kernel': [5, 3, 3, 1, 1], 'tdnn_dilation': [1, 2, 3, 1, 1], 'xvector_output_dim': 512, 'output_dir': './', 'overwrite_output_dir': True, 'do_train': True, 'do_eval': True, 'do_predict': False, 'evaluation_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 8, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': 'None', 'per_gpu_eval_batch_size': 'None', 'gradient_accumulation_steps': 4, 'eval_accumulation_steps': 'None', 'learning_rate': 7.5e-05, 'weight_decay': 0.0, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 50.0, 'max_steps': -1, 'lr_scheduler_type': 'linear', 'warmup_ratio': 0.0, 'warmup_steps': 2000, 'log_level': -1, 'log_level_replica': -1, 'log_on_each_node': True, 'logging_dir': './runs/Jan27_12-08-15_brutasse', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 100, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 500, 'save_total_limit': 3, 'save_on_each_node': False, 'no_cuda': False, 'seed': 42, 'bf16': False, 'fp16': True, 'fp16_opt_level': 'O1', 'half_precision_backend': 'amp', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': 'None', 'local_rank': -1, 'xpu_backend': 'None', 'tpu_num_cores': 'None', 'tpu_metrics_debug': False, 'debug': '[]', 'dataloader_drop_last': False, 'eval_steps': 500, 'dataloader_num_workers': 0, 'past_index': -1, 'run_name': './', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': 'None', 'load_best_model_at_end': False, 'metric_for_best_model': 'None', 'greater_is_better': 'None', 'ignore_data_skip': False, 'sharded_ddp': '[]', 'deepspeed': 'None', 'label_smoothing_factor': 0.0, 'optim': 'adamw_hf', 'adafactor': False, 'group_by_length': True, 'length_column_name': 'input_length', 'report_to': "['tensorboard', 'wandb', 'codecarbon']", 'ddp_find_unused_parameters': 'None', 'ddp_bucket_cap_mb': 'None', 'dataloader_pin_memory': True, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': 'None', 'hub_model_id': 'None', 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'gradient_checkpointing': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': 'None', 'push_to_hub_organization': 'None', 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', '_n_gpu': 1, 'mp_parameters': '', 'train_batch_size': 8, 'eval_batch_size': 8}
25
  2022-01-27 12:12:53,094 INFO MainThread:15970 [wandb_watch.py:watch():43] Watching
26
+ 2022-01-27 20:36:06,837 INFO MainThread:15970 [wandb_run.py:_atexit_cleanup():1571] got exitcode: 0
27
+ 2022-01-27 20:36:06,838 INFO MainThread:15970 [wandb_run.py:_restore():1543] restore
28
+ 2022-01-27 20:36:09,501 INFO MainThread:15970 [wandb_run.py:_wait_for_finish():1693] got exit ret: file_counts {
29
+ wandb_count: 1
30
+ }
31
+ pusher_stats {
32
+ uploaded_bytes: 2244
33
+ total_bytes: 2244
34
+ }
35
+
36
+ 2022-01-27 20:36:10,037 INFO MainThread:15970 [wandb_run.py:_wait_for_finish():1693] got exit ret: file_counts {
37
+ wandb_count: 1
38
+ }
39
+ pusher_stats {
40
+ uploaded_bytes: 2244
41
+ total_bytes: 2244
42
+ }
43
+
44
+ 2022-01-27 20:36:10,627 INFO MainThread:15970 [wandb_run.py:_wait_for_finish():1693] got exit ret: file_counts {
45
+ wandb_count: 6
46
+ }
47
+ pusher_stats {
48
+ uploaded_bytes: 2244
49
+ total_bytes: 2750979
50
+ }
51
+
52
+ 2022-01-27 20:36:10,729 INFO MainThread:15970 [wandb_run.py:_wait_for_finish():1693] got exit ret: file_counts {
53
+ wandb_count: 6
54
+ }
55
+ pusher_stats {
56
+ uploaded_bytes: 2244
57
+ total_bytes: 2750979
58
+ }
59
+
60
+ 2022-01-27 20:36:10,830 INFO MainThread:15970 [wandb_run.py:_wait_for_finish():1693] got exit ret: file_counts {
61
+ wandb_count: 6
62
+ }
63
+ pusher_stats {
64
+ uploaded_bytes: 515593
65
+ total_bytes: 2750979
66
+ }
67
+
68
+ 2022-01-27 20:36:10,931 INFO MainThread:15970 [wandb_run.py:_wait_for_finish():1693] got exit ret: file_counts {
69
+ wandb_count: 6
70
+ }
71
+ pusher_stats {
72
+ uploaded_bytes: 1897531
73
+ total_bytes: 2750979
74
+ }
75
+
76
+ 2022-01-27 20:36:11,033 INFO MainThread:15970 [wandb_run.py:_wait_for_finish():1693] got exit ret: file_counts {
77
+ wandb_count: 6
78
+ }
79
+ pusher_stats {
80
+ uploaded_bytes: 2750979
81
+ total_bytes: 2750979
82
+ }
83
+
84
+ 2022-01-27 20:36:11,135 INFO MainThread:15970 [wandb_run.py:_wait_for_finish():1693] got exit ret: file_counts {
85
+ wandb_count: 6
86
+ }
87
+ pusher_stats {
88
+ uploaded_bytes: 2750979
89
+ total_bytes: 2750979
90
+ }
91
+
92
+ 2022-01-27 20:36:11,237 INFO MainThread:15970 [wandb_run.py:_wait_for_finish():1693] got exit ret: file_counts {
93
+ wandb_count: 6
94
+ }
95
+ pusher_stats {
96
+ uploaded_bytes: 2750979
97
+ total_bytes: 2750979
98
+ }
99
+
100
+ 2022-01-27 20:36:11,339 INFO MainThread:15970 [wandb_run.py:_wait_for_finish():1693] got exit ret: file_counts {
101
+ wandb_count: 6
102
+ }
103
+ pusher_stats {
104
+ uploaded_bytes: 2750979
105
+ total_bytes: 2750979
106
+ }
107
+
108
+ 2022-01-27 20:36:11,441 INFO MainThread:15970 [wandb_run.py:_wait_for_finish():1693] got exit ret: file_counts {
109
+ wandb_count: 6
110
+ }
111
+ pusher_stats {
112
+ uploaded_bytes: 2750979
113
+ total_bytes: 2750979
114
+ }
115
+
116
+ 2022-01-27 20:36:12,158 INFO MainThread:15970 [wandb_run.py:_wait_for_finish():1693] got exit ret: file_counts {
117
+ wandb_count: 6
118
+ }
119
+ pusher_stats {
120
+ uploaded_bytes: 2750979
121
+ total_bytes: 2750979
122
+ }
123
+
124
+ 2022-01-27 20:36:12,260 INFO MainThread:15970 [wandb_run.py:_wait_for_finish():1693] got exit ret: done: true
125
+ exit_result {
126
+ }
127
+ file_counts {
128
+ wandb_count: 6
129
+ }
130
+ pusher_stats {
131
+ uploaded_bytes: 2750979
132
+ total_bytes: 2750979
133
+ }
134
+
135
+ 2022-01-27 20:36:13,565 INFO MainThread:15970 [wandb_run.py:_show_summary():1848] rendering summary
136
+ 2022-01-27 20:36:13,566 INFO MainThread:15970 [wandb_run.py:_show_history():1886] rendering history
137
+ 2022-01-27 20:36:13,567 INFO MainThread:15970 [wandb_run.py:_show_files():1915] logging synced files
wandb/run-20220127_121247-o8za41vn/run-o8za41vn.wandb CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2ad3076251c2c4cd4f61ecf05112073f1f8cf21f6835657c4067761890ecc41
3
- size 123820895
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c2cd3e0df32b837b9614d7a7668306733e2fb1b905ddb0f5e3df297dea4ff84
3
+ size 124498930