diff --git "a/wandb/run-20220127_103723-scy0vyln/files/config.yaml" "b/wandb/run-20220127_103723-scy0vyln/files/config.yaml" deleted file mode 100644--- "a/wandb/run-20220127_103723-scy0vyln/files/config.yaml" +++ /dev/null @@ -1,5476 +0,0 @@ -wandb_version: 1 - -_n_gpu: - desc: null - value: 1 -_name_or_path: - desc: null - value: KBLab/wav2vec2-large-voxrex -_wandb: - desc: null - value: - cli_version: 0.12.9 - framework: huggingface - huggingface_version: 4.16.0.dev0 - is_jupyter_run: false - is_kaggle_kernel: false - m: - - 1: train/global_step - 6: - - 3 - - 1: gradients/lm_head\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/lm_head\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/lm_head\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/lm_head\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/lm_head\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/lm_head\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.23\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.22\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.21\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.20\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.19\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.18\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.17\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.16\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.15\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.14\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.13\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.12\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.11\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.10\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.9\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.8\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.7\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.6\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.5\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.4\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.3\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.2\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.1\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.feed_forward\.output_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.feed_forward\.output_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.feed_forward\.output_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.feed_forward\.output_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.feed_forward\.output_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.feed_forward\.output_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.feed_forward\.intermediate_dense\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.feed_forward\.intermediate_dense\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.feed_forward\.intermediate_dense\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.feed_forward\.intermediate_dense\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.feed_forward\.intermediate_dense\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.feed_forward\.intermediate_dense\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.final_layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.final_layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.final_layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.final_layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.final_layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.final_layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.out_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.out_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.out_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.out_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.out_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.out_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.v_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.v_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.v_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.v_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.v_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.v_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.k_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.k_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.k_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.k_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.k_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.k_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.q_proj\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.q_proj\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.q_proj\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.q_proj\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.q_proj\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.attention\.q_proj\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.layers\.0\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.pos_conv_embed\.conv\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.pos_conv_embed\.conv\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.pos_conv_embed\.conv\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.pos_conv_embed\.conv\.weight_v._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.pos_conv_embed\.conv\.weight_v.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.pos_conv_embed\.conv\.weight_v.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.pos_conv_embed\.conv\.weight_g._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.pos_conv_embed\.conv\.weight_g.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.encoder\.pos_conv_embed\.conv\.weight_g.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.masked_spec_embed._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.masked_spec_embed.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.masked_spec_embed.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.feature_projection\.projection\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.feature_projection\.projection\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.feature_projection\.projection\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.feature_projection\.projection\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.feature_projection\.projection\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.feature_projection\.projection\.bias.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.feature_projection\.layer_norm\.weight._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.feature_projection\.layer_norm\.weight.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.feature_projection\.layer_norm\.weight.bins - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.feature_projection\.layer_norm\.bias._type - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.feature_projection\.layer_norm\.bias.values - 5: 1 - 6: - - 1 - - 1: gradients/wav2vec2\.feature_projection\.layer_norm\.bias.bins - 5: 1 - 6: - - 1 - - 1: train/loss - 5: 1 - 6: - - 1 - - 1: train/learning_rate - 5: 1 - 6: - - 1 - - 1: train/epoch - 5: 1 - 6: - - 1 - - 1: eval/loss - 5: 1 - 6: - - 1 - - 1: eval/wer - 5: 1 - 6: - - 1 - - 1: eval/runtime - 5: 1 - 6: - - 1 - - 1: eval/samples_per_second - 5: 1 - 6: - - 1 - - 1: eval/steps_per_second - 5: 1 - 6: - - 1 - - 1: train/train_runtime - 5: 1 - 6: - - 1 - - 1: train/train_samples_per_second - 5: 1 - 6: - - 1 - - 1: train/train_steps_per_second - 5: 1 - 6: - - 1 - - 1: train/total_flos - 5: 1 - 6: - - 1 - - 1: train/train_loss - 5: 1 - 6: - - 1 - python_version: 3.8.8 - start_time: 1643279843 - t: - 1: - - 1 - - 5 - - 11 - 3: - - 13 - 4: 3.8.8 - 5: 0.12.9 - 6: 4.16.0.dev0 - 8: - - 5 -activation_dropout: - desc: null - value: 0.1 -adafactor: - desc: null - value: false -adam_beta1: - desc: null - value: 0.9 -adam_beta2: - desc: null - value: 0.999 -adam_epsilon: - desc: null - value: 1.0e-08 -adapter_kernel_size: - desc: null - value: 3 -adapter_stride: - desc: null - value: 2 -add_adapter: - desc: null - value: false -add_cross_attention: - desc: null - value: false -apply_spec_augment: - desc: null - value: true -architectures: - desc: null - value: - - Wav2Vec2ForPreTraining -attention_dropout: - desc: null - value: 0.0 -bad_words_ids: - desc: null - value: null -bf16: - desc: null - value: false -bf16_full_eval: - desc: null - value: false -bos_token_id: - desc: null - value: 1 -chunk_size_feed_forward: - desc: null - value: 0 -classifier_proj_size: - desc: null - value: 256 -codevector_dim: - desc: null - value: 768 -contrastive_logits_temperature: - desc: null - value: 0.1 -conv_bias: - desc: null - value: true -conv_dim: - desc: null - value: - - 512 - - 512 - - 512 - - 512 - - 512 - - 512 - - 512 -conv_kernel: - desc: null - value: - - 10 - - 3 - - 3 - - 3 - - 3 - - 2 - - 2 -conv_stride: - desc: null - value: - - 5 - - 2 - - 2 - - 2 - - 2 - - 2 - - 2 -cross_attention_hidden_size: - desc: null - value: null -ctc_loss_reduction: - desc: null - value: mean -ctc_zero_infinity: - desc: null - value: false -dataloader_drop_last: - desc: null - value: false -dataloader_num_workers: - desc: null - value: 0 -dataloader_pin_memory: - desc: null - value: true -ddp_bucket_cap_mb: - desc: null - value: None -ddp_find_unused_parameters: - desc: null - value: None -debug: - desc: null - value: '[]' -decoder_start_token_id: - desc: null - value: null -deepspeed: - desc: null - value: None -disable_tqdm: - desc: null - value: false -diversity_loss_weight: - desc: null - value: 0.1 -diversity_penalty: - desc: null - value: 0.0 -do_eval: - desc: null - value: true -do_predict: - desc: null - value: false -do_sample: - desc: null - value: false -do_stable_layer_norm: - desc: null - value: true -do_train: - desc: null - value: true -early_stopping: - desc: null - value: false -encoder_no_repeat_ngram_size: - desc: null - value: 0 -eos_token_id: - desc: null - value: 2 -eval_accumulation_steps: - desc: null - value: None -eval_batch_size: - desc: null - value: 8 -eval_steps: - desc: null - value: 500 -evaluation_strategy: - desc: null - value: steps -feat_extract_activation: - desc: null - value: gelu -feat_extract_dropout: - desc: null - value: 0.0 -feat_extract_norm: - desc: null - value: layer -feat_proj_dropout: - desc: null - value: 0.0 -feat_quantizer_dropout: - desc: null - value: 0.0 -final_dropout: - desc: null - value: 0.0 -finetuning_task: - desc: null - value: null -forced_bos_token_id: - desc: null - value: null -forced_eos_token_id: - desc: null - value: null -fp16: - desc: null - value: true -fp16_backend: - desc: null - value: auto -fp16_full_eval: - desc: null - value: false -fp16_opt_level: - desc: null - value: O1 -gradient_accumulation_steps: - desc: null - value: 4 -gradient_checkpointing: - desc: null - value: true -greater_is_better: - desc: null - value: None -group_by_length: - desc: null - value: true -half_precision_backend: - desc: null - value: amp -hidden_act: - desc: null - value: gelu -hidden_dropout: - desc: null - value: 0.0 -hidden_size: - desc: null - value: 1024 -hub_model_id: - desc: null - value: None -hub_strategy: - desc: null - value: every_save -hub_token: - desc: null - value: -id2label: - desc: null - value: - '0': LABEL_0 - '1': LABEL_1 -ignore_data_skip: - desc: null - value: false -initializer_range: - desc: null - value: 0.02 -intermediate_size: - desc: null - value: 4096 -is_decoder: - desc: null - value: false -is_encoder_decoder: - desc: null - value: false -label2id: - desc: null - value: - LABEL_0: 0 - LABEL_1: 1 -label_names: - desc: null - value: None -label_smoothing_factor: - desc: null - value: 0.0 -layer_norm_eps: - desc: null - value: 1.0e-05 -layerdrop: - desc: null - value: 0.0 -learning_rate: - desc: null - value: 7.5e-05 -length_column_name: - desc: null - value: input_length -length_penalty: - desc: null - value: 1.0 -load_best_model_at_end: - desc: null - value: false -local_rank: - desc: null - value: -1 -log_level: - desc: null - value: -1 -log_level_replica: - desc: null - value: -1 -log_on_each_node: - desc: null - value: true -logging_dir: - desc: null - value: ./runs/Jan27_10-34-00_job-38746614-58de-4025-b727-ddb5a9d90aee -logging_first_step: - desc: null - value: false -logging_nan_inf_filter: - desc: null - value: true -logging_steps: - desc: null - value: 100 -logging_strategy: - desc: null - value: steps -lr_scheduler_type: - desc: null - value: linear -mask_channel_length: - desc: null - value: 10 -mask_channel_min_space: - desc: null - value: 1 -mask_channel_other: - desc: null - value: 0.0 -mask_channel_prob: - desc: null - value: 0.0 -mask_channel_selection: - desc: null - value: static -mask_feature_length: - desc: null - value: 64 -mask_feature_min_masks: - desc: null - value: 0 -mask_feature_prob: - desc: null - value: 0.25 -mask_time_length: - desc: null - value: 10 -mask_time_min_masks: - desc: null - value: 2 -mask_time_min_space: - desc: null - value: 1 -mask_time_other: - desc: null - value: 0.0 -mask_time_prob: - desc: null - value: 0.75 -mask_time_selection: - desc: null - value: static -max_grad_norm: - desc: null - value: 1.0 -max_length: - desc: null - value: 20 -max_steps: - desc: null - value: -1 -metric_for_best_model: - desc: null - value: None -min_length: - desc: null - value: 0 -model_type: - desc: null - value: wav2vec2 -mp_parameters: - desc: null - value: '' -no_cuda: - desc: null - value: false -no_repeat_ngram_size: - desc: null - value: 0 -num_adapter_layers: - desc: null - value: 3 -num_attention_heads: - desc: null - value: 16 -num_beam_groups: - desc: null - value: 1 -num_beams: - desc: null - value: 1 -num_codevector_groups: - desc: null - value: 2 -num_codevectors_per_group: - desc: null - value: 320 -num_conv_pos_embedding_groups: - desc: null - value: 16 -num_conv_pos_embeddings: - desc: null - value: 128 -num_feat_extract_layers: - desc: null - value: 7 -num_hidden_layers: - desc: null - value: 24 -num_negatives: - desc: null - value: 100 -num_return_sequences: - desc: null - value: 1 -num_train_epochs: - desc: null - value: 50.0 -optim: - desc: null - value: adamw_hf -output_attentions: - desc: null - value: false -output_dir: - desc: null - value: ./ -output_hidden_size: - desc: null - value: 1024 -output_hidden_states: - desc: null - value: false -output_scores: - desc: null - value: false -overwrite_output_dir: - desc: null - value: true -pad_token_id: - desc: null - value: 34 -past_index: - desc: null - value: -1 -per_device_eval_batch_size: - desc: null - value: 8 -per_device_train_batch_size: - desc: null - value: 8 -per_gpu_eval_batch_size: - desc: null - value: None -per_gpu_train_batch_size: - desc: null - value: None -prediction_loss_only: - desc: null - value: false -prefix: - desc: null - value: null -problem_type: - desc: null - value: null -proj_codevector_dim: - desc: null - value: 768 -pruned_heads: - desc: null - value: {} -push_to_hub: - desc: null - value: true -push_to_hub_model_id: - desc: null - value: None -push_to_hub_organization: - desc: null - value: None -push_to_hub_token: - desc: null - value: -remove_invalid_values: - desc: null - value: false -remove_unused_columns: - desc: null - value: true -repetition_penalty: - desc: null - value: 1.0 -report_to: - desc: null - value: '[''wandb'']' -resume_from_checkpoint: - desc: null - value: None -return_dict: - desc: null - value: true -return_dict_in_generate: - desc: null - value: false -run_name: - desc: null - value: '2022-01-27T10:34:01.114533' -save_on_each_node: - desc: null - value: false -save_steps: - desc: null - value: 500 -save_strategy: - desc: null - value: steps -save_total_limit: - desc: null - value: 3 -seed: - desc: null - value: 42 -sep_token_id: - desc: null - value: null -sharded_ddp: - desc: null - value: '[]' -skip_memory_metrics: - desc: null - value: true -task_specific_params: - desc: null - value: null -tdnn_dilation: - desc: null - value: - - 1 - - 2 - - 3 - - 1 - - 1 -tdnn_dim: - desc: null - value: - - 512 - - 512 - - 512 - - 512 - - 1500 -tdnn_kernel: - desc: null - value: - - 5 - - 3 - - 3 - - 1 - - 1 -temperature: - desc: null - value: 1.0 -tf32: - desc: null - value: None -tie_encoder_decoder: - desc: null - value: false -tie_word_embeddings: - desc: null - value: true -tokenizer_class: - desc: null - value: null -top_k: - desc: null - value: 50 -top_p: - desc: null - value: 1.0 -torch_dtype: - desc: null - value: null -torchscript: - desc: null - value: false -tpu_metrics_debug: - desc: null - value: false -tpu_num_cores: - desc: null - value: None -train_batch_size: - desc: null - value: 8 -transformers_version: - desc: null - value: 4.16.0.dev0 -use_bfloat16: - desc: null - value: false -use_legacy_prediction_loop: - desc: null - value: false -use_weighted_layer_sum: - desc: null - value: false -vocab_size: - desc: null - value: 37 -warmup_ratio: - desc: null - value: 0.0 -warmup_steps: - desc: null - value: 2000 -weight_decay: - desc: null - value: 0.0 -xpu_backend: - desc: null - value: None -xvector_output_dim: - desc: null - value: 512