{"train/decoder_grad_norm": 0.3170955181121826, "train/decoder_param_norm": 10.98730754852295, "train/encoder_grad_norm": 7.285628817044199e-05, "train/encoder_param_norm": 21.97297477722168, "train/grad_norm": 0.3170955181121826, "layer_grad_norm/": {"decoder": {"model": {"decoder": {"embed_positions": {"embedding": 0.16519849002361298}, "embed_tokens": {"embedding": 0.2683090269565582}, "layernorm_embedding": {"bias": 0.00845938641577959, "scale": 0.00517110014334321}, "layers": {"FlaxBartDecoderLayers": {"encoder_attn": {"k_proj": {"bias": 3.6778113649167665e-13, "kernel": 1.197263317133379e-12}, "out_proj": {"bias": 0.01301304530352354, "kernel": 6.306260183919221e-05}, "q_proj": {"bias": 9.55028374091671e-13, "kernel": 1.1253619564000061e-12}, "v_proj": {"bias": 0.0014304526848718524, "kernel": 5.171417342353379e-06}}, "encoder_attn_layer_norm": {"bias": 0.012739405035972595, "scale": 0.007039573043584824}, "fc1": {"bias": 0.0002723249781411141, "kernel": 0.0004740327422041446}, "fc2": {"bias": 0.013017209246754646, "kernel": 0.00048240856267511845}, "final_layer_norm": {"bias": 0.013769222423434258, "scale": 0.007471546996384859}, "self_attn": {"k_proj": {"bias": 1.7592640677577265e-09, "kernel": 4.8097604121721815e-06}, "out_proj": {"bias": 0.01252918504178524, "kernel": 0.001151563017629087}, "q_proj": {"bias": 1.753854803610011e-06, "kernel": 4.778269158123294e-06}, "v_proj": {"bias": 0.0009930545929819345, "kernel": 0.0011230409145355225}}, "self_attn_layer_norm": {"bias": 0.012738531455397606, "scale": 0.00703705009073019}}}}}}, "encoder": {"adapter": {"layers": {"0": {"conv": {"bias": 3.205414316198585e-07, "kernel": 1.4481754533335334e-06}}, "1": {"conv": {"bias": 4.1292250898550265e-06, "kernel": 1.6521905763511313e-06}}, "2": {"conv": {"bias": 7.260794518515468e-05, "kernel": 3.06191236632003e-06}}}}, "encoder": {"layer_norm": {"bias": 5.523256163542101e-08, "scale": 4.672925157933605e-08}, "layers": {"FlaxWav2Vec2EncoderLayers": {"attention": {"k_proj": {"bias": 2.0252214720506683e-15, "kernel": 2.2661324206030287e-10}, "out_proj": {"bias": 1.2527184480859432e-06, "kernel": 2.1728278909449728e-07}, "q_proj": {"bias": 1.0131199351670617e-10, "kernel": 2.5732815878143356e-10}, "v_proj": {"bias": 9.004332213180533e-08, "kernel": 2.0428340974376624e-07}}, "feed_forward": {"intermediate_dense": {"bias": 5.7502425931943435e-08, "kernel": 1.7381272243710555e-07}, "output_dense": {"bias": 1.2294220823605428e-06, "kernel": 1.8091645870299544e-07}}, "final_layer_norm": {"bias": 4.410487530748242e-09, "scale": 3.4101199641867197e-09}, "layer_norm": {"bias": 6.48679510106831e-09, "scale": 4.099019346170962e-09}}}, "pos_conv_embed": {"conv": {"bias": 4.5359942646427953e-07, "weight_g": 8.91475782083262e-09, "weight_v": 1.0556363605473962e-07}}}, "feature_extractor": {"conv_layers": {"0": {"conv": {"kernel": 0.0}, "layer_norm": {"bias": 0.0, "scale": 0.0}}, "1": {"conv": {"kernel": 0.0}, "layer_norm": {"bias": 0.0, "scale": 0.0}}, "2": {"conv": {"kernel": 0.0}, "layer_norm": {"bias": 0.0, "scale": 0.0}}}}, "feature_projection": {"layer_norm": {"bias": 8.599896261785034e-08, "scale": 1.2218480449632807e-08}, "projection": {"bias": 8.408756002609152e-07, "kernel": 7.672040283068782e-07}}, "masked_spec_embed": 0.0}}, "layer_param_norm/": {"decoder": {"model": {"decoder": {"embed_positions": {"embedding": 0.7995837926864624}, "embed_tokens": {"embedding": 2.508500337600708}, "layernorm_embedding": {"bias": 0.0043898290023207664, "scale": 4.000094890594482}, "layers": {"FlaxBartDecoderLayers": {"encoder_attn": {"k_proj": {"bias": 2.6323088153645813e-09, "kernel": 0.43237069249153137}, "out_proj": {"bias": 0.00618136627599597, "kernel": 0.4670513868331909}, "q_proj": {"bias": 3.326803366121567e-08, "kernel": 0.4763868451118469}, "v_proj": {"bias": 0.006634118035435677, "kernel": 0.46297508478164673}}, "encoder_attn_layer_norm": {"bias": 0.006301939021795988, "scale": 5.656976222991943}, "fc1": {"bias": 0.0031436358112841845, "kernel": 0.23027531802654266}, "fc2": {"bias": 0.006195463240146637, "kernel": 0.22851817309856415}, "final_layer_norm": {"bias": 0.00606531323865056, "scale": 5.657156944274902}, "self_attn": {"k_proj": {"bias": 1.3420313734968659e-05, "kernel": 0.44890034198760986}, "out_proj": {"bias": 0.006184814497828484, "kernel": 0.4596027135848999}, "q_proj": {"bias": 0.005368082784116268, "kernel": 0.4389948546886444}, "v_proj": {"bias": 0.005956699140369892, "kernel": 0.47396498918533325}}, "self_attn_layer_norm": {"bias": 0.006302110850811005, "scale": 5.656976222991943}}}}}}, "encoder": {"adapter": {"layers": {"0": {"conv": {"bias": 0.0037685695569962263, "kernel": 0.7979614734649658}}, "1": {"conv": {"bias": 0.004708290100097656, "kernel": 0.7824040055274963}}, "2": {"conv": {"bias": 0.004585933405905962, "kernel": 0.7934508323669434}}}}, "encoder": {"layer_norm": {"bias": 0.001405583810992539, "scale": 4.000487327575684}, "layers": {"FlaxWav2Vec2EncoderLayers": {"attention": {"k_proj": {"bias": 1.1651571374393654e-10, "kernel": 0.6511669158935547}, "out_proj": {"bias": 0.004394491668790579, "kernel": 0.6515659689903259}, "q_proj": {"bias": 9.028558451973367e-06, "kernel": 0.636457085609436}, "v_proj": {"bias": 0.0028231709729880095, "kernel": 0.6421379446983337}}, "feed_forward": {"intermediate_dense": {"bias": 0.0022689849138259888, "kernel": 0.7063419818878174}, "output_dense": {"bias": 0.004643301945179701, "kernel": 0.7153213620185852}}, "final_layer_norm": {"bias": 0.0003230707661714405, "scale": 7.999977111816406}, "layer_norm": {"bias": 0.0006301795365288854, "scale": 8.000048637390137}}}, "pos_conv_embed": {"conv": {"bias": 0.0019321668660268188, "weight_g": 2.2777063846588135, "weight_v": 2.2775826454162598}}}, "feature_extractor": {"conv_layers": {"0": {"conv": {"kernel": 7.867799758911133}, "layer_norm": {"bias": 0.0, "scale": 5.656854152679443}}, "1": {"conv": {"kernel": 8.025212287902832}, "layer_norm": {"bias": 0.0, "scale": 5.656854152679443}}, "2": {"conv": {"kernel": 7.975250720977783}, "layer_norm": {"bias": 0.0, "scale": 5.656854152679443}}}}, "feature_projection": {"layer_norm": {"bias": 0.0016006563091650605, "scale": 5.656808376312256}, "projection": {"bias": 0.0019031842239201069, "kernel": 0.430086225271225}}, "masked_spec_embed": 2.404470205307007}}, "train/learning_rate": 8.99998121894896e-06, "train/loss": 6.895620822906494, "train/param_norm": 24.566898345947266, "_timestamp": 1651947860, "_runtime": 219, "_step": 15, "eval/loss": 6.897119522094727, "eval/wer": 1.0, "eval/step_0k": {"_type": "table-file", "path": "media/table/eval/step_0k_15_a7d6e656cdc47be11a4d.table.json", "sha256": "a7d6e656cdc47be11a4d75d3c011d99f659e767be494426c80c0c0731f31d13d", "size": 16130, "artifact_path": "wandb-client-artifact://19f4znzaesiaov03izen1ahl0w7qlmc8cj5t002wl7xspuucj5elm5l18o3220zua1am9pknj3unkkmct9closy16r18nq0qbu0tcbd6h8k1nu94mptc1jcspvzozzvs:latest/eval/step_0k.table.json", "_latest_artifact_path": "wandb-client-artifact://19f4znzaesiaov03izen1ahl0w7qlmc8cj5t002wl7xspuucj5elm5l18o3220zua1am9pknj3unkkmct9closy16r18nq0qbu0tcbd6h8k1nu94mptc1jcspvzozzvs:latest/eval/step_0k.table.json", "ncols": 4, "nrows": 50}, "eval/step_0k_incorrect": {"_type": "table-file", "path": "media/table/eval/step_0k_incorrect_15_623faa4883d23d9d4194.table.json", "sha256": "623faa4883d23d9d41947dcde31f197a909862eb4d078966446c26699859d3be", "size": 20629, "artifact_path": "wandb-client-artifact://17fe55artcmnr37cm8759c1k6bsv73gf8abz6v04cd7o4x8736tep7fwespmhloma88uxxcks4u4wt28hxxjlc5l2zj52tehiu7w7w8rs4pxgqs6ilyeydcyplzzaovz:latest/eval/step_0k_incorrect.table.json", "_latest_artifact_path": "wandb-client-artifact://17fe55artcmnr37cm8759c1k6bsv73gf8abz6v04cd7o4x8736tep7fwespmhloma88uxxcks4u4wt28hxxjlc5l2zj52tehiu7w7w8rs4pxgqs6ilyeydcyplzzaovz:latest/eval/step_0k_incorrect.table.json", "ncols": 4, "nrows": 64}, "validation[:90%]/loss": 6.898902893066406, "validation[:90%]/wer": 1.0, "validation[:90%]/step_0k": {"_type": "table-file", "path": "media/table/validation[:90%]/step_0k_15_b59f86c33aa51dff79ab.table.json", "sha256": "b59f86c33aa51dff79ab7525d68bf93d944418cd9934b0bab1b26d58eb2047a0", "size": 15524, "artifact_path": "wandb-client-artifact://u0z0z66hn744k4v3xsj9dxa8isd41pixt3bc8hjl4zc1ddo4crr5xfnq5nlicikke60g4yvsznfk6wvaps314asysxc8a2f1dgr90a6ofrejii2g20qvu5ajyo3ljcic:latest/validation[:90%]/step_0k.table.json", "_latest_artifact_path": "wandb-client-artifact://u0z0z66hn744k4v3xsj9dxa8isd41pixt3bc8hjl4zc1ddo4crr5xfnq5nlicikke60g4yvsznfk6wvaps314asysxc8a2f1dgr90a6ofrejii2g20qvu5ajyo3ljcic:latest/validation[:90%]/step_0k.table.json", "ncols": 4, "nrows": 48}, "validation[:90%]/step_0k_incorrect": {"_type": "table-file", "path": "media/table/validation[:90%]/step_0k_incorrect_15_b59f86c33aa51dff79ab.table.json", "sha256": "b59f86c33aa51dff79ab7525d68bf93d944418cd9934b0bab1b26d58eb2047a0", "size": 15524, "artifact_path": "wandb-client-artifact://b9fe5eri5xnu2j65g1ecj9c30mdsis2s4cct3iwf0adthwpcpsoa6yc5im5x4axjtrysakbqgazlsj9cvkgc2wsbo10fyhbpl5foda0utlzyfvqnhumq8wk9eyaxiyid:latest/validation[:90%]/step_0k_incorrect.table.json", "_latest_artifact_path": "wandb-client-artifact://b9fe5eri5xnu2j65g1ecj9c30mdsis2s4cct3iwf0adthwpcpsoa6yc5im5x4axjtrysakbqgazlsj9cvkgc2wsbo10fyhbpl5foda0utlzyfvqnhumq8wk9eyaxiyid:latest/validation[:90%]/step_0k_incorrect.table.json", "ncols": 4, "nrows": 48}, "validation[:95%]/loss": 6.897119522094727, "validation[:95%]/wer": 1.0, "validation[:95%]/step_0k": {"_type": "table-file", "path": "media/table/validation[:95%]/step_0k_15_a7d6e656cdc47be11a4d.table.json", "sha256": "a7d6e656cdc47be11a4d75d3c011d99f659e767be494426c80c0c0731f31d13d", "size": 16130, "artifact_path": "wandb-client-artifact://7527uwgru9gzrm8xtuylf3ivix7kg530r7v8uxqxe7ol19balonvqhvf2lytdvkoa7wsobwxdw1sn0o7ke08yvboe9pon62ec24wimo0wyy4sm3o4uhygnna3enz25km:latest/validation[:95%]/step_0k.table.json", "_latest_artifact_path": "wandb-client-artifact://7527uwgru9gzrm8xtuylf3ivix7kg530r7v8uxqxe7ol19balonvqhvf2lytdvkoa7wsobwxdw1sn0o7ke08yvboe9pon62ec24wimo0wyy4sm3o4uhygnna3enz25km:latest/validation[:95%]/step_0k.table.json", "ncols": 4, "nrows": 50}, "validation[:95%]/step_0k_incorrect": {"_type": "table-file", "path": "media/table/validation[:95%]/step_0k_incorrect_15_623faa4883d23d9d4194.table.json", "sha256": "623faa4883d23d9d41947dcde31f197a909862eb4d078966446c26699859d3be", "size": 20629, "artifact_path": "wandb-client-artifact://y3oqnalspy00o6lj7ippqlg8wlj1tgnmbt6853o012ws8qc326oism2qizcsf20th8oank2w4s5ber52ovt1iuh4grfh0qq3xx4azrpsk57fgjccrgrm2j497ir58n3b:latest/validation[:95%]/step_0k_incorrect.table.json", "_latest_artifact_path": "wandb-client-artifact://y3oqnalspy00o6lj7ippqlg8wlj1tgnmbt6853o012ws8qc326oism2qizcsf20th8oank2w4s5ber52ovt1iuh4grfh0qq3xx4azrpsk57fgjccrgrm2j497ir58n3b:latest/validation[:95%]/step_0k_incorrect.table.json", "ncols": 4, "nrows": 64}, "_wandb": {"runtime": 221}}