diff --git "a/octo_connector_rl_45/9999/default/_METADATA" "b/octo_connector_rl_45/9999/default/_METADATA" new file mode 100644--- /dev/null +++ "b/octo_connector_rl_45/9999/default/_METADATA" @@ -0,0 +1 @@ +{"tree_metadata": {"('heads_action', 'diffusion_model', 'cond_encoder', 'Dense_0', 'bias')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "cond_encoder", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'cond_encoder', 'Dense_0', 'kernel')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "cond_encoder", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'cond_encoder', 'Dense_1', 'bias')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "cond_encoder", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'cond_encoder', 'Dense_1', 'kernel')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "cond_encoder", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'Dense_0', 'bias')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'Dense_0', 'kernel')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'Dense_1', 'bias')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'Dense_1', 'kernel')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'MLPResNetBlock_0', 'Dense_0', 'bias')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "MLPResNetBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'MLPResNetBlock_0', 'Dense_0', 'kernel')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "MLPResNetBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'MLPResNetBlock_0', 'Dense_1', 'bias')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "MLPResNetBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'MLPResNetBlock_0', 'Dense_1', 'kernel')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "MLPResNetBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'MLPResNetBlock_0', 'LayerNorm_0', 'bias')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "MLPResNetBlock_0", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'MLPResNetBlock_0', 'LayerNorm_0', 'scale')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "MLPResNetBlock_0", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'MLPResNetBlock_1', 'Dense_0', 'bias')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "MLPResNetBlock_1", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'MLPResNetBlock_1', 'Dense_0', 'kernel')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "MLPResNetBlock_1", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'MLPResNetBlock_1', 'Dense_1', 'bias')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "MLPResNetBlock_1", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'MLPResNetBlock_1', 'Dense_1', 'kernel')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "MLPResNetBlock_1", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'MLPResNetBlock_1', 'LayerNorm_0', 'bias')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "MLPResNetBlock_1", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'MLPResNetBlock_1', 'LayerNorm_0', 'scale')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "MLPResNetBlock_1", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'MLPResNetBlock_2', 'Dense_0', 'bias')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "MLPResNetBlock_2", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'MLPResNetBlock_2', 'Dense_0', 'kernel')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "MLPResNetBlock_2", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'MLPResNetBlock_2', 'Dense_1', 'bias')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "MLPResNetBlock_2", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'MLPResNetBlock_2', 'Dense_1', 'kernel')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "MLPResNetBlock_2", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'MLPResNetBlock_2', 'LayerNorm_0', 'bias')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "MLPResNetBlock_2", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'reverse_network', 'MLPResNetBlock_2', 'LayerNorm_0', 'scale')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "reverse_network", "key_type": 2}, {"key": "MLPResNetBlock_2", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('heads_action', 'diffusion_model', 'time_preprocess', 'kernel')": {"key_metadata": [{"key": "heads_action", "key_type": 2}, {"key": "diffusion_model", "key_type": 2}, {"key": "time_preprocess", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoder_norm', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoder_norm", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoder_norm', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoder_norm", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_0', 'LayerNorm_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_0", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_0', 'LayerNorm_0', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_0", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_0', 'LayerNorm_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_0", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_0', 'LayerNorm_1', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_0", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_0', 'MlpBlock_0', 'Dense_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_0", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_0', 'MlpBlock_0', 'Dense_0', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_0", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_0', 'MlpBlock_0', 'Dense_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_0", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_0', 'MlpBlock_0', 'Dense_1', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_0", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_0', 'MultiHeadDotProductAttention_0', 'key', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_0", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_0', 'MultiHeadDotProductAttention_0', 'key', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_0", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_0', 'MultiHeadDotProductAttention_0', 'out', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_0", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_0', 'MultiHeadDotProductAttention_0', 'out', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_0", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_0', 'MultiHeadDotProductAttention_0', 'query', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_0", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_0', 'MultiHeadDotProductAttention_0', 'query', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_0", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_0', 'MultiHeadDotProductAttention_0', 'value', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_0", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_0', 'MultiHeadDotProductAttention_0', 'value', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_0", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_1', 'LayerNorm_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_1", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_1', 'LayerNorm_0', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_1", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_1', 'LayerNorm_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_1", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_1', 'LayerNorm_1', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_1", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_1', 'MlpBlock_0', 'Dense_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_1", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_1', 'MlpBlock_0', 'Dense_0', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_1", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_1', 'MlpBlock_0', 'Dense_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_1", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_1', 'MlpBlock_0', 'Dense_1', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_1", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_1', 'MultiHeadDotProductAttention_0', 'key', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_1", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_1', 'MultiHeadDotProductAttention_0', 'key', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_1", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_1', 'MultiHeadDotProductAttention_0', 'out', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_1", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_1', 'MultiHeadDotProductAttention_0', 'out', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_1", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_1', 'MultiHeadDotProductAttention_0', 'query', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_1", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_1', 'MultiHeadDotProductAttention_0', 'query', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_1", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_1', 'MultiHeadDotProductAttention_0', 'value', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_1", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_1', 'MultiHeadDotProductAttention_0', 'value', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_1", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_10', 'LayerNorm_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_10", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_10', 'LayerNorm_0', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_10", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_10', 'LayerNorm_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_10", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_10', 'LayerNorm_1', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_10", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_10', 'MlpBlock_0', 'Dense_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_10", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_10', 'MlpBlock_0', 'Dense_0', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_10", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_10', 'MlpBlock_0', 'Dense_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_10", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_10', 'MlpBlock_0', 'Dense_1', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_10", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_10', 'MultiHeadDotProductAttention_0', 'key', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_10", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_10', 'MultiHeadDotProductAttention_0', 'key', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_10", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_10', 'MultiHeadDotProductAttention_0', 'out', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_10", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_10', 'MultiHeadDotProductAttention_0', 'out', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_10", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_10', 'MultiHeadDotProductAttention_0', 'query', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_10", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_10', 'MultiHeadDotProductAttention_0', 'query', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_10", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_10', 'MultiHeadDotProductAttention_0', 'value', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_10", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_10', 'MultiHeadDotProductAttention_0', 'value', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_10", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_11', 'LayerNorm_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_11", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_11', 'LayerNorm_0', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_11", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_11', 'LayerNorm_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_11", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_11', 'LayerNorm_1', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_11", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_11', 'MlpBlock_0', 'Dense_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_11", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_11', 'MlpBlock_0', 'Dense_0', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_11", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_11', 'MlpBlock_0', 'Dense_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_11", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_11', 'MlpBlock_0', 'Dense_1', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_11", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_11', 'MultiHeadDotProductAttention_0', 'key', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_11", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_11', 'MultiHeadDotProductAttention_0', 'key', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_11", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_11', 'MultiHeadDotProductAttention_0', 'out', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_11", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_11', 'MultiHeadDotProductAttention_0', 'out', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_11", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_11', 'MultiHeadDotProductAttention_0', 'query', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_11", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_11', 'MultiHeadDotProductAttention_0', 'query', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_11", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_11', 'MultiHeadDotProductAttention_0', 'value', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_11", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_11', 'MultiHeadDotProductAttention_0', 'value', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_11", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_2', 'LayerNorm_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_2", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_2', 'LayerNorm_0', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_2", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_2', 'LayerNorm_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_2", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_2', 'LayerNorm_1', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_2", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_2', 'MlpBlock_0', 'Dense_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_2", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_2', 'MlpBlock_0', 'Dense_0', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_2", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_2', 'MlpBlock_0', 'Dense_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_2", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_2', 'MlpBlock_0', 'Dense_1', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_2", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_2', 'MultiHeadDotProductAttention_0', 'key', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_2", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_2', 'MultiHeadDotProductAttention_0', 'key', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_2", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_2', 'MultiHeadDotProductAttention_0', 'out', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_2", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_2', 'MultiHeadDotProductAttention_0', 'out', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_2", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_2', 'MultiHeadDotProductAttention_0', 'query', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_2", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_2', 'MultiHeadDotProductAttention_0', 'query', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_2", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_2', 'MultiHeadDotProductAttention_0', 'value', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_2", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_2', 'MultiHeadDotProductAttention_0', 'value', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_2", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_3', 'LayerNorm_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_3", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_3', 'LayerNorm_0', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_3", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_3', 'LayerNorm_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_3", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_3', 'LayerNorm_1', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_3", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_3', 'MlpBlock_0', 'Dense_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_3", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_3', 'MlpBlock_0', 'Dense_0', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_3", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_3', 'MlpBlock_0', 'Dense_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_3", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_3', 'MlpBlock_0', 'Dense_1', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_3", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_3', 'MultiHeadDotProductAttention_0', 'key', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_3", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_3', 'MultiHeadDotProductAttention_0', 'key', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_3", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_3', 'MultiHeadDotProductAttention_0', 'out', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_3", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_3', 'MultiHeadDotProductAttention_0', 'out', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_3", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_3', 'MultiHeadDotProductAttention_0', 'query', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_3", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_3', 'MultiHeadDotProductAttention_0', 'query', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_3", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_3', 'MultiHeadDotProductAttention_0', 'value', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_3", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_3', 'MultiHeadDotProductAttention_0', 'value', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_3", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_4', 'LayerNorm_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_4", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_4', 'LayerNorm_0', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_4", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_4', 'LayerNorm_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_4", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_4', 'LayerNorm_1', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_4", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_4', 'MlpBlock_0', 'Dense_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_4", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_4', 'MlpBlock_0', 'Dense_0', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_4", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_4', 'MlpBlock_0', 'Dense_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_4", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_4', 'MlpBlock_0', 'Dense_1', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_4", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_4', 'MultiHeadDotProductAttention_0', 'key', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_4", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_4', 'MultiHeadDotProductAttention_0', 'key', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_4", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_4', 'MultiHeadDotProductAttention_0', 'out', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_4", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_4', 'MultiHeadDotProductAttention_0', 'out', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_4", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_4', 'MultiHeadDotProductAttention_0', 'query', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_4", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_4', 'MultiHeadDotProductAttention_0', 'query', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_4", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_4', 'MultiHeadDotProductAttention_0', 'value', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_4", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_4', 'MultiHeadDotProductAttention_0', 'value', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_4", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_5', 'LayerNorm_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_5", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_5', 'LayerNorm_0', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_5", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_5', 'LayerNorm_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_5", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_5', 'LayerNorm_1', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_5", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_5', 'MlpBlock_0', 'Dense_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_5", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_5', 'MlpBlock_0', 'Dense_0', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_5", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_5', 'MlpBlock_0', 'Dense_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_5", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_5', 'MlpBlock_0', 'Dense_1', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_5", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_5', 'MultiHeadDotProductAttention_0', 'key', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_5", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_5', 'MultiHeadDotProductAttention_0', 'key', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_5", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_5', 'MultiHeadDotProductAttention_0', 'out', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_5", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_5', 'MultiHeadDotProductAttention_0', 'out', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_5", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_5', 'MultiHeadDotProductAttention_0', 'query', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_5", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_5', 'MultiHeadDotProductAttention_0', 'query', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_5", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_5', 'MultiHeadDotProductAttention_0', 'value', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_5", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_5', 'MultiHeadDotProductAttention_0', 'value', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_5", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_6', 'LayerNorm_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_6", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_6', 'LayerNorm_0', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_6", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_6', 'LayerNorm_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_6", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_6', 'LayerNorm_1', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_6", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_6', 'MlpBlock_0', 'Dense_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_6", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_6', 'MlpBlock_0', 'Dense_0', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_6", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_6', 'MlpBlock_0', 'Dense_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_6", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_6', 'MlpBlock_0', 'Dense_1', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_6", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_6', 'MultiHeadDotProductAttention_0', 'key', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_6", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_6', 'MultiHeadDotProductAttention_0', 'key', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_6", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_6', 'MultiHeadDotProductAttention_0', 'out', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_6", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_6', 'MultiHeadDotProductAttention_0', 'out', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_6", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_6', 'MultiHeadDotProductAttention_0', 'query', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_6", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_6', 'MultiHeadDotProductAttention_0', 'query', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_6", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_6', 'MultiHeadDotProductAttention_0', 'value', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_6", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_6', 'MultiHeadDotProductAttention_0', 'value', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_6", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_7', 'LayerNorm_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_7", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_7', 'LayerNorm_0', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_7", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_7', 'LayerNorm_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_7", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_7', 'LayerNorm_1', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_7", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_7', 'MlpBlock_0', 'Dense_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_7", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_7', 'MlpBlock_0', 'Dense_0', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_7", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_7', 'MlpBlock_0', 'Dense_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_7", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_7', 'MlpBlock_0', 'Dense_1', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_7", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_7', 'MultiHeadDotProductAttention_0', 'key', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_7", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_7', 'MultiHeadDotProductAttention_0', 'key', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_7", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_7', 'MultiHeadDotProductAttention_0', 'out', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_7", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_7', 'MultiHeadDotProductAttention_0', 'out', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_7", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_7', 'MultiHeadDotProductAttention_0', 'query', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_7", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_7', 'MultiHeadDotProductAttention_0', 'query', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_7", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_7', 'MultiHeadDotProductAttention_0', 'value', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_7", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_7', 'MultiHeadDotProductAttention_0', 'value', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_7", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_8', 'LayerNorm_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_8", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_8', 'LayerNorm_0', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_8", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_8', 'LayerNorm_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_8", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_8', 'LayerNorm_1', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_8", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_8', 'MlpBlock_0', 'Dense_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_8", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_8', 'MlpBlock_0', 'Dense_0', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_8", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_8', 'MlpBlock_0', 'Dense_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_8", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_8', 'MlpBlock_0', 'Dense_1', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_8", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_8', 'MultiHeadDotProductAttention_0', 'key', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_8", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_8', 'MultiHeadDotProductAttention_0', 'key', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_8", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_8', 'MultiHeadDotProductAttention_0', 'out', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_8", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_8', 'MultiHeadDotProductAttention_0', 'out', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_8", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_8', 'MultiHeadDotProductAttention_0', 'query', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_8", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_8', 'MultiHeadDotProductAttention_0', 'query', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_8", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_8', 'MultiHeadDotProductAttention_0', 'value', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_8", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_8', 'MultiHeadDotProductAttention_0', 'value', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_8", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_9', 'LayerNorm_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_9", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_9', 'LayerNorm_0', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_9", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_9', 'LayerNorm_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_9", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_9', 'LayerNorm_1', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_9", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_9', 'MlpBlock_0', 'Dense_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_9", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_9', 'MlpBlock_0', 'Dense_0', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_9", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_9', 'MlpBlock_0', 'Dense_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_9", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_9', 'MlpBlock_0', 'Dense_1', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_9", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_9', 'MultiHeadDotProductAttention_0', 'key', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_9", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_9', 'MultiHeadDotProductAttention_0', 'key', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_9", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_9', 'MultiHeadDotProductAttention_0', 'out', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_9", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_9', 'MultiHeadDotProductAttention_0', 'out', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_9", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_9', 'MultiHeadDotProductAttention_0', 'query', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_9", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_9', 'MultiHeadDotProductAttention_0', 'query', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_9", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_9', 'MultiHeadDotProductAttention_0', 'value', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_9", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'BlockTransformer_0', 'Transformer_0', 'encoderblock_9', 'MultiHeadDotProductAttention_0', 'value', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "BlockTransformer_0", "key_type": 2}, {"key": "Transformer_0", "key_type": 2}, {"key": "encoderblock_9", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'obs_primary_pos_embedding')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "obs_primary_pos_embedding", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'obs_primary_projection', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "obs_primary_projection", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'obs_primary_projection', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "obs_primary_projection", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'observation_tokenizers_primary', 'SmallStem16_0', 'GroupNorm_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "observation_tokenizers_primary", "key_type": 2}, {"key": "SmallStem16_0", "key_type": 2}, {"key": "GroupNorm_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'observation_tokenizers_primary', 'SmallStem16_0', 'GroupNorm_0', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "observation_tokenizers_primary", "key_type": 2}, {"key": "SmallStem16_0", "key_type": 2}, {"key": "GroupNorm_0", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'observation_tokenizers_primary', 'SmallStem16_0', 'GroupNorm_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "observation_tokenizers_primary", "key_type": 2}, {"key": "SmallStem16_0", "key_type": 2}, {"key": "GroupNorm_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'observation_tokenizers_primary', 'SmallStem16_0', 'GroupNorm_1', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "observation_tokenizers_primary", "key_type": 2}, {"key": "SmallStem16_0", "key_type": 2}, {"key": "GroupNorm_1", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'observation_tokenizers_primary', 'SmallStem16_0', 'GroupNorm_2', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "observation_tokenizers_primary", "key_type": 2}, {"key": "SmallStem16_0", "key_type": 2}, {"key": "GroupNorm_2", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'observation_tokenizers_primary', 'SmallStem16_0', 'GroupNorm_2', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "observation_tokenizers_primary", "key_type": 2}, {"key": "SmallStem16_0", "key_type": 2}, {"key": "GroupNorm_2", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'observation_tokenizers_primary', 'SmallStem16_0', 'GroupNorm_3', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "observation_tokenizers_primary", "key_type": 2}, {"key": "SmallStem16_0", "key_type": 2}, {"key": "GroupNorm_3", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'observation_tokenizers_primary', 'SmallStem16_0', 'GroupNorm_3', 'scale')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "observation_tokenizers_primary", "key_type": 2}, {"key": "SmallStem16_0", "key_type": 2}, {"key": "GroupNorm_3", "key_type": 2}, {"key": "scale", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'observation_tokenizers_primary', 'SmallStem16_0', 'StdConv_0', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "observation_tokenizers_primary", "key_type": 2}, {"key": "SmallStem16_0", "key_type": 2}, {"key": "StdConv_0", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'observation_tokenizers_primary', 'SmallStem16_0', 'StdConv_0', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "observation_tokenizers_primary", "key_type": 2}, {"key": "SmallStem16_0", "key_type": 2}, {"key": "StdConv_0", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'observation_tokenizers_primary', 'SmallStem16_0', 'StdConv_1', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "observation_tokenizers_primary", "key_type": 2}, {"key": "SmallStem16_0", "key_type": 2}, {"key": "StdConv_1", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'observation_tokenizers_primary', 'SmallStem16_0', 'StdConv_1', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "observation_tokenizers_primary", "key_type": 2}, {"key": "SmallStem16_0", "key_type": 2}, {"key": "StdConv_1", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'observation_tokenizers_primary', 'SmallStem16_0', 'StdConv_2', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "observation_tokenizers_primary", "key_type": 2}, {"key": "SmallStem16_0", "key_type": 2}, {"key": "StdConv_2", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'observation_tokenizers_primary', 'SmallStem16_0', 'StdConv_2', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "observation_tokenizers_primary", "key_type": 2}, {"key": "SmallStem16_0", "key_type": 2}, {"key": "StdConv_2", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'observation_tokenizers_primary', 'SmallStem16_0', 'StdConv_3', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "observation_tokenizers_primary", "key_type": 2}, {"key": "SmallStem16_0", "key_type": 2}, {"key": "StdConv_3", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'observation_tokenizers_primary', 'SmallStem16_0', 'StdConv_3', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "observation_tokenizers_primary", "key_type": 2}, {"key": "SmallStem16_0", "key_type": 2}, {"key": "StdConv_3", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'observation_tokenizers_primary', 'SmallStem16_0', 'embedding', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "observation_tokenizers_primary", "key_type": 2}, {"key": "SmallStem16_0", "key_type": 2}, {"key": "embedding", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'observation_tokenizers_primary', 'SmallStem16_0', 'embedding', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "observation_tokenizers_primary", "key_type": 2}, {"key": "SmallStem16_0", "key_type": 2}, {"key": "embedding", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'readout_action_pos_embedding')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "readout_action_pos_embedding", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_language_pos_embedding')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_language_pos_embedding", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_language_projection', 'bias')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_language_projection", "key_type": 2}, {"key": "bias", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_language_projection', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_language_projection", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '0', 'layer', '0', 'SelfAttention', 'k', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '0', 'layer', '0', 'SelfAttention', 'o', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '0', 'layer', '0', 'SelfAttention', 'q', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '0', 'layer', '0', 'SelfAttention', 'relative_attention_bias', 'embedding')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "relative_attention_bias", "key_type": 2}, {"key": "embedding", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '0', 'layer', '0', 'SelfAttention', 'v', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '0', 'layer', '0', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '0', 'layer', '1', 'DenseReluDense', 'wi', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wi", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '0', 'layer', '1', 'DenseReluDense', 'wo', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wo", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '0', 'layer', '1', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '1', 'layer', '0', 'SelfAttention', 'k', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '1', 'layer', '0', 'SelfAttention', 'o', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '1', 'layer', '0', 'SelfAttention', 'q', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '1', 'layer', '0', 'SelfAttention', 'v', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '1', 'layer', '0', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '1', 'layer', '1', 'DenseReluDense', 'wi', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wi", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '1', 'layer', '1', 'DenseReluDense', 'wo', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wo", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '1', 'layer', '1', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '10', 'layer', '0', 'SelfAttention', 'k', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "10", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '10', 'layer', '0', 'SelfAttention', 'o', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "10", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '10', 'layer', '0', 'SelfAttention', 'q', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "10", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '10', 'layer', '0', 'SelfAttention', 'v', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "10", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '10', 'layer', '0', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "10", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '10', 'layer', '1', 'DenseReluDense', 'wi', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "10", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wi", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '10', 'layer', '1', 'DenseReluDense', 'wo', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "10", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wo", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '10', 'layer', '1', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "10", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '11', 'layer', '0', 'SelfAttention', 'k', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "11", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '11', 'layer', '0', 'SelfAttention', 'o', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "11", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '11', 'layer', '0', 'SelfAttention', 'q', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "11", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '11', 'layer', '0', 'SelfAttention', 'v', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "11", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '11', 'layer', '0', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "11", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '11', 'layer', '1', 'DenseReluDense', 'wi', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "11", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wi", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '11', 'layer', '1', 'DenseReluDense', 'wo', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "11", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wo", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '11', 'layer', '1', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "11", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '2', 'layer', '0', 'SelfAttention', 'k', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '2', 'layer', '0', 'SelfAttention', 'o', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '2', 'layer', '0', 'SelfAttention', 'q', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '2', 'layer', '0', 'SelfAttention', 'v', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '2', 'layer', '0', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '2', 'layer', '1', 'DenseReluDense', 'wi', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wi", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '2', 'layer', '1', 'DenseReluDense', 'wo', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wo", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '2', 'layer', '1', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "2", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '3', 'layer', '0', 'SelfAttention', 'k', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "3", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '3', 'layer', '0', 'SelfAttention', 'o', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "3", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '3', 'layer', '0', 'SelfAttention', 'q', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "3", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '3', 'layer', '0', 'SelfAttention', 'v', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "3", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '3', 'layer', '0', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "3", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '3', 'layer', '1', 'DenseReluDense', 'wi', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "3", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wi", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '3', 'layer', '1', 'DenseReluDense', 'wo', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "3", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wo", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '3', 'layer', '1', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "3", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '4', 'layer', '0', 'SelfAttention', 'k', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "4", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '4', 'layer', '0', 'SelfAttention', 'o', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "4", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '4', 'layer', '0', 'SelfAttention', 'q', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "4", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '4', 'layer', '0', 'SelfAttention', 'v', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "4", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '4', 'layer', '0', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "4", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '4', 'layer', '1', 'DenseReluDense', 'wi', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "4", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wi", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '4', 'layer', '1', 'DenseReluDense', 'wo', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "4", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wo", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '4', 'layer', '1', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "4", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '5', 'layer', '0', 'SelfAttention', 'k', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "5", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '5', 'layer', '0', 'SelfAttention', 'o', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "5", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '5', 'layer', '0', 'SelfAttention', 'q', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "5", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '5', 'layer', '0', 'SelfAttention', 'v', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "5", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '5', 'layer', '0', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "5", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '5', 'layer', '1', 'DenseReluDense', 'wi', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "5", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wi", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '5', 'layer', '1', 'DenseReluDense', 'wo', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "5", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wo", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '5', 'layer', '1', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "5", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '6', 'layer', '0', 'SelfAttention', 'k', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "6", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '6', 'layer', '0', 'SelfAttention', 'o', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "6", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '6', 'layer', '0', 'SelfAttention', 'q', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "6", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '6', 'layer', '0', 'SelfAttention', 'v', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "6", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '6', 'layer', '0', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "6", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '6', 'layer', '1', 'DenseReluDense', 'wi', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "6", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wi", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '6', 'layer', '1', 'DenseReluDense', 'wo', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "6", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wo", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '6', 'layer', '1', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "6", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '7', 'layer', '0', 'SelfAttention', 'k', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "7", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '7', 'layer', '0', 'SelfAttention', 'o', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "7", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '7', 'layer', '0', 'SelfAttention', 'q', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "7", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '7', 'layer', '0', 'SelfAttention', 'v', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "7", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '7', 'layer', '0', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "7", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '7', 'layer', '1', 'DenseReluDense', 'wi', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "7", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wi", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '7', 'layer', '1', 'DenseReluDense', 'wo', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "7", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wo", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '7', 'layer', '1', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "7", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '8', 'layer', '0', 'SelfAttention', 'k', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "8", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '8', 'layer', '0', 'SelfAttention', 'o', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "8", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '8', 'layer', '0', 'SelfAttention', 'q', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "8", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '8', 'layer', '0', 'SelfAttention', 'v', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "8", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '8', 'layer', '0', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "8", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '8', 'layer', '1', 'DenseReluDense', 'wi', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "8", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wi", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '8', 'layer', '1', 'DenseReluDense', 'wo', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "8", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wo", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '8', 'layer', '1', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "8", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '9', 'layer', '0', 'SelfAttention', 'k', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "9", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "k", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '9', 'layer', '0', 'SelfAttention', 'o', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "9", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "o", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '9', 'layer', '0', 'SelfAttention', 'q', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "9", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "q", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '9', 'layer', '0', 'SelfAttention', 'v', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "9", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "SelfAttention", "key_type": 2}, {"key": "v", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '9', 'layer', '0', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "9", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "0", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '9', 'layer', '1', 'DenseReluDense', 'wi', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "9", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wi", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '9', 'layer', '1', 'DenseReluDense', 'wo', 'kernel')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "9", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "DenseReluDense", "key_type": 2}, {"key": "wo", "key_type": 2}, {"key": "kernel", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'block', '9', 'layer', '1', 'layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "block", "key_type": 2}, {"key": "9", "key_type": 2}, {"key": "layer", "key_type": 2}, {"key": "1", "key_type": 2}, {"key": "layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'encoder', 'final_layer_norm', 'weight')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "encoder", "key_type": 2}, {"key": "final_layer_norm", "key_type": 2}, {"key": "weight", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}, "('octo_transformer', 'task_tokenizers_language', 'hf_model', 'shared', 'embedding')": {"key_metadata": [{"key": "octo_transformer", "key_type": 2}, {"key": "task_tokenizers_language", "key_type": 2}, {"key": "hf_model", "key_type": 2}, {"key": "shared", "key_type": 2}, {"key": "embedding", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": true}}}} \ No newline at end of file