siriuz42 commited on
Commit
b99e9f6
·
verified ·
1 Parent(s): 57996ba

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ ocdbt.process_0/d/391be1dabf9d22a13dbd77a36b10b698 filter=lfs diff=lfs merge=lfs -text
37
+ ocdbt.process_0/d/f933434baa602db9432904cb5cfd5012 filter=lfs diff=lfs merge=lfs -text
_CHECKPOINT_METADATA ADDED
@@ -0,0 +1 @@
 
 
1
+ {"item_handlers": "orbax.checkpoint._src.handlers.standard_checkpoint_handler.StandardCheckpointHandler", "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1756834444111574238, "commit_timestamp_nsecs": 1756834447611022662, "custom_metadata": {}}
_METADATA ADDED
@@ -0,0 +1 @@
 
 
1
+ {"tree_metadata": {"('output_projection_point', 'hidden_layer', 'kernel', 'value')": {"key_metadata": [{"key": "output_projection_point", "key_type": 2}, {"key": "hidden_layer", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [320, 1280]}}, "('output_projection_point', 'output_layer', 'kernel', 'value')": {"key_metadata": [{"key": "output_projection_point", "key_type": 2}, {"key": "output_layer", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [320, 1280]}}, "('output_projection_point', 'residual_layer', 'kernel', 'value')": {"key_metadata": [{"key": "output_projection_point", "key_type": 2}, {"key": "residual_layer", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [320, 1280]}}, "('output_projection_quantiles', 'hidden_layer', 'kernel', 'value')": {"key_metadata": [{"key": "output_projection_quantiles", "key_type": 2}, {"key": "hidden_layer", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [320, 1280]}}, "('output_projection_quantiles', 'output_layer', 'kernel', 'value')": {"key_metadata": [{"key": "output_projection_quantiles", "key_type": 2}, {"key": "output_layer", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [320, 10240]}}, "('output_projection_quantiles', 'residual_layer', 'kernel', 'value')": {"key_metadata": [{"key": "output_projection_quantiles", "key_type": 2}, {"key": "residual_layer", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [320, 10240]}}, "('stacked_xf', 'attn', 'key', 'kernel', 'value')": {"key_metadata": [{"key": "stacked_xf", "key_type": 2}, {"key": "attn", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [5, 1280, 16, 80]}}, "('stacked_xf', 'attn', 'key_ln', 'scale', 'value')": {"key_metadata": [{"key": "stacked_xf", "key_type": 2}, {"key": "attn", "key_type": 2}, {"key": "key_ln", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [5, 80]}}, "('stacked_xf', 'attn', 'out', 'kernel', 'value')": {"key_metadata": [{"key": "stacked_xf", "key_type": 2}, {"key": "attn", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [5, 16, 80, 1280]}}, "('stacked_xf', 'attn', 'per_dim_scale', 'per_dim_scale', 'value')": {"key_metadata": [{"key": "stacked_xf", "key_type": 2}, {"key": "attn", "key_type": 2}, {"key": "per_dim_scale", "key_type": 2}, {"key": "per_dim_scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [5, 80]}}, "('stacked_xf', 'attn', 'query', 'kernel', 'value')": {"key_metadata": [{"key": "stacked_xf", "key_type": 2}, {"key": "attn", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [5, 1280, 16, 80]}}, "('stacked_xf', 'attn', 'query_ln', 'scale', 'value')": {"key_metadata": [{"key": "stacked_xf", "key_type": 2}, {"key": "attn", "key_type": 2}, {"key": "query_ln", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [5, 80]}}, "('stacked_xf', 'attn', 'value', 'kernel', 'value')": {"key_metadata": [{"key": "stacked_xf", "key_type": 2}, {"key": "attn", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [5, 1280, 16, 80]}}, "('stacked_xf', 'ff0', 'kernel', 'value')": {"key_metadata": [{"key": "stacked_xf", "key_type": 2}, {"key": "ff0", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [5, 1280, 1280]}}, "('stacked_xf', 'ff1', 'kernel', 'value')": {"key_metadata": [{"key": "stacked_xf", "key_type": 2}, {"key": "ff1", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [5, 1280, 1280]}}, "('stacked_xf', 'post_attn_ln', 'scale', 'value')": {"key_metadata": [{"key": "stacked_xf", "key_type": 2}, {"key": "post_attn_ln", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [5, 1280]}}, "('stacked_xf', 'post_ff_ln', 'scale', 'value')": {"key_metadata": [{"key": "stacked_xf", "key_type": 2}, {"key": "post_ff_ln", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [5, 1280]}}, "('stacked_xf', 'pre_attn_ln', 'scale', 'value')": {"key_metadata": [{"key": "stacked_xf", "key_type": 2}, {"key": "pre_attn_ln", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [5, 1280]}}, "('stacked_xf', 'pre_ff_ln', 'scale', 'value')": {"key_metadata": [{"key": "stacked_xf", "key_type": 2}, {"key": "pre_ff_ln", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [5, 1280]}}, "('tokenizer', 'hidden_layer', 'bias', 'value')": {"key_metadata": [{"key": "tokenizer", "key_type": 2}, {"key": "hidden_layer", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [320]}}, "('tokenizer', 'hidden_layer', 'kernel', 'value')": {"key_metadata": [{"key": "tokenizer", "key_type": 2}, {"key": "hidden_layer", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [16, 1280]}}, "('tokenizer', 'output_layer', 'bias', 'value')": {"key_metadata": [{"key": "tokenizer", "key_type": 2}, {"key": "output_layer", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [320]}}, "('tokenizer', 'output_layer', 'kernel', 'value')": {"key_metadata": [{"key": "tokenizer", "key_type": 2}, {"key": "output_layer", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [320, 1280]}}, "('tokenizer', 'residual_layer', 'bias', 'value')": {"key_metadata": [{"key": "tokenizer", "key_type": 2}, {"key": "residual_layer", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [320]}}, "('tokenizer', 'residual_layer', 'kernel', 'value')": {"key_metadata": [{"key": "tokenizer", "key_type": 2}, {"key": "residual_layer", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false, "write_shape": [16, 1280]}}}, "use_zarr3": false, "store_array_data_equal_to_fill_value": true, "custom_metadata": null}
_sharding ADDED
@@ -0,0 +1 @@
 
 
1
+ {"b3V0cHV0X3Byb2plY3Rpb25fcG9pbnQuaGlkZGVuX2xheWVyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","b3V0cHV0X3Byb2plY3Rpb25fcG9pbnQub3V0cHV0X2xheWVyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","b3V0cHV0X3Byb2plY3Rpb25fcG9pbnQucmVzaWR1YWxfbGF5ZXIua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","b3V0cHV0X3Byb2plY3Rpb25fcXVhbnRpbGVzLm91dHB1dF9sYXllci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","b3V0cHV0X3Byb2plY3Rpb25fcXVhbnRpbGVzLmhpZGRlbl9sYXllci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","b3V0cHV0X3Byb2plY3Rpb25fcXVhbnRpbGVzLnJlc2lkdWFsX2xheWVyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","c3RhY2tlZF94Zi5hdHRuLm91dC5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","c3RhY2tlZF94Zi5hdHRuLmtleS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","c3RhY2tlZF94Zi5hdHRuLmtleV9sbi5zY2FsZS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","c3RhY2tlZF94Zi5hdHRuLnBlcl9kaW1fc2NhbGUucGVyX2RpbV9zY2FsZS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","c3RhY2tlZF94Zi5hdHRuLnF1ZXJ5Lmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","c3RhY2tlZF94Zi5hdHRuLnF1ZXJ5X2xuLnNjYWxlLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","c3RhY2tlZF94Zi5hdHRuLnZhbHVlLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","c3RhY2tlZF94Zi5mZjAua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","c3RhY2tlZF94Zi5mZjEua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","c3RhY2tlZF94Zi5wb3N0X2F0dG5fbG4uc2NhbGUudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","c3RhY2tlZF94Zi5wb3N0X2ZmX2xuLnNjYWxlLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","c3RhY2tlZF94Zi5wcmVfYXR0bl9sbi5zY2FsZS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","c3RhY2tlZF94Zi5wcmVfZmZfbG4uc2NhbGUudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","dG9rZW5pemVyLm91dHB1dF9sYXllci5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","dG9rZW5pemVyLm91dHB1dF9sYXllci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","dG9rZW5pemVyLmhpZGRlbl9sYXllci5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","dG9rZW5pemVyLmhpZGRlbl9sYXllci5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","dG9rZW5pemVyLnJlc2lkdWFsX2xheWVyLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}","dG9rZW5pemVyLnJlc2lkdWFsX2xheWVyLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [1, 4, 1], \"axis_names\": [\"replica\", \"data\", \"mdl\"], \"partition_spec\": [null, null], \"device_mesh\": {\"mesh\": [[[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 3}], [{\"id\": 2}]]]}}"}
array_metadatas/process_0 ADDED
@@ -0,0 +1 @@
 
 
1
+ {"array_metadatas": [{"array_metadata": {"param_name": "output_projection_point.hidden_layer.kernel.value", "write_shape": [320, 1280], "chunk_shape": [320, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "output_projection_point.output_layer.kernel.value", "write_shape": [320, 1280], "chunk_shape": [320, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "output_projection_point.residual_layer.kernel.value", "write_shape": [320, 1280], "chunk_shape": [320, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "output_projection_quantiles.hidden_layer.kernel.value", "write_shape": [320, 1280], "chunk_shape": [320, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "output_projection_quantiles.output_layer.kernel.value", "write_shape": [320, 10240], "chunk_shape": [320, 10240], "ext_metadata": null}}, {"array_metadata": {"param_name": "output_projection_quantiles.residual_layer.kernel.value", "write_shape": [320, 10240], "chunk_shape": [320, 10240], "ext_metadata": null}}, {"array_metadata": {"param_name": "stacked_xf.attn.key.kernel.value", "write_shape": [5, 1280, 16, 80], "chunk_shape": [5, 1280, 16, 80], "ext_metadata": null}}, {"array_metadata": {"param_name": "stacked_xf.attn.key_ln.scale.value", "write_shape": [5, 80], "chunk_shape": [5, 80], "ext_metadata": null}}, {"array_metadata": {"param_name": "stacked_xf.attn.out.kernel.value", "write_shape": [5, 16, 80, 1280], "chunk_shape": [5, 16, 80, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "stacked_xf.attn.per_dim_scale.per_dim_scale.value", "write_shape": [5, 80], "chunk_shape": [5, 80], "ext_metadata": null}}, {"array_metadata": {"param_name": "stacked_xf.attn.query.kernel.value", "write_shape": [5, 1280, 16, 80], "chunk_shape": [5, 1280, 16, 80], "ext_metadata": null}}, {"array_metadata": {"param_name": "stacked_xf.attn.query_ln.scale.value", "write_shape": [5, 80], "chunk_shape": [5, 80], "ext_metadata": null}}, {"array_metadata": {"param_name": "stacked_xf.attn.value.kernel.value", "write_shape": [5, 1280, 16, 80], "chunk_shape": [5, 1280, 16, 80], "ext_metadata": null}}, {"array_metadata": {"param_name": "stacked_xf.ff0.kernel.value", "write_shape": [5, 1280, 1280], "chunk_shape": [5, 1280, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "stacked_xf.ff1.kernel.value", "write_shape": [5, 1280, 1280], "chunk_shape": [5, 1280, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "stacked_xf.post_attn_ln.scale.value", "write_shape": [5, 1280], "chunk_shape": [5, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "stacked_xf.post_ff_ln.scale.value", "write_shape": [5, 1280], "chunk_shape": [5, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "stacked_xf.pre_attn_ln.scale.value", "write_shape": [5, 1280], "chunk_shape": [5, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "stacked_xf.pre_ff_ln.scale.value", "write_shape": [5, 1280], "chunk_shape": [5, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "tokenizer.hidden_layer.bias.value", "write_shape": [320], "chunk_shape": [320], "ext_metadata": null}}, {"array_metadata": {"param_name": "tokenizer.hidden_layer.kernel.value", "write_shape": [16, 1280], "chunk_shape": [16, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "tokenizer.output_layer.bias.value", "write_shape": [320], "chunk_shape": [320], "ext_metadata": null}}, {"array_metadata": {"param_name": "tokenizer.output_layer.kernel.value", "write_shape": [320, 1280], "chunk_shape": [320, 1280], "ext_metadata": null}}, {"array_metadata": {"param_name": "tokenizer.residual_layer.bias.value", "write_shape": [320], "chunk_shape": [320], "ext_metadata": null}}, {"array_metadata": {"param_name": "tokenizer.residual_layer.kernel.value", "write_shape": [16, 1280], "chunk_shape": [16, 1280], "ext_metadata": null}}]}
d/99d9838f4ea666b0baf271caec0acb55 ADDED
Binary file (1.64 kB). View file
 
descriptor/descriptor.pbtxt ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ uuid: "1268afaf-1c19-4568-8171-17e9c4ca2504"
2
+ build_data {
3
+ timestamp {
4
+ seconds: 1756506922
5
+ }
6
+ user: "yichenzhou"
7
+ hostname: "jaii33.prod.google.com"
8
+ path: "/google/src/cloud/buildrabbit-username/buildrabbit-client/google3"
9
+ target: "//learning/multipod/pax/foundation_ts:colab_utils"
10
+ invocation_id: "85202664-c4db-4178-9852-4d838c3fc656"
11
+ changelist: 801048062
12
+ baseline_cl: 801048062
13
+ workspace_id: "yichenzhou/3652"
14
+ citc_snapshot: 1422
15
+ client_status: BUILD_CLIENT_STATUS_UNSPECIFIED
16
+ verifiable: NON_VERIFIABLE
17
+ }
descriptor/uuid-1268afaf-1c19-4568-8171-17e9c4ca2504 ADDED
@@ -0,0 +1 @@
 
 
1
+ uuid: "1268afaf-1c19-4568-8171-17e9c4ca2504"
manifest.ocdbt ADDED
Binary file (117 Bytes). View file
 
ocdbt.process_0/d/391be1dabf9d22a13dbd77a36b10b698 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d0d0c4a6a6a7de9f740d9742fc55e7da88bcaa1358db77b8e2f2e0fa8513e43
3
+ size 128737280
ocdbt.process_0/d/82e3580474fe958b6aca1f086b1801bb ADDED
Binary file (1.62 kB). View file
 
ocdbt.process_0/d/f0a794078cf86d67e5026770a0cb3aaa ADDED
Binary file (590 Bytes). View file
 
ocdbt.process_0/d/f933434baa602db9432904cb5cfd5012 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6785fb6360727a848ef3934b4b1c891d3dcfb8117ad073d4a3661c8fe2769fa4
3
+ size 729174016
ocdbt.process_0/manifest.ocdbt ADDED
Binary file (266 Bytes). View file