diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..81919cba361a24d921f6d7ff2adada227186a951 --- /dev/null +++ b/config.json @@ -0,0 +1,31 @@ +{ + "_name_or_path": "./", + "architectures": [ + "T5ForConditionalGeneration" + ], + "d_ff": 16, + "d_kv": 6, + "d_model": 8, + "decoder_start_token_id": 0, + "dense_act_fn": "silu", + "dropout_rate": 0.0, + "eos_token_id": 1, + "feed_forward_proj": "gated-silu", + "initializer_factor": 1.0, + "is_encoder_decoder": true, + "is_gated_act": true, + "layer_norm_epsilon": 1e-06, + "model_type": "t5", + "num_decoder_layers": 3, + "num_heads": 4, + "num_layers": 3, + "output_past": true, + "pad_token_id": 0, + "relative_attention_max_distance": 128, + "relative_attention_num_buckets": 64, + "tie_word_embeddings": false, + "torch_dtype": "float32", + "transformers_version": "4.26.0", + "use_cache": true, + "vocab_size": 256 +} diff --git a/t5x/README.md b/t5x/README.md new file mode 100644 index 0000000000000000000000000000000000000000..3c7c6a10d0d6f251612d9fbc86faab06d66fd918 --- /dev/null +++ b/t5x/README.md @@ -0,0 +1,3 @@ +--- +license: cc-by-nc-sa-4.0 +--- diff --git a/t5x/checkpoint_0/checkpoint b/t5x/checkpoint_0/checkpoint new file mode 100644 index 0000000000000000000000000000000000000000..1d8f53ed2e8a5b5cfe18229ade865f0dfd95445a Binary files /dev/null and b/t5x/checkpoint_0/checkpoint differ diff --git a/t5x/checkpoint_0/state.param_states.decoder.decoder.pre_cross_attention_layer_norm.scale.v/.zarray b/t5x/checkpoint_0/state.param_states.decoder.decoder.pre_cross_attention_layer_norm.scale.v/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..94cd03e354db3f7611f0b444f71a3086c0e3a23a --- /dev/null +++ b/t5x/checkpoint_0/state.param_states.decoder.decoder.pre_cross_attention_layer_norm.scale.v/.zarray @@ -0,0 +1 @@ +{"chunks":[8,3],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"