EleutherAI
/

pythia-2.8b-modularaddition-first-ft

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

atmallen commited on Mar 22

Commit

06caae1

•

1 Parent(s): de4dd30

Training in progress, step 1

Files changed (2) hide show

config.json +2 -1
training_args.bin +2 -2

config.json CHANGED Viewed

@@ -3,6 +3,7 @@
   "architectures": [
     "GPTNeoXForCausalLM"
   ],
   "attention_dropout": 0.0,
   "bos_token_id": 0,
   "classifier_dropout": 0.1,
@@ -22,7 +23,7 @@
   "rotary_pct": 0.25,
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
-  "transformers_version": "4.36.2",
   "use_cache": true,
   "use_parallel_residual": true,
   "vocab_size": 50304

   "architectures": [
     "GPTNeoXForCausalLM"
   ],
+  "attention_bias": true,
   "attention_dropout": 0.0,
   "bos_token_id": 0,
   "classifier_dropout": 0.1,
   "rotary_pct": 0.25,
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
+  "transformers_version": "4.37.2",
   "use_cache": true,
   "use_parallel_residual": true,
   "vocab_size": 50304

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e8e455a3f95cbf8a506ee68a17228e55c17a09445cf18696e067ad3b359d6ebf
-size 4984

 version https://git-lfs.github.com/spec/v1
+oid sha256:71f535faf39eb8a143c9cbe9b66145745379ad5a03cc27575312af91d543de99
+size 4920