bh8648
/

codeparrot

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

bh8648 commited on Aug 17, 2023

Commit

e97302d

•

1 Parent(s): b830c84

Upload model

Files changed (2) hide show

config.json +4 -5
pytorch_model.bin +2 -2

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "gpt2-xl",
   "activation_function": "gelu_new",
   "architectures": [
     "GPT2LMHeadModel"
@@ -12,12 +12,11 @@
   "layer_norm_epsilon": 1e-05,
   "model_type": "gpt2",
   "n_ctx": 1024,
-  "n_embd": 1600,
-  "n_head": 25,
   "n_inner": null,
-  "n_layer": 48,
   "n_positions": 1024,
-  "output_past": true,
   "reorder_and_upcast_attn": false,
   "resid_pdrop": 0.1,
   "scale_attn_by_inverse_layer_idx": false,

 {
+  "_name_or_path": "gpt2",
   "activation_function": "gelu_new",
   "architectures": [
     "GPT2LMHeadModel"
   "layer_norm_epsilon": 1e-05,
   "model_type": "gpt2",
   "n_ctx": 1024,
+  "n_embd": 768,
+  "n_head": 12,
   "n_inner": null,
+  "n_layer": 12,
   "n_positions": 1024,
   "reorder_and_upcast_attn": false,
   "resid_pdrop": 0.1,
   "scale_attn_by_inverse_layer_idx": false,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7c1745afaf59b94d60ca4a5a95bf4ef63aa53db0c92183a6101659495d8c00ff
-size 6118698809

 version https://git-lfs.github.com/spec/v1
+oid sha256:cedd9284d78a99471924ed75c89982c1433e64c14106c4165840e027ce4a1307
+size 444078941