bh8648
/

codeparrot

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

bh8648 commited on Aug 17, 2023

Commit

fe26199

•

1 Parent(s): 173dc6c

Upload model

Files changed (2) hide show

config.json +5 -4
pytorch_model.bin +2 -2

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "gpt2",
   "activation_function": "gelu_new",
   "architectures": [
     "GPT2LMHeadModel"
@@ -12,11 +12,12 @@
   "layer_norm_epsilon": 1e-05,
   "model_type": "gpt2",
   "n_ctx": 1024,
-  "n_embd": 768,
-  "n_head": 12,
   "n_inner": null,
-  "n_layer": 12,
   "n_positions": 1024,
   "reorder_and_upcast_attn": false,
   "resid_pdrop": 0.1,
   "scale_attn_by_inverse_layer_idx": false,

 {
+  "_name_or_path": "gpt2-xl",
   "activation_function": "gelu_new",
   "architectures": [
     "GPT2LMHeadModel"
   "layer_norm_epsilon": 1e-05,
   "model_type": "gpt2",
   "n_ctx": 1024,
+  "n_embd": 1600,
+  "n_head": 25,
   "n_inner": null,
+  "n_layer": 48,
   "n_positions": 1024,
+  "output_past": true,
   "reorder_and_upcast_attn": false,
   "resid_pdrop": 0.1,
   "scale_attn_by_inverse_layer_idx": false,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cedd9284d78a99471924ed75c89982c1433e64c14106c4165840e027ce4a1307
-size 444078941

 version https://git-lfs.github.com/spec/v1
+oid sha256:7c1745afaf59b94d60ca4a5a95bf4ef63aa53db0c92183a6101659495d8c00ff
+size 6118698809