Rich-J
/

key11

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

Rich-J commited on Jan 24

Commit

a4a7d00

•

1 Parent(s): b93bea1

Upload model

Files changed (2) hide show

config.json +9 -2
model.safetensors +2 -2

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "syncdoth/pretraining-sn9-2",
   "activation_function": "gelu_new",
   "architectures": [
     "GPT2LMHeadModel"
@@ -11,10 +11,11 @@
   "initializer_range": 0.02,
   "layer_norm_epsilon": 1e-05,
   "model_type": "gpt2",
   "n_embd": 768,
   "n_head": 12,
   "n_inner": null,
-  "n_layer": 11,
   "n_positions": 1024,
   "reorder_and_upcast_attn": false,
   "resid_pdrop": 0.0,
@@ -25,6 +26,12 @@
   "summary_proj_to_labels": true,
   "summary_type": "cls_index",
   "summary_use_proj": true,
   "torch_dtype": "float32",
   "transformers_version": "4.34.1",
   "use_cache": true,

 {
+  "_name_or_path": "/root/pretraining/local-models/training/2024-01-24_07-40-33",
   "activation_function": "gelu_new",
   "architectures": [
     "GPT2LMHeadModel"
   "initializer_range": 0.02,
   "layer_norm_epsilon": 1e-05,
   "model_type": "gpt2",
+  "n_ctx": 1024,
   "n_embd": 768,
   "n_head": 12,
   "n_inner": null,
+  "n_layer": 20,
   "n_positions": 1024,
   "reorder_and_upcast_attn": false,
   "resid_pdrop": 0.0,
   "summary_proj_to_labels": true,
   "summary_type": "cls_index",
   "summary_use_proj": true,
+  "task_specific_params": {
+    "text-generation": {
+      "do_sample": true,
+      "max_length": 50
+    }
+  },
   "torch_dtype": "float32",
   "transformers_version": "4.34.1",
   "use_cache": true,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fc47c819387b16e69b9d562d3130f62e8203838348cf92ced5128009f229ee8c
-size 469421488

 version https://git-lfs.github.com/spec/v1
+oid sha256:01a1592c24c4e291e280c07a4a6e6c7410d707bdccb1575817c78ebb27a0a0b2
+size 724595976