Striker-7
/

finetune

Generated from Trainer

text generation

Model card Files Files and versions Community

Striker-7 commited on Jul 30, 2024

Commit

e3fc864

·

verified ·

1 Parent(s): 004d861

Update config.json

Files changed (1) hide show

config.json +133 -3

config.json CHANGED Viewed

@@ -1,9 +1,139 @@
 {
-  "model_type": "EleutherAI/gpt-neo-2.7B",
   "task_specific_params": {
     "text-generation": {
       "do_sample": true,
-      "max_length": 200
     }
-  }
 }

+Hugging Face's logo
+Hugging Face
+Search models, datasets, users...
+Models
+Datasets
+Spaces
+Posts
+Docs
+Pricing
+EleutherAI
+/
+gpt-neo-2.7B
+like
+400
+Text Generation
+Transformers
+PyTorch
+JAX
+Rust
+Safetensors
+EleutherAI/pile
+English
+gpt_neo
+text generation
+causal-lm
+Inference Endpoints
+License:
+mit
+Model card
+Files and versions
+Community
+15
+gpt-neo-2.7B
+/
+config.json
+valhalla's picture
+valhalla
+add flax model
+0b8087b
+about 3 years ago
+raw
+Copy download link
+history
+blame
+contribute
+delete
+No virus
+1.46 kB
 {
+  "activation_function": "gelu_new",
+  "architectures": [
+    "GPTNeoForCausalLM"
+  ],
+  "attention_dropout": 0,
+  "attention_layers": [
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local"
+  ],
+  "attention_types": [
+    [
+      [
+        "global",
+        "local"
+      ],
+      16
+    ]
+  ],
+  "bos_token_id": 50256,
+  "embed_dropout": 0,
+  "eos_token_id": 50256,
+  "gradient_checkpointing": false,
+  "hidden_size": 2560,
+  "initializer_range": 0.02,
+  "intermediate_size": null,
+  "layer_norm_epsilon": 1e-05,
+  "max_position_embeddings": 2048,
+  "model_type": "gpt_neo",
+  "num_heads": 20,
+  "num_layers": 32,
+  "resid_dropout": 0,
+  "summary_activation": null,
+  "summary_first_dropout": 0.1,
+  "summary_proj_to_labels": true,
+  "summary_type": "cls_index",
+  "summary_use_proj": true,
   "task_specific_params": {
     "text-generation": {
       "do_sample": true,
+      "max_length": 50,
+      "temperature": 0.9
     }
+  },
+  "tokenizer_class": "GPT2Tokenizer",
+  "transformers_version": "4.9.0.dev0",
+  "use_cache": true,
+  "vocab_size": 50257,
+  "window_size": 256
 }