pellto commited on
Commit
30a7125
โ€ข
1 Parent(s): fa27690

upload files about models

Browse files
Files changed (6) hide show
  1. README.md +4 -0
  2. config.json +40 -0
  3. merges.txt +0 -0
  4. pytorch_model.bin +3 -0
  5. tokenizer.json +0 -0
  6. vocab.json +0 -0
README.md ADDED
@@ -0,0 +1,4 @@
 
 
 
 
1
+ ํ•ด๋‹น ๋ชจ๋ธ์€ [ํ•ด๋‹น ์‚ฌ์ดํŠธ](https://huggingface.co/gpt2-medium)์—์„œ ๊ฐ€์ ธ์˜จ ๋ชจ๋ธ์ž…๋‹ˆ๋‹ค.
2
+
3
+
4
+ ํ•ด๋‹น ๋ชจ๋ธ์€ [Teachable NLP](https://ainize.ai/teachable-nlp) ์„œ๋น„์Šค์—์„œ ์‚ฌ์šฉ๋ฉ๋‹ˆ๋‹ค.
config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation_function": "gelu_new",
3
+ "architectures": [
4
+ "GPT2Model"
5
+ ],
6
+ "attn_pdrop": 0.1,
7
+ "bos_token_id": 50256,
8
+ "embd_pdrop": 0.1,
9
+ "eos_token_id": 50256,
10
+ "initializer_range": 0.02,
11
+ "layer_norm_epsilon": 1e-05,
12
+ "model_type": "gpt2",
13
+ "n_ctx": 1024,
14
+ "n_embd": 1024,
15
+ "n_head": 16,
16
+ "n_inner": null,
17
+ "n_layer": 24,
18
+ "n_positions": 1024,
19
+ "n_special": 0,
20
+ "predict_special_tokens": true,
21
+ "reorder_and_upcast_attn": false,
22
+ "resid_pdrop": 0.1,
23
+ "scale_attn_by_inverse_layer_idx": false,
24
+ "scale_attn_weights": true,
25
+ "summary_activation": null,
26
+ "summary_first_dropout": 0.1,
27
+ "summary_proj_to_labels": true,
28
+ "summary_type": "cls_index",
29
+ "summary_use_proj": true,
30
+ "task_specific_params": {
31
+ "text-generation": {
32
+ "do_sample": true,
33
+ "max_length": 50
34
+ }
35
+ },
36
+ "torch_dtype": "float32",
37
+ "transformers_version": "4.12.3",
38
+ "use_cache": true,
39
+ "vocab_size": 50257
40
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09fa59f5990d6767ee006f73f642a90e76b7112e62e39f0523f2db31cbcbadab
3
+ size 1444568793
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
vocab.json ADDED
The diff for this file is too large to render. See raw diff