RollingMuffin commited on
Commit
33a1aed
1 Parent(s): 0d8a7a6

Commit from colab

Browse files
Files changed (4) hide show
  1. config.json +14 -6
  2. pytorch_model.bin +2 -2
  3. tokenizer_config.json +1 -1
  4. training_args.bin +1 -1
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "sberbank-ai/rugpt3small_based_on_gpt2",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
@@ -8,16 +8,24 @@
8
  "bos_token_id": 50256,
9
  "embd_pdrop": 0.1,
10
  "eos_token_id": 50256,
11
- "gradient_checkpointing": false,
 
 
12
  "initializer_range": 0.02,
 
 
 
13
  "layer_norm_epsilon": 1e-05,
14
  "model_type": "gpt2",
15
  "n_ctx": 2048,
16
- "n_embd": 768,
17
- "n_head": 12,
18
  "n_inner": null,
19
- "n_layer": 12,
20
  "n_positions": 2048,
 
 
 
21
  "reorder_and_upcast_attn": false,
22
  "resid_pdrop": 0.1,
23
  "scale_attn_by_inverse_layer_idx": false,
@@ -30,5 +38,5 @@
30
  "torch_dtype": "float32",
31
  "transformers_version": "4.16.2",
32
  "use_cache": true,
33
- "vocab_size": 50264
34
  }
 
1
  {
2
+ "_name_or_path": "sberbank-ai/rugpt3medium_based_on_gpt2",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
 
8
  "bos_token_id": 50256,
9
  "embd_pdrop": 0.1,
10
  "eos_token_id": 50256,
11
+ "id2label": {
12
+ "0": "LABEL_0"
13
+ },
14
  "initializer_range": 0.02,
15
+ "label2id": {
16
+ "LABEL_0": 0
17
+ },
18
  "layer_norm_epsilon": 1e-05,
19
  "model_type": "gpt2",
20
  "n_ctx": 2048,
21
+ "n_embd": 1024,
22
+ "n_head": 16,
23
  "n_inner": null,
24
+ "n_layer": 24,
25
  "n_positions": 2048,
26
+ "n_special": 0,
27
+ "output_past": true,
28
+ "predict_special_tokens": true,
29
  "reorder_and_upcast_attn": false,
30
  "resid_pdrop": 0.1,
31
  "scale_attn_by_inverse_layer_idx": false,
 
38
  "torch_dtype": "float32",
39
  "transformers_version": "4.16.2",
40
  "use_cache": true,
41
+ "vocab_size": 50257
42
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c1f0d84ef1079701c83ff564124ad358c399a79e64e48787e14b67d35658b4d
3
- size 551319785
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46c362b75386c0250fcf748cac4880eb9692074c69f0b525494873e359415a50
3
+ size 1524273113
tokenizer_config.json CHANGED
@@ -1 +1 @@
1
- {"unk_token": {"content": "<|endoftext|>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "bos_token": {"content": "<|endoftext|>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "eos_token": {"content": "<|endoftext|>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "add_prefix_space": false, "special_tokens_map_file": null, "name_or_path": "sberbank-ai/rugpt3small_based_on_gpt2", "errors": "replace", "tokenizer_class": "GPT2Tokenizer"}
 
1
+ {"unk_token": {"content": "<|endoftext|>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "bos_token": {"content": "<|endoftext|>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "eos_token": {"content": "<|endoftext|>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "add_prefix_space": false, "special_tokens_map_file": null, "name_or_path": "sberbank-ai/rugpt3medium_based_on_gpt2", "errors": "replace", "tokenizer_class": "GPT2Tokenizer"}
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:338449769623e92b438a7ed6bbc03986348358994b5a1d22545e14e260da2926
3
  size 2991
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a54fb90143bbc04b2dfdbe8cbdcd9ef94eb712cb8d27a668ac2e7ce60b197db
3
  size 2991