usmiva commited on
Commit
2ec7af4
1 Parent(s): b9c2048

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +35 -1
README.md CHANGED
@@ -87,8 +87,10 @@ set_seed(42)
87
  ```python
88
  gpt_web_bg("По професия той е ")
89
 
 
90
  ```
91
  [{'generated_text': 'По професия той е строителен работник, който е �'}]
 
92
 
93
 
94
 
@@ -103,7 +105,39 @@ gpt_web_bg("По професия той е ")
103
 
104
  <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
105
 
106
-
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
107
 
108
  #### Preprocessing [optional]
109
 
 
87
  ```python
88
  gpt_web_bg("По професия той е ")
89
 
90
+ ```
91
  ```
92
  [{'generated_text': 'По професия той е строителен работник, който е �'}]
93
+ ```
94
 
95
 
96
 
 
105
 
106
  <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
107
 
108
+ ```
109
+ {
110
+ "activation_function": "gelu_new",
111
+ "architectures": [
112
+ "GPT2LMHeadModel"
113
+ ],
114
+ "attn_pdrop": 0.1,
115
+ "bos_token_id": 50256,
116
+ "embd_pdrop": 0.1,
117
+ "eos_token_id": 50256,
118
+ "initializer_range": 0.02,
119
+ "layer_norm_epsilon": 1e-05,
120
+ "model_type": "gpt2",
121
+ "n_embd": 768,
122
+ "n_head": 12,
123
+ "n_inner": null,
124
+ "n_layer": 12,
125
+ "n_positions": 1024,
126
+ "reorder_and_upcast_attn": false,
127
+ "resid_pdrop": 0.1,
128
+ "scale_attn_by_inverse_layer_idx": false,
129
+ "scale_attn_weights": true,
130
+ "summary_activation": null,
131
+ "summary_first_dropout": 0.1,
132
+ "summary_proj_to_labels": true,
133
+ "summary_type": "cls_index",
134
+ "summary_use_proj": true,
135
+ "torch_dtype": "float32",
136
+ "transformers_version": "4.22.0.dev0",
137
+ "use_cache": true,
138
+ "vocab_size": 50257
139
+ }
140
+ ```
141
 
142
  #### Preprocessing [optional]
143