ojasaar commited on
Commit
ce09134
1 Parent(s): d332c5d

model + tokenizer

Browse files
Files changed (6) hide show
  1. README.md +18 -0
  2. config.json +38 -0
  3. merges.txt +0 -0
  4. pytorch_model_quantized.bin +3 -0
  5. tokenizer.json +0 -0
  6. vocab.json +0 -0
README.md ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ language:
3
+ - en
4
+ ---
5
+ # Pytorch int8 quantized version of gpt2-large
6
+
7
+ ## Usage
8
+
9
+ Download the .bin file locally.
10
+ Load with:
11
+
12
+ Rest of the usage according to [original instructions](https://huggingface.co/gpt2-large).
13
+
14
+ ```python
15
+ import torch
16
+
17
+ model = torch.load("path/to/pytorch_model_quantized.bin")
18
+ ```
config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_num_labels": 1,
3
+ "activation_function": "gelu_new",
4
+ "architectures": [
5
+ "GPT2LMHeadModel"
6
+ ],
7
+ "attn_pdrop": 0.1,
8
+ "bos_token_id": 50256,
9
+ "embd_pdrop": 0.1,
10
+ "eos_token_id": 50256,
11
+ "id2label": {
12
+ "0": "LABEL_0"
13
+ },
14
+ "initializer_range": 0.02,
15
+ "label2id": {
16
+ "LABEL_0": 0
17
+ },
18
+ "layer_norm_epsilon": 1e-05,
19
+ "model_type": "gpt2",
20
+ "n_ctx": 1024,
21
+ "n_embd": 1280,
22
+ "n_head": 20,
23
+ "n_layer": 36,
24
+ "n_positions": 1024,
25
+ "resid_pdrop": 0.1,
26
+ "summary_activation": null,
27
+ "summary_first_dropout": 0.1,
28
+ "summary_proj_to_labels": true,
29
+ "summary_type": "cls_index",
30
+ "summary_use_proj": true,
31
+ "task_specific_params": {
32
+ "text-generation": {
33
+ "do_sample": true,
34
+ "max_length": 50
35
+ }
36
+ },
37
+ "vocab_size": 50257
38
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
pytorch_model_quantized.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdd8898ce0b7fb7f54042968f2fdb53eaa4d4ba3c78f81ce09d0f609fd7c9b94
3
+ size 1075062658
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
vocab.json ADDED
The diff for this file is too large to render. See raw diff