adithya8 commited on
Commit
ccbfbaf
1 Parent(s): 964e4f7

updated model

Browse files
README.md DELETED
@@ -1,3 +0,0 @@
1
- ---
2
- license: cc
3
- ---
 
 
 
 
config.json CHANGED
@@ -1,14 +1,19 @@
1
  {
2
- "_name_or_path": "/chronos_data/nisoni/analysing_hart_user_states/GPT2_TWT_PT_3June2024/outputs/gpt2_twt_pt_60bs",
3
  "activation_function": "gelu_new",
 
4
  "architectures": [
5
- "GPT2hlcLMHeadModel"
6
  ],
7
  "attn_pdrop": 0.1,
8
  "bos_token_id": 50256,
9
  "embd_pdrop": 0.1,
10
  "eos_token_id": 50256,
 
 
 
11
  "initializer_range": 0.02,
 
12
  "layer_norm_epsilon": 1e-05,
13
  "model_type": "gpt2",
14
  "n_ctx": 1024,
@@ -17,24 +22,16 @@
17
  "n_inner": null,
18
  "n_layer": 12,
19
  "n_positions": 1024,
20
- "pad_token_id": 50256,
21
- "reorder_and_upcast_attn": false,
22
  "resid_pdrop": 0.1,
23
- "scale_attn_by_inverse_layer_idx": false,
24
- "scale_attn_weights": true,
25
  "summary_activation": null,
26
  "summary_first_dropout": 0.1,
27
  "summary_proj_to_labels": true,
28
  "summary_type": "cls_index",
29
  "summary_use_proj": true,
30
- "task_specific_params": {
31
- "text-generation": {
32
- "do_sample": true,
33
- "max_length": 50
34
- }
35
- },
36
  "torch_dtype": "float32",
37
  "transformers_version": "4.33.1",
38
  "use_cache": true,
 
 
39
  "vocab_size": 50258
40
  }
 
1
  {
2
+ "_name_or_path": "/chronos_data/nisoni/HaRT_Twt_model",
3
  "activation_function": "gelu_new",
4
+ "add_history": true,
5
  "architectures": [
6
+ "HaRTPreTrainedModel"
7
  ],
8
  "attn_pdrop": 0.1,
9
  "bos_token_id": 50256,
10
  "embd_pdrop": 0.1,
11
  "eos_token_id": 50256,
12
+ "extract_layer": 11,
13
+ "freeze_model": false,
14
+ "gradient_checkpointing": false,
15
  "initializer_range": 0.02,
16
+ "layer_ins": 2,
17
  "layer_norm_epsilon": 1e-05,
18
  "model_type": "gpt2",
19
  "n_ctx": 1024,
 
22
  "n_inner": null,
23
  "n_layer": 12,
24
  "n_positions": 1024,
 
 
25
  "resid_pdrop": 0.1,
 
 
26
  "summary_activation": null,
27
  "summary_first_dropout": 0.1,
28
  "summary_proj_to_labels": true,
29
  "summary_type": "cls_index",
30
  "summary_use_proj": true,
 
 
 
 
 
 
31
  "torch_dtype": "float32",
32
  "transformers_version": "4.33.1",
33
  "use_cache": true,
34
+ "use_hart_no_hist": false,
35
+ "use_qh05_wts": false,
36
  "vocab_size": 50258
37
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9018b546d98352c967aded0bc1e6626025839b8846c1a5184228eb6d101b29f2
3
- size 652200033
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:593a35def4af82c3fa0546f068234c483766cc10005bb2acc3c8ef9f27c72b6f
3
+ size 782895249
special_tokens_map.json CHANGED
@@ -1,7 +1,6 @@
1
  {
2
  "bos_token": "<|endoftext|>",
3
  "eos_token": "<|endoftext|>",
4
- "pad_token": "<|endoftext|>",
5
  "sep_token": "<|insep|>",
6
  "unk_token": "<|endoftext|>"
7
  }
 
1
  {
2
  "bos_token": "<|endoftext|>",
3
  "eos_token": "<|endoftext|>",
 
4
  "sep_token": "<|insep|>",
5
  "unk_token": "<|endoftext|>"
6
  }
tokenizer_config.json CHANGED
@@ -1,9 +1,33 @@
1
  {
 
2
  "add_prefix_space": false,
3
- "bos_token": "<|endoftext|>",
 
 
 
 
 
 
 
4
  "clean_up_tokenization_spaces": true,
5
- "eos_token": "<|endoftext|>",
 
 
 
 
 
 
 
 
6
  "model_max_length": 1024,
 
7
  "tokenizer_class": "GPT2Tokenizer",
8
- "unk_token": "<|endoftext|>"
 
 
 
 
 
 
 
9
  }
 
1
  {
2
+ "add_bos_token": false,
3
  "add_prefix_space": false,
4
+ "bos_token": {
5
+ "__type": "AddedToken",
6
+ "content": "<|endoftext|>",
7
+ "lstrip": false,
8
+ "normalized": true,
9
+ "rstrip": false,
10
+ "single_word": false
11
+ },
12
  "clean_up_tokenization_spaces": true,
13
+ "eos_token": {
14
+ "__type": "AddedToken",
15
+ "content": "<|endoftext|>",
16
+ "lstrip": false,
17
+ "normalized": true,
18
+ "rstrip": false,
19
+ "single_word": false
20
+ },
21
+ "errors": "replace",
22
  "model_max_length": 1024,
23
+ "pad_token": null,
24
  "tokenizer_class": "GPT2Tokenizer",
25
+ "unk_token": {
26
+ "__type": "AddedToken",
27
+ "content": "<|endoftext|>",
28
+ "lstrip": false,
29
+ "normalized": true,
30
+ "rstrip": false,
31
+ "single_word": false
32
+ }
33
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3480cd5758a54474a91ba1c798474a3993bf335537e6779a563a251720d2655b
3
  size 4091
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3822f8ccdb8783bf065a662eda9058a38704d232a74bd8a1eb90eccb80eb2003
3
  size 4091