beplay commited on
Commit
3e7df00
1 Parent(s): c480d54

Training in progress, epoch 0

Browse files
adapter_config.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": null,
4
+ "base_model_name_or_path": "facebook/opt-125m",
5
+ "bias": "none",
6
+ "fan_in_fan_out": false,
7
+ "inference_mode": true,
8
+ "init_lora_weights": true,
9
+ "layer_replication": null,
10
+ "layers_pattern": null,
11
+ "layers_to_transform": null,
12
+ "loftq_config": {},
13
+ "lora_alpha": 128,
14
+ "lora_dropout": 0.05,
15
+ "megatron_config": null,
16
+ "megatron_core": "megatron.core",
17
+ "modules_to_save": null,
18
+ "peft_type": "LORA",
19
+ "r": 256,
20
+ "rank_pattern": {},
21
+ "revision": null,
22
+ "target_modules": [
23
+ "q_proj",
24
+ "fc2",
25
+ "k_proj",
26
+ "out_proj",
27
+ "v_proj",
28
+ "fc1"
29
+ ],
30
+ "task_type": "CAUSAL_LM",
31
+ "use_dora": false,
32
+ "use_rslora": false
33
+ }
adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4954052ddd512b5809e7052691755651aaf943eb599a2f1cc54b15aaef38b4c1
3
+ size 478730240
added_tokens.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "<|im_end|>": 50266,
3
+ "<|im_start|>": 50265
4
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
runs/Sep13_09-49-40_sifs-dgx/events.out.tfevents.1726213790.sifs-dgx.33.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c8d452405d2681c8ef548b4d4d385e1bdcf4661ac089f48e827fc2c87cf0ffc
3
+ size 5898
runs/Sep13_12-36-10_sifs-dgx/events.out.tfevents.1726223774.sifs-dgx.33.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:351114d2ca8cd274297223ce01d66d452850f34dea954e137b31ea78d1afe32f
3
+ size 5917
runs/Sep13_12-46-15_sifs-dgx/events.out.tfevents.1726224378.sifs-dgx.33.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:853592b299c1177ef4abcfdf768ef1e51b6b6e02c45bad2c006ae67a893454ce
3
+ size 5917
runs/Sep13_12-47-38_sifs-dgx/events.out.tfevents.1726224462.sifs-dgx.33.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55417a5b114a1e19e37bacba6f07a7d05b5720361bd30de1947c61ff4e32ec8d
3
+ size 5917
runs/Sep13_12-54-40_sifs-dgx/events.out.tfevents.1726224883.sifs-dgx.33.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77025fb4229eff04ae6a59d2dd0299e37e291a4d0acf35d509e7bdece209bea4
3
+ size 7780
special_tokens_map.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ {
4
+ "content": "<|im_start|>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false
9
+ },
10
+ {
11
+ "content": "<|im_end|>",
12
+ "lstrip": false,
13
+ "normalized": false,
14
+ "rstrip": false,
15
+ "single_word": false
16
+ }
17
+ ],
18
+ "bos_token": "<|im_start|>",
19
+ "eos_token": "<|im_end|>",
20
+ "pad_token": "<|im_end|>",
21
+ "unk_token": {
22
+ "content": "</s>",
23
+ "lstrip": false,
24
+ "normalized": true,
25
+ "rstrip": false,
26
+ "single_word": false
27
+ }
28
+ }
test_dataset.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": true,
3
+ "add_prefix_space": false,
4
+ "added_tokens_decoder": {
5
+ "1": {
6
+ "content": "<pad>",
7
+ "lstrip": false,
8
+ "normalized": true,
9
+ "rstrip": false,
10
+ "single_word": false,
11
+ "special": true
12
+ },
13
+ "2": {
14
+ "content": "</s>",
15
+ "lstrip": false,
16
+ "normalized": true,
17
+ "rstrip": false,
18
+ "single_word": false,
19
+ "special": true
20
+ },
21
+ "50265": {
22
+ "content": "<|im_start|>",
23
+ "lstrip": false,
24
+ "normalized": false,
25
+ "rstrip": false,
26
+ "single_word": false,
27
+ "special": true
28
+ },
29
+ "50266": {
30
+ "content": "<|im_end|>",
31
+ "lstrip": false,
32
+ "normalized": false,
33
+ "rstrip": false,
34
+ "single_word": false,
35
+ "special": true
36
+ }
37
+ },
38
+ "additional_special_tokens": [
39
+ "<|im_start|>",
40
+ "<|im_end|>"
41
+ ],
42
+ "bos_token": "<|im_start|>",
43
+ "chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
44
+ "clean_up_tokenization_spaces": true,
45
+ "eos_token": "<|im_end|>",
46
+ "errors": "replace",
47
+ "model_max_length": 1000000000000000019884624838656,
48
+ "pad_token": "<|im_end|>",
49
+ "tokenizer_class": "GPT2Tokenizer",
50
+ "unk_token": "</s>"
51
+ }
train_dataset.json ADDED
The diff for this file is too large to render. See raw diff
 
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4df05743fd778f8813b5d8b536e839b57fd6527ef38b4a272d0a27ff6d67ce62
3
+ size 5560
vocab.json ADDED
The diff for this file is too large to render. See raw diff