cavendishlabs commited on
Commit
ff161d7
·
verified ·
1 Parent(s): 5cfc851

Training in progress, step 44

Browse files
adapter_config.json CHANGED
@@ -3,6 +3,8 @@
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "Qwen/Qwen2-0.5B",
5
  "bias": "none",
 
 
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
8
  "init_lora_weights": true,
@@ -11,6 +13,7 @@
11
  "layers_to_transform": null,
12
  "loftq_config": {},
13
  "lora_alpha": 16,
 
14
  "lora_dropout": 0.05,
15
  "megatron_config": null,
16
  "megatron_core": "megatron.core",
@@ -20,8 +23,8 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "q_proj",
24
- "v_proj"
25
  ],
26
  "task_type": "CAUSAL_LM",
27
  "use_dora": false,
 
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "Qwen/Qwen2-0.5B",
5
  "bias": "none",
6
+ "eva_config": null,
7
+ "exclude_modules": null,
8
  "fan_in_fan_out": false,
9
  "inference_mode": true,
10
  "init_lora_weights": true,
 
13
  "layers_to_transform": null,
14
  "loftq_config": {},
15
  "lora_alpha": 16,
16
+ "lora_bias": false,
17
  "lora_dropout": 0.05,
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
 
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
+ "v_proj",
27
+ "q_proj"
28
  ],
29
  "task_type": "CAUSAL_LM",
30
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2a620e25934e469a8b270a2f9922f02e86689b5183d54ffb886e6f878af58466
3
  size 8663400
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a0da76a15c3e0a0dcf3f88ee33d69448ccc91e71e1d8de2c0bb4f4dcc88b369
3
  size 8663400
tokenizer_config.json CHANGED
@@ -35,6 +35,7 @@
35
  "clean_up_tokenization_spaces": false,
36
  "eos_token": "<|endoftext|>",
37
  "errors": "replace",
 
38
  "model_max_length": 32768,
39
  "pad_token": "<|endoftext|>",
40
  "split_special_tokens": false,
 
35
  "clean_up_tokenization_spaces": false,
36
  "eos_token": "<|endoftext|>",
37
  "errors": "replace",
38
+ "extra_special_tokens": {},
39
  "model_max_length": 32768,
40
  "pad_token": "<|endoftext|>",
41
  "split_special_tokens": false,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7aa817f51616ea5d83274cea099ed8dd46559c4750e8d66315b5ce19c85397f1
3
- size 5688
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28344a9081919b6de86592f6eb5ee9bd3de7032c10be475bebcacf3dac1ce216
3
+ size 5752