nielsbantilan commited on
Commit
2252f27
1 Parent(s): 78a4041

Upload folder using huggingface_hub

Browse files
README.md CHANGED
@@ -1,14 +1,3 @@
1
  ---
2
- language:
3
- - en
4
- license: apache-2.0
5
- tags:
6
- - pytorch
7
- - causal-lm
8
- - redpajama
9
- - fine-tuning
10
- - wikipedia
11
-
12
  ---
13
-
14
- # RedPajama-INCITE-Base-3B-v1 fine-tuned on wikipedia
 
1
  ---
2
+ library_name: peft
 
 
 
 
 
 
 
 
 
3
  ---
 
 
adapter_config.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "base_model_name_or_path": "togethercomputer/RedPajama-INCITE-7B-Chat",
3
+ "bias": "none",
4
+ "fan_in_fan_out": false,
5
+ "inference_mode": true,
6
+ "init_lora_weights": true,
7
+ "layers_pattern": null,
8
+ "layers_to_transform": null,
9
+ "lora_alpha": 16,
10
+ "lora_dropout": 0.05,
11
+ "modules_to_save": null,
12
+ "peft_type": "LORA",
13
+ "r": 8,
14
+ "revision": null,
15
+ "target_modules": [
16
+ "query_key_value"
17
+ ],
18
+ "task_type": "CAUSAL_LM"
19
+ }
adapter_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5e1621f48d9ad8feb1d6d31050275f0aafd080c5c07153301fe2f48411f4406
3
+ size 443
checkpoint-50/adapter_model/README.md ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ ---
2
+ library_name: peft
3
+ ---
checkpoint-50/adapter_model/adapter_config.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "base_model_name_or_path": "togethercomputer/RedPajama-INCITE-7B-Chat",
3
+ "bias": "none",
4
+ "fan_in_fan_out": false,
5
+ "inference_mode": true,
6
+ "init_lora_weights": true,
7
+ "layers_pattern": null,
8
+ "layers_to_transform": null,
9
+ "lora_alpha": 16,
10
+ "lora_dropout": 0.05,
11
+ "modules_to_save": null,
12
+ "peft_type": "LORA",
13
+ "r": 8,
14
+ "revision": null,
15
+ "target_modules": [
16
+ "query_key_value"
17
+ ],
18
+ "task_type": "CAUSAL_LM"
19
+ }
checkpoint-50/adapter_model/adapter_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5e1621f48d9ad8feb1d6d31050275f0aafd080c5c07153301fe2f48411f4406
3
+ size 443
checkpoint-50/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afa9f042c9c4093bbdb30a28b4efe74911eae71f7643db6d3a5670ac1c078c89
3
+ size 8482757
checkpoint-50/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f2208daec5a8ad6d59f722f32cc9f3cf64f1a581a8ccb4f989f92ff5c247dd6
3
+ size 21687
checkpoint-50/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bd37d6d5be7d186e90b1471dde3a7e3798dacddb468d4a83351f7fcaf36fec5
3
+ size 21687
checkpoint-50/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3027312469f9c6fbed5d28a57844e1edd56af1c7761d3a67f783e921e55e133
3
+ size 21687
checkpoint-50/rng_state_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1ab6e962803634eedfc7404ea6dcc78c6484774ded3801821ffb9a273a05be5
3
+ size 21687
checkpoint-50/rng_state_4.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e4b5a4e0d43915af261d0756dc377b6cab9110b165c415734817dcf1d6f64b6
3
+ size 21687
checkpoint-50/rng_state_5.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4654cb0101527e78199161270991c20893a1244ca1236166725f2dd84c64fcc9
3
+ size 21687
checkpoint-50/rng_state_6.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff39c29de1d03aa674c23fecdbf8243369122193600ed49de91a90174f40844a
3
+ size 21687
checkpoint-50/rng_state_7.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48e736ffaab1a27035ef05150913a0726356fc6cfa9e5074043d02eaa91824f8
3
+ size 21687
checkpoint-50/scaler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfa3bcfad6548e955614aa66924075e0bfa36d4a9baf6cf6190c3fd577b6da91
3
+ size 557
checkpoint-50/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4267400369983b1274b53d4bee44860f806fbc7d36c9b08d8df3dcaf0049b87d
3
+ size 627
checkpoint-50/trainer_state.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 0.015455950540958269,
5
+ "global_step": 50,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.01,
12
+ "learning_rate": 6.91341716182545e-05,
13
+ "loss": 2.4205,
14
+ "step": 20
15
+ },
16
+ {
17
+ "epoch": 0.01,
18
+ "learning_rate": 1.0332332985438248e-05,
19
+ "loss": 1.2875,
20
+ "step": 40
21
+ }
22
+ ],
23
+ "max_steps": 50,
24
+ "num_train_epochs": 1,
25
+ "total_flos": 6696347264614400.0,
26
+ "trial_name": null,
27
+ "trial_params": null
28
+ }
checkpoint-50/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:390f5383386edfc387592f60849b35e1b737eade925308dba6e13c354bc3f549
3
+ size 3963