nealchandra commited on Jul 30, 2023

Commit

17763bd

•

1 Parent(s): d6e7c3c

Upload folder using huggingface_hub

Files changed (19) hide show

README.md ADDED Viewed

+---
+library_name: peft
+---
+## Training procedure
+The following `bitsandbytes` quantization config was used during training:
+- load_in_8bit: False
+- load_in_4bit: True
+- llm_int8_threshold: 6.0
+- llm_int8_skip_modules: None
+- llm_int8_enable_fp32_cpu_offload: False
+- llm_int8_has_fp16_weight: False
+- bnb_4bit_quant_type: nf4
+- bnb_4bit_use_double_quant: True
+- bnb_4bit_compute_dtype: bfloat16
+### Framework versions
+- PEFT 0.4.0.dev0

adapter_config.json ADDED Viewed

+{
+  "base_model_name_or_path": "/models/meta-llama--Llama-2-7b-hf",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "lora_alpha": 16,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 16,
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "k_proj",
+    "v_proj",
+    "o_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

adapter_model.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:5b8c852a367764f99dbb7294c1fc6c34b970cf042147e307d81d0f2d70f93dff
+size 67201357

checkpoint-5500/README.md ADDED Viewed

+---
+library_name: peft
+---
+## Training procedure
+The following `bitsandbytes` quantization config was used during training:
+- load_in_8bit: False
+- load_in_4bit: True
+- llm_int8_threshold: 6.0
+- llm_int8_skip_modules: None
+- llm_int8_enable_fp32_cpu_offload: False
+- llm_int8_has_fp16_weight: False
+- bnb_4bit_quant_type: nf4
+- bnb_4bit_use_double_quant: True
+- bnb_4bit_compute_dtype: bfloat16
+### Framework versions
+- PEFT 0.4.0.dev0

checkpoint-5500/adapter_config.json ADDED Viewed

+{
+  "base_model_name_or_path": "/models/meta-llama--Llama-2-7b-hf",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "lora_alpha": 16,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 16,
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "k_proj",
+    "v_proj",
+    "o_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

checkpoint-5500/adapter_model.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:2501d577aa3c13e6872404d1481ef5ccb30fe8d6703a1af7bd27211102db505a
+size 67201357

checkpoint-5500/optimizer.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:1a7e81bcd9f627990655611bed92a7b57e46859f663d2868f50988fdc1ab53f2
+size 134369669

checkpoint-5500/rng_state.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:9876379ec43070a3a6a1e012404169dfa1dca5d431f07c93b953dd0393eda2e8
+size 14575

checkpoint-5500/scheduler.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:7310504c6dd483294102fd78d4a4a719dd62d0ce6001a85adca5ec1f74a5a007
+size 627

checkpoint-5500/trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-5500/training_args.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:8a2b74f33e2400f69010addfd67de997497948e45eb5ba3212e8a370f414074b
+size 4091

checkpoint-6000/README.md ADDED Viewed

+---
+library_name: peft
+---
+## Training procedure
+The following `bitsandbytes` quantization config was used during training:
+- load_in_8bit: False
+- load_in_4bit: True
+- llm_int8_threshold: 6.0
+- llm_int8_skip_modules: None
+- llm_int8_enable_fp32_cpu_offload: False
+- llm_int8_has_fp16_weight: False
+- bnb_4bit_quant_type: nf4
+- bnb_4bit_use_double_quant: True
+- bnb_4bit_compute_dtype: bfloat16
+### Framework versions
+- PEFT 0.4.0.dev0

checkpoint-6000/adapter_config.json ADDED Viewed

+{
+  "base_model_name_or_path": "/models/meta-llama--Llama-2-7b-hf",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "lora_alpha": 16,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 16,
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "k_proj",
+    "v_proj",
+    "o_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

checkpoint-6000/adapter_model.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:70dab0cf48e114f703aa36ff4717f9dbd09d37e8df37adc1420a9237b2b7b840
+size 67201357

checkpoint-6000/optimizer.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:3943be26870cbb1d156afe3c1d5e92ad2020a3ac04fb648175c5ad7870a27c3b
+size 134369669

checkpoint-6000/rng_state.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:0733e7faa251c5aeb870b25a736f65ff3885a13e5ae22b7439a685ceeab2f1c7
+size 14575

checkpoint-6000/scheduler.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:a7a323739148b73b653af5d001bd55dbb43af0a7e1bbbb51eb25ab1c00661365
+size 627

checkpoint-6000/trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-6000/training_args.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:8a2b74f33e2400f69010addfd67de997497948e45eb5ba3212e8a370f414074b
+size 4091