Training in progress, step 10
Browse files- 26_10_23_config_test_3.csv +1 -1
- 26_10_23_results_real_3.csv +2 -1
- README.md +13 -0
- adapter_model.bin +1 -1
- adapter_model.safetensors +1 -1
- proc_dataset.csv +0 -0
- training_args.bin +1 -1
26_10_23_config_test_3.csv
CHANGED
@@ -3,6 +3,6 @@ run_number,comment,peformed_already,num_train_epochs,max_tokens,temperature,stop
|
|
3 |
2,lemmatization set True,True,2,100,0.8,False,False,False,True
|
4 |
3,stemming set True,True,2,100,0.8,False,False,True,False
|
5 |
4,classification_of_valuems set True,True,2,100,0.8,False,True,False,False
|
6 |
-
5,lemmatization set True stemming set True classification_of_valuems set True,
|
7 |
6,lemmatization set True classification_of_valuems set True,False,2,100,0.8,False,True,False,True
|
8 |
7,lemmatization set True stemming set True classification_of_valuems set True,False,2,100,0.8,False,True,True,True
|
|
|
3 |
2,lemmatization set True,True,2,100,0.8,False,False,False,True
|
4 |
3,stemming set True,True,2,100,0.8,False,False,True,False
|
5 |
4,classification_of_valuems set True,True,2,100,0.8,False,True,False,False
|
6 |
+
5,lemmatization set True stemming set True classification_of_valuems set True,True,2,100,0.8,False,True,True,True
|
7 |
6,lemmatization set True classification_of_valuems set True,False,2,100,0.8,False,True,False,True
|
8 |
7,lemmatization set True stemming set True classification_of_valuems set True,False,2,100,0.8,False,True,True,True
|
26_10_23_results_real_3.csv
CHANGED
@@ -3,4 +3,5 @@ run_number,items_per_minute,changed_settings,total_time_taken,rouge_scores_unnes
|
|
3 |
2,1536.0607907581125,lemmatization set True,17.186819791793823,0,0.214089850397903,0.318702425435426,0.2423715028093075,0.2529693313991745,0.3585456885960055,0.2769754910708834,0.2936855415126434,0.3948906866601206,0.3139260215675037,0.0750408604918147,0.0993313642783126,0.0806385046330855,0.0998362391572985,0.1241065730842655,0.1044138796128328,0.1271034884820783,0.1499837386497416,0.1290391381032435,0.5,0.5,0.5
|
4 |
3,1518.4399626994298,stemming set True,17.38626527786255,0,0.1178075851397331,0.1964903653343984,0.137917383716792,0.1453055143811142,0.2315236059515145,0.1668826618900411,0.1755426478710371,0.2662609300754107,0.1952669585988578,0.0248398335210917,0.0377277461104543,0.0282191244695968,0.0398256113302351,0.0555684230999425,0.0432994464743569,0.056346867998003,0.0743205476107291,0.0594836650305486,0.25,0.25,0.25
|
5 |
4,1525.602524101584,classification_of_valuems set True,17.304638385772705,0,0.3449559795118336,0.3423341666457499,0.3223067218438548,0.3962323417858379,0.3934280156800367,0.3705820791169619,0.4480554100301472,0.4472379094634592,0.4191781582462838,0.1924640322240557,0.1864412220397102,0.1791588870738077,0.2322731554369229,0.2249807377601852,0.2130668974234288,0.275524472174082,0.267281230315844,0.2520826707151871,0.25,0.25,0.25
|
6 |
-
5,
|
|
|
|
3 |
2,1536.0607907581125,lemmatization set True,17.186819791793823,0,0.214089850397903,0.318702425435426,0.2423715028093075,0.2529693313991745,0.3585456885960055,0.2769754910708834,0.2936855415126434,0.3948906866601206,0.3139260215675037,0.0750408604918147,0.0993313642783126,0.0806385046330855,0.0998362391572985,0.1241065730842655,0.1044138796128328,0.1271034884820783,0.1499837386497416,0.1290391381032435,0.5,0.5,0.5
|
4 |
3,1518.4399626994298,stemming set True,17.38626527786255,0,0.1178075851397331,0.1964903653343984,0.137917383716792,0.1453055143811142,0.2315236059515145,0.1668826618900411,0.1755426478710371,0.2662609300754107,0.1952669585988578,0.0248398335210917,0.0377277461104543,0.0282191244695968,0.0398256113302351,0.0555684230999425,0.0432994464743569,0.056346867998003,0.0743205476107291,0.0594836650305486,0.25,0.25,0.25
|
5 |
4,1525.602524101584,classification_of_valuems set True,17.304638385772705,0,0.3449559795118336,0.3423341666457499,0.3223067218438548,0.3962323417858379,0.3934280156800367,0.3705820791169619,0.4480554100301472,0.4472379094634592,0.4191781582462838,0.1924640322240557,0.1864412220397102,0.1791588870738077,0.2322731554369229,0.2249807377601852,0.2130668974234288,0.275524472174082,0.267281230315844,0.2520826707151871,0.25,0.25,0.25
|
6 |
+
5,1526.1514943613795,lemmatization set True stemming set True classification_of_valuems set True,17.29841375350952,0,0.2740090800292036,0.3255265414032295,0.2775650458916542,0.3242606066397121,0.382074138505741,0.3267769081728278,0.3772870132781871,0.4458722947774239,0.3791647882107381,0.1589738558026723,0.1948121530040918,0.163589425650448,0.197346401556911,0.2400173323974756,0.2012985648757239,0.2417203208425002,0.291225773302693,0.2448890209857868,0.5,0.5,0.5
|
7 |
+
6,0.0,0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
|
README.md
CHANGED
@@ -832,6 +832,18 @@ The following `bitsandbytes` quantization config was used during training:
|
|
832 |
- bnb_4bit_use_double_quant: True
|
833 |
- bnb_4bit_compute_dtype: bfloat16
|
834 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
835 |
The following `bitsandbytes` quantization config was used during training:
|
836 |
- quant_method: bitsandbytes
|
837 |
- load_in_8bit: False
|
@@ -914,5 +926,6 @@ The following `bitsandbytes` quantization config was used during training:
|
|
914 |
- PEFT 0.5.0
|
915 |
- PEFT 0.5.0
|
916 |
- PEFT 0.5.0
|
|
|
917 |
|
918 |
- PEFT 0.5.0
|
|
|
832 |
- bnb_4bit_use_double_quant: True
|
833 |
- bnb_4bit_compute_dtype: bfloat16
|
834 |
|
835 |
+
The following `bitsandbytes` quantization config was used during training:
|
836 |
+
- quant_method: bitsandbytes
|
837 |
+
- load_in_8bit: False
|
838 |
+
- load_in_4bit: True
|
839 |
+
- llm_int8_threshold: 6.0
|
840 |
+
- llm_int8_skip_modules: None
|
841 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
842 |
+
- llm_int8_has_fp16_weight: False
|
843 |
+
- bnb_4bit_quant_type: nf4
|
844 |
+
- bnb_4bit_use_double_quant: True
|
845 |
+
- bnb_4bit_compute_dtype: bfloat16
|
846 |
+
|
847 |
The following `bitsandbytes` quantization config was used during training:
|
848 |
- quant_method: bitsandbytes
|
849 |
- load_in_8bit: False
|
|
|
926 |
- PEFT 0.5.0
|
927 |
- PEFT 0.5.0
|
928 |
- PEFT 0.5.0
|
929 |
+
- PEFT 0.5.0
|
930 |
|
931 |
- PEFT 0.5.0
|
adapter_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 100733709
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7292753dcf5912ec2758e47b4f2dccab7520d96d9d76a7c7094f1735d567b353
|
3 |
size 100733709
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 100690288
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7c0ddf681cf1992628abc7cace21abdd86412e9b2f4906f1fbec5340f41caf4
|
3 |
size 100690288
|
proc_dataset.csv
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4283
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c9f083b19d53a4b3010039d85e9ef9eb625a60a5654cac57880128a4c424a91
|
3 |
size 4283
|