Training in progress, step 10

Browse files

Files changed (7) hide show

26_10_23_config_test_3.csv +1 -1
26_10_23_results_real_3.csv +2 -1
README.md +13 -0
adapter_model.bin +1 -1
adapter_model.safetensors +1 -1
proc_dataset.csv +0 -0
training_args.bin +1 -1

26_10_23_config_test_3.csv CHANGED Viewed

@@ -3,6 +3,6 @@ run_number,comment,peformed_already,num_train_epochs,max_tokens,temperature,stop
 2,lemmatization set True,True,2,100,0.8,False,False,False,True
 3,stemming set True,True,2,100,0.8,False,False,True,False
 4,classification_of_valuems set True,True,2,100,0.8,False,True,False,False
-5,lemmatization set True    stemming set True    classification_of_valuems set True,False,2,100,0.8,False,True,True,True
 6,lemmatization set True    classification_of_valuems set True,False,2,100,0.8,False,True,False,True
 7,lemmatization set True    stemming set True    classification_of_valuems set True,False,2,100,0.8,False,True,True,True

 2,lemmatization set True,True,2,100,0.8,False,False,False,True
 3,stemming set True,True,2,100,0.8,False,False,True,False
 4,classification_of_valuems set True,True,2,100,0.8,False,True,False,False
+5,lemmatization set True    stemming set True    classification_of_valuems set True,True,2,100,0.8,False,True,True,True
 6,lemmatization set True    classification_of_valuems set True,False,2,100,0.8,False,True,False,True
 7,lemmatization set True    stemming set True    classification_of_valuems set True,False,2,100,0.8,False,True,True,True

26_10_23_results_real_3.csv CHANGED Viewed

@@ -3,4 +3,5 @@ run_number,items_per_minute,changed_settings,total_time_taken,rouge_scores_unnes
 2,1536.0607907581125,lemmatization set True,17.186819791793823,0,0.214089850397903,0.318702425435426,0.2423715028093075,0.2529693313991745,0.3585456885960055,0.2769754910708834,0.2936855415126434,0.3948906866601206,0.3139260215675037,0.0750408604918147,0.0993313642783126,0.0806385046330855,0.0998362391572985,0.1241065730842655,0.1044138796128328,0.1271034884820783,0.1499837386497416,0.1290391381032435,0.5,0.5,0.5
 3,1518.4399626994298,stemming set True,17.38626527786255,0,0.1178075851397331,0.1964903653343984,0.137917383716792,0.1453055143811142,0.2315236059515145,0.1668826618900411,0.1755426478710371,0.2662609300754107,0.1952669585988578,0.0248398335210917,0.0377277461104543,0.0282191244695968,0.0398256113302351,0.0555684230999425,0.0432994464743569,0.056346867998003,0.0743205476107291,0.0594836650305486,0.25,0.25,0.25
 4,1525.602524101584,classification_of_valuems set True,17.304638385772705,0,0.3449559795118336,0.3423341666457499,0.3223067218438548,0.3962323417858379,0.3934280156800367,0.3705820791169619,0.4480554100301472,0.4472379094634592,0.4191781582462838,0.1924640322240557,0.1864412220397102,0.1791588870738077,0.2322731554369229,0.2249807377601852,0.2130668974234288,0.275524472174082,0.267281230315844,0.2520826707151871,0.25,0.25,0.25
-5,0.0,0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0

 2,1536.0607907581125,lemmatization set True,17.186819791793823,0,0.214089850397903,0.318702425435426,0.2423715028093075,0.2529693313991745,0.3585456885960055,0.2769754910708834,0.2936855415126434,0.3948906866601206,0.3139260215675037,0.0750408604918147,0.0993313642783126,0.0806385046330855,0.0998362391572985,0.1241065730842655,0.1044138796128328,0.1271034884820783,0.1499837386497416,0.1290391381032435,0.5,0.5,0.5
 3,1518.4399626994298,stemming set True,17.38626527786255,0,0.1178075851397331,0.1964903653343984,0.137917383716792,0.1453055143811142,0.2315236059515145,0.1668826618900411,0.1755426478710371,0.2662609300754107,0.1952669585988578,0.0248398335210917,0.0377277461104543,0.0282191244695968,0.0398256113302351,0.0555684230999425,0.0432994464743569,0.056346867998003,0.0743205476107291,0.0594836650305486,0.25,0.25,0.25
 4,1525.602524101584,classification_of_valuems set True,17.304638385772705,0,0.3449559795118336,0.3423341666457499,0.3223067218438548,0.3962323417858379,0.3934280156800367,0.3705820791169619,0.4480554100301472,0.4472379094634592,0.4191781582462838,0.1924640322240557,0.1864412220397102,0.1791588870738077,0.2322731554369229,0.2249807377601852,0.2130668974234288,0.275524472174082,0.267281230315844,0.2520826707151871,0.25,0.25,0.25
+5,1526.1514943613795,lemmatization set True    stemming set True    classification_of_valuems set True,17.29841375350952,0,0.2740090800292036,0.3255265414032295,0.2775650458916542,0.3242606066397121,0.382074138505741,0.3267769081728278,0.3772870132781871,0.4458722947774239,0.3791647882107381,0.1589738558026723,0.1948121530040918,0.163589425650448,0.197346401556911,0.2400173323974756,0.2012985648757239,0.2417203208425002,0.291225773302693,0.2448890209857868,0.5,0.5,0.5
+6,0.0,0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0

README.md CHANGED Viewed

@@ -832,6 +832,18 @@ The following `bitsandbytes` quantization config was used during training:
 - bnb_4bit_use_double_quant: True
 - bnb_4bit_compute_dtype: bfloat16
 The following `bitsandbytes` quantization config was used during training:
 - quant_method: bitsandbytes
 - load_in_8bit: False
@@ -914,5 +926,6 @@ The following `bitsandbytes` quantization config was used during training:
 - PEFT 0.5.0
 - PEFT 0.5.0
 - PEFT 0.5.0
 - PEFT 0.5.0

 - bnb_4bit_use_double_quant: True
 - bnb_4bit_compute_dtype: bfloat16
+The following `bitsandbytes` quantization config was used during training:
+- quant_method: bitsandbytes
+- load_in_8bit: False
+- load_in_4bit: True
+- llm_int8_threshold: 6.0
+- llm_int8_skip_modules: None
+- llm_int8_enable_fp32_cpu_offload: False
+- llm_int8_has_fp16_weight: False
+- bnb_4bit_quant_type: nf4
+- bnb_4bit_use_double_quant: True
+- bnb_4bit_compute_dtype: bfloat16
 The following `bitsandbytes` quantization config was used during training:
 - quant_method: bitsandbytes
 - load_in_8bit: False
 - PEFT 0.5.0
 - PEFT 0.5.0
 - PEFT 0.5.0
+- PEFT 0.5.0
 - PEFT 0.5.0

adapter_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3f344bfe4e1e78d1bc1b1eecd338cfe910bef2472c0b5f501dc7c8c0a10e235a
 size 100733709

 version https://git-lfs.github.com/spec/v1
+oid sha256:7292753dcf5912ec2758e47b4f2dccab7520d96d9d76a7c7094f1735d567b353
 size 100733709

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8435a3c8ea4c47af962e3a4e3149f7f9999232c4a6c060495e93dc50e42f81f9
 size 100690288

 version https://git-lfs.github.com/spec/v1
+oid sha256:c7c0ddf681cf1992628abc7cace21abdd86412e9b2f4906f1fbec5340f41caf4
 size 100690288

proc_dataset.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9c9a7b8a52ad3c9d13c87375ac4a8a52268e28d39ed12e1b0ba1d8b28fb101fc
 size 4283

 version https://git-lfs.github.com/spec/v1
+oid sha256:1c9f083b19d53a4b3010039d85e9ef9eb625a60a5654cac57880128a4c424a91
 size 4283