deuswoof commited on
Commit
b4ee6ad
·
1 Parent(s): 1bdfb19

Training in progress, step 10

Browse files
26_10_23_config_test_3.csv CHANGED
@@ -3,6 +3,6 @@ run_number,comment,peformed_already,num_train_epochs,max_tokens,temperature,stop
3
  2,lemmatization set True,True,2,100,0.8,False,False,False,True
4
  3,stemming set True,True,2,100,0.8,False,False,True,False
5
  4,classification_of_valuems set True,True,2,100,0.8,False,True,False,False
6
- 5,lemmatization set True stemming set True classification_of_valuems set True,False,2,100,0.8,False,True,True,True
7
  6,lemmatization set True classification_of_valuems set True,False,2,100,0.8,False,True,False,True
8
  7,lemmatization set True stemming set True classification_of_valuems set True,False,2,100,0.8,False,True,True,True
 
3
  2,lemmatization set True,True,2,100,0.8,False,False,False,True
4
  3,stemming set True,True,2,100,0.8,False,False,True,False
5
  4,classification_of_valuems set True,True,2,100,0.8,False,True,False,False
6
+ 5,lemmatization set True stemming set True classification_of_valuems set True,True,2,100,0.8,False,True,True,True
7
  6,lemmatization set True classification_of_valuems set True,False,2,100,0.8,False,True,False,True
8
  7,lemmatization set True stemming set True classification_of_valuems set True,False,2,100,0.8,False,True,True,True
26_10_23_results_real_3.csv CHANGED
@@ -3,4 +3,5 @@ run_number,items_per_minute,changed_settings,total_time_taken,rouge_scores_unnes
3
  2,1536.0607907581125,lemmatization set True,17.186819791793823,0,0.214089850397903,0.318702425435426,0.2423715028093075,0.2529693313991745,0.3585456885960055,0.2769754910708834,0.2936855415126434,0.3948906866601206,0.3139260215675037,0.0750408604918147,0.0993313642783126,0.0806385046330855,0.0998362391572985,0.1241065730842655,0.1044138796128328,0.1271034884820783,0.1499837386497416,0.1290391381032435,0.5,0.5,0.5
4
  3,1518.4399626994298,stemming set True,17.38626527786255,0,0.1178075851397331,0.1964903653343984,0.137917383716792,0.1453055143811142,0.2315236059515145,0.1668826618900411,0.1755426478710371,0.2662609300754107,0.1952669585988578,0.0248398335210917,0.0377277461104543,0.0282191244695968,0.0398256113302351,0.0555684230999425,0.0432994464743569,0.056346867998003,0.0743205476107291,0.0594836650305486,0.25,0.25,0.25
5
  4,1525.602524101584,classification_of_valuems set True,17.304638385772705,0,0.3449559795118336,0.3423341666457499,0.3223067218438548,0.3962323417858379,0.3934280156800367,0.3705820791169619,0.4480554100301472,0.4472379094634592,0.4191781582462838,0.1924640322240557,0.1864412220397102,0.1791588870738077,0.2322731554369229,0.2249807377601852,0.2130668974234288,0.275524472174082,0.267281230315844,0.2520826707151871,0.25,0.25,0.25
6
- 5,0.0,0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
 
 
3
  2,1536.0607907581125,lemmatization set True,17.186819791793823,0,0.214089850397903,0.318702425435426,0.2423715028093075,0.2529693313991745,0.3585456885960055,0.2769754910708834,0.2936855415126434,0.3948906866601206,0.3139260215675037,0.0750408604918147,0.0993313642783126,0.0806385046330855,0.0998362391572985,0.1241065730842655,0.1044138796128328,0.1271034884820783,0.1499837386497416,0.1290391381032435,0.5,0.5,0.5
4
  3,1518.4399626994298,stemming set True,17.38626527786255,0,0.1178075851397331,0.1964903653343984,0.137917383716792,0.1453055143811142,0.2315236059515145,0.1668826618900411,0.1755426478710371,0.2662609300754107,0.1952669585988578,0.0248398335210917,0.0377277461104543,0.0282191244695968,0.0398256113302351,0.0555684230999425,0.0432994464743569,0.056346867998003,0.0743205476107291,0.0594836650305486,0.25,0.25,0.25
5
  4,1525.602524101584,classification_of_valuems set True,17.304638385772705,0,0.3449559795118336,0.3423341666457499,0.3223067218438548,0.3962323417858379,0.3934280156800367,0.3705820791169619,0.4480554100301472,0.4472379094634592,0.4191781582462838,0.1924640322240557,0.1864412220397102,0.1791588870738077,0.2322731554369229,0.2249807377601852,0.2130668974234288,0.275524472174082,0.267281230315844,0.2520826707151871,0.25,0.25,0.25
6
+ 5,1526.1514943613795,lemmatization set True stemming set True classification_of_valuems set True,17.29841375350952,0,0.2740090800292036,0.3255265414032295,0.2775650458916542,0.3242606066397121,0.382074138505741,0.3267769081728278,0.3772870132781871,0.4458722947774239,0.3791647882107381,0.1589738558026723,0.1948121530040918,0.163589425650448,0.197346401556911,0.2400173323974756,0.2012985648757239,0.2417203208425002,0.291225773302693,0.2448890209857868,0.5,0.5,0.5
7
+ 6,0.0,0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
README.md CHANGED
@@ -832,6 +832,18 @@ The following `bitsandbytes` quantization config was used during training:
832
  - bnb_4bit_use_double_quant: True
833
  - bnb_4bit_compute_dtype: bfloat16
834
 
 
 
 
 
 
 
 
 
 
 
 
 
835
  The following `bitsandbytes` quantization config was used during training:
836
  - quant_method: bitsandbytes
837
  - load_in_8bit: False
@@ -914,5 +926,6 @@ The following `bitsandbytes` quantization config was used during training:
914
  - PEFT 0.5.0
915
  - PEFT 0.5.0
916
  - PEFT 0.5.0
 
917
 
918
  - PEFT 0.5.0
 
832
  - bnb_4bit_use_double_quant: True
833
  - bnb_4bit_compute_dtype: bfloat16
834
 
835
+ The following `bitsandbytes` quantization config was used during training:
836
+ - quant_method: bitsandbytes
837
+ - load_in_8bit: False
838
+ - load_in_4bit: True
839
+ - llm_int8_threshold: 6.0
840
+ - llm_int8_skip_modules: None
841
+ - llm_int8_enable_fp32_cpu_offload: False
842
+ - llm_int8_has_fp16_weight: False
843
+ - bnb_4bit_quant_type: nf4
844
+ - bnb_4bit_use_double_quant: True
845
+ - bnb_4bit_compute_dtype: bfloat16
846
+
847
  The following `bitsandbytes` quantization config was used during training:
848
  - quant_method: bitsandbytes
849
  - load_in_8bit: False
 
926
  - PEFT 0.5.0
927
  - PEFT 0.5.0
928
  - PEFT 0.5.0
929
+ - PEFT 0.5.0
930
 
931
  - PEFT 0.5.0
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f344bfe4e1e78d1bc1b1eecd338cfe910bef2472c0b5f501dc7c8c0a10e235a
3
  size 100733709
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7292753dcf5912ec2758e47b4f2dccab7520d96d9d76a7c7094f1735d567b353
3
  size 100733709
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8435a3c8ea4c47af962e3a4e3149f7f9999232c4a6c060495e93dc50e42f81f9
3
  size 100690288
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7c0ddf681cf1992628abc7cace21abdd86412e9b2f4906f1fbec5340f41caf4
3
  size 100690288
proc_dataset.csv CHANGED
The diff for this file is too large to render. See raw diff
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c9a7b8a52ad3c9d13c87375ac4a8a52268e28d39ed12e1b0ba1d8b28fb101fc
3
  size 4283
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c9f083b19d53a4b3010039d85e9ef9eb625a60a5654cac57880128a4c424a91
3
  size 4283