bogdancazan
/

t5-base-newsela-biendata-with-domain-adaptation

Text2Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

bogdancazan commited on Jun 25, 2023

Commit

1a4efb3

•

1 Parent(s): 1445bdd

Update README.md

Files changed (1) hide show

README.md +11 -11

README.md CHANGED Viewed

@@ -1,5 +1,5 @@
 training_args = TrainingArguments(
-    output_dir='t5-base-newsela-biendata-with-domain-adaptation',
     num_train_epochs=20,
     warmup_steps=250,
     per_device_train_batch_size=BATCH_SIZE,
@@ -10,13 +10,13 @@ training_args = TrainingArguments(
 )
 Step	Training Loss
-500	31.865400
-1000	37.290400
-1500	18.697100
-2000	4.517400
-2500	2.976500
-3000	2.558100
-3500	2.305200
-4000	2.187100
-4500	2.125000
-TrainOutput(global_step=4640, training_loss=11.326794861102925, metrics={'train_runtime': 5055.1704, 'train_samples_per_second': 58.688, 'train_steps_per_second': 0.918, 'total_flos': 0.0, 'train_loss': 11.326794861102925, 'epoch': 20.0})

 training_args = TrainingArguments(
+    output_dir='t5-base-wikilarge-newsela-with-domain-adaptation',
     num_train_epochs=20,
     warmup_steps=250,
     per_device_train_batch_size=BATCH_SIZE,
 )
 Step	Training Loss
+500	4.184500
+1000	2.470900
+1500	2.128900
+2000	1.951600
+2500	1.834400
+3000	1.755800
+3500	1.701800
+4000	1.656300
+4500	1.628800
+TrainOutput(global_step=4640, training_loss=2.1286644540984057, metrics={'train_runtime': 4090.6694, 'train_samples_per_second': 72.526, 'train_steps_per_second': 1.134, 'total_flos': 0.0, 'train_loss': 2.1286644540984057, 'epoch': 20.0})