bogdancazan commited on
Commit
1b7276f
1 Parent(s): 2810bdc

Create README.md

Browse files
Files changed (1) hide show
  1. README.md +18 -0
README.md ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ training_args = TrainingArguments(
2
+ output_dir='t5-small-newsela-biendata-with-domain-adaptation',
3
+ num_train_epochs=20,
4
+ warmup_steps=250,
5
+ per_device_train_batch_size=BATCH_SIZE,
6
+ weight_decay=0.01,
7
+ learning_rate=2e-4,
8
+ fp16=True,
9
+ optim="adafactor",
10
+ )
11
+
12
+
13
+ Step Training Loss
14
+ 500 35.466600
15
+ 1000 25.795400
16
+ 1500 10.923200
17
+ 2000 4.515500
18
+ TrainOutput(global_step=2320, training_loss=16.92537920721646, metrics={'train_runtime': 628.0033, 'train_samples_per_second': 472.418, 'train_steps_per_second': 3.694, 'total_flos': 0.0, 'train_loss': 16.92537920721646, 'epoch': 20.0})