Update README.md
Browse files
README.md
CHANGED
|
@@ -9,6 +9,26 @@ metrics:
|
|
| 9 |
pipeline_tag: summarization
|
| 10 |
---
|
| 11 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 12 |
# Training Results
|
| 13 |
|
| 14 |
| Epoch | Training Loss | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum | Bleu | Gen Len |
|
|
|
|
| 9 |
pipeline_tag: summarization
|
| 10 |
---
|
| 11 |
|
| 12 |
+
# Hyperparameters
|
| 13 |
+
learning_rate=2e-5
|
| 14 |
+
per_device_train_batch_size=14
|
| 15 |
+
per_device_eval_batch_size=14
|
| 16 |
+
weight_decay=0.01
|
| 17 |
+
save_total_limit=3
|
| 18 |
+
num_train_epochs=3
|
| 19 |
+
predict_with_generate=True
|
| 20 |
+
fp16=True
|
| 21 |
+
|
| 22 |
+
# Training Output
|
| 23 |
+
global_step=3003,
|
| 24 |
+
training_loss=1.8524150695953217,
|
| 25 |
+
metrics={'train_runtime': 2319.7329,
|
| 26 |
+
'train_samples_per_second': 18.122,
|
| 27 |
+
'train_steps_per_second': 1.295,
|
| 28 |
+
'total_flos': 9.110291036818637e+16,
|
| 29 |
+
'train_loss': 1.8524150695953217,
|
| 30 |
+
'epoch': 3.0}
|
| 31 |
+
|
| 32 |
# Training Results
|
| 33 |
|
| 34 |
| Epoch | Training Loss | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum | Bleu | Gen Len |
|