Update README.md
Browse files
README.md
CHANGED
|
@@ -6,6 +6,25 @@ metrics:
|
|
| 6 |
- rouge
|
| 7 |
pipeline_tag: summarization
|
| 8 |
---
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 9 |
|
| 10 |
# Training Results
|
| 11 |
|
|
|
|
| 6 |
- rouge
|
| 7 |
pipeline_tag: summarization
|
| 8 |
---
|
| 9 |
+
# Hyperparameters
|
| 10 |
+
learning_rate=2e-5
|
| 11 |
+
per_device_train_batch_size=14
|
| 12 |
+
per_device_eval_batch_size=14
|
| 13 |
+
weight_decay=0.01
|
| 14 |
+
save_total_limit=3
|
| 15 |
+
num_train_epochs=3
|
| 16 |
+
predict_with_generate=True
|
| 17 |
+
fp16=True
|
| 18 |
+
|
| 19 |
+
# Training Output
|
| 20 |
+
global_step=4248,
|
| 21 |
+
training_loss=2.930363613782405,
|
| 22 |
+
metrics={'train_runtime': 11857.8062,
|
| 23 |
+
'train_samples_per_second': 5.014,
|
| 24 |
+
'train_steps_per_second': 0.358,
|
| 25 |
+
'total_flos': 1.3114345819786445e+17,
|
| 26 |
+
'train_loss': 2.930363613782405,
|
| 27 |
+
'epoch': 3.0}
|
| 28 |
|
| 29 |
# Training Results
|
| 30 |
|