Update README.md
Browse files
README.md
CHANGED
|
@@ -74,7 +74,8 @@ The following hyperparameters were used during training:
|
|
| 74 |
- seed: 42
|
| 75 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
| 76 |
- lr_scheduler_type: linear
|
| 77 |
-
-
|
|
|
|
| 78 |
- num_epochs: 3
|
| 79 |
- eval_steps: 500
|
| 80 |
- save_steps: 500
|
|
|
|
| 74 |
- seed: 42
|
| 75 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
| 76 |
- lr_scheduler_type: linear
|
| 77 |
+
- weight_decay=0.1
|
| 78 |
+
- warmup_ratio: 0.06
|
| 79 |
- num_epochs: 3
|
| 80 |
- eval_steps: 500
|
| 81 |
- save_steps: 500
|