End of training
Browse files- all_results.json +6 -6
- eval_results.json +3 -3
- train_results.json +3 -3
- trainer_state.json +3 -3
all_results.json
CHANGED
|
@@ -1,11 +1,11 @@
|
|
| 1 |
{
|
| 2 |
"epoch": 0.04,
|
| 3 |
"eval_loss": 0.07713703066110611,
|
| 4 |
-
"eval_runtime":
|
| 5 |
-
"eval_samples_per_second":
|
| 6 |
-
"eval_steps_per_second":
|
| 7 |
"train_loss": 0.0033295607640092873,
|
| 8 |
-
"train_runtime":
|
| 9 |
-
"train_samples_per_second":
|
| 10 |
-
"train_steps_per_second":
|
| 11 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"epoch": 0.04,
|
| 3 |
"eval_loss": 0.07713703066110611,
|
| 4 |
+
"eval_runtime": 761.1334,
|
| 5 |
+
"eval_samples_per_second": 50.911,
|
| 6 |
+
"eval_steps_per_second": 6.364,
|
| 7 |
"train_loss": 0.0033295607640092873,
|
| 8 |
+
"train_runtime": 303.4327,
|
| 9 |
+
"train_samples_per_second": 386.099,
|
| 10 |
+
"train_steps_per_second": 48.264
|
| 11 |
}
|
eval_results.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
{
|
| 2 |
"epoch": 0.04,
|
| 3 |
"eval_loss": 0.07713703066110611,
|
| 4 |
-
"eval_runtime":
|
| 5 |
-
"eval_samples_per_second":
|
| 6 |
-
"eval_steps_per_second":
|
| 7 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"epoch": 0.04,
|
| 3 |
"eval_loss": 0.07713703066110611,
|
| 4 |
+
"eval_runtime": 761.1334,
|
| 5 |
+
"eval_samples_per_second": 50.911,
|
| 6 |
+
"eval_steps_per_second": 6.364
|
| 7 |
}
|
train_results.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
{
|
| 2 |
"epoch": 0.04,
|
| 3 |
"train_loss": 0.0033295607640092873,
|
| 4 |
-
"train_runtime":
|
| 5 |
-
"train_samples_per_second":
|
| 6 |
-
"train_steps_per_second":
|
| 7 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"epoch": 0.04,
|
| 3 |
"train_loss": 0.0033295607640092873,
|
| 4 |
+
"train_runtime": 303.4327,
|
| 5 |
+
"train_samples_per_second": 386.099,
|
| 6 |
+
"train_steps_per_second": 48.264
|
| 7 |
}
|
trainer_state.json
CHANGED
|
@@ -208,9 +208,9 @@
|
|
| 208 |
"step": 14645,
|
| 209 |
"total_flos": 7.904602466056929e+18,
|
| 210 |
"train_loss": 0.0033295607640092873,
|
| 211 |
-
"train_runtime":
|
| 212 |
-
"train_samples_per_second":
|
| 213 |
-
"train_steps_per_second":
|
| 214 |
}
|
| 215 |
],
|
| 216 |
"max_steps": 14645,
|
|
|
|
| 208 |
"step": 14645,
|
| 209 |
"total_flos": 7.904602466056929e+18,
|
| 210 |
"train_loss": 0.0033295607640092873,
|
| 211 |
+
"train_runtime": 303.4327,
|
| 212 |
+
"train_samples_per_second": 386.099,
|
| 213 |
+
"train_steps_per_second": 48.264
|
| 214 |
}
|
| 215 |
],
|
| 216 |
"max_steps": 14645,
|