Training in progress, step 4000, checkpoint
Browse files
last-checkpoint/trainer_state.json
CHANGED
@@ -81,9 +81,9 @@
|
|
81 |
{
|
82 |
"epoch": 0.08,
|
83 |
"eval_loss": 0.09235642850399017,
|
84 |
-
"eval_runtime":
|
85 |
-
"eval_samples_per_second":
|
86 |
-
"eval_steps_per_second": 2.
|
87 |
"step": 500
|
88 |
},
|
89 |
{
|
@@ -159,9 +159,9 @@
|
|
159 |
{
|
160 |
"epoch": 0.16,
|
161 |
"eval_loss": 0.08949962258338928,
|
162 |
-
"eval_runtime":
|
163 |
-
"eval_samples_per_second":
|
164 |
-
"eval_steps_per_second": 2.
|
165 |
"step": 1000
|
166 |
},
|
167 |
{
|
@@ -237,9 +237,9 @@
|
|
237 |
{
|
238 |
"epoch": 0.24,
|
239 |
"eval_loss": 0.08808805048465729,
|
240 |
-
"eval_runtime":
|
241 |
-
"eval_samples_per_second":
|
242 |
-
"eval_steps_per_second": 2.
|
243 |
"step": 1500
|
244 |
},
|
245 |
{
|
@@ -315,9 +315,9 @@
|
|
315 |
{
|
316 |
"epoch": 0.32,
|
317 |
"eval_loss": 0.08704760670661926,
|
318 |
-
"eval_runtime":
|
319 |
-
"eval_samples_per_second":
|
320 |
-
"eval_steps_per_second": 2.
|
321 |
"step": 2000
|
322 |
},
|
323 |
{
|
@@ -393,9 +393,9 @@
|
|
393 |
{
|
394 |
"epoch": 0.4,
|
395 |
"eval_loss": 0.08615937829017639,
|
396 |
-
"eval_runtime":
|
397 |
-
"eval_samples_per_second":
|
398 |
-
"eval_steps_per_second": 2.
|
399 |
"step": 2500
|
400 |
},
|
401 |
{
|
@@ -471,9 +471,9 @@
|
|
471 |
{
|
472 |
"epoch": 0.48,
|
473 |
"eval_loss": 0.08551913499832153,
|
474 |
-
"eval_runtime":
|
475 |
-
"eval_samples_per_second":
|
476 |
-
"eval_steps_per_second": 2.
|
477 |
"step": 3000
|
478 |
},
|
479 |
{
|
@@ -549,9 +549,9 @@
|
|
549 |
{
|
550 |
"epoch": 0.56,
|
551 |
"eval_loss": 0.08540560305118561,
|
552 |
-
"eval_runtime":
|
553 |
-
"eval_samples_per_second":
|
554 |
-
"eval_steps_per_second": 2.
|
555 |
"step": 3500
|
556 |
},
|
557 |
{
|
@@ -627,9 +627,9 @@
|
|
627 |
{
|
628 |
"epoch": 0.64,
|
629 |
"eval_loss": 0.08466340601444244,
|
630 |
-
"eval_runtime":
|
631 |
-
"eval_samples_per_second":
|
632 |
-
"eval_steps_per_second": 2.
|
633 |
"step": 4000
|
634 |
}
|
635 |
],
|
|
|
81 |
{
|
82 |
"epoch": 0.08,
|
83 |
"eval_loss": 0.09235642850399017,
|
84 |
+
"eval_runtime": 116.7651,
|
85 |
+
"eval_samples_per_second": 17.128,
|
86 |
+
"eval_steps_per_second": 2.141,
|
87 |
"step": 500
|
88 |
},
|
89 |
{
|
|
|
159 |
{
|
160 |
"epoch": 0.16,
|
161 |
"eval_loss": 0.08949962258338928,
|
162 |
+
"eval_runtime": 116.7407,
|
163 |
+
"eval_samples_per_second": 17.132,
|
164 |
+
"eval_steps_per_second": 2.141,
|
165 |
"step": 1000
|
166 |
},
|
167 |
{
|
|
|
237 |
{
|
238 |
"epoch": 0.24,
|
239 |
"eval_loss": 0.08808805048465729,
|
240 |
+
"eval_runtime": 116.8722,
|
241 |
+
"eval_samples_per_second": 17.113,
|
242 |
+
"eval_steps_per_second": 2.139,
|
243 |
"step": 1500
|
244 |
},
|
245 |
{
|
|
|
315 |
{
|
316 |
"epoch": 0.32,
|
317 |
"eval_loss": 0.08704760670661926,
|
318 |
+
"eval_runtime": 116.8362,
|
319 |
+
"eval_samples_per_second": 17.118,
|
320 |
+
"eval_steps_per_second": 2.14,
|
321 |
"step": 2000
|
322 |
},
|
323 |
{
|
|
|
393 |
{
|
394 |
"epoch": 0.4,
|
395 |
"eval_loss": 0.08615937829017639,
|
396 |
+
"eval_runtime": 116.9591,
|
397 |
+
"eval_samples_per_second": 17.1,
|
398 |
+
"eval_steps_per_second": 2.137,
|
399 |
"step": 2500
|
400 |
},
|
401 |
{
|
|
|
471 |
{
|
472 |
"epoch": 0.48,
|
473 |
"eval_loss": 0.08551913499832153,
|
474 |
+
"eval_runtime": 116.545,
|
475 |
+
"eval_samples_per_second": 17.161,
|
476 |
+
"eval_steps_per_second": 2.145,
|
477 |
"step": 3000
|
478 |
},
|
479 |
{
|
|
|
549 |
{
|
550 |
"epoch": 0.56,
|
551 |
"eval_loss": 0.08540560305118561,
|
552 |
+
"eval_runtime": 116.9131,
|
553 |
+
"eval_samples_per_second": 17.107,
|
554 |
+
"eval_steps_per_second": 2.138,
|
555 |
"step": 3500
|
556 |
},
|
557 |
{
|
|
|
627 |
{
|
628 |
"epoch": 0.64,
|
629 |
"eval_loss": 0.08466340601444244,
|
630 |
+
"eval_runtime": 116.6411,
|
631 |
+
"eval_samples_per_second": 17.147,
|
632 |
+
"eval_steps_per_second": 2.143,
|
633 |
"step": 4000
|
634 |
}
|
635 |
],
|