rakhman-llm commited on
Commit
559b875
·
verified ·
1 Parent(s): 9c0ef16

Training in progress, step 4000, checkpoint

Browse files
Files changed (1) hide show
  1. last-checkpoint/trainer_state.json +24 -24
last-checkpoint/trainer_state.json CHANGED
@@ -81,9 +81,9 @@
81
  {
82
  "epoch": 0.08,
83
  "eval_loss": 0.09235642850399017,
84
- "eval_runtime": 109.274,
85
- "eval_samples_per_second": 18.303,
86
- "eval_steps_per_second": 2.288,
87
  "step": 500
88
  },
89
  {
@@ -159,9 +159,9 @@
159
  {
160
  "epoch": 0.16,
161
  "eval_loss": 0.08949962258338928,
162
- "eval_runtime": 109.2536,
163
- "eval_samples_per_second": 18.306,
164
- "eval_steps_per_second": 2.288,
165
  "step": 1000
166
  },
167
  {
@@ -237,9 +237,9 @@
237
  {
238
  "epoch": 0.24,
239
  "eval_loss": 0.08808805048465729,
240
- "eval_runtime": 109.2355,
241
- "eval_samples_per_second": 18.309,
242
- "eval_steps_per_second": 2.289,
243
  "step": 1500
244
  },
245
  {
@@ -315,9 +315,9 @@
315
  {
316
  "epoch": 0.32,
317
  "eval_loss": 0.08704760670661926,
318
- "eval_runtime": 109.4348,
319
- "eval_samples_per_second": 18.276,
320
- "eval_steps_per_second": 2.284,
321
  "step": 2000
322
  },
323
  {
@@ -393,9 +393,9 @@
393
  {
394
  "epoch": 0.4,
395
  "eval_loss": 0.08615937829017639,
396
- "eval_runtime": 109.2621,
397
- "eval_samples_per_second": 18.305,
398
- "eval_steps_per_second": 2.288,
399
  "step": 2500
400
  },
401
  {
@@ -471,9 +471,9 @@
471
  {
472
  "epoch": 0.48,
473
  "eval_loss": 0.08551913499832153,
474
- "eval_runtime": 109.2626,
475
- "eval_samples_per_second": 18.305,
476
- "eval_steps_per_second": 2.288,
477
  "step": 3000
478
  },
479
  {
@@ -549,9 +549,9 @@
549
  {
550
  "epoch": 0.56,
551
  "eval_loss": 0.08540560305118561,
552
- "eval_runtime": 109.3641,
553
- "eval_samples_per_second": 18.288,
554
- "eval_steps_per_second": 2.286,
555
  "step": 3500
556
  },
557
  {
@@ -627,9 +627,9 @@
627
  {
628
  "epoch": 0.64,
629
  "eval_loss": 0.08466340601444244,
630
- "eval_runtime": 109.2066,
631
- "eval_samples_per_second": 18.314,
632
- "eval_steps_per_second": 2.289,
633
  "step": 4000
634
  }
635
  ],
 
81
  {
82
  "epoch": 0.08,
83
  "eval_loss": 0.09235642850399017,
84
+ "eval_runtime": 116.7651,
85
+ "eval_samples_per_second": 17.128,
86
+ "eval_steps_per_second": 2.141,
87
  "step": 500
88
  },
89
  {
 
159
  {
160
  "epoch": 0.16,
161
  "eval_loss": 0.08949962258338928,
162
+ "eval_runtime": 116.7407,
163
+ "eval_samples_per_second": 17.132,
164
+ "eval_steps_per_second": 2.141,
165
  "step": 1000
166
  },
167
  {
 
237
  {
238
  "epoch": 0.24,
239
  "eval_loss": 0.08808805048465729,
240
+ "eval_runtime": 116.8722,
241
+ "eval_samples_per_second": 17.113,
242
+ "eval_steps_per_second": 2.139,
243
  "step": 1500
244
  },
245
  {
 
315
  {
316
  "epoch": 0.32,
317
  "eval_loss": 0.08704760670661926,
318
+ "eval_runtime": 116.8362,
319
+ "eval_samples_per_second": 17.118,
320
+ "eval_steps_per_second": 2.14,
321
  "step": 2000
322
  },
323
  {
 
393
  {
394
  "epoch": 0.4,
395
  "eval_loss": 0.08615937829017639,
396
+ "eval_runtime": 116.9591,
397
+ "eval_samples_per_second": 17.1,
398
+ "eval_steps_per_second": 2.137,
399
  "step": 2500
400
  },
401
  {
 
471
  {
472
  "epoch": 0.48,
473
  "eval_loss": 0.08551913499832153,
474
+ "eval_runtime": 116.545,
475
+ "eval_samples_per_second": 17.161,
476
+ "eval_steps_per_second": 2.145,
477
  "step": 3000
478
  },
479
  {
 
549
  {
550
  "epoch": 0.56,
551
  "eval_loss": 0.08540560305118561,
552
+ "eval_runtime": 116.9131,
553
+ "eval_samples_per_second": 17.107,
554
+ "eval_steps_per_second": 2.138,
555
  "step": 3500
556
  },
557
  {
 
627
  {
628
  "epoch": 0.64,
629
  "eval_loss": 0.08466340601444244,
630
+ "eval_runtime": 116.6411,
631
+ "eval_samples_per_second": 17.147,
632
+ "eval_steps_per_second": 2.143,
633
  "step": 4000
634
  }
635
  ],