emdemor commited on
Commit
24cd73a
·
verified ·
1 Parent(s): 33735b5

Training in progress, step 1450

Browse files
Files changed (3) hide show
  1. adapter_model.safetensors +1 -1
  2. metrics.json +1 -0
  3. state.json +18 -3
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:079525c8ed387cce1ea9e0669805467b05b018b02e24d14699f2e7957dacfe7f
3
  size 35668592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e4611d599d8161322f3e6b8d6251a0a636fca8d840e06365ce4111550431816
3
  size 35668592
metrics.json CHANGED
@@ -26,3 +26,4 @@
26
  {"Step":1300,"eval_loss":1.8769853115,"eval_runtime":29.4816,"eval_samples_per_second":3.392,"eval_steps_per_second":0.441,"epoch":1.0212097408}
27
  {"Step":1350,"eval_loss":1.8668268919,"eval_runtime":29.5392,"eval_samples_per_second":3.385,"eval_steps_per_second":0.44,"epoch":1.0604870385}
28
  {"Step":1400,"eval_loss":1.8661786318,"eval_runtime":29.4511,"eval_samples_per_second":3.395,"eval_steps_per_second":0.441,"epoch":1.0997643362}
 
 
26
  {"Step":1300,"eval_loss":1.8769853115,"eval_runtime":29.4816,"eval_samples_per_second":3.392,"eval_steps_per_second":0.441,"epoch":1.0212097408}
27
  {"Step":1350,"eval_loss":1.8668268919,"eval_runtime":29.5392,"eval_samples_per_second":3.385,"eval_steps_per_second":0.44,"epoch":1.0604870385}
28
  {"Step":1400,"eval_loss":1.8661786318,"eval_runtime":29.4511,"eval_samples_per_second":3.395,"eval_steps_per_second":0.441,"epoch":1.0997643362}
29
+ {"Step":1450,"eval_loss":1.8573988676,"eval_runtime":29.4384,"eval_samples_per_second":3.397,"eval_steps_per_second":0.442,"epoch":1.1390416339}
state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.0997643362136684,
5
  "eval_steps": 50,
6
- "global_step": 1400,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -412,6 +412,21 @@
412
  "eval_samples_per_second": 3.385,
413
  "eval_steps_per_second": 0.44,
414
  "step": 1350
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
415
  }
416
  ],
417
  "logging_steps": 50,
@@ -431,7 +446,7 @@
431
  "attributes": {}
432
  }
433
  },
434
- "total_flos": 1.698206414174208e+16,
435
  "train_batch_size": 8,
436
  "trial_name": null,
437
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.139041633935585,
5
  "eval_steps": 50,
6
+ "global_step": 1450,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
412
  "eval_samples_per_second": 3.385,
413
  "eval_steps_per_second": 0.44,
414
  "step": 1350
415
+ },
416
+ {
417
+ "epoch": 1.0997643362136684,
418
+ "grad_norm": 0.1711549311876297,
419
+ "learning_rate": 0.00035190573174279896,
420
+ "loss": 1.8477,
421
+ "step": 1400
422
+ },
423
+ {
424
+ "epoch": 1.0997643362136684,
425
+ "eval_loss": 1.8661786317825317,
426
+ "eval_runtime": 29.4511,
427
+ "eval_samples_per_second": 3.395,
428
+ "eval_steps_per_second": 0.441,
429
+ "step": 1400
430
  }
431
  ],
432
  "logging_steps": 50,
 
446
  "attributes": {}
447
  }
448
  },
449
+ "total_flos": 1.763832907462656e+16,
450
  "train_batch_size": 8,
451
  "trial_name": null,
452
  "trial_params": null