File size: 1,683 Bytes
b557d4a
 
 
0486018
 
b557d4a
 
 
 
 
 
0486018
 
b557d4a
 
 
0486018
 
 
b557d4a
 
 
0486018
 
 
b557d4a
 
 
0486018
 
 
b557d4a
 
 
0486018
 
 
b557d4a
 
 
0486018
 
 
b557d4a
 
 
0486018
 
 
b557d4a
 
 
0486018
 
 
b557d4a
 
 
0486018
 
 
b557d4a
 
 
0486018
 
 
b557d4a
 
 
0486018
 
 
b557d4a
 
 
0486018
b557d4a
0486018
b557d4a
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 0.03031705623698218,
  "global_step": 262,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.0,
      "learning_rate": 1.9997685720897943e-05,
      "loss": 2.316,
      "step": 1
    },
    {
      "epoch": 0.0,
      "learning_rate": 1.993982874334645e-05,
      "loss": 3.0145,
      "step": 26
    },
    {
      "epoch": 0.01,
      "learning_rate": 1.9881971765794957e-05,
      "loss": 2.9775,
      "step": 52
    },
    {
      "epoch": 0.01,
      "learning_rate": 1.9821800509141405e-05,
      "loss": 2.9141,
      "step": 78
    },
    {
      "epoch": 0.01,
      "learning_rate": 1.976162925248785e-05,
      "loss": 2.8213,
      "step": 104
    },
    {
      "epoch": 0.02,
      "learning_rate": 1.9701457995834298e-05,
      "loss": 2.8003,
      "step": 130
    },
    {
      "epoch": 0.02,
      "learning_rate": 1.9641286739180746e-05,
      "loss": 2.8823,
      "step": 156
    },
    {
      "epoch": 0.02,
      "learning_rate": 1.9581115482527195e-05,
      "loss": 2.8253,
      "step": 182
    },
    {
      "epoch": 0.02,
      "learning_rate": 1.9520944225873643e-05,
      "loss": 2.7823,
      "step": 208
    },
    {
      "epoch": 0.03,
      "learning_rate": 1.946077296922009e-05,
      "loss": 2.7374,
      "step": 234
    },
    {
      "epoch": 0.03,
      "learning_rate": 1.9402915991668595e-05,
      "loss": 2.8325,
      "step": 260
    }
  ],
  "max_steps": 8642,
  "num_train_epochs": 1,
  "total_flos": 487908402266112.0,
  "trial_name": null,
  "trial_params": null
}