delta8tyome
/

llm-jp-3-13b-20241123-0

Transformers

Safetensors

Japanese

unsloth

Model card Files Files and versions Community

delta8tyome commited on Nov 23, 2024

Commit

eeef15e

verified ·

1 Parent(s): 2ef9423

Delete trainer_state.json

Browse files

Files changed (1) hide show

trainer_state.json +0 -180

trainer_state.json DELETED Viewed

@@ -1,180 +0,0 @@
-{
-  "best_metric": null,
-  "best_model_checkpoint": null,
-  "epoch": 0.9988439306358381,
-  "eval_steps": 500,
-  "global_step": 216,
-  "is_hyper_param_search": false,
-  "is_local_process_zero": true,
-  "is_world_process_zero": true,
-  "log_history": [
-    {
-      "epoch": 0.046242774566473986,
-      "grad_norm": 0.29475411772727966,
-      "learning_rate": 0.0002,
-      "loss": 2.2125,
-      "step": 10
-    },
-    {
-      "epoch": 0.09248554913294797,
-      "grad_norm": 0.3760108947753906,
-      "learning_rate": 0.00019029126213592236,
-      "loss": 1.9606,
-      "step": 20
-    },
-    {
-      "epoch": 0.13872832369942195,
-      "grad_norm": 0.31119468808174133,
-      "learning_rate": 0.00018058252427184467,
-      "loss": 1.8787,
-      "step": 30
-    },
-    {
-      "epoch": 0.18497109826589594,
-      "grad_norm": 0.32787275314331055,
-      "learning_rate": 0.000170873786407767,
-      "loss": 1.8978,
-      "step": 40
-    },
-    {
-      "epoch": 0.23121387283236994,
-      "grad_norm": 0.7112058401107788,
-      "learning_rate": 0.0001611650485436893,
-      "loss": 1.7504,
-      "step": 50
-    },
-    {
-      "epoch": 0.2774566473988439,
-      "grad_norm": 0.2233152985572815,
-      "learning_rate": 0.00015145631067961166,
-      "loss": 2.0392,
-      "step": 60
-    },
-    {
-      "epoch": 0.3236994219653179,
-      "grad_norm": 0.22356455028057098,
-      "learning_rate": 0.000141747572815534,
-      "loss": 1.8432,
-      "step": 70
-    },
-    {
-      "epoch": 0.3699421965317919,
-      "grad_norm": 0.30998003482818604,
-      "learning_rate": 0.00013203883495145632,
-      "loss": 1.8597,
-      "step": 80
-    },
-    {
-      "epoch": 0.4161849710982659,
-      "grad_norm": 0.3756067156791687,
-      "learning_rate": 0.00012233009708737864,
-      "loss": 1.7925,
-      "step": 90
-    },
-    {
-      "epoch": 0.4624277456647399,
-      "grad_norm": 0.8105658292770386,
-      "learning_rate": 0.00011262135922330097,
-      "loss": 1.7537,
-      "step": 100
-    },
-    {
-      "epoch": 0.5086705202312138,
-      "grad_norm": 0.19787977635860443,
-      "learning_rate": 0.0001029126213592233,
-      "loss": 1.9549,
-      "step": 110
-    },
-    {
-      "epoch": 0.5549132947976878,
-      "grad_norm": 0.2306784689426422,
-      "learning_rate": 9.320388349514564e-05,
-      "loss": 1.8755,
-      "step": 120
-    },
-    {
-      "epoch": 0.6011560693641619,
-      "grad_norm": 0.24941173195838928,
-      "learning_rate": 8.349514563106797e-05,
-      "loss": 1.8362,
-      "step": 130
-    },
-    {
-      "epoch": 0.6473988439306358,
-      "grad_norm": 0.3020782768726349,
-      "learning_rate": 7.37864077669903e-05,
-      "loss": 1.7704,
-      "step": 140
-    },
-    {
-      "epoch": 0.6936416184971098,
-      "grad_norm": 0.48686742782592773,
-      "learning_rate": 6.407766990291263e-05,
-      "loss": 1.672,
-      "step": 150
-    },
-    {
-      "epoch": 0.7398843930635838,
-      "grad_norm": 0.22017759084701538,
-      "learning_rate": 5.436893203883495e-05,
-      "loss": 1.9731,
-      "step": 160
-    },
-    {
-      "epoch": 0.7861271676300579,
-      "grad_norm": 0.22683261334896088,
-      "learning_rate": 4.466019417475728e-05,
-      "loss": 1.8569,
-      "step": 170
-    },
-    {
-      "epoch": 0.8323699421965318,
-      "grad_norm": 0.2718450129032135,
-      "learning_rate": 3.4951456310679615e-05,
-      "loss": 1.8241,
-      "step": 180
-    },
-    {
-      "epoch": 0.8786127167630058,
-      "grad_norm": 0.36181768774986267,
-      "learning_rate": 2.5242718446601944e-05,
-      "loss": 1.7315,
-      "step": 190
-    },
-    {
-      "epoch": 0.9248554913294798,
-      "grad_norm": 0.6412150263786316,
-      "learning_rate": 1.5533980582524273e-05,
-      "loss": 1.7282,
-      "step": 200
-    },
-    {
-      "epoch": 0.9710982658959537,
-      "grad_norm": 0.26944366097450256,
-      "learning_rate": 5.825242718446602e-06,
-      "loss": 1.8982,
-      "step": 210
-    }
-  ],
-  "logging_steps": 10,
-  "max_steps": 216,
-  "num_input_tokens_seen": 0,
-  "num_train_epochs": 1,
-  "save_steps": 100,
-  "stateful_callbacks": {
-    "TrainerControl": {
-      "args": {
-        "should_epoch_stop": false,
-        "should_evaluate": false,
-        "should_log": false,
-        "should_save": true,
-        "should_training_stop": true
-      },
-      "attributes": {}
-    }
-  },
-  "total_flos": 2.79883718602752e+16,
-  "train_batch_size": 2,
-  "trial_name": null,
-  "trial_params": null
-}