FinancialSupport commited on
Commit
8d7dd3d
·
verified ·
1 Parent(s): bb004a8

Training in progress, step 5

Browse files
README.md CHANGED
@@ -4,8 +4,8 @@ library_name: transformers
4
  model_name: training_output
5
  tags:
6
  - generated_from_trainer
7
- - trl
8
  - sft
 
9
  licence: license
10
  ---
11
 
@@ -27,7 +27,7 @@ print(output["generated_text"])
27
 
28
  ## Training procedure
29
 
30
- [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/g-puca1-deloitte/llmv3/runs/t2exxzwk)
31
 
32
 
33
  This model was trained with SFT.
@@ -37,7 +37,7 @@ This model was trained with SFT.
37
  - TRL: 0.23.0
38
  - Transformers: 4.56.1
39
  - Pytorch: 2.8.0+cu128
40
- - Datasets: 4.1.0
41
  - Tokenizers: 0.22.0
42
 
43
  ## Citations
 
4
  model_name: training_output
5
  tags:
6
  - generated_from_trainer
 
7
  - sft
8
+ - trl
9
  licence: license
10
  ---
11
 
 
27
 
28
  ## Training procedure
29
 
30
+ [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/g-puca1-deloitte/llmv3/runs/l3n3g0uy)
31
 
32
 
33
  This model was trained with SFT.
 
37
  - TRL: 0.23.0
38
  - Transformers: 4.56.1
39
  - Pytorch: 2.8.0+cu128
40
+ - Datasets: 4.1.1
41
  - Tokenizers: 0.22.0
42
 
43
  ## Citations
adapter_config.json CHANGED
@@ -26,9 +26,9 @@
26
  "revision": null,
27
  "target_modules": [
28
  "k_proj",
 
29
  "v_proj",
30
- "q_proj",
31
- "o_proj"
32
  ],
33
  "target_parameters": [
34
  "0.mlp.experts.gate_up_proj",
 
26
  "revision": null,
27
  "target_modules": [
28
  "k_proj",
29
+ "o_proj",
30
  "v_proj",
31
+ "q_proj"
 
32
  ],
33
  "target_parameters": [
34
  "0.mlp.experts.gate_up_proj",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d147581ca30f55ea738784409f3a2fceba21f913603ef5a7a2074f9418caae5b
3
  size 200875760
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e6d575864214be51d3fcdaa26b66c3ea53a453c8a6e34a5eedaa7f7a36253a0
3
  size 200875760
modelopt_state_train.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08b72d12efee4760a7976fc1b1999766aa9b7e4c0424db574290a3244c7bf2b6
3
  size 994683
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:459575f004991383da01238b5d6d3b8af0771254055c9b7c1a501308b596415c
3
  size 994683
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:19c9f8c1573117bfcc34b1aa9927ed4b7998d0a4953f7850283bc10589236efb
3
  size 6289
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4167536525b2f6bb1c4de50374830bd61091f3a55828e96d4206a103aecc0bfc
3
  size 6289