trungtienluong commited on
Commit
475182d
·
verified ·
1 Parent(s): fafd766

trungtienluong/test_4

Browse files
README.md CHANGED
@@ -42,7 +42,7 @@ The following hyperparameters were used during training:
42
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
43
  - lr_scheduler_type: cosine
44
  - lr_scheduler_warmup_ratio: 0.05
45
- - num_epochs: 7
46
  - mixed_precision_training: Native AMP
47
 
48
  ### Training results
 
42
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
43
  - lr_scheduler_type: cosine
44
  - lr_scheduler_warmup_ratio: 0.05
45
+ - num_epochs: 10
46
  - mixed_precision_training: Native AMP
47
 
48
  ### Training results
adapter_config.json CHANGED
@@ -20,13 +20,13 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
 
23
  "o_proj",
24
- "q_proj",
25
  "k_proj",
26
  "gate_proj",
27
- "v_proj",
28
- "down_proj",
29
- "up_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "v_proj",
24
+ "up_proj",
25
  "o_proj",
26
+ "down_proj",
27
  "k_proj",
28
  "gate_proj",
29
+ "q_proj"
 
 
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4b1331bffb184cc7eb85d081a7b414a6f126d00d74ba63c290abd0f09d77e55
3
  size 159967880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e686aec745766170201296dac402cc6dad9c1070a164599fbcd980416997031e
3
  size 159967880
runs/May16_04-21-12_902ee609b897/events.out.tfevents.1715833281.902ee609b897.3205.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78c8db4f72010892e4211ceeb8fa7e1af74e81da118c83054051b6379f01d523
3
+ size 16059
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:76ae282d19828978a486033e8c0be252981b35c060ad225a07935993e4919daa
3
  size 5112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e39e9f1f73757c32bc747d16b460a587a3f35762e3b54b1918213bf7c9648e1
3
  size 5112