CristianMascia commited on
Commit
cc18489
·
verified ·
1 Parent(s): a6352a1

phi-3-mini-QLoRA

Browse files
README.md CHANGED
@@ -34,8 +34,8 @@ This model was trained with SFT.
34
  ### Framework versions
35
 
36
  - TRL: 0.12.0
37
- - Transformers: 4.46.1
38
- - Pytorch: 2.5.1
39
  - Datasets: 3.1.0
40
  - Tokenizers: 0.20.1
41
 
 
34
  ### Framework versions
35
 
36
  - TRL: 0.12.0
37
+ - Transformers: 4.47.0.dev0
38
+ - Pytorch: 2.6.0.dev20241031+cu121
39
  - Datasets: 3.1.0
40
  - Tokenizers: 0.20.1
41
 
adapter_config.json CHANGED
@@ -20,13 +20,13 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
 
 
23
  "k_proj",
24
  "up_proj",
25
- "v_proj",
26
- "q_proj",
27
  "o_proj",
28
- "down_proj",
29
- "gate_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "v_proj",
24
+ "gate_proj",
25
+ "down_proj",
26
  "k_proj",
27
  "up_proj",
 
 
28
  "o_proj",
29
+ "q_proj"
 
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5980492d7515b3f8b2ddf23effe065ef0603b929e70232a3d80cf5e2937d208e
3
  size 35668592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4857948b5f9544edc16884106ac75ce7aa14f2a31298d848b202fbad9cc3532e
3
  size 35668592
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:366522af54da8b366709580193d5609018d277afe49ff393876a86bef2b0f5ab
3
- size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95e5ccd9bcf2d869ee3a4da1ed7db4ba7240997c954cc6fb579e5e5201536efd
3
+ size 5560