shawhin commited on
Commit
a68c9c9
·
verified ·
1 Parent(s): 7989ea9

shawhin/gemma-3-1b-tool-use

Browse files
README.md CHANGED
@@ -4,8 +4,8 @@ library_name: transformers
4
  model_name: gemma-3-1b-tool-use
5
  tags:
6
  - generated_from_trainer
7
- - trl
8
  - sft
 
9
  licence: license
10
  ---
11
 
@@ -35,8 +35,8 @@ This model was trained with SFT.
35
  ### Framework versions
36
 
37
  - TRL: 0.19.1
38
- - Transformers: 4.53.1
39
- - Pytorch: 2.7.1
40
  - Datasets: 4.0.0
41
  - Tokenizers: 0.21.2
42
 
 
4
  model_name: gemma-3-1b-tool-use
5
  tags:
6
  - generated_from_trainer
 
7
  - sft
8
+ - trl
9
  licence: license
10
  ---
11
 
 
35
  ### Framework versions
36
 
37
  - TRL: 0.19.1
38
+ - Transformers: 4.53.2
39
+ - Pytorch: 2.6.0+cu124
40
  - Datasets: 4.0.0
41
  - Tokenizers: 0.21.2
42
 
adapter_config.json CHANGED
@@ -13,9 +13,9 @@
13
  "layers_pattern": null,
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
- "lora_alpha": 16,
17
  "lora_bias": false,
18
- "lora_dropout": 0.1,
19
  "megatron_config": null,
20
  "megatron_core": "megatron.core",
21
  "modules_to_save": null,
@@ -25,8 +25,8 @@
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
- "v_proj",
29
  "k_proj",
 
30
  "q_proj"
31
  ],
32
  "task_type": "CAUSAL_LM",
 
13
  "layers_pattern": null,
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
+ "lora_alpha": 64,
17
  "lora_bias": false,
18
+ "lora_dropout": 0.05,
19
  "megatron_config": null,
20
  "megatron_core": "megatron.core",
21
  "modules_to_save": null,
 
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
 
28
  "k_proj",
29
+ "v_proj",
30
  "q_proj"
31
  ],
32
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a2968fd76eeee8a9be1f2bc2c148a16aa5007b941be960e2f0242e45bff90f9d
3
  size 4173784
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3794b465e918005e8ba83fcbc43465970d616db894677c38a3fbaf0f2f8b2992
3
  size 4173784
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "<image_soft_token>": 262144
3
+ }
runs/Jul17_22-16-29_5b17db383321/events.out.tfevents.1752790594.5b17db383321.3458.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b042cf66fec3396bd189c9f3643c14a5ce653284a294cabf4a925ea78dfcfd9
3
+ size 6887
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1299c11d7cf632ef3b4e11937501358ada021bbdf7c47638d13c0ee982f2e79c
3
+ size 4689074
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e29d3046e90c852986bd42bf21587b8291e74dd9f7cd0e7331787ef7877f385d
3
- size 6161
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac139ed071484ebdc698444cba2a6854f61bb7577241b0f7fb29facaa3244dc2
3
+ size 5752