Upload Qwen3ForCausalLM
Browse files- config.json +14 -7
- generation_config.json +1 -1
- pytorch_model-00001-of-00007.bin +2 -2
- pytorch_model-00002-of-00007.bin +2 -2
- pytorch_model-00003-of-00007.bin +2 -2
- pytorch_model-00004-of-00007.bin +2 -2
- pytorch_model-00005-of-00007.bin +2 -2
- pytorch_model-00006-of-00007.bin +2 -2
- pytorch_model-00007-of-00007.bin +2 -2
config.json
CHANGED
|
@@ -18,7 +18,7 @@
|
|
| 18 |
"num_hidden_layers": 64,
|
| 19 |
"num_key_value_heads": 8,
|
| 20 |
"quantization_config": {
|
| 21 |
-
"
|
| 22 |
"modules_to_not_convert": null,
|
| 23 |
"quant_method": "torchao",
|
| 24 |
"quant_type": {
|
|
@@ -28,11 +28,18 @@
|
|
| 28 |
"_data": "float8_e4m3fn",
|
| 29 |
"_type": "torch.dtype"
|
| 30 |
},
|
| 31 |
-
"granularity":
|
| 32 |
-
|
| 33 |
-
|
| 34 |
-
|
| 35 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 36 |
"mm_config": {
|
| 37 |
"_data": {
|
| 38 |
"emulate": false,
|
|
@@ -61,7 +68,7 @@
|
|
| 61 |
"sliding_window": null,
|
| 62 |
"tie_word_embeddings": false,
|
| 63 |
"torch_dtype": "bfloat16",
|
| 64 |
-
"transformers_version": "4.52.
|
| 65 |
"use_cache": true,
|
| 66 |
"use_sliding_window": false,
|
| 67 |
"vocab_size": 151936
|
|
|
|
| 18 |
"num_hidden_layers": 64,
|
| 19 |
"num_key_value_heads": 8,
|
| 20 |
"quantization_config": {
|
| 21 |
+
"include_input_output_embeddings": false,
|
| 22 |
"modules_to_not_convert": null,
|
| 23 |
"quant_method": "torchao",
|
| 24 |
"quant_type": {
|
|
|
|
| 28 |
"_data": "float8_e4m3fn",
|
| 29 |
"_type": "torch.dtype"
|
| 30 |
},
|
| 31 |
+
"granularity": [
|
| 32 |
+
{
|
| 33 |
+
"_data": {},
|
| 34 |
+
"_type": "PerRow",
|
| 35 |
+
"_version": 1
|
| 36 |
+
},
|
| 37 |
+
{
|
| 38 |
+
"_data": {},
|
| 39 |
+
"_type": "PerRow",
|
| 40 |
+
"_version": 1
|
| 41 |
+
}
|
| 42 |
+
],
|
| 43 |
"mm_config": {
|
| 44 |
"_data": {
|
| 45 |
"emulate": false,
|
|
|
|
| 68 |
"sliding_window": null,
|
| 69 |
"tie_word_embeddings": false,
|
| 70 |
"torch_dtype": "bfloat16",
|
| 71 |
+
"transformers_version": "4.52.3",
|
| 72 |
"use_cache": true,
|
| 73 |
"use_sliding_window": false,
|
| 74 |
"vocab_size": 151936
|
generation_config.json
CHANGED
|
@@ -9,5 +9,5 @@
|
|
| 9 |
"temperature": 0.6,
|
| 10 |
"top_k": 20,
|
| 11 |
"top_p": 0.95,
|
| 12 |
-
"transformers_version": "4.52.
|
| 13 |
}
|
|
|
|
| 9 |
"temperature": 0.6,
|
| 10 |
"top_k": 20,
|
| 11 |
"top_p": 0.95,
|
| 12 |
+
"transformers_version": "4.52.3"
|
| 13 |
}
|
pytorch_model-00001-of-00007.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eed0a42c41196d852a0ad630145156d1f25ebbd5503f308233b211b81604c03e
|
| 3 |
+
size 4971155870
|
pytorch_model-00002-of-00007.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3e647e9ddf448a623b78897e10808f3a1c971453ab1a719eae153fb628e5e51c
|
| 3 |
+
size 4973482027
|
pytorch_model-00003-of-00007.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:787b871f002495b07948640c6c2268c57dda22c12e8084194d751522c99e53b5
|
| 3 |
+
size 4879043437
|
pytorch_model-00004-of-00007.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:34d6f19c4295c04255fcdebccd83b9a7768584d33db6426350dce44c9d2bebc4
|
| 3 |
+
size 4879043437
|
pytorch_model-00005-of-00007.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e584b23cec40945a33df1465d9df128b01f08780ce06d75793c787ad2199bf94
|
| 3 |
+
size 4879043437
|
pytorch_model-00006-of-00007.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f728859761efca7d6e8ea7a0385ced26e22b2c3e3cd18f4aa4206e363e49a9ab
|
| 3 |
+
size 4879043437
|
pytorch_model-00007-of-00007.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:403de3a4d63a3fbc964476f7cdee8aa8349242eac732621b199330d1b41e0ecd
|
| 3 |
+
size 4876727583
|