LGAI-EXAONE
/

EXAONE-Deep-2.4B-AWQ

Text Generation

4-bit precision

Model card Files Files and versions Community

LG-AI-EXAONE commited on 10 days ago

Commit

169cd5b

·

1 Parent(s): 76c60f1

Fix quantized weights

Files changed (2) hide show

config.json +3 -4
model.safetensors +2 -2

config.json CHANGED Viewed

@@ -27,8 +27,7 @@
     "bits": 4,
     "group_size": 128,
     "modules_to_not_convert": [
-      "lm_head",
-      "gate"
     ],
     "quant_method": "awq",
     "version": "gemm",
@@ -43,8 +42,8 @@
   },
   "rope_theta": 1000000,
   "tie_word_embeddings": true,
-  "torch_dtype": "bfloat16",
-  "transformers_version": "4.48.3",
   "use_cache": false,
   "vocab_size": 102400
 }

     "bits": 4,
     "group_size": 128,
     "modules_to_not_convert": [
+      "lm_head"
     ],
     "quant_method": "awq",
     "version": "gemm",
   },
   "rope_theta": 1000000,
   "tie_word_embeddings": true,
+  "torch_dtype": "float16",
+  "transformers_version": "4.43.1",
   "use_cache": false,
   "vocab_size": 102400
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a68cb9c85c1d871b1b384938fe178b270c7498bff79ebcf64962c24e0cb6944b
-size 1638048680

 version https://git-lfs.github.com/spec/v1
+oid sha256:736fa24988823b07e43792d1eb010b6ee3d1aefaddb2dbeaac6a3be9d7c9817a
+size 1638048576