EleutherAI/SmolLM2-1.7B-magpie-ultra-v0.1-attribution

Files changed (6) hide show

README.md CHANGED Viewed

@@ -27,7 +27,7 @@ print(output["generated_text"])
 ## Training procedure
-[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/eleutherai/huggingface/runs/vofyo7hl)
 This model was trained with SFT.
@@ -35,7 +35,7 @@ This model was trained with SFT.
 ### Framework versions
 - TRL: 0.18.1
-- Transformers: 4.51.3
 - Pytorch: 2.5.1
 - Datasets: 3.6.0
 - Tokenizers: 0.21.1

 ## Training procedure
+[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/eleutherai/huggingface/runs/2e1kywoy)
 This model was trained with SFT.
 ### Framework versions
 - TRL: 0.18.1
+- Transformers: 4.52.4
 - Pytorch: 2.5.1
 - Datasets: 3.6.0
 - Tokenizers: 0.21.1

config.json CHANGED Viewed

@@ -24,7 +24,7 @@
   "rope_theta": 130000,
   "tie_word_embeddings": true,
   "torch_dtype": "bfloat16",
-  "transformers_version": "4.51.3",
   "use_cache": true,
   "vocab_size": 49152
 }

   "rope_theta": 130000,
   "tie_word_embeddings": true,
   "torch_dtype": "bfloat16",
+  "transformers_version": "4.52.4",
   "use_cache": true,
   "vocab_size": 49152
 }

generation_config.json CHANGED Viewed

@@ -3,5 +3,5 @@
   "bos_token_id": 1,
   "eos_token_id": 2,
   "pad_token_id": 2,
-  "transformers_version": "4.51.3"
 }

   "bos_token_id": 1,
   "eos_token_id": 2,
   "pad_token_id": 2,
+  "transformers_version": "4.52.4"
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bf9ed62f32bc7a474274025af822815ff912a25aa872f03b39bfa1ec7b8d2843
 size 3422777952

 version https://git-lfs.github.com/spec/v1
+oid sha256:dc3265f1eccc7f0a63088133dde35097dc97defc4153c5515541f94198a5254d
 size 3422777952

tokenizer_config.json CHANGED Viewed

@@ -143,10 +143,10 @@
     "<|im_end|>"
   ],
   "bos_token": "<|im_start|>",
-  "chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
   "clean_up_tokenization_spaces": false,
   "eos_token": "<|im_end|>",
   "extra_special_tokens": {},
   "model_max_length": 8192,
   "pad_token": "<|im_end|>",
   "tokenizer_class": "GPT2Tokenizer",

     "<|im_end|>"
   ],
   "bos_token": "<|im_start|>",
   "clean_up_tokenization_spaces": false,
   "eos_token": "<|im_end|>",
   "extra_special_tokens": {},
+  "max_length": 8192,
   "model_max_length": 8192,
   "pad_token": "<|im_end|>",
   "tokenizer_class": "GPT2Tokenizer",

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1580a1d6e6e9330ed239f0141f3c6a9b2003ba9dbe5012527caf9d9ef19fce48
-size 5688

 version https://git-lfs.github.com/spec/v1
+oid sha256:bc7ca4fc7c17fe67dad7f930c033aab41d667039fb6b330646c2f2d703a964a8
+size 5624