langrbide-deepseek / config.json
ayushayush591's picture
Upload model
bc50e85 verified
{
"_name_or_path": "./python_scripts/checkpoints/deepseek/epoch=1-step=3125",
"alignments": "linear",
"architectures": [
"LangBridgeModel"
],
"dim_enc": 2048,
"dim_lm": 4096,
"enc": "DKYoon/mt5-xl-lm-adapt",
"freeze_encoder": true,
"freeze_language_model": true,
"lm": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B",
"torch_dtype": "float32",
"transformers_version": "4.49.0"
}