File size: 402 Bytes
bc50e85
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
{
  "_name_or_path": "./python_scripts/checkpoints/deepseek/epoch=1-step=3125",
  "alignments": "linear",
  "architectures": [
    "LangBridgeModel"
  ],
  "dim_enc": 2048,
  "dim_lm": 4096,
  "enc": "DKYoon/mt5-xl-lm-adapt",
  "freeze_encoder": true,
  "freeze_language_model": true,
  "lm": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B",
  "torch_dtype": "float32",
  "transformers_version": "4.49.0"
}