{
    "architectures": [
        "Lake1ForAnyToAny"
    ],
    "vocab_size": 20064,
    "hidden_size": 1024,
    "num_hidden_layers": 16,
    "num_attention_heads": 64,
    "embd_pdrop": 0.1,
    "use_moe": true,
    "num_experts": 24,
    "expert_hidden_size": 496,
    "dropout": 0.1,
    "model_type": "lake",
    "torch_dtype": "float16"
}