_name_or_path: Duino/Darija-LM | |
architectures: | |
- GPTLanguageModel | |
block_size: 256 | |
dropout: 0.2 | |
model_type: gpt2 | |
n_embd: 384 | |
n_head: 6 | |
n_layer: 6 | |
tokenizer_class: SentencePieceTokenizer | |
vocab_size: 32000 | |
_name_or_path: Duino/Darija-LM | |
architectures: | |
- GPTLanguageModel | |
block_size: 256 | |
dropout: 0.2 | |
model_type: gpt2 | |
n_embd: 384 | |
n_head: 6 | |
n_layer: 6 | |
tokenizer_class: SentencePieceTokenizer | |
vocab_size: 32000 | |