{"n_layer": 12, "n_head": 12, "n_embd": 768, "block_size": 1024, "bias": false, "dropout": 0.0, "n_codes_total": 8, "n_codes_given": 1, "input_vocab_size": 1056, "output_vocab_size": 1056} |
{"n_layer": 12, "n_head": 12, "n_embd": 768, "block_size": 1024, "bias": false, "dropout": 0.0, "n_codes_total": 8, "n_codes_given": 1, "input_vocab_size": 1056, "output_vocab_size": 1056} |