| { | |
| "name": "Crystal-Beeper-Harmony-v5", | |
| "context": 512, | |
| "dim": 512, | |
| "n_layers": 6, | |
| "n_heads": 8, | |
| "mlp_ratio": 4.0, | |
| "dropout": 0.0, | |
| "resid_dropout": 0.0, | |
| "grad_checkpoint": false, | |
| "compile_model": false, | |
| "use_ascii": true, | |
| "vocab_size": 8192, | |
| "regions_per_block": 64, | |
| "capoera": { | |
| "enable": true, | |
| "topic_bins": 512, | |
| "mood_bins": 7 | |
| }, | |
| "context_mask_style": "right", | |
| "_alive_entries": [ | |
| { | |
| "name": "TinyStories", | |
| "path": "roneneldan/TinyStories", | |
| "split": "train[30%:50%]", | |
| "weight": 0.1, | |
| "dialect": [ | |
| 0.6000000238418579, | |
| 0.10000000149011612, | |
| 0.05000000074505806, | |
| 0.05000000074505806, | |
| 0.20000000298023224 | |
| ], | |
| "class_id": 0, | |
| "p": 0.03125000000000001 | |
| }, | |
| { | |
| "name": "WikipediaEN", | |
| "path": "wikimedia/wikipedia", | |
| "config": "20231101.en", | |
| "split": "train[5%:15%]", | |
| "weight": 0.5, | |
| "dialect": [ | |
| 0.11999999731779099, | |
| 0.5799999833106995, | |
| 0.10000000149011612, | |
| 0.10000000149011612, | |
| 0.10000000149011612 | |
| ], | |
| "class_id": 1, | |
| "p": 0.15625 | |
| }, | |
| { | |
| "name": "AGNews", | |
| "path": "ag_news", | |
| "split": "train[:]", | |
| "weight": 0.1, | |
| "dialect": [ | |
| 0.20000000298023224, | |
| 0.5, | |
| 0.10000000149011612, | |
| 0.10000000149011612, | |
| 0.10000000149011612 | |
| ], | |
| "class_id": 2, | |
| "p": 0.03125000000000001 | |
| }, | |
| { | |
| "name": "GSM8K", | |
| "path": "openai/gsm8k", | |
| "config": "main", | |
| "split": "train[40%:60%]", | |
| "weight": 0.6, | |
| "dialect": [ | |
| 0.10000000149011612, | |
| 0.15000000596046448, | |
| 0.5, | |
| 0.15000000596046448, | |
| 0.10000000149011612 | |
| ], | |
| "class_id": 3, | |
| "p": 0.1875 | |
| }, | |
| { | |
| "name": "AI2-ARC-Easy", | |
| "path": "allenai/ai2_arc", | |
| "config": "ARC-Easy", | |
| "split": "train[30%:60%]", | |
| "weight": 0.6, | |
| "dialect": [ | |
| 0.05000000074505806, | |
| 0.15000000596046448, | |
| 0.4000000059604645, | |
| 0.25, | |
| 0.15000000596046448 | |
| ], | |
| "class_id": 4, | |
| "p": 0.1875 | |
| }, | |
| { | |
| "name": "HH-RLHF", | |
| "path": "Anthropic/hh-rlhf", | |
| "split": "train[5%:10%]", | |
| "weight": 0.5, | |
| "dialect": [ | |
| 0.10000000149011612, | |
| 0.25, | |
| 0.20000000298023224, | |
| 0.25, | |
| 0.20000000298023224 | |
| ], | |
| "class_id": 5, | |
| "p": 0.15625 | |
| }, | |
| { | |
| "name": "SVAMP", | |
| "path": "ChilleD/SVAMP", | |
| "split": "train", | |
| "weight": 0.25, | |
| "dialect": [ | |
| 0.10000000149011612, | |
| 0.15000000596046448, | |
| 0.550000011920929, | |
| 0.15000000596046448, | |
| 0.05000000074505806 | |
| ], | |
| "class_id": 6, | |
| "p": 0.078125 | |
| }, | |
| { | |
| "name": "MATH-500", | |
| "path": "HuggingFaceH4/MATH-500", | |
| "split": "test", | |
| "weight": 0.25, | |
| "dialect": [ | |
| 0.05000000074505806, | |
| 0.15000000596046448, | |
| 0.6000000238418579, | |
| 0.15000000596046448, | |
| 0.05000000074505806 | |
| ], | |
| "class_id": 7, | |
| "p": 0.078125 | |
| }, | |
| { | |
| "name": "SEP", | |
| "path": "AiresPucrs/stanford-encyclopedia-philosophy", | |
| "split": "train", | |
| "weight": 0.3, | |
| "dialect": [ | |
| 0.05000000074505806, | |
| 0.44999998807907104, | |
| 0.18000000715255737, | |
| 0.2199999988079071, | |
| 0.10000000149011612 | |
| ], | |
| "class_id": 8, | |
| "p": 0.09375 | |
| } | |
| ] | |
| } |