Spaces:
Runtime error
Runtime error
| tune_config: | |
| mode: "max" | |
| metric: "reward/mean" | |
| search_alg: "random" | |
| scheduler: "fifo" | |
| num_samples: 32 | |
| # https://docs.ray.io/en/latest/tune/api_docs/search_space.html#tune-sample-docs | |
| optimizer.kwargs.lr: | |
| strategy: "loguniform" | |
| values: [0.000001, 0.001] | |
| method.init_kl_coef: | |
| strategy: "loguniform" | |
| values: [0.0001, 0.2] | |
| model.num_layers_unfrozen: | |
| strategy: "choice" | |
| values: [-1, 2, 6] | |
| method.num_rollouts: | |
| strategy: "choice" | |
| values: [32, 128, 512] | |
| method.target: | |
| strategy: "choice" | |
| values: [null, 1] | |
| # disable checkpointing for storage sake | |
| train.checkpoint_interval: | |
| strategy: "choice" | |
| values: [10000000] | |
| train.save_best: | |
| strategy: "choice" | |
| values: [false] | |