Upload 46 files
Browse files- Pretrain/.DS_Store +0 -0
- Pretrain/Pretrain_OfflineMetadrive-easydense-v0_ddpm_lora_/.DS_Store +0 -0
- Pretrain/Pretrain_OfflineMetadrive-easydense-v0_ddpm_lora_/ddpm_lora/config.json +46 -0
- Pretrain/Pretrain_OfflineMetadrive-easydense-v0_ddpm_lora_/ddpm_lora_bc/.DS_Store +0 -0
- Pretrain/Pretrain_OfflineMetadrive-easydense-v0_ddpm_lora_/ddpm_lora_bc/config.json +46 -0
- Pretrain/Pretrain_OfflineMetadrive-easydense-v0_ddpm_lora_/ddpm_lora_bc/model1000000.pickle +3 -0
- Pretrain/Pretrain_OfflineMetadrive-easymean-v0_ddpm_lora_/.DS_Store +0 -0
- Pretrain/Pretrain_OfflineMetadrive-easymean-v0_ddpm_lora_/ddpm_lora/config.json +46 -0
- Pretrain/Pretrain_OfflineMetadrive-easymean-v0_ddpm_lora_/ddpm_lora_bc/.DS_Store +0 -0
- Pretrain/Pretrain_OfflineMetadrive-easymean-v0_ddpm_lora_/ddpm_lora_bc/config.json +46 -0
- Pretrain/Pretrain_OfflineMetadrive-easymean-v0_ddpm_lora_/ddpm_lora_bc/model1000000.pickle +3 -0
- Pretrain/Pretrain_OfflineMetadrive-easysparse-v0_ddpm_lora_/.DS_Store +0 -0
- Pretrain/Pretrain_OfflineMetadrive-easysparse-v0_ddpm_lora_/ddpm_lora/config.json +46 -0
- Pretrain/Pretrain_OfflineMetadrive-easysparse-v0_ddpm_lora_/ddpm_lora_bc/.DS_Store +0 -0
- Pretrain/Pretrain_OfflineMetadrive-easysparse-v0_ddpm_lora_/ddpm_lora_bc/config.json +46 -0
- Pretrain/Pretrain_OfflineMetadrive-easysparse-v0_ddpm_lora_/ddpm_lora_bc/model1000000.pickle +3 -0
- Pretrain/Pretrain_OfflineMetadrive-harddense-v0_ddpm_lora_/.DS_Store +0 -0
- Pretrain/Pretrain_OfflineMetadrive-harddense-v0_ddpm_lora_/ddpm_lora/config.json +46 -0
- Pretrain/Pretrain_OfflineMetadrive-harddense-v0_ddpm_lora_/ddpm_lora_bc/.DS_Store +0 -0
- Pretrain/Pretrain_OfflineMetadrive-harddense-v0_ddpm_lora_/ddpm_lora_bc/config.json +46 -0
- Pretrain/Pretrain_OfflineMetadrive-harddense-v0_ddpm_lora_/ddpm_lora_bc/model1000000.pickle +3 -0
- Pretrain/Pretrain_OfflineMetadrive-hardmean-v0_ddpm_lora_/.DS_Store +0 -0
- Pretrain/Pretrain_OfflineMetadrive-hardmean-v0_ddpm_lora_/ddpm_lora/config.json +46 -0
- Pretrain/Pretrain_OfflineMetadrive-hardmean-v0_ddpm_lora_/ddpm_lora_bc/.DS_Store +0 -0
- Pretrain/Pretrain_OfflineMetadrive-hardmean-v0_ddpm_lora_/ddpm_lora_bc/config.json +46 -0
- Pretrain/Pretrain_OfflineMetadrive-hardmean-v0_ddpm_lora_/ddpm_lora_bc/model1000000.pickle +3 -0
- Pretrain/Pretrain_OfflineMetadrive-hardsparse-v0_ddpm_lora_/.DS_Store +0 -0
- Pretrain/Pretrain_OfflineMetadrive-hardsparse-v0_ddpm_lora_/ddpm_lora/config.json +46 -0
- Pretrain/Pretrain_OfflineMetadrive-hardsparse-v0_ddpm_lora_/ddpm_lora_bc/.DS_Store +0 -0
- Pretrain/Pretrain_OfflineMetadrive-hardsparse-v0_ddpm_lora_/ddpm_lora_bc/config.json +46 -0
- Pretrain/Pretrain_OfflineMetadrive-hardsparse-v0_ddpm_lora_/ddpm_lora_bc/model1000000.pickle +3 -0
- Pretrain/Pretrain_OfflineMetadrive-mediumdense-v0_ddpm_lora_/.DS_Store +0 -0
- Pretrain/Pretrain_OfflineMetadrive-mediumdense-v0_ddpm_lora_/ddpm_lora/config.json +46 -0
- Pretrain/Pretrain_OfflineMetadrive-mediumdense-v0_ddpm_lora_/ddpm_lora_bc/.DS_Store +0 -0
- Pretrain/Pretrain_OfflineMetadrive-mediumdense-v0_ddpm_lora_/ddpm_lora_bc/config.json +46 -0
- Pretrain/Pretrain_OfflineMetadrive-mediumdense-v0_ddpm_lora_/ddpm_lora_bc/model1000000.pickle +3 -0
- Pretrain/Pretrain_OfflineMetadrive-mediummean-v0_ddpm_lora_/.DS_Store +0 -0
- Pretrain/Pretrain_OfflineMetadrive-mediummean-v0_ddpm_lora_/ddpm_lora/config.json +46 -0
- Pretrain/Pretrain_OfflineMetadrive-mediummean-v0_ddpm_lora_/ddpm_lora_bc/.DS_Store +0 -0
- Pretrain/Pretrain_OfflineMetadrive-mediummean-v0_ddpm_lora_/ddpm_lora_bc/config.json +46 -0
- Pretrain/Pretrain_OfflineMetadrive-mediummean-v0_ddpm_lora_/ddpm_lora_bc/model1000000.pickle +3 -0
- Pretrain/Pretrain_OfflineMetadrive-mediumsparse-v0_ddpm_lora_/.DS_Store +0 -0
- Pretrain/Pretrain_OfflineMetadrive-mediumsparse-v0_ddpm_lora_/ddpm_lora/config.json +46 -0
- Pretrain/Pretrain_OfflineMetadrive-mediumsparse-v0_ddpm_lora_/ddpm_lora_bc/.DS_Store +0 -0
- Pretrain/Pretrain_OfflineMetadrive-mediumsparse-v0_ddpm_lora_/ddpm_lora_bc/config.json +46 -0
- Pretrain/Pretrain_OfflineMetadrive-mediumsparse-v0_ddpm_lora_/ddpm_lora_bc/model1000000.pickle +3 -0
Pretrain/.DS_Store
ADDED
Binary file (8.2 kB). View file
|
|
Pretrain/Pretrain_OfflineMetadrive-easydense-v0_ddpm_lora_/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
Pretrain/Pretrain_OfflineMetadrive-easydense-v0_ddpm_lora_/ddpm_lora/config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"project": "PSEC",
|
3 |
+
"experiment_name": "ddpm_lora",
|
4 |
+
"timestamp": "Pretrain",
|
5 |
+
"max_steps": 1,
|
6 |
+
"batch_size": 2048,
|
7 |
+
"eval_episodes": 10,
|
8 |
+
"log_interval": 1000,
|
9 |
+
"save_steps": 250000,
|
10 |
+
"eval_interval": 250000,
|
11 |
+
"save_video": false,
|
12 |
+
"filter_threshold": null,
|
13 |
+
"take_top": null,
|
14 |
+
"online_max_steps": 0,
|
15 |
+
"unsquash_actions": false,
|
16 |
+
"normalize_returns": true,
|
17 |
+
"ratio": 1.0,
|
18 |
+
"training_time_inference_params": {
|
19 |
+
"N": 64,
|
20 |
+
"clip_sampler": true,
|
21 |
+
"M": 1
|
22 |
+
},
|
23 |
+
"rl_config": {
|
24 |
+
"model_cls": "Pretrain",
|
25 |
+
"actor_lr": 0.0003,
|
26 |
+
"T": 5,
|
27 |
+
"N": 64,
|
28 |
+
"M": 0,
|
29 |
+
"actor_dropout_rate": 0.1,
|
30 |
+
"actor_num_blocks": 3,
|
31 |
+
"decay_steps": 3000000,
|
32 |
+
"actor_layer_norm": true,
|
33 |
+
"actor_tau": 0.001,
|
34 |
+
"beta_schedule": "vp"
|
35 |
+
},
|
36 |
+
"seed": 42,
|
37 |
+
"env_name": "OfflineMetadrive-easydense-v0",
|
38 |
+
"group": "OfflineMetadrive-easydense-v0_ddpm_lora_",
|
39 |
+
"inference_variants": [
|
40 |
+
{
|
41 |
+
"N": 1,
|
42 |
+
"clip_sampler": true,
|
43 |
+
"M": 0
|
44 |
+
}
|
45 |
+
]
|
46 |
+
}
|
Pretrain/Pretrain_OfflineMetadrive-easydense-v0_ddpm_lora_/ddpm_lora_bc/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
Pretrain/Pretrain_OfflineMetadrive-easydense-v0_ddpm_lora_/ddpm_lora_bc/config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"project": "PSEC",
|
3 |
+
"experiment_name": "ddpm_lora",
|
4 |
+
"timestamp": "Pretrain",
|
5 |
+
"max_steps": 1,
|
6 |
+
"batch_size": 2048,
|
7 |
+
"eval_episodes": 10,
|
8 |
+
"log_interval": 1000,
|
9 |
+
"save_steps": 250000,
|
10 |
+
"eval_interval": 250000,
|
11 |
+
"save_video": false,
|
12 |
+
"filter_threshold": null,
|
13 |
+
"take_top": null,
|
14 |
+
"online_max_steps": 0,
|
15 |
+
"unsquash_actions": false,
|
16 |
+
"normalize_returns": true,
|
17 |
+
"ratio": 1.0,
|
18 |
+
"training_time_inference_params": {
|
19 |
+
"N": 64,
|
20 |
+
"clip_sampler": true,
|
21 |
+
"M": 1
|
22 |
+
},
|
23 |
+
"rl_config": {
|
24 |
+
"model_cls": "Pretrain",
|
25 |
+
"actor_lr": 0.0003,
|
26 |
+
"T": 5,
|
27 |
+
"N": 64,
|
28 |
+
"M": 0,
|
29 |
+
"actor_dropout_rate": 0.1,
|
30 |
+
"actor_num_blocks": 3,
|
31 |
+
"decay_steps": 3000000,
|
32 |
+
"actor_layer_norm": true,
|
33 |
+
"actor_tau": 0.001,
|
34 |
+
"beta_schedule": "vp"
|
35 |
+
},
|
36 |
+
"seed": 42,
|
37 |
+
"env_name": "OfflineMetadrive-easydense-v0",
|
38 |
+
"group": "OfflineMetadrive-easydense-v0_ddpm_lora_",
|
39 |
+
"inference_variants": [
|
40 |
+
{
|
41 |
+
"N": 1,
|
42 |
+
"clip_sampler": true,
|
43 |
+
"M": 0
|
44 |
+
}
|
45 |
+
]
|
46 |
+
}
|
Pretrain/Pretrain_OfflineMetadrive-easydense-v0_ddpm_lora_/ddpm_lora_bc/model1000000.pickle
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e179812da65cdd24842b0aab259577d27dd3b5d6e0562457d60b8468989db5d
|
3 |
+
size 27263099
|
Pretrain/Pretrain_OfflineMetadrive-easymean-v0_ddpm_lora_/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
Pretrain/Pretrain_OfflineMetadrive-easymean-v0_ddpm_lora_/ddpm_lora/config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"project": "PSEC",
|
3 |
+
"experiment_name": "ddpm_lora",
|
4 |
+
"timestamp": "Pretrain",
|
5 |
+
"max_steps": 1,
|
6 |
+
"batch_size": 2048,
|
7 |
+
"eval_episodes": 10,
|
8 |
+
"log_interval": 1000,
|
9 |
+
"save_steps": 250000,
|
10 |
+
"eval_interval": 250000,
|
11 |
+
"save_video": false,
|
12 |
+
"filter_threshold": null,
|
13 |
+
"take_top": null,
|
14 |
+
"online_max_steps": 0,
|
15 |
+
"unsquash_actions": false,
|
16 |
+
"normalize_returns": true,
|
17 |
+
"ratio": 1.0,
|
18 |
+
"training_time_inference_params": {
|
19 |
+
"N": 64,
|
20 |
+
"clip_sampler": true,
|
21 |
+
"M": 1
|
22 |
+
},
|
23 |
+
"rl_config": {
|
24 |
+
"model_cls": "Pretrain",
|
25 |
+
"actor_lr": 0.0003,
|
26 |
+
"T": 5,
|
27 |
+
"N": 64,
|
28 |
+
"M": 0,
|
29 |
+
"actor_dropout_rate": 0.1,
|
30 |
+
"actor_num_blocks": 3,
|
31 |
+
"decay_steps": 3000000,
|
32 |
+
"actor_layer_norm": true,
|
33 |
+
"actor_tau": 0.001,
|
34 |
+
"beta_schedule": "vp"
|
35 |
+
},
|
36 |
+
"seed": 42,
|
37 |
+
"env_name": "OfflineMetadrive-easymean-v0",
|
38 |
+
"group": "OfflineMetadrive-easymean-v0_ddpm_lora_",
|
39 |
+
"inference_variants": [
|
40 |
+
{
|
41 |
+
"N": 1,
|
42 |
+
"clip_sampler": true,
|
43 |
+
"M": 0
|
44 |
+
}
|
45 |
+
]
|
46 |
+
}
|
Pretrain/Pretrain_OfflineMetadrive-easymean-v0_ddpm_lora_/ddpm_lora_bc/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
Pretrain/Pretrain_OfflineMetadrive-easymean-v0_ddpm_lora_/ddpm_lora_bc/config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"project": "PSEC",
|
3 |
+
"experiment_name": "ddpm_lora",
|
4 |
+
"timestamp": "Pretrain",
|
5 |
+
"max_steps": 1,
|
6 |
+
"batch_size": 2048,
|
7 |
+
"eval_episodes": 10,
|
8 |
+
"log_interval": 1000,
|
9 |
+
"save_steps": 250000,
|
10 |
+
"eval_interval": 250000,
|
11 |
+
"save_video": false,
|
12 |
+
"filter_threshold": null,
|
13 |
+
"take_top": null,
|
14 |
+
"online_max_steps": 0,
|
15 |
+
"unsquash_actions": false,
|
16 |
+
"normalize_returns": true,
|
17 |
+
"ratio": 1.0,
|
18 |
+
"training_time_inference_params": {
|
19 |
+
"N": 64,
|
20 |
+
"clip_sampler": true,
|
21 |
+
"M": 1
|
22 |
+
},
|
23 |
+
"rl_config": {
|
24 |
+
"model_cls": "Pretrain",
|
25 |
+
"actor_lr": 0.0003,
|
26 |
+
"T": 5,
|
27 |
+
"N": 64,
|
28 |
+
"M": 0,
|
29 |
+
"actor_dropout_rate": 0.1,
|
30 |
+
"actor_num_blocks": 3,
|
31 |
+
"decay_steps": 3000000,
|
32 |
+
"actor_layer_norm": true,
|
33 |
+
"actor_tau": 0.001,
|
34 |
+
"beta_schedule": "vp"
|
35 |
+
},
|
36 |
+
"seed": 42,
|
37 |
+
"env_name": "OfflineMetadrive-easymean-v0",
|
38 |
+
"group": "OfflineMetadrive-easymean-v0_ddpm_lora_",
|
39 |
+
"inference_variants": [
|
40 |
+
{
|
41 |
+
"N": 1,
|
42 |
+
"clip_sampler": true,
|
43 |
+
"M": 0
|
44 |
+
}
|
45 |
+
]
|
46 |
+
}
|
Pretrain/Pretrain_OfflineMetadrive-easymean-v0_ddpm_lora_/ddpm_lora_bc/model1000000.pickle
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f2d995745df3a6a80ad4b5a1bfb33a3c6eec4ea43e6a825252d8559f6c95687
|
3 |
+
size 27263099
|
Pretrain/Pretrain_OfflineMetadrive-easysparse-v0_ddpm_lora_/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
Pretrain/Pretrain_OfflineMetadrive-easysparse-v0_ddpm_lora_/ddpm_lora/config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"project": "PSEC",
|
3 |
+
"experiment_name": "ddpm_lora",
|
4 |
+
"timestamp": "Pretrain",
|
5 |
+
"max_steps": 1,
|
6 |
+
"batch_size": 2048,
|
7 |
+
"eval_episodes": 10,
|
8 |
+
"log_interval": 1000,
|
9 |
+
"save_steps": 250000,
|
10 |
+
"eval_interval": 250000,
|
11 |
+
"save_video": false,
|
12 |
+
"filter_threshold": null,
|
13 |
+
"take_top": null,
|
14 |
+
"online_max_steps": 0,
|
15 |
+
"unsquash_actions": false,
|
16 |
+
"normalize_returns": true,
|
17 |
+
"ratio": 1.0,
|
18 |
+
"training_time_inference_params": {
|
19 |
+
"N": 64,
|
20 |
+
"clip_sampler": true,
|
21 |
+
"M": 1
|
22 |
+
},
|
23 |
+
"rl_config": {
|
24 |
+
"model_cls": "Pretrain",
|
25 |
+
"actor_lr": 0.0003,
|
26 |
+
"T": 5,
|
27 |
+
"N": 64,
|
28 |
+
"M": 0,
|
29 |
+
"actor_dropout_rate": 0.1,
|
30 |
+
"actor_num_blocks": 3,
|
31 |
+
"decay_steps": 3000000,
|
32 |
+
"actor_layer_norm": true,
|
33 |
+
"actor_tau": 0.001,
|
34 |
+
"beta_schedule": "vp"
|
35 |
+
},
|
36 |
+
"seed": 42,
|
37 |
+
"env_name": "OfflineMetadrive-easysparse-v0",
|
38 |
+
"group": "OfflineMetadrive-easysparse-v0_ddpm_lora_",
|
39 |
+
"inference_variants": [
|
40 |
+
{
|
41 |
+
"N": 1,
|
42 |
+
"clip_sampler": true,
|
43 |
+
"M": 0
|
44 |
+
}
|
45 |
+
]
|
46 |
+
}
|
Pretrain/Pretrain_OfflineMetadrive-easysparse-v0_ddpm_lora_/ddpm_lora_bc/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
Pretrain/Pretrain_OfflineMetadrive-easysparse-v0_ddpm_lora_/ddpm_lora_bc/config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"project": "PSEC",
|
3 |
+
"experiment_name": "ddpm_lora",
|
4 |
+
"timestamp": "Pretrain",
|
5 |
+
"max_steps": 1,
|
6 |
+
"batch_size": 2048,
|
7 |
+
"eval_episodes": 10,
|
8 |
+
"log_interval": 1000,
|
9 |
+
"save_steps": 250000,
|
10 |
+
"eval_interval": 250000,
|
11 |
+
"save_video": false,
|
12 |
+
"filter_threshold": null,
|
13 |
+
"take_top": null,
|
14 |
+
"online_max_steps": 0,
|
15 |
+
"unsquash_actions": false,
|
16 |
+
"normalize_returns": true,
|
17 |
+
"ratio": 1.0,
|
18 |
+
"training_time_inference_params": {
|
19 |
+
"N": 64,
|
20 |
+
"clip_sampler": true,
|
21 |
+
"M": 1
|
22 |
+
},
|
23 |
+
"rl_config": {
|
24 |
+
"model_cls": "Pretrain",
|
25 |
+
"actor_lr": 0.0003,
|
26 |
+
"T": 5,
|
27 |
+
"N": 64,
|
28 |
+
"M": 0,
|
29 |
+
"actor_dropout_rate": 0.1,
|
30 |
+
"actor_num_blocks": 3,
|
31 |
+
"decay_steps": 3000000,
|
32 |
+
"actor_layer_norm": true,
|
33 |
+
"actor_tau": 0.001,
|
34 |
+
"beta_schedule": "vp"
|
35 |
+
},
|
36 |
+
"seed": 42,
|
37 |
+
"env_name": "OfflineMetadrive-easysparse-v0",
|
38 |
+
"group": "OfflineMetadrive-easysparse-v0_ddpm_lora_",
|
39 |
+
"inference_variants": [
|
40 |
+
{
|
41 |
+
"N": 1,
|
42 |
+
"clip_sampler": true,
|
43 |
+
"M": 0
|
44 |
+
}
|
45 |
+
]
|
46 |
+
}
|
Pretrain/Pretrain_OfflineMetadrive-easysparse-v0_ddpm_lora_/ddpm_lora_bc/model1000000.pickle
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30fd438570f430cc3a79f44d6b87d588cdd90572db52993ecd30f1afc9da2a9e
|
3 |
+
size 27263099
|
Pretrain/Pretrain_OfflineMetadrive-harddense-v0_ddpm_lora_/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
Pretrain/Pretrain_OfflineMetadrive-harddense-v0_ddpm_lora_/ddpm_lora/config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"project": "PSEC",
|
3 |
+
"experiment_name": "ddpm_lora",
|
4 |
+
"timestamp": "Pretrain",
|
5 |
+
"max_steps": 1,
|
6 |
+
"batch_size": 2048,
|
7 |
+
"eval_episodes": 10,
|
8 |
+
"log_interval": 1000,
|
9 |
+
"save_steps": 250000,
|
10 |
+
"eval_interval": 250000,
|
11 |
+
"save_video": false,
|
12 |
+
"filter_threshold": null,
|
13 |
+
"take_top": null,
|
14 |
+
"online_max_steps": 0,
|
15 |
+
"unsquash_actions": false,
|
16 |
+
"normalize_returns": true,
|
17 |
+
"ratio": 1.0,
|
18 |
+
"training_time_inference_params": {
|
19 |
+
"N": 64,
|
20 |
+
"clip_sampler": true,
|
21 |
+
"M": 1
|
22 |
+
},
|
23 |
+
"rl_config": {
|
24 |
+
"model_cls": "Pretrain",
|
25 |
+
"actor_lr": 0.0003,
|
26 |
+
"T": 5,
|
27 |
+
"N": 64,
|
28 |
+
"M": 0,
|
29 |
+
"actor_dropout_rate": 0.1,
|
30 |
+
"actor_num_blocks": 3,
|
31 |
+
"decay_steps": 3000000,
|
32 |
+
"actor_layer_norm": true,
|
33 |
+
"actor_tau": 0.001,
|
34 |
+
"beta_schedule": "vp"
|
35 |
+
},
|
36 |
+
"seed": 42,
|
37 |
+
"env_name": "OfflineMetadrive-easydense-v0",
|
38 |
+
"group": "OfflineMetadrive-easydense-v0_ddpm_lora_",
|
39 |
+
"inference_variants": [
|
40 |
+
{
|
41 |
+
"N": 1,
|
42 |
+
"clip_sampler": true,
|
43 |
+
"M": 0
|
44 |
+
}
|
45 |
+
]
|
46 |
+
}
|
Pretrain/Pretrain_OfflineMetadrive-harddense-v0_ddpm_lora_/ddpm_lora_bc/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
Pretrain/Pretrain_OfflineMetadrive-harddense-v0_ddpm_lora_/ddpm_lora_bc/config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"project": "PSEC",
|
3 |
+
"experiment_name": "ddpm_lora",
|
4 |
+
"timestamp": "Pretrain",
|
5 |
+
"max_steps": 1,
|
6 |
+
"batch_size": 2048,
|
7 |
+
"eval_episodes": 10,
|
8 |
+
"log_interval": 1000,
|
9 |
+
"save_steps": 250000,
|
10 |
+
"eval_interval": 250000,
|
11 |
+
"save_video": false,
|
12 |
+
"filter_threshold": null,
|
13 |
+
"take_top": null,
|
14 |
+
"online_max_steps": 0,
|
15 |
+
"unsquash_actions": false,
|
16 |
+
"normalize_returns": true,
|
17 |
+
"ratio": 1.0,
|
18 |
+
"training_time_inference_params": {
|
19 |
+
"N": 64,
|
20 |
+
"clip_sampler": true,
|
21 |
+
"M": 1
|
22 |
+
},
|
23 |
+
"rl_config": {
|
24 |
+
"model_cls": "Pretrain",
|
25 |
+
"actor_lr": 0.0003,
|
26 |
+
"T": 5,
|
27 |
+
"N": 64,
|
28 |
+
"M": 0,
|
29 |
+
"actor_dropout_rate": 0.1,
|
30 |
+
"actor_num_blocks": 3,
|
31 |
+
"decay_steps": 3000000,
|
32 |
+
"actor_layer_norm": true,
|
33 |
+
"actor_tau": 0.001,
|
34 |
+
"beta_schedule": "vp"
|
35 |
+
},
|
36 |
+
"seed": 42,
|
37 |
+
"env_name": "OfflineMetadrive-easydense-v0",
|
38 |
+
"group": "OfflineMetadrive-easydense-v0_ddpm_lora_",
|
39 |
+
"inference_variants": [
|
40 |
+
{
|
41 |
+
"N": 1,
|
42 |
+
"clip_sampler": true,
|
43 |
+
"M": 0
|
44 |
+
}
|
45 |
+
]
|
46 |
+
}
|
Pretrain/Pretrain_OfflineMetadrive-harddense-v0_ddpm_lora_/ddpm_lora_bc/model1000000.pickle
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8a80d92836f73803a3962e5971016f1b8a2c9c47585b63b68c835b2df288281
|
3 |
+
size 27263099
|
Pretrain/Pretrain_OfflineMetadrive-hardmean-v0_ddpm_lora_/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
Pretrain/Pretrain_OfflineMetadrive-hardmean-v0_ddpm_lora_/ddpm_lora/config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"project": "PSEC",
|
3 |
+
"experiment_name": "ddpm_lora",
|
4 |
+
"timestamp": "Pretrain",
|
5 |
+
"max_steps": 1,
|
6 |
+
"batch_size": 2048,
|
7 |
+
"eval_episodes": 10,
|
8 |
+
"log_interval": 1000,
|
9 |
+
"save_steps": 250000,
|
10 |
+
"eval_interval": 250000,
|
11 |
+
"save_video": false,
|
12 |
+
"filter_threshold": null,
|
13 |
+
"take_top": null,
|
14 |
+
"online_max_steps": 0,
|
15 |
+
"unsquash_actions": false,
|
16 |
+
"normalize_returns": true,
|
17 |
+
"ratio": 1.0,
|
18 |
+
"training_time_inference_params": {
|
19 |
+
"N": 64,
|
20 |
+
"clip_sampler": true,
|
21 |
+
"M": 1
|
22 |
+
},
|
23 |
+
"rl_config": {
|
24 |
+
"model_cls": "Pretrain",
|
25 |
+
"actor_lr": 0.0003,
|
26 |
+
"T": 5,
|
27 |
+
"N": 64,
|
28 |
+
"M": 0,
|
29 |
+
"actor_dropout_rate": 0.1,
|
30 |
+
"actor_num_blocks": 3,
|
31 |
+
"decay_steps": 3000000,
|
32 |
+
"actor_layer_norm": true,
|
33 |
+
"actor_tau": 0.001,
|
34 |
+
"beta_schedule": "vp"
|
35 |
+
},
|
36 |
+
"seed": 42,
|
37 |
+
"env_name": "OfflineMetadrive-easymean-v0",
|
38 |
+
"group": "OfflineMetadrive-easymean-v0_ddpm_lora_",
|
39 |
+
"inference_variants": [
|
40 |
+
{
|
41 |
+
"N": 1,
|
42 |
+
"clip_sampler": true,
|
43 |
+
"M": 0
|
44 |
+
}
|
45 |
+
]
|
46 |
+
}
|
Pretrain/Pretrain_OfflineMetadrive-hardmean-v0_ddpm_lora_/ddpm_lora_bc/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
Pretrain/Pretrain_OfflineMetadrive-hardmean-v0_ddpm_lora_/ddpm_lora_bc/config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"project": "PSEC",
|
3 |
+
"experiment_name": "ddpm_lora",
|
4 |
+
"timestamp": "Pretrain",
|
5 |
+
"max_steps": 1,
|
6 |
+
"batch_size": 2048,
|
7 |
+
"eval_episodes": 10,
|
8 |
+
"log_interval": 1000,
|
9 |
+
"save_steps": 250000,
|
10 |
+
"eval_interval": 250000,
|
11 |
+
"save_video": false,
|
12 |
+
"filter_threshold": null,
|
13 |
+
"take_top": null,
|
14 |
+
"online_max_steps": 0,
|
15 |
+
"unsquash_actions": false,
|
16 |
+
"normalize_returns": true,
|
17 |
+
"ratio": 1.0,
|
18 |
+
"training_time_inference_params": {
|
19 |
+
"N": 64,
|
20 |
+
"clip_sampler": true,
|
21 |
+
"M": 1
|
22 |
+
},
|
23 |
+
"rl_config": {
|
24 |
+
"model_cls": "Pretrain",
|
25 |
+
"actor_lr": 0.0003,
|
26 |
+
"T": 5,
|
27 |
+
"N": 64,
|
28 |
+
"M": 0,
|
29 |
+
"actor_dropout_rate": 0.1,
|
30 |
+
"actor_num_blocks": 3,
|
31 |
+
"decay_steps": 3000000,
|
32 |
+
"actor_layer_norm": true,
|
33 |
+
"actor_tau": 0.001,
|
34 |
+
"beta_schedule": "vp"
|
35 |
+
},
|
36 |
+
"seed": 42,
|
37 |
+
"env_name": "OfflineMetadrive-easymean-v0",
|
38 |
+
"group": "OfflineMetadrive-easymean-v0_ddpm_lora_",
|
39 |
+
"inference_variants": [
|
40 |
+
{
|
41 |
+
"N": 1,
|
42 |
+
"clip_sampler": true,
|
43 |
+
"M": 0
|
44 |
+
}
|
45 |
+
]
|
46 |
+
}
|
Pretrain/Pretrain_OfflineMetadrive-hardmean-v0_ddpm_lora_/ddpm_lora_bc/model1000000.pickle
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41bd524d41e4f02ec7fd425648f27397b8942c005c5251c08030fa4bb0b13fbf
|
3 |
+
size 27263099
|
Pretrain/Pretrain_OfflineMetadrive-hardsparse-v0_ddpm_lora_/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
Pretrain/Pretrain_OfflineMetadrive-hardsparse-v0_ddpm_lora_/ddpm_lora/config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"project": "PSEC",
|
3 |
+
"experiment_name": "ddpm_lora",
|
4 |
+
"timestamp": "Pretrain",
|
5 |
+
"max_steps": 1,
|
6 |
+
"batch_size": 2048,
|
7 |
+
"eval_episodes": 10,
|
8 |
+
"log_interval": 1000,
|
9 |
+
"save_steps": 250000,
|
10 |
+
"eval_interval": 250000,
|
11 |
+
"save_video": false,
|
12 |
+
"filter_threshold": null,
|
13 |
+
"take_top": null,
|
14 |
+
"online_max_steps": 0,
|
15 |
+
"unsquash_actions": false,
|
16 |
+
"normalize_returns": true,
|
17 |
+
"ratio": 1.0,
|
18 |
+
"training_time_inference_params": {
|
19 |
+
"N": 64,
|
20 |
+
"clip_sampler": true,
|
21 |
+
"M": 1
|
22 |
+
},
|
23 |
+
"rl_config": {
|
24 |
+
"model_cls": "Pretrain",
|
25 |
+
"actor_lr": 0.0003,
|
26 |
+
"T": 5,
|
27 |
+
"N": 64,
|
28 |
+
"M": 0,
|
29 |
+
"actor_dropout_rate": 0.1,
|
30 |
+
"actor_num_blocks": 3,
|
31 |
+
"decay_steps": 3000000,
|
32 |
+
"actor_layer_norm": true,
|
33 |
+
"actor_tau": 0.001,
|
34 |
+
"beta_schedule": "vp"
|
35 |
+
},
|
36 |
+
"seed": 42,
|
37 |
+
"env_name": "OfflineMetadrive-easysparse-v0",
|
38 |
+
"group": "OfflineMetadrive-easysparse-v0_ddpm_lora_",
|
39 |
+
"inference_variants": [
|
40 |
+
{
|
41 |
+
"N": 1,
|
42 |
+
"clip_sampler": true,
|
43 |
+
"M": 0
|
44 |
+
}
|
45 |
+
]
|
46 |
+
}
|
Pretrain/Pretrain_OfflineMetadrive-hardsparse-v0_ddpm_lora_/ddpm_lora_bc/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
Pretrain/Pretrain_OfflineMetadrive-hardsparse-v0_ddpm_lora_/ddpm_lora_bc/config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"project": "PSEC",
|
3 |
+
"experiment_name": "ddpm_lora",
|
4 |
+
"timestamp": "Pretrain",
|
5 |
+
"max_steps": 1,
|
6 |
+
"batch_size": 2048,
|
7 |
+
"eval_episodes": 10,
|
8 |
+
"log_interval": 1000,
|
9 |
+
"save_steps": 250000,
|
10 |
+
"eval_interval": 250000,
|
11 |
+
"save_video": false,
|
12 |
+
"filter_threshold": null,
|
13 |
+
"take_top": null,
|
14 |
+
"online_max_steps": 0,
|
15 |
+
"unsquash_actions": false,
|
16 |
+
"normalize_returns": true,
|
17 |
+
"ratio": 1.0,
|
18 |
+
"training_time_inference_params": {
|
19 |
+
"N": 64,
|
20 |
+
"clip_sampler": true,
|
21 |
+
"M": 1
|
22 |
+
},
|
23 |
+
"rl_config": {
|
24 |
+
"model_cls": "Pretrain",
|
25 |
+
"actor_lr": 0.0003,
|
26 |
+
"T": 5,
|
27 |
+
"N": 64,
|
28 |
+
"M": 0,
|
29 |
+
"actor_dropout_rate": 0.1,
|
30 |
+
"actor_num_blocks": 3,
|
31 |
+
"decay_steps": 3000000,
|
32 |
+
"actor_layer_norm": true,
|
33 |
+
"actor_tau": 0.001,
|
34 |
+
"beta_schedule": "vp"
|
35 |
+
},
|
36 |
+
"seed": 42,
|
37 |
+
"env_name": "OfflineMetadrive-easysparse-v0",
|
38 |
+
"group": "OfflineMetadrive-easysparse-v0_ddpm_lora_",
|
39 |
+
"inference_variants": [
|
40 |
+
{
|
41 |
+
"N": 1,
|
42 |
+
"clip_sampler": true,
|
43 |
+
"M": 0
|
44 |
+
}
|
45 |
+
]
|
46 |
+
}
|
Pretrain/Pretrain_OfflineMetadrive-hardsparse-v0_ddpm_lora_/ddpm_lora_bc/model1000000.pickle
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef007d606bb177f40c82e82668e29a7a15138a8618a595711ac8b15268667319
|
3 |
+
size 27263099
|
Pretrain/Pretrain_OfflineMetadrive-mediumdense-v0_ddpm_lora_/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
Pretrain/Pretrain_OfflineMetadrive-mediumdense-v0_ddpm_lora_/ddpm_lora/config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"project": "PSEC",
|
3 |
+
"experiment_name": "ddpm_lora",
|
4 |
+
"timestamp": "Pretrain",
|
5 |
+
"max_steps": 1,
|
6 |
+
"batch_size": 2048,
|
7 |
+
"eval_episodes": 10,
|
8 |
+
"log_interval": 1000,
|
9 |
+
"save_steps": 250000,
|
10 |
+
"eval_interval": 250000,
|
11 |
+
"save_video": false,
|
12 |
+
"filter_threshold": null,
|
13 |
+
"take_top": null,
|
14 |
+
"online_max_steps": 0,
|
15 |
+
"unsquash_actions": false,
|
16 |
+
"normalize_returns": true,
|
17 |
+
"ratio": 1.0,
|
18 |
+
"training_time_inference_params": {
|
19 |
+
"N": 64,
|
20 |
+
"clip_sampler": true,
|
21 |
+
"M": 1
|
22 |
+
},
|
23 |
+
"rl_config": {
|
24 |
+
"model_cls": "Pretrain",
|
25 |
+
"actor_lr": 0.0003,
|
26 |
+
"T": 5,
|
27 |
+
"N": 64,
|
28 |
+
"M": 0,
|
29 |
+
"actor_dropout_rate": 0.1,
|
30 |
+
"actor_num_blocks": 3,
|
31 |
+
"decay_steps": 3000000,
|
32 |
+
"actor_layer_norm": true,
|
33 |
+
"actor_tau": 0.001,
|
34 |
+
"beta_schedule": "vp"
|
35 |
+
},
|
36 |
+
"seed": 42,
|
37 |
+
"env_name": "OfflineMetadrive-easydense-v0",
|
38 |
+
"group": "OfflineMetadrive-easydense-v0_ddpm_lora_",
|
39 |
+
"inference_variants": [
|
40 |
+
{
|
41 |
+
"N": 1,
|
42 |
+
"clip_sampler": true,
|
43 |
+
"M": 0
|
44 |
+
}
|
45 |
+
]
|
46 |
+
}
|
Pretrain/Pretrain_OfflineMetadrive-mediumdense-v0_ddpm_lora_/ddpm_lora_bc/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
Pretrain/Pretrain_OfflineMetadrive-mediumdense-v0_ddpm_lora_/ddpm_lora_bc/config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"project": "PSEC",
|
3 |
+
"experiment_name": "ddpm_lora",
|
4 |
+
"timestamp": "Pretrain",
|
5 |
+
"max_steps": 1,
|
6 |
+
"batch_size": 2048,
|
7 |
+
"eval_episodes": 10,
|
8 |
+
"log_interval": 1000,
|
9 |
+
"save_steps": 250000,
|
10 |
+
"eval_interval": 250000,
|
11 |
+
"save_video": false,
|
12 |
+
"filter_threshold": null,
|
13 |
+
"take_top": null,
|
14 |
+
"online_max_steps": 0,
|
15 |
+
"unsquash_actions": false,
|
16 |
+
"normalize_returns": true,
|
17 |
+
"ratio": 1.0,
|
18 |
+
"training_time_inference_params": {
|
19 |
+
"N": 64,
|
20 |
+
"clip_sampler": true,
|
21 |
+
"M": 1
|
22 |
+
},
|
23 |
+
"rl_config": {
|
24 |
+
"model_cls": "Pretrain",
|
25 |
+
"actor_lr": 0.0003,
|
26 |
+
"T": 5,
|
27 |
+
"N": 64,
|
28 |
+
"M": 0,
|
29 |
+
"actor_dropout_rate": 0.1,
|
30 |
+
"actor_num_blocks": 3,
|
31 |
+
"decay_steps": 3000000,
|
32 |
+
"actor_layer_norm": true,
|
33 |
+
"actor_tau": 0.001,
|
34 |
+
"beta_schedule": "vp"
|
35 |
+
},
|
36 |
+
"seed": 42,
|
37 |
+
"env_name": "OfflineMetadrive-easydense-v0",
|
38 |
+
"group": "OfflineMetadrive-easydense-v0_ddpm_lora_",
|
39 |
+
"inference_variants": [
|
40 |
+
{
|
41 |
+
"N": 1,
|
42 |
+
"clip_sampler": true,
|
43 |
+
"M": 0
|
44 |
+
}
|
45 |
+
]
|
46 |
+
}
|
Pretrain/Pretrain_OfflineMetadrive-mediumdense-v0_ddpm_lora_/ddpm_lora_bc/model1000000.pickle
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c130c94c938812667a2bbb1f75615d1726bf3e734fd3c5dd9d2308064255051b
|
3 |
+
size 27263099
|
Pretrain/Pretrain_OfflineMetadrive-mediummean-v0_ddpm_lora_/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
Pretrain/Pretrain_OfflineMetadrive-mediummean-v0_ddpm_lora_/ddpm_lora/config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"project": "PSEC",
|
3 |
+
"experiment_name": "ddpm_lora",
|
4 |
+
"timestamp": "Pretrain",
|
5 |
+
"max_steps": 1,
|
6 |
+
"batch_size": 2048,
|
7 |
+
"eval_episodes": 10,
|
8 |
+
"log_interval": 1000,
|
9 |
+
"save_steps": 250000,
|
10 |
+
"eval_interval": 250000,
|
11 |
+
"save_video": false,
|
12 |
+
"filter_threshold": null,
|
13 |
+
"take_top": null,
|
14 |
+
"online_max_steps": 0,
|
15 |
+
"unsquash_actions": false,
|
16 |
+
"normalize_returns": true,
|
17 |
+
"ratio": 1.0,
|
18 |
+
"training_time_inference_params": {
|
19 |
+
"N": 64,
|
20 |
+
"clip_sampler": true,
|
21 |
+
"M": 1
|
22 |
+
},
|
23 |
+
"rl_config": {
|
24 |
+
"model_cls": "Pretrain",
|
25 |
+
"actor_lr": 0.0003,
|
26 |
+
"T": 5,
|
27 |
+
"N": 64,
|
28 |
+
"M": 0,
|
29 |
+
"actor_dropout_rate": 0.1,
|
30 |
+
"actor_num_blocks": 3,
|
31 |
+
"decay_steps": 3000000,
|
32 |
+
"actor_layer_norm": true,
|
33 |
+
"actor_tau": 0.001,
|
34 |
+
"beta_schedule": "vp"
|
35 |
+
},
|
36 |
+
"seed": 42,
|
37 |
+
"env_name": "OfflineMetadrive-easymean-v0",
|
38 |
+
"group": "OfflineMetadrive-easymean-v0_ddpm_lora_",
|
39 |
+
"inference_variants": [
|
40 |
+
{
|
41 |
+
"N": 1,
|
42 |
+
"clip_sampler": true,
|
43 |
+
"M": 0
|
44 |
+
}
|
45 |
+
]
|
46 |
+
}
|
Pretrain/Pretrain_OfflineMetadrive-mediummean-v0_ddpm_lora_/ddpm_lora_bc/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
Pretrain/Pretrain_OfflineMetadrive-mediummean-v0_ddpm_lora_/ddpm_lora_bc/config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"project": "PSEC",
|
3 |
+
"experiment_name": "ddpm_lora",
|
4 |
+
"timestamp": "Pretrain",
|
5 |
+
"max_steps": 1,
|
6 |
+
"batch_size": 2048,
|
7 |
+
"eval_episodes": 10,
|
8 |
+
"log_interval": 1000,
|
9 |
+
"save_steps": 250000,
|
10 |
+
"eval_interval": 250000,
|
11 |
+
"save_video": false,
|
12 |
+
"filter_threshold": null,
|
13 |
+
"take_top": null,
|
14 |
+
"online_max_steps": 0,
|
15 |
+
"unsquash_actions": false,
|
16 |
+
"normalize_returns": true,
|
17 |
+
"ratio": 1.0,
|
18 |
+
"training_time_inference_params": {
|
19 |
+
"N": 64,
|
20 |
+
"clip_sampler": true,
|
21 |
+
"M": 1
|
22 |
+
},
|
23 |
+
"rl_config": {
|
24 |
+
"model_cls": "Pretrain",
|
25 |
+
"actor_lr": 0.0003,
|
26 |
+
"T": 5,
|
27 |
+
"N": 64,
|
28 |
+
"M": 0,
|
29 |
+
"actor_dropout_rate": 0.1,
|
30 |
+
"actor_num_blocks": 3,
|
31 |
+
"decay_steps": 3000000,
|
32 |
+
"actor_layer_norm": true,
|
33 |
+
"actor_tau": 0.001,
|
34 |
+
"beta_schedule": "vp"
|
35 |
+
},
|
36 |
+
"seed": 42,
|
37 |
+
"env_name": "OfflineMetadrive-easymean-v0",
|
38 |
+
"group": "OfflineMetadrive-easymean-v0_ddpm_lora_",
|
39 |
+
"inference_variants": [
|
40 |
+
{
|
41 |
+
"N": 1,
|
42 |
+
"clip_sampler": true,
|
43 |
+
"M": 0
|
44 |
+
}
|
45 |
+
]
|
46 |
+
}
|
Pretrain/Pretrain_OfflineMetadrive-mediummean-v0_ddpm_lora_/ddpm_lora_bc/model1000000.pickle
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29397dfc8de909f7e38731e891e0d7c32a98bcebfff3562d648dccc7e876e47c
|
3 |
+
size 27263099
|
Pretrain/Pretrain_OfflineMetadrive-mediumsparse-v0_ddpm_lora_/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
Pretrain/Pretrain_OfflineMetadrive-mediumsparse-v0_ddpm_lora_/ddpm_lora/config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"project": "PSEC",
|
3 |
+
"experiment_name": "ddpm_lora",
|
4 |
+
"timestamp": "Pretrain",
|
5 |
+
"max_steps": 1,
|
6 |
+
"batch_size": 2048,
|
7 |
+
"eval_episodes": 10,
|
8 |
+
"log_interval": 1000,
|
9 |
+
"save_steps": 250000,
|
10 |
+
"eval_interval": 250000,
|
11 |
+
"save_video": false,
|
12 |
+
"filter_threshold": null,
|
13 |
+
"take_top": null,
|
14 |
+
"online_max_steps": 0,
|
15 |
+
"unsquash_actions": false,
|
16 |
+
"normalize_returns": true,
|
17 |
+
"ratio": 1.0,
|
18 |
+
"training_time_inference_params": {
|
19 |
+
"N": 64,
|
20 |
+
"clip_sampler": true,
|
21 |
+
"M": 1
|
22 |
+
},
|
23 |
+
"rl_config": {
|
24 |
+
"model_cls": "Pretrain",
|
25 |
+
"actor_lr": 0.0003,
|
26 |
+
"T": 5,
|
27 |
+
"N": 64,
|
28 |
+
"M": 0,
|
29 |
+
"actor_dropout_rate": 0.1,
|
30 |
+
"actor_num_blocks": 3,
|
31 |
+
"decay_steps": 3000000,
|
32 |
+
"actor_layer_norm": true,
|
33 |
+
"actor_tau": 0.001,
|
34 |
+
"beta_schedule": "vp"
|
35 |
+
},
|
36 |
+
"seed": 42,
|
37 |
+
"env_name": "OfflineMetadrive-easysparse-v0",
|
38 |
+
"group": "OfflineMetadrive-easysparse-v0_ddpm_lora_",
|
39 |
+
"inference_variants": [
|
40 |
+
{
|
41 |
+
"N": 1,
|
42 |
+
"clip_sampler": true,
|
43 |
+
"M": 0
|
44 |
+
}
|
45 |
+
]
|
46 |
+
}
|
Pretrain/Pretrain_OfflineMetadrive-mediumsparse-v0_ddpm_lora_/ddpm_lora_bc/.DS_Store
ADDED
Binary file (6.15 kB). View file
|
|
Pretrain/Pretrain_OfflineMetadrive-mediumsparse-v0_ddpm_lora_/ddpm_lora_bc/config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"project": "PSEC",
|
3 |
+
"experiment_name": "ddpm_lora",
|
4 |
+
"timestamp": "Pretrain",
|
5 |
+
"max_steps": 1,
|
6 |
+
"batch_size": 2048,
|
7 |
+
"eval_episodes": 10,
|
8 |
+
"log_interval": 1000,
|
9 |
+
"save_steps": 250000,
|
10 |
+
"eval_interval": 250000,
|
11 |
+
"save_video": false,
|
12 |
+
"filter_threshold": null,
|
13 |
+
"take_top": null,
|
14 |
+
"online_max_steps": 0,
|
15 |
+
"unsquash_actions": false,
|
16 |
+
"normalize_returns": true,
|
17 |
+
"ratio": 1.0,
|
18 |
+
"training_time_inference_params": {
|
19 |
+
"N": 64,
|
20 |
+
"clip_sampler": true,
|
21 |
+
"M": 1
|
22 |
+
},
|
23 |
+
"rl_config": {
|
24 |
+
"model_cls": "Pretrain",
|
25 |
+
"actor_lr": 0.0003,
|
26 |
+
"T": 5,
|
27 |
+
"N": 64,
|
28 |
+
"M": 0,
|
29 |
+
"actor_dropout_rate": 0.1,
|
30 |
+
"actor_num_blocks": 3,
|
31 |
+
"decay_steps": 3000000,
|
32 |
+
"actor_layer_norm": true,
|
33 |
+
"actor_tau": 0.001,
|
34 |
+
"beta_schedule": "vp"
|
35 |
+
},
|
36 |
+
"seed": 42,
|
37 |
+
"env_name": "OfflineMetadrive-easysparse-v0",
|
38 |
+
"group": "OfflineMetadrive-easysparse-v0_ddpm_lora_",
|
39 |
+
"inference_variants": [
|
40 |
+
{
|
41 |
+
"N": 1,
|
42 |
+
"clip_sampler": true,
|
43 |
+
"M": 0
|
44 |
+
}
|
45 |
+
]
|
46 |
+
}
|
Pretrain/Pretrain_OfflineMetadrive-mediumsparse-v0_ddpm_lora_/ddpm_lora_bc/model1000000.pickle
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:695435838fcd3fda56abfada00747373ab4764f672005384c1583e54d6c71b04
|
3 |
+
size 27263099
|