YoungMeng commited on
Commit
274ccf8
·
1 Parent(s): abde19c

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: MsPacmanNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 1333.00 +/- 436.03
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: MsPacmanNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 1789.00 +/- 1081.22
20
  name: mean_reward
21
  verified: false
22
  ---
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 2937734951
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 2562555806
58
  - - storage
59
  - null
60
  - - study_name
dqn-MsPacmanNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8dbd64280be93a4bb564d38b8dcf18b307838113af4f716140bdad54c75e834f
3
- size 27244694
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c34ebb525f8e6ecf4e107161f0755d7e2923e6b89558470b415e322f671168e7
3
+ size 27244712
dqn-MsPacmanNoFrameskip-v4/_stable_baselines3_version CHANGED
@@ -1 +1 @@
1
- 2.2.1
 
1
+ 2.3.0a1
dqn-MsPacmanNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-MsPacmanNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e8dbf5fe837d1c5da0da4c3eb21656ed0539279bdfc86b144f96e02d6ce0aeac
3
  size 13518524
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de3f27ab655e0fb820633c4952f3c37fd2ae74e283eae5018b68b446ea757ac1
3
  size 13518524
dqn-MsPacmanNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c2a5dbd81b3dcfc075579859c3bacc5c2627f3dd6e8fef7e349a2a4b21a89bf4
3
  size 13517658
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f3068160a72a4c8fd059ffe07c06e33ebb095907d3f4b4c34b6b1234a487a94
3
  size 13517658
dqn-MsPacmanNoFrameskip-v4/system_info.txt CHANGED
@@ -1,7 +1,7 @@
1
- - OS: Linux-5.15.120+-x86_64-with-glibc2.35 # 1 SMP Wed Aug 30 11:19:59 UTC 2023
2
  - Python: 3.10.12
3
- - Stable-Baselines3: 2.2.1
4
- - PyTorch: 2.1.0+cu118
5
  - GPU Enabled: True
6
  - Numpy: 1.23.5
7
  - Cloudpickle: 2.2.1
 
1
+ - OS: Linux-6.1.58+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sat Nov 18 15:31:17 UTC 2023
2
  - Python: 3.10.12
3
+ - Stable-Baselines3: 2.3.0a1
4
+ - PyTorch: 2.1.0+cu121
5
  - GPU Enabled: True
6
  - Numpy: 1.23.5
7
  - Cloudpickle: 2.2.1
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c5391eef6c823244cde4258af36a7f6bb41e8d030cbd9407fc967eae248d3a7
3
- size 241492
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ee98119a228905463f3ae45488bc0c551546366543044c1cca520156cfb1a3b
3
+ size 236004
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 1333.0, "std_reward": 436.02866878222585, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-12-01T20:27:11.362833"}
 
1
+ {"mean_reward": 1789.0, "std_reward": 1081.2164445660267, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-01-24T21:29:15.806736"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a13cc0875ad386b1e18801f8ab7295ee08ab6133f2774be06e8e97596d84787d
3
- size 42245
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:169be6b52357f2d62319f53a4eae07efc32a8f3ada5e933d2d5005c9fae8fbf8
3
+ size 42902