hari13 commited on
Commit
832ffee
·
verified ·
1 Parent(s): abe998a

Upload PPO LunarLander-v2 trained agent

Browse files
Files changed (4) hide show
  1. README.md +1 -1
  2. ppo-lunarLander-v2.zip +1 -1
  3. replay.mp4 +2 -2
  4. results.json +1 -1
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 265.94 +/- 15.17
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 255.32 +/- 18.77
20
  name: mean_reward
21
  verified: false
22
  ---
ppo-lunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16f416eb428a38b9542cee9d5688855f17151a52bd9280df8bda2bdc5a2245d4
3
  size 147427
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff35674f7a8ebb8634af3772567846f4d23257f6c16654fc44a0a52b50c6fe6a
3
  size 147427
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd0e6637f1bcbfeca002819cf99dd7aeed995596a5a8588946992d2b39e9f08b
3
- size 183189
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ee3755b2e823c78b1cdb7f4349b0e62d5c2aca0d8dc67da234cb8937a8c975f
3
+ size 176470
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 265.940711, "std_reward": 15.167428894863287, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2025-12-10T10:38:33.980939"}
 
1
+ {"mean_reward": 255.3163676, "std_reward": 18.77390371898252, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2025-12-10T10:40:04.259201"}