eshwarprasadS commited on
Commit
4f7343b
1 Parent(s): 1397bca

Push PPO Agent for CarRacing

Browse files
PPO_CNN_CarRacing.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e51ab19d992f17125a36d8c45143133c0b0bb15ce3bed5267c241d609b514923
3
- size 26440029
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fceb96ad2348605562e9a6e2be935783eaaef2d2b716fdbafe8af2022c2ab42
3
+ size 26440026
PPO_CNN_CarRacing/data CHANGED
The diff for this file is too large to render. See raw diff
 
PPO_CNN_CarRacing/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba1cdbac8879378365a0a915d45adeed0a433fb27f77dd5956a1e3b22db9a2e0
3
  size 17415600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a95c585ac26abaec4fcd2227494a4df09587994f253df0a17df83ec4694ec1ca
3
  size 17415600
PPO_CNN_CarRacing/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb6972b26a22736a468ccb958524792e3ee90cca9c7f33e7620a05a5096d58d3
3
  size 8709950
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:411c758f1bf97b33eac989b3320db1d7c5f83863698de63ba482a49b287f1a41
3
  size 8709950
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: CarRacing-v0
17
  metrics:
18
  - type: mean_reward
19
- value: -47.12 +/- 60.20
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: CarRacing-v0
17
  metrics:
18
  - type: mean_reward
19
+ value: -50.30 +/- 10.65
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
The diff for this file is too large to render. See raw diff
 
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd747dddc730eb6c18625f86f2823c8652e1656ab8dbda7cbb645faf80e1fc66
3
- size 950657
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:610d43e4d9420856bc591eceb3ca54d58628291178a8fbb7ddbafb122c8eedb9
3
+ size 2052170
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": -47.12344413101673, "std_reward": 60.19849429944899, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-02-07T00:31:22.905846"}
 
1
+ {"mean_reward": -50.30261606797576, "std_reward": 10.654653135571326, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-02-07T01:15:17.688737"}