Push PPO Agent for CarRacing

Files changed (8) hide show

PPO_CNN_CarRacing.zip CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e51ab19d992f17125a36d8c45143133c0b0bb15ce3bed5267c241d609b514923
-size 26440029

 version https://git-lfs.github.com/spec/v1
+oid sha256:5fceb96ad2348605562e9a6e2be935783eaaef2d2b716fdbafe8af2022c2ab42
+size 26440026

PPO_CNN_CarRacing/data CHANGED Viewed

The diff for this file is too large to render. See raw diff

PPO_CNN_CarRacing/policy.optimizer.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ba1cdbac8879378365a0a915d45adeed0a433fb27f77dd5956a1e3b22db9a2e0
 size 17415600

 version https://git-lfs.github.com/spec/v1
+oid sha256:a95c585ac26abaec4fcd2227494a4df09587994f253df0a17df83ec4694ec1ca
 size 17415600

PPO_CNN_CarRacing/policy.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fb6972b26a22736a468ccb958524792e3ee90cca9c7f33e7620a05a5096d58d3
 size 8709950

 version https://git-lfs.github.com/spec/v1
+oid sha256:411c758f1bf97b33eac989b3320db1d7c5f83863698de63ba482a49b287f1a41
 size 8709950

README.md CHANGED Viewed

@@ -16,7 +16,7 @@ model-index:
       type: CarRacing-v0
     metrics:
     - type: mean_reward
-      value: -47.12 +/- 60.20
       name: mean_reward
       verified: false
 ---

       type: CarRacing-v0
     metrics:
     - type: mean_reward
+      value: -50.30 +/- 10.65
       name: mean_reward
       verified: false
 ---

config.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

replay.mp4 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cd747dddc730eb6c18625f86f2823c8652e1656ab8dbda7cbb645faf80e1fc66
-size 950657

 version https://git-lfs.github.com/spec/v1
+oid sha256:610d43e4d9420856bc591eceb3ca54d58628291178a8fbb7ddbafb122c8eedb9
+size 2052170

results.json CHANGED Viewed

	@@ -1 +1 @@
1	- {"mean_reward": -47.~~12344413101673~~, "std_reward": 60.~~19849429944899~~, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-02-~~07T00~~:31:22.~~905846~~"}


1	+ {"mean_reward": -50.30261606797576, "std_reward": 10.654653135571326, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-02-07T01:15:17.688737"}