carolinacon commited on
Commit
03ad5f9
·
verified ·
1 Parent(s): 9a83a26

Push agent to the Hub

Browse files
README.md CHANGED
@@ -17,7 +17,7 @@ model-index:
17
  type: LunarLander-v2
18
  metrics:
19
  - type: mean_reward
20
- value: -135.92 +/- 143.99
21
  name: mean_reward
22
  verified: false
23
  ---
@@ -40,7 +40,7 @@ model-index:
40
  'total_timesteps': 1000000
41
  'learning_rate': 0.00025
42
  'num_envs': 16
43
- 'num_steps': 1024
44
  'anneal_lr': True
45
  'gae': True
46
  'gamma': 0.999
@@ -55,7 +55,7 @@ model-index:
55
  'max_grad_norm': 0.5
56
  'target_kl': None
57
  'repo_id': 'carolinacon/ppo-CartPole-v1'
58
- 'batch_size': 16384
59
- 'minibatch_size': 4096}
60
  ```
61
 
 
17
  type: LunarLander-v2
18
  metrics:
19
  - type: mean_reward
20
+ value: 69.12 +/- 53.92
21
  name: mean_reward
22
  verified: false
23
  ---
 
40
  'total_timesteps': 1000000
41
  'learning_rate': 0.00025
42
  'num_envs': 16
43
+ 'num_steps': 128
44
  'anneal_lr': True
45
  'gae': True
46
  'gamma': 0.999
 
55
  'max_grad_norm': 0.5
56
  'target_kl': None
57
  'repo_id': 'carolinacon/ppo-CartPole-v1'
58
+ 'batch_size': 2048
59
+ 'minibatch_size': 512}
60
  ```
61
 
logs/events.out.tfevents.1751467965.7c6da54d0a13.29308.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:022318db724e802017a4bac09c602728e87670816727967ca08ea20203e22dee
3
+ size 675015
model.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9b5d60c2b204c19ced8eaa71795e391e7ff2736bc887adeb91682a71febf8596
3
  size 43419
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f772cc5ced3de9dfe8e865d82900eb59076fba760c4e7eaba1438cd4d77ec3d
3
  size 43419
results.json CHANGED
@@ -1 +1 @@
1
- {"env_id": "LunarLander-v2", "mean_reward": -135.9165392596514, "std_reward": 143.99480221788966, "n_evaluation_episodes": 10, "eval_datetime": "2025-07-02T14:51:52.768663"}
 
1
+ {"env_id": "LunarLander-v2", "mean_reward": 69.12400944629034, "std_reward": 53.91812989195952, "n_evaluation_episodes": 10, "eval_datetime": "2025-07-02T15:09:55.598385"}