turbo-maikol commited on
Commit
106c13e
·
verified ·
1 Parent(s): bbafeb0

Upload folder using huggingface_hub

Browse files
.summary/0/events.out.tfevents.1756487512.Pac ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ce2a1118f92d8787511b29bc3293bc3923c6f3be26b19fd9a64573a83ddebbc
3
+ size 40
.summary/0/events.out.tfevents.1756487556.Pac ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01cc3a02253c72350b7c23d9c28f8b72293f5c943d39054cd349ba00b4c19fdb
3
+ size 40
.summary/0/events.out.tfevents.1756487755.Pac ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e323a977f06005638c5a746ccc1adb91ff2756c339d7d9434aaa2786ec31607
3
+ size 119794
.summary/0/events.out.tfevents.1756489979.Pac ADDED
File without changes
.summary/0/events.out.tfevents.1756490729.Pac ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4711b8e85b5053f2d3ec95793131588ea0b6081ca0070afd89df574edc2a37ce
3
+ size 1465481
README.md CHANGED
@@ -15,7 +15,7 @@ model-index:
15
  type: doom_health_gathering_supreme
16
  metrics:
17
  - type: mean_reward
18
- value: 4.06 +/- 0.29
19
  name: mean_reward
20
  verified: false
21
  ---
 
15
  type: doom_health_gathering_supreme
16
  metrics:
17
  - type: mean_reward
18
+ value: 4.08 +/- 0.63
19
  name: mean_reward
20
  verified: false
21
  ---
config.json CHANGED
@@ -16,8 +16,8 @@
16
  "policy_workers_per_policy": 1,
17
  "max_policy_lag": 1000,
18
  "num_workers": 10,
19
- "num_envs_per_worker": 4,
20
- "batch_size": 1024,
21
  "num_batches_per_epoch": 1,
22
  "num_epochs": 1,
23
  "rollout": 64,
@@ -33,7 +33,7 @@
33
  "kl_loss_coeff": 0.0,
34
  "exploration_loss": "symmetric_kl",
35
  "gae_lambda": 0.95,
36
- "ppo_clip_ratio": 0.1,
37
  "ppo_clip_value": 0.2,
38
  "with_vtrace": false,
39
  "vtrace_rho": 1.0,
@@ -43,7 +43,7 @@
43
  "adam_beta1": 0.9,
44
  "adam_beta2": 0.999,
45
  "max_grad_norm": 4.0,
46
- "learning_rate": 0.0001,
47
  "lr_schedule": "constant",
48
  "lr_schedule_kl_threshold": 0.008,
49
  "lr_adaptive_min": 1e-06,
@@ -65,7 +65,7 @@
65
  "summaries_use_frameskip": true,
66
  "heartbeat_interval": 20,
67
  "heartbeat_reporting_interval": 600,
68
- "train_for_env_steps": 20000000,
69
  "train_for_seconds": 10000000000,
70
  "save_every_sec": 120,
71
  "keep_checkpoints": 2,
 
16
  "policy_workers_per_policy": 1,
17
  "max_policy_lag": 1000,
18
  "num_workers": 10,
19
+ "num_envs_per_worker": 8,
20
+ "batch_size": 16384,
21
  "num_batches_per_epoch": 1,
22
  "num_epochs": 1,
23
  "rollout": 64,
 
33
  "kl_loss_coeff": 0.0,
34
  "exploration_loss": "symmetric_kl",
35
  "gae_lambda": 0.95,
36
+ "ppo_clip_ratio": 0.2,
37
  "ppo_clip_value": 0.2,
38
  "with_vtrace": false,
39
  "vtrace_rho": 1.0,
 
43
  "adam_beta1": 0.9,
44
  "adam_beta2": 0.999,
45
  "max_grad_norm": 4.0,
46
+ "learning_rate": 0.0002,
47
  "lr_schedule": "constant",
48
  "lr_schedule_kl_threshold": 0.008,
49
  "lr_adaptive_min": 1e-06,
 
65
  "summaries_use_frameskip": true,
66
  "heartbeat_interval": 20,
67
  "heartbeat_reporting_interval": 600,
68
+ "train_for_env_steps": 30000000,
69
  "train_for_seconds": 10000000000,
70
  "save_every_sec": 120,
71
  "keep_checkpoints": 2,
git.diff ADDED
The diff for this file is too large to render. See raw diff
 
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d68220307c311d960a42551365fa1cf0216627cfc8ff7b2308e884c156a3ce8
3
- size 6191141
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:326b2aa7398ea99309b188513a36416adb9ad337a3a44b1bee2642f7bab21038
3
+ size 5657570
sf_log.txt CHANGED
The diff for this file is too large to render. See raw diff