benstaf commited on
Commit
2153a72
·
verified ·
1 Parent(s): 1af2ab6

Upload 15 files

Browse files
agent_cppo_100_epochs_20k_steps.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7017d10df45958f1a09ee8e009d8c99346be867ff312b03876ed1b8cfb289b1
3
+ size 5730119
agent_cppo_20_epochs_20k_steps.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c9771b11a99c389877c35317ef7d542208a35264c47051ce460791e207ec985
3
+ size 5730102
agent_cppo_deepseek_100_epochs_20k_steps.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8dc3e1cc247a16c258d6940644008f3a491f0dd962145d37659a66c55b99d44
3
+ size 6418400
agent_cppo_deepseek_100_epochs_20k_steps_01.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:672fa6bfc0e656f724833fac2046f04f5598fd9a87a1ea457bcaf9b1a2edcda0
3
+ size 6418349
agent_cppo_deepseek_100_epochs_20k_steps_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0995acb84653b5ffbfaab13fed295ff1efa8443df66f6dfe80e0ac82280fe53d
3
+ size 6418519
agent_cppo_llama_20_epochs_20k_steps.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9f0fb6fe944f01a6f5e38c6fe6a1e92369b92252e29ed16101766e92b9d8087
3
+ size 6418332
agent_deepseek_20_epochs_20k_steps.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98d4c116d6e17ade1ed6710488446c3d10fe01fbd7350974bbf146641868b693
3
+ size 6418298
agent_ppo_100_epochs_20k_steps.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f138a91c36e0b88b27d58bf41549de24717aec48e7107641f3dfa1838b51177b
3
+ size 5730102
agent_ppo_20_epochs_20k_steps.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:238632dc96b40aa21a3993e1cac90578b7f84ea8e6811aebcfc4cbf3ac37443e
3
+ size 5730085
agent_ppo_deepseek_100_epochs_20k_steps.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae05dd713d1c0e8a880daad0a3be49db0314c50211805272f8a61dd84794ef84
3
+ size 6074319
agent_ppo_deepseek_100_epochs_20k_steps_01.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0969fc0b9d4c49aa816b2ec88dd321ffa619d765df27d79ef8975797747b8d5b
3
+ size 6074370
agent_ppo_deepseek_100_epochs_20k_steps_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f54f756654dc9a23c9c6fe6836a0be5ac03cc1fecf8952f020e58f63291fb8c
3
+ size 6074540
agent_ppo_deepseek_20_epochs_20k_steps.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e799bdf91c48654b4e7a0f3c090abff69b45a5ec88f592511c1dd34bc446d41
3
+ size 6074302
agent_ppo_llama_100_epochs_20k_steps.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06a1dbc0e65a7868c9c98db19c53311fc23ffc954faab3b913df4f4c05aa7cd9
3
+ size 6074268
agent_ppo_llama_20_epochs_20k_steps.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67c515df96ed32e57a37566d86c3547c63987d9e758ebe2984749a6f771cedfe
3
+ size 6074251